wp1.7-soa-benchmark/plot_benchmarks.py at main · cern-nextgen/wp1.7-soa-benchmark · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
import matplotlib.pyplot as plt
from matplotlib.ticker import FuncFormatter
import pandas as pd
import subprocess
import sys
import os
import json
import math
import re

def read_data(filename):
    """
    Reads the Google Benchmark data from a JSON file and returns a DataFrame.
    """
    with open(filename, "r") as read_file:
        data = json.load(read_file)
        df = pd.DataFrame.from_dict(data["benchmarks"]).astype({"real_time": float})
        df = df[df["run_type"] == "aggregate"]
        df["benchmark"] = df["name"].apply(lambda x: x.split('/')[1].split('_')[1])
        return df

def plot_per_benchmark(all_data, out_dir):
    """
    Generates one plot per benchmark, comparing all SoA variants.
    """
    all_benchmarks = set()
    for df, _ in all_data:
        all_benchmarks.update(df["benchmark"].unique())

    for benchmark in all_benchmarks:
        plt.figure(figsize=(10, 6))
        ax = plt.subplot(111)

        for df, soa_label in all_data:
            df_mean = df[(df["benchmark"] == benchmark) & (df["aggregate_name"] == "mean")]
            df_std = df[(df["benchmark"] == benchmark) & (df["aggregate_name"] == "stddev")]

            if df_mean.empty:
                continue

            ax.errorbar(df_mean['n_elem'], df_mean['real_time'], yerr=df_std["real_time"],
                        ls="-", marker="o", label=soa_label)

        ax.set_title(f'{benchmark}')
        ax.set_xlabel('Number of Elements')
        ax.set_xscale('symlog')
        ax.set_xticks(sorted(df_mean['n_elem'].unique()),
                      labels=["{:g}".format(x) for x in sorted(df_mean['n_elem'].unique())], minor=False)

        ax.set_ylabel(f'Real Time ({df["time_unit"].iloc[0]})')
        ax.set_yscale('log')
        ax.yaxis.set_major_formatter(FuncFormatter(lambda y, _: '{:g}'.format(y)))

        plt.legend()

        out_file = f'{out_dir}/{benchmark}_comparison.png'
        plt.savefig(out_file)
        print(f"Saved to {out_file}")


def plot_per_version(df, title, out_dir, min_y=-0.000001, max_y=1000):
    """
    Generates one plot per version, comparing all benchmarks.
    """
    # Set the figure size
    plt.figure(figsize=(10, 6))
    ax = plt.subplot(111)

    # Plot the data
    for bm in df["benchmark"].unique():
        # Filter the DataFrame for the current benchmark
        df_mean = df[(df["benchmark"] == bm) & (df["aggregate_name"] == "mean")]
        df_std = df[(df["benchmark"] == bm) & (df["aggregate_name"] == "stddev")]
        ax.errorbar(df_mean['n_elem'].astype(int), df_mean['real_time'], yerr=df_std["real_time"],
                    ls="-", marker="o", label=bm)

    # Set the title and labels
    ax.set_title(title)
    ax.set_xlabel('Number of Elements')
    ax.set_xscale('symlog')
    ax.set_xticks(df_mean['n_elem'].unique(), labels=["{:g}".format(x) for x in df_mean['n_elem'].unique()], minor=False)

    ax.set_ylabel(f'Real Time ({df["time_unit"].iloc[0]})')
    ax.set_yscale('log')
    ax.yaxis.set_major_formatter(FuncFormatter(lambda y, _: '{:g}'.format(y)))
    plt.ylim(min_y, max_y)

    # Add a legend
    plt.legend()

    # Show the plot
    out_file = f'{out_dir}/{title.replace(" ", "_")}.png'
    plt.savefig(out_file)
    print(f"Saved to {out_file}")

if __name__ == "__main__":
    print("Plotting the benchmark results...")

    output_dir = sys.argv[1]
    if len(sys.argv) > 2:
        csvfile = sys.argv[2]
        all_results = []
        with open(f"{csvfile}", "r") as soa_versions_file:
            soa_versions = pd.read_csv(soa_versions_file)
            for _, row in soa_versions.iterrows():
                f = row['version']
                label = row['label']

                filename = f"{output_dir}/{f}"
                df = read_data(f"{filename}.json")
                all_results.append((df, label))

            plot_per_benchmark(all_results, output_dir)

            # Round the y-axis up/down to the nearest power of 10
            max_y = 10 ** math.ceil(math.log10(max([df[df["aggregate_name"] == "mean"]["real_time"].max() for (df, _) in all_results])))
            min_y = 10 ** math.floor(math.log10(min([df[df["aggregate_name"] == "mean"]["real_time"].min() for (df, _) in all_results])))
            for (df, label) in all_results:
                plot_per_version(df, label, output_dir, min_y, max_y)
    else:
        print("python plot_benchmark.py <output_dir> <csvfile>")
        print("Provide a CSV file with the SoA Json files to plot and their labels")