-
Notifications
You must be signed in to change notification settings - Fork 1
/
plot_copy_at_scale_benchmark.py
61 lines (47 loc) · 2.14 KB
/
plot_copy_at_scale_benchmark.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
import argparse
from pathlib import Path
import numpy as np
import pandas as pd
import matplotlib as mpl
import matplotlib.pyplot as plt
def parse_args():
parser = argparse.ArgumentParser(
description="Plot results from copy-at-scale benchmarks."
)
parser.add_argument(
"--benchmarks-file",
type=str,
help="Filepath to a benchmarks CSV file.",
required=True
)
return parser.parse_args()
def num_to_kM(val, pos):
if val < 1e3:
return f"{val:.0f}"
if 1e3 <= val < 1e6:
return f"{val/1e3:.0f}k"
elif 1e6 <= val < 1e9:
return f"{val/1e6:.0f}M"
def main(args):
df = pd.read_csv(args.benchmarks_file)
def plot(ax, method, rate, table_type, label, color):
dfq = df.query(f"method == '{method}' and table_type == '{table_type}'").sort_values(by="hour")
rows_inserted = dfq["num_rows"].cumsum() / 1e6
insert_rate = dfq[rate]
insert_rate_smoothed = insert_rate.rolling(window=10, min_periods=1).mean()
ax.scatter(rows_inserted, insert_rate, marker=".", color=color, alpha=0.2)
ax.hlines(dfq[rate].mean(), 0, rows_inserted.max(), color=color, alpha=0.5)
ax.plot(rows_inserted, insert_rate_smoothed, color=color, label=label)
fig, ax = plt.subplots(figsize=(8, 6))
plot(ax, "psycopg3", "rate_full", "regular", label="psycopg3 (regular table)", color="tab:blue")
plot(ax, "psycopg3", "rate_full", "hyper", label="psycopg3 (hypertable)", color="tab:orange")
plot(ax, "copy_csv", "rate_full", "regular", label="copy_csv (regular table)", color="tab:green")
plot(ax, "copy_csv", "rate_full", "hyper", label="copy_csv (hypertable)", color="tab:red")
ax.yaxis.set_major_formatter(mpl.ticker.FuncFormatter(num_to_kM))
ax.set_xlabel("Rows inserted (millions)")
ax.set_ylabel("Overall insert rate (rows per second)")
ax.legend(frameon=False, ncol=2, loc="upper center", bbox_to_anchor=(0.5, 1.15))
output_filename = Path(args.benchmarks_file).with_suffix(".png")
fig.savefig(output_filename, dpi=200, transparent=False, bbox_inches="tight")
if __name__ == "__main__":
main(parse_args())