ultrajson · Erotemic · May 9, 2022 · May 23, 2022 · May 26, 2022 · May 26, 2022
diff --git a/json_benchmarks/__init__.py b/json_benchmarks/__init__.py
diff --git a/json_benchmarks/__main__.py b/json_benchmarks/__main__.py
@@ -0,0 +1,8 @@
+if __name__ == "__main__":
+    """
+    CommandLine:
+        python -m json_benchmarks
+    """
+    from json_benchmarks import core
+
+    core.main()
diff --git a/json_benchmarks/analysis.py b/json_benchmarks/analysis.py
@@ -0,0 +1,116 @@
+"""
+The analysis of the measurements
+"""
+import scriptconfig as scfg
+import ubelt as ub
+
+
+class AnalysisConfig(scfg.Config):
+    default = {
+        "cache_dir": scfg.Value(
+            None,
+            help=ub.paragraph(
+                """
+                Location for benchmark cache.
+                Defaults to $XDG_CACHE/ujson/benchmark_results/
+                """
+            ),
+        ),
+    }
+
+    def normalize(self):
+        dpath = self["cache_dir"]
+        if dpath is None:
+            dpath = ub.Path.appdir("ujson/benchmark_results")
+        dpath = ub.Path(dpath)
+        self["cache_dir"] = dpath
+
+
+def analyze_results(result_fpaths):
+    import json
+
+    from json_benchmarks import benchmarker
+    from json_benchmarks.benchmarker import util_stats
+
+    results = []
+    for fpath in ub.ProgIter(result_fpaths, desc="load results"):
+        data = json.loads(fpath.read_text())
+        for row in data["rows"]:
+            result = benchmarker.BenchmarkerResult.load(fpath)
+            results.extend(result.to_result_list())
+
+    RECORD_ALL = 0
+    metric_key = "time" if RECORD_ALL else "mean_time"
+
+    # results = benchmark.result.to_result_list()
+
+    analysis = benchmarker.result_analysis.ResultAnalysis(
+        results,
+        metrics=[metric_key],
+        params=["impl", "impl_version"],
+        metric_objectives={
+            "min_time": "min",
+            "mean_time": "min",
+            "time": "min",
+        },
+    )
+    analysis.analysis()
+
+    table = analysis.table
+    stats_table = util_stats.aggregate_stats(
+        table, suffix="_time", group_keys=["name", "impl_version"]
+    )
+
+    single_size = stats_table[
+        (stats_table["size"] == 256) | stats_table["size"].isnull()
+    ]
+    # single_size_combo = aggregate_stats(single_size, None)
+    single_size_combo = util_stats.aggregate_stats(
+        single_size, suffix="_time", group_keys=["name", "impl_version"]
+    )
+
+    param_group = ["impl", "impl_version"]
+    single_size_combo["calls/sec"] = 1 / single_size_combo["mean_time"]
+    # _single_size_combo = single_size_combo.copy()
+    time_piv = single_size_combo.pivot(["input", "func"], param_group, "mean_time")
+
+    hz_piv = 1 / time_piv
+    # hzstr_piv = (1 / time_piv).applymap(lambda x: f"{x:,.02f}")
+    print("Table for size=256")
+    # print(hzstr_piv.to_markdown())
+    print(hz_piv.to_markdown(floatfmt=",.02f"))
+    print("")
+    print("Above metrics are in call/sec, larger is better.")
+
+    speedup_piv = hz_piv / hz_piv["json"].values
+    print(speedup_piv.to_markdown(floatfmt=",.02g"))
+
+    analysis.abalate(param_group)
+    # benchmark_analysis(rows, xlabel, group_labels, basis, RECORD_ALL)
+
+    xlabel = "size"
+    # Set these to empty lists if they are not used
+    group_labels = {
+        "fig": ["input"],
+        "col": ["func"],
+        # "fig": [],
+        # "col": ["func" "input"],
+        "hue": ["impl", "impl_version"],
+        "size": [],
+    }
+    import kwplot
+
+    kwplot.autosns()
+    self = analysis  # NOQA
+
+    data = stats_table
+    plots = analysis.plot(
+        xlabel,
+        metric_key,
+        group_labels,
+        xscale="log",
+        yscale="log",
+        data=data,
+    )
+    plots
+    kwplot.show_if_requested()
diff --git a/json_benchmarks/benchmarker/__init__.py b/json_benchmarks/benchmarker/__init__.py
@@ -0,0 +1,68 @@
+"""
+A helper module for executing, serializing, combining, and comparing benchmarks
+"""
+
+__mkinit__ = """
+# Autogenerate this file
+mkinit ~/code/ultrajson/json_benchmarks/benchmarker/__init__.py -w
+"""
+
+__version__ = "0.1.0"
+
+from json_benchmarks.benchmarker import (
+    benchmarker,
+    process_context,
+    result_analysis,
+    util_json,
+    util_stats,
+    visualize,
+)
+from json_benchmarks.benchmarker.benchmarker import (
+    Benchmarker,
+    BenchmarkerConfig,
+    BenchmarkerResult,
+)
+from json_benchmarks.benchmarker.process_context import ProcessContext
+from json_benchmarks.benchmarker.result_analysis import (
+    DEFAULT_METRIC_TO_OBJECTIVE,
+    Result,
+    ResultAnalysis,
+    SkillTracker,
+)
+from json_benchmarks.benchmarker.util_json import (
+    ensure_json_serializable,
+    find_json_unserializable,
+    indexable_allclose,
+)
+from json_benchmarks.benchmarker.util_stats import (
+    aggregate_stats,
+    combine_stats,
+    combine_stats_arrs,
+    stats_dict,
+)
+from json_benchmarks.benchmarker.visualize import benchmark_analysis
+
+__all__ = [
+    "Benchmarker",
+    "BenchmarkerConfig",
+    "BenchmarkerResult",
+    "DEFAULT_METRIC_TO_OBJECTIVE",
+    "ProcessContext",
+    "Result",
+    "ResultAnalysis",
+    "SkillTracker",
+    "aggregate_stats",
+    "benchmark_analysis",
+    "benchmarker",
+    "combine_stats",
+    "combine_stats_arrs",
+    "ensure_json_serializable",
+    "find_json_unserializable",
+    "indexable_allclose",
+    "process_context",
+    "result_analysis",
+    "stats_dict",
+    "util_json",
+    "util_stats",
+    "visualize",
+]