igerber
diff --git a/‎benchmarks/speed_review/README.md‎
Lines changed: 10 additions & 4 deletions b/‎benchmarks/speed_review/README.md‎
Lines changed: 10 additions & 4 deletions
diff --git a/‎benchmarks/speed_review/baselines/brand_awareness_survey_large_python.json‎
Lines changed: 59 additions & 0 deletions b/‎benchmarks/speed_review/baselines/brand_awareness_survey_large_python.json‎
Lines changed: 59 additions & 0 deletions
diff --git a/‎benchmarks/speed_review/baselines/brand_awareness_survey_large_rust.json‎
Lines changed: 59 additions & 0 deletions b/‎benchmarks/speed_review/baselines/brand_awareness_survey_large_rust.json‎
Lines changed: 59 additions & 0 deletions
diff --git a/‎benchmarks/speed_review/baselines/brand_awareness_survey_medium_python.json‎
Lines changed: 59 additions & 0 deletions b/‎benchmarks/speed_review/baselines/brand_awareness_survey_medium_python.json‎
Lines changed: 59 additions & 0 deletions
diff --git a/‎benchmarks/speed_review/baselines/brand_awareness_survey_medium_rust.json‎
Lines changed: 59 additions & 0 deletions b/‎benchmarks/speed_review/baselines/brand_awareness_survey_medium_rust.json‎
Lines changed: 59 additions & 0 deletions
diff --git a/‎…lines/brand_awareness_survey_python.json‎ ‎…brand_awareness_survey_small_python.json‎benchmarks/speed_review/baselines/brand_awareness_survey_python.json renamed to benchmarks/speed_review/baselines/brand_awareness_survey_small_python.json
Lines changed: 10 additions & 9 deletions b/‎…lines/brand_awareness_survey_python.json‎ ‎…brand_awareness_survey_small_python.json‎benchmarks/speed_review/baselines/brand_awareness_survey_python.json renamed to benchmarks/speed_review/baselines/brand_awareness_survey_small_python.json
Lines changed: 10 additions & 9 deletions
diff --git a/‎…selines/brand_awareness_survey_rust.json‎ ‎…s/brand_awareness_survey_small_rust.json‎benchmarks/speed_review/baselines/brand_awareness_survey_rust.json renamed to benchmarks/speed_review/baselines/brand_awareness_survey_small_rust.json
Lines changed: 10 additions & 9 deletions b/‎…selines/brand_awareness_survey_rust.json‎ ‎…s/brand_awareness_survey_small_rust.json‎benchmarks/speed_review/baselines/brand_awareness_survey_rust.json renamed to benchmarks/speed_review/baselines/brand_awareness_survey_small_rust.json
Lines changed: 10 additions & 9 deletions
@@ -1,4 +1,4 @@
-# Speed Review — Practitioner Workflow Benchmarks
+# Speed Review - Practitioner Workflow Benchmarks
 
 Scenario-driven performance measurement for end-to-end practitioner chains,
 as distinct from `benchmarks/run_benchmarks.py` which measures R-parity on
@@ -47,19 +47,25 @@ to regenerate the full flame when needed.
 # One-time install
 pip install pyinstrument
 
-# All scenarios, both backends
+# All scenarios, both backends, all scales
 python benchmarks/speed_review/run_all.py
 
-# One scenario, one backend
+# One scenario, one backend (the script runs its full scale sweep internally)
 DIFF_DIFF_BACKEND=rust python benchmarks/speed_review/bench_campaign_staggered.py
 
 # Subset
 python benchmarks/speed_review/run_all.py --scenarios brfss_panel geo_few_markets
 ```
 
+Multi-scale scenarios write per-scale outputs
+(e.g. `campaign_staggered_small_rust.json`, `..._medium_rust.json`,
+`..._large_rust.json`). Single-scale scenarios write the scale-free form
+(e.g. `dose_response_rust.json`). Full runtime for all scales × both
+backends is ~90 seconds on Apple Silicon M4.
+
 ## Where to look for findings
 
-[`docs/performance-plan.md`](../../docs/performance-plan.md) — "Practitioner
+[`docs/performance-plan.md`](../../docs/performance-plan.md) - "Practitioner
 Workflow Baseline (v3.1.3)" section holds per-scenario hot-phase rankings
 and action recommendations. The scenarios here are the measurement surface;
 the findings doc is the decision output.
 
@@ -0,0 +1,59 @@
+{
+  "scenario": "brand_awareness_survey_large",
+  "backend": "python",
+  "has_rust_backend": false,
+  "total_seconds": 0.7940070000000001,
+  "phases": {
+    "1_naive_fit_no_survey_design": {
+      "seconds": 0.013499665999999966,
+      "ok": true,
+      "error": null
+    },
+    "2_tsl_strata_psu_fpc": {
+      "seconds": 0.03187458300000001,
+      "ok": true,
+      "error": null
+    },
+    "3_replicate_weights_brr": {
+      "seconds": 0.3442796670000001,
+      "ok": true,
+      "error": null
+    },
+    "4_multi_outcome_loop_3_metrics": {
+      "seconds": 0.19682533299999982,
+      "ok": true,
+      "error": null
+    },
+    "5_check_parallel_trends": {
+      "seconds": 0.030179500000000026,
+      "ok": true,
+      "error": null
+    },
+    "6_placebo_refit_pre_period": {
+      "seconds": 0.043751333999999975,
+      "ok": true,
+      "error": null
+    },
+    "7_event_study_plus_honest_did": {
+      "seconds": 0.13358487500000016,
+      "ok": true,
+      "error": null
+    }
+  },
+  "metadata": {
+    "scale": "large",
+    "n_units": 1000,
+    "n_periods": 12,
+    "n_obs": 12000,
+    "n_strata": 20,
+    "n_psu_per_stratum": 8,
+    "n_replicate_weights": 160,
+    "outcomes": [
+      "outcome",
+      "consideration",
+      "purchase_intent"
+    ]
+  },
+  "diff_diff_version": "3.1.3",
+  "numpy_version": "2.0.2"
+}
@@ -0,0 +1,59 @@
+{
+  "scenario": "brand_awareness_survey_large",
+  "backend": "rust",
+  "has_rust_backend": true,
+  "total_seconds": 0.828119375,
+  "phases": {
+    "1_naive_fit_no_survey_design": {
+      "seconds": 0.014049749999999861,
+      "ok": true,
+      "error": null
+    },
+    "2_tsl_strata_psu_fpc": {
+      "seconds": 0.029422499999999907,
+      "ok": true,
+      "error": null
+    },
+    "3_replicate_weights_brr": {
+      "seconds": 0.36754912500000003,
+      "ok": true,
+      "error": null
+    },
+    "4_multi_outcome_loop_3_metrics": {
+      "seconds": 0.16490987499999998,
+      "ok": true,
+      "error": null
+    },
+    "5_check_parallel_trends": {
+      "seconds": 0.03375229199999996,
+      "ok": true,
+      "error": null
+    },
+    "6_placebo_refit_pre_period": {
+      "seconds": 0.06475750000000025,
+      "ok": true,
+      "error": null
+    },
+    "7_event_study_plus_honest_did": {
+      "seconds": 0.15367104200000004,
+      "ok": true,
+      "error": null
+    }
+  },
+  "metadata": {
+    "scale": "large",
+    "n_units": 1000,
+    "n_periods": 12,
+    "n_obs": 12000,
+    "n_strata": 20,
+    "n_psu_per_stratum": 8,
+    "n_replicate_weights": 160,
+    "outcomes": [
+      "outcome",
+      "consideration",
+      "purchase_intent"
+    ]
+  },
+  "diff_diff_version": "3.1.3",
+  "numpy_version": "2.0.2"
+}
@@ -0,0 +1,59 @@
+{
+  "scenario": "brand_awareness_survey_medium",
+  "backend": "python",
+  "has_rust_backend": false,
+  "total_seconds": 0.48956791599999994,
+  "phases": {
+    "1_naive_fit_no_survey_design": {
+      "seconds": 0.01289191699999992,
+      "ok": true,
+      "error": null
+    },
+    "2_tsl_strata_psu_fpc": {
+      "seconds": 0.035409875000000035,
+      "ok": true,
+      "error": null
+    },
+    "3_replicate_weights_brr": {
+      "seconds": 0.12633833299999997,
+      "ok": true,
+      "error": null
+    },
+    "4_multi_outcome_loop_3_metrics": {
+      "seconds": 0.17774295900000003,
+      "ok": true,
+      "error": null
+    },
+    "5_check_parallel_trends": {
+      "seconds": 0.018629792000000034,
+      "ok": true,
+      "error": null
+    },
+    "6_placebo_refit_pre_period": {
+      "seconds": 0.0519646250000001,
+      "ok": true,
+      "error": null
+    },
+    "7_event_study_plus_honest_did": {
+      "seconds": 0.06657341699999986,
+      "ok": true,
+      "error": null
+    }
+  },
+  "metadata": {
+    "scale": "medium",
+    "n_units": 500,
+    "n_periods": 12,
+    "n_obs": 6000,
+    "n_strata": 15,
+    "n_psu_per_stratum": 6,
+    "n_replicate_weights": 90,
+    "outcomes": [
+      "outcome",
+      "consideration",
+      "purchase_intent"
+    ]
+  },
+  "diff_diff_version": "3.1.3",
+  "numpy_version": "2.0.2"
+}
@@ -0,0 +1,59 @@
+{
+  "scenario": "brand_awareness_survey_medium",
+  "backend": "rust",
+  "has_rust_backend": true,
+  "total_seconds": 0.535454792,
+  "phases": {
+    "1_naive_fit_no_survey_design": {
+      "seconds": 0.011897708999999979,
+      "ok": true,
+      "error": null
+    },
+    "2_tsl_strata_psu_fpc": {
+      "seconds": 0.03526237499999996,
+      "ok": true,
+      "error": null
+    },
+    "3_replicate_weights_brr": {
+      "seconds": 0.185435083,
+      "ok": true,
+      "error": null
+    },
+    "4_multi_outcome_loop_3_metrics": {
+      "seconds": 0.14044966699999994,
+      "ok": true,
+      "error": null
+    },
+    "5_check_parallel_trends": {
+      "seconds": 0.019051875000000162,
+      "ok": true,
+      "error": null
+    },
+    "6_placebo_refit_pre_period": {
+      "seconds": 0.05337804200000007,
+      "ok": true,
+      "error": null
+    },
+    "7_event_study_plus_honest_did": {
+      "seconds": 0.08997387500000009,
+      "ok": true,
+      "error": null
+    }
+  },
+  "metadata": {
+    "scale": "medium",
+    "n_units": 500,
+    "n_periods": 12,
+    "n_obs": 6000,
+    "n_strata": 15,
+    "n_psu_per_stratum": 6,
+    "n_replicate_weights": 90,
+    "outcomes": [
+      "outcome",
+      "consideration",
+      "purchase_intent"
+    ]
+  },
+  "diff_diff_version": "3.1.3",
+  "numpy_version": "2.0.2"
+}
@@ -1,46 +1,47 @@
 {
-  "scenario": "brand_awareness_survey",
+  "scenario": "brand_awareness_survey_small",
   "backend": "python",
   "has_rust_backend": false,
-  "total_seconds": 0.18850491600000008,
+  "total_seconds": 0.15087129199999993,
   "phases": {
     "1_naive_fit_no_survey_design": {
-      "seconds": 0.0016701670000000002,
+      "seconds": 0.0017902499999999932,
       "ok": true,
       "error": null
     },
     "2_tsl_strata_psu_fpc": {
-      "seconds": 0.006741541999999989,
+      "seconds": 0.00610949999999999,
       "ok": true,
       "error": null
     },
     "3_replicate_weights_brr": {
-      "seconds": 0.014424250000000027,
+      "seconds": 0.02120725000000001,
       "ok": true,
       "error": null
     },
     "4_multi_outcome_loop_3_metrics": {
-      "seconds": 0.043619666,
+      "seconds": 0.011621500000000062,
       "ok": true,
       "error": null
     },
     "5_check_parallel_trends": {
-      "seconds": 0.00915220799999994,
+      "seconds": 0.001833375000000026,
       "ok": true,
       "error": null
     },
     "6_placebo_refit_pre_period": {
-      "seconds": 0.029268290999999946,
+      "seconds": 0.027076792000000016,
       "ok": true,
       "error": null
     },
     "7_event_study_plus_honest_did": {
-      "seconds": 0.08362433400000002,
+      "seconds": 0.081212583,
       "ok": true,
       "error": null
     }
   },
   "metadata": {
+    "scale": "small",
     "n_units": 200,
     "n_periods": 12,
     "n_obs": 2400,
 
@@ -1,46 +1,47 @@
 {
-  "scenario": "brand_awareness_survey",
+  "scenario": "brand_awareness_survey_small",
   "backend": "rust",
   "has_rust_backend": true,
-  "total_seconds": 0.16800324999999994,
+  "total_seconds": 0.200881125,
   "phases": {
     "1_naive_fit_no_survey_design": {
-      "seconds": 0.0018907079999999077,
+      "seconds": 0.0018462080000000158,
       "ok": true,
       "error": null
     },
     "2_tsl_strata_psu_fpc": {
-      "seconds": 0.006109541999999912,
+      "seconds": 0.005704333000000061,
       "ok": true,
       "error": null
     },
     "3_replicate_weights_brr": {
-      "seconds": 0.01849195799999992,
+      "seconds": 0.015561500000000006,
       "ok": true,
       "error": null
     },
     "4_multi_outcome_loop_3_metrics": {
-      "seconds": 0.02723191700000005,
+      "seconds": 0.05937758399999993,
       "ok": true,
       "error": null
     },
     "5_check_parallel_trends": {
-      "seconds": 0.009134625000000063,
+      "seconds": 0.00939004099999996,
       "ok": true,
       "error": null
     },
     "6_placebo_refit_pre_period": {
-      "seconds": 0.024182666999999936,
+      "seconds": 0.025794415999999987,
       "ok": true,
       "error": null
     },
     "7_event_study_plus_honest_did": {
-      "seconds": 0.08095333299999996,
+      "seconds": 0.08319054199999998,
       "ok": true,
       "error": null
     }
   },
   "metadata": {
+    "scale": "small",
     "n_units": 200,
     "n_periods": 12,
     "n_obs": 2400,