cppalliance · leostar0412 · May 19, 2026 · May 20, 2026 · coderabbitai · May 20, 2026
diff --git a/.github/workflows/benchmarks.yml b/.github/workflows/benchmarks.yml
@@ -0,0 +1,78 @@
+name: Benchmarks
+
+on:
+  workflow_dispatch:
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.ref }}
+  cancel-in-progress: true
+
+jobs:
+  benchmark:
+    runs-on: ubuntu-latest
+    timeout-minutes: 30
+
+    services:
+      postgres:
+        image: postgres:16
+        env:
+          POSTGRES_USER: postgres
+          POSTGRES_PASSWORD: postgres
+          POSTGRES_DB: postgres
+        ports: ["5432:5432"]
+        options: >-
+          --health-cmd pg_isready
+          --health-interval 10s
+          --health-timeout 5s
+          --health-retries 5
+          --shm-size=256mb
+
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Install uv
+        uses: astral-sh/setup-uv@v7
+        with:
+          python-version: "3.13"
+
+      - name: Cache uv
+        uses: actions/cache@v4
+        with:
+          path: ~/.cache/uv
+          key: ${{ runner.os }}-uv-benchmark-${{ hashFiles('requirements-dev.lock') }}
+          restore-keys: |
+            ${{ runner.os }}-uv-benchmark-
+            ${{ runner.os }}-uv-
+
+      - name: Install dependencies
+        env:
+          SETUPTOOLS_SCM_WRITE_TO_SOURCE: "1"
+        run: |
+          uv venv
+          uv pip install -r requirements-dev.lock
+          uv pip install -e .
+
+      - name: Run benchmarks
+        env:
+          DATABASE_URL: postgres://postgres:postgres@127.0.0.1:5432/postgres
+          SECRET_KEY: for-testing-only
+          DJANGO_SETTINGS_MODULE: config.test_settings
+          RUN_BENCHMARKS: "1"
+        run: |
+          uv run pytest benchmarks/ -m benchmark --benchmark-only \
+            --benchmark-json=bench.json -v \
+            --benchmark-disable-gc
+
+      - name: Compare to baselines
+        if: success()
+        run: |
+          uv run python benchmarks/compare_to_baseline.py bench.json benchmarks/baselines.json
+
+      - name: Upload benchmark JSON
+        if: always()
+        uses: actions/upload-artifact@v4
+        with:
+          name: benchmark-json
+          path: bench.json
+          retention-days: 30
diff --git a/docs/Contributing.md → CONTRIBUTING.md b/docs/Contributing.md → CONTRIBUTING.md
@@ -34,11 +34,11 @@ Each Django app that has **models** provides a **`services.py`** module. This is
 | `cppa_slack_tracker` | `cppa_slack_tracker/services.py` | Slack teams, channels, messages, membership. |
 | `wg21_paper_tracker` | `wg21_paper_tracker/services.py` | WG21 papers, authors, mailings. |
 
-For a full list of functions, parameter/return types, and validation (e.g. empty `name` raises `ValueError`), see **[Service_API.md](Service_API.md)** and the per-app docs in **[service_api/](service_api/)** (index: [service_api/README.md](service_api/README.md)). DTO protocols shared across trackers are documented in **[service_api/core_protocols.md](service_api/core_protocols.md)** (generated from `core/protocols.py`).
+For a full list of functions, parameter/return types, and validation (e.g. empty `name` raises `ValueError`), see **[docs/Service_API.md](docs/Service_API.md)** and the per-app docs in **[docs/service_api/](docs/service_api/)** (index: [docs/service_api/README.md](docs/service_api/README.md)).
 
 ### Regenerating service API docs
 
-Reference tables in `docs/service_api/*.md` are produced by **[`scripts/generate_service_docs.py`](../scripts/generate_service_docs.py)** from each app’s `services.py` and from `core/protocols.py`.
+Reference tables in `docs/service_api/*.md` are produced by **[`scripts/generate_service_docs.py`](scripts/generate_service_docs.py)** from each app’s `services.py` and from `core/protocols.py`.
 
 - **Markers:** Each file contains `<!-- SERVICE_API:GENERATED:START -->` … `<!-- SERVICE_API:GENERATED:END -->`. The script replaces **only** that region. Put hand-written notes (usage, cross-app warnings, command help) **below** the `END` marker.
 - **Regenerate locally:** `python scripts/generate_service_docs.py` (optional: `--app <django_app_label>` for one module).
@@ -65,22 +65,47 @@ Reference tables in `docs/service_api/*.md` are produced by **[`scripts/generate
 
 ### Testing
 
-- **Running tests:** From the project root, install dev deps (`pip install -r requirements-dev.lock` or `uv pip install -r requirements-dev.lock`), start the test database (`docker compose -f docker-compose.test.yml up -d`), set `DATABASE_URL` (and `SECRET_KEY` for the process) as in [README.md](../README.md#running-tests), then run `python -m pytest`. Tests **always use PostgreSQL** (`config.test_settings`); there is no SQLite fallback.
-- See [README.md](../README.md#running-tests) and [Development_guideline.md](Development_guideline.md#testing-workflow) for full commands and options.
+- **Running tests:** From the project root, install dev deps (`pip install -r requirements-dev.lock` or `uv pip install -r requirements-dev.lock`), start the test database (`docker compose -f docker-compose.test.yml up -d`), set `DATABASE_URL` (and `SECRET_KEY` for the process) as in [README.md](README.md#running-tests), then run `python -m pytest`. Tests **always use PostgreSQL** (`config.test_settings`); there is no SQLite fallback.
+- See [README.md](README.md#running-tests) and [docs/Development_guideline.md](docs/Development_guideline.md#testing-workflow) for full commands and options.
 - **Unit tests for `services.py`:** Call the service functions and assert on the database (or mocks) as needed.
 - **Other tests:** Prefer service functions when setting up data. If you must create models directly for tests, keep it in test code (e.g. fixtures or test helpers) and avoid doing the same in production code.
 
+### Performance benchmarks
+
+Throughput checks live under [`benchmarks/`](benchmarks/) and use **`pytest-benchmark`**. They are **not** collected during normal `pytest` runs: set **`RUN_BENCHMARKS=1`** so the root [`conftest.py`](conftest.py) stops ignoring that directory (see `collect_ignore`). Tests are marked with **`@pytest.mark.benchmark`**.
+
+**Prerequisites:** Same as unit tests: PostgreSQL, `DATABASE_URL`, `SECRET_KEY`, `DJANGO_SETTINGS_MODULE=config.test_settings` (see [README.md](README.md#running-tests)).
+
+**Run locally** (from repo root, with Postgres up):
+
+```bash
+export RUN_BENCHMARKS=1
+export DATABASE_URL=postgres://postgres:postgres@127.0.0.1:5433/postgres
+export SECRET_KEY=for-local-only
+export DJANGO_SETTINGS_MODULE=config.test_settings
+# Optional: batch size (default 50; match benchmarks/baselines.json "n")
+export BENCHMARK_COMMIT_N=50
+
+uv run pytest benchmarks/ -m benchmark --benchmark-only \
+  --benchmark-json=bench.json -v
-uv run pytest benchmarks/ -m benchmark --benchmark-only \
-  --benchmark-json=bench.json -v
+uv run pytest benchmarks/ -m benchmark --benchmark-only \
+  --benchmark-json=bench.json -v \
+  --benchmark-disable-gc
-uv run pytest benchmarks/ -m benchmark --benchmark-only \
-  --benchmark-json=bench.json -v
+uv run pytest benchmarks/ -m benchmark --benchmark-only \
+  --benchmark-json=bench.json -v \
+  --benchmark-disable-gc
+uv run python benchmarks/compare_to_baseline.py bench.json benchmarks/baselines.json
+```
+
+**Baselines:** [`benchmarks/baselines.json`](benchmarks/baselines.json) stores maximum acceptable **median** seconds per scenario (for the configured `n`). The compare script fails if any median exceeds `baseline_median × 1.25` (more than 25% slower than the reference). After a deliberate performance change or a CI image upgrade, update `median_seconds` (and `n` if you change `BENCHMARK_COMMIT_N`) using `stats.median` from the generated JSON.
+
+**CI:** The [`.github/workflows/benchmarks.yml`](.github/workflows/benchmarks.yml) workflow runs on **`workflow_dispatch`** only, uploads `bench.json` as an artifact, and runs the compare step on success.
+
 ## Other guidelines
 
-- **Branching:** Create feature branches from `develop`. Open pull requests against `develop`. See [Development_guideline.md](Development_guideline.md).
+- **Branching:** Create feature branches from `develop`. Open pull requests against `develop`. See [docs/Development_guideline.md](docs/Development_guideline.md).
 - **Code style:** Use Python 3.11+ and follow Django and project conventions. Use the project’s logging (`logging.getLogger(__name__)`). Before pushing, run **`uv run pyright`** (with dev deps) for the paths covered by **`pyrightconfig.json`**, and ensure CI’s **lint** / **pyright** / **test** jobs would pass.
 - **Database:** Use the Django ORM and migrations. Writes only through the service layer as above.
-- **Docs:** Update this doc (and app `services.py` docstrings) when adding new apps or changing the write rules. After changing `services.py` or `core/protocols.py`, run `python scripts/generate_service_docs.py` and commit the updated `docs/service_api/` files.
+- **Docs:** Update this file (and app `services.py` docstrings) when adding new apps or changing the write rules. After changing `services.py` or `core/protocols.py`, run `python scripts/generate_service_docs.py` and commit the updated `docs/service_api/` files.
 
 ## Related documentation
 
-- [Service_API.md](Service_API.md) – API reference for all service layer functions.
-- [Development_guideline.md](Development_guideline.md) – Setup, workflow, adding apps.
-- [Workflow.md](Workflow.md) – Execution order and collectors.
-- [Schema.md](Schema.md) – Database schema.
-- [cross-app-dependencies.md](cross-app-dependencies.md) – Complete map of every cross-app FK, MTI, ORM read, and Python import dependency, plus `import-linter` recommendations.
+- [docs/Service_API.md](docs/Service_API.md) – API reference for all service layer functions.
+- [docs/Development_guideline.md](docs/Development_guideline.md) – Setup, workflow, adding apps.
+- [docs/Workflow.md](docs/Workflow.md) – Execution order and collectors.
+- [docs/Schema.md](docs/Schema.md) – Database schema.
+- [docs/cross-app-dependencies.md](docs/cross-app-dependencies.md) – Complete map of every cross-app FK, MTI, ORM read, and Python import dependency, plus `import-linter` recommendations.
diff --git a/README.md b/README.md
@@ -215,7 +215,7 @@ Docs are organized **by topic** (one doc per concern: workflow, workspace, servi
 - [Workspace.md](docs/Workspace.md) – Workspace layout and usage for file processing.
 - [Schema.md](docs/Schema.md) – Database schema and table relationships.
 - [Development_guideline.md](docs/Development_guideline.md) – Development setup, app requirements, and step-by-step workflow.
-- [Contributing.md](docs/Contributing.md) – Service layer (single place for writes), **regenerating service API docs** (`scripts/generate_service_docs.py`), and contributor guidelines.
+- [CONTRIBUTING.md](CONTRIBUTING.md) – Service layer (single place for writes), **regenerating service API docs** (`scripts/generate_service_docs.py`), and contributor guidelines.
 - [Service_API.md](docs/Service_API.md) – API reference and index for all service layer functions.
 - [service_api/](docs/service_api/) – Per-app service API docs (name, description, parameters, return types, validation).
 

diff --git a/bench.json b/bench.json
@@ -0,0 +1,132 @@
+{
+    "machine_info": {
+        "node": "Leos-Mac-mini.local",
+        "processor": "arm",
+        "machine": "arm64",
+        "python_compiler": "Clang 21.1.4 ",
+        "python_implementation": "CPython",
+        "python_implementation_version": "3.13.12",
+        "python_version": "3.13.12",
+        "python_build": [
+            "main",
+            "Mar 10 2026 18:26:32"
+        ],
+        "release": "25.4.0",
+        "system": "Darwin",
+        "cpu": {
+            "python_version": "3.13.12.final.0 (64 bit)",
+            "cpuinfo_version": [
+                9,
+                0,
+                0
+            ],
+            "cpuinfo_version_string": "9.0.0",
+            "arch": "ARM_8",
+            "bits": 64,
+            "count": 10,
+            "arch_string_raw": "arm64",
+            "brand_raw": "Apple M4"
+        }
+    },
+    "commit_info": {
+        "id": "7bf1b7ea6657990eef44fdb362b762abb16e41ba",
+        "time": "2026-05-18T20:05:08-04:00",
+        "author_time": "2026-05-18T20:05:08-04:00",
+        "dirty": true,
+        "project": "boost-data-collector",
+        "branch": "develop"
+    },
+    "benchmarks": [
+        {
+            "group": null,
+            "name": "test_process_commit_data_batch",
+            "fullname": "benchmarks/test_github_commits_throughput.py::test_process_commit_data_batch",
+            "params": null,
+            "param": null,
+            "extra_info": {
+                "n": 50
+            },
+            "options": {
+                "disable_gc": false,
+                "timer": "perf_counter",
+                "min_rounds": 5,
+                "max_time": 1.0,
+                "min_time": 5e-06,
+                "warmup": false
+            },
+            "stats": {
+                "min": 0.13009395799599588,
+                "max": 0.16657558304723352,
+                "mean": 0.14227045823354273,
+                "stddev": 0.01457181655810832,
+                "rounds": 5,
+                "median": 0.13689958304166794,
+                "iqr": 0.01724434396601282,
+                "q1": 0.1326302083034534,
+                "q3": 0.14987455226946622,
+                "iqr_outliers": 0,
+                "stddev_outliers": 1,
+                "outliers": "1;0",
+                "ld15iqr": 0.13009395799599588,
+                "hd15iqr": 0.16657558304723352,
+                "ops": 7.0288660936092535,
+                "total": 0.7113522911677137,
+                "data": [
+                    0.16657558304723352,
+                    0.1334756250726059,
+                    0.13009395799599588,
+                    0.13689958304166794,
+                    0.14430754201021045
+                ],
+                "iterations": 1
+            }
+        },
+        {
+            "group": null,
+            "name": "test_service_bulk_commits_and_file_changes",
+            "fullname": "benchmarks/test_service_bulk_insert.py::test_service_bulk_commits_and_file_changes",
+            "params": null,
+            "param": null,
+            "extra_info": {
+                "n": 50
+            },
+            "options": {
+                "disable_gc": false,
+                "timer": "perf_counter",
+                "min_rounds": 5,
+                "max_time": 1.0,
+                "min_time": 5e-06,
+                "warmup": false
+            },
+            "stats": {
+                "min": 0.10591337503865361,
+                "max": 0.1513816670048982,
+                "mean": 0.13538706267718226,
+                "stddev": 0.01819949434483927,
+                "rounds": 6,
+                "median": 0.14058843749808148,
+                "iqr": 0.02617037494201213,
+                "q1": 0.12384004204068333,
+                "q3": 0.15001041698269546,
+                "iqr_outliers": 0,
+                "stddev_outliers": 1,
+                "outliers": "1;0",
+                "ld15iqr": 0.10591337503865361,
+                "hd15iqr": 0.1513816670048982,
+                "ops": 7.386230118489284,
+                "total": 0.8123223760630935,
+                "data": [
+                    0.1513816670048982,
+                    0.15001041698269546,
+                    0.13251695793587714,
+                    0.12384004204068333,
+                    0.1486599170602858,
+                    0.10591337503865361
+                ],
+                "iterations": 1
+            }
+        }
+    ],
+    "datetime": "2026-05-19T18:09:23.360634+00:00",
+    "version": "5.2.3"
+}
diff --git a/benchmarks/baselines.json b/benchmarks/baselines.json
@@ -0,0 +1,13 @@
+{
+  "description": "Maximum acceptable median wall time (seconds) per scenario at BENCHMARK_COMMIT_N. Update median_seconds after intentional perf work or when CI hardware changes; copy medians from --benchmark-json stats.median.",
+  "benchmarks": {
+    "benchmarks/test_github_commits_throughput.py::test_process_commit_data_batch": {
+      "median_seconds": 45.0,
+      "n": 50
+    },
+    "benchmarks/test_service_bulk_insert.py::test_service_bulk_commits_and_file_changes": {
+      "median_seconds": 35.0,
+      "n": 50
-      "median_seconds": 45.0,
-      "n": 50
-    },
-    "benchmarks/test_service_bulk_insert.py::test_service_bulk_commits_and_file_changes": {
-      "median_seconds": 35.0,
-      "n": 50
+      "median_seconds": 0.137,
+      "n": 50
+    },
+    "benchmarks/test_service_bulk_insert.py::test_service_bulk_commits_and_file_changes": {
+      "median_seconds": 0.141,
+      "n": 50
-      "median_seconds": 45.0,
-      "n": 50
-    },
-    "benchmarks/test_service_bulk_insert.py::test_service_bulk_commits_and_file_changes": {
-      "median_seconds": 35.0,
-      "n": 50
+      "median_seconds": 0.137,
+      "n": 50
+    },
+    "benchmarks/test_service_bulk_insert.py::test_service_bulk_commits_and_file_changes": {
+      "median_seconds": 0.141,
+      "n": 50
+    }
+  }
+}