From 3bbff8c9b8fc2519151c6081c0b953f8cef4a2bd Mon Sep 17 00:00:00 2001
From: Workflow OS <workflow@local>
Date: Sun, 5 Apr 2026 22:15:59 +0000
Subject: [PATCH 1/2] repo_refactor: Repair mainline benchmark hygiene and make
 benchmark/report

---
 .gitignore                 |  46 +++++++++++++++-
 README.md                  |  54 +++++++++++--------
 report/benchmark_report.md | 104 +++++++++++++++----------------------
 3 files changed, 120 insertions(+), 84 deletions(-)

diff --git a/.gitignore b/.gitignore
index e0d63ba..ba99364 100644
--- a/.gitignore
+++ b/.gitignore
@@ -3,6 +3,48 @@ __pycache__/
 .venv/
 venv/
 *.pyc
+
+# CMake and out-of-source build trees
 /build/
-.cmake-test-build/
-reports/
+/build-*/
+/build_*/
+/.cmake-test-build/
+/cmake-build-*/
+/out/
+/CMakeCache.txt
+/CMakeFiles/
+/CTestTestfile.cmake
+/CTestCostData.txt
+/DartConfiguration.tcl
+/Testing/
+/Makefile
+/build.ninja
+/.ninja_deps
+/.ninja_log
+/rules.ninja
+/cmake_install.cmake
+/compile_commands.json
+/lob_engine
+/lob_engine.exe
+/lob_benchmark
+/lob_benchmark.exe
+/test_parser
+/test_parser.exe
+/test_order_book
+/test_order_book.exe
+/test_analytics
+/test_analytics.exe
+
+# Generated benchmark, analytics, and report artifacts
+/benchmark/*.csv
+/benchmark/*.json
+/benchmark/*.log
+/benchmark/*.out
+/benchmark/*.txt
+/report/*.csv
+/report/*.json
+/report/*.log
+/report/*.out
+/report/*.txt
+/report/generated/
+/reports/
diff --git a/README.md b/README.md
index a9488d4..3db5760 100644
--- a/README.md
+++ b/README.md
@@ -1,6 +1,6 @@
 # Real-Time Limit Order Book Engine in C++
 
-This repository implements a small, deterministic C++ limit-order-book engine for LOBSTER-style message data. It includes:
+This repository implements a small, deterministic C++ limit-order-book engine for LOBSTER-style message data. The parser and replay code operate on the LOBSTER six-column message schema, but the checked-in CSVs are tiny synthetic/reduced fixtures for reproducibility, not full proprietary LOBSTER distributions. The repo includes:
 
 - typed CSV ingestion for LOBSTER message rows
 - order lifecycle processing for add, cancel, and execute events
@@ -8,7 +8,7 @@ This repository implements a small, deterministic C++ limit-order-book engine fo
 - two price-level backends: `std::map` and flat sorted `std::vector`
 - rolling analytics and CSV export after every processed message
 - deterministic C++ and Python integration tests
-- replay benchmark tooling and a checked-in benchmark report
+- replay benchmark tooling and a hand-maintained benchmark reproducibility note
 
 ## Repository layout
 
@@ -19,29 +19,42 @@ This repository implements a small, deterministic C++ limit-order-book engine fo
 - `data/`: checked-in small sample datasets used for deterministic tests and reproducible benchmark captures
 - `report/`: benchmark and methodology notes
 
-## Build
+## Reproducible build
+
+From a fresh clone, run the build, verifier, and benchmark commands below in order. Start with a clean temporary build directory instead of an in-repo build tree:
+
+```bash
+build_dir="$(mktemp -d "${TMPDIR:-/tmp}/lob-engine-build.XXXXXX")"
+cmake -S . -B "$build_dir" -DCMAKE_BUILD_TYPE=Release
+cmake --build "$build_dir" --config Release
+```
+
+## Correctness verification
+
+Run the CMake/CTest verifier from that build directory, then run the existing Python test suite from the repo root:
 
 ```bash
-cmake -S . -B build -DCMAKE_BUILD_TYPE=Release
-cmake --build build
-ctest --test-dir build --output-on-failure
+ctest --test-dir "$build_dir" --output-on-failure -C Release
+python -m pytest tests -q --tb=short
 ```
 
+`ctest` runs the three C++ test executables plus the `lob_benchmark_smoke` path. `python -m pytest tests -q --tb=short` configures and reuses a separate `.cmake-test-build/` directory under the repo root; that directory and the analytics CSVs produced there are ignored local test artifacts.
+
 ## CLI usage
 
 Replay a dataset and print final top-of-book state:
 
 ```bash
-./build/lob_engine data/AAPL_sample_messages.csv --backend both --depth 10 --repeat 5
+"$build_dir/lob_engine" data/AAPL_sample_messages.csv --backend both --depth 10 --repeat 5
 ```
 
 Export analytics rows after every processed message:
 
 ```bash
-./build/lob_engine \
+"$build_dir/lob_engine" \
   data/AAPL_sample_messages.csv \
   --backend both \
-  --analytics-out build/analytics.csv \
+  --analytics-out "$build_dir/analytics.csv" \
   --trade-window-messages 1000 \
   --realized-vol-window-seconds 300
 ```
@@ -81,15 +94,13 @@ Deterministic parity tests assert that both backends produce identical book snap
 
 ## Benchmarking
 
-The benchmark harness focuses on replay throughput and simple preallocation effects:
+The benchmark harness focuses on replay throughput and simple preallocation effects on the checked-in reduced fixtures. These four commands are the final step in the fresh-clone verification sequence documented above:
 
 ```bash
-./build/lob_benchmark \
-  --dataset data/AAPL_sample_messages.csv \
-  --backend both \
-  --reserve both \
-  --depth 5 \
-  --repeat 100000
+"$build_dir/lob_benchmark" --dataset data/AAPL_sample_messages.csv --backend both --reserve both --depth 5 --repeat 100000
+"$build_dir/lob_benchmark" --dataset data/MSFT_sample_messages.csv --backend both --reserve both --depth 5 --repeat 100000
+"$build_dir/lob_benchmark" --dataset data/NVDA_sample_messages.csv --backend both --reserve both --depth 5 --repeat 100000
+"$build_dir/lob_benchmark" --dataset data/TSLA_sample_messages.csv --backend both --reserve both --depth 5 --repeat 100000
 ```
 
 What the benchmark compares:
@@ -102,20 +113,21 @@ What the benchmark compares:
 - `unordered_map::reserve()` for order lookup
 - vector capacity reservation for the flat backend
 
-This is the bounded hot-path allocation reduction implemented in the repo. The benchmark report records the measured effect on the checked-in sample datasets.
-
-On a fresh build of this repository on a 4-core AMD EPYC-Rome VM, the fastest AAPL replay configuration processed `60.1 million messages/second` with the flat-vector backend and reserve disabled.
+This is the bounded hot-path allocation reduction implemented in the repo. Throughput numbers are host-dependent and should be treated as local measurements on the checked-in reduced fixtures, not as publishable claims about full vendor datasets. See `report/benchmark_report.md` for the exact datasets and commands used for reproducible reruns.
 
 ## Dataset note
 
-The repo ships small checked-in reproducibility datasets:
+The repo ships five checked-in reproducibility fixtures:
 
 - `AAPL_sample_messages.csv`
 - `MSFT_sample_messages.csv`
 - `NVDA_sample_messages.csv`
 - `TSLA_sample_messages.csv`
+- `sample_messages.csv`
+
+The four ticker-named files are 25-line reduced fixtures with 20 valid messages plus 5 intentionally malformed rows each. `sample_messages.csv` is a legacy generic fixture with the same contents as `AAPL_sample_messages.csv`, kept because the parser and Python integration tests reference it directly.
 
-They are intentionally tiny and deterministic so the build, tests, and benchmark report can run in CI or on a fresh clone without external data dependencies. They are suitable for correctness checks and relative replay comparisons, not production-grade market simulation.
+These files are intentionally tiny and deterministic so the build, tests, and benchmark workflow can run on a fresh clone without external data dependencies. They are suitable for correctness checks and relative replay comparisons, not production-grade market simulation or claims about full vendor data.
 
 ## Why this is useful for quant / HFT workflows
 
diff --git a/report/benchmark_report.md b/report/benchmark_report.md
index b0f25c5..743b834 100644
--- a/report/benchmark_report.md
+++ b/report/benchmark_report.md
@@ -1,78 +1,60 @@
 # Benchmark Report
 
-This report captures reproducible replay benchmarks from a clean checkout of the repository after the analytics/export and preallocation work landed.
+This document is a hand-maintained reproducibility note for the replay benchmark harness. The repository does not track generated benchmark outputs, build trees, or machine-specific report artifacts.
 
-## Reproduction
+## Fixture scope
 
-```bash
-cmake -S . -B build -DCMAKE_BUILD_TYPE=Release
-cmake --build build
-ctest --test-dir build --output-on-failure
-./build/lob_benchmark --dataset data/AAPL_sample_messages.csv --backend both --reserve both --depth 5 --repeat 200000
-./build/lob_benchmark --dataset data/MSFT_sample_messages.csv --backend both --reserve both --depth 5 --repeat 100000
-./build/lob_benchmark --dataset data/NVDA_sample_messages.csv --backend both --reserve both --depth 5 --repeat 100000
-./build/lob_benchmark --dataset data/TSLA_sample_messages.csv --backend both --reserve both --depth 5 --repeat 100000
-```
-
-## Scope
-
-- timed section: replay-only
-- analytics/export: available in `lob_engine`, but excluded from the replay throughput timer
-- backends compared: `std::map` and flat sorted `std::vector`
-- allocation mode compared: reserve/preallocation `off` vs `on`
-
-## Results
-
-### AAPL sample
+The checked-in CSV files are reduced reproducibility fixtures that match the LOBSTER message schema, not full proprietary LOBSTER distributions.
 
-| Backend | Reserve | Throughput msgs/s | Avg ns/msg |
-| --- | --- | ---: | ---: |
-| map | off | 55,621,183 | 17.979 |
-| flat | off | 59,151,913 | 16.906 |
-| map | on | 57,645,505 | 17.347 |
-| flat | on | 56,307,627 | 17.760 |
+| Dataset | Purpose | Rows on disk | Parsed rows | Malformed rows |
+| --- | --- | ---: | ---: | ---: |
+| `data/AAPL_sample_messages.csv` | Reduced AAPL-like benchmark fixture | 25 | 20 | 5 |
+| `data/MSFT_sample_messages.csv` | Reduced MSFT-like benchmark fixture | 25 | 20 | 5 |
+| `data/NVDA_sample_messages.csv` | Reduced NVDA-like benchmark fixture | 25 | 20 | 5 |
+| `data/TSLA_sample_messages.csv` | Reduced TSLA-like benchmark fixture | 25 | 20 | 5 |
+| `data/sample_messages.csv` | Legacy parser/integration-test alias of the AAPL fixture | 25 | 20 | 5 |
 
-Takeaway: on the checked-in AAPL sample, `flat` wins without reserve, while `map` slightly benefits from preallocation.
+The fixtures intentionally include malformed rows so parser error accounting is exercised during correctness checks. They also include obviously synthetic values, so benchmark output should be interpreted only as a local engineering signal for this repository, not as a publishable claim about full proprietary datasets.
 
-### MSFT sample
+## Fresh-clone sequence
 
-| Backend | Reserve | Throughput msgs/s | Avg ns/msg |
-| --- | --- | ---: | ---: |
-| map | off | 29,049,272 | 34.424 |
-| flat | off | 55,216,799 | 18.110 |
-| map | on | 51,246,182 | 19.514 |
-| flat | on | 49,013,940 | 20.402 |
-
-Takeaway: the reserve hint materially improves the `map` path on this sample and narrows the gap to the flat-vector backend.
-
-### NVDA sample
+```bash
+build_dir="$(mktemp -d "${TMPDIR:-/tmp}/lob-engine-build.XXXXXX")"
+cmake -S . -B "$build_dir" -DCMAKE_BUILD_TYPE=Release
+cmake --build "$build_dir" --config Release
+ctest --test-dir "$build_dir" --output-on-failure -C Release
+python -m pytest tests -q --tb=short
+"$build_dir/lob_benchmark" --dataset data/AAPL_sample_messages.csv --backend both --reserve both --depth 5 --repeat 100000
+"$build_dir/lob_benchmark" --dataset data/MSFT_sample_messages.csv --backend both --reserve both --depth 5 --repeat 100000
+"$build_dir/lob_benchmark" --dataset data/NVDA_sample_messages.csv --backend both --reserve both --depth 5 --repeat 100000
+"$build_dir/lob_benchmark" --dataset data/TSLA_sample_messages.csv --backend both --reserve both --depth 5 --repeat 100000
+```
 
-| Backend | Reserve | Throughput msgs/s | Avg ns/msg |
-| --- | --- | ---: | ---: |
-| map | off | 46,925,367 | 21.310 |
-| flat | off | 54,675,249 | 18.290 |
-| map | on | 53,910,207 | 18.549 |
-| flat | on | 45,742,321 | 21.862 |
+`ctest` covers the C++ test executables plus a smoke run of `lob_benchmark`. `python -m pytest tests -q --tb=short` reruns the existing Python integration suite, which configures and reuses a separate `.cmake-test-build/` directory under the repo root and emits local analytics CSV byproducts there.
 
-Takeaway: preallocation helps the `map` backend more than the flat-vector backend on this sample.
+## Benchmark commands
 
-### TSLA sample
+```bash
+"$build_dir/lob_benchmark" --dataset data/AAPL_sample_messages.csv --backend both --reserve both --depth 5 --repeat 100000
+"$build_dir/lob_benchmark" --dataset data/MSFT_sample_messages.csv --backend both --reserve both --depth 5 --repeat 100000
+"$build_dir/lob_benchmark" --dataset data/NVDA_sample_messages.csv --backend both --reserve both --depth 5 --repeat 100000
+"$build_dir/lob_benchmark" --dataset data/TSLA_sample_messages.csv --backend both --reserve both --depth 5 --repeat 100000
+```
 
-| Backend | Reserve | Throughput msgs/s | Avg ns/msg |
-| --- | --- | ---: | ---: |
-| map | off | 55,859,805 | 17.902 |
-| flat | off | 57,432,210 | 17.412 |
-| map | on | 55,976,073 | 17.865 |
-| flat | on | 52,862,960 | 18.917 |
+Each command prints:
 
-Takeaway: the two container choices are close on the TSLA sample, with flat-vector slightly ahead without reserve.
+- parsed and malformed row counts
+- throughput for `map` and `flat_vector`
+- reserve `off` and `on`
+- final top-of-book snapshot for a quick sanity check
 
-## Interpretation
+## Scope
 
-- The flat-vector backend can outperform `std::map` on these shallow sample books because the active level count stays low and the contiguous representation is cache-friendly.
-- Reserve/preallocation mainly helps the order-ID `unordered_map` and removes some rehash churn on the replay path.
-- The effect is workload-dependent. There is no single winner across every sample dataset, which is exactly why both container choices are kept in the repo and exposed through the same interface.
+- timed section: replay-only
+- analytics/export: available in `lob_engine`, but excluded from the replay throughput timer
+- backends compared: `std::map` and flat sorted `std::vector`
+- allocation mode compared: reserve/preallocation `off` vs `on`
 
-## Important note
+## Report regeneration
 
-The checked-in datasets are intentionally tiny reproducibility samples, not large production LOBSTER files. These numbers should be treated as relative engineering signals for this repo, not as final claims about live-market performance.
+There is no checked-in script that rewrites this file. To refresh the report, rerun the build, verifier, and benchmark commands above, then update this markdown manually with any observations you want to preserve.

From 20b1f1f9f013e2c3f0415b5004f3a1f59ecb377b Mon Sep 17 00:00:00 2001
From: Alexander Roesler <alex_roesler@berkeley.edu>
Date: Sun, 5 Apr 2026 22:34:36 +0000
Subject: [PATCH 2/2] Add project CI and secret scan merge gate

---
 .github/workflows/project-ci.yml  | 88 +++++++++++++++++++++++++++++++
 .github/workflows/secret-scan.yml | 27 ++++++++++
 .gitleaks.toml                    | 11 ++++
 .pre-commit-config.yaml           | 12 +++++
 4 files changed, 138 insertions(+)
 create mode 100644 .github/workflows/project-ci.yml
 create mode 100644 .github/workflows/secret-scan.yml
 create mode 100644 .gitleaks.toml
 create mode 100644 .pre-commit-config.yaml

diff --git a/.github/workflows/project-ci.yml b/.github/workflows/project-ci.yml
new file mode 100644
index 0000000..14d7ac1
--- /dev/null
+++ b/.github/workflows/project-ci.yml
@@ -0,0 +1,88 @@
+# managed by workflow os: project-ci
+name: project-ci
+
+on:
+  pull_request:
+  merge_group:
+  workflow_dispatch:
+
+permissions:
+  contents: read
+
+jobs:
+  project-ci:
+    runs-on: ubuntu-latest
+    timeout-minutes: 25
+    steps:
+      - name: Check out repo
+        uses: actions/checkout@v4
+
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: "3.11"
+
+      - name: Set up Node
+        if: ${{ hashFiles('package.json') != '' }}
+        uses: actions/setup-node@v4
+        with:
+          node-version: "20"
+
+      - name: Set up Go
+        if: ${{ hashFiles('go.mod') != '' }}
+        uses: actions/setup-go@v5
+        with:
+          go-version: stable
+
+      - name: Set up Rust
+        if: ${{ hashFiles('Cargo.toml') != '' }}
+        uses: dtolnay/rust-toolchain@stable
+
+      - name: Run project CI
+        shell: bash
+        run: |
+          set -euo pipefail
+          ran_any=0
+
+          if [[ -f pyproject.toml || -f setup.py || -f requirements.txt || -d tests ]]; then
+            python -m pip install --upgrade pip
+            if [[ -f requirements.txt ]]; then python -m pip install -r requirements.txt; fi
+            if [[ -f requirements-dev.txt ]]; then python -m pip install -r requirements-dev.txt; fi
+            python -m pip install pytest
+            if [[ -f pyproject.toml || -f setup.py ]]; then python -m pip install -e . || true; fi
+            if [[ -d tests ]]; then
+              python -m pytest tests -q --tb=short
+              ran_any=1
+            fi
+          fi
+
+          if [[ -f package.json ]]; then
+            if [[ -f package-lock.json ]]; then npm ci; else npm install; fi
+            if npm run | grep -qE '(^|[[:space:]])test([[:space:]]|$)'; then
+              npm test -- --runInBand || npm test
+              ran_any=1
+            fi
+          fi
+
+          if [[ -f go.mod ]]; then
+            go test ./...
+            ran_any=1
+          fi
+
+          if [[ -f Cargo.toml ]]; then
+            cargo test --all-targets --all-features
+            ran_any=1
+          fi
+
+          if [[ -f CMakeLists.txt ]]; then
+            sudo apt-get update
+            sudo apt-get install -y cmake ninja-build
+            cmake -S . -B build -G Ninja
+            cmake --build build
+            ctest --test-dir build --output-on-failure
+            ran_any=1
+          fi
+
+          if [[ "$ran_any" -eq 0 ]]; then
+            echo "No recognized project CI harness found; passing as metadata-only repo."
+          fi
diff --git a/.github/workflows/secret-scan.yml b/.github/workflows/secret-scan.yml
new file mode 100644
index 0000000..00a3092
--- /dev/null
+++ b/.github/workflows/secret-scan.yml
@@ -0,0 +1,27 @@
+# managed by workflow os: secret-scan
+name: secret-scan
+
+on:
+  pull_request:
+  push:
+  merge_group:
+  workflow_dispatch:
+
+permissions:
+  contents: read
+
+jobs:
+  secret-scan:
+    runs-on: ubuntu-latest
+    timeout-minutes: 10
+    steps:
+      - name: Check out repo
+        uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+
+      - name: Run gitleaks
+        uses: gitleaks/gitleaks-action@v2
+        env:
+          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+          GITLEAKS_CONFIG: .gitleaks.toml
diff --git a/.gitleaks.toml b/.gitleaks.toml
new file mode 100644
index 0000000..3b15916
--- /dev/null
+++ b/.gitleaks.toml
@@ -0,0 +1,11 @@
+# managed by workflow os: gitleaks-config
+title = "workflow managed secret scan configuration"
+
+[extend]
+useDefault = true
+
+[[rules]]
+id = "openclaw-auth-token"
+description = "OpenClaw auth or gateway token"
+regex = '''(?i)(?:OPENCLAW_(?:AUTH|GATEWAY|API)_TOKEN|openclaw(?:[_-]?(?:auth|gateway|api))?[_-]?token)[^\n]{0,32}[=:][^\S\r\n]*["']?[A-Za-z0-9._\-]{12,}["']?'''
+keywords = ["openclaw", "OPENCLAW_"]
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
new file mode 100644
index 0000000..745ff41
--- /dev/null
+++ b/.pre-commit-config.yaml
@@ -0,0 +1,12 @@
+# managed by workflow os: pre-commit
+default_install_hook_types:
+  - pre-commit
+  - pre-push
+
+repos:
+  - repo: https://github.com/gitleaks/gitleaks
+    rev: v8.30.1
+    hooks:
+      - id: gitleaks
+        stages: [pre-commit, pre-push, manual]
+        args: ["--config=.gitleaks.toml"]