ENTERPILOT
diff --git a/‎docs/2026-03-23_benchmark_scripts/.gitignore‎
Lines changed: 2 additions & 0 deletions b/‎docs/2026-03-23_benchmark_scripts/.gitignore‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎docs/2026-03-23_benchmark_scripts/README.md‎
Lines changed: 82 additions & 0 deletions b/‎docs/2026-03-23_benchmark_scripts/README.md‎
Lines changed: 82 additions & 0 deletions
diff --git a/‎docs/2026-03-23_benchmark_scripts/gateway-comparison/.gitignore‎
Lines changed: 4 additions & 0 deletions b/‎docs/2026-03-23_benchmark_scripts/gateway-comparison/.gitignore‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎docs/2026-03-23_benchmark_scripts/gateway-comparison/configs/gomodel-config.yaml‎
Lines changed: 47 additions & 0 deletions b/‎docs/2026-03-23_benchmark_scripts/gateway-comparison/configs/gomodel-config.yaml‎
Lines changed: 47 additions & 0 deletions
diff --git a/‎docs/2026-03-23_benchmark_scripts/gateway-comparison/configs/litellm-config.yaml‎
Lines changed: 15 additions & 0 deletions b/‎docs/2026-03-23_benchmark_scripts/gateway-comparison/configs/litellm-config.yaml‎
Lines changed: 15 additions & 0 deletions
@@ -0,0 +1,2 @@
+__pycache__/
+output/
@@ -0,0 +1,82 @@
+# March 23, 2026 benchmark scripts
+
+This directory is the reproducible entry point for the March 23, 2026
+GoModel vs LiteLLM benchmark refresh.
+
+It is built around the benchmark workspace in
+`docs/2026-03-23_benchmark_scripts/gateway-comparison/`, then adds:
+
+- a tested normalization step for the raw `hey` and streaming outputs,
+- chart generation for the blog assets,
+- a stable wrapper command for rerunning the benchmark and rebuilding the
+  article artifacts.
+
+## What this benchmark measures
+
+This run uses the same localhost mock backend for both gateways, so the numbers
+measure gateway overhead rather than upstream model latency.
+
+Workloads covered:
+
+- `/v1/chat/completions` non-streaming
+- `/v1/chat/completions` streaming
+- `/v1/responses` non-streaming
+- `/v1/responses` streaming
+
+The raw benchmark runner also records a direct baseline for chat traffic with no
+gateway in the middle.
+
+## Prerequisites
+
+- Go 1.26+
+- Python 3.10+
+- `hey`
+- `litellm`
+- Python packages: `matplotlib`, `numpy`
+
+Install Python packages if needed:
+
+```bash
+python3 -m pip install matplotlib numpy
+```
+
+## Quick start
+
+Run the raw benchmark and generate normalized artifacts:
+
+```bash
+RUN_BENCHMARK=1 bash docs/2026-03-23_benchmark_scripts/run.sh
+```
+
+If you already have a benchmark result directory, point the wrapper at it:
+
+```bash
+RESULTS_DIR=/path/to/results bash docs/2026-03-23_benchmark_scripts/run.sh
+```
+
+Copy the generated chart assets into the sibling Enterpilot blog repo:
+
+```bash
+BLOG_PUBLIC_DIR=../enterpilot.io/blog/public/charts \
+  bash docs/2026-03-23_benchmark_scripts/run.sh
+```
+
+## Outputs
+
+By default, generated artifacts land in `docs/2026-03-23_benchmark_scripts/output/`:
+
+- `benchmark_summary.json`: normalized machine-readable metrics
+- `charts/gomodel-vs-litellm-march-2026-dashboard.png`
+- `charts/gomodel-vs-litellm-march-2026-throughput.png`
+- `charts/gomodel-vs-litellm-march-2026-latency.png`
+- `charts/gomodel-vs-litellm-march-2026-memory.png`
+- `charts/gomodel-vs-litellm-march-2026-speedup.png`
+
+## Notes
+
+- The raw benchmark runner lives in `docs/2026-03-23_benchmark_scripts/gateway-comparison/run-benchmark.sh`.
+- The normalization step exists because raw shell summaries are easy to drift or
+  misparse; the parser in this directory is covered by unit tests with inline
+  sample fixtures, so the repo does not need to carry benchmark result dumps.
+- These results are a point-in-time localhost benchmark, not a universal claim
+  about every deployment shape.
@@ -0,0 +1,4 @@
+gomodel-bin
+mock-backend/mock-server
+stream-bench/stream-bench
+results/
@@ -0,0 +1,47 @@
+server:
+  port: "8081"
+  master_key: ""
+  body_size_limit: "10M"
+  swagger_enabled: false
+  pprof_enabled: false
+  enable_passthrough_routes: false
+
+cache:
+  model:
+    refresh_interval: 86400
+    local:
+      cache_dir: "/tmp/gomodel-bench-cache"
+
+storage:
+  type: "sqlite"
+  sqlite:
+    path: "/tmp/gomodel-bench.db"
+
+logging:
+  enabled: false
+
+usage:
+  enabled: false
+
+metrics:
+  enabled: false
+
+admin:
+  endpoints_enabled: false
+  ui_enabled: false
+
+http:
+  timeout: 60
+  response_header_timeout: 60
+
+resilience:
+  retry:
+    max_retries: 0
+  circuit_breaker:
+    failure_threshold: 999
+
+providers:
+  openai:
+    type: openai
+    api_key: "sk-bench-test-key"
+    base_url: "http://localhost:9999/v1"
@@ -0,0 +1,15 @@
+model_list:
+  - model_name: "gpt-4o-mini"
+    litellm_params:
+      model: "openai/gpt-4o-mini"
+      api_key: "sk-bench-test-key"
+      api_base: "http://localhost:9999/v1"
+
+general_settings:
+  master_key: null
+  disable_spend_logs: true
+
+litellm_settings:
+  num_retries: 0
+  request_timeout: 60
+  drop_params: true