ENTERPILOT
diff --git a/‎DEVELOPMENT.md‎
Lines changed: 19 additions & 8 deletions b/‎DEVELOPMENT.md‎
Lines changed: 19 additions & 8 deletions
diff --git a/‎GETTING_STARTED.md‎
Lines changed: 89 additions & 34 deletions b/‎GETTING_STARTED.md‎
Lines changed: 89 additions & 34 deletions
diff --git a/‎Makefile‎
Lines changed: 8 additions & 1 deletion b/‎Makefile‎
Lines changed: 8 additions & 1 deletion
diff --git a/‎README.md‎
Lines changed: 8 additions & 7 deletions b/‎README.md‎
Lines changed: 8 additions & 7 deletions
diff --git a/‎internal/admin/handler_test.go‎
Lines changed: 4 additions & 0 deletions b/‎internal/admin/handler_test.go‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎internal/auditlog/stream_wrapper.go‎
Lines changed: 1 addition & 0 deletions b/‎internal/auditlog/stream_wrapper.go‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎internal/core/interfaces.go‎
Lines changed: 3 additions & 4 deletions b/‎internal/core/interfaces.go‎
Lines changed: 3 additions & 4 deletions
diff --git a/‎internal/core/types.go‎
Lines changed: 33 additions & 0 deletions b/‎internal/core/types.go‎
Lines changed: 33 additions & 0 deletions
diff --git a/‎internal/guardrails/provider.go‎
Lines changed: 5 additions & 0 deletions b/‎internal/guardrails/provider.go‎
Lines changed: 5 additions & 0 deletions
@@ -1,5 +1,23 @@
 # Development
 
+## Prerequisites
+
+Install all required development tools in one step:
+
+```bash
+make install-tools
+```
+
+This installs:
+- [golangci-lint v2](https://golangci-lint.run/welcome/install/) — required for `make lint`
+- [pre-commit](https://pre-commit.com/) — required for git hook setup
+
+After installing tools, set up the pre-commit hooks:
+
+```bash
+pre-commit install
+```
+
 ## Testing
 
 ```bash
@@ -10,7 +28,7 @@ make test-all      # All tests
 
 ## Linting
 
-Requires [golangci-lint](https://golangci-lint.run/welcome/install/).
+Requires [golangci-lint v2](https://golangci-lint.run/welcome/install/)
 
 ```bash
 make lint          # Check code quality
@@ -42,10 +60,3 @@ Override the auto-detection with `LOG_FORMAT`:
 LOG_FORMAT=text make run   # force text output
 LOG_FORMAT=json make run   # force JSON output
 ```
-
-## Pre-commit
-
-```bash
-pip install pre-commit
-pre-commit install
-```
 
@@ -114,11 +114,13 @@ providers:
 
 **Effective resilience per provider:**
 
-| Provider  | max_retries | failure_threshold | cb timeout |
-|-----------|-------------|-------------------|------------|
-| openai    | 2 (global)  | 3 (global)        | 15s (global) |
-| anthropic | **5** (override) | 3 (global)   | 15s (global) |
-| ollama    | 2 (global)  | **10** (override) | **5s** (override) |
+
+| Provider  | max_retries      | failure_threshold | cb timeout        |
+| --------- | ---------------- | ----------------- | ----------------- |
+| openai    | 2 (global)       | 3 (global)        | 15s (global)      |
+| anthropic | **5** (override) | 3 (global)        | 15s (global)      |
+| ollama    | 2 (global)       | **10** (override) | **5s** (override) |
+
 
 Only fields that are explicitly listed under a provider's `resilience:` block are overridden. Everything else silently inherits from the global section.
 
@@ -161,33 +163,37 @@ GROQ_API_KEY=gsk_...
 
 All resilience settings can be overridden at runtime via env vars. Env vars always beat both code defaults and YAML values.
 
-| Variable | Type | Default | Description |
-|---|---|---|---|
-| `RETRY_MAX_RETRIES` | int | `3` | Maximum retry attempts per request |
-| `RETRY_INITIAL_BACKOFF` | duration | `1s` | First retry wait (e.g. `500ms`, `2s`) |
-| `RETRY_MAX_BACKOFF` | duration | `30s` | Upper cap on retry wait |
-| `RETRY_BACKOFF_FACTOR` | float | `2.0` | Exponential multiplier between retries |
-| `RETRY_JITTER_FACTOR` | float | `0.1` | Random jitter as a fraction of the backoff |
-| `CIRCUIT_BREAKER_FAILURE_THRESHOLD` | int | `5` | Consecutive failures before opening |
-| `CIRCUIT_BREAKER_SUCCESS_THRESHOLD` | int | `2` | Consecutive successes to close again |
-| `CIRCUIT_BREAKER_TIMEOUT` | duration | `30s` | How long the circuit stays open |
-| `LOG_FORMAT` | string | _(unset)_ | Auto-detects based on environment: colorized text on a TTY, JSON otherwise. Set to `text` to force human-readable output (no colors if not a TTY), or `json` to force structured JSON even on a TTY (recommended for production, CloudWatch, Datadog, GCP). |
+
+| Variable                            | Type     | Default   | Description                                                                                                                                                                                                                                                 |
+| ----------------------------------- | -------- | --------- | ----------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------------- |
+| `RETRY_MAX_RETRIES`                 | int      | `3`       | Maximum retry attempts per request                                                                                                                                                                                                                          |
+| `RETRY_INITIAL_BACKOFF`             | duration | `1s`      | First retry wait (e.g. `500ms`, `2s`)                                                                                                                                                                                                                       |
+| `RETRY_MAX_BACKOFF`                 | duration | `30s`     | Upper cap on retry wait                                                                                                                                                                                                                                     |
+| `RETRY_BACKOFF_FACTOR`              | float    | `2.0`     | Exponential multiplier between retries                                                                                                                                                                                                                      |
+| `RETRY_JITTER_FACTOR`               | float    | `0.1`     | Random jitter as a fraction of the backoff                                                                                                                                                                                                                  |
+| `CIRCUIT_BREAKER_FAILURE_THRESHOLD` | int      | `5`       | Consecutive failures before opening                                                                                                                                                                                                                         |
+| `CIRCUIT_BREAKER_SUCCESS_THRESHOLD` | int      | `2`       | Consecutive successes to close again                                                                                                                                                                                                                        |
+| `CIRCUIT_BREAKER_TIMEOUT`           | duration | `30s`     | How long the circuit stays open                                                                                                                                                                                                                             |
+| `LOG_FORMAT`                        | string   | *(unset)* | Auto-detects based on environment: colorized text on a TTY, JSON otherwise. Set to `text` to force human-readable output (no colors if not a TTY), or `json` to force structured JSON even on a TTY (recommended for production, CloudWatch, Datadog, GCP). |
+
 
 Provider credentials:
 
-| Variable | Provider |
-|---|---|
-| `OPENAI_API_KEY` | OpenAI |
-| `OPENAI_BASE_URL` | OpenAI (custom endpoint) |
-| `ANTHROPIC_API_KEY` | Anthropic |
-| `ANTHROPIC_BASE_URL` | Anthropic (custom endpoint) |
-| `GEMINI_API_KEY` | Google Gemini |
-| `GEMINI_BASE_URL` | Gemini (custom endpoint) |
-| `XAI_API_KEY` | xAI / Grok |
-| `XAI_BASE_URL` | xAI (custom endpoint) |
-| `GROQ_API_KEY` | Groq |
-| `GROQ_BASE_URL` | Groq (custom endpoint) |
-| `OLLAMA_BASE_URL` | Ollama (default: `http://localhost:11434/v1`) |
+
+| Variable             | Provider                                      |
+| -------------------- | --------------------------------------------- |
+| `OPENAI_API_KEY`     | OpenAI                                        |
+| `OPENAI_BASE_URL`    | OpenAI (custom endpoint)                      |
+| `ANTHROPIC_API_KEY`  | Anthropic                                     |
+| `ANTHROPIC_BASE_URL` | Anthropic (custom endpoint)                   |
+| `GEMINI_API_KEY`     | Google Gemini                                 |
+| `GEMINI_BASE_URL`    | Gemini (custom endpoint)                      |
+| `XAI_API_KEY`        | xAI / Grok                                    |
+| `XAI_BASE_URL`       | xAI (custom endpoint)                         |
+| `GROQ_API_KEY`       | Groq                                          |
+| `GROQ_BASE_URL`      | Groq (custom endpoint)                        |
+| `OLLAMA_BASE_URL`    | Ollama (default: `http://localhost:11434/v1`) |
+
 
 See `.env.template` for the full list of all configurable environment variables.
 
@@ -409,6 +415,44 @@ curl http://localhost:8080/v1/responses \
   }'
 ```
 
+### Embeddings
+
+#### Basic Embedding
+
+```bash
+curl http://localhost:8080/v1/embeddings \
+  -H "Content-Type: application/json" \
+  -d '{
+    "model": "text-embedding-3-small",
+    "input": "The quick brown fox jumps over the lazy dog."
+  }'
+```
+
+#### Batch Embedding (multiple inputs)
+
+```bash
+curl http://localhost:8080/v1/embeddings \
+  -H "Content-Type: application/json" \
+  -d '{
+    "model": "text-embedding-3-small",
+    "input": ["First sentence", "Second sentence", "Third sentence"]
+  }'
+```
+
+#### With Custom Dimensions
+
+```bash
+curl http://localhost:8080/v1/embeddings \
+  -H "Content-Type: application/json" \
+  -d '{
+    "model": "text-embedding-3-large",
+    "input": "Hello world",
+    "dimensions": 512
+  }'
+```
+
+Supported by: OpenAI, Gemini, Groq, xAI, Ollama. Anthropic does not support embeddings natively.
+
 ### List Available Models
 
 ```bash
@@ -480,6 +524,13 @@ stream = client.chat.completions.create(
 for chunk in stream:
     if chunk.choices[0].delta.content:
         print(chunk.choices[0].delta.content, end="")
+
+# Embeddings
+embedding = client.embeddings.create(
+    model="text-embedding-3-small",
+    input="Hello world"
+)
+print(embedding.data[0].embedding[:5])  # first 5 dimensions
 ```
 
 ### Node.js
@@ -510,6 +561,13 @@ for await (const chunk of stream) {
     process.stdout.write(chunk.choices[0].delta.content);
   }
 }
+
+// Embeddings
+const embedding = await client.embeddings.create({
+  model: "text-embedding-3-small",
+  input: "Hello world",
+});
+console.log(embedding.data[0].embedding.slice(0, 5)); // first 5 dimensions
 ```
 
 ---
@@ -554,13 +612,10 @@ for await (const chunk of stream) {
 ## Tips
 
 1. **Model routing**: The gateway automatically routes requests to the correct provider based on the model name — no configuration needed. Just use any model name from the list above.
-
 2. **API compatibility**: The gateway exposes an OpenAI-compatible API. Existing OpenAI client libraries work unchanged for all providers.
-
 3. **Streaming**: All providers support streaming. The gateway normalises provider-specific formats to OpenAI's SSE format.
-
 4. **System messages**: Anthropic's system message format is handled automatically. Gemini uses Google's OpenAI-compatible endpoint, which also handles system messages natively.
-
 5. **Max tokens**: Anthropic requires `max_tokens` to be set. If not provided, the gateway defaults to 4096. OpenAI and Gemini treat it as optional.
-
 6. **Responses API**: The `/v1/responses` endpoint provides a unified interface across all providers. Providers that do not natively support the Responses API convert requests internally.
+7. **Embeddings**: The `/v1/embeddings` endpoint is supported by OpenAI, Gemini, Groq, xAI, and Ollama. Anthropic does not offer embeddings natively.
+
@@ -1,4 +1,6 @@
-.PHONY: build run clean tidy test test-e2e test-integration test-contract test-all lint lint-fix record-api swagger
+.PHONY: all build run clean tidy test test-e2e test-integration test-contract test-all lint lint-fix record-api swagger install-tools
+
+all: build
 
 # Get version info
 VERSION ?= $(shell git describe --tags --always --dirty)
@@ -10,6 +12,11 @@ LDFLAGS := -X "gomodel/internal/version.Version=$(VERSION)" \
            -X "gomodel/internal/version.Commit=$(COMMIT)" \
            -X "gomodel/internal/version.Date=$(DATE)"
 
+install-tools:
+	@command -v golangci-lint > /dev/null 2>&1 || (echo "Installing golangci-lint..." && go install github.com/golangci/golangci-lint/v2/cmd/golangci-lint@v2.10.1)
+	@command -v pre-commit > /dev/null 2>&1 || (echo "Installing pre-commit..." && pip install pre-commit==4.5.1)
+	@echo "All tools are ready"
+
 build:
 	go build -ldflags '$(LDFLAGS)' -o bin/gomodel ./cmd/gomodel
 # Run the application
 
@@ -70,41 +70,41 @@ Example model identifiers are illustrative and subject to change; consult provid
     <td>OpenAI</td>
     <td><code>OPENAI_API_KEY</code></td>
     <td><code>gpt&#8209;4o&#8209;mini</code></td>
-    <td>✅</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td>
+    <td>✅</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>✅</td><td>🚧</td>
   </tr>
   <tr>
     <td>Anthropic</td>
     <td><code>ANTHROPIC_API_KEY</code></td>
     <td><code>claude&#8209;sonnet&#8209;4&#8209;20250514</code></td>
-    <td>✅</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td>
+    <td>✅</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>❌</td><td>🚧</td>
   </tr>
   <tr>
     <td>Google&nbsp;Gemini</td>
     <td><code>GEMINI_API_KEY</code></td>
     <td><code>gemini&#8209;2.5&#8209;flash</code></td>
-    <td>✅</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td>
+    <td>✅</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>✅</td><td>🚧</td>
   </tr>
   <tr>
     <td>Groq</td>
     <td><code>GROQ_API_KEY</code></td>
     <td><code>llama&#8209;3.3&#8209;70b&#8209;versatile</code></td>
-    <td>✅</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td>
+    <td>✅</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>✅</td><td>🚧</td>
   </tr>
   <tr>
     <td>xAI&nbsp;(Grok)</td>
     <td><code>XAI_API_KEY</code></td>
     <td><code>grok&#8209;2</code></td>
-    <td>✅</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td>
+    <td>✅</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>✅</td><td>🚧</td>
   </tr>
   <tr>
     <td>Ollama</td>
     <td><code>OLLAMA_BASE_URL</code></td>
     <td><code>llama3.2</code></td>
-    <td>✅</td><td>🚧</td><td>🚧</td><td>—</td><td>—</td><td>🚧</td><td>🚧</td><td>🚧</td>
+    <td>✅</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>🚧</td><td>✅</td><td>🚧</td>
   </tr>
 </table>
 
-✅ Supported  🚧 Coming soon  — Not applicable
+✅ Supported  🚧 Coming soon  ❌ Unsupported
 
 ---
 
@@ -159,6 +159,7 @@ docker run --rm -p 8080:8080 --env-file .env gomodel
 |----------|--------|-------------|
 | `/v1/chat/completions` | POST | Chat completions (streaming supported) |
 | `/v1/responses` | POST | OpenAI Responses API |
+| `/v1/embeddings` | POST | Text embeddings |
 | `/v1/models` | GET | List available models |
 | `/health` | GET | Health check |
 | `/metrics` | GET | Prometheus metrics (when enabled) |
 
@@ -78,6 +78,10 @@ func (m *handlerMockProvider) StreamResponses(_ context.Context, _ *core.Respons
 	return nil, nil
 }
 
+func (m *handlerMockProvider) Embeddings(_ context.Context, _ *core.EmbeddingRequest) (*core.EmbeddingResponse, error) {
+	return nil, core.NewInvalidRequestError("not supported", nil)
+}
+
 func newHandlerContext(path string) (echo.Context, *httptest.ResponseRecorder) {
 	e := echo.New()
 	req := httptest.NewRequest(http.MethodGet, path, nil)
 
@@ -426,6 +426,7 @@ func IsModelInteractionPath(path string) bool {
 	modelPaths := []string{
 		"/v1/chat/completions",
 		"/v1/responses",
+		"/v1/embeddings",
 	}
 	for _, p := range modelPaths {
 		if strings.HasPrefix(path, p) {
 
@@ -22,6 +22,9 @@ type Provider interface {
 
 	// StreamResponses returns a raw SSE stream for Responses API (caller must close)
 	StreamResponses(ctx context.Context, req *ResponsesRequest) (io.ReadCloser, error)
+
+	// Embeddings sends an embeddings request to the provider
+	Embeddings(ctx context.Context, req *EmbeddingRequest) (*EmbeddingResponse, error)
 }
 
 // RoutableProvider extends Provider with routing capability.
@@ -30,11 +33,7 @@ type Provider interface {
 type RoutableProvider interface {
 	Provider
 
-	// Supports returns true if the provider can handle the given model
 	Supports(model string) bool
-
-	// GetProviderType returns the provider type string for the given model.
-	// Returns empty string if the model is not found.
 	GetProviderType(model string) string
 }
 
 
@@ -1,5 +1,7 @@
 package core
 
+import "encoding/json"
+
 // StreamOptions controls streaming behavior options.
 // This is used to request usage data in streaming responses.
 type StreamOptions struct {
@@ -212,3 +214,34 @@ type ModelsResponse struct {
 	Object string  `json:"object"`
 	Data   []Model `json:"data"`
 }
+
+// EmbeddingRequest represents the incoming embeddings request (OpenAI-compatible).
+type EmbeddingRequest struct {
+	Model          string `json:"model"`
+	Input          any    `json:"input"`
+	EncodingFormat string `json:"encoding_format,omitempty"`
+	Dimensions     *int   `json:"dimensions,omitempty"`
+}
+
+// EmbeddingResponse represents the embeddings response (OpenAI-compatible).
+type EmbeddingResponse struct {
+	Object   string          `json:"object"`
+	Data     []EmbeddingData `json:"data"`
+	Model    string          `json:"model"`
+	Provider string          `json:"provider"`
+	Usage    EmbeddingUsage  `json:"usage"`
+}
+
+// EmbeddingData represents a single embedding data point.
+// Embedding is json.RawMessage to support both float arrays and base64-encoded strings.
+type EmbeddingData struct {
+	Object    string          `json:"object"`
+	Embedding json.RawMessage `json:"embedding"`
+	Index     int             `json:"index"`
+}
+
+// EmbeddingUsage represents token usage information for embeddings.
+type EmbeddingUsage struct {
+	PromptTokens int `json:"prompt_tokens"`
+	TotalTokens  int `json:"total_tokens"`
+}
@@ -59,6 +59,11 @@ func (g *GuardedProvider) ListModels(ctx context.Context) (*core.ModelsResponse,
 	return g.inner.ListModels(ctx)
 }
 
+// Embeddings delegates directly to the inner provider (no guardrails needed for embeddings).
+func (g *GuardedProvider) Embeddings(ctx context.Context, req *core.EmbeddingRequest) (*core.EmbeddingResponse, error) {
+	return g.inner.Embeddings(ctx, req)
+}
+
 // Responses extracts messages, applies guardrails, then routes the request.
 func (g *GuardedProvider) Responses(ctx context.Context, req *core.ResponsesRequest) (*core.ResponsesResponse, error) {
 	modified, err := g.processResponses(ctx, req)
Original file line number	Diff line number	Diff line change
`@@ -426,6 +426,7 @@ func IsModelInteractionPath(path string) bool {`
`426`	`426`	`modelPaths := []string{`
`427`	`427`	`"/v1/chat/completions",`
`428`	`428`	`"/v1/responses",`
	`429`	`+ "/v1/embeddings",`
`429`	`430`	`}`
`430`	`431`	`for _, p := range modelPaths {`
`431`	`432`	`if strings.HasPrefix(path, p) {`