@@ -374,58 +374,76 @@ data:
374374Here's a comprehensive example for configuring Inference Gateway in a production environment:
375375
376376` ` ` bash
377+
377378# General settings
378379ENVIRONMENT=production
379- ENABLE_VISION=true
380- TELEMETRY_ENABLE=true
381- AUTH_ENABLE=true
382-
380+ ALLOWED_MODELS=
381+ ENABLE_VISION=false
382+ DEBUG_CONTENT_TRUNCATE_WORDS=10
383+ DEBUG_MAX_MESSAGES=100
384+ # Telemetry
385+ TELEMETRY_ENABLE=false
386+ TELEMETRY_METRICS_PORT=9464
387+ # Model Context Protocol (MCP)
388+ MCP_ENABLE=false
389+ MCP_EXPOSE=false
390+ MCP_SERVERS=
391+ MCP_CLIENT_TIMEOUT=5s
392+ MCP_DIAL_TIMEOUT=3s
393+ MCP_TLS_HANDSHAKE_TIMEOUT=3s
394+ MCP_RESPONSE_HEADER_TIMEOUT=3s
395+ MCP_EXPECT_CONTINUE_TIMEOUT=1s
396+ MCP_REQUEST_TIMEOUT=5s
397+ MCP_MAX_RETRIES=3
398+ MCP_RETRY_INTERVAL=5s
399+ MCP_INITIAL_BACKOFF=1s
400+ MCP_ENABLE_RECONNECT=true
401+ MCP_RECONNECT_INTERVAL=30s
402+ MCP_POLLING_ENABLE=true
403+ MCP_POLLING_INTERVAL=30s
404+ MCP_POLLING_TIMEOUT=5s
405+ MCP_DISABLE_HEALTHCHECK_LOGS=true
383406# Authentication
384- OIDC_ISSUER_URL=https://auth.example.com/realms/inference-gateway
385- OIDC_CLIENT_ID= inference-gateway
386- OIDC_CLIENT_SECRET=your-client-secret
387-
407+ AUTH_ENABLE=false
408+ AUTH_OIDC_ISSUER=http://keycloak:8080/realms/ inference-gateway-realm
409+ AUTH_OIDC_CLIENT_ID=inference-gateway-client
410+ AUTH_OIDC_CLIENT_SECRET=
388411# Server settings
389412SERVER_HOST=0.0.0.0
390413SERVER_PORT=8080
391414SERVER_READ_TIMEOUT=30s
392415SERVER_WRITE_TIMEOUT=30s
393416SERVER_IDLE_TIMEOUT=120s
394- SERVER_TLS_CERT_PATH=/certs/tls.crt
395- SERVER_TLS_KEY_PATH=/certs/tls.key
396-
417+ SERVER_TLS_CERT_PATH=
418+ SERVER_TLS_KEY_PATH=
397419# Client settings
398- CLIENT_TIMEOUT=45s
399- CLIENT_MAX_IDLE_CONNS=100
400- CLIENT_MAX_IDLE_CONNS_PER_HOST=50
401- CLIENT_IDLE_CONN_TIMEOUT=60s
420+ CLIENT_TIMEOUT=30s
421+ CLIENT_MAX_IDLE_CONNS=20
422+ CLIENT_MAX_IDLE_CONNS_PER_HOST=20
423+ CLIENT_IDLE_CONN_TIMEOUT=30s
402424CLIENT_TLS_MIN_VERSION=TLS12
403-
404- # Provider settings
405- OPENAI_API_KEY=your-openai-api-key
406- ANTHROPIC_API_KEY=your-anthropic-api-key
407- GROQ_API_KEY=your-groq-api-key
408- DEEPSEEK_API_KEY=your-deepseek-api-key
409- GOOGLE_API_KEY=your-google-api-key
410-
411- # Model Context Protocol (MCP) - for external tool integration
412- MCP_ENABLE=true
413- MCP_EXPOSE=false # Set to true for debugging
414- MCP_SERVERS=http://time-server:8081/mcp,http://search-server:8082/mcp
415- MCP_CLIENT_TIMEOUT=10s
416- MCP_REQUEST_TIMEOUT=10s
417-
418- # Agent-to-Agent (A2A) - for agent coordination
419- A2A_ENABLE=true
420- A2A_EXPOSE=false # Set to true for debugging
421- A2A_AGENTS=http://google-calendar-agent:8084
422- A2A_CLIENT_TIMEOUT=30s
423-
424- # UI settings (if using UI)
425- INFERENCE_GATEWAY_URL=https://api.example.com/v1
426-
427- # Logging
428- LOG_LEVEL=info # Use 'debug' for troubleshooting
425+ CLIENT_DISABLE_COMPRESSION=true
426+ CLIENT_RESPONSE_HEADER_TIMEOUT=10s
427+ CLIENT_EXPECT_CONTINUE_TIMEOUT=1s
428+ # Providers
429+ ANTHROPIC_API_URL=https://api.anthropic.com/v1
430+ ANTHROPIC_API_KEY=
431+ CLOUDFLARE_API_URL=https://api.cloudflare.com/client/v4/accounts/{ACCOUNT_ID}/ai
432+ CLOUDFLARE_API_KEY=
433+ COHERE_API_URL=https://api.cohere.ai
434+ COHERE_API_KEY=
435+ GROQ_API_URL=https://api.groq.com/openai/v1
436+ GROQ_API_KEY=
437+ OLLAMA_API_URL=http://ollama:8080/v1
438+ OLLAMA_API_KEY=
439+ OPENAI_API_URL=https://api.openai.com/v1
440+ OPENAI_API_KEY=
441+ DEEPSEEK_API_URL=https://api.deepseek.com
442+ DEEPSEEK_API_KEY=
443+ GOOGLE_API_URL=https://generativelanguage.googleapis.com/v1beta/openai
444+ GOOGLE_API_KEY=
445+ MISTRAL_API_URL=https://api.mistral.ai/v1
446+ MISTRAL_API_KEY=
429447```
430448
431449## Configuration Best Practices
0 commit comments