[Search][Playground] Fix loading context limit for EIS model (#225360)

TattdCodeMonkey · TattdCodeMonkey · commit 0399d3c18e47 · 2025-06-30T18:40:32.000Z
## Summary Updates the playground to properly load the right context token limit when using the EIS model as well as sending the model to the chat endpoint. Additionally updated the backend to load the correct chat parameters for the EIS model. Fixes issue where too large context error was received from connector instead of being cause by playground. Before: ![image](https://github.com/user-attachments/assets/578f841c-3ef7-4ec7-a2b3-d3c03fd8387f) After: ![image](https://github.com/user-attachments/assets/52a6fa9f-d1d6-42ab-acc1-83171bb2eb25) ### Checklist - [ ] Any text added follows [EUI's writing guidelines](https://elastic.github.io/eui/#/guidelines/writing), uses sentence case text and includes [i18n support](https://github.com/elastic/kibana/blob/main/src/platform/packages/shared/kbn-i18n/README.md) - [ ] [Documentation](https://www.elastic.co/guide/en/kibana/master/development-documentation.html) was added for features that require explanation or tutorials - [x] [Unit or functional tests](https://www.elastic.co/guide/en/kibana/master/development-tests.html) were updated or added to match the most common scenarios - [ ] If a plugin configuration key changed, check if it needs to be allowlisted in the cloud and added to the [docker list](https://github.com/elastic/kibana/blob/main/src/dev/build/tasks/os_packages/docker_generator/resources/base/bin/kibana-docker) - [ ] This was checked for breaking HTTP API changes, and any breaking changes have been approved by the breaking-change committee. The `release_note:breaking` label should be applied in these situations. - [ ] [Flaky Test Runner](https://ci-stats.kibana.dev/trigger_flaky_test_runner/1) was used on any tests changed - [x] The PR description includes the appropriate Release Notes section, and the correct `release_note:*` label is applied per the [guidelines](https://www.elastic.co/guide/en/kibana/master/contributing.html#kibana-release-notes-process) ## Release note Fixes issue in Search Playground where context limit errors were not handled well when using the Elastic Managed LLM. (cherry picked from commit 34dfd62) # Conflicts: # x-pack/platform/plugins/private/translations/translations/fr-FR.json # x-pack/platform/plugins/private/translations/translations/ja-JP.json # x-pack/platform/plugins/private/translations/translations/zh-CN.json # x-pack/solutions/search/plugins/search_playground/public/hooks/use_llms_models.ts # x-pack/solutions/search/plugins/search_playground/server/lib/get_chat_params.test.ts # x-pack/solutions/search/plugins/search_playground/server/lib/get_chat_params.ts # x-pack/solutions/search/plugins/search_playground/server/routes.ts
diff --git a/x-pack/platform/plugins/private/translations/translations/fr-FR.json b/x-pack/platform/plugins/private/translations/translations/fr-FR.json
@@ -34850,8 +34850,7 @@
     "xpack.searchPlayground.geminiConnectorTitle": "Gemini",
     "xpack.searchPlayground.header.view.chat": "Chat",
     "xpack.searchPlayground.header.view.preview": "Aperçu",
-    "xpack.searchPlayground.header.view.query": "Recherche",
-    "xpack.searchPlayground.inferenceModel": "{name} (connecteur IA)",
+    "xpack.searchPlayground.header.view.query": "Requête",
     "xpack.searchPlayground.loadConnectorsError": "Erreur lors du chargement des connecteurs. Veuillez vérifier votre configuration et réessayer.",
     "xpack.searchPlayground.openAIAzureConnectorTitle": "OpenAI Azure",
     "xpack.searchPlayground.openAIAzureModel": "{name} (Azure OpenAI)",
diff --git a/x-pack/platform/plugins/private/translations/translations/ja-JP.json b/x-pack/platform/plugins/private/translations/translations/ja-JP.json
@@ -34826,7 +34826,6 @@
     "xpack.searchPlayground.header.view.chat": "チャット",
     "xpack.searchPlayground.header.view.preview": "プレビュー",
     "xpack.searchPlayground.header.view.query": "クエリー",
-    "xpack.searchPlayground.inferenceModel": "{name}（AIコネクター）",
     "xpack.searchPlayground.loadConnectorsError": "コネクターの読み込みエラーです。構成を確認して、再試行してください。",
     "xpack.searchPlayground.openAIAzureConnectorTitle": "OpenAI Azure",
     "xpack.searchPlayground.openAIAzureModel": "{name} (Azure OpenAI)",
diff --git a/x-pack/platform/plugins/private/translations/translations/zh-CN.json b/x-pack/platform/plugins/private/translations/translations/zh-CN.json
@@ -34885,7 +34885,6 @@
     "xpack.searchPlayground.header.view.chat": "聊天",
     "xpack.searchPlayground.header.view.preview": "预览",
     "xpack.searchPlayground.header.view.query": "查询",
-    "xpack.searchPlayground.inferenceModel": "{name}（AI 连接器）",
     "xpack.searchPlayground.loadConnectorsError": "加载连接器进出错。请检查您的配置，然后重试。",
     "xpack.searchPlayground.openAIAzureConnectorTitle": "OpenAI Azure",
     "xpack.searchPlayground.openAIAzureModel": "{name} (Azure OpenAI)",
diff --git a/x-pack/solutions/search/plugins/search_playground/common/models.ts b/x-pack/solutions/search/plugins/search_playground/common/models.ts
@@ -5,6 +5,7 @@
  * 2.0.
  */
 
+import { elasticModelIds } from '@kbn/inference-common';
 import { ModelProvider, LLMs } from './types';
 
 export const MODELS: ModelProvider[] = [
@@ -50,4 +51,10 @@ export const MODELS: ModelProvider[] = [
     promptTokenLimit: 2097152,
     provider: LLMs.gemini,
   },
+  {
+    name: 'Elastic Managed LLM',
+    model: elasticModelIds.RainbowSprinkles,
+    promptTokenLimit: 200000,
+    provider: LLMs.inference,
+  },
 ];
diff --git a/x-pack/solutions/search/plugins/search_playground/public/hooks/use_llms_models.ts b/x-pack/solutions/search/plugins/search_playground/public/hooks/use_llms_models.ts
@@ -26,7 +26,8 @@ const mapLlmToModels: Record<
     icon: string | ((connector: PlaygroundConnector) => string);
     getModels: (
       connectorName: string,
-      includeName: boolean
+      includeName: boolean,
+      modelId?: string
     ) => Array<{ label: string; value?: string; promptTokenLimit?: number }>;
   }
 > = {
@@ -85,12 +86,11 @@ const mapLlmToModels: Record<
         ? SERVICE_PROVIDERS[connector.config.provider].icon
         : '';
     },
-    getModels: (connectorName) => [
+    getModels: (connectorName, _, modelId) => [
       {
-        label: i18n.translate('xpack.searchPlayground.inferenceModel', {
-          defaultMessage: '{name}',
-          values: { name: connectorName },
-        }),
+        label: connectorName,
+        value: modelId,
+        promptTokenLimit: MODELS.find((m) => m.model === modelId)?.promptTokenLimit,
       },
     ],
   },
@@ -126,7 +126,13 @@ export const useLLMsModels = (): LLMModel[] => {
         return [
           ...result,
           ...llmParams
-            .getModels(connector.name, false)
+            .getModels(
+              connector.name,
+              false,
+              isInferenceActionConnector(connector)
+                ? connector.config?.providerConfig?.model_id
+                : undefined
+            )
             .map(({ label, value, promptTokenLimit }) => ({
               id: connector?.id + label,
               name: label,
diff --git a/x-pack/solutions/search/plugins/search_playground/public/providers/form_provider.tsx b/x-pack/solutions/search/plugins/search_playground/public/providers/form_provider.tsx
@@ -84,6 +84,7 @@ export const FormProvider: React.FC<React.PropsWithChildren<FormProviderProps>>
   }, [form, storage]);
 
   useEffect(() => {
+    if (models.length === 0) return; // don't continue if there are no models
     const defaultModel = models.find((model) => !model.disabled);
     const currentModel = form.getValues(ChatFormFields.summarizationModel);
 
diff --git a/x-pack/solutions/search/plugins/search_playground/public/types.ts b/x-pack/solutions/search/plugins/search_playground/public/types.ts
@@ -231,6 +231,12 @@ export interface LLMModel {
 
 export type { ActionConnector, UserConfiguredActionConnector };
 export type InferenceActionConnector = ActionConnector & {
-  config: { provider: ServiceProviderKeys; inferenceId: string };
+  config: {
+    providerConfig?: {
+      model_id?: string;
+    };
+    provider: ServiceProviderKeys;
+    inferenceId: string;
+  };
 };
 export type PlaygroundConnector = ActionConnector & { title: string; type: LLMs };
diff --git a/x-pack/solutions/search/plugins/search_playground/server/lib/get_chat_params.test.ts b/x-pack/solutions/search/plugins/search_playground/server/lib/get_chat_params.test.ts
@@ -20,6 +20,7 @@ import {
 import { Prompt, QuestionRewritePrompt } from '../../common/prompt';
 import { KibanaRequest, Logger } from '@kbn/core/server';
 import { PluginStartContract as ActionsPluginStartContract } from '@kbn/actions-plugin/server';
+import { elasticModelIds } from '@kbn/inference-common';
 
 jest.mock('@kbn/langchain/server', () => {
   const original = jest.requireActual('@kbn/langchain/server');
@@ -230,4 +231,67 @@ describe('getChatParams', () => {
     });
     expect(result.chatPrompt).toContain('How does it work?');
   });
+
+  it('returns the correct params for the EIS connector', async () => {
+    const mockConnector = {
+      id: 'elastic-llm',
+      actionTypeId: INFERENCE_CONNECTOR_ID,
+      config: {
+        providerConfig: {
+          model_id: elasticModelIds.RainbowSprinkles,
+        },
+      },
+    };
+    mockActionsClient.get.mockResolvedValue(mockConnector);
+
+    const result = await getChatParams(
+      {
+        connectorId: 'elastic-llm',
+        prompt: 'How does it work?',
+        citations: false,
+      },
+      { actions, request, logger }
+    );
+
+    expect(result).toMatchObject({
+      connector: mockConnector,
+      summarizationModel: elasticModelIds.RainbowSprinkles,
+    });
+
+    expect(Prompt).toHaveBeenCalledWith('How does it work?', {
+      citations: false,
+      context: true,
+      type: 'openai',
+    });
+    expect(QuestionRewritePrompt).toHaveBeenCalledWith({
+      type: 'openai',
+    });
+  });
+
+  it('it returns provided model with EIS connector', async () => {
+    const mockConnector = {
+      id: 'elastic-llm',
+      actionTypeId: INFERENCE_CONNECTOR_ID,
+      config: {
+        providerConfig: {
+          model_id: elasticModelIds.RainbowSprinkles,
+        },
+      },
+    };
+    mockActionsClient.get.mockResolvedValue(mockConnector);
+
+    const result = await getChatParams(
+      {
+        connectorId: 'elastic-llm',
+        model: 'foo-bar',
+        prompt: 'How does it work?',
+        citations: false,
+      },
+      { actions, request, logger }
+    );
+
+    expect(result).toMatchObject({
+      summarizationModel: 'foo-bar',
+    });
+  });
 });
diff --git a/x-pack/solutions/search/plugins/search_playground/server/lib/get_chat_params.ts b/x-pack/solutions/search/plugins/search_playground/server/lib/get_chat_params.ts
@@ -21,6 +21,7 @@ import {
 import { GEMINI_CONNECTOR_ID } from '@kbn/stack-connectors-plugin/common/gemini/constants';
 import { INFERENCE_CONNECTOR_ID } from '@kbn/stack-connectors-plugin/common/inference/constants';
 import { Prompt, QuestionRewritePrompt } from '../../common/prompt';
+import { isEISConnector } from '../utils/eis';
 
 export const getChatParams = async (
   {
@@ -43,9 +44,11 @@ export const getChatParams = async (
   chatPrompt: string;
   questionRewritePrompt: string;
   connector: Connector;
+  summarizationModel?: string;
 }> => {
   const abortController = new AbortController();
   const abortSignal = abortController.signal;
+  let summarizationModel = model;
   const actionsClient = await actions.getActionsClientWithRequest(request);
   const connector = await actionsClient.get({ id: connectorId });
   let chatModel;
@@ -55,12 +58,17 @@ export const getChatParams = async (
 
   switch (connector.actionTypeId) {
     case INFERENCE_CONNECTOR_ID:
+      if (isEISConnector(connector)) {
+        if (!summarizationModel && connector.config?.providerConfig?.model_id) {
+          summarizationModel = connector.config?.providerConfig?.model_id;
+        }
+      }
       llmType = 'inference';
       chatModel = new ActionsClientChatOpenAI({
         actionsClient,
         logger,
         connectorId,
-        model: connector?.config?.defaultModel,
+        model: summarizationModel || connector?.config?.defaultModel,
         llmType,
         temperature: getDefaultArguments(llmType).temperature,
         // prevents the agent from retrying on failure
@@ -146,5 +154,11 @@ export const getChatParams = async (
     throw new Error('Invalid connector id');
   }
 
-  return { chatModel, chatPrompt, questionRewritePrompt, connector };
+  return {
+    chatModel,
+    chatPrompt,
+    questionRewritePrompt,
+    connector,
+    summarizationModel: summarizationModel || connector?.config?.defaultModel,
+  };
 };
diff --git a/x-pack/solutions/search/plugins/search_playground/server/routes.ts b/x-pack/solutions/search/plugins/search_playground/server/routes.ts
@@ -115,15 +115,16 @@ export function defineRoutes({
         es_client: client.asCurrentUser,
       } as AssistClientOptionsWithClient);
       const { messages, data } = request.body;
-      const { chatModel, chatPrompt, questionRewritePrompt, connector } = await getChatParams(
-        {
-          connectorId: data.connector_id,
-          model: data.summarization_model,
-          citations: data.citations,
-          prompt: data.prompt,
-        },
-        { actions, logger, request }
-      );
+      const { chatModel, chatPrompt, questionRewritePrompt, connector, summarizationModel } =
+        await getChatParams(
+          {
+            connectorId: data.connector_id,
+            model: data.summarization_model,
+            citations: data.citations,
+            prompt: data.prompt,
+          },
+          { actions, logger, request }
+        );
 
       let sourceFields = {};
 
@@ -139,7 +140,7 @@ export function defineRoutes({
         throw Error(e);
       }
 
-      const model = MODELS.find((m) => m.model === data.summarization_model);
+      const model = MODELS.find((m) => m.model === summarizationModel);
       const modelPromptLimit = model?.promptTokenLimit;
 
       const chain = ConversationalChain({
@@ -162,7 +163,7 @@ export function defineRoutes({
           connectorType:
             connector.actionTypeId +
             (connector.config?.apiProvider ? `-${connector.config.apiProvider}` : ''),
-          model: data.summarization_model ?? '',
+          model: summarizationModel ?? '',
           isCitationsEnabled: data.citations,
         });
 
diff --git a/x-pack/solutions/search/plugins/search_playground/server/utils/eis.ts b/x-pack/solutions/search/plugins/search_playground/server/utils/eis.ts
@@ -0,0 +1,19 @@
+/*
+ * Copyright Elasticsearch B.V. and/or licensed to Elasticsearch B.V. under one
+ * or more contributor license agreements. Licensed under the Elastic License
+ * 2.0; you may not use this file except in compliance with the Elastic License
+ * 2.0.
+ */
+
+import { INFERENCE_CONNECTOR_ID } from '@kbn/stack-connectors-plugin/common/inference/constants';
+import type { Connector } from '@kbn/actions-plugin/server/application/connector/types';
+import { elasticModelIds } from '@kbn/inference-common';
+
+export const isEISConnector = (connector: Connector) => {
+  if (connector.actionTypeId !== INFERENCE_CONNECTOR_ID) return false;
+  const modelId = connector.config?.providerConfig?.model_id ?? undefined;
+  if (modelId === elasticModelIds.RainbowSprinkles) {
+    return true;
+  }
+  return false;
+};