vercel
diff --git a/‎.changeset/brown-coats-obey.md‎
Lines changed: 5 additions & 0 deletions b/‎.changeset/brown-coats-obey.md‎
Lines changed: 5 additions & 0 deletions
diff --git a/‎content/providers/01-ai-sdk-providers/00-ai-gateway.mdx‎
Lines changed: 80 additions & 0 deletions b/‎content/providers/01-ai-sdk-providers/00-ai-gateway.mdx‎
Lines changed: 80 additions & 0 deletions
diff --git a/‎examples/ai-functions/src/gateway/get-generation-info.ts‎
Lines changed: 33 additions & 0 deletions b/‎examples/ai-functions/src/gateway/get-generation-info.ts‎
Lines changed: 33 additions & 0 deletions
diff --git a/‎packages/gateway/src/gateway-generation-info.test.ts‎
Lines changed: 268 additions & 0 deletions b/‎packages/gateway/src/gateway-generation-info.test.ts‎
Lines changed: 268 additions & 0 deletions
@@ -0,0 +1,5 @@
+---
+"@ai-sdk/gateway": patch
+---
+
+feat (provider/gateway): add get-generation support
@@ -238,6 +238,86 @@ The `getCredits()` method returns your team's credit information based on the au
 - **balance** _number_ - Your team's current available credit balance
 - **total_used** _number_ - Total credits consumed by your team
 
+## Generation Lookup
+
+Look up detailed information about a specific generation by its ID, including cost, token usage, latency, and provider details. Generation IDs are available in `providerMetadata.gateway.generationId` on both `generateText` and `streamText` responses.
+
+When streaming, the generation ID is injected on the first content chunk, so you can capture it early in the stream without waiting for completion. This is especially useful in cases where a network interruption or mid-stream error could prevent you from receiving the final response — since the gateway records the final status server-side, you can use the generation ID to look up the results (including cost, token usage, and finish reason) later via `getGenerationInfo()`.
+
+```ts
+import { gateway, generateText } from 'ai';
+
+// Make a request
+const result = await generateText({
+  model: gateway('anthropic/claude-sonnet-4'),
+  prompt: 'Explain quantum entanglement briefly',
+});
+
+// Get the generation ID from provider metadata
+const generationId = result.providerMetadata?.gateway?.generationId;
+
+// Look up detailed generation info
+const generation = await gateway.getGenerationInfo({ id: generationId });
+
+console.log(`Model: ${generation.model}`);
+console.log(`Cost: $${generation.totalCost.toFixed(6)}`);
+console.log(`Latency: ${generation.latency}ms`);
+console.log(`Prompt tokens: ${generation.promptTokens}`);
+console.log(`Completion tokens: ${generation.completionTokens}`);
+```
+
+With `streamText`, you can capture the generation ID from the first chunk via `fullStream`:
+
+```ts
+import { gateway, streamText } from 'ai';
+
+const result = streamText({
+  model: gateway('anthropic/claude-sonnet-4'),
+  prompt: 'Explain quantum entanglement briefly',
+});
+
+let generationId: string | undefined;
+
+for await (const part of result.fullStream) {
+  if (!generationId && part.providerMetadata?.gateway?.generationId) {
+    generationId = part.providerMetadata.gateway.generationId as string;
+    console.log(`Generation ID (early): ${generationId}`);
+  }
+}
+
+// Look up cost and usage after the stream completes
+if (generationId) {
+  const generation = await gateway.getGenerationInfo({ id: generationId });
+  console.log(`Cost: $${generation.totalCost.toFixed(6)}`);
+  console.log(`Finish reason: ${generation.finishReason}`);
+}
+```
+
+The `getGenerationInfo()` method accepts:
+
+- **id** _string_ - The generation ID to look up (format: `gen_<ulid>`, required)
+
+It returns a `GatewayGenerationInfo` object with the following fields:
+
+- **id** _string_ - The generation ID
+- **totalCost** _number_ - Total cost in USD
+- **upstreamInferenceCost** _number_ - Upstream inference cost in USD (relevant for BYOK)
+- **usage** _number_ - Usage cost in USD (same as totalCost)
+- **createdAt** _string_ - ISO 8601 timestamp when the generation was created
+- **model** _string_ - Model identifier used
+- **isByok** _boolean_ - Whether Bring Your Own Key credentials were used
+- **providerName** _string_ - The provider that served this generation
+- **streamed** _boolean_ - Whether streaming was used
+- **finishReason** _string_ - Finish reason (e.g. `'stop'`)
+- **latency** _number_ - Time to first token in milliseconds
+- **generationTime** _number_ - Total generation time in milliseconds
+- **promptTokens** _number_ - Number of prompt tokens
+- **completionTokens** _number_ - Number of completion tokens
+- **reasoningTokens** _number_ - Reasoning tokens used (if applicable)
+- **cachedTokens** _number_ - Cached tokens used (if applicable)
+- **cacheCreationTokens** _number_ - Cache creation input tokens
+- **billableWebSearchCalls** _number_ - Number of billable web search calls
+
 ## Examples
 
 ### Basic Text Generation
 
@@ -0,0 +1,33 @@
+import { gateway, streamText } from 'ai';
+import { run } from '../lib/run';
+
+run(async () => {
+  const result = streamText({
+    model: gateway('anthropic/claude-haiku-4.5'),
+    prompt: 'What animals are relatives of the tenrec?',
+  });
+
+  result.consumeStream();
+  console.log('Response:', await result.text);
+  console.log('Token usage:', await result.usage);
+  const providerMetadata = await result.providerMetadata;
+  console.log('Provider metadata:', JSON.stringify(providerMetadata, null, 2));
+
+  const generationId = (
+    providerMetadata?.gateway as { generationId?: string } | undefined
+  )?.generationId;
+
+  if (!generationId) {
+    console.log('No generation ID found in provider metadata.');
+    return;
+  }
+
+  console.log(`\nGeneration ID: ${generationId}`);
+
+  console.log('\nWaiting briefly for generation data to become available...');
+  await new Promise(resolve => setTimeout(resolve, 30_000));
+
+  console.log('\n--- Generation Details ---\n');
+  const generation = await gateway.getGenerationInfo({ id: generationId });
+  console.log(JSON.stringify(generation, null, 2));
+});
@@ -0,0 +1,268 @@
+import { createTestServer } from '@ai-sdk/test-server/with-vitest';
+import { describe, expect, it, vi } from 'vitest';
+import { GatewayGenerationInfoFetcher } from './gateway-generation-info';
+import type { FetchFunction } from '@ai-sdk/provider-utils';
+import {
+  GatewayAuthenticationError,
+  GatewayInternalServerError,
+  GatewayResponseError,
+} from './errors';
+
+function createFetcher({
+  headers,
+  fetch,
+}: {
+  headers?: () => Record<string, string>;
+  fetch?: FetchFunction;
+} = {}) {
+  return new GatewayGenerationInfoFetcher({
+    baseURL: 'https://api.example.com',
+    headers: headers ?? (() => ({ Authorization: 'Bearer test-token' })),
+    fetch,
+  });
+}
+
+const mockGenerationResponse = {
+  data: {
+    id: 'gen_01ARZ3NDEKTSV4RRFFQ69G5FAV',
+    total_cost: 0.00123,
+    upstream_inference_cost: 0.0011,
+    usage: 0.00123,
+    created_at: '2024-01-01T00:00:00.000Z',
+    model: 'gpt-4',
+    is_byok: false,
+    provider_name: 'openai',
+    streamed: true,
+    finish_reason: 'stop',
+    latency: 200,
+    generation_time: 1500,
+    native_tokens_prompt: 100,
+    native_tokens_completion: 50,
+    native_tokens_reasoning: 0,
+    native_tokens_cached: 0,
+    native_tokens_cache_creation: 0,
+    billable_web_search_calls: 0,
+  },
+};
+
+describe('GatewayGenerationInfoFetcher', () => {
+  const server = createTestServer({
+    'https://api.example.com/*': {
+      response: {
+        type: 'json-value',
+        body: mockGenerationResponse,
+      },
+    },
+  });
+
+  describe('getGenerationInfo', () => {
+    it('should fetch from the correct endpoint with generation ID', async () => {
+      const fetcher = createFetcher();
+
+      await fetcher.getGenerationInfo({
+        id: 'gen_01ARZ3NDEKTSV4RRFFQ69G5FAV',
+      });
+
+      expect(server.calls[0].requestMethod).toBe('GET');
+      const url = new URL(server.calls[0].requestUrl);
+      expect(url.pathname).toBe('/v1/generation');
+      expect(url.searchParams.get('id')).toBe('gen_01ARZ3NDEKTSV4RRFFQ69G5FAV');
+    });
+
+    it('should transform snake_case response fields to camelCase', async () => {
+      const fetcher = createFetcher();
+
+      const result = await fetcher.getGenerationInfo({
+        id: 'gen_01ARZ3NDEKTSV4RRFFQ69G5FAV',
+      });
+
+      expect(result).toEqual({
+        id: 'gen_01ARZ3NDEKTSV4RRFFQ69G5FAV',
+        totalCost: 0.00123,
+        upstreamInferenceCost: 0.0011,
+        usage: 0.00123,
+        createdAt: '2024-01-01T00:00:00.000Z',
+        model: 'gpt-4',
+        isByok: false,
+        providerName: 'openai',
+        streamed: true,
+        finishReason: 'stop',
+        latency: 200,
+        generationTime: 1500,
+        promptTokens: 100,
+        completionTokens: 50,
+        reasoningTokens: 0,
+        cachedTokens: 0,
+        cacheCreationTokens: 0,
+        billableWebSearchCalls: 0,
+      });
+    });
+
+    it('should unwrap the data envelope', async () => {
+      const fetcher = createFetcher();
+
+      const result = await fetcher.getGenerationInfo({
+        id: 'gen_01ARZ3NDEKTSV4RRFFQ69G5FAV',
+      });
+
+      // Result should be the data object directly, not { data: ... }
+      expect('data' in result).toBe(false);
+      expect(result.id).toBe('gen_01ARZ3NDEKTSV4RRFFQ69G5FAV');
+    });
+
+    it('should not have snake_case fields in result', async () => {
+      const fetcher = createFetcher();
+
+      const result = await fetcher.getGenerationInfo({
+        id: 'gen_01ARZ3NDEKTSV4RRFFQ69G5FAV',
+      });
+
+      expect('total_cost' in result).toBe(false);
+      expect('is_byok' in result).toBe(false);
+      expect('provider_name' in result).toBe(false);
+      expect('created_at' in result).toBe(false);
+      expect('generation_time' in result).toBe(false);
+      expect('finish_reason' in result).toBe(false);
+    });
+
+    it('should pass headers correctly', async () => {
+      const fetcher = createFetcher({
+        headers: () => ({
+          Authorization: 'Bearer custom-token',
+          'Custom-Header': 'custom-value',
+        }),
+      });
+
+      await fetcher.getGenerationInfo({
+        id: 'gen_01ARZ3NDEKTSV4RRFFQ69G5FAV',
+      });
+
+      expect(server.calls[0].requestHeaders).toEqual({
+        authorization: 'Bearer custom-token',
+        'custom-header': 'custom-value',
+      });
+    });
+
+    it('should handle 401 authentication errors', async () => {
+      server.urls['https://api.example.com/*'].response = {
+        type: 'error',
+        status: 401,
+        body: JSON.stringify({
+          error: {
+            message: 'Unauthorized',
+            type: 'authentication_error',
+          },
+        }),
+      };
+
+      const fetcher = createFetcher();
+
+      try {
+        await fetcher.getGenerationInfo({
+          id: 'gen_01ARZ3NDEKTSV4RRFFQ69G5FAV',
+        });
+        expect.fail('Should have thrown an error');
+      } catch (error) {
+        expect(GatewayAuthenticationError.isInstance(error)).toBe(true);
+        const authError = error as GatewayAuthenticationError;
+        expect(authError.statusCode).toBe(401);
+      }
+    });
+
+    it('should handle 500 internal server errors', async () => {
+      server.urls['https://api.example.com/*'].response = {
+        type: 'error',
+        status: 500,
+        body: JSON.stringify({
+          error: {
+            message: 'Failed to retrieve usage data',
+            type: 'internal_server_error',
+          },
+        }),
+      };
+
+      const fetcher = createFetcher();
+
+      await expect(
+        fetcher.getGenerationInfo({
+          id: 'gen_01ARZ3NDEKTSV4RRFFQ69G5FAV',
+        }),
+      ).rejects.toThrow(GatewayInternalServerError);
+    });
+
+    it('should handle malformed JSON error responses', async () => {
+      server.urls['https://api.example.com/*'].response = {
+        type: 'error',
+        status: 500,
+        body: '{ invalid json',
+      };
+
+      const fetcher = createFetcher();
+
+      try {
+        await fetcher.getGenerationInfo({
+          id: 'gen_01ARZ3NDEKTSV4RRFFQ69G5FAV',
+        });
+        expect.fail('Should have thrown an error');
+      } catch (error) {
+        expect(GatewayResponseError.isInstance(error)).toBe(true);
+        const responseError = error as GatewayResponseError;
+        expect(responseError.statusCode).toBe(500);
+      }
+    });
+
+    it('should use custom fetch function when provided', async () => {
+      const mockFetch = vi.fn().mockResolvedValue(
+        new Response(JSON.stringify(mockGenerationResponse), {
+          status: 200,
+          headers: { 'Content-Type': 'application/json' },
+        }),
+      );
+
+      const fetcher = createFetcher({ fetch: mockFetch });
+
+      const result = await fetcher.getGenerationInfo({
+        id: 'gen_01ARZ3NDEKTSV4RRFFQ69G5FAV',
+      });
+
+      expect(mockFetch).toHaveBeenCalled();
+      expect(result.totalCost).toBe(0.00123);
+      expect(result.model).toBe('gpt-4');
+    });
+
+    it('should encode special characters in generation ID', async () => {
+      const fetcher = createFetcher();
+
+      await fetcher.getGenerationInfo({
+        id: 'gen_01ARZ3NDEKTSV4RRFFQ69G5FAV',
+      });
+
+      const url = new URL(server.calls[0].requestUrl);
+      expect(url.searchParams.get('id')).toBe('gen_01ARZ3NDEKTSV4RRFFQ69G5FAV');
+    });
+
+    it('should handle BYOK generation response', async () => {
+      server.urls['https://api.example.com/*'].response = {
+        type: 'json-value',
+        body: {
+          data: {
+            ...mockGenerationResponse.data,
+            is_byok: true,
+            upstream_inference_cost: 0.0009,
+            provider_name: 'anthropic',
+            model: 'claude-sonnet-4',
+          },
+        },
+      };
+
+      const fetcher = createFetcher();
+      const result = await fetcher.getGenerationInfo({
+        id: 'gen_01ARZ3NDEKTSV4RRFFQ69G5FAV',
+      });
+
+      expect(result.isByok).toBe(true);
+      expect(result.upstreamInferenceCost).toBe(0.0009);
+      expect(result.providerName).toBe('anthropic');
+    });
+  });
+});
-Original file line number
+Diff line change
@@ @@ -0,0 +1,5 @@ @@
 +---
 +"@ai-sdk/gateway": patch
 +---
++
 +feat (provider/gateway): add get-generation support