From f41f32e5aac0c22137f5c1f90a1757125aa18bd9 Mon Sep 17 00:00:00 2001
From: Photon101 <123910806+Photon101@users.noreply.github.com>
Date: Wed, 13 May 2026 06:50:42 +0100
Subject: [PATCH] feat(ai): integrate Fireworks adapter

---
 packages/ai/fireworks/src/index.test.ts | 76 +++++++++++++++++++++++++
 packages/ai/fireworks/src/index.ts      | 50 ++++++++++++++--
 2 files changed, 120 insertions(+), 6 deletions(-)
diff --git a/packages/ai/fireworks/src/index.test.ts b/packages/ai/fireworks/src/index.test.ts
index f43ad207..329a621e 100644
--- a/packages/ai/fireworks/src/index.test.ts
+++ b/packages/ai/fireworks/src/index.test.ts
@@ -1,4 +1,80 @@
 import { smokeTest } from '@profullstack/sh1pt-core/testing';
+import { afterEach, describe, expect, it, vi } from 'vitest';
 import adapter from './index.js';
 
 smokeTest(adapter, { idPrefix: 'ai' });
+
+const ctx = (secrets: Record<string, string> = { FIREWORKS_API_KEY: 'test-key' }, dryRun = false) => ({
+  secret: (key: string) => secrets[key],
+  log: () => {},
+  dryRun,
+});
+
+describe('Fireworks AI OpenAI-compatible generation', () => {
+  afterEach(() => {
+    vi.unstubAllGlobals();
+  });
+
+  it('short-circuits dry-run before network calls', async () => {
+    const fetchMock = vi.fn();
+    vi.stubGlobal('fetch', fetchMock);
+
+    const result = await adapter.generate(ctx({ FIREWORKS_API_KEY: 'test-key' }, true), 'hello', {}, {});
+
+    expect(result).toEqual({ text: '[dry-run]', model: 'accounts/fireworks/models/deepseek-v3p2' });
+    expect(fetchMock).not.toHaveBeenCalled();
+  });
+
+  it('posts chat completions requests and maps usage tokens', async () => {
+    const fetchMock = vi.fn().mockResolvedValue({
+      ok: true,
+      json: async () => ({
+        choices: [{ message: { content: 'hi from fireworks' } }],
+        model: 'accounts/fireworks/models/llama-v3p3-70b-instruct',
+        usage: { prompt_tokens: 10, completion_tokens: 4 },
+      }),
+    });
+    vi.stubGlobal('fetch', fetchMock);
+
+    const result = await adapter.generate(ctx(), 'hello', {
+      model: 'accounts/fireworks/models/llama-v3p3-70b-instruct',
+      system: 'be brief',
+      maxTokens: 20,
+      temperature: 0.2,
+      extra: { response_format: { type: 'json_object' } },
+    }, {});
+
+    expect(fetchMock).toHaveBeenCalledOnce();
+    const call = fetchMock.mock.calls[0];
+    expect(call).toBeDefined();
+    const [url, request] = call!;
+    expect(url).toBe('https://api.fireworks.ai/inference/v1/chat/completions');
+    expect(request.headers.authorization).toBe('Bearer test-key');
+    expect(JSON.parse(request.body)).toEqual({
+      model: 'accounts/fireworks/models/llama-v3p3-70b-instruct',
+      messages: [
+        { role: 'system', content: 'be brief' },
+        { role: 'user', content: 'hello' },
+      ],
+      max_tokens: 20,
+      temperature: 0.2,
+      response_format: { type: 'json_object' },
+    });
+    expect(result).toEqual({
+      text: 'hi from fireworks',
+      model: 'accounts/fireworks/models/llama-v3p3-70b-instruct',
+      inputTokens: 10,
+      outputTokens: 4,
+    });
+  });
+
+  it('includes status and response body excerpt on errors', async () => {
+    vi.stubGlobal('fetch', vi.fn().mockResolvedValue({
+      ok: false,
+      status: 429,
+      text: async () => 'rate limited'.repeat(30),
+    }));
+
+    await expect(adapter.generate(ctx(), 'hello', {}, {})).rejects.toThrow(/Fireworks AI 429: rate limited/);
+  });
+});
diff --git a/packages/ai/fireworks/src/index.ts b/packages/ai/fireworks/src/index.ts
index 636abf12..36afc6df 100644
--- a/packages/ai/fireworks/src/index.ts
+++ b/packages/ai/fireworks/src/index.ts
@@ -4,17 +4,55 @@ interface Config {
   baseUrl?: string;
 }
 
+const DEFAULT_BASE = 'https://api.fireworks.ai/inference/v1';
+
 export default defineAi<Config>({
   id: 'ai-fireworks',
   label: 'Fireworks AI',
-  defaultModel: 'accounts/fireworks/models/llama-v3p3-70b-instruct',
-  models: ['accounts/fireworks/models/llama-v3p3-70b-instruct'],
+  defaultModel: 'accounts/fireworks/models/deepseek-v3p2',
+  models: [
+    'accounts/fireworks/models/deepseek-v3p2',
+    'accounts/fireworks/models/deepseek-r1',
+    'accounts/fireworks/models/llama-v3p3-70b-instruct',
+  ],
 
-  async generate(ctx, prompt, _opts, _config) {
+  async generate(ctx, prompt, opts, config) {
     const apiKey = ctx.secret('FIREWORKS_API_KEY');
-    if (!apiKey) throw new Error('FIREWORKS_API_KEY not in vault — run `sh1pt promote ai setup`');
-    ctx.log(`[stub] ai-fireworks · ${prompt.length} chars in — integration pending`);
-    return { text: '[stub — ai-fireworks integration not yet implemented]', model: 'accounts/fireworks/models/llama-v3p3-70b-instruct' };
+    if (!apiKey) throw new Error('FIREWORKS_API_KEY not in vault');
+    const model = opts.model ?? 'accounts/fireworks/models/deepseek-v3p2';
+    ctx.log(`fireworks · model=${model} · ${prompt.length} chars in`);
+    if (ctx.dryRun) return { text: '[dry-run]', model };
+
+    const messages: Array<{ role: string; content: string }> = [];
+    if (opts.system) messages.push({ role: 'system', content: opts.system });
+    messages.push({ role: 'user', content: prompt });
+
+    const res = await fetch(`${config.baseUrl ?? DEFAULT_BASE}/chat/completions`, {
+      method: 'POST',
+      headers: {
+        authorization: `Bearer ${apiKey}`,
+        'content-type': 'application/json',
+      },
+      body: JSON.stringify({
+        model,
+        messages,
+        ...(opts.maxTokens !== undefined ? { max_tokens: opts.maxTokens } : {}),
+        ...(opts.temperature !== undefined ? { temperature: opts.temperature } : {}),
+        ...opts.extra,
+      }),
+    });
+    if (!res.ok) throw new Error(`Fireworks AI ${res.status}: ${(await res.text()).slice(0, 200)}`);
+    const data = (await res.json()) as {
+      choices: Array<{ message?: { content?: string } }>;
+      model: string;
+      usage?: { prompt_tokens?: number; completion_tokens?: number };
+    };
+    return {
+      text: data.choices[0]?.message?.content ?? '',
+      model: data.model,
+      inputTokens: data.usage?.prompt_tokens,
+      outputTokens: data.usage?.completion_tokens,
+    };
   },
 
   setup: tokenSetup<Config>({