Add Together AI model discovery with dynamic API key support

2026-01-26 16:07:09 +01:00 · 2026-01-26 16:07:09 +01:00 · 7d4d53366e
commit 7d4d53366e
parent 39cd9102c1
4 changed files with 221 additions and 117 deletions
--- a/src/agents/models-config.providers.ts
+++ b/src/agents/models-config.providers.ts
@ -13,6 +13,7 @@ import {
  SYNTHETIC_MODEL_CATALOG,
 } from "./synthetic-models.js";
 import { discoverVeniceModels, VENICE_BASE_URL } from "./venice-models.js";
+import { discoverTogetherModels, TOGETHER_BASE_URL } from "./together-models.js";

 type ModelsConfig = NonNullable<ClawdbotConfig["models"]>;
 export type ProviderConfig = NonNullable<ModelsConfig["providers"]>[string];
@ -359,110 +360,16 @@ async function buildOllamaProvider(): Promise<ProviderConfig> {
  };
 }

-function buildTogetherProvider(): ProviderConfig {
+async function buildTogetherProvider(apiKey?: string): Promise<ProviderConfig> {
+  // Only discover models if we have an API key, otherwise use static catalog
+  const models = apiKey ? await discoverTogetherModels(apiKey) : [];
+
+  // If we successfully discovered models, return them and let the merge logic handle conflicts
+  // If discovery failed, return empty array to fallback to static catalog
  return {
-    baseUrl: "https://api.together.xyz/v1",
+    baseUrl: TOGETHER_BASE_URL,
    api: "openai-completions",
-    models: [
-      {
-        id: "meta-llama/Llama-3.3-70B-Instruct-Turbo",
-        name: "Llama 3.3 70B Instruct Turbo",
-        reasoning: false,
-        input: ["text"],
-        contextWindow: 131072,
-        maxTokens: 8192,
-        cost: {
-          input: 0.88,
-          output: 0.88,
-          cacheRead: 0.88,
-          cacheWrite: 0.88,
-        },
-      },
-      {
-        id: "meta-llama/Llama-4-Scout-17B-16E-Instruct",
-        name: "Llama 4 Scout 17B 16E Instruct",
-        reasoning: false,
-        input: ["text", "image"],
-        contextWindow: 10000000,
-        maxTokens: 32768,
-        cost: {
-          input: 0.18,
-          output: 0.59,
-          cacheRead: 0.18,
-          cacheWrite: 0.18,
-        },
-      },
-      {
-        id: "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
-        name: "Llama 4 Maverick 17B 128E Instruct FP8",
-        reasoning: false,
-        input: ["text", "image"],
-        contextWindow: 20000000,
-        maxTokens: 32768,
-        cost: {
-          input: 0.27,
-          output: 0.85,
-          cacheRead: 0.27,
-          cacheWrite: 0.27,
-        },
-      },
-      {
-        id: "deepseek-ai/DeepSeek-V3.1",
-        name: "DeepSeek V3.1",
-        reasoning: false,
-        input: ["text"],
-        contextWindow: 131072,
-        maxTokens: 8192,
-        cost: {
-          input: 0.6,
-          output: 1.25,
-          cacheRead: 0.6,
-          cacheWrite: 0.6,
-        },
-      },
-      {
-        id: "deepseek-ai/DeepSeek-R1",
-        name: "DeepSeek R1",
-        reasoning: true,
-        input: ["text"],
-        contextWindow: 131072,
-        maxTokens: 8192,
-        cost: {
-          input: 3.0,
-          output: 7.0,
-          cacheRead: 3.0,
-          cacheWrite: 3.0,
-        },
-      },
-      {
-        id: "Qwen/Qwen2.5-72B-Instruct-Turbo",
-        name: "Qwen 2.5 72B Instruct Turbo",
-        reasoning: false,
-        input: ["text"],
-        contextWindow: 131072,
-        maxTokens: 8192,
-        cost: {
-          input: 0.35,
-          output: 0.8,
-          cacheRead: 0.35,
-          cacheWrite: 0.35,
-        },
-      },
-      {
-        id: "mistralai/Mixtral-8x7B-Instruct-v0.1",
-        name: "Mixtral 8x7B Instruct v0.1",
-        reasoning: false,
-        input: ["text"],
-        contextWindow: 32768,
-        maxTokens: 8192,
-        cost: {
-          input: 0.6,
-          output: 0.6,
-          cacheRead: 0.6,
-          cacheWrite: 0.6,
-        },
-      },
-    ],
+    models,
  };
 }

@ -529,7 +436,7 @@ export async function resolveImplicitProviders(params: {
    resolveEnvApiKeyVarName("together") ??
    resolveApiKeyFromProfiles({ provider: "together", store: authStore });
  if (togetherKey) {
-    providers.together = { ...buildTogetherProvider(), apiKey: togetherKey };
+    providers.together = { ...(await buildTogetherProvider(togetherKey)), apiKey: togetherKey };
  }

  return providers;
--- a/src/agents/together-models.ts
+++ b/src/agents/together-models.ts
@ -0,0 +1,178 @@
+import type { ModelDefinitionConfig } from "../config/types.models.js";
+
+export const TOGETHER_BASE_URL = "https://api.together.xyz/v1";
+
+// Together AI uses token-based pricing
+// Default costs when specific pricing is not available
+export const TOGETHER_DEFAULT_COST = {
+  input: 0.5,
+  output: 0.5,
+  cacheRead: 0.5,
+  cacheWrite: 0.5,
+};
+
+// Together AI API response types
+interface TogetherModel {
+  id: string;
+  name?: string;
+  display_name?: string;
+  description?: string;
+  context_length?: number;
+  tokenizer?: string;
+  type?: string;
+  capabilities?: {
+    vision?: boolean;
+    function_calling?: boolean;
+    tool_use?: boolean;
+  };
+  pricing?: {
+    input?: number;
+    output?: number;
+  };
+}
+
+/**
+ * Discover models from Together AI API.
+ * The /models endpoint requires authentication via API key.
+ */
+export async function discoverTogetherModels(apiKey?: string): Promise<ModelDefinitionConfig[]> {
+  // Skip API discovery in test environment
+  if (process.env.NODE_ENV === "test" || process.env.VITEST) {
+    return [];
+  }
+
+  console.log("[together-models] Starting model discovery from Together AI API...");
+  console.log(`[together-models] Fetching from: ${TOGETHER_BASE_URL}/models`);
+  console.log(`[together-models] API key provided: ${apiKey ? "Yes" : "No"}`);
+
+  try {
+    // Together AI requires authentication for /models endpoint
+    const headers: Record<string, string> = {
+      "Content-Type": "application/json",
+    };
+
+    if (apiKey) {
+      headers["Authorization"] = `Bearer ${apiKey}`;
+    }
+
+    const response = await fetch(`${TOGETHER_BASE_URL}/models`, {
+      signal: AbortSignal.timeout(5000),
+      headers,
+    });
+
+    console.log(`[together-models] Response status: ${response.status} ${response.statusText}`);
+    console.log(
+      `[together-models] Response headers:`,
+      Object.fromEntries(response.headers.entries()),
+    );
+
+    if (!response.ok) {
+      console.warn(`[together-models] Failed to discover models: HTTP ${response.status}`);
+
+      // Try to get error details from response
+      try {
+        const errorText = await response.text();
+        console.warn(`[together-models] Error response body: ${errorText}`);
+      } catch (e) {
+        console.warn(`[together-models] Could not read error response body: ${e}`);
+      }
+
+      return [];
+    }
+
+    const rawResponse = await response.text();
+    console.log(
+      `[together-models] Raw response (first 500 chars): ${rawResponse.substring(0, 500)}`,
+    );
+
+    let models: TogetherModel[];
+    try {
+      const parsed = JSON.parse(rawResponse);
+
+      // Together AI returns array directly, not { data: array }
+      if (Array.isArray(parsed)) {
+        models = parsed as TogetherModel[];
+        console.log(`[together-models] Response is direct array with ${models.length} models`);
+      } else if (parsed.data && Array.isArray(parsed.data)) {
+        models = parsed.data as TogetherModel[];
+        console.log(`[together-models] Response has data array with ${models.length} models`);
+      } else {
+        console.error(`[together-models] Unexpected response format:`, parsed);
+        return [];
+      }
+    } catch (e) {
+      console.error(`[together-models] Failed to parse JSON: ${e}`);
+      console.error(`[together-models] Raw response: ${rawResponse}`);
+      return [];
+    }
+
+    if (!Array.isArray(models) || models.length === 0) {
+      console.warn("[together-models] No models found from API");
+      return [];
+    }
+
+    // Filter for chat models only and map to ModelDefinitionConfig
+    const chatModels = models.filter((model) => model.type === "chat");
+    console.log(
+      `[together-models] Found ${models.length} total models, ${chatModels.length} chat models`,
+    );
+
+    return chatModels.map((model: TogetherModel, index: number) => {
+      console.log(`[together-models] Processing model ${index + 1}/${chatModels.length}:`, {
+        id: model.id,
+        name: model.name,
+        display_name: model.display_name,
+        type: model.type,
+        context_length: model.context_length,
+        capabilities: model.capabilities,
+        pricing: model.pricing,
+      });
+      const modelId = model.id;
+      const displayName = model.display_name || model.name || modelId;
+
+      // Determine if model supports reasoning
+      const isReasoning =
+        modelId.toLowerCase().includes("reason") ||
+        modelId.toLowerCase().includes("r1") ||
+        modelId.toLowerCase().includes("thinking") ||
+        model.description?.toLowerCase().includes("reasoning") ||
+        false;
+
+      // Determine input types
+      const hasVision =
+        model.capabilities?.vision ||
+        modelId.toLowerCase().includes("vision") ||
+        modelId.toLowerCase().includes("vl") ||
+        model.description?.toLowerCase().includes("vision") ||
+        false;
+
+      // Use pricing from API if available, otherwise use defaults
+      const cost = model.pricing
+        ? {
+            input: model.pricing.input || TOGETHER_DEFAULT_COST.input,
+            output: model.pricing.output || TOGETHER_DEFAULT_COST.output,
+            cacheRead: model.pricing.input || TOGETHER_DEFAULT_COST.cacheRead,
+            cacheWrite: model.pricing.output || TOGETHER_DEFAULT_COST.cacheWrite,
+          }
+        : TOGETHER_DEFAULT_COST;
+
+      return {
+        id: modelId,
+        name: displayName,
+        reasoning: isReasoning,
+        input: hasVision ? ["text", "image"] : ["text"],
+        cost,
+        contextWindow: model.context_length || 131072,
+        maxTokens: 8192, // Default max tokens for most models
+      };
+    });
+  } catch (error) {
+    console.warn(`[together-models] Discovery failed: ${String(error)}`);
+    if (error instanceof Error) {
+      console.warn(`[together-models] Error name: ${error.name}`);
+      console.warn(`[together-models] Error message: ${error.message}`);
+      console.warn(`[together-models] Error stack: ${error.stack}`);
+    }
+    return [];
+  }
+}
--- a/src/commands/auth-choice.default-model.ts
+++ b/src/commands/auth-choice.default-model.ts
@ -5,21 +5,21 @@ export async function applyDefaultModelChoice(params: {
  config: ClawdbotConfig;
  setDefaultModel: boolean;
  defaultModel: string;
-  applyDefaultConfig: (config: ClawdbotConfig) => ClawdbotConfig;
-  applyProviderConfig: (config: ClawdbotConfig) => ClawdbotConfig;
+  applyDefaultConfig: (config: ClawdbotConfig) => ClawdbotConfig | Promise<ClawdbotConfig>;
+  applyProviderConfig: (config: ClawdbotConfig) => ClawdbotConfig | Promise<ClawdbotConfig>;
  noteDefault?: string;
  noteAgentModel: (model: string) => Promise<void>;
  prompter: WizardPrompter;
 }): Promise<{ config: ClawdbotConfig; agentModelOverride?: string }> {
  if (params.setDefaultModel) {
-    const next = params.applyDefaultConfig(params.config);
+    const next = await params.applyDefaultConfig(params.config);
    if (params.noteDefault) {
      await params.prompter.note(`Default model set to ${params.noteDefault}`, "Model configured");
    }
    return { config: next };
  }

-  const next = params.applyProviderConfig(params.config);
+  const next = await params.applyProviderConfig(params.config);
  await params.noteAgentModel(params.defaultModel);
  return { config: next, agentModelOverride: params.defaultModel };
 }
--- a/src/commands/onboard-auth.config-core.ts
+++ b/src/commands/onboard-auth.config-core.ts
@ -4,6 +4,7 @@ import {
  SYNTHETIC_DEFAULT_MODEL_REF,
  SYNTHETIC_MODEL_CATALOG,
 } from "../agents/synthetic-models.js";
+import { discoverTogetherModels } from "../agents/together-models.js";

 // Together AI constants and models - inline to avoid separate models file
 const TOGETHER_BASE_URL = "https://api.together.xyz/v1";
@ -518,7 +519,7 @@ export function applyVeniceConfig(cfg: ClawdbotConfig): ClawdbotConfig {
  };
 }

-export function applyTogetherProviderConfig(cfg: ClawdbotConfig): ClawdbotConfig {
+export async function applyTogetherProviderConfig(cfg: ClawdbotConfig): Promise<ClawdbotConfig> {
  const models = { ...cfg.agents?.defaults?.models };
  models[TOGETHER_DEFAULT_MODEL_REF] = {
    ...models[TOGETHER_DEFAULT_MODEL_REF],
@ -528,19 +529,37 @@ export function applyTogetherProviderConfig(cfg: ClawdbotConfig): ClawdbotConfig
  const providers = { ...cfg.models?.providers };
  const existingProvider = providers.together;
  const existingModels = Array.isArray(existingProvider?.models) ? existingProvider.models : [];
-  const togetherModels = TOGETHER_MODEL_CATALOG.map(buildTogetherModelDefinition);
-  const mergedModels = [
-    ...existingModels,
-    ...togetherModels.filter(
-      (model) => !existingModels.some((existing) => existing.id === model.id),
-    ),
-  ];
+
+  // Try dynamic discovery if API key is available, otherwise fall back to static catalog
  const { apiKey: existingApiKey, ...existingProviderRest } = (existingProvider ?? {}) as Record<
    string,
    unknown
  > as { apiKey?: string };
  const resolvedApiKey = typeof existingApiKey === "string" ? existingApiKey : undefined;
  const normalizedApiKey = resolvedApiKey?.trim();
+
+  let togetherModels;
+  if (normalizedApiKey) {
+    // Try dynamic discovery with API key
+    try {
+      togetherModels = await discoverTogetherModels(normalizedApiKey);
+      console.log(`[together-models] Dynamic discovery found ${togetherModels.length} models`);
+    } catch (error) {
+      console.warn(`[together-models] Dynamic discovery failed, using static catalog: ${error}`);
+      togetherModels = TOGETHER_MODEL_CATALOG.map(buildTogetherModelDefinition);
+    }
+  } else {
+    // No API key, use static catalog
+    togetherModels = TOGETHER_MODEL_CATALOG.map(buildTogetherModelDefinition);
+  }
+
+  const mergedModels = [
+    ...existingModels,
+    ...togetherModels.filter(
+      (model) => !existingModels.some((existing) => existing.id === model.id),
+    ),
+  ];
+
  providers.together = {
    ...existingProviderRest,
    baseUrl: TOGETHER_BASE_URL,
@ -565,8 +584,8 @@ export function applyTogetherProviderConfig(cfg: ClawdbotConfig): ClawdbotConfig
  };
 }

-export function applyTogetherConfig(cfg: ClawdbotConfig): ClawdbotConfig {
-  const next = applyTogetherProviderConfig(cfg);
+export async function applyTogetherConfig(cfg: ClawdbotConfig): Promise<ClawdbotConfig> {
+  const next = await applyTogetherProviderConfig(cfg);
  const existingModel = next.agents?.defaults?.model;
  return {
    ...next,