💄 style: update cohere model list

hezhijie0327 · web-flow · commit 22ec8cd54b1d · 2025-03-17T22:07:33.000+08:00
diff --git a/src/config/aiModels/cohere.ts b/src/config/aiModels/cohere.ts
@@ -5,14 +5,228 @@ const cohereChatModels: AIChatModelCard[] = [
     abilities: {
       functionCall: true,
     },
-    contextWindowTokens: 16_000,
-    description: '',
+    contextWindowTokens: 256_000,
+    description: 'Command A is our most performant model to date, excelling at tool use, agents, retrieval augmented generation (RAG), and multilingual use cases. Command A has a context length of 256K, only requires two GPUs to run, and has 150% higher throughput compared to Command R+ 08-2024.',
+    displayName: 'Command A',
+    enabled: true,
+    id: 'command-a-03-2025',
+    maxOutput: 8000,
+    pricing: {
+      input: 2.5,
+      output: 10
+    },
+    type: 'chat'
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 128_000,
+    description: 'command-r-plus is an alias for command-r-plus-04-2024, so if you use command-r-plus in the API, that’s the model you’re pointing to.',
+    displayName: 'Command R+',
+    enabled: true,
+    id: 'command-r-plus',
+    maxOutput: 4000,
+    pricing: {
+      input: 2.5,
+      output: 10
+    },
+    type: 'chat'
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 128_000,
+    description: 'Command R+ is an instruction-following conversational model that performs language tasks at a higher quality, more reliably, and with a longer context than previous models. It is best suited for complex RAG workflows and multi-step tool use.',
+    displayName: 'Command R+ 04-2024',
+    id: 'command-r-plus-04-2024',
+    maxOutput: 4000,
+    pricing: {
+      input: 3,
+      output: 15
+    },
+    type: 'chat'
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 128_000,
+    description: 'command-r is an alias for command-r-03-2024, so if you use command-r in the API, that’s the model you’re pointing to.',
+    displayName: 'Command R',
+    enabled: true,
+    id: 'command-r',
+    maxOutput: 4000,
+    pricing: {
+      input: 0.15,
+      output: 0.6
+    },
+    type: 'chat'
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 128_000,
+    description: 'command-r-08-2024 is an update of the Command R model, delivered in August 2024.',
+    displayName: 'Command R 08-2024',
+    id: 'command-r-08-2024',
+    maxOutput: 4000,
+    pricing: {
+      input: 0.15,
+      output: 0.6
+    },
+    type: 'chat'
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 128_000,
+    description: 'Command R is an instruction-following conversational model that performs language tasks at a higher quality, more reliably, and with a longer context than previous models. It can be used for complex workflows like code generation, retrieval augmented generation (RAG), tool use, and agents.',
+    displayName: 'Command R 03-2024',
+    id: 'command-r-03-2024',
+    maxOutput: 4000,
+    pricing: {
+      input: 0.5,
+      output: 1.5
+    },
+    type: 'chat'
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 128_000,
+    description: 'command-r7b-12-2024 is a small, fast update delivered in December 2024. It excels at RAG, tool use, agents, and similar tasks requiring complex reasoning and multiple steps.',
+    displayName: 'Command R7B 12-2024',
+    enabled: true,
+    id: 'command-r7b-12-2024',
+    maxOutput: 4000,
+    pricing: {
+      input: 0.0375,
+      output: 0.15
+    },
+    type: 'chat'
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 4000,
+    description: 'An instruction-following conversational model that performs language tasks with high quality, more reliably and with a longer context than our base generative models.',
     displayName: 'Command',
     enabled: true,
     id: 'command',
+    maxOutput: 4000,
+    pricing: {
+      input: 1,
+      output: 2
+    },
+    type: 'chat'
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 128_000,
+    description: 'To reduce the time between major releases, we put out nightly versions of command models. For command, that is command-nightly. Be advised that command-nightly is the latest, most experimental, and (possibly) unstable version of its default counterpart. Nightly releases are updated regularly, without warning, and are not recommended for production use.',
+    displayName: 'Command Nightly',
+    id: 'command-nightly',
+    maxOutput: 4000,
+    pricing: {
+      input: 1,
+      output: 2
+    },
+    type: 'chat'
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 4000,
+    description: 'A smaller, faster version of command. Almost as capable, but a lot faster.',
+    displayName: 'Command Light',
+    enabled: true,
+    id: 'command-light',
+    maxOutput: 4000,
+    pricing: {
+      input: 0.3,
+      output: 0.6
+    },
+    type: 'chat'
+  },
+  {
+    abilities: {
+      functionCall: true,
+    },
+    contextWindowTokens: 4000,
+    description: 'To reduce the time between major releases, we put out nightly versions of command models. For command-light, that is command-light-nightly. Be advised that command-light-nightly is the latest, most experimental, and (possibly) unstable version of its default counterpart. Nightly releases are updated regularly, without warning, and are not recommended for production use.',
+    displayName: 'Command Light Nightly',
+    id: 'command-light-nightly',
+    maxOutput: 4000,
+    pricing: {
+      input: 0.3,
+      output: 0.6
+    },
+    type: 'chat'
+  },
+  {
+    contextWindowTokens: 128_000,
+    description: 'Aya Expanse is a highly performant 32B multilingual model, designed to rival monolingual performance through innovations in instruction tuning with data arbitrage, preference training, and model merging. Serves 23 languages.',
+    displayName: 'Aya Expanse 32B',
+    enabled: true,
+    id: 'c4ai-aya-expanse-32b',
+    maxOutput: 4000,
+    pricing: {
+      input: 0.5,
+      output: 1.5
+    },
+    type: 'chat'
+  },
+  {
+    contextWindowTokens: 8000,
+    description: 'Aya Expanse is a highly performant 8B multilingual model, designed to rival monolingual performance through innovations in instruction tuning with data arbitrage, preference training, and model merging. Serves 23 languages.',
+    displayName: 'Aya Expanse 8B',
+    enabled: true,
+    id: 'c4ai-aya-expanse-8b',
+    maxOutput: 4000,
+    pricing: {
+      input: 0.5,
+      output: 1.5
+    },
+    type: 'chat'
+  },
+  {
+    abilities: {
+      vision: true,
+    },
+    contextWindowTokens: 16_000,
+    description: 'Aya Vision is a state-of-the-art multimodal model excelling at a variety of critical benchmarks for language, text, and image capabilities. Serves 23 languages. This 32 billion parameter variant is focused on state-of-art multilingual performance.',
+    displayName: 'Aya Vision 32B',
+    enabled: true,
+    id: 'c4ai-aya-vision-32b',
+    maxOutput: 4000,
+    pricing: {
+      input: 0.5,
+      output: 1.5
+    },
+    type: 'chat'
+  },
+  {
+    abilities: {
+      vision: true,
+    },
+    contextWindowTokens: 16_000,
+    description: 'Aya Vision is a state-of-the-art multimodal model excelling at a variety of critical benchmarks for language, text, and image capabilities. This 8 billion parameter variant is focused on low latency and best-in-class performance.',
+    displayName: 'Aya Vision 8B',
+    enabled: true,
+    id: 'c4ai-aya-vision-8b',
+    maxOutput: 4000,
     pricing: {
-      input: 0.6,
-      output: 1.2
+      input: 0.5,
+      output: 1.5
     },
     type: 'chat'
   },
diff --git a/src/config/modelProviders/cohere.ts b/src/config/modelProviders/cohere.ts
@@ -2,14 +2,17 @@ import { ModelProviderCard } from '@/types/llm';
 
 const Cohere: ModelProviderCard = {
   chatModels: [],
-  checkModel: 'command',
+  checkModel: 'command-r7b-12-2024',
   description: 'Cohere',
   //disableBrowserRequest: true,
   id: 'cohere',
   modelsUrl: 'https://docs.cohere.com/v2/docs/models',
   name: 'Cohere',
   settings: {
     //disableBrowserRequest: true,
+    proxyUrl: {
+      placeholder: 'https://api.cohere.ai/compatibility/v1',
+    },
     sdkType: 'openai',
   },
   url: 'https://cohere.com',
diff --git a/src/libs/agent-runtime/cohere/index.ts b/src/libs/agent-runtime/cohere/index.ts
@@ -1,10 +1,48 @@
 import { ModelProvider } from '../types';
 import { LobeOpenAICompatibleFactory } from '../utils/openaiCompatibleFactory';
 
+import type { ChatModelCard } from '@/types/llm';
+
+export interface CohereModelCard {
+  context_length: number;
+  features: string[];
+  name: string;
+  supports_vision: boolean;
+}
+
 export const LobeCohereAI = LobeOpenAICompatibleFactory({
   baseURL: 'https://api.cohere.ai/compatibility/v1',
   debug: {
     chatCompletion: () => process.env.DEBUG_COHERE_CHAT_COMPLETION === '1',
   },
+  models: async ({ client }) => {
+    const { LOBE_DEFAULT_MODEL_LIST } = await import('@/config/aiModels');
+
+    client.baseURL = 'https://api.cohere.com/v1';
+
+    const modelsPage = await client.models.list() as any;
+    const modelList: CohereModelCard[] = modelsPage.models;
+
+    return modelList
+      .map((model) => {
+        const knownModel = LOBE_DEFAULT_MODEL_LIST.find((m) => model.name.toLowerCase() === m.id.toLowerCase());
+
+        return {
+          contextWindowTokens: model.context_length,
+          displayName: knownModel?.displayName ?? undefined,
+          enabled: knownModel?.enabled || false,
+          functionCall:
+            model.features.includes("tools")
+            || knownModel?.abilities?.functionCall
+            || false,
+          id: model.name,
+          vision:
+            model.supports_vision
+            || knownModel?.abilities?.vision
+            || false,
+        };
+      })
+      .filter(Boolean) as ChatModelCard[];
+  },
   provider: ModelProvider.Cohere,
 });