-
-
Notifications
You must be signed in to change notification settings - Fork 10.7k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
- Loading branch information
Showing
13 changed files
with
332 additions
and
14 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,38 @@ | ||
import { readFileSync } from 'node:fs'; | ||
import { resolve } from 'node:path'; | ||
|
||
import { getLLMConfig } from '@/config/llm'; | ||
import { AgentRuntime, ModelProvider } from '@/libs/agent-runtime'; | ||
import { LobeVertexAI } from '@/libs/agent-runtime/vertexai'; | ||
import { safeParseJSON } from '@/utils/safeParseJSON'; | ||
|
||
import { POST as UniverseRoute } from '../[provider]/route'; | ||
|
||
export const POST = async (req: Request) => | ||
UniverseRoute(req, { | ||
createRuntime: () => { | ||
const { | ||
VERTEXAI_PROJECT, | ||
VERTEXAI_LOCATION, | ||
VERTEXAI_CREDENTIALS, | ||
VERTEXAI_CREDENTIALS_PATH, | ||
} = getLLMConfig(); | ||
|
||
const credentialsContent = | ||
VERTEXAI_CREDENTIALS ?? | ||
(VERTEXAI_CREDENTIALS_PATH | ||
? readFileSync(resolve(process.cwd(), VERTEXAI_CREDENTIALS_PATH), 'utf8') | ||
: undefined); | ||
|
||
const googleAuthOptions = credentialsContent ? safeParseJSON(credentialsContent) : undefined; | ||
|
||
const instance = LobeVertexAI.initFromVertexAI({ | ||
googleAuthOptions: googleAuthOptions, | ||
location: VERTEXAI_LOCATION, | ||
project: VERTEXAI_PROJECT, | ||
}); | ||
|
||
return new AgentRuntime(instance); | ||
}, | ||
params: { provider: ModelProvider.VertexAI }, | ||
}); |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,217 @@ | ||
import { ModelProviderCard } from '@/types/llm'; | ||
|
||
// ref: https://ai.google.dev/gemini-api/docs/models/gemini | ||
const VertexAI: ModelProviderCard = { | ||
chatModels: [ | ||
{ | ||
description: | ||
'Gemini 1.5 Flash 是Google最新的多模态AI模型,具备快速处理能力,支持文本、图像和视频输入,适用于多种任务的高效扩展。', | ||
displayName: 'Gemini 1.5 Flash', | ||
enabled: true, | ||
functionCall: true, | ||
id: 'gemini-1.5-flash-latest', | ||
maxOutput: 8192, | ||
pricing: { | ||
cachedInput: 0.018_75, | ||
input: 0.075, | ||
output: 0.3, | ||
}, | ||
tokens: 1_000_000 + 8192, | ||
vision: true, | ||
}, | ||
{ | ||
description: 'Gemini 1.5 Flash 002 是一款高效的多模态模型,支持广泛应用的扩展。', | ||
displayName: 'Gemini 1.5 Flash 002', | ||
enabled: true, | ||
functionCall: true, | ||
id: 'gemini-1.5-flash-002', | ||
maxOutput: 8192, | ||
pricing: { | ||
cachedInput: 0.018_75, | ||
input: 0.075, | ||
output: 0.3, | ||
}, | ||
releasedAt: '2024-09-25', | ||
tokens: 1_000_000 + 8192, | ||
vision: true, | ||
}, | ||
{ | ||
description: 'Gemini 1.5 Flash 001 是一款高效的多模态模型,支持广泛应用的扩展。', | ||
displayName: 'Gemini 1.5 Flash 001', | ||
functionCall: true, | ||
id: 'gemini-1.5-flash-001', | ||
maxOutput: 8192, | ||
pricing: { | ||
cachedInput: 0.018_75, | ||
input: 0.075, | ||
output: 0.3, | ||
}, | ||
tokens: 1_000_000 + 8192, | ||
vision: true, | ||
}, | ||
{ | ||
description: 'Gemini 1.5 Flash 0827 提供了优化后的多模态处理能力,适用多种复杂任务场景。', | ||
displayName: 'Gemini 1.5 Flash 0827', | ||
functionCall: true, | ||
id: 'gemini-1.5-flash-exp-0827', | ||
maxOutput: 8192, | ||
pricing: { | ||
cachedInput: 0.018_75, | ||
input: 0.075, | ||
output: 0.3, | ||
}, | ||
releasedAt: '2024-08-27', | ||
tokens: 1_000_000 + 8192, | ||
vision: true, | ||
}, | ||
|
||
{ | ||
description: | ||
'Gemini 1.5 Flash 8B 0924 是最新的实验性模型,在文本和多模态用例中都有显著的性能提升。', | ||
displayName: 'Gemini 1.5 Flash 8B 0924', | ||
functionCall: true, | ||
id: 'gemini-1.5-flash-8b-exp-0924', | ||
maxOutput: 8192, | ||
pricing: { | ||
cachedInput: 0.018_75, | ||
input: 0.075, | ||
output: 0.3, | ||
}, | ||
releasedAt: '2024-09-24', | ||
tokens: 1_000_000 + 8192, | ||
vision: true, | ||
}, | ||
{ | ||
description: | ||
'Gemini 1.5 Pro 支持高达200万个tokens,是中型多模态模型的理想选择,适用于复杂任务的多方面支持。', | ||
displayName: 'Gemini 1.5 Pro', | ||
enabled: true, | ||
functionCall: true, | ||
id: 'gemini-1.5-pro-latest', | ||
maxOutput: 8192, | ||
pricing: { | ||
cachedInput: 0.875, | ||
input: 3.5, | ||
output: 10.5, | ||
}, | ||
releasedAt: '2024-02-15', | ||
tokens: 2_000_000 + 8192, | ||
vision: true, | ||
}, | ||
{ | ||
description: | ||
'Gemini 1.5 Pro 002 是最新的生产就绪模型,提供更高质量的输出,特别在数学、长上下文和视觉任务方面有显著提升。', | ||
displayName: 'Gemini 1.5 Pro 002', | ||
enabled: true, | ||
functionCall: true, | ||
id: 'gemini-1.5-pro-002', | ||
maxOutput: 8192, | ||
pricing: { | ||
cachedInput: 0.315, | ||
input: 1.25, | ||
output: 2.5, | ||
}, | ||
releasedAt: '2024-09-24', | ||
tokens: 2_000_000 + 8192, | ||
vision: true, | ||
}, | ||
{ | ||
description: 'Gemini 1.5 Pro 001 是可扩展的多模态AI解决方案,支持广泛的复杂任务。', | ||
displayName: 'Gemini 1.5 Pro 001', | ||
functionCall: true, | ||
id: 'gemini-1.5-pro-001', | ||
maxOutput: 8192, | ||
pricing: { | ||
cachedInput: 0.875, | ||
input: 3.5, | ||
output: 10.5, | ||
}, | ||
releasedAt: '2024-02-15', | ||
tokens: 2_000_000 + 8192, | ||
vision: true, | ||
}, | ||
{ | ||
description: 'Gemini 1.5 Pro 0827 结合最新优化技术,带来更高效的多模态数据处理能力。', | ||
displayName: 'Gemini 1.5 Pro 0827', | ||
functionCall: true, | ||
id: 'gemini-1.5-pro-exp-0827', | ||
maxOutput: 8192, | ||
pricing: { | ||
cachedInput: 0.875, | ||
input: 3.5, | ||
output: 10.5, | ||
}, | ||
releasedAt: '2024-08-27', | ||
tokens: 2_000_000 + 8192, | ||
vision: true, | ||
}, | ||
{ | ||
description: 'Gemini 1.5 Pro 0801 提供出色的多模态处理能力,为应用开发带来更大灵活性。', | ||
displayName: 'Gemini 1.5 Pro 0801', | ||
functionCall: true, | ||
id: 'gemini-1.5-pro-exp-0801', | ||
maxOutput: 8192, | ||
pricing: { | ||
cachedInput: 0.875, | ||
input: 3.5, | ||
output: 10.5, | ||
}, | ||
releasedAt: '2024-08-01', | ||
tokens: 2_000_000 + 8192, | ||
vision: true, | ||
}, | ||
{ | ||
description: 'Gemini 1.0 Pro 是Google的高性能AI模型,专为广泛任务扩展而设计。', | ||
displayName: 'Gemini 1.0 Pro', | ||
id: 'gemini-1.0-pro-latest', | ||
maxOutput: 2048, | ||
pricing: { | ||
input: 0.5, | ||
output: 1.5, | ||
}, | ||
releasedAt: '2023-12-06', | ||
tokens: 30_720 + 2048, | ||
}, | ||
{ | ||
description: | ||
'Gemini 1.0 Pro 001 (Tuning) 提供稳定并可调优的性能,是复杂任务解决方案的理想选择。', | ||
displayName: 'Gemini 1.0 Pro 001 (Tuning)', | ||
functionCall: true, | ||
id: 'gemini-1.0-pro-001', | ||
maxOutput: 2048, | ||
pricing: { | ||
input: 0.5, | ||
output: 1.5, | ||
}, | ||
releasedAt: '2023-12-06', | ||
tokens: 30_720 + 2048, | ||
}, | ||
{ | ||
description: 'Gemini 1.0 Pro 002 (Tuning) 提供出色的多模态支持,专注于复杂任务的有效解决。', | ||
displayName: 'Gemini 1.0 Pro 002 (Tuning)', | ||
id: 'gemini-1.0-pro-002', | ||
maxOutput: 2048, | ||
pricing: { | ||
input: 0.5, | ||
output: 1.5, | ||
}, | ||
releasedAt: '2023-12-06', | ||
tokens: 30_720 + 2048, | ||
}, | ||
], | ||
checkModel: 'gemini-1.5-flash-latest', | ||
description: | ||
'Google 的 Gemini 系列是其最先进、通用的 AI模型,由 Google DeepMind 打造,专为多模态设计,支持文本、代码、图像、音频和视频的无缝理解与处理。适用于从数据中心到移动设备的多种环境,极大提升了AI模型的效率与应用广泛性。', | ||
id: 'vertexai', | ||
modelsUrl: 'https://cloud.google.com/vertex-ai/generative-ai/docs/learn/model-versioning', | ||
name: 'VertexAI', | ||
showApiKey: false, | ||
showChecker: false, | ||
smoothing: { | ||
speed: 2, | ||
text: true, | ||
}, | ||
url: 'https://cloud.google.com/vertex-ai', | ||
}; | ||
|
||
export default VertexAI; |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.