v0.2.1 model names config-driven
This commit is contained in:
@@ -3,9 +3,10 @@ import { configFile } from '../file-models/config.json'
|
||||
|
||||
const { InputSpec, Value } = sdk
|
||||
|
||||
// Optional Gemma/Ollama endpoint for the operator-hardware analysis
|
||||
// fallback. Counterpart to setParakeetUrl — Parakeet handles transcribe
|
||||
// overflow, this handles analyze overflow.
|
||||
// Operator's Gemma (or any OpenAI-compatible chat-completions) endpoint
|
||||
// + which model to request. Both fields live-reload so the operator
|
||||
// can pull a different Gemma SKU on Ollama and update the model name
|
||||
// here without restarting the relay.
|
||||
const inputSpec = InputSpec.of({
|
||||
relay_gemma_base_url: Value.text({
|
||||
name: 'Gemma Base URL',
|
||||
@@ -22,6 +23,15 @@ const inputSpec = InputSpec.of({
|
||||
},
|
||||
],
|
||||
}),
|
||||
relay_gemma_model: Value.text({
|
||||
name: 'Gemma Model Name',
|
||||
description:
|
||||
'The model identifier sent in upstream chat-completions requests. Match whatever name your Ollama / vLLM / llama.cpp deployment exposes (run `ollama list` to see what you have pulled). Example: gemma3:27b, gemma2:9b, llama3.1:70b',
|
||||
required: true,
|
||||
default: 'gemma3:27b',
|
||||
minLength: 1,
|
||||
maxLength: 128,
|
||||
}),
|
||||
})
|
||||
|
||||
export const setGemmaUrl = sdk.Action.withInput(
|
||||
@@ -30,7 +40,7 @@ export const setGemmaUrl = sdk.Action.withInput(
|
||||
async ({ effects }) => ({
|
||||
name: 'Set Gemma URL',
|
||||
description:
|
||||
'Optional. Where the relay forwards analysis requests once a user exceeds their monthly Gemini cap. Leave empty to disable the fallback.',
|
||||
'Optional. Where the relay forwards analysis requests once a user exceeds their monthly Gemini cap. Leave URL empty to disable the fallback.',
|
||||
warning: null,
|
||||
allowedStatuses: 'any',
|
||||
group: null,
|
||||
@@ -43,12 +53,14 @@ export const setGemmaUrl = sdk.Action.withInput(
|
||||
const config = await configFile.read().once()
|
||||
return {
|
||||
relay_gemma_base_url: config?.relay_gemma_base_url || '',
|
||||
relay_gemma_model: config?.relay_gemma_model || 'gemma3:27b',
|
||||
}
|
||||
},
|
||||
|
||||
async ({ effects, input }) => {
|
||||
await configFile.merge(effects, {
|
||||
relay_gemma_base_url: (input.relay_gemma_base_url || '').trim(),
|
||||
relay_gemma_model: (input.relay_gemma_model || 'gemma3:27b').trim(),
|
||||
})
|
||||
return null
|
||||
},
|
||||
|
||||
Reference in New Issue
Block a user