aboutsummaryrefslogtreecommitdiffstats
diff options
context:
space:
mode:
authorben2025-01-16 21:07:47 +0100
committerben2025-01-16 21:07:47 +0100
commit38ab78f649773a2a623595b4025811e9e500b4c8 (patch)
treef07e8074161d30ea6a6350b221ef7c3f0381b22a
parente2561fe3e08e0d73d299a913f534344bb219811c (diff)
downloadai_env-38ab78f649773a2a623595b4025811e9e500b4c8.tar.gz
ai_env-38ab78f649773a2a623595b4025811e9e500b4c8.tar.bz2
ai_env-38ab78f649773a2a623595b4025811e9e500b4c8.tar.xz
Improve configuration with models details.
-rw-r--r--src/aichat/config.yaml14
1 files changed, 14 insertions, 0 deletions
diff --git a/src/aichat/config.yaml b/src/aichat/config.yaml
index b2809b1..7a6fef7 100644
--- a/src/aichat/config.yaml
+++ b/src/aichat/config.yaml
@@ -4,8 +4,22 @@ rag_embedding_model: ollama:nomic-embed-text
rag_chunk_size: 8192
rag_chunk_overlap: 409
model: ollama:qwen2.5
+temperature: 0
clients:
- type: openai-compatible
name: ollama
api_base: http://localhost:11434/v1
api_key: __LLM_API_KEY__
+ models:
+ - name: qwen2.5
+ supports_function_calling: true
+ max_input_tokens: 128000
+ - name: qwen2.5-coder:32b
+ supports_function_calling: true
+ max_input_tokens: 128000
+ - name: nomic-embed-text
+ type: embedding
+ max_input_tokens: 200000
+ max_tokens_per_chunk: 2000
+ default_chunk_size: 8192
+ max_batch_size: 100