diff options
| author | S. Solomon Darnell | 2025-03-28 21:52:21 -0500 |
|---|---|---|
| committer | S. Solomon Darnell | 2025-03-28 21:52:21 -0500 |
| commit | 4a52a71956a8d46fcb7294ac71734504bb09bcc2 (patch) | |
| tree | ee3dc5af3b6313e921cd920906356f5d4febc4ed /.venv/lib/python3.12/site-packages/core/configs/ollama.toml | |
| parent | cc961e04ba734dd72309fb548a2f97d67d578813 (diff) | |
| download | gn-ai-master.tar.gz | |
Diffstat (limited to '.venv/lib/python3.12/site-packages/core/configs/ollama.toml')
| -rw-r--r-- | .venv/lib/python3.12/site-packages/core/configs/ollama.toml | 48 |
1 files changed, 48 insertions, 0 deletions
diff --git a/.venv/lib/python3.12/site-packages/core/configs/ollama.toml b/.venv/lib/python3.12/site-packages/core/configs/ollama.toml new file mode 100644 index 00000000..5226eebf --- /dev/null +++ b/.venv/lib/python3.12/site-packages/core/configs/ollama.toml @@ -0,0 +1,48 @@ +[app] +# LLM used for internal operations, like deriving conversation names +fast_llm = "openai/llama3.1" ### NOTE - RECOMMENDED TO USE `openai` with `api_base = "http://localhost:11434/v1"` for best results, otherwise `ollama` with `litellm` is acceptable + +# LLM used for user-facing output, like RAG replies +quality_llm = "openai/llama3.1" + +# LLM used for ingesting visual inputs +vlm = "openai/llama3.1" # TODO - Replace with viable candidate + +# LLM used for transcription +audio_lm = "openai/llama3.1" # TODO - Replace with viable candidate + + +# Reasoning model, used for `research` agent +reasoning_llm = "openai/llama3.1" +# Planning model, used for `research` agent +planning_llm = "openai/llama3.1" + +[embedding] +provider = "ollama" +base_model = "mxbai-embed-large" +base_dimension = 1_024 +batch_size = 128 +add_title_as_prefix = true +concurrent_request_limit = 2 + +[completion_embedding] +provider = "ollama" +base_model = "mxbai-embed-large" +base_dimension = 1_024 +batch_size = 128 +add_title_as_prefix = true +concurrent_request_limit = 2 + +[agent] +tools = ["search_file_knowledge"] + +[completion] +provider = "litellm" +concurrent_request_limit = 1 + + [completion.generation_config] + temperature = 0.1 + top_p = 1 + max_tokens_to_sample = 1_024 + stream = false + api_base = "http://localhost:11434/v1" |
