about summary refs log tree commit diff
path: root/.venv/lib/python3.12/site-packages/core/configs/ollama.toml
diff options
context:
space:
mode:
authorS. Solomon Darnell2025-03-28 21:52:21 -0500
committerS. Solomon Darnell2025-03-28 21:52:21 -0500
commit4a52a71956a8d46fcb7294ac71734504bb09bcc2 (patch)
treeee3dc5af3b6313e921cd920906356f5d4febc4ed /.venv/lib/python3.12/site-packages/core/configs/ollama.toml
parentcc961e04ba734dd72309fb548a2f97d67d578813 (diff)
downloadgn-ai-master.tar.gz
two version of R2R are here HEAD master
Diffstat (limited to '.venv/lib/python3.12/site-packages/core/configs/ollama.toml')
-rw-r--r--.venv/lib/python3.12/site-packages/core/configs/ollama.toml48
1 files changed, 48 insertions, 0 deletions
diff --git a/.venv/lib/python3.12/site-packages/core/configs/ollama.toml b/.venv/lib/python3.12/site-packages/core/configs/ollama.toml
new file mode 100644
index 00000000..5226eebf
--- /dev/null
+++ b/.venv/lib/python3.12/site-packages/core/configs/ollama.toml
@@ -0,0 +1,48 @@
+[app]
+# LLM used for internal operations, like deriving conversation names
+fast_llm = "openai/llama3.1" ### NOTE - RECOMMENDED TO USE `openai` with `api_base = "http://localhost:11434/v1"` for best results, otherwise `ollama` with `litellm` is acceptable
+
+# LLM used for user-facing output, like RAG replies
+quality_llm = "openai/llama3.1"
+
+# LLM used for ingesting visual inputs
+vlm = "openai/llama3.1" # TODO - Replace with viable candidate
+
+# LLM used for transcription
+audio_lm = "openai/llama3.1" # TODO - Replace with viable candidate
+
+
+# Reasoning model, used for `research` agent
+reasoning_llm = "openai/llama3.1"
+# Planning model, used for `research` agent
+planning_llm = "openai/llama3.1"
+
+[embedding]
+provider = "ollama"
+base_model = "mxbai-embed-large"
+base_dimension = 1_024
+batch_size = 128
+add_title_as_prefix = true
+concurrent_request_limit = 2
+
+[completion_embedding]
+provider = "ollama"
+base_model = "mxbai-embed-large"
+base_dimension = 1_024
+batch_size = 128
+add_title_as_prefix = true
+concurrent_request_limit = 2
+
+[agent]
+tools = ["search_file_knowledge"]
+
+[completion]
+provider = "litellm"
+concurrent_request_limit = 1
+
+  [completion.generation_config]
+  temperature = 0.1
+  top_p = 1
+  max_tokens_to_sample = 1_024
+  stream = false
+  api_base = "http://localhost:11434/v1"