about summary refs log tree commit diff
path: root/.venv/lib/python3.12/site-packages/core/configs/full_ollama.toml
diff options
context:
space:
mode:
authorS. Solomon Darnell2025-03-28 21:52:21 -0500
committerS. Solomon Darnell2025-03-28 21:52:21 -0500
commit4a52a71956a8d46fcb7294ac71734504bb09bcc2 (patch)
treeee3dc5af3b6313e921cd920906356f5d4febc4ed /.venv/lib/python3.12/site-packages/core/configs/full_ollama.toml
parentcc961e04ba734dd72309fb548a2f97d67d578813 (diff)
downloadgn-ai-master.tar.gz
two version of R2R are here HEAD master
Diffstat (limited to '.venv/lib/python3.12/site-packages/core/configs/full_ollama.toml')
-rw-r--r--.venv/lib/python3.12/site-packages/core/configs/full_ollama.toml63
1 files changed, 63 insertions, 0 deletions
diff --git a/.venv/lib/python3.12/site-packages/core/configs/full_ollama.toml b/.venv/lib/python3.12/site-packages/core/configs/full_ollama.toml
new file mode 100644
index 00000000..8ec2fc77
--- /dev/null
+++ b/.venv/lib/python3.12/site-packages/core/configs/full_ollama.toml
@@ -0,0 +1,63 @@
+[app]
+# LLM used for internal operations, like deriving conversation names
+fast_llm = "openai/llama3.1"
+
+# LLM used for user-facing output, like RAG replies
+quality_llm = "openai/llama3.1"
+
+# LLM used for ingesting visual inputs
+vlm = "openai/llama3.1" # TODO - Replace with viable candidate
+
+# LLM used for transcription
+audio_lm = "openai/llama3.1" # TODO - Replace with viable candidate
+
+
+# Reasoning model, used for `research` agent
+reasoning_llm = "openai/llama3.1"
+# Planning model, used for `research` agent
+planning_llm = "openai/llama3.1"
+
+[embedding]
+provider = "ollama"
+base_model = "mxbai-embed-large"
+base_dimension = 1_024
+batch_size = 128
+add_title_as_prefix = true
+concurrent_request_limit = 2
+
+[completion_embedding]
+provider = "ollama"
+base_model = "mxbai-embed-large"
+base_dimension = 1_024
+batch_size = 128
+add_title_as_prefix = true
+concurrent_request_limit = 2
+
+[agent]
+tools = ["search_file_knowledge"]
+
+[completion]
+provider = "litellm"
+concurrent_request_limit = 1
+
+  [completion.generation_config]
+  temperature = 0.1
+  top_p = 1
+  max_tokens_to_sample = 1_024
+  stream = false
+  api_base = "http://localhost:11434/v1"
+
+[ingestion]
+provider = "unstructured_local"
+strategy = "auto"
+chunking_strategy = "by_title"
+new_after_n_chars = 512
+max_characters = 1_024
+combine_under_n_chars = 128
+overlap = 20
+chunks_for_document_summary = 16
+document_summary_model = "ollama/llama3.1"
+automatic_extraction = false
+
+[orchestration]
+provider = "hatchet"