This commit is contained in:
Nicole Dresselhaus
2025-06-04 10:13:16 +02:00
parent 8e7058f4b2
commit 9ab97a7867
6 changed files with 166 additions and 11 deletions

View File

@ -6,6 +6,9 @@ return {
-- add any opts here
-- for example
provider = "ollama",
behaviour = {
enable_cursor_planning_mode = true, -- enable cursor planning mode!
},
ollama = {
endpoint = "http://gpu.dighist.geschichte.hu-berlin.de:11434",
model = "cogito:14b", -- your desired model (or use gpt-4o, etc.)
@ -15,7 +18,23 @@ return {
stream = true,
thinking = true,
system_prompt = "Enable deep thinking subroutine.",
--reasoning_effort = "medium", -- low|medium|high, only used for reasoning models
-- reasoning_effort = "high", -- low|medium|high, only used for reasoning models
},
rag_service = {
enabled = true, -- Enables the RAG service
host_mount = os.getenv("HOME"), -- Host mount path for the rag service
provider = "ollama", -- The provider to use for RAG service (e.g. openai or ollama)
llm_model = "qwen3:32b", -- The LLM model to use for RAG service
embed_model = "nomic-embed-text", -- The embedding model to use for RAG service
endpoint = "http://gpu.dighist.geschichte.hu-berlin.de:11434", -- The API endpoint for RAG service
},
vendors = {
deepthink = {
__inherited_from = "ollama",
model = "qwen3:32b",
max_completion_tokens = 40000,
reasoning_effort = "high",
},
},
},
-- if you want to build from source then do `make BUILD_FROM_SOURCE=true`