diff --git a/lua/avante/config.lua b/lua/avante/config.lua index 0bdb463..2c22754 100644 --- a/lua/avante/config.lua +++ b/lua/avante/config.lua @@ -58,6 +58,8 @@ M._defaults = { enabled = false, -- Enables the RAG service host_mount = os.getenv("HOME"), -- Host mount path for the RAG service (Docker will mount this path) runner = "docker", -- The runner for the RAG service (can use docker or nix) + -- The image to use to run the rag service if runner is docker + image = "quay.io/yetoneful/avante-rag-service:0.0.11", llm = { -- Configuration for the Language Model (LLM) used by the RAG service provider = "openai", -- The LLM provider endpoint = "https://api.openai.com/v1", -- The LLM API endpoint diff --git a/lua/avante/rag_service.lua b/lua/avante/rag_service.lua index f22fba2..2d544dc 100644 --- a/lua/avante/rag_service.lua +++ b/lua/avante/rag_service.lua @@ -8,7 +8,13 @@ local M = {} local container_name = "avante-rag-service" local service_path = "/tmp/" .. container_name -function M.get_rag_service_image() return "quay.io/yetoneful/avante-rag-service:0.0.11" end +function M.get_rag_service_image() + if Config.rag_service and Config.rag_service.image then + return Config.rag_service.image + else + return "quay.io/yetoneful/avante-rag-service:0.0.11" + end +end function M.get_rag_service_port() return 20250 end diff --git a/py/rag-service/requirements.txt b/py/rag-service/requirements.txt index 44d6abf..8f82333 100644 --- a/py/rag-service/requirements.txt +++ b/py/rag-service/requirements.txt @@ -9,6 +9,7 @@ attrs==25.1.0 backoff==2.2.1 bcrypt==4.2.1 beautifulsoup4==4.13.3 +bleach==6.3.0 build==1.2.2.post1 cachetools==5.5.1 certifi==2024.12.14 @@ -20,6 +21,7 @@ coloredlogs==15.0.1 dashscope==1.22.2 dataclasses-json==0.6.7 decorator==5.1.1 +defusedxml==0.7.1 deprecated==1.2.18 dirtyjson==1.0.8 distro==1.9.0 @@ -31,6 +33,7 @@ et-xmlfile==2.0.0 executing==2.2.0 fastapi==0.115.8 fastapi-cli==0.0.7 +fastjsonschema==2.21.2 filelock==3.17.0 filetype==1.2.0 flatbuffers==25.1.24 @@ -55,6 +58,11 @@ jedi==0.19.2 jinja2==3.1.5 jiter==0.8.2 joblib==1.4.2 +jsonschema==4.25.1 +jsonschema-specifications==2025.9.1 +jupyter-client==8.7.0 +jupyter-core==5.9.1 +jupyterlab-pygments==0.3.0 kubernetes==32.0.0 llama-cloud==0.1.11 llama-cloud-services==0.6.0 @@ -84,11 +92,15 @@ markupsafe==3.0.2 marshmallow==3.26.1 matplotlib-inline==0.1.7 mdurl==0.1.2 +mistune==3.1.4 mmh3==5.1.0 monotonic==1.6 mpmath==1.3.0 multidict==6.1.0 mypy-extensions==1.0.0 +nbclient==0.10.2 +nbconvert==7.16.6 +nbformat==5.10.4 nest-asyncio==1.6.0 networkx==3.4.2 nltk==3.9.1 @@ -112,10 +124,12 @@ orjson==3.10.15 overrides==7.7.0 packaging==24.2 pandas==2.2.3 +pandocfilters==1.5.1 parso==0.8.4 pathspec==0.12.1 pexpect==4.9.0 pillow==11.1.0 +platformdirs==4.5.1 posthog==3.11.0 prompt-toolkit==3.0.50 propcache==0.2.1 @@ -135,11 +149,14 @@ python-dotenv==1.0.1 python-multipart==0.0.20 pytz==2025.1 pyyaml==6.0.2 +pyzmq==27.1.0 +referencing==0.37.0 regex==2024.11.6 requests==2.32.3 requests-oauthlib==2.0.0 rich==13.9.4 rich-toolkit==0.13.2 +rpds-py==0.30.0 rsa==4.9 safetensors==0.5.3 shellingham==1.5.4 @@ -153,7 +170,9 @@ striprtf==0.0.26 sympy==1.13.3 tenacity==9.0.0 tiktoken==0.8.0 +tinycss2==1.4.0 tokenizers==0.21.0 +tornado==6.5.3 tqdm==4.67.1 traitlets==5.14.3 transformers==4.51.3 @@ -172,9 +191,9 @@ uvloop==0.21.0 watchdog==6.0.0 watchfiles==1.0.4 wcwidth==0.2.13 +webencodings==0.5.1 websocket-client==1.8.0 websockets==14.2 wrapt==1.17.2 yarl==1.18.3 zipp==3.21.0 -nbconvert==7.16.6