refactor(llm): cleanup providers for future ops (closes #134) (#147)

support allow_insecure and proxy ops

Signed-off-by: Aaron Pham <contact@aarnphm.xyz>
This commit is contained in:
Aaron Pham
2024-08-22 01:48:40 -04:00
committed by GitHub
parent 380a7254ae
commit 8d52229f16
15 changed files with 1007 additions and 874 deletions

View File

@@ -4,209 +4,21 @@ local curl = require("plenary.curl")
local Utils = require("avante.utils")
local Config = require("avante.config")
local Tiktoken = require("avante.tiktoken")
local Dressing = require("avante.ui.dressing")
local P = require("avante.providers")
---@class avante.LLM
local M = {}
M.CANCEL_PATTERN = "AvanteLLMEscape"
---@class CopilotToken
---@field annotations_enabled boolean
---@field chat_enabled boolean
---@field chat_jetbrains_enabled boolean
---@field code_quote_enabled boolean
---@field codesearch boolean
---@field copilotignore_enabled boolean
---@field endpoints {api: string, ["origin-tracker"]: string, proxy: string, telemetry: string}
---@field expires_at integer
---@field individual boolean
---@field nes_enabled boolean
---@field prompt_8k boolean
---@field public_suggestions string
---@field refresh_in integer
---@field sku string
---@field snippy_load_test_enabled boolean
---@field telemetry string
---@field token string
---@field tracking_id string
---@field vsc_electron_fetcher boolean
---@field xcode boolean
---@field xcode_chat boolean
---
---@private
---@class AvanteCopilot: table<string, any>
---@field proxy string
---@field allow_insecure boolean
---@field token? CopilotToken
---@field github_token? string
---@field sessionid? string
---@field machineid? string
M.copilot = nil
---@class EnvironmentHandler: table<[Provider], string>
local E = {
---@type table<Provider, string | fun(): boolean>
env = {
openai = "OPENAI_API_KEY",
claude = "ANTHROPIC_API_KEY",
azure = "AZURE_OPENAI_API_KEY",
deepseek = "DEEPSEEK_API_KEY",
groq = "GROQ_API_KEY",
gemini = "GEMINI_API_KEY",
copilot = function()
if Utils.has("copilot.lua") or Utils.has("copilot.vim") or Utils.copilot.find_config_path() then
return true
end
Utils.warn("copilot is not setup correctly. Please use copilot.lua or copilot.vim for authentication.")
return false
end,
},
}
setmetatable(E, {
---@param k Provider
__index = function(_, k)
if E.is_local(k) then
return true
end
local builtins = E.env[k]
if builtins then
if type(builtins) == "function" then
return builtins()
end
return os.getenv(builtins) and true or false
end
---@type AvanteProvider | nil
local external = Config.vendors[k]
if external then
return os.getenv(external.api_key_name) and true or false
end
end,
})
---@private
E._once = false
---@param provider Provider
E.is_default = function(provider)
return E.env[provider] and true or false
end
local AVANTE_INTERNAL_KEY = "__avante_internal"
--- return the environment variable name for the given provider
---@param provider? Provider
---@return string the envvar key
E.key = function(provider)
provider = provider or Config.provider
if E.is_default(provider) then
local result = E.env[provider]
return type(result) == "function" and AVANTE_INTERNAL_KEY or result
end
---@type AvanteProvider | nil
local external = Config.vendors[provider]
if external then
return external.api_key_name
end
error("Failed to find provider: " .. provider, 2)
end
---@param provider Provider
E.is_local = function(provider)
if Config.options[provider] then
return Config.options[provider]["local"]
elseif Config.vendors[provider] then
return Config.vendors[provider]["local"]
else
return false
end
end
---@param provider? Provider
E.value = function(provider)
if E.is_local(provider or Config.provider) then
return "__avante_dummy"
end
return os.getenv(E.key(provider or Config.provider))
end
--- intialize the environment variable for current neovim session.
--- This will only run once and spawn a UI for users to input the envvar.
---@param var string supported providers
---@param refresh? boolean
---@private
E.setup = function(var, refresh)
if var == AVANTE_INTERNAL_KEY then
return
end
refresh = refresh or false
---@param value string
---@return nil
local function on_confirm(value)
if value then
vim.fn.setenv(var, value)
else
if not E[Config.provider] then
Utils.warn("Failed to set " .. var .. ". Avante won't work as expected", { once = true, title = "Avante" })
end
end
end
if refresh then
vim.defer_fn(function()
Dressing.initialize_input_buffer({ opts = { prompt = "Enter " .. var .. ": " }, on_confirm = on_confirm })
end, 200)
elseif not E._once then
E._once = true
api.nvim_create_autocmd({ "BufEnter", "BufWinEnter" }, {
pattern = "*",
once = true,
callback = function()
vim.defer_fn(function()
-- only mount if given buffer is not of buftype ministarter, dashboard, alpha, qf
local exclude_buftypes = { "dashboard", "alpha", "qf", "nofile" }
local exclude_filetypes = {
"NvimTree",
"Outline",
"help",
"dashboard",
"alpha",
"qf",
"ministarter",
"TelescopePrompt",
"gitcommit",
"gitrebase",
"DressingInput",
}
if
not vim.tbl_contains(exclude_buftypes, vim.bo.buftype)
and not vim.tbl_contains(exclude_filetypes, vim.bo.filetype)
then
Dressing.initialize_input_buffer({
opts = { prompt = "Enter " .. var .. ": " },
on_confirm = on_confirm,
})
end
end, 200)
end,
})
end
end
------------------------------Prompt and type------------------------------
---@alias AvanteSystemPrompt string
local system_prompt = [[
You are an excellent programming expert.
]]
---@alias AvanteBasePrompt string
local base_user_prompt = [[
Your primary task is to suggest code modifications with precise line number ranges. Follow these instructions meticulously:
@@ -251,490 +63,6 @@ Replace lines: {{start_line}}-{{end_line}}
Remember: Accurate line numbers are CRITICAL. The range start_line to end_line must include ALL lines to be replaced, from the very first to the very last. Double-check every range before finalizing your response, paying special attention to the start_line to ensure it hasn't shifted down. Ensure that your line numbers perfectly match the original code structure without any overall shift.
]]
---@class AvanteHandlerOptions: table<[string], string>
---@field on_chunk AvanteChunkParser
---@field on_complete AvanteCompleteParser
---
---@class AvantePromptOptions: table<[string], string>
---@field question string
---@field code_lang string
---@field code_content string
---@field selected_code_content? string
---
---@class AvanteBaseMessage
---@field role "user" | "system"
---@field content string
---
---@class AvanteClaudeMessage: AvanteBaseMessage
---@field role "user"
---@field content {type: "text", text: string, cache_control?: {type: "ephemeral"}}[]
---
---@alias AvanteOpenAIMessage AvanteBaseMessage
---
---@class AvanteGeminiMessage
---@field role "user"
---@field parts { text: string }[]
---
---@alias AvanteChatMessage AvanteClaudeMessage | AvanteOpenAIMessage | AvanteGeminiMessage
---
---@alias AvanteAiMessageBuilder fun(opts: AvantePromptOptions): AvanteChatMessage[]
---
---@class AvanteCurlOutput: {url: string, body: table<string, any> | string, headers: table<string, string>}
---@alias AvanteCurlArgsBuilder fun(code_opts: AvantePromptOptions): AvanteCurlOutput
---
---@class ResponseParser
---@field on_chunk fun(chunk: string): any
---@field on_complete fun(err: string|nil): any
---@alias AvanteResponseParser fun(data_stream: string, event_state: string, opts: ResponseParser): nil
---
---@class AvanteDefaultBaseProvider
---@field endpoint string
---@field local? boolean
---
---@class AvanteSupportedProvider: AvanteDefaultBaseProvider
---@field model string
---@field temperature number
---@field max_tokens number
---
---@class AvanteAzureProvider: AvanteDefaultBaseProvider
---@field deployment string
---@field api_version string
---@field temperature number
---@field max_tokens number
---
---@class AvanteCopilotProvider: AvanteSupportedProvider
---@field proxy string | nil
---@field allow_insecure boolean
---@field timeout number
---
---@class AvanteGeminiProvider: AvanteDefaultBaseProvider
---@field model string
---@field type string
---@field options table
---
---@class AvanteProvider: AvanteDefaultBaseProvider
---@field model? string
---@field api_key_name string
---@field parse_response_data AvanteResponseParser
---@field parse_curl_args fun(opts: AvanteProvider, code_opts: AvantePromptOptions): AvanteCurlOutput
---@field parse_stream_data? fun(line: string, handler_opts: AvanteHandlerOptions): nil
---
---@alias AvanteChunkParser fun(chunk: string): any
---@alias AvanteCompleteParser fun(err: string|nil): nil
------------------------------Anthropic------------------------------
---@param opts AvantePromptOptions
---@return AvanteClaudeMessage[]
M.make_claude_message = function(opts)
local code_prompt_obj = {
type = "text",
text = string.format("<code>```%s\n%s```</code>", opts.code_lang, opts.code_content),
}
if Tiktoken.count(code_prompt_obj.text) > 1024 then
code_prompt_obj.cache_control = { type = "ephemeral" }
end
if opts.selected_code_content then
code_prompt_obj.text = string.format("<code_context>```%s\n%s```</code_context>", opts.code_lang, opts.code_content)
end
local message_content = {
code_prompt_obj,
}
if opts.selected_code_content then
local selected_code_obj = {
type = "text",
text = string.format("<code>```%s\n%s```</code>", opts.code_lang, opts.selected_code_content),
}
if Tiktoken.count(selected_code_obj.text) > 1024 then
selected_code_obj.cache_control = { type = "ephemeral" }
end
table.insert(message_content, selected_code_obj)
end
table.insert(message_content, {
type = "text",
text = string.format("<question>%s</question>", opts.question),
})
local user_prompt = base_user_prompt
local user_prompt_obj = {
type = "text",
text = user_prompt,
}
if Tiktoken.count(user_prompt_obj.text) > 1024 then
user_prompt_obj.cache_control = { type = "ephemeral" }
end
table.insert(message_content, user_prompt_obj)
return {
{
role = "user",
content = message_content,
},
}
end
---@type AvanteResponseParser
M.parse_claude_response = function(data_stream, event_state, opts)
if event_state == "content_block_delta" then
local ok, json = pcall(vim.json.decode, data_stream)
if not ok then
return
end
opts.on_chunk(json.delta.text)
elseif event_state == "message_stop" then
opts.on_complete(nil)
return
elseif event_state == "error" then
opts.on_complete(vim.json.decode(data_stream))
end
end
---@type AvanteCurlArgsBuilder
M.make_claude_curl_args = function(code_opts)
return {
url = Utils.trim(Config.claude.endpoint, { suffix = "/" }) .. "/v1/messages",
headers = {
["Content-Type"] = "application/json",
["x-api-key"] = E.value("claude"),
["anthropic-version"] = "2023-06-01",
["anthropic-beta"] = "prompt-caching-2024-07-31",
},
body = {
model = Config.claude.model,
system = system_prompt,
stream = true,
messages = M.make_claude_message(code_opts),
temperature = Config.claude.temperature,
max_tokens = Config.claude.max_tokens,
},
}
end
------------------------------OpenAI------------------------------
---@param opts AvantePromptOptions
---@return AvanteOpenAIMessage[]
M.make_openai_message = function(opts)
local user_prompt = base_user_prompt
.. "\n\nCODE:\n"
.. "```"
.. opts.code_lang
.. "\n"
.. opts.code_content
.. "\n```"
.. "\n\nQUESTION:\n"
.. opts.question
if opts.selected_code_content ~= nil then
user_prompt = base_user_prompt
.. "\n\nCODE CONTEXT:\n"
.. "```"
.. opts.code_lang
.. "\n"
.. opts.code_content
.. "\n```"
.. "\n\nCODE:\n"
.. "```"
.. opts.code_lang
.. "\n"
.. opts.selected_code_content
.. "\n```"
.. "\n\nQUESTION:\n"
.. opts.question
end
return {
{ role = "system", content = system_prompt },
{ role = "user", content = user_prompt },
}
end
---@type AvanteResponseParser
M.parse_openai_response = function(data_stream, _, opts)
if data_stream:match('"%[DONE%]":') then
opts.on_complete(nil)
return
end
if data_stream:match('"delta":') then
local json = vim.json.decode(data_stream)
if json.choices and json.choices[1] then
local choice = json.choices[1]
if choice.finish_reason == "stop" then
opts.on_complete(nil)
elseif choice.delta.content then
opts.on_chunk(choice.delta.content)
end
end
end
end
---@type AvanteCurlArgsBuilder
M.make_openai_curl_args = function(code_opts)
return {
url = Utils.trim(Config.openai.endpoint, { suffix = "/" }) .. "/v1/chat/completions",
headers = {
["Content-Type"] = "application/json",
["Authorization"] = "Bearer " .. E.value("openai"),
},
body = {
model = Config.openai.model,
messages = M.make_openai_message(code_opts),
temperature = Config.openai.temperature,
max_tokens = Config.openai.max_tokens,
stream = true,
},
}
end
------------------------------Copilot------------------------------
---@type AvanteAiMessageBuilder
M.make_copilot_message = M.make_openai_message
---@type AvanteResponseParser
M.parse_copilot_response = M.parse_openai_response
---@type AvanteCurlArgsBuilder
M.make_copilot_curl_args = function(code_opts)
local github_token = Utils.copilot.cached_token()
if not github_token then
error(
"No GitHub token found, please use `:Copilot auth` to setup with `copilot.lua` or `:Copilot setup` with `copilot.vim`"
)
end
local on_done = function()
return {
url = Utils.trim(Config.copilot.endpoint, { suffix = "/" }) .. "/chat/completions",
proxy = Config.copilot.proxy,
insecure = Config.copilot.allow_insecure,
headers = Utils.copilot.generate_headers(M.copilot.token.token, M.copilot.sessionid, M.copilot.machineid),
body = {
mode = Config.copilot.model,
n = 1,
top_p = 1,
stream = true,
temperature = Config.copilot.temperature,
max_tokens = Config.copilot.max_tokens,
messages = M.make_copilot_message(code_opts),
},
}
end
local result = nil
if not M.copilot.token or (M.copilot.token.expires_at and M.copilot.token.expires_at <= math.floor(os.time())) then
local sessionid = Utils.copilot.uuid() .. tostring(math.floor(os.time() * 1000))
local url = "https://api.github.com/copilot_internal/v2/token"
local headers = {
["Authorization"] = "token " .. github_token,
["Accept"] = "application/json",
}
for key, value in pairs(Utils.copilot.version_headers) do
headers[key] = value
end
local response = curl.get(url, {
timeout = Config.copilot.timeout,
headers = headers,
proxy = M.copilot.proxy,
insecure = M.copilot.allow_insecure,
on_error = function(err)
error("Failed to get response: " .. vim.inspect(err))
end,
})
M.copilot.sessionid = sessionid
M.copilot.token = vim.json.decode(response.body)
result = on_done()
else
result = on_done()
end
return result
end
------------------------------Azure------------------------------
---@type AvanteAiMessageBuilder
M.make_azure_message = M.make_openai_message
---@type AvanteResponseParser
M.parse_azure_response = M.parse_openai_response
---@type AvanteCurlArgsBuilder
M.make_azure_curl_args = function(code_opts)
return {
url = Config.azure.endpoint
.. "/openai/deployments/"
.. Config.azure.deployment
.. "/chat/completions?api-version="
.. Config.azure.api_version,
headers = {
["Content-Type"] = "application/json",
["api-key"] = E.value("azure"),
},
body = {
messages = M.make_openai_message(code_opts),
temperature = Config.azure.temperature,
max_tokens = Config.azure.max_tokens,
stream = true,
},
}
end
------------------------------Deepseek------------------------------
---@type AvanteAiMessageBuilder
M.make_deepseek_message = M.make_openai_message
---@type AvanteResponseParser
M.parse_deepseek_response = M.parse_openai_response
---@type AvanteCurlArgsBuilder
M.make_deepseek_curl_args = function(code_opts)
return {
url = Utils.trim(Config.deepseek.endpoint, { suffix = "/" }) .. "/chat/completions",
headers = {
["Content-Type"] = "application/json",
["Authorization"] = "Bearer " .. E.value("deepseek"),
},
body = {
model = Config.deepseek.model,
messages = M.make_openai_message(code_opts),
temperature = Config.deepseek.temperature,
max_tokens = Config.deepseek.max_tokens,
stream = true,
},
}
end
------------------------------Grok------------------------------
---@type AvanteAiMessageBuilder
M.make_groq_message = M.make_openai_message
---@type AvanteResponseParser
M.parse_groq_response = M.parse_openai_response
---@type AvanteCurlArgsBuilder
M.make_groq_curl_args = function(code_opts)
return {
url = Utils.trim(Config.groq.endpoint, { suffix = "/" }) .. "/openai/v1/chat/completions",
headers = {
["Content-Type"] = "application/json",
["Authorization"] = "Bearer " .. E.value("groq"),
},
body = {
model = Config.groq.model,
messages = M.make_openai_message(code_opts),
temperature = Config.groq.temperature,
max_tokens = Config.groq.max_tokens,
stream = true,
},
}
end
------------------------------Gemini------------------------------
---@param opts AvantePromptOptions
---@return AvanteGeminiMessage[]
M.make_gemini_message = function(opts)
local code_prompt_obj = {
text = string.format("<code>```%s\n%s```</code>", opts.code_lang, opts.code_content),
}
if opts.selected_code_content then
code_prompt_obj.text = string.format("<code_context>```%s\n%s```</code_context>", opts.code_lang, opts.code_content)
end
-- parts ready
local message_content = {
code_prompt_obj,
}
if opts.selected_code_content then
local selected_code_obj = {
text = string.format("<code>```%s\n%s```</code>", opts.code_lang, opts.selected_code_content),
}
table.insert(message_content, selected_code_obj)
end
-- insert a part into parts
table.insert(message_content, {
text = string.format("<question>%s</question>", opts.question),
})
-- local user_prompt_obj = {
-- text = base_user_prompt,
-- }
-- insert another part into parts
-- table.insert(message_content, user_prompt_obj)
return {
{
role = "user",
parts = message_content,
},
}
end
---@type AvanteResponseParser
M.parse_gemini_response = function(data_stream, event_state, opts)
local json = vim.json.decode(data_stream)
opts.on_chunk(json.candidates[1].content.parts[1].text)
end
---@type AvanteCurlArgsBuilder
M.make_gemini_curl_args = function(code_opts)
local endpoint = ""
if Config.gemini.endpoint == "" then
endpoint = "https://generativelanguage.googleapis.com/v1beta/models/"
.. Config.gemini.model
.. ":streamGenerateContent?alt=sse&key="
.. E.value("gemini")
end
-- Prepare the body with contents and options (only if options are not empty)
local body = {
systemInstruction = {
role = "user",
parts = {
{
text = system_prompt .. base_user_prompt,
},
},
},
contents = M.make_gemini_message(code_opts),
}
if next(Config.gemini.options) ~= nil then -- Check if options table is not empty
for k, v in pairs(Config.gemini.options) do
body[k] = v
end
end
return {
url = endpoint,
headers = {
["Content-Type"] = "application/json",
},
body = body,
}
end
------------------------------Logic------------------------------
local group = vim.api.nvim_create_augroup("AvanteLLM", { clear = true })
local active_job = nil
@@ -747,30 +75,29 @@ local active_job = nil
M.stream = function(question, code_lang, code_content, selected_content_content, on_chunk, on_complete)
local provider = Config.provider
---@type AvantePromptOptions
local code_opts = {
base_prompt = base_user_prompt,
system_prompt = system_prompt,
question = question,
code_lang = code_lang,
code_content = code_content,
selected_code_content = selected_content_content,
}
---@type string
local current_event_state = nil
---@type AvanteProviderFunctor
local Provider = P[provider]
---@type AvanteHandlerOptions
local handler_opts = { on_chunk = on_chunk, on_complete = on_complete }
---@type AvanteCurlOutput
local spec = nil
---@type AvanteProvider
local ProviderConfig = nil
if E.is_default(provider) then
spec = M["make_" .. provider .. "_curl_args"](code_opts)
else
ProviderConfig = Config.vendors[provider]
spec = ProviderConfig.parse_curl_args(ProviderConfig, code_opts)
end
local spec = Provider.parse_curl_args(Config.get_provider(provider), code_opts)
---@param line string
local function parse_and_call(line)
local function parse_stream_data(line)
local event = line:match("^event: (.+)$")
if event then
current_event_state = event
@@ -778,11 +105,7 @@ M.stream = function(question, code_lang, code_content, selected_content_content,
end
local data_match = line:match("^data: (.+)$")
if data_match then
if ProviderConfig ~= nil then
ProviderConfig.parse_response_data(data_match, current_event_state, handler_opts)
else
M["parse_" .. provider .. "_response"](data_match, current_event_state, handler_opts)
end
Provider.parse_response(data_match, current_event_state, handler_opts)
end
end
@@ -793,6 +116,8 @@ M.stream = function(question, code_lang, code_content, selected_content_content,
active_job = curl.post(spec.url, {
headers = spec.headers,
proxy = spec.proxy,
insecure = spec.insecure,
body = vim.json.encode(spec.body),
stream = function(err, data, _)
if err then
@@ -803,16 +128,16 @@ M.stream = function(question, code_lang, code_content, selected_content_content,
return
end
vim.schedule(function()
if ProviderConfig ~= nil and ProviderConfig.parse_stream_data ~= nil then
if ProviderConfig.parse_response_data ~= nil then
if Config.options[provider] == nil and Provider.parse_stream_data ~= nil then
if Provider.parse_response ~= nil then
Utils.warn(
"parse_stream_data and parse_response_data are mutually exclusive, and thus parse_response_data will be ignored. Make sure that you handle the incoming data correctly.",
{ once = true }
)
end
ProviderConfig.parse_stream_data(data, handler_opts)
Provider.parse_stream_data(data, handler_opts)
else
parse_and_call(data)
parse_stream_data(data)
end
end)
end,
@@ -839,61 +164,4 @@ M.stream = function(question, code_lang, code_content, selected_content_content,
return active_job
end
---@public
function M.setup()
if Config.provider == "copilot" and not M.copilot then
M.copilot = {
proxy = Config.copilot.proxy,
allow_insecure = Config.copilot.allow_insecure,
github_token = Utils.copilot.cached_token(),
sessionid = nil,
token = nil,
machineid = Utils.copilot.machine_id(),
}
end
local has = E[Config.provider]
if not has then
E.setup(E.key())
end
M.commands()
end
---@param provider Provider
function M.refresh(provider)
local has = E[provider]
if not has then
E.setup(E.key(provider), true)
else
Utils.info("Switch to provider: " .. provider, { once = true, title = "Avante" })
end
require("avante.config").override({ provider = provider })
end
---@private
M.commands = function()
api.nvim_create_user_command("AvanteSwitchProvider", function(args)
local cmd = vim.trim(args.args or "")
M.refresh(cmd)
end, {
nargs = 1,
desc = "avante: switch provider",
complete = function(_, line)
if line:match("^%s*AvanteSwitchProvider %w") then
return {}
end
local prefix = line:match("^%s*AvanteSwitchProvider (%w*)") or ""
-- join two tables
local Keys = vim.list_extend(vim.tbl_keys(E.env), vim.tbl_keys(Config.vendors))
return vim.tbl_filter(function(key)
return key:find(prefix) == 1
end, Keys)
end,
})
end
M.SYSTEM_PROMPT = system_prompt
M.BASE_PROMPT = base_user_prompt
return M