From a09ee0ab738c0bbcbaa6cf0aec6c4aa74474358c Mon Sep 17 00:00:00 2001 From: "RingOfStorms (Joshua Bell)" Date: Wed, 3 Dec 2025 21:31:33 +0000 Subject: [PATCH] update llm stuff --- hosts/h001/flake.lock | 12 ++++++------ hosts/h001/mods/litellm.nix | 18 +++++++++--------- hosts/h001/mods/openwebui.nix | 4 ++++ 3 files changed, 19 insertions(+), 15 deletions(-) diff --git a/hosts/h001/flake.lock b/hosts/h001/flake.lock index 2ca1683e..0f0ad6fc 100644 --- a/hosts/h001/flake.lock +++ b/hosts/h001/flake.lock @@ -195,11 +195,11 @@ }, "litellm-nixpkgs": { "locked": { - "lastModified": 1764517877, - "narHash": "sha256-pp3uT4hHijIC8JUK5MEqeAWmParJrgBVzHLNfJDZxg4=", + "lastModified": 1764667669, + "narHash": "sha256-7WUCZfmqLAssbDqwg9cUDAXrSoXN79eEEq17qhTNM/Y=", "owner": "nixos", "repo": "nixpkgs", - "rev": "2d293cbfa5a793b4c50d17c05ef9e385b90edf6c", + "rev": "418468ac9527e799809c900eda37cbff999199b6", "type": "github" }, "original": { @@ -1190,11 +1190,11 @@ }, "open-webui-nixpkgs": { "locked": { - "lastModified": 1764517877, - "narHash": "sha256-pp3uT4hHijIC8JUK5MEqeAWmParJrgBVzHLNfJDZxg4=", + "lastModified": 1764667669, + "narHash": "sha256-7WUCZfmqLAssbDqwg9cUDAXrSoXN79eEEq17qhTNM/Y=", "owner": "nixos", "repo": "nixpkgs", - "rev": "2d293cbfa5a793b4c50d17c05ef9e385b90edf6c", + "rev": "418468ac9527e799809c900eda37cbff999199b6", "type": "github" }, "original": { diff --git a/hosts/h001/mods/litellm.nix b/hosts/h001/mods/litellm.nix index b81109f0..dbf2a6f4 100644 --- a/hosts/h001/mods/litellm.nix +++ b/hosts/h001/mods/litellm.nix @@ -33,10 +33,9 @@ in GITHUB_COPILOT_TOKEN_DIR = "/var/lib/litellm/github_copilot"; XDG_CONFIG_HOME = "/var/lib/litellm/.config"; }; - settings = { + settings = { environment_variables = { LITELLM_PROXY_API_KEY = "na"; - LITELLM_PROXY_API_BASE = "http://100.64.0.8:9010/air_key"; }; litellm_settings = { check_provider_endpoints = true; @@ -81,14 +80,15 @@ in api_key = "na"; }; }) + # curl -L "http://100.64.0.8:9010/azure/openai/models?api-version=2025-04-01-preview" | jq '.data.[].id' [ + "gpt-5.1-2025-11-13" "gpt-4o-2024-05-13" "gpt-4.1-2025-04-14" "gpt-4.1-mini-2025-04-14" "gpt-5-nano-2025-08-07" "gpt-5-mini-2025-08-07" "gpt-5-2025-08-07" - # "gpt-5-codex-2025-09-15" ] ) # 宙 Proxy @@ -98,16 +98,19 @@ in litellm_params = { model = "litellm_proxy/${m}"; api_base = "http://100.64.0.8:9010/air_prd"; - api_key = "os.environ/LITELLM_PROXY_API_KEY"; + api_key = "na"; }; }) - # curl -L t.net.joshuabell.xyz:9010/air_key/models | jq '.data.[].id' + # curl -L t.net.joshuabell.xyz:9010/air_prd/models | jq '.data.[].id' [ "gpt-5-mini" + "gpt-5-nano" + "gpt-5.1" "gpt-5" "gpt-4.1" "gpt-4.1-mini" "gpt-4o" + "gpt-4o-applied-ai" "gpt-4o-mini" "o3-mini" "o4-mini" @@ -116,6 +119,7 @@ in "gemini-2.5-flash" "gemini-2.0-flash-lite" "gemini-2.5-flash-lite" + "gemini-2.5-flash-image" "claude-opus-4.1" "claude-opus-4" "claude-sonnet-4" @@ -125,10 +129,6 @@ in "text-embedding-ada-002" "text-embedding-large-exp-03-07" "text-embedding-005" - "llama7b" - "medgemma-4b" - "qwen3-instruct" - "bge-small-en-v1.5" ] ); }; diff --git a/hosts/h001/mods/openwebui.nix b/hosts/h001/mods/openwebui.nix index f19f77e4..d6c0e5a4 100644 --- a/hosts/h001/mods/openwebui.nix +++ b/hosts/h001/mods/openwebui.nix @@ -77,6 +77,10 @@ in # OAUTH_UPDATE_PICTURE_ON_LOGIN = "True"; BYPASS_MODEL_ACCESS_CONTROL="True"; + + # Other settings + CHAT_STREAM_RESPONSE_CHUNK_MAX_BUFFER_SIZE="10485760"; + REPLACE_IMAGE_URLS_IN_CHAT_RESPONSE="True"; }; }; };