diff --git a/backend/onyx/llm/chat_llm.py b/backend/onyx/llm/chat_llm.py index 32f8684b4..66e65415b 100644 --- a/backend/onyx/llm/chat_llm.py +++ b/backend/onyx/llm/chat_llm.py @@ -453,7 +453,9 @@ class DefaultMultiLLM(LLM): if LOG_DANSWER_MODEL_INTERACTIONS: self.log_model_configs() - if DISABLE_LITELLM_STREAMING: + if ( + DISABLE_LITELLM_STREAMING or self.config.model_name == "o1-2024-12-17" + ): # TODO: remove once litellm supports streaming yield self.invoke(prompt, tools, tool_choice, structured_response_format) return diff --git a/backend/onyx/llm/llm_provider_options.py b/backend/onyx/llm/llm_provider_options.py index cf562ee5a..d42ff3a5e 100644 --- a/backend/onyx/llm/llm_provider_options.py +++ b/backend/onyx/llm/llm_provider_options.py @@ -29,6 +29,7 @@ OPENAI_PROVIDER_NAME = "openai" OPEN_AI_MODEL_NAMES = [ "o1-mini", "o1-preview", + "o1-2024-12-17", "gpt-4", "gpt-4o", "gpt-4o-mini", diff --git a/backend/requirements/default.txt b/backend/requirements/default.txt index 3a4996d90..7a88fc01c 100644 --- a/backend/requirements/default.txt +++ b/backend/requirements/default.txt @@ -29,7 +29,7 @@ trafilatura==1.12.2 langchain==0.1.17 langchain-core==0.1.50 langchain-text-splitters==0.0.1 -litellm==1.54.1 +litellm==1.55.4 lxml==5.3.0 lxml_html_clean==0.2.2 llama-index==0.9.45 diff --git a/backend/requirements/model_server.txt b/backend/requirements/model_server.txt index 531382cb4..ac97e64ae 100644 --- a/backend/requirements/model_server.txt +++ b/backend/requirements/model_server.txt @@ -12,5 +12,5 @@ torch==2.2.0 transformers==4.39.2 uvicorn==0.21.1 voyageai==0.2.3 -litellm==1.54.1 +litellm==1.55.4 sentry-sdk[fastapi,celery,starlette]==2.14.0 \ No newline at end of file diff --git a/web/src/lib/hooks.ts b/web/src/lib/hooks.ts index 214ecb6a8..c9d91d619 100644 --- a/web/src/lib/hooks.ts +++ b/web/src/lib/hooks.ts @@ -299,6 +299,7 @@ const MODEL_DISPLAY_NAMES: { [key: string]: string } = { // OpenAI models "o1-mini": "O1 Mini", "o1-preview": "O1 Preview", + "o1-2024-12-17": "O1", "gpt-4": "GPT 4", "gpt-4o": "GPT 4o", "gpt-4o-2024-08-06": "GPT 4o (Structured Outputs)",