From 030f0bbb58c6fee291c778bd12a5758049981863 Mon Sep 17 00:00:00 2001 From: Milutin-S Date: Fri, 17 May 2024 22:13:28 +0200 Subject: [PATCH 1/3] Change llm model and set router model explicitly. --- app.py | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/app.py b/app.py index 4209d57..236a642 100644 --- a/app.py +++ b/app.py @@ -56,6 +56,7 @@ def response_generator(query: str): # Rout query collections = semantic_query_router( client=openai_client, + model=config["openai"]["gpt_model"]["router"], query=query, prompt=ROUTER_PROMPT, temperature=config["openai"]["gpt_model"]["temperature"], @@ -82,7 +83,7 @@ def response_generator(query: str): stream = get_answer( client=openai_client, - model=config["openai"]["gpt_model"]["name"], + model=config["openai"]["gpt_model"]["llm"], temperature=config["openai"]["gpt_model"]["temperature"], messages=get_messages( context=context, query=query, conversation=st.session_state.messages From c5a69a1d74eacd4568f20a65b758849080b5fed1 Mon Sep 17 00:00:00 2001 From: Milutin-S Date: Fri, 17 May 2024 22:13:45 +0200 Subject: [PATCH 2/3] Update router model name. --- chat-dev.ipynb | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/chat-dev.ipynb b/chat-dev.ipynb index a97a568..9d43204 100644 --- a/chat-dev.ipynb +++ b/chat-dev.ipynb @@ -225,7 +225,7 @@ "outputs": [], "source": [ "response = openai_client.chat.completions.create(\n", - " model=config[\"openai\"][\"gpt_model\"][\"name_light\"],\n", + " model=config[\"openai\"][\"gpt_model\"][\"router\"],\n", " temperature=config[\"openai\"][\"gpt_model\"][\"temperature\"],\n", " messages=messages,\n", ")" From d7294e92a75089f807ef9543cea5cbd0a3b5a3a3 Mon Sep 17 00:00:00 2001 From: Milutin-S Date: Fri, 17 May 2024 22:14:12 +0200 Subject: [PATCH 3/3] Update router and llm keys, and update llm model. --- config.yaml | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/config.yaml b/config.yaml index 1249f5a..562ebd0 100644 --- a/config.yaml +++ b/config.yaml @@ -3,8 +3,8 @@ openai: name: "text-embedding-3-small" dimensions: 1536 gpt_model: - name: "gpt-4-turbo-preview" - name_light: "gpt-3.5-turbo" + llm: "gpt-4o" + router: "gpt-3.5-turbo" temperature: 0 max_conversation: 100 collection: