From c26460e7b600b9f4350cd0d6756944ead4f08c78 Mon Sep 17 00:00:00 2001 From: Yohan Lasorsa Date: Mon, 6 May 2024 16:54:02 +0200 Subject: [PATCH] feat: swicth chat model to gpt-4-turbo (#65) * feat: swicth chat model to gpt-4-turbo * docs: update cost estimate --- docs/cost.md | 2 +- infra/main.bicep | 2 +- infra/main.parameters.json | 4 ++-- 3 files changed, 4 insertions(+), 4 deletions(-) diff --git a/docs/cost.md b/docs/cost.md index 98e5de8..27093e0 100644 --- a/docs/cost.md +++ b/docs/cost.md @@ -1,7 +1,7 @@ ## Cost estimation Pricing varies per region and usage, so it isn't possible to predict exact costs for your usage. -However, you can use the [Azure pricing calculator](https://azure.com/e/a5769032546440dc98285eaba6bd5423) for the resources below to get an estimate. +However, you can use the [Azure pricing calculator](https://azure.com/e/c504007c9f024699a37f5d947dbb1e79) for the resources below to get an estimate. - Azure Functions: Consumption plan, Free for the first 1M executions. Pricing per execution and memory used. [Pricing](https://azure.microsoft.com/pricing/details/functions/) - Azure Static Web Apps: Free tier, 100GB bandwidth. Pricing per GB served. [Pricing](https://azure.microsoft.com/pricing/details/app-service/static/) diff --git a/infra/main.bicep b/infra/main.bicep index bdf2aae..ba14dc9 100644 --- a/infra/main.bicep +++ b/infra/main.bicep @@ -45,7 +45,7 @@ param webappLocation string // Set in main.parameters.json param chatModelName string // Set in main.parameters.json param chatDeploymentName string = chatModelName param chatModelVersion string // Set in main.parameters.json -param chatDeploymentCapacity int = 30 +param chatDeploymentCapacity int = 15 param embeddingsModelName string // Set in main.parameters.json param embeddingsModelVersion string // Set in main.parameters.json param embeddingsDeploymentName string = embeddingsModelName diff --git a/infra/main.parameters.json b/infra/main.parameters.json index d015798..51b580e 100644 --- a/infra/main.parameters.json +++ b/infra/main.parameters.json @@ -18,10 +18,10 @@ "value": "${AZURE_OPENAI_LOCATION=eastus2}" }, "chatModelName": { - "value": "${AZURE_OPENAI_API_MODEL=gpt-35-turbo}" + "value": "${AZURE_OPENAI_API_MODEL=gpt-4}" }, "chatModelVersion": { - "value": "${AZURE_OPENAI_API_MODEL_VERSION=0613}" + "value": "${AZURE_OPENAI_API_MODEL_VERSION=turbo-2024-04-09}" }, "embeddingsModelName": { "value": "${AZURE_OPENAI_API_EMBEDDINGS_MODEL=text-embedding-ada-002}"