From 50576111c585157d81705ec2c3ef4ddc62e429a1 Mon Sep 17 00:00:00 2001 From: Shreyas-Microsoft Date: Mon, 16 Mar 2026 17:29:33 +0530 Subject: [PATCH 1/5] update ai model name --- infra/main.bicep | 8 ++++---- infra/main_custom.bicep | 8 ++++---- 2 files changed, 8 insertions(+), 8 deletions(-) diff --git a/infra/main.bicep b/infra/main.bicep index 16a2440..f2e4a78 100644 --- a/infra/main.bicep +++ b/infra/main.bicep @@ -32,7 +32,7 @@ var solutionLocation = empty(location) ? resourceGroup().location : location azd: { type: 'location' usageName: [ - 'OpenAI.GlobalStandard.GPT5.1, 500' + 'OpenAI.GlobalStandard.gpt-5.1, 500' ] } }) @@ -69,11 +69,11 @@ param aiDeploymentType string = 'GlobalStandard' @minLength(1) @description('Optional. Name of the AI model to deploy. Recommend using GPT5.1. Defaults to GPT5.1.') -param aiModelName string = 'GPT5.1' +param aiModelName string = 'gpt-5.1' @minLength(1) @description('Optional. Version of AI model. Review available version numbers per model before setting. Defaults to 2025-04-16.') -param aiModelVersion string = '2025-04-16' +param aiModelVersion string = '2025-11-13' @description('Optional. AI model deployment token capacity. Lower this if initial provisioning fails due to capacity. Defaults to 50K tokens per minute to improve regional success rate.') param aiModelCapacity int = 500 @@ -86,7 +86,7 @@ param aiEmbeddingModelName string = 'text-embedding-3-large' param aiEmbeddingModelVersion string = '1' @description('Optional. Embedding model deployment token capacity. Defaults to 500.') -param aiEmbeddingModelCapacity int = 500 +param aiEmbeddingModelCapacity int = 350 @description('Optional. The tags to apply to all deployed Azure resources.') param tags resourceInput<'Microsoft.Resources/resourceGroups@2025-04-01'>.tags = {} diff --git a/infra/main_custom.bicep b/infra/main_custom.bicep index ee99c5b..3802b9e 100644 --- a/infra/main_custom.bicep +++ b/infra/main_custom.bicep @@ -32,7 +32,7 @@ var solutionLocation = empty(location) ? resourceGroup().location : location azd: { type: 'location' usageName: [ - 'OpenAI.GlobalStandard.GPT5.1, 500' + 'OpenAI.GlobalStandard.gpt-5.1, 500' ] } }) @@ -62,11 +62,11 @@ param aiDeploymentType string = 'GlobalStandard' @minLength(1) @description('Optional. Name of the AI model to deploy. Recommend using GPT5.1. Defaults to GPT5.1.') -param aiModelName string = 'GPT5.1' +param aiModelName string = 'gpt-5.1' @minLength(1) -@description('Optional. Version of AI model. Review available version numbers per model before setting. Defaults to 2025-04-16.') -param aiModelVersion string = '2025-04-16' +@description('Optional. Version of AI model. Review available version numbers per model before setting. Defaults to 2025-11-13.') +param aiModelVersion string = '2025-11-13' @description('Optional. AI model deployment token capacity. Lower this if initial provisioning fails due to capacity. Defaults to 50K tokens per minute to improve regional success rate.') param aiModelCapacity int = 1 From a47d0d0306a04abfde89c911865f22ff6d318bb9 Mon Sep 17 00:00:00 2001 From: Shreyas-Microsoft Date: Wed, 18 Mar 2026 08:42:09 +0530 Subject: [PATCH 2/5] change sku from standard to globalstandard --- infra/main.bicep | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/infra/main.bicep b/infra/main.bicep index f2e4a78..198a117 100644 --- a/infra/main.bicep +++ b/infra/main.bicep @@ -887,7 +887,7 @@ module aiFoundry 'br/public:avm/ptn/ai-ml/ai-foundry:0.4.0' = if(!useExistingAiF version: aiEmbeddingModelVersion } sku: { - name: 'Standard' + name: 'GlobalStandard' capacity: aiEmbeddingModelCapacity } } From babfa84a01aa3cd9d0b5cbbeb7c23a7fa0ffe3e1 Mon Sep 17 00:00:00 2001 From: Shreyas-Microsoft Date: Wed, 18 Mar 2026 08:46:22 +0530 Subject: [PATCH 3/5] increase capacity back to 500 --- infra/main.bicep | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/infra/main.bicep b/infra/main.bicep index 198a117..abacb90 100644 --- a/infra/main.bicep +++ b/infra/main.bicep @@ -86,7 +86,7 @@ param aiEmbeddingModelName string = 'text-embedding-3-large' param aiEmbeddingModelVersion string = '1' @description('Optional. Embedding model deployment token capacity. Defaults to 500.') -param aiEmbeddingModelCapacity int = 350 +param aiEmbeddingModelCapacity int = 500 @description('Optional. The tags to apply to all deployed Azure resources.') param tags resourceInput<'Microsoft.Resources/resourceGroups@2025-04-01'>.tags = {} From 5647552a3d9a0bf101abac06c03bdc4fe19a2acc Mon Sep 17 00:00:00 2001 From: Shreyas-Microsoft Date: Wed, 18 Mar 2026 10:12:44 +0530 Subject: [PATCH 4/5] Add aiEmbeddingDeploymentType parameter for embedding model SKU configuration --- infra/main.bicep | 9 +++++++-- 1 file changed, 7 insertions(+), 2 deletions(-) diff --git a/infra/main.bicep b/infra/main.bicep index abacb90..f31ea27 100644 --- a/infra/main.bicep +++ b/infra/main.bicep @@ -85,6 +85,11 @@ param aiEmbeddingModelName string = 'text-embedding-3-large' @description('Optional. Version of the embedding model. Defaults to 1.') param aiEmbeddingModelVersion string = '1' +@minLength(1) +@allowed(['Standard', 'GlobalStandard']) +@description('Optional. Embedding model deployment type. Defaults to GlobalStandard.') +param aiEmbeddingDeploymentType string = 'GlobalStandard' + @description('Optional. Embedding model deployment token capacity. Defaults to 500.') param aiEmbeddingModelCapacity int = 500 @@ -779,7 +784,7 @@ module existingAiFoundryAiServicesDeployments 'modules/ai-services-deployments.b version: aiEmbeddingModelVersion } sku: { - name: 'Standard' + name: aiEmbeddingDeploymentType capacity: aiEmbeddingModelCapacity } } @@ -887,7 +892,7 @@ module aiFoundry 'br/public:avm/ptn/ai-ml/ai-foundry:0.4.0' = if(!useExistingAiF version: aiEmbeddingModelVersion } sku: { - name: 'GlobalStandard' + name: aiEmbeddingDeploymentType capacity: aiEmbeddingModelCapacity } } From abc2ce4e9c23eec7efeace49ad22a795d2ef1d4c Mon Sep 17 00:00:00 2001 From: Shreyas-Microsoft Date: Wed, 18 Mar 2026 11:35:29 +0530 Subject: [PATCH 5/5] Update descriptions Co-authored-by: Copilot Autofix powered by AI <175728472+Copilot@users.noreply.github.com> --- infra/main.bicep | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/infra/main.bicep b/infra/main.bicep index f31ea27..e124273 100644 --- a/infra/main.bicep +++ b/infra/main.bicep @@ -36,7 +36,7 @@ var solutionLocation = empty(location) ? resourceGroup().location : location ] } }) -@description('Required. Azure region for AI services (OpenAI/AI Foundry). Must be a region that supports GPT5.1 model deployment.') +@description('Required. Azure region for AI services (OpenAI/AI Foundry). Must be a region that supports gpt-5.1 model deployment.') param azureAiServiceLocation string @allowed([ @@ -68,11 +68,11 @@ param imageTag string = 'latest' param aiDeploymentType string = 'GlobalStandard' @minLength(1) -@description('Optional. Name of the AI model to deploy. Recommend using GPT5.1. Defaults to GPT5.1.') +@description('Optional. Name of the AI model to deploy. Recommend using gpt-5.1. Defaults to gpt-5.1.') param aiModelName string = 'gpt-5.1' @minLength(1) -@description('Optional. Version of AI model. Review available version numbers per model before setting. Defaults to 2025-04-16.') +@description('Optional. Version of AI model. Review available version numbers per model before setting. Defaults to 2025-11-13.') param aiModelVersion string = '2025-11-13' @description('Optional. AI model deployment token capacity. Lower this if initial provisioning fails due to capacity. Defaults to 50K tokens per minute to improve regional success rate.')