From 3f71c1f5dbd10665b2d728c555db2d3edb3d2212 Mon Sep 17 00:00:00 2001 From: Pablo Zaidenvoren Date: Tue, 6 Jan 2026 16:59:48 +0000 Subject: [PATCH 1/6] feat(terraform): update model deployments to use GPT-5 series models --- modules/ai_foundry/README.md | 2 +- modules/common_models/README.md | 37 +++-- modules/common_models/outputs.tf | 143 +++++++++++++----- reference_architectures/foundry_basic/main.tf | 4 +- .../foundry_basic_private/main.tf | 4 +- .../foundry_standard/main.tf | 4 +- .../foundry_standard_private/main.tf | 4 +- 7 files changed, 136 insertions(+), 62 deletions(-) diff --git a/modules/ai_foundry/README.md b/modules/ai_foundry/README.md index ab1144cf..9c98eab1 100644 --- a/modules/ai_foundry/README.md +++ b/modules/ai_foundry/README.md @@ -105,7 +105,7 @@ module "ai_foundry" { # Provide at least one model deployment model_deployments = [ - module.common_models.gpt_4_1, + module.common_models.gpt_5, module.common_models.text_embedding_3_large ] diff --git a/modules/common_models/README.md b/modules/common_models/README.md index 4bc7be54..b22d139c 100644 --- a/modules/common_models/README.md +++ b/modules/common_models/README.md @@ -35,8 +35,8 @@ module "ai_foundry" { # ... other required inputs ... model_deployments = [ - module.common_models.gpt_4_1, - module.common_models.o4_mini, + module.common_models.gpt_5, + module.common_models.o3, module.common_models.text_embedding_3_large ] } @@ -46,7 +46,7 @@ To override SKU per deployment: ```terraform model_deployments = [ - merge(module.common_models.gpt_4_1, { sku = { name = "GlobalStandard", capacity = 2 } }), + merge(module.common_models.gpt_5, { sku = { name = "GlobalStandard", capacity = 2 } }), module.common_models.text_embedding_3_large ] ``` @@ -60,17 +60,22 @@ model_deployments = [ ## Outputs -| Name | Description | -|----------------------------|-------------------------------| -| gpt\_4\_1 | GPT-4.1 model | -| gpt\_4\_1\_mini | GPT-4.1-mini model | -| gpt\_4\_1\_nano | GPT-4.1-nano model | -| gpt\_4o | GPT-4o model | -| gpt\_4o\_audio\_preview | GPT-4o audio preview model | -| gpt\_4o\_mini | GPT-4o-mini model | -| gpt\_4o\_realtime\_preview | GPT-4o realtime preview model | -| gpt\_4o\_transcribe | GPT-4o transcribe model | -| o4\_mini | O4-mini model | -| text\_embedding\_3\_large | Text embedding 3 large model | -| text\_embedding\_3\_small | Text embedding 3 small model | +| Name | Description | +|------------------------------|-----------------------------------------------------------------------| +| gpt\_5 | GPT-5 model - Latest flagship reasoning model | +| gpt\_5\_mini | GPT-5-mini model - Balanced performance and cost | +| gpt\_5\_nano | GPT-5-nano model - Lightweight high-throughput model | +| gpt\_5\_chat | GPT-5-chat model - Conversational AI with emotional intelligence | +| gpt\_5\_1 | GPT-5.1 model - Enhanced reasoning capabilities | +| gpt\_5\_1\_chat | GPT-5.1-chat model - Built-in reasoning for chat | +| gpt\_5\_1\_codex | GPT-5.1-codex model - Optimized for Codex CLI/VS Code | +| gpt\_5\_1\_codex\_mini | GPT-5.1-codex-mini model - Lightweight codex model | +| text\_embedding\_3\_small | Text embedding 3 small model | +| text\_embedding\_3\_large | Text embedding 3 large model - Most capable embedding | +| gpt\_realtime | GPT-realtime model (GA) - Real-time audio processing | +| gpt\_realtime\_mini | GPT-realtime-mini model - Lightweight real-time audio | +| gpt\_audio | GPT-audio model (GA) - Audio generation | +| gpt\_audio\_mini | GPT-audio-mini model - Lightweight audio generation | +| gpt\_4o\_mini\_transcribe | GPT-4o-mini-transcribe model - Improved transcription | +| gpt\_4o\_transcribe\_diarize | GPT-4o-transcribe-diarize model - Speech-to-text with diarization | diff --git a/modules/common_models/outputs.tf b/modules/common_models/outputs.tf index c07100ba..d75dbdba 100644 --- a/modules/common_models/outputs.tf +++ b/modules/common_models/outputs.tf @@ -2,60 +2,90 @@ # Copyright (c) Microsoft Corporation. Licensed under the MIT license. # --------------------------------------------------------------------- -output "gpt_4_1" { +# --------------------------------------------------------------------- +# GPT-5 Series Models (Latest generation) +# --------------------------------------------------------------------- + +output "gpt_5" { + value = { + format = "OpenAI" + name = "gpt-5" + version = "2025-08-07" + } + description = "GPT-5 model - Latest flagship reasoning model with advanced capabilities" +} + +output "gpt_5_mini" { + value = { + format = "OpenAI" + name = "gpt-5-mini" + version = "2025-08-07" + } + description = "GPT-5-mini model - Balanced performance and cost efficiency" +} + +output "gpt_5_nano" { value = { format = "OpenAI" - name = "gpt-4.1" - version = "2025-04-14" + name = "gpt-5-nano" + version = "2025-08-07" } - description = "GPT-4.1 model" + description = "GPT-5-nano model - Lightweight model for high-throughput scenarios" } -output "gpt_4_1_mini" { +output "gpt_5_chat" { value = { format = "OpenAI" - name = "gpt-4.1-mini" - version = "2025-04-14" + name = "gpt-5-chat" + version = "2025-10-03" } - description = "GPT-4.1-mini model" + description = "GPT-5-chat model - Optimized for conversational AI with emotional intelligence" } -output "gpt_4_1_nano" { +# --------------------------------------------------------------------- +# GPT-5.1 Series Models (Advanced generation) +# --------------------------------------------------------------------- + +output "gpt_5_1" { value = { format = "OpenAI" - name = "gpt-4.1-nano" - version = "2025-04-14" + name = "gpt-5.1" + version = "2025-11-13" } - description = "GPT-4.1-nano model" + description = "GPT-5.1 model - Enhanced reasoning with configurable reasoning_effort" } -output "gpt_4o" { +output "gpt_5_1_chat" { value = { format = "OpenAI" - name = "gpt-4o" - version = "2024-11-20" + name = "gpt-5.1-chat" + version = "2025-11-13" } - description = "GPT-4o model" + description = "GPT-5.1-chat model - Built-in reasoning capabilities for chat" } -output "gpt_4o_mini" { +output "gpt_5_1_codex" { value = { format = "OpenAI" - name = "gpt-4o-mini" - version = "2024-07-18" + name = "gpt-5.1-codex" + version = "2025-11-13" } - description = "GPT-4o-mini model" + description = "GPT-5.1-codex model - Optimized for Codex CLI and VS Code extension" } -output "o4_mini" { +output "gpt_5_1_codex_mini" { value = { format = "OpenAI" - name = "o4-mini" - version = "2025-04-16" + name = "gpt-5.1-codex-mini" + version = "2025-11-13" } - description = "O4-mini model" + description = "GPT-5.1-codex-mini model - Lightweight codex model" } +# --------------------------------------------------------------------- +# Embedding Models +# --------------------------------------------------------------------- + output "text_embedding_3_small" { value = { format = "OpenAI" @@ -71,32 +101,71 @@ output "text_embedding_3_large" { name = "text-embedding-3-large" version = "1" } - description = "Text embedding 3 large model" + description = "Text embedding 3 large model - Most capable embedding model" +} + +# --------------------------------------------------------------------- +# Real-time Audio Models (GA) +# --------------------------------------------------------------------- + +output "gpt_realtime" { + value = { + format = "OpenAI" + name = "gpt-realtime" + version = "2025-08-28" + } + description = "GPT-realtime model (GA) - Real-time audio processing" +} + +output "gpt_realtime_mini" { + value = { + format = "OpenAI" + name = "gpt-realtime-mini" + version = "2025-10-06" + } + description = "GPT-realtime-mini model - Lightweight real-time audio processing" +} + +# --------------------------------------------------------------------- +# Audio Generation Models (GA) +# --------------------------------------------------------------------- + +output "gpt_audio" { + value = { + format = "OpenAI" + name = "gpt-audio" + version = "2025-08-28" + } + description = "GPT-audio model (GA) - Audio generation capabilities" } -output "gpt_4o_realtime_preview" { +output "gpt_audio_mini" { value = { format = "OpenAI" - name = "gpt-4o-realtime-preview" - version = "2025-06-03" + name = "gpt-audio-mini" + version = "2025-10-06" } - description = "GPT-4o realtime preview model" + description = "GPT-audio-mini model - Lightweight audio generation" } -output "gpt_4o_audio_preview" { +# --------------------------------------------------------------------- +# Speech-to-Text Models +# --------------------------------------------------------------------- + +output "gpt_4o_mini_transcribe" { value = { format = "OpenAI" - name = "gpt-4o-audio-preview" - version = "2024-12-17" + name = "gpt-4o-mini-transcribe-2025-12-15" + version = "2025-12-15" } - description = "GPT-4o audio preview model" + description = "GPT-4o-mini-transcribe model - Improved transcription accuracy and robustness" } -output "gpt_4o_transcribe" { +output "gpt_4o_transcribe_diarize" { value = { format = "OpenAI" - name = "gpt-4o-transcribe" - version = "2025-03-20" + name = "gpt-4o-transcribe-diarize" + version = "1" } - description = "GPT-4o transcribe model" + description = "GPT-4o-transcribe-diarize model - Speech-to-text with speaker diarization" } diff --git a/reference_architectures/foundry_basic/main.tf b/reference_architectures/foundry_basic/main.tf index b4219ee5..5798fbed 100644 --- a/reference_architectures/foundry_basic/main.tf +++ b/reference_architectures/foundry_basic/main.tf @@ -58,8 +58,8 @@ module "ai_foundry" { # Model deployments to make available within Foundry # Add/remove models as needed for your workload requirements model_deployments = [ - module.common_models.gpt_4_1, - module.common_models.o4_mini, + module.common_models.gpt_5, + module.common_models.gpt_5_nano, module.common_models.text_embedding_3_large ] diff --git a/reference_architectures/foundry_basic_private/main.tf b/reference_architectures/foundry_basic_private/main.tf index d4743d18..edda15db 100644 --- a/reference_architectures/foundry_basic_private/main.tf +++ b/reference_architectures/foundry_basic_private/main.tf @@ -45,8 +45,8 @@ module "ai_foundry" { name = module.naming.cognitive_account.name_unique model_deployments = [ - module.common_models.gpt_4_1, - module.common_models.o4_mini, + module.common_models.gpt_5, + module.common_models.gpt_5_nano, module.common_models.text_embedding_3_large ] diff --git a/reference_architectures/foundry_standard/main.tf b/reference_architectures/foundry_standard/main.tf index 9f4fb964..0b86a10b 100644 --- a/reference_architectures/foundry_standard/main.tf +++ b/reference_architectures/foundry_standard/main.tf @@ -59,8 +59,8 @@ module "ai_foundry" { # Model deployments to make available within Foundry # Add/remove models as needed for your workload requirements model_deployments = [ - module.common_models.gpt_4_1, - module.common_models.o4_mini, + module.common_models.gpt_5, + module.common_models.gpt_5_nano, module.common_models.text_embedding_3_large ] diff --git a/reference_architectures/foundry_standard_private/main.tf b/reference_architectures/foundry_standard_private/main.tf index ab164f39..6be5d3b7 100644 --- a/reference_architectures/foundry_standard_private/main.tf +++ b/reference_architectures/foundry_standard_private/main.tf @@ -57,8 +57,8 @@ module "ai_foundry" { name = module.naming.cognitive_account.name_unique model_deployments = [ - module.common_models.gpt_4_1, - module.common_models.o4_mini, + module.common_models.gpt_5, + module.common_models.gpt_5_nano, module.common_models.text_embedding_3_large ] From 6aaca35856d6fe4e7872b50c14f919a74e1fbc57 Mon Sep 17 00:00:00 2001 From: Pablo Zaidenvoren Date: Tue, 6 Jan 2026 17:30:15 +0000 Subject: [PATCH 2/6] feat(terraform): add GPT-5.2 models and update deployments in Foundry architecture --- modules/common_models/README.md | 2 + modules/common_models/outputs.tf | 40 ++++++++----------- reference_architectures/foundry_basic/main.tf | 2 +- .../foundry_basic_private/main.tf | 2 +- .../foundry_standard/main.tf | 2 +- .../foundry_standard_private/main.tf | 2 +- 6 files changed, 23 insertions(+), 27 deletions(-) diff --git a/modules/common_models/README.md b/modules/common_models/README.md index b22d139c..fa86b729 100644 --- a/modules/common_models/README.md +++ b/modules/common_models/README.md @@ -70,6 +70,8 @@ model_deployments = [ | gpt\_5\_1\_chat | GPT-5.1-chat model - Built-in reasoning for chat | | gpt\_5\_1\_codex | GPT-5.1-codex model - Optimized for Codex CLI/VS Code | | gpt\_5\_1\_codex\_mini | GPT-5.1-codex-mini model - Lightweight codex model | +| gpt\_5\_2 | GPT-5.2 model - Latest flagship reasoning model | +| gpt\_5\_2\_chat | GPT-5.2-chat model - Latest chat with advanced capabilities | | text\_embedding\_3\_small | Text embedding 3 small model | | text\_embedding\_3\_large | Text embedding 3 large model - Most capable embedding | | gpt\_realtime | GPT-realtime model (GA) - Real-time audio processing | diff --git a/modules/common_models/outputs.tf b/modules/common_models/outputs.tf index d75dbdba..5d03be68 100644 --- a/modules/common_models/outputs.tf +++ b/modules/common_models/outputs.tf @@ -2,10 +2,6 @@ # Copyright (c) Microsoft Corporation. Licensed under the MIT license. # --------------------------------------------------------------------- -# --------------------------------------------------------------------- -# GPT-5 Series Models (Latest generation) -# --------------------------------------------------------------------- - output "gpt_5" { value = { format = "OpenAI" @@ -42,10 +38,6 @@ output "gpt_5_chat" { description = "GPT-5-chat model - Optimized for conversational AI with emotional intelligence" } -# --------------------------------------------------------------------- -# GPT-5.1 Series Models (Advanced generation) -# --------------------------------------------------------------------- - output "gpt_5_1" { value = { format = "OpenAI" @@ -82,9 +74,23 @@ output "gpt_5_1_codex_mini" { description = "GPT-5.1-codex-mini model - Lightweight codex model" } -# --------------------------------------------------------------------- -# Embedding Models -# --------------------------------------------------------------------- +output "gpt_5_2" { + value = { + format = "OpenAI" + name = "gpt-5.2" + version = "2025-12-11" + } + description = "GPT-5.2 model - Latest flagship reasoning model" +} + +output "gpt_5_2_chat" { + value = { + format = "OpenAI" + name = "gpt-5.2-chat" + version = "2025-12-11" + } + description = "GPT-5.2-chat model - Latest chat model with advanced capabilities" +} output "text_embedding_3_small" { value = { @@ -104,10 +110,6 @@ output "text_embedding_3_large" { description = "Text embedding 3 large model - Most capable embedding model" } -# --------------------------------------------------------------------- -# Real-time Audio Models (GA) -# --------------------------------------------------------------------- - output "gpt_realtime" { value = { format = "OpenAI" @@ -126,10 +128,6 @@ output "gpt_realtime_mini" { description = "GPT-realtime-mini model - Lightweight real-time audio processing" } -# --------------------------------------------------------------------- -# Audio Generation Models (GA) -# --------------------------------------------------------------------- - output "gpt_audio" { value = { format = "OpenAI" @@ -148,10 +146,6 @@ output "gpt_audio_mini" { description = "GPT-audio-mini model - Lightweight audio generation" } -# --------------------------------------------------------------------- -# Speech-to-Text Models -# --------------------------------------------------------------------- - output "gpt_4o_mini_transcribe" { value = { format = "OpenAI" diff --git a/reference_architectures/foundry_basic/main.tf b/reference_architectures/foundry_basic/main.tf index 5798fbed..2ee09a8b 100644 --- a/reference_architectures/foundry_basic/main.tf +++ b/reference_architectures/foundry_basic/main.tf @@ -58,7 +58,7 @@ module "ai_foundry" { # Model deployments to make available within Foundry # Add/remove models as needed for your workload requirements model_deployments = [ - module.common_models.gpt_5, + module.common_models.gpt_5_2_chat, module.common_models.gpt_5_nano, module.common_models.text_embedding_3_large ] diff --git a/reference_architectures/foundry_basic_private/main.tf b/reference_architectures/foundry_basic_private/main.tf index edda15db..2ce5e4a8 100644 --- a/reference_architectures/foundry_basic_private/main.tf +++ b/reference_architectures/foundry_basic_private/main.tf @@ -45,7 +45,7 @@ module "ai_foundry" { name = module.naming.cognitive_account.name_unique model_deployments = [ - module.common_models.gpt_5, + module.common_models.gpt_5_2_chat, module.common_models.gpt_5_nano, module.common_models.text_embedding_3_large ] diff --git a/reference_architectures/foundry_standard/main.tf b/reference_architectures/foundry_standard/main.tf index 0b86a10b..57dee22d 100644 --- a/reference_architectures/foundry_standard/main.tf +++ b/reference_architectures/foundry_standard/main.tf @@ -59,7 +59,7 @@ module "ai_foundry" { # Model deployments to make available within Foundry # Add/remove models as needed for your workload requirements model_deployments = [ - module.common_models.gpt_5, + module.common_models.gpt_5_2_chat, module.common_models.gpt_5_nano, module.common_models.text_embedding_3_large ] diff --git a/reference_architectures/foundry_standard_private/main.tf b/reference_architectures/foundry_standard_private/main.tf index 6be5d3b7..c7e27413 100644 --- a/reference_architectures/foundry_standard_private/main.tf +++ b/reference_architectures/foundry_standard_private/main.tf @@ -57,7 +57,7 @@ module "ai_foundry" { name = module.naming.cognitive_account.name_unique model_deployments = [ - module.common_models.gpt_5, + module.common_models.gpt_5_2_chat, module.common_models.gpt_5_nano, module.common_models.text_embedding_3_large ] From c828742174287b46c03b7e0fa74267cd4152c66e Mon Sep 17 00:00:00 2001 From: Pablo Zaidenvoren Date: Tue, 6 Jan 2026 17:30:32 +0000 Subject: [PATCH 3/6] feat(terraform): update model outputs to include GPT-5.1 and GPT-5.2 models --- modules/common_models/README.md | 40 ++++++++++++++++----------------- 1 file changed, 20 insertions(+), 20 deletions(-) diff --git a/modules/common_models/README.md b/modules/common_models/README.md index fa86b729..472bed50 100644 --- a/modules/common_models/README.md +++ b/modules/common_models/README.md @@ -60,24 +60,24 @@ model_deployments = [ ## Outputs -| Name | Description | -|------------------------------|-----------------------------------------------------------------------| -| gpt\_5 | GPT-5 model - Latest flagship reasoning model | -| gpt\_5\_mini | GPT-5-mini model - Balanced performance and cost | -| gpt\_5\_nano | GPT-5-nano model - Lightweight high-throughput model | -| gpt\_5\_chat | GPT-5-chat model - Conversational AI with emotional intelligence | -| gpt\_5\_1 | GPT-5.1 model - Enhanced reasoning capabilities | -| gpt\_5\_1\_chat | GPT-5.1-chat model - Built-in reasoning for chat | -| gpt\_5\_1\_codex | GPT-5.1-codex model - Optimized for Codex CLI/VS Code | -| gpt\_5\_1\_codex\_mini | GPT-5.1-codex-mini model - Lightweight codex model | -| gpt\_5\_2 | GPT-5.2 model - Latest flagship reasoning model | -| gpt\_5\_2\_chat | GPT-5.2-chat model - Latest chat with advanced capabilities | -| text\_embedding\_3\_small | Text embedding 3 small model | -| text\_embedding\_3\_large | Text embedding 3 large model - Most capable embedding | -| gpt\_realtime | GPT-realtime model (GA) - Real-time audio processing | -| gpt\_realtime\_mini | GPT-realtime-mini model - Lightweight real-time audio | -| gpt\_audio | GPT-audio model (GA) - Audio generation | -| gpt\_audio\_mini | GPT-audio-mini model - Lightweight audio generation | -| gpt\_4o\_mini\_transcribe | GPT-4o-mini-transcribe model - Improved transcription | -| gpt\_4o\_transcribe\_diarize | GPT-4o-transcribe-diarize model - Speech-to-text with diarization | +| Name | Description | +|------------------------------|--------------------------------------------------------------------------------| +| gpt\_4o\_mini\_transcribe | GPT-4o-mini-transcribe model - Improved transcription accuracy and robustness | +| gpt\_4o\_transcribe\_diarize | GPT-4o-transcribe-diarize model - Speech-to-text with speaker diarization | +| gpt\_5 | GPT-5 model - Latest flagship reasoning model with advanced capabilities | +| gpt\_5\_1 | GPT-5.1 model - Enhanced reasoning with configurable reasoning\_effort | +| gpt\_5\_1\_chat | GPT-5.1-chat model - Built-in reasoning capabilities for chat | +| gpt\_5\_1\_codex | GPT-5.1-codex model - Optimized for Codex CLI and VS Code extension | +| gpt\_5\_1\_codex\_mini | GPT-5.1-codex-mini model - Lightweight codex model | +| gpt\_5\_2 | GPT-5.2 model - Latest flagship reasoning model | +| gpt\_5\_2\_chat | GPT-5.2-chat model - Latest chat model with advanced capabilities | +| gpt\_5\_chat | GPT-5-chat model - Optimized for conversational AI with emotional intelligence | +| gpt\_5\_mini | GPT-5-mini model - Balanced performance and cost efficiency | +| gpt\_5\_nano | GPT-5-nano model - Lightweight model for high-throughput scenarios | +| gpt\_audio | GPT-audio model (GA) - Audio generation capabilities | +| gpt\_audio\_mini | GPT-audio-mini model - Lightweight audio generation | +| gpt\_realtime | GPT-realtime model (GA) - Real-time audio processing | +| gpt\_realtime\_mini | GPT-realtime-mini model - Lightweight real-time audio processing | +| text\_embedding\_3\_large | Text embedding 3 large model - Most capable embedding model | +| text\_embedding\_3\_small | Text embedding 3 small model | From f9c70c453cc5b89eab5b028432b3260b0a5a8241 Mon Sep 17 00:00:00 2001 From: Pablo Zaidenvoren Date: Tue, 6 Jan 2026 20:40:09 +0000 Subject: [PATCH 4/6] fix(terraform): update model descriptions for clarity and accuracy --- modules/common_models/outputs.tf | 8 ++++---- 1 file changed, 4 insertions(+), 4 deletions(-) diff --git a/modules/common_models/outputs.tf b/modules/common_models/outputs.tf index 5d03be68..4ff2dca3 100644 --- a/modules/common_models/outputs.tf +++ b/modules/common_models/outputs.tf @@ -8,7 +8,7 @@ output "gpt_5" { name = "gpt-5" version = "2025-08-07" } - description = "GPT-5 model - Latest flagship reasoning model with advanced capabilities" + description = "GPT-5 model - Reasoning model with advanced capabilities" } output "gpt_5_mini" { @@ -80,7 +80,7 @@ output "gpt_5_2" { name = "gpt-5.2" version = "2025-12-11" } - description = "GPT-5.2 model - Latest flagship reasoning model" + description = "GPT-5.2 model - Reasoning model" } output "gpt_5_2_chat" { @@ -89,7 +89,7 @@ output "gpt_5_2_chat" { name = "gpt-5.2-chat" version = "2025-12-11" } - description = "GPT-5.2-chat model - Latest chat model with advanced capabilities" + description = "GPT-5.2-chat model - Chat model with advanced capabilities" } output "text_embedding_3_small" { @@ -149,7 +149,7 @@ output "gpt_audio_mini" { output "gpt_4o_mini_transcribe" { value = { format = "OpenAI" - name = "gpt-4o-mini-transcribe-2025-12-15" + name = "gpt-4o-mini-transcribe" version = "2025-12-15" } description = "GPT-4o-mini-transcribe model - Improved transcription accuracy and robustness" From 274a0c218dd241f53df3731b896d4d0a16fc8a6c Mon Sep 17 00:00:00 2001 From: Pablo Zaidenvoren Date: Tue, 6 Jan 2026 20:42:21 +0000 Subject: [PATCH 5/6] feat(terraform): update model deployments to use GPT-5.2 chat and nano models --- modules/common_models/README.md | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/modules/common_models/README.md b/modules/common_models/README.md index 472bed50..d6b59c9c 100644 --- a/modules/common_models/README.md +++ b/modules/common_models/README.md @@ -35,8 +35,8 @@ module "ai_foundry" { # ... other required inputs ... model_deployments = [ - module.common_models.gpt_5, - module.common_models.o3, + module.common_models.gpt_5_2_chat, + module.common_models.gpt_5_nano, module.common_models.text_embedding_3_large ] } @@ -46,7 +46,7 @@ To override SKU per deployment: ```terraform model_deployments = [ - merge(module.common_models.gpt_5, { sku = { name = "GlobalStandard", capacity = 2 } }), + merge(module.common_models.gpt_5_2_chat, { sku = { name = "GlobalStandard", capacity = 2 } }), module.common_models.text_embedding_3_large ] ``` From d3fb21c7d4046707cf4558ccd3105b225c3ef950 Mon Sep 17 00:00:00 2001 From: Pablo Zaidenvoren Date: Tue, 6 Jan 2026 20:45:22 +0000 Subject: [PATCH 6/6] fix(terraform): update GPT-5 model descriptions for clarity and consistency --- modules/common_models/README.md | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/modules/common_models/README.md b/modules/common_models/README.md index d6b59c9c..c5fc412e 100644 --- a/modules/common_models/README.md +++ b/modules/common_models/README.md @@ -64,13 +64,13 @@ model_deployments = [ |------------------------------|--------------------------------------------------------------------------------| | gpt\_4o\_mini\_transcribe | GPT-4o-mini-transcribe model - Improved transcription accuracy and robustness | | gpt\_4o\_transcribe\_diarize | GPT-4o-transcribe-diarize model - Speech-to-text with speaker diarization | -| gpt\_5 | GPT-5 model - Latest flagship reasoning model with advanced capabilities | +| gpt\_5 | GPT-5 model - Reasoning model with advanced capabilities | | gpt\_5\_1 | GPT-5.1 model - Enhanced reasoning with configurable reasoning\_effort | | gpt\_5\_1\_chat | GPT-5.1-chat model - Built-in reasoning capabilities for chat | | gpt\_5\_1\_codex | GPT-5.1-codex model - Optimized for Codex CLI and VS Code extension | | gpt\_5\_1\_codex\_mini | GPT-5.1-codex-mini model - Lightweight codex model | -| gpt\_5\_2 | GPT-5.2 model - Latest flagship reasoning model | -| gpt\_5\_2\_chat | GPT-5.2-chat model - Latest chat model with advanced capabilities | +| gpt\_5\_2 | GPT-5.2 model - Reasoning model | +| gpt\_5\_2\_chat | GPT-5.2-chat model - Chat model with advanced capabilities | | gpt\_5\_chat | GPT-5-chat model - Optimized for conversational AI with emotional intelligence | | gpt\_5\_mini | GPT-5-mini model - Balanced performance and cost efficiency | | gpt\_5\_nano | GPT-5-nano model - Lightweight model for high-throughput scenarios |