Skip to content

Commit ec42736

Browse files
authored
note about models
1 parent 1baaefb commit ec42736

1 file changed

Lines changed: 17 additions & 4 deletions

File tree

terraform-infrastructure/main.tf

Lines changed: 17 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -532,18 +532,31 @@ resource "azurerm_cognitive_deployment" "gpt4o" {
532532

533533
# Text Embedding Model for Semantic Search and Document Analysis
534534
resource "azurerm_cognitive_deployment" "text_embedding" {
535-
name = "text-embedding-ada-002"
535+
name = "text-embedding-ada-3-large"
536536
cognitive_account_id = azurerm_cognitive_account.openai.id
537537

538538
model {
539539
format = "OpenAI"
540-
name = "text-embedding-ada-002"
541-
version = "2"
540+
# Example: Use "text-embedding-3-large" as an embedding model
541+
# You can use one of the following models for text embedding:
542+
# - "text-embedding-3-small" (recommended for most use cases)
543+
# - "text-embedding-3-large" (higher accuracy, higher cost)
544+
# - "text-search-ada-doc-001" (legacy, for backward compatibility)
545+
# - "text-embedding-ada-002" (legacy, for backward compatibility)
546+
# - "text-search-babbage-doc-001" (legacy, for backward compatibility)
547+
# - "text-search-curie-doc-001" (legacy, for backward compatibility)
548+
# - "text-search-davinci-doc-001" (legacy, for backward compatibility)
549+
name = "text-embedding-3-large"
550+
version = "1" # This depends on the model
542551
}
543552

544553
sku {
545554
name = "Standard"
546-
capacity = 120 # High capacity for batch document processing
555+
# Capacity is the number of 1,000 tokens per minute (TPM) units.
556+
# Allowed values depend on your Azure OpenAI quota and region.
557+
# Common values: 1, 2, 5, 10, 20, 40, 80, 160, etc.
558+
# You can only set up to your available quota for this model.
559+
capacity = 1 # Example: set to 1 to fit within available quota
547560
}
548561

549562
depends_on = [azurerm_cognitive_account.openai]

0 commit comments

Comments
 (0)