@@ -532,18 +532,31 @@ resource "azurerm_cognitive_deployment" "gpt4o" {
532532
533533# Text Embedding Model for Semantic Search and Document Analysis
534534resource "azurerm_cognitive_deployment" "text_embedding" {
535- name = " text-embedding-ada-002 "
535+ name = " text-embedding-ada-3-large "
536536 cognitive_account_id = azurerm_cognitive_account. openai . id
537537
538538 model {
539539 format = " OpenAI"
540- name = " text-embedding-ada-002"
541- version = " 2"
540+ # Example: Use "text-embedding-3-large" as an embedding model
541+ # You can use one of the following models for text embedding:
542+ # - "text-embedding-3-small" (recommended for most use cases)
543+ # - "text-embedding-3-large" (higher accuracy, higher cost)
544+ # - "text-search-ada-doc-001" (legacy, for backward compatibility)
545+ # - "text-embedding-ada-002" (legacy, for backward compatibility)
546+ # - "text-search-babbage-doc-001" (legacy, for backward compatibility)
547+ # - "text-search-curie-doc-001" (legacy, for backward compatibility)
548+ # - "text-search-davinci-doc-001" (legacy, for backward compatibility)
549+ name = " text-embedding-3-large"
550+ version = " 1" # This depends on the model
542551 }
543552
544553 sku {
545554 name = " Standard"
546- capacity = 120 # High capacity for batch document processing
555+ # Capacity is the number of 1,000 tokens per minute (TPM) units.
556+ # Allowed values depend on your Azure OpenAI quota and region.
557+ # Common values: 1, 2, 5, 10, 20, 40, 80, 160, etc.
558+ # You can only set up to your available quota for this model.
559+ capacity = 1 # Example: set to 1 to fit within available quota
547560 }
548561
549562 depends_on = [azurerm_cognitive_account . openai ]
0 commit comments