graphrag-accelerator/infra/core/aoai/aoai.bicep

@description('Name of the Azure OpenAI instance')
param openAiName string = 'openai${uniqueString(resourceGroup().id)}'

@description('Location for the Azure OpenAI instance')
param location string = resourceGroup().location

@description('LLM model name')
param llmModelName string = 'gpt-4o'

@description('LLM Model API version')
param llmModelVersion string

@description('Embedding model name')
param embeddingModelName string = 'text-embedding-ada-002'

@description('Embedding Model API version')
param embeddingModelVersion string

@description('TPM quota for llm model deployment (x1000)')
param llmTpmQuota int = 1

@description('TPM quota for embedding model deployment (x1000)')
param embeddingTpmQuota int = 1

resource aoai 'Microsoft.CognitiveServices/accounts@2024-10-01' = {
  name: openAiName
  location: location
  sku: {
    name: 'S0'
  }
  kind: 'OpenAI'
  properties: {
    publicNetworkAccess: 'Enabled'
    disableLocalAuth: true
  }
}

resource llmDeployment 'Microsoft.CognitiveServices/accounts/deployments@2024-10-01' = {
  parent: aoai
  name: llmModelName
  sku: {
    name: 'GlobalStandard'
    capacity: llmTpmQuota
  }
  properties: {
    model: {
      format: 'OpenAI'
      name: llmModelName
      version: llmModelVersion
    }
    currentCapacity: llmTpmQuota
  }
}

resource embeddingDeployment 'Microsoft.CognitiveServices/accounts/deployments@2024-10-01' = {
  parent: aoai
  name: embeddingModelName
  // NOTE: simultaneous model deployments are not supported at this time. As a workaround, use dependsOn to force the models to be deployed in a sequential manner.
  dependsOn: [llmDeployment]
  sku: {
    name: 'Standard'
    capacity: embeddingTpmQuota
  }
  properties: {
    model: {
      format: 'OpenAI'
      name: embeddingModelName
      version: embeddingModelVersion
    }
    currentCapacity: embeddingTpmQuota
  }
}

output openAiEndpoint string = aoai.properties.endpoint
output llmModel string = llmDeployment.properties.model.name
output llmModelDeploymentName string = llmDeployment.name
output llmModelApiVersion string = llmDeployment.apiVersion
output textEmbeddingModel string = embeddingDeployment.properties.model.name
output textEmbeddingModelDeploymentName string = embeddingDeployment.name
output textEmbeddingModelApiVersion string = embeddingDeployment.apiVersion
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00			`@description('Name of the Azure OpenAI instance')`
			`param openAiName string = 'openai${uniqueString(resourceGroup().id)}'`

			`@description('Location for the Azure OpenAI instance')`
			`param location string = resourceGroup().location`

working version of a managed app 2025-01-08 11:38:03 -05:00			`@description('LLM model name')`
			`param llmModelName string = 'gpt-4o'`
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00
working version of a managed app 2025-01-08 11:38:03 -05:00			`@description('LLM Model API version')`
			`param llmModelVersion string`
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00
working version of a managed app 2025-01-08 11:38:03 -05:00			`@description('Embedding model name')`
			`param embeddingModelName string = 'text-embedding-ada-002'`
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00
working version of a managed app 2025-01-08 11:38:03 -05:00			`@description('Embedding Model API version')`
			`param embeddingModelVersion string`

			`@description('TPM quota for llm model deployment (x1000)')`
ManagedAPP 2025-02-11 16:01:32 -04:00			`param llmTpmQuota int = 1`
working version of a managed app 2025-01-08 11:38:03 -05:00
			`@description('TPM quota for embedding model deployment (x1000)')`
ManagedAPP 2025-02-11 16:01:32 -04:00			`param embeddingTpmQuota int = 1`
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00
			`resource aoai 'Microsoft.CognitiveServices/accounts@2024-10-01' = {`
			`name: openAiName`
			`location: location`
			`sku: {`
			`name: 'S0'`
			`}`
			`kind: 'OpenAI'`
			`properties: {`
			`publicNetworkAccess: 'Enabled'`
			`disableLocalAuth: true`
			`}`
			`}`

working version of a managed app 2025-01-08 11:38:03 -05:00			`resource llmDeployment 'Microsoft.CognitiveServices/accounts/deployments@2024-10-01' = {`
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00			`parent: aoai`
working version of a managed app 2025-01-08 11:38:03 -05:00			`name: llmModelName`
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00			`sku: {`
			`name: 'GlobalStandard'`
working version of a managed app 2025-01-08 11:38:03 -05:00			`capacity: llmTpmQuota`
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00			`}`
			`properties: {`
			`model: {`
			`format: 'OpenAI'`
working version of a managed app 2025-01-08 11:38:03 -05:00			`name: llmModelName`
			`version: llmModelVersion`
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00			`}`
working version of a managed app 2025-01-08 11:38:03 -05:00			`currentCapacity: llmTpmQuota`
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00			`}`
			`}`

working version of a managed app 2025-01-08 11:38:03 -05:00			`resource embeddingDeployment 'Microsoft.CognitiveServices/accounts/deployments@2024-10-01' = {`
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00			`parent: aoai`
working version of a managed app 2025-01-08 11:38:03 -05:00			`name: embeddingModelName`
fix aoai deployment issue 2025-01-07 01:20:33 -05:00			`// NOTE: simultaneous model deployments are not supported at this time. As a workaround, use dependsOn to force the models to be deployed in a sequential manner.`
working version of a managed app 2025-01-08 11:38:03 -05:00			`dependsOn: [llmDeployment]`
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00			`sku: {`
			`name: 'Standard'`
working version of a managed app 2025-01-08 11:38:03 -05:00			`capacity: embeddingTpmQuota`
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00			`}`
			`properties: {`
			`model: {`
			`format: 'OpenAI'`
working version of a managed app 2025-01-08 11:38:03 -05:00			`name: embeddingModelName`
			`version: embeddingModelVersion`
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00			`}`
working version of a managed app 2025-01-08 11:38:03 -05:00			`currentCapacity: embeddingTpmQuota`
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00			`}`
			`}`

			`output openAiEndpoint string = aoai.properties.endpoint`
working version of a managed app 2025-01-08 11:38:03 -05:00			`output llmModel string = llmDeployment.properties.model.name`
			`output llmModelDeploymentName string = llmDeployment.name`
			`output llmModelApiVersion string = llmDeployment.apiVersion`
			`output textEmbeddingModel string = embeddingDeployment.properties.model.name`
			`output textEmbeddingModelDeploymentName string = embeddingDeployment.name`
			`output textEmbeddingModelApiVersion string = embeddingDeployment.apiVersion`