graphrag-accelerator/infra/core/aoai/aoai.bicep

@description('Name of the Azure OpenAI instance')
param openAiName string = 'openai${uniqueString(resourceGroup().id)}'

@description('Location for the Azure OpenAI instance')
param location string = resourceGroup().location

@description('LLM model deployment name')
param llmModelDeploymentName string = 'gpt-4o'

@description('Embedding model deployment name')
param embeddingModelDeploymentName string = 'text-embedding-ada-002'

@description('TPM quota for GPT-4o deployment')
param gpt4oTpm int = 10

@description('TPM quota for text-embedding-ada-002 deployment')
param textEmbeddingAdaTpm int = 10

@description('Array of objects with fields principalId, roleDefinitionId')
param roleAssignments array = []

resource aoai 'Microsoft.CognitiveServices/accounts@2024-10-01' = {
  name: openAiName
  location: location
  sku: {
    name: 'S0'
  }
  kind: 'OpenAI'
  properties: {
    publicNetworkAccess: 'Enabled'
    disableLocalAuth: true
  }
}

resource gpt4oDeployment 'Microsoft.CognitiveServices/accounts/deployments@2024-10-01' = {
  parent: aoai
  name: llmModelDeploymentName
  sku: {
    name: 'GlobalStandard'
    capacity: gpt4oTpm
  }
  properties: {
    model: {
      format: 'OpenAI'
      name: 'gpt-4o'
      version: '2024-05-13'
    }
    currentCapacity: gpt4oTpm
  }
}

resource textEmbeddingAdaDeployment 'Microsoft.CognitiveServices/accounts/deployments@2024-10-01' = {
  parent: aoai
  name: embeddingModelDeploymentName
  // NOTE: simultaneous model deployments are not supported at this time. As a workaround, use dependsOn to force the models to be deployed in a sequential manner.
  dependsOn: [gpt4oDeployment]
  sku: {
    name: 'Standard'
    capacity: textEmbeddingAdaTpm
  }
  properties: {
    model: {
      format: 'OpenAI'
      name: 'text-embedding-ada-002'
      version: '2'
    }
    currentCapacity: textEmbeddingAdaTpm
  }
}

resource roleAssignment 'Microsoft.Authorization/roleAssignments@2022-04-01' = [
  for role in roleAssignments: {
    name: guid('${role.principalId}-${role.roleDefinitionId}')
    scope: resourceGroup()
    properties: role
  }
]

output openAiEndpoint string = aoai.properties.endpoint
output llmModel string = gpt4oDeployment.properties.model.name
output llmModelDeploymentName string = gpt4oDeployment.name
output llmModelApiVersion string = gpt4oDeployment.apiVersion
output textEmbeddingModel string = textEmbeddingAdaDeployment.properties.model.name
output textEmbeddingModelDeploymentName string = textEmbeddingAdaDeployment.name
output textEmbeddingModelApiVersion string = textEmbeddingAdaDeployment.apiVersion
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00			`@description('Name of the Azure OpenAI instance')`
			`param openAiName string = 'openai${uniqueString(resourceGroup().id)}'`

			`@description('Location for the Azure OpenAI instance')`
			`param location string = resourceGroup().location`

			`@description('LLM model deployment name')`
			`param llmModelDeploymentName string = 'gpt-4o'`

			`@description('Embedding model deployment name')`
			`param embeddingModelDeploymentName string = 'text-embedding-ada-002'`

			`@description('TPM quota for GPT-4o deployment')`
			`param gpt4oTpm int = 10`

			`@description('TPM quota for text-embedding-ada-002 deployment')`
			`param textEmbeddingAdaTpm int = 10`

			`@description('Array of objects with fields principalId, roleDefinitionId')`
			`param roleAssignments array = []`

			`resource aoai 'Microsoft.CognitiveServices/accounts@2024-10-01' = {`
			`name: openAiName`
			`location: location`
			`sku: {`
			`name: 'S0'`
			`}`
			`kind: 'OpenAI'`
			`properties: {`
			`publicNetworkAccess: 'Enabled'`
			`disableLocalAuth: true`
			`}`
			`}`

			`resource gpt4oDeployment 'Microsoft.CognitiveServices/accounts/deployments@2024-10-01' = {`
			`parent: aoai`
			`name: llmModelDeploymentName`
			`sku: {`
			`name: 'GlobalStandard'`
			`capacity: gpt4oTpm`
			`}`
			`properties: {`
			`model: {`
			`format: 'OpenAI'`
			`name: 'gpt-4o'`
			`version: '2024-05-13'`
			`}`
			`currentCapacity: gpt4oTpm`
			`}`
			`}`

			`resource textEmbeddingAdaDeployment 'Microsoft.CognitiveServices/accounts/deployments@2024-10-01' = {`
			`parent: aoai`
			`name: embeddingModelDeploymentName`
fix aoai deployment issue 2025-01-07 01:20:33 -05:00			`// NOTE: simultaneous model deployments are not supported at this time. As a workaround, use dependsOn to force the models to be deployed in a sequential manner.`
			`dependsOn: [gpt4oDeployment]`
add aoai to bicep deployment 2025-01-06 00:53:29 -05:00			`sku: {`
			`name: 'Standard'`
			`capacity: textEmbeddingAdaTpm`
			`}`
			`properties: {`
			`model: {`
			`format: 'OpenAI'`
			`name: 'text-embedding-ada-002'`
			`version: '2'`
			`}`
			`currentCapacity: textEmbeddingAdaTpm`
			`}`
			`}`

			`resource roleAssignment 'Microsoft.Authorization/roleAssignments@2022-04-01' = [`
			`for role in roleAssignments: {`
			`name: guid('${role.principalId}-${role.roleDefinitionId}')`
			`scope: resourceGroup()`
			`properties: role`
			`}`
			`]`

			`output openAiEndpoint string = aoai.properties.endpoint`
cleanup bicep variable names 2025-01-06 02:03:09 -05:00			`output llmModel string = gpt4oDeployment.properties.model.name`
			`output llmModelDeploymentName string = gpt4oDeployment.name`
			`output llmModelApiVersion string = gpt4oDeployment.apiVersion`
			`output textEmbeddingModel string = textEmbeddingAdaDeployment.properties.model.name`
			`output textEmbeddingModelDeploymentName string = textEmbeddingAdaDeployment.name`
			`output textEmbeddingModelApiVersion string = textEmbeddingAdaDeployment.apiVersion`