githubabcs-devops
diff --git a/‎AI-in-a-Box.sln‎
Lines changed: 46 additions & 0 deletions b/‎AI-in-a-Box.sln‎
Lines changed: 46 additions & 0 deletions
diff --git a/‎ai-services/gpt-video-analysis-in-a-box/README.md‎
Lines changed: 41 additions & 68 deletions b/‎ai-services/gpt-video-analysis-in-a-box/README.md‎
Lines changed: 41 additions & 68 deletions
diff --git a/‎ai-services/gpt-video-analysis-in-a-box/azure.yaml‎
Lines changed: 14 additions & 0 deletions b/‎ai-services/gpt-video-analysis-in-a-box/azure.yaml‎
Lines changed: 14 additions & 0 deletions
@@ -0,0 +1,46 @@
+
+Microsoft Visual Studio Solution File, Format Version 12.00
+# Visual Studio Version 17
+VisualStudioVersion = 17.5.002.0
+MinimumVisualStudioVersion = 10.0.40219.1
+Project("{2150E333-8FDC-42A3-9474-1A3956D46DE8}") = "gen-ai", "gen-ai", "{5A9632E5-F638-42BF-BF07-3B35E2BE0605}"
+EndProject
+Project("{2150E333-8FDC-42A3-9474-1A3956D46DE8}") = "semantic-kernel-bot-in-a-box", "semantic-kernel-bot-in-a-box", "{3E61D800-B120-46E9-B7EE-332ED8488CC9}"
+EndProject
+Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "SemanticKernelBot", "gen-ai\semantic-kernel-bot-in-a-box\src\SemanticKernelBot.csproj", "{189DDAAC-CE3B-4488-BD53-C71F802E3395}"
+EndProject
+Project("{2150E333-8FDC-42A3-9474-1A3956D46DE8}") = "Assistants", "Assistants", "{176DEFFB-5FDF-4308-84B3-C685641CFA0B}"
+EndProject
+Project("{2150E333-8FDC-42A3-9474-1A3956D46DE8}") = "bot-in-a-box", "bot-in-a-box", "{83389DF2-DAC5-4172-A0DF-017F511DBD8A}"
+EndProject
+Project("{9A19103F-16F7-4668-BE54-9A1E7A4F7556}") = "AssistantBot", "gen-ai\Assistants\bot-in-a-box\src\AssistantBot.csproj", "{BD9D160A-49C7-4BD7-9559-7C0185C76122}"
+EndProject
+Global
+	GlobalSection(SolutionConfigurationPlatforms) = preSolution
+		Debug|Any CPU = Debug|Any CPU
+		Release|Any CPU = Release|Any CPU
+	EndGlobalSection
+	GlobalSection(ProjectConfigurationPlatforms) = postSolution
+		{189DDAAC-CE3B-4488-BD53-C71F802E3395}.Debug|Any CPU.ActiveCfg = Debug|Any CPU
+		{189DDAAC-CE3B-4488-BD53-C71F802E3395}.Debug|Any CPU.Build.0 = Debug|Any CPU
+		{189DDAAC-CE3B-4488-BD53-C71F802E3395}.Release|Any CPU.ActiveCfg = Release|Any CPU
+		{189DDAAC-CE3B-4488-BD53-C71F802E3395}.Release|Any CPU.Build.0 = Release|Any CPU
+		{BD9D160A-49C7-4BD7-9559-7C0185C76122}.Debug|Any CPU.ActiveCfg = Debug|Any CPU
+		{BD9D160A-49C7-4BD7-9559-7C0185C76122}.Debug|Any CPU.Build.0 = Debug|Any CPU
+		{BD9D160A-49C7-4BD7-9559-7C0185C76122}.Release|Any CPU.ActiveCfg = Release|Any CPU
+		{BD9D160A-49C7-4BD7-9559-7C0185C76122}.Release|Any CPU.Build.0 = Release|Any CPU
+	EndGlobalSection
+	GlobalSection(SolutionProperties) = preSolution
+		HideSolutionNode = FALSE
+	EndGlobalSection
+	GlobalSection(NestedProjects) = preSolution
+		{3E61D800-B120-46E9-B7EE-332ED8488CC9} = {5A9632E5-F638-42BF-BF07-3B35E2BE0605}
+		{189DDAAC-CE3B-4488-BD53-C71F802E3395} = {3E61D800-B120-46E9-B7EE-332ED8488CC9}
+		{176DEFFB-5FDF-4308-84B3-C685641CFA0B} = {5A9632E5-F638-42BF-BF07-3B35E2BE0605}
+		{83389DF2-DAC5-4172-A0DF-017F511DBD8A} = {176DEFFB-5FDF-4308-84B3-C685641CFA0B}
+		{BD9D160A-49C7-4BD7-9559-7C0185C76122} = {83389DF2-DAC5-4172-A0DF-017F511DBD8A}
+	EndGlobalSection
+	GlobalSection(ExtensibilityGlobals) = postSolution
+		SolutionGuid = {DB39B9D2-8859-49C2-9636-C4E4D345C9A7}
+	EndGlobalSection
+EndGlobal
@@ -1,86 +1,61 @@
-# Video Analysis-Azure Open AI in-a-box
+# Image and Video Analysis-Azure Open AI in-a-box
 ![banner](./readme-assets/banner-aoai-video-analysis-in-a-box.png)
-This solution examines vehicles for damage using Azure Open AI GPT-4 Turbo with Vision and Computer Vision Image Analysis 4.0. All orchestration is done with Azure Data Factory, allowing this solution to be easily customized for your own use cases.
+This solution examines videos and image of vehicles for damage using Azure Open AI GPT-4 Turbo with Vision and Azure AI Vision Image Analysis 4.0. All orchestration is done with Azure Data Factory, allowing this solution to be easily customized for your own use cases.
 
-Please note that as of this 1/31/2024, Azure Open AI GPT-4 Turbo with Vision and Computer Vision Image Analysis 4 are in Public Preview for limited regions.
+Please note that as of this 4/4/2024, Azure Open AI GPT-4 Turbo with Vision and Azure AI Vision Image Analysis 4.0 are in Public Preview for limited regions.
 
-- [Check here for available regions for Computer Vision Image Analysis 4.0.](https://learn.microsoft.com/en-us/azure/ai-services/computer-vision/overview-image-analysis?tabs=4-0#image-analysis-versions)
+- [Check here for available regions for Azure AI Vision Image Analysis 4.0.](https://learn.microsoft.com/en-us/azure/ai-services/computer-vision/overview-image-analysis?tabs=4-0#image-analysis-versions)
 - [Check here for available regions for GPT-4 Turbo with Vision.](https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models#gpt-4-and-gpt-4-turbo-preview-model-availability)
 
 ## Solution Architecture
 
 ![solution-arch](./readme-assets/gpt4-adf-architecture.jpg)
 
-1. Land videos in Azure Blob storage with Azure Event Grid, Azure Logic Apps, Azure Functions, other ADF pipelines or other applications.
+1. Land images and/or videos in Azure Blob storage with Azure Event Grid, Azure Logic Apps, Azure Functions, other ADF pipelines or other applications.
 1. The ADF pipeline retrieves the Azure AI API endpoints, keys and other configurations from Key Vault.
-1. The blob storage URL for the video file is retrieved.
-1. With Azure Computer Vision, a video retrieval index is created for the file and the video is ingested. Depending on your use case, you could ingest multiple videos to the same index.
-1. Call GPT4-V deployment in Azure Open AI, passing in video URL and the video retrieval index, system message, system prompt and other inputs.
+1. The blob storage URL for the image or video file is retrieved.
+1. For videos, a video retrieval index is created for the file with Azure AI Vision and the video is ingested into the index. Depending on your use case, you could ingest multiple videos to the same index. Image analysis does not require an index.
+1. Call GPT4-V deployment in Azure Open AI, passing in video or image URL, the video retrieval index for videos, the system message, the user prompt and other inputs.
 1. Save the response to Azure Cosmos DB.
-1. If the video processes successfully, move the video to an archive folder.
+1. If the video processes successfully, move the video to the appropriate archive folder.
 
 ## Resources Deployed in this solution
 
 ![resources](./readme-assets/resources.jpg)
 
 - User Assigned Managed Identity which has access to all resources
-- Storage account and containers for input videos and processed videos. Additionally, a SAS key is created which is required at this time for Azure Computer Vision Image Analyis 4.0.
+- Storage account and containers for input images and videos and processed images videos. Additionally, a SAS key is created which is required at this time for Azure AI Vision Image Analysis 4.0.
 - Azure Key Vault for holding API keys, the storage SAS token, and deployment information.
-- Azure Computer Vision with Image Analysis 4.0 for video ingestion. Note that at this time Image Analysis 4.0 is in Preview and in limited regions. [Check here for available regions.](https://learn.microsoft.com/en-us/azure/ai-services/computer-vision/overview-image-analysis?tabs=4-0#image-analysis-versions)
+- Azure AI Vision with Image Analysis 4.0 for video ingestion and/or image analysis. Note that at this time Image Analysis 4.0 is in Preview and in limited regions. [Check here for available regions.](https://learn.microsoft.com/en-us/azure/ai-services/computer-vision/overview-image-analysis?tabs=4-0#image-analysis-versions)
 - Azure Open AI resource with a GPT-4 Vision Preview Deployment. [Check here for available regions.](https://learn.microsoft.com/en-us/azure/ai-services/openai/concepts/models#gpt-4-and-gpt-4-turbo-preview-model-availability)
 
-## Prerequisites
+## Prerequisites for running locally
 
  1. Install latest version of [Azure CLI](https://docs.microsoft.com/en-us/cli/azure/install-azure-cli-windows?view=azure-cli-latest)
  1. Install latest version of [Bicep](https://docs.microsoft.com/en-us/azure/azure-resource-manager/bicep/install)
+ 1. Install latest version of [Azure Developer CLI](https://learn.microsoft.com/en-us/azure/developer/azure-developer-cli/install-azd?tabs=winget-windows%2Cbrew-mac%2Cscript-linux&pivots=os-windows)
  1. Install latest version [Azure Functions Core Tools](https://learn.microsoft.com/en-us/azure/azure-functions/functions-run-local?tabs=windows%2Cisolated-process%2Cnode-v4%2Cpython-v2%2Chttp-trigger%2Ccontainer-apps&pivots=programming-language-python#v2)
- 1. Clone this repo
 
-## Deploy Azure Resources
+## Deploy to Azure
 
-1. Navigate to the **infra** directory in your local repo
-1. Login to your Azure account:  
+### Clone this repository locally
 
-    ```bash
-         az login
-    ```
-
-1. Set your Azure subscription ID:
-
-    ```bash
-    az account set --subscription <subscription id>
-    ```
-
-1. Create an Azure Resource group in the same region that is supported by Azure OpenAI GPT-4V:
-
-    ```bash
-     az group create --name <your resource group name> --location <your resource group location>
-    ```
-
-1. Run command to get the object id for your email address. This is to give you access needed for deployed resources:
-
-    ```bash
-     az ad user show --id 'your email' --query id
-    ```
-
-1. Copy the objectid value returned from the above command.
-1. Open file main.bicepparam
-    1. For **spObjectId**, paste the id value from the previous command over 'your-object-id'.
-    1. Add value for your **resourceGroupName**.
-    1. For **resourceLocation**, specify a region where GPT-4 Turbo with Vision is available.
-    1. For **resourceLocationCV**, specify a region where Computer Vision with Image Analysis 4.0 is available.
-    1. Add 2 or 3 alpha characters for both  **prefix**, and **suffix**. Some of the resources require unique names across Azure and cannot be the same as a soft-deleted resource.
-1. Save the main.bicepparam file.
+```bash
+git clone https://github.com/Azure/AI-in-a-Box
+```
 
-## Deploy resources to Azure
+### Deploy resources
 
-1. Navigate to the **infra** folder and run the following command:
+```bash
+cd gen-ai/a-services/gpt-video-analysis-in-a-box
+azd auth login
+azd up
+```
 
-    ```bash
-    az deployment group create --resource-group <your resource group name>  --template-file main.bicep --parameters main.bicepparam
-    ```
+You will be prompted for a subscription, a region for GPT-4V, a region for AI Vision, a resource group, a prefix and a suffix. 
 
-1. Upload videos of vehicles to your new storage account's **videosin** container using [Azure Storage Explorer](https://learn.microsoft.com/en-us/azure/vs-azure-tools-storage-manage-with-storage-explorer), [AzCopy](https://learn.microsoft.com/en-us/azure/storage/common/storage-use-azcopy-files#upload-the-contents-of-a-directory) or within [the Azure portal](https://learn.microsoft.com/en-us/azure/storage/blobs/storage-quickstart-blobs-portal#upload-a-block-blob). You can find some sample videos at the bottom of this blog, [Analyze Videos with Azure Open AI GPT-4 Turbo with Vision and Azure Data Factory](https://techcommunity.microsoft.com/t5/fasttrack-for-azure/analyze-videos-with-azure-open-ai-gpt-4-turbo-with-vision-and/ba-p/4032778).
+### Post deployment:
+Upload images and videos of vehicles to your new storage account's **videosin** container using [Azure Storage Explorer](https://learn.microsoft.com/en-us/azure/vs-azure-tools-storage-manage-with-storage-explorer), [AzCopy](https://learn.microsoft.com/en-us/azure/storage/common/storage-use-azcopy-files#upload-the-contents-of-a-directory) or within [the Azure portal](https://learn.microsoft.com/en-us/azure/storage/blobs/storage-quickstart-blobs-portal#upload-a-block-blob). You can find some sample images and videos at the bottom of this blog, [Analyze Videos with Azure Open AI GPT-4 Turbo with Vision and Azure Data Factory](https://techcommunity.microsoft.com/t5/fasttrack-for-azure/analyze-videos-with-azure-open-ai-gpt-4-turbo-with-vision-and/ba-p/4032778).
 
 ## Run the solution
 
@@ -93,41 +68,39 @@ Please note that as of this 1/31/2024, Azure Open AI GPT-4 Turbo with Vision and
 1. After it runs successfully, go to your Azure Cosmos DB resource and examine the results in Data Explorer:
 ![cosmos](./readme-assets/cosmos-data-explorer.png)
 
-1. Because the way the system message was instructed to format the results, we can run queries with expressions like the one below to easily see the probability of damage, the severity of any damage, and the kind of damage that occurred:
+1. At this time, GPT4-V does not support response_format={"type": "json_object"}. However, if we still specify the chat completion to return the results in Json, we can specify a Cosmos query to convert the string to a Json object:
 ![cosmos query](./readme-assets/cosmos-query.png)
 
 ```sql
-SELECT gptoutput.filename, gptoutput.fileurl, gptoutput.shortdate,
-SUBSTRING(gptoutput.content, INDEX_OF(gptoutput.content, "Location[") + 9, INDEX_OF(gptoutput.content, "]", INDEX_OF(gptoutput.content, "Location[") + 9) - INDEX_OF(gptoutput.content, "Location[") - 9) AS Location,
-SUBSTRING(gptoutput.content, INDEX_OF(gptoutput.content, "VehicleType[") + 12, INDEX_OF(gptoutput.content, "]", INDEX_OF(gptoutput.content, "VehicleType[") + 12) - INDEX_OF(gptoutput.content, "VehicleType[") - 12) AS VehicleType,
-SUBSTRING(gptoutput.content, INDEX_OF(gptoutput.content, "DamageProbability[") + 18, INDEX_OF(gptoutput.content, "]", INDEX_OF(gptoutput.content, "DamageProbability[") + 18) - INDEX_OF(gptoutput.content, "DamageProbability[") - 18) AS DamageProbability,
-SUBSTRING(gptoutput.content, INDEX_OF(gptoutput.content, "Damage[") + 7, INDEX_OF(gptoutput.content, "]", INDEX_OF(gptoutput.content, "Damage[") + 7) - INDEX_OF(gptoutput.content, "Damage[") - 7) AS DamageType,
-SUBSTRING(gptoutput.content, INDEX_OF(gptoutput.content, "Severity[") + 9, INDEX_OF(gptoutput.content, "]", INDEX_OF(gptoutput.content, "Severity[") + 9) - INDEX_OF(gptoutput.content, "Severity[") - 9) AS Severity,
-gptoutput.content
-FROM gptoutput
+SELECT gptoutput.filename, gptoutput.fileurl, gptoutput.shortdate, 
+StringToObject(gptoutput.content) as results
+FROM gptoutput 
 ```
 
 ## Enhance the solution in your environment for your own use cases
 
 This solution is highly customizable due to the parameterization capabilities in Azure Data Factory. Below are the features you can parameterize out-of-the-box, or should I say, out-of-the-AI-in-Box (insert-nerdy-laugh-here.)
 
-![parameters](./readme-assets/adf-parms.jpg)
-
 ### Test prompts and other settings
 
 When developing your solution, you can rerun it with different settings to get the best results from GPT-4V by tweaking the **sys-message**, **user_prompt**, **temperature**, and **top_p** values.
 
+![parameters](./readme-assets/adf-parms.jpg)
+
 ### Change from batch to real-time
 
-This solution is set to loop against a container of videos in batch, which is ideal for testing. However, when you move to production, you may want the video to be analyzed in real-time. To do this, you can set up a storage event trigger which will run when a file is landed in blob storage.
-![trigger](./readme-assets/blob-event-trigger.jpg)
-Then eliminate the Get Metadata and For Each activities and call the ChildAnalyzeVideo pipeline after the variables are set and the parameters are retrieved from Key Vault. You can get the file name from the trigger metadata. [Read more about ADF Storage Event triggers here](https://learn.microsoft.com/en-us/azure/data-factory/how-to-create-event-trigger?tabs=data-factory).
+This solution is set to loop against a container of videos and images in batch, which is ideal for testing. However, when you move to production, you may want the video to be analyzed in real-time. To do this, you can set up a storage event trigger which will run when a file is landed in blob storage.
+![triMovegger](./readme-assets/blob-event-trigger.jpg)
+Move the If Activity inside the For Each loop to the main Orchestrator pipeline canvas and hen eliminate the Get Metadata and For Each activities.  Call the If activity after the variables are set and the parameters are retrieved from Key Vault. You can get the file name from the trigger metadata. [Read more about ADF Storage Event triggers here](https://learn.microsoft.com/en-us/azure/data-factory/how-to-create-event-trigger?tabs=data-factory).
 
-### Use the same Data Factory for other video analysis use cases
+### Use the same Data Factory for other image and/or video analysis use cases
 
 You can set up multiple triggers over your Azure Data Factory and pass different parameter values for whatever analysis you need to do:
 ![triggers](./readme-assets/new-trigger-parm.png)
 
-You can set up different storage accounts for landing videos, then adjust the **storageaccounturl** and **storageaccountcontainer** parameters to ingest and analyze those videos. You can have different prompts and other values sent to GPT-4V in the **sys_message**, **user_prompt**, **temperature**, and **top_p** values for different triggers. You can land the data in a different Cosmos Account, Database and/or Container when setting the **cosmosaccount**, and **cosmosdb**, and **cosmoscontainer** values.
+You can set up different storage accounts for landing the files, then adjust the **storageaccounturl** and **storageaccountcontainer** parameters to ingest and analyze the images and/or videos. You can have different prompts and other values sent to GPT-4V in the **sys_message**, **user_prompt**, **temperature**, and **top_p** values for different triggers. You can land the data in a different Cosmos Account, Database and/or Container when setting the **cosmosaccount**, and **cosmosdb**, and **cosmoscontainer** values.
+
+### Only analyze images or videos
+If you are only analyzing images OR videos, you can delete the pipeline that is not needed (childAnalyzeImage or childAnalyzeVideo), eliminate the If activity inside the ForEach File activity and specify the Execute Pipeline activity for just the pipeline you need. However, it doesn't hurt to leave the unneeded pipeline there in case you want to use it in the future.
 
 For more details on this solution, check out this blog: [Analyze Videos with Azure Open AI GPT-4 Turbo with Vision and Azure Data Factory](https://techcommunity.microsoft.com/t5/fasttrack-for-azure/analyze-videos-with-azure-open-ai-gpt-4-turbo-with-vision-and/ba-p/4032778)!
@@ -0,0 +1,14 @@
+# yaml-language-server: $schema=https://raw.githubusercontent.com/Azure/azure-dev/main/schemas/v1.0/azure.yaml.json
+
+name: gpt4v-image-and-video-analysis-in-a-box
+metadata:
+    template: azd-init@1.4.4
+hooks:
+  preprovision:
+    windows:
+      shell: pwsh
+      run: ./scripts/setSPObjectId.ps1
+      interactive: true
+      continueOnError: false
+
+