Merge pull request #53760 from MicrosoftDocs/NEW-image-content-understanding

Stacyrch140 · web-flow · commit 22e59961321d · 2026-03-10T16:27:50.000-04:00
New module - image content understanding
diff --git a/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/1-introduction.yml b/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/1-introduction.yml
@@ -0,0 +1,13 @@
+### YamlMime:ModuleUnit
+uid: learn.wwl.analyze-images-with-content-understanding.introduction
+title: Introduction
+metadata:
+  title: Introduction
+  description: "Get started with Content Understanding in Microsoft Foundry."
+  ms.date: 03/04/2026
+  author: buzahid
+  ms.author: buzahid
+  ms.topic: unit
+durationInMinutes: 1
+content: |
+  [!include[](includes/1-introduction.md)]
diff --git a/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/2-what-is-content-understanding.yml b/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/2-what-is-content-understanding.yml
@@ -0,0 +1,13 @@
+### YamlMime:ModuleUnit
+uid: learn.wwl.analyze-images-with-content-understanding.what-is-content-understanding
+title: What is Content Understanding?
+metadata:
+  title: What is Content Understanding?
+  description: "Learn about Azure Content Understanding and how it can analyze images to extract structured data."
+  ms.date: 03/04/2026
+  author: buzahid
+  ms.author: buzahid
+  ms.topic: unit
+durationInMinutes: 3
+content: |
+  [!include[](includes/2-what-is-content-understanding.md)]
diff --git a/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/3-analyze-images-with-content-understanding.yml b/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/3-analyze-images-with-content-understanding.yml
@@ -0,0 +1,14 @@
+### YamlMime:ModuleUnit
+uid: learn.wwl.analyze-images-with-content-understanding.analyze-images-with-content-understanding
+title: Analyze images with Content Understanding
+metadata:
+  title: Analyze images with Content Understanding
+  description: "Learn how to analyze images with Azure Content Understanding."
+  ms.date: 03/04/2026
+  author: buzahid
+  ms.author: buzahid
+  ms.topic: unit
+durationInMinutes: 5
+content: |
+  [!include[](includes/3-analyze-images-with-content-understanding.md)]
+
diff --git a/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/4-exercise.yml b/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/4-exercise.yml
@@ -0,0 +1,13 @@
+### YamlMime:ModuleUnit
+uid: learn.wwl.analyze-images-with-content-understanding.exercise
+title: Exercise - Analyze images with Content Understanding
+metadata:
+  title: Exercise - Analyze images with Content Understanding
+  description: "Get practical experience with analyzing images using Azure Content Understanding."
+  ms.date: 03/04/2026
+  author: buzahid
+  ms.author: buzahid
+  ms.topic: unit
+durationInMinutes: 30
+content: |
+  [!include[](includes/4-exercise.md)]
diff --git a/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/5-knowledge-check.yml b/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/5-knowledge-check.yml
@@ -0,0 +1,48 @@
+### YamlMime:ModuleUnit
+uid: learn.wwl.analyze-images-with-content-understanding.knowledge-check
+title: Module assessment
+metadata:
+  title: Module assessment
+  description: "Check your learning on analyzing images with Azure Content Understanding."
+  ms.date: 03/04/2026
+  author: buzahid
+  ms.author: buzahid
+  ms.topic: unit
+durationInMinutes: 3
+content: |
+quiz:
+  questions:
+  - content: "What is the purpose of grounding in Content Understanding?"
+    choices:
+    - content: "To connect Content Understanding to Azure storage"
+      isCorrect: false
+      explanation: "Incorrect. Grounding identifies where in the content each extracted value was found."
+    - content: "To identify the specific regions in content where each value was extracted"
+      isCorrect: true
+      explanation: "Correct. Grounding allows users to trace extracted values back to their origin in the source content for verification."
+    - content: "To filter out harmful content from images"
+      isCorrect: false
+      explanation: "Incorrect. Content filtering is handled separately by Azure AI Content Safety, not by grounding."
+  - content: "What does a confidence score of 0.95 indicate for an extracted field?"
+    choices:
+    - content: "The extraction failed and needs manual review"
+      isCorrect: false
+      explanation: "Incorrect. A score of 0.95 is high confidence, indicating the value can be trusted."
+    - content: "The value can be trusted for automated processing"
+      isCorrect: true
+      explanation: "Correct. High confidence scores (0.9+) indicate accurate data extraction that can be used in automated workflows."
+    - content: "The field was classified rather than extracted"
+      isCorrect: false
+      explanation: "Incorrect. Confidence scores indicate reliability, not the extraction method used."
+  - content: "Which prebuilt analyzer would you use to extract vendor names and item totals from a purchase receipt?"
+    choices:
+    - content: "prebuilt-image"
+      isCorrect: false
+      explanation: "Incorrect. While prebuilt-image provides general analysis, prebuilt-receipt is optimized for receipt extraction."
+    - content: "prebuilt-invoice"
+      isCorrect: false
+      explanation: "Incorrect. prebuilt-invoice is designed for invoices, not receipts."
+    - content: "prebuilt-receipt"
+      isCorrect: true
+      explanation: "Correct. The prebuilt-receipt analyzer is optimized to extract vendor names, items, totals, and dates from receipt images."
+
diff --git a/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/6-summary.yml b/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/6-summary.yml
@@ -0,0 +1,13 @@
+### YamlMime:ModuleUnit
+uid: learn.wwl.analyze-images-with-content-understanding.summary
+title: Summary
+metadata:
+  title: Summary
+  description: "Reflect on what you've learned about analyzing images with Azure Content Understanding."
+  ms.date: 03/04/2026
+  author: buzahid
+  ms.author: buzahid
+  ms.topic: unit
+durationInMinutes: 1
+content: |
+  [!include[](includes/6-summary.md)]
diff --git a/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/includes/1-introduction.md b/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/includes/1-introduction.md
@@ -0,0 +1,6 @@
+Images, documents, and other unstructured content often contain valuable information that's hard to extract automatically. Azure Content Understanding solves this problem by using generative AI to analyze content and return structured data.
+
+With Content Understanding, you define a schema describing the data you want, and the service extracts it from your images and documents. The output is ready to use in automation workflows, analytics, and search applications.
+
+In this module, you'll learn how to analyze images with Content Understanding using both prebuilt and custom analyzers.
+
diff --git a/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/includes/2-what-is-content-understanding.md b/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/includes/2-what-is-content-understanding.md
@@ -0,0 +1,60 @@
+Azure Content Understanding is a Foundry Tool that uses generative AI to process and extract insights from many types of content, including documents, images, videos, and audio. It transforms unstructured data into structured, actionable output that you can integrate into automation and analytical workflows.
+
+## Why use Content Understanding?
+
+Content Understanding accelerates time to value by enabling straight-through processing of unstructured data. Key benefits include:
+
+- **Simplified workflows**: Standardizes extraction and classification of content from various content types into a unified process
+- **Easy field extraction**: Define a schema to extract, classify, or generate field values without complex prompt engineering
+- **Enhanced accuracy**: Uses multiple AI models to analyze and cross-validate information simultaneously
+- **Confidence scores and grounding**: Ensures accuracy of extracted values while minimizing the cost of human review
+- **Content classification**: Categorize document types to streamline processing and route content to appropriate analyzers
+
+## Content Understanding components
+
+The Content Understanding framework processes unstructured content through multiple stages:
+
+| Component | Description |
+|-----------|-------------|
+| **Inputs** | Source content including documents, images, video, and audio |
+| **Analyzer** | Defines how content is processed, including extraction settings and field schema |
+| **Content extraction** | Transforms unstructured input into normalized text and metadata using OCR, speech transcription, and layout detection |
+| **Field extraction** | Generates structured key-value pairs based on your defined schema |
+| **Confidence scores** | Provides reliability estimates from 0 to 1 for each extracted field value |
+| **Grounding** | Identifies specific regions in content where each value was extracted |
+| **Structured output** | Final result as Markdown for search scenarios or JSON for automation workflows |
+
+## Analyzers
+
+Analyzers are the core component that defines how your content is processed. Content Understanding offers two types:
+
+- **Prebuilt analyzers**: Ready-to-use analyzers designed for common scenarios like invoice processing, receipt extraction, and call center analytics
+- **Custom analyzers**: Tailored analyzers you create with your own field schema for specific business needs
+
+When you create an analyzer, you configure:
+
+- The base analyzer type (document, image, audio, or video)
+- The AI models to use for processing
+- The field schema that defines what data to extract
+- Options like confidence scoring and content segmentation
+
+## Use cases
+
+Content Understanding supports many business scenarios:
+
+| Use case | Description |
+|----------|-------------|
+| **Intelligent document processing** | Convert unstructured documents into structured data for invoice processing, contract analysis, and claims management |
+| **Search and RAG** | Ingest multimodal content into search indexes with figure descriptions and layout analysis |
+| **Agentic applications** | Transform messy file inputs into predictable, standardized inputs for AI agents |
+| **Analytics and reporting** | Extract field outputs to gain insights and make informed decisions |
+
+## Content restrictions
+
+Content Understanding includes built-in Responsible AI protections. The service integrates Azure AI Content Safety to detect and prevent harmful content. When processing content, be aware of these guidelines:
+
+- Content is filtered for harmful material including violence, hate speech, and exploitation
+- Face description capabilities can identify facial attributes in video and image content
+- Biometric data processing requires appropriate notice and consent from data subjects
+
+With Content Understanding, you can build solutions that extract meaningful insights from diverse content types while maintaining data quality and compliance.
diff --git a/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/includes/3-analyze-images-with-content-understanding.md b/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/includes/3-analyze-images-with-content-understanding.md
@@ -0,0 +1,137 @@
+Content Understanding can analyze images to extract structured data, identify visual elements, and generate descriptions. You can use prebuilt analyzers for common scenarios or create custom analyzers tailored to your specific needs.
+
+## Supported image formats
+
+Content Understanding supports the following image input types:
+
+| Format | Description |
+|--------|-------------|
+| **JPEG** | Standard photographic images |
+| **PNG** | Images with transparency support |
+| **BMP** | Bitmap images |
+| **TIFF** | High-quality scanned documents |
+| **HEIF** | High-efficiency image format |
+| **PDF** | Single or multi-page documents with embedded images |
+
+## Prebuilt image analyzers
+
+Content Understanding includes prebuilt analyzers optimized for common image analysis scenarios:
+
+- **prebuilt-image**: General-purpose image analysis with content extraction and figure description
+- **prebuilt-receipt**: Extract vendor names, items, totals, and dates from receipt images
+- **prebuilt-invoice**: Extract invoice details including line items, amounts, and vendor information
+- **prebuilt-idDocument**: Extract information from identity documents like driver's licenses and passports
+
+## Define a field schema for images
+
+To extract specific information from images, define a field schema that describes the data you want. Each field can use one of three extraction methods:
+
+| Method | Description | Example |
+|--------|-------------|---------|
+| **extract** | Pull values directly as they appear in the image | Extract text from a label or sign |
+| **classify** | Categorize content from predefined options | Classify image as "damaged" or "undamaged" |
+| **generate** | Create values based on image analysis | Generate a description of the scene |
+
+Here's an example schema for analyzing product images:
+
+```json
+{
+  "description": "Product image analyzer",
+  "baseAnalyzerId": "prebuilt-image",
+  "fieldSchema": {
+    "fields": {
+      "ProductName": {
+        "type": "string",
+        "method": "extract",
+        "description": "Name of the product visible in the image"
+      },
+      "Condition": {
+        "type": "string",
+        "method": "classify",
+        "description": "Condition of the product",
+        "enum": ["new", "used", "damaged"]
+      },
+      "Description": {
+        "type": "string",
+        "method": "generate",
+        "description": "Brief description of what the image shows"
+      }
+    }
+  }
+}
+```
+
+## Analyze an image
+
+To analyze an image using Content Understanding, submit a POST request to the analyze endpoint with your analyzer ID and the image URL or file:
+
+```bash
+curl -X POST "{endpoint}/contentunderstanding/analyzers/{analyzerId}:analyze?api-version=2025-11-01" \
+  -H "Ocp-Apim-Subscription-Key: {key}" \
+  -H "Content-Type: application/json" \
+  -d '{
+        "inputs": [
+          {
+            "url": "https://example.url/product-image.jpg"
+          }
+        ]
+      }'
+```
+
+The response includes a result ID that you use to retrieve the analysis results once processing completes.
+
+## Understand the response
+
+When analysis completes, the response includes:
+
+- **markdown**: A text representation of the image content, useful for search and RAG scenarios
+- **fields**: Extracted field values matching your schema, each with a confidence score
+- **source**: Grounding information showing where in the image each value was found
+
+Example response for a product image:
+
+```json
+{
+  "contents": [
+    {
+      "markdown": "Product label showing 'Contoso Widget Pro' with serial number...",
+      "fields": {
+        "ProductName": {
+          "type": "string",
+          "valueString": "Contoso Widget Pro",
+          "confidence": 0.95,
+          "source": "D(1,100,50,300,50,300,80,100,80)"
+        },
+        "Condition": {
+          "type": "string",
+          "valueString": "new",
+          "confidence": 0.89
+        },
+        "Description": {
+          "type": "string",
+          "valueString": "A silver electronic device in retail packaging with product label visible"
+        }
+      }
+    }
+  ]
+}
+```
+
+## Use confidence scores
+
+Each extracted field includes a confidence score from 0 to 1:
+
+- **High confidence (0.9+)**: Value can be trusted for automated processing
+- **Medium confidence (0.7-0.9)**: Consider human review for critical applications
+- **Low confidence (<0.7)**: Recommend manual verification
+
+Use confidence scores to build automation workflows that route low-confidence extractions to human reviewers while processing high-confidence results automatically.
+
+## Tips for better image analysis
+
+- **Image quality matters**: Higher resolution images produce more accurate extractions
+- **Lighting and contrast**: Ensure text and visual elements are clearly visible
+- **Single focus**: Images with one clear subject yield better results than cluttered scenes
+- **Consistent orientation**: Upright images are processed more reliably than rotated ones
+
+Content Understanding's image analysis capabilities enable you to transform visual content into structured, actionable data for document processing, inventory management, quality inspection, and many other business scenarios.
diff --git a/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/includes/4-exercise.md b/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/includes/4-exercise.md
@@ -0,0 +1,8 @@
+In this exercise, you'll use Azure Content Understanding to analyze images. You start by exploring the prebuilt image analyzer in the Microsoft Foundry portal to see how Content Understanding extracts information from images. Then, you create a Python application that uses the Content Understanding API to analyze images programmatically and extract structured data.
+
+> [!NOTE]
+> To complete this exercise, you need an Azure subscription. If you don't have one, you can [sign up for a free account](https://azure.microsoft.com/pricing/purchase-options/azure-account?cid=msft_learn), which includes credits for the first 30 days.
+
+Launch the exercise and follow the instructions.
+
+[![Button to launch exercise.](../media/launch-exercise.png)](https://go.microsoft.com/fwlink/?linkid=2356120&azure-portal=true)
diff --git a/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/includes/6-summary.md b/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/includes/6-summary.md
@@ -0,0 +1,14 @@
+In this module, you learned how to analyze images using Azure Content Understanding in Microsoft Foundry.
+
+You explored how to:
+
+- Understand the components of Content Understanding, including analyzers, field extraction, and confidence scores
+- Use prebuilt analyzers for common scenarios like receipts, invoices, and identity documents
+- Define field schemas with extract, classify, and generate methods
+- Analyze images using the Content Understanding API
+
+Content Understanding transforms unstructured visual content into structured, actionable data. By defining a schema and using prebuilt or custom analyzers, you can automate image analysis for document processing, inventory management, quality inspection, and other business scenarios.
+
+> [!TIP]
+> For more information about Content Understanding, see **[What is Azure Content Understanding?](/azure/ai-services/content-understanding/overview)** in the Azure AI documentation.
+
diff --git a/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/index.yml b/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/index.yml
@@ -0,0 +1,43 @@
+### YamlMime:Module
+uid: learn.wwl.analyze-images-with-content-understanding
+metadata:
+  title: Analyze Images with Content Understanding
+  description: "Learn how to analyze images with Azure Content Understanding."
+  ms.date: 03/04/2026
+  author: buzahid
+  ms.author: buzahid
+  ms.topic: module-standard-task-based # Please don't edit, used for our analytics
+  ai-usage: ai-assisted
+  ms.service: azure-ai-foundry
+title: Analyze images with Content Understanding
+summary: Learn how to analyze images with Azure Content Understanding.
+abstract: |
+  After completing this module, you'll be able to:
+  - Deploy a content-understanding AI model in Microsoft Foundry.
+  - Test an image-based prompt in the chat playground.
+  - Use the Azure OpenAI SDK to analyze images in Python.
+prerequisites: |
+  Before starting this module, you should have:
+  - Experience with deploying generative AI models in Microsoft Foundry.
+  - Programming experience.
+iconUrl: /learn/achievements/generic-badge.svg
+levels:
+  - intermediate
+roles: 
+  - ai-engineer
+products: 
+  - azure-ai-foundry
+  - azure-ai-foundry-sdk
+subjects: 
+  - artificial-intelligence
+units:
+- learn.wwl.analyze-images-with-content-understanding.introduction
+- learn.wwl.analyze-images-with-content-understanding.what-is-content-understanding
+- learn.wwl.analyze-images-with-content-understanding.analyze-images-with-content-understanding
+- learn.wwl.analyze-images-with-content-understanding.exercise
+- learn.wwl.analyze-images-with-content-understanding.knowledge-check
+- learn.wwl.analyze-images-with-content-understanding.summary
+badge:
+  uid: learn.wwl.analyze-images-with-content-understanding.badge
+
+
diff --git a/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/media/launch-exercise.png b/learn-pr/wwl-data-ai/analyze-images-with-content-understanding/media/launch-exercise.png