Merge pull request #53837 from GraemeMalcolm/main

JillGrant615 · web-flow · commit bb8875e58200 · 2026-03-12T20:21:57.000-06:00
Updated Voice live module
diff --git a/learn-pr/wwl-data-ai/develop-voice-live-agent/1-introduction.yml b/learn-pr/wwl-data-ai/develop-voice-live-agent/1-introduction.yml
@@ -4,11 +4,11 @@ title: Introduction
 metadata:
   title: Introduction
   description: Introduction
-  ms.date: 10/9/2025
+  ms.date: 03/12/2026
   author: jeffkoms
   ms.author: jeffko
   ms.topic: unit
 azureSandbox: false
-durationInMinutes: 3
+durationInMinutes: 1
 content: |
-  [!include[](includes/1-introduction.md)]
+  [!include[](includes/1-introduction.md)]
diff --git a/learn-pr/wwl-data-ai/develop-voice-live-agent/2-voice-live-api.yml b/learn-pr/wwl-data-ai/develop-voice-live-agent/2-voice-live-api.yml
@@ -4,11 +4,11 @@ title: Explore the Azure Voice Live API
 metadata:
   title: Explore the Azure Voice Live API
   description: Explore the Azure Voice Live API
-  ms.date: 10/9/2025
+  ms.date: 03/12/2026
   author: jeffkoms
   ms.author: jeffko
   ms.topic: unit
 azureSandbox: false
 durationInMinutes: 5
 content: |
-  [!include[](includes/2-voice-live-api.md)]
+  [!include[](includes/2-voice-live-api.md)]
diff --git a/learn-pr/wwl-data-ai/develop-voice-live-agent/3-voice-live-sdk.yml b/learn-pr/wwl-data-ai/develop-voice-live-agent/3-voice-live-sdk.yml
@@ -4,11 +4,11 @@ title: Explore the AI Voice Live client library for Python
 metadata:
   title: Explore the AI Voice Live Client Library for Python
   description: Explore the AI Voice Live client library for Python
-  ms.date: 10/9/2025
+  ms.date: 03/12/2026
   author: jeffkoms
   ms.author: jeffko
   ms.topic: unit
 azureSandbox: false
 durationInMinutes: 5
 content: |
-  [!include[](includes/3-voice-live-sdk.md)]
+  [!include[](includes/3-voice-live-sdk.md)]
diff --git a/learn-pr/wwl-data-ai/develop-voice-live-agent/3b-voice-live-agent.yml b/learn-pr/wwl-data-ai/develop-voice-live-agent/3b-voice-live-agent.yml
@@ -0,0 +1,14 @@
+### YamlMime:ModuleUnit
+uid: learn.wwl.develop-voice-live-agent.voice-live-agent
+title: Create a Voice Live agent
+metadata:
+  title: Create a Voice Live agent
+  description: Create a Voice Live agent
+  ms.date: 03/12/2026
+  author: jeffkoms
+  ms.author: jeffko
+  ms.topic: unit
+azureSandbox: false
+durationInMinutes: 5
+content: |
+  [!include[](includes/3b-voice-live-agent.md)]
diff --git a/learn-pr/wwl-data-ai/develop-voice-live-agent/4-exercise-develop-agent.yml b/learn-pr/wwl-data-ai/develop-voice-live-agent/4-exercise-develop-agent.yml
@@ -1,14 +1,14 @@
 ### YamlMime:ModuleUnit
 uid: learn.wwl.develop-voice-live-agent.exercise-develop-agent
-title: Exercise - Develop an Azure AI Voice Live agent
+title: Exercise - Develop a Voice Live agent
 metadata:
-  title: Exercise - Develop an Azure AI Voice Live Agent
-  description: Exercise - Develop an Azure AI Voice Live agent
-  ms.date: 10/9/2025
+  title: Exercise - Develop a Voice Live Agent
+  description: Exercise - Develop a Voice Live agent
+  ms.date: 03/12/2026
   author: jeffkoms
   ms.author: jeffko
   ms.topic: unit
 azureSandbox: false
 durationInMinutes: 30
 content: |
-  [!include[](includes/4-exercise-develop-agent.md)]
+  [!include[](includes/4-exercise-develop-agent.md)]
diff --git a/learn-pr/wwl-data-ai/develop-voice-live-agent/5-knowledge-check.yml b/learn-pr/wwl-data-ai/develop-voice-live-agent/5-knowledge-check.yml
@@ -5,7 +5,7 @@ title: Module assessment
 metadata:
   title: Module Assessment
   description: Module assessment
-  ms.date: 10/9/2025
+  ms.date: 03/12/2026
   author: jeffkoms
   ms.author: jeffko
   ms.topic: unit
@@ -14,58 +14,58 @@ durationInMinutes: 5
 content: |
 quiz:
   questions:
-  - content: "What are the two authentication methods supported by the Voice Live API?"
-    choices:
-    - content: "OAuth 2.0 and JWT (JSON Web Tokens)"
-      isCorrect: false
-      explanation: "OAuth 2.0 and JWT tokens aren't supported authentication methods for the Voice Live API."
-    - content: "Basic authentication and API keys"
-      isCorrect: false
-      explanation: "API keys are supported, but basic authentication isn't a supported authentication method for the Voice Live API."
-    - content: "Microsoft Entra (keyless) and API key"
-      isCorrect: true
-      explanation: "Microsoft Entra (keyless) and API key are both supported authentication methods for the Voice Live API."
-  - content: "Which scope is required when generating a token for Microsoft Entra authentication?"
-    choices:
-    - content: "`https://cognitiveservices.azure.com/.default`"
-      isCorrect: true
-      explanation: "The scope `https://cognitiveservices.azure.com/.default`, or `https://ai.azure.com/.default`, is required for Microsoft Entra authentication."
-    - content: "`https://management.azure.com/.default`"
-      isCorrect: false
-      explanation: "This is the Azure Resource Manager scope, not for AI services"
-    - content: "`https://graph.microsoft.com/.default`"
-      isCorrect: false
-      explanation: "This is the Microsoft Graph API scope, not for AI services"
-  - content: "Which protocol is used for avatar streaming integration in Voice Live API?"
-    choices:
-    - content: "HTTP/2"
-      isCorrect: false
-      explanation: "HTTP/2 is used for standard web communication."
-    - content: "WebRTC"
-      isCorrect: true
-      explanation: "The Voice live API supports WebRTC-based avatar streaming for interactive applications"
-    - content: "gRPC"
-      isCorrect: false
-      explanation: "gRPC is used to enable communication between microservices by using HTTP/2."
-  - content: "Which event should be handled to stop audio playback when a user interrupts the voice agent?"
-    choices:
-    - content: "`ServerEventType.RESPONSE_AUDIO_DELTA`"
-      isCorrect: false
-      explanation: "This event is for receiving audio chunks to play, not for stopping playback"
-    - content: "`ServerEventType.INPUT_AUDIO_BUFFER_SPEECH_STARTED`"
-      isCorrect: true
-      explanation: "This event can be used to stop audio playback, and cancel any current response."
-    - content: "`ServerEventType.SESSION_UPDATED`"
-      isCorrect: false
-      explanation: "This event indicates session readiness, not user speech interruption."
-  - content: "What is the recommended authentication method for production applications using the SDK?"
-    choices:
-    - content: "API key authentication"
-      isCorrect: false
-      explanation: "API key authentication isn't recommended for production applications."
-    - content: "Microsoft Entra authentication with DefaultAzureCredential"
-      isCorrect: true
-      explanation: "Microsoft Entra authentication with DefaultAzureCredential is the recommended approach for production applications."
-    - content: "Basic username/password authentication"
-      isCorrect: false
-      explanation: "Basic username/password authentication isn't a supported authentication method."
+    - content: "What are the two authentication methods supported by the Voice Live API?"
+      choices:
+        - content: "OAuth 2.0 and JWT (JSON Web Tokens)"
+          isCorrect: false
+          explanation: "OAuth 2.0 and JWT tokens aren't supported authentication methods for the Voice Live API."
+        - content: "Basic authentication and API keys"
+          isCorrect: false
+          explanation: "API keys are supported, but basic authentication isn't a supported authentication method for the Voice Live API."
+        - content: "Microsoft Entra (keyless) and API key"
+          isCorrect: true
+          explanation: "Microsoft Entra (keyless) and API key are both supported authentication methods for the Voice Live API."
+    - content: "Which scope is required when generating a token for Microsoft Entra authentication?"
+      choices:
+        - content: "`https://cognitiveservices.azure.com/.default`"
+          isCorrect: true
+          explanation: "The scope `https://cognitiveservices.azure.com/.default`, or `https://ai.azure.com/.default`, is required for Microsoft Entra authentication."
+        - content: "`https://management.azure.com/.default`"
+          isCorrect: false
+          explanation: "This is the Azure Resource Manager scope, not for AI services"
+        - content: "`https://graph.microsoft.com/.default`"
+          isCorrect: false
+          explanation: "This is the Microsoft Graph API scope, not for AI services"
+    - content: "Which protocol is used for avatar streaming integration in Voice Live API?"
+      choices:
+        - content: "HTTP/2"
+          isCorrect: false
+          explanation: "HTTP/2 is used for standard web communication."
+        - content: "WebRTC"
+          isCorrect: true
+          explanation: "The Voice live API supports WebRTC-based avatar streaming for interactive applications"
+        - content: "gRPC"
+          isCorrect: false
+          explanation: "gRPC is used to enable communication between microservices by using HTTP/2."
+    - content: "Which event should be handled to stop audio playback when a user interrupts the voice agent?"
+      choices:
+        - content: "`ServerEventType.RESPONSE_AUDIO_DELTA`"
+          isCorrect: false
+          explanation: "This event is for receiving audio chunks to play, not for stopping playback"
+        - content: "`ServerEventType.INPUT_AUDIO_BUFFER_SPEECH_STARTED`"
+          isCorrect: true
+          explanation: "This event can be used to stop audio playback, and cancel any current response."
+        - content: "`ServerEventType.SESSION_UPDATED`"
+          isCorrect: false
+          explanation: "This event indicates session readiness, not user speech interruption."
+    - content: "What is the recommended authentication method for production applications using the SDK?"
+      choices:
+        - content: "API key authentication"
+          isCorrect: false
+          explanation: "API key authentication isn't recommended for production applications."
+        - content: "Microsoft Entra authentication with DefaultAzureCredential"
+          isCorrect: true
+          explanation: "Microsoft Entra authentication with DefaultAzureCredential is the recommended approach for production applications."
+        - content: "Basic username/password authentication"
+          isCorrect: false
+          explanation: "Basic username/password authentication isn't a supported authentication method."
diff --git a/learn-pr/wwl-data-ai/develop-voice-live-agent/6-summary.yml b/learn-pr/wwl-data-ai/develop-voice-live-agent/6-summary.yml
@@ -4,11 +4,11 @@ title: Summary
 metadata:
   title: Summary
   description: Summary
-  ms.date: 10/9/2025
+  ms.date: 03/12/2026
   author: jeffkoms
   ms.author: jeffko
   ms.topic: unit
 azureSandbox: false
-durationInMinutes: 3
+durationInMinutes: 1
 content: |
-  [!include[](includes/6-summary.md)]
+  [!include[](includes/6-summary.md)]
diff --git a/learn-pr/wwl-data-ai/develop-voice-live-agent/includes/1-introduction.md b/learn-pr/wwl-data-ai/develop-voice-live-agent/includes/1-introduction.md
@@ -1,8 +1,8 @@
-Voice-enabled applications are transforming how we interact with technology, and this module guides you through building a real-time, interactive voice solutions using advanced APIs and tools. The Azure AI Voice live API is a solution enabling low-latency, high-quality speech to speech interactions for voice agents. The API is designed for developers seeking scalable and efficient voice-driven experiences as it eliminates the need to manually orchestrate multiple components.
+Voice-enabled applications are transforming how we interact with technology, and this module guides you through building a real-time, interactive voice solutions using advanced APIs and tools. The Voice live API in Azure Speech in Foundry Tools is a solution enabling low-latency, high-quality speech to speech interactions for voice agents. The API is designed for developers seeking scalable and efficient voice-driven experiences as it eliminates the need to manually orchestrate multiple components.
 
 After completing this module, you'll be able to:
 
-- Implement the Azure AI Voice Live API to enable real-time, bidirectional communication.
+- Implement the Azure Speech Voice Live API to enable real-time, bidirectional communication.
 - Set up and configure the agent session.
 - Develop and manage event handlers to create dynamic and interactive user experiences.
-- Build and deploy a Python-based web app with real-time voice interaction capabilities to Azure.
+- Use Voice Live with a Foundry Agent.
diff --git a/learn-pr/wwl-data-ai/develop-voice-live-agent/includes/2-voice-live-api.md b/learn-pr/wwl-data-ai/develop-voice-live-agent/includes/2-voice-live-api.md
@@ -8,6 +8,7 @@ The Voice live API provides real-time communication using WebSocket connections.
 - Events are categorized into client events (sent from client to server) and server events (sent from server to client).
 
 Key features include:
+
 - Real-time audio processing with support for multiple formats like PCM16 and G.711.
 - Advanced voice options, including OpenAI voices and Azure custom voices.
 - Avatar integration using WebRTC for video and animation.
@@ -20,7 +21,7 @@ For a table of supported models and regions, visit the [Voice Live API overview]
 
 ## Connect to the Voice Live API
 
-The Voice live API supports two authentication methods: Microsoft Entra (keyless) and API key. Microsoft Entra uses token-based authentication for a Microsoft Foundry resource. You apply a retrieved authentication token using a `Bearer` token with the `Authorization` header. 
+The Voice live API supports two authentication methods: Microsoft Entra (keyless) and API key. Microsoft Entra uses token-based authentication for a Microsoft Foundry resource. You apply a retrieved authentication token using a `Bearer` token with the `Authorization` header.
 
 For the recommended keyless authentication with Microsoft Entra ID, you need to assign the **Cognitive Services User** role to your user account or a managed identity. You generate a token using the Azure CLI or Azure SDKs. The token must be generated with the `https://ai.azure.com/.default` scope, or the legacy `https://cognitiveservices.azure.com/.default` scope. Use the token in the `Authorization` header of the WebSocket connection request, with the format `Bearer <token>`.
 
@@ -31,10 +32,10 @@ For key access, an API key can be provided in one of two ways. You can use an `a
 
 ### WebSocket endpoint
 
-The endpoint to use varies depending on how you want to access your resources. You can access resources through a connection to the AI Foundry project (Agent), or through a connection to the model. 
+The endpoint to use varies depending on how you want to access your resources. You can access resources through a connection to the Foundry project when implementing an agent, or through a direct connection to a model.
 
 - **Project connection:** The endpoint is `wss://<your-ai-foundry-resource-name>.services.ai.azure.com/voice-live/realtime?api-version=2025-10-01`
-- **Model connection:** The endpoint is `wss://<your-ai-foundry-resource-name>.cognitiveservices.azure.com/voice-live/realtime?api-version=2025-10-01`. 
+- **Model connection:** The endpoint is `wss://<your-ai-foundry-resource-name>.cognitiveservices.azure.com/voice-live/realtime?api-version=2025-10-01`.
 
 The endpoint is the same for all models. The only difference is the required `model` query parameter, or, when using the Agent service, the `agent_id` and `project_id` parameters.
 
@@ -137,6 +138,3 @@ Example configuration:
 
 > [!TIP]
 > Use high-resolution video settings for enhanced visual quality in avatar interactions.
-
-
-
diff --git a/learn-pr/wwl-data-ai/develop-voice-live-agent/includes/3b-voice-live-agent.md b/learn-pr/wwl-data-ai/develop-voice-live-agent/includes/3b-voice-live-agent.md
diff --git a/learn-pr/wwl-data-ai/develop-voice-live-agent/includes/4-exercise-develop-agent.md b/learn-pr/wwl-data-ai/develop-voice-live-agent/includes/4-exercise-develop-agent.md
diff --git a/learn-pr/wwl-data-ai/develop-voice-live-agent/index.yml b/learn-pr/wwl-data-ai/develop-voice-live-agent/index.yml
diff --git a/learn-pr/wwl-data-ai/develop-voice-live-agent/media/voice-mode.png b/learn-pr/wwl-data-ai/develop-voice-live-agent/media/voice-mode.png