@@ -12,37 +12,37 @@ durationInMinutes: 3
1212content : |
1313quiz :
1414 questions :
15- - content : " What video durations does Sora 2 support ?"
15+ - content : " What is the purpose of grounding in Content Understanding ?"
1616 choices :
17- - content : " 1 to 20 seconds in 1-second increments "
17+ - content : " To connect Content Understanding to Azure storage "
1818 isCorrect : false
19- explanation : " Incorrect. Sora 2 supports specific duration values, not a continuous range ."
20- - content : " 4, 8, or 12 seconds "
19+ explanation : " Incorrect. Grounding identifies where in the content each extracted value was found ."
20+ - content : " To identify the specific regions in content where each value was extracted "
2121 isCorrect : true
22- explanation : " Correct. Sora 2 supports video durations of 4, 8, or 12 seconds ."
23- - content : " Any duration up to 60 seconds "
22+ explanation : " Correct. Grounding allows users to trace extracted values back to their origin in the source content for verification ."
23+ - content : " To filter out harmful content from images "
2424 isCorrect : false
25- explanation : " Incorrect. Sora 2 has specific supported duration values ."
26- - content : " What is required when using a reference image with Sora 2 ?"
25+ explanation : " Incorrect. Content filtering is handled separately by Azure AI Content Safety, not by grounding ."
26+ - content : " What does a confidence score of 0.95 indicate for an extracted field ?"
2727 choices :
28- - content : " The image must be smaller than 1 MB "
28+ - content : " The extraction failed and needs manual review "
2929 isCorrect : false
30- explanation : " Incorrect. The key requirement is that the image resolution must match the target video size ."
31- - content : " The image resolution must match the target video size "
30+ explanation : " Incorrect. A score of 0.95 is high confidence, indicating the value can be trusted ."
31+ - content : " The value can be trusted for automated processing "
3232 isCorrect : true
33- explanation : " Correct. Reference images must match the target video resolution exactly (1280x720 or 720x1280) ."
34- - content : " The image must contain at least one human face "
33+ explanation : " Correct. High confidence scores (0.9+) indicate accurate data extraction that can be used in automated workflows ."
34+ - content : " The field was classified rather than extracted "
3535 isCorrect : false
36- explanation : " Incorrect. Reference images with human faces are currently rejected by Sora 2 ."
37- - content : " What is the remix feature used for in Sora 2 ?"
36+ explanation : " Incorrect. Confidence scores indicate reliability, not the extraction method used ."
37+ - content : " Which prebuilt analyzer would you use to extract vendor names and item totals from a purchase receipt ?"
3838 choices :
39- - content : " Combining multiple videos into one "
39+ - content : " prebuilt-image "
4040 isCorrect : false
41- explanation : " Incorrect. Remix modifies an existing video while preserving its structure."
42- - content : " Making targeted adjustments to an existing video without regenerating from scratch"
43- isCorrect : true
44- explanation : " Correct. The remix feature lets you modify specific aspects while preserving scene transitions, visual layout, and overall structure."
45- - content : " Adding background music to generated videos"
41+ explanation : " Incorrect. While prebuilt-image provides general analysis, prebuilt-receipt is optimized for receipt extraction."
42+ - content : " prebuilt-invoice"
4643 isCorrect : false
47- explanation : " Incorrect. Remix is for making visual adjustments to existing videos."
44+ explanation : " Incorrect. prebuilt-invoice is designed for invoices, not receipts."
45+ - content : " prebuilt-receipt"
46+ isCorrect : true
47+ explanation : " Correct. The prebuilt-receipt analyzer is optimized to extract vendor names, items, totals, and dates from receipt images."
4848
0 commit comments