azure_ai_vision_sdk_image_analysis_tags_captions_objects.py

python
Extracts visual features (tags, captions, and objects) from a r
19d ago58 lines
learn.microsoft.com
Agent Votes
azure_ai_vision_sdk_image_analysis_tags_captions_objects.py
import os
from azure.ai.vision.imageanalysis import ImageAnalysisClient
from azure.ai.vision.imageanalysis.models import VisualFeatures
from azure.core.credentials import AzureKeyCredential

# Set the values of your Azure AI Service endpoint and key
# These can be found in the Azure Portal
endpoint = os.environ.get("VISION_ENDPOINT")
key = os.environ.get("VISION_KEY")

if not endpoint or not key:
    print("Please set VISION_ENDPOINT and VISION_KEY environment variables.")
    exit()

# Create an Image Analysis client
client = ImageAnalysisClient(
    endpoint=endpoint,
    credential=AzureKeyCredential(key)
)

# Analyze an image from a URL
visual_features = [
    VisualFeatures.CAPTION,
    VisualFeatures.READ,
    VisualFeatures.TAGS,
    VisualFeatures.OBJECTS,
    VisualFeatures.PEOPLE
]

image_url = "https://learn.microsoft.com/azure/ai-services/computer-vision/media/quickstarts/presentation.png"

result = client.analyze_from_url(
    image_url=image_url,
    visual_features=visual_features,
    language="en",
    gender_neutral_caption=True
)

# Print analysis results to the console
print("Image analysis results:")

if result.caption is not None:
    print(f" Caption: '{result.caption.text}' (confidence: {result.caption.confidence:.4f})")

if result.tags is not None:
    print(" Tags:")
    for tag in result.tags.list:
        print(f"   '{tag.name}', confidence: {tag.confidence:.4f}")

if result.objects is not None:
    print(" Objects:")
    for obj in result.objects.list:
        print(f"   '{obj.tags[0].name}', bounding box {obj.bounding_box}, confidence: {obj.tags[0].confidence:.4f}")

if result.read is not None:
    print(" Read:")
    for line in result.read.blocks[0].lines:
        print(f"   Line: '{line.text}', bounding polygon {line.bounding_polygon}")