add integration test for agent framework

Jimh333 · Jimh333 · commit a38e4b2c2289 · 2025-11-04T22:32:41.000-05:00
diff --git a/pyproject.toml b/pyproject.toml
@@ -38,6 +38,7 @@ dev-dependencies = [
     "ruff>=0.1.0",
     "python-dotenv>=1.0.0",
     "openai>=1.0.0",
+    "agent-framework-azure-ai >= 0.1.0",
     "azure-identity>=1.12.0",
     "openai-agents >= 0.2.6",
 ]
diff --git a/tests/integration/test_agentframework_trace_processor.py b/tests/integration/test_agentframework_trace_processor.py
@@ -0,0 +1,307 @@
+# Copyright (c) Microsoft Corporation.
+# Licensed under the MIT License.
+
+import time
+
+import pytest
+from microsoft_agents_a365.observability.core import configure, get_tracer_provider
+from microsoft_agents_a365.observability.core.constants import (
+    GEN_AI_AGENT_ID_KEY,
+    GEN_AI_INPUT_MESSAGES_KEY,
+    GEN_AI_OUTPUT_MESSAGES_KEY,
+    GEN_AI_REQUEST_MODEL_KEY,
+    GEN_AI_SYSTEM_KEY,
+    TENANT_ID_KEY,
+)
+from microsoft_agents_a365.observability.extensions.agentframework.trace_instrumentor import (
+    AgentFrameworkInstrumentor,
+)
+
+# AgentFramework SDK
+try:
+    from agent_framework.azure import AzureOpenAIChatClient
+    from agent_framework import ChatAgent, ai_function
+    from azure.identity import AzureCliCredential
+    from agent_framework.observability import setup_observability
+except ImportError:
+    pytest.skip(
+        "AgentFramework library and dependencies required for integration tests",
+        allow_module_level=True,
+    )
+
+
+@ai_function
+def add_numbers(a: float, b: float) -> float:
+    """Add two numbers together.
+
+    Args:
+        a: First number
+        b: Second number
+
+    Returns:
+        The sum of a and b
+    """
+    return a + b
+
+
+@pytest.mark.integration
+class TestAgentFrameworkTraceProcessorIntegration:
+    """Integration tests for AgentFramework trace processor with real Azure OpenAI."""
+
+    def setup_method(self):
+        """Set up test method with mock exporter."""
+        self.captured_spans = []
+        self.mock_exporter = MockAgent365Exporter(self.captured_spans)
+
+    def test_agentframework_trace_processor_integration(self, azure_openai_config, agent365_config):
+        """Test AgentFramework trace processor with real Azure OpenAI call."""
+
+
+        # Configure observability
+        configure(
+            service_name="integration-test-service",
+            service_namespace="agent365-tests",
+            logger_name="test-logger",
+        )
+
+        # Get the tracer provider and add our mock exporter
+        provider = get_tracer_provider()
+        provider.add_span_processor(self.mock_exporter)
+
+        setup_observability()
+
+        # Initialize the instrumentor
+        instrumentor = AgentFrameworkInstrumentor()
+        instrumentor.instrument()
+
+        try:
+            # Create Azure OpenAI ChatClient
+            chat_client = AzureOpenAIChatClient(
+                endpoint=azure_openai_config["endpoint"],
+                credential=AzureCliCredential(),
+                deployment_name=azure_openai_config["deployment"],
+                api_version=azure_openai_config["api_version"],
+            )
+
+            # Create agent framework agent
+            agent = ChatAgent(
+                chat_client=chat_client,
+                instructions="You are a helpful assistant.",
+                tools=[],
+            )
+
+            # Execute a simple prompt using async runner
+            import asyncio
+
+            async def run_agent():
+                result = await agent.run("What can you do with agent framework?")
+                return result
+
+            asyncio.run(setup_observability())
+            response = asyncio.run(run_agent())
+
+            # Give some time for spans to be processed
+            time.sleep(1)
+
+            # Verify that spans were captured
+            assert len(self.captured_spans) > 0, "No spans were captured"
+
+            # Verify we have the expected span types
+            span_names = [span.name for span in self.captured_spans]
+            print(f"Captured spans: {span_names}")
+
+            # Validate attributes on spans
+            self._validate_span_attributes(agent365_config)
+
+            # Verify the response content
+            assert response is not None
+            assert len(response) > 0
+            print(f"Agent response: {response}")
+
+        finally:
+            # Clean up
+            instrumentor.uninstrument()
+
+    def test_agentframework_trace_processor_with_tool_calls(self, azure_openai_config, agent365_config):
+        """Test AgentFramework trace processor with tool calls."""
+
+        # Configure observability
+        configure(
+            service_name="integration-test-service-tools",
+            service_namespace="agent365-tests",
+            logger_name="test-logger",
+        )
+
+        # Get the tracer provider and add our mock exporter
+        provider = get_tracer_provider()
+        provider.add_span_processor(self.mock_exporter)
+
+        setup_observability()
+
+        # Initialize the instrumentor
+        instrumentor = AgentFrameworkInstrumentor()
+        instrumentor.instrument()
+
+        try:
+            # Create Azure OpenAI ChatClient
+            chat_client = AzureOpenAIChatClient(
+                endpoint=azure_openai_config["endpoint"],
+                credential=AzureCliCredential(),
+                deployment_name=azure_openai_config["deployment"],
+                api_version=azure_openai_config["api_version"],
+            )
+
+            # Create agent framework agent
+            agent = ChatAgent(
+                chat_client=chat_client,
+                instructions="You are a helpful agent framework assistant.",
+                tools=[add_numbers],
+            )
+
+            # Execute a prompt that requires tool usage
+            import asyncio
+
+
+            async def run_agent_with_tool():
+                result = await agent.run("What is 15 + 27?")
+                return result
+
+            response = asyncio.run(run_agent_with_tool())
+
+            # Give some time for spans to be processed
+            time.sleep(1)
+
+            # Verify that spans were captured
+            assert len(self.captured_spans) > 0, "No spans were captured"
+
+            # Verify we have the expected span types
+            span_names = [span.name for span in self.captured_spans]
+            print(f"Captured spans with tools: {span_names}")
+
+            # Validate attributes on spans including tool calls
+            self._validate_tool_span_attributes(agent365_config)
+
+            # Verify the response content includes the calculation result
+            assert response is not None
+            assert len(response) > 0
+            assert "42" in response  # 15 + 27 = 42
+            print(f"Agent response with tool: {response}")
+
+        finally:
+            # Clean up
+            instrumentor.uninstrument()
+
+    def _validate_span_attributes(self, agent365_config):
+        """Validate that spans have the expected attributes."""
+        llm_spans_found = 0
+        agent_spans_found = 0
+
+        for span in self.captured_spans:
+            attributes = dict(span.attributes or {})
+            print(f"Span '{span.name}' attributes: {list(attributes.keys())}")
+
+            # Check common attributes
+            if TENANT_ID_KEY in attributes:
+                assert attributes[TENANT_ID_KEY] == agent365_config["tenant_id"]
+
+            if GEN_AI_AGENT_ID_KEY in attributes:
+                assert attributes[GEN_AI_AGENT_ID_KEY] == agent365_config["agent_id"]
+
+            # Check for LLM spans (generation spans)
+            if GEN_AI_SYSTEM_KEY in attributes and attributes[GEN_AI_SYSTEM_KEY] == "openai":
+                if GEN_AI_REQUEST_MODEL_KEY in attributes:
+                    llm_spans_found += 1
+                    # Validate LLM span attributes
+                    assert GEN_AI_REQUEST_MODEL_KEY in attributes
+                    assert attributes[GEN_AI_REQUEST_MODEL_KEY] is not None
+                    print(f"✓ Found LLM span with model: {attributes[GEN_AI_REQUEST_MODEL_KEY]}")
+
+                    # Check for input/output messages
+                    if GEN_AI_INPUT_MESSAGES_KEY in attributes:
+                        input_messages = attributes[GEN_AI_INPUT_MESSAGES_KEY]
+                        assert input_messages is not None
+                        print(f"✓ Input messages found: {input_messages[:100]}...")
+
+                    if GEN_AI_OUTPUT_MESSAGES_KEY in attributes:
+                        output_messages = attributes[GEN_AI_OUTPUT_MESSAGES_KEY]
+                        assert output_messages is not None
+                        print(f"✓ Output messages found: {output_messages[:100]}...")
+
+            # Check for agent spans
+            if "agent" in span.name.lower():
+                agent_spans_found += 1
+                print(f"✓ Found agent span: {span.name}")
+
+        # Ensure we found at least some spans with telemetry data
+        assert len(self.captured_spans) > 0, "No spans were captured"
+        print(f"✓ Captured {len(self.captured_spans)} spans total")
+        print(f"✓ Found {llm_spans_found} LLM spans and {agent_spans_found} agent spans")
+
+    def _validate_tool_span_attributes(self, agent365_config):
+        """Validate that spans have the expected attributes including tool calls."""
+        llm_spans_found = 0
+        agent_spans_found = 0
+        tool_spans_found = 0
+
+        for span in self.captured_spans:
+            attributes = dict(span.attributes or {})
+            print(f"Span '{span.name}' attributes: {list(attributes.keys())}")
+
+            # Check common attributes
+            if TENANT_ID_KEY in attributes:
+                assert attributes[TENANT_ID_KEY] == agent365_config["tenant_id"]
+
+            if GEN_AI_AGENT_ID_KEY in attributes:
+                assert attributes[GEN_AI_AGENT_ID_KEY] == agent365_config["agent_id"]
+
+            # Check for LLM spans (generation spans)
+            if GEN_AI_SYSTEM_KEY in attributes and attributes[GEN_AI_SYSTEM_KEY] == "openai":
+                if GEN_AI_REQUEST_MODEL_KEY in attributes:
+                    llm_spans_found += 1
+                    print(f"✓ Found LLM span with model: {attributes[GEN_AI_REQUEST_MODEL_KEY]}")
+
+                    # Check for tool calls in messages
+                    if GEN_AI_OUTPUT_MESSAGES_KEY in attributes:
+                        output_messages = attributes[GEN_AI_OUTPUT_MESSAGES_KEY]
+                        if "tool_calls" in output_messages:
+                            print("✓ Found tool calls in LLM output messages")
+
+            # Check for agent spans
+            if "agent" in span.name.lower():
+                agent_spans_found += 1
+                print(f"✓ Found agent span: {span.name}")
+
+            # Check for tool execution spans
+            if "execute_tool" in span.name.lower() or "calculator_tool" in span.name.lower():
+                tool_spans_found += 1
+                print(f"✓ Found tool execution span: {span.name}")
+
+        # Ensure we found the expected span types
+        assert len(self.captured_spans) > 0, "No spans were captured"
+        print(f"✓ Captured {len(self.captured_spans)} spans total")
+        print(
+            f"✓ Found {llm_spans_found} LLM spans, {agent_spans_found} agent spans, and {tool_spans_found} tool spans"
+        )
+
+
+class MockAgent365Exporter:
+    """Mock span processor that captures spans instead of sending them."""
+
+    def __init__(self, captured_spans):
+        self.captured_spans = captured_spans
+
+    def on_start(self, span, parent_context=None):
+        """Called when a span starts."""
+        pass
+
+    def on_end(self, span):
+        """Called when a span ends."""
+        self.captured_spans.append(span)
+
+    def shutdown(self):
+        """Mock shutdown."""
+        pass
+
+    def force_flush(self, timeout_millis: int = 30000) -> bool:
+        """Mock force flush."""
+        return True
diff --git a/uv.lock b/uv.lock

Original file line number	Diff line number	Diff line change
`@@ -38,6 +38,7 @@ dev-dependencies = [`
`38`	`38`	`"ruff>=0.1.0",`
`39`	`39`	`"python-dotenv>=1.0.0",`
`40`	`40`	`"openai>=1.0.0",`
	`41`	`+ "agent-framework-azure-ai >= 0.1.0",`
`41`	`42`	`"azure-identity>=1.12.0",`
`42`	`43`	`"openai-agents >= 0.2.6",`
`43`	`44`	`]`