Auto-commit pending changes before rebase - PR synchronize

cursoragent · cursoragent · commit 1e08fc2b7d25 · 2025-10-14T19:41:35.000Z
diff --git a/test_responses_integration.py b/test_responses_integration.py
@@ -0,0 +1,363 @@
+#!/usr/bin/env python3
+"""
+Test script for OpenAI Responses API integration with Openlayer.
+
+This script tests both Chat Completions API (backward compatibility) and 
+the new Responses API with real API calls to verify tracing functionality.
+"""
+
+import os
+import sys
+import time
+import asyncio
+
+# Set up environment variables
+os.environ["OPENLAYER_INFERENCE_PIPELINE_ID"] = "c3dc9ba7-19da-4779-a14f-252ebf69e1a5"
+os.environ["OPENLAYER_API_KEY"] = "sk-ol-2W6jJYWvo3Op4wfVqk9ah0QcZUnRHlEH"
+os.environ["OPENAI_API_KEY"] = "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"
+
+# Add src to path
+sys.path.insert(0, os.path.join(os.path.dirname(__file__), 'src'))
+
+try:
+    import openai
+    from openlayer.lib import trace_openai, trace_async_openai
+    print("✓ Successfully imported OpenAI and Openlayer libraries")
+except ImportError as e:
+    print(f"✗ Import error: {e}")
+    print("Make sure to install openai: pip install openai")
+    sys.exit(1)
+
+def test_chat_completions_non_streaming():
+    """Test Chat Completions API (non-streaming) with tracing."""
+    print("\n=== Testing Chat Completions API (Non-Streaming) ===")
+    
+    try:
+        # Create and trace OpenAI client
+        client = openai.OpenAI()
+        traced_client = trace_openai(client)
+        
+        # Make a simple chat completion request
+        print("Making Chat Completions API call...")
+        response = traced_client.chat.completions.create(
+            model="gpt-4o-mini",
+            messages=[
+                {"role": "system", "content": "You are a helpful assistant."},
+                {"role": "user", "content": "What is 2 + 2? Give a brief answer."},
+            ],
+            temperature=0.1,
+            max_tokens=50,
+        )
+        
+        print(f"✓ Response: {response.choices[0].message.content}")
+        print(f"✓ Tokens used: {response.usage.total_tokens}")
+        print("✓ Chat Completions API (non-streaming) test PASSED")
+        return True
+        
+    except Exception as e:
+        print(f"✗ Chat Completions API (non-streaming) test FAILED: {e}")
+        return False
+
+def test_chat_completions_streaming():
+    """Test Chat Completions API (streaming) with tracing."""
+    print("\n=== Testing Chat Completions API (Streaming) ===")
+    
+    try:
+        # Create and trace OpenAI client
+        client = openai.OpenAI()
+        traced_client = trace_openai(client)
+        
+        # Make a streaming chat completion request
+        print("Making streaming Chat Completions API call...")
+        stream = traced_client.chat.completions.create(
+            model="gpt-4o-mini",
+            messages=[
+                {"role": "user", "content": "Count from 1 to 3 slowly."},
+            ],
+            stream=True,
+            temperature=0.1,
+        )
+        
+        print("Response: ", end="", flush=True)
+        for chunk in stream:
+            if chunk.choices[0].delta.content is not None:
+                print(chunk.choices[0].delta.content, end="", flush=True)
+        print()
+        
+        print("✓ Chat Completions API (streaming) test PASSED")
+        return True
+        
+    except Exception as e:
+        print(f"✗ Chat Completions API (streaming) test FAILED: {e}")
+        return False
+
+def test_responses_api_non_streaming():
+    """Test Responses API (non-streaming) with tracing."""
+    print("\n=== Testing Responses API (Non-Streaming) ===")
+    
+    try:
+        # Create and trace OpenAI client
+        client = openai.OpenAI()
+        traced_client = trace_openai(client)
+        
+        # Check if Responses API is available
+        if not hasattr(traced_client, 'responses'):
+            print("⚠️  Responses API not available in this OpenAI version")
+            return True  # Not a failure, just unavailable
+        
+        # Make a Responses API request
+        print("Making Responses API call...")
+        response = traced_client.responses.create(
+            model="gpt-4o-mini",
+            input="What is 3 + 3? Answer briefly.",
+            max_output_tokens=50,
+            temperature=0.1,
+        )
+        
+        print(f"✓ Response: {response}")
+        print("✓ Responses API (non-streaming) test PASSED")
+        return True
+        
+    except Exception as e:
+        print(f"✗ Responses API (non-streaming) test FAILED: {e}")
+        # Don't fail the test if Responses API is not available
+        if "not found" in str(e).lower() or "404" in str(e):
+            print("⚠️  Responses API might not be available yet")
+            return True
+        return False
+
+def test_responses_api_streaming():
+    """Test Responses API (streaming) with tracing."""
+    print("\n=== Testing Responses API (Streaming) ===")
+    
+    try:
+        # Create and trace OpenAI client
+        client = openai.OpenAI()
+        traced_client = trace_openai(client)
+        
+        # Check if Responses API is available
+        if not hasattr(traced_client, 'responses'):
+            print("⚠️  Responses API not available in this OpenAI version")
+            return True  # Not a failure, just unavailable
+        
+        # Make a streaming Responses API request
+        print("Making streaming Responses API call...")
+        stream = traced_client.responses.create(
+            model="gpt-4o-mini",
+            input="List numbers 1, 2, 3 with spaces between them.",
+            stream=True,
+            max_output_tokens=30,
+        )
+        
+        print("Response: ", end="", flush=True)
+        for event in stream:
+            # The actual streaming format may vary
+            print(".", end="", flush=True)
+        print()
+        
+        print("✓ Responses API (streaming) test PASSED")
+        return True
+        
+    except Exception as e:
+        print(f"✗ Responses API (streaming) test FAILED: {e}")
+        # Don't fail the test if Responses API is not available
+        if "not found" in str(e).lower() or "404" in str(e):
+            print("⚠️  Responses API might not be available yet")
+            return True
+        return False
+
+async def test_async_chat_completions():
+    """Test async Chat Completions API with tracing."""
+    print("\n=== Testing Async Chat Completions API ===")
+    
+    try:
+        # Create and trace async OpenAI client
+        client = openai.AsyncOpenAI()
+        traced_client = trace_async_openai(client)
+        
+        # Make async chat completion request
+        print("Making async Chat Completions API call...")
+        response = await traced_client.chat.completions.create(
+            model="gpt-4o-mini",
+            messages=[
+                {"role": "user", "content": "What is 5 + 5? Be brief."},
+            ],
+            temperature=0.1,
+            max_tokens=30,
+        )
+        
+        print(f"✓ Response: {response.choices[0].message.content}")
+        print("✓ Async Chat Completions API test PASSED")
+        return True
+        
+    except Exception as e:
+        print(f"✗ Async Chat Completions API test FAILED: {e}")
+        return False
+
+async def test_async_responses_api():
+    """Test async Responses API with tracing."""
+    print("\n=== Testing Async Responses API ===")
+    
+    try:
+        # Create and trace async OpenAI client
+        client = openai.AsyncOpenAI()
+        traced_client = trace_async_openai(client)
+        
+        # Check if Responses API is available
+        if not hasattr(traced_client, 'responses'):
+            print("⚠️  Async Responses API not available in this OpenAI version")
+            return True  # Not a failure, just unavailable
+        
+        # Make async Responses API request
+        print("Making async Responses API call...")
+        response = await traced_client.responses.create(
+            model="gpt-4o-mini",
+            input="What is 7 + 7? Answer briefly.",
+            max_output_tokens=30,
+            temperature=0.1,
+        )
+        
+        print(f"✓ Response: {response}")
+        print("✓ Async Responses API test PASSED")
+        return True
+        
+    except Exception as e:
+        print(f"✗ Async Responses API test FAILED: {e}")
+        # Don't fail the test if Responses API is not available
+        if "not found" in str(e).lower() or "404" in str(e):
+            print("⚠️  Async Responses API might not be available yet")
+            return True
+        return False
+
+def test_function_calling():
+    """Test function calling with Chat Completions API."""
+    print("\n=== Testing Function Calling ===")
+    
+    try:
+        # Create and trace OpenAI client
+        client = openai.OpenAI()
+        traced_client = trace_openai(client)
+        
+        # Define a simple function
+        tools = [{
+            "type": "function",
+            "function": {
+                "name": "calculate_sum",
+                "description": "Calculate the sum of two numbers",
+                "parameters": {
+                    "type": "object",
+                    "properties": {
+                        "a": {"type": "number", "description": "First number"},
+                        "b": {"type": "number", "description": "Second number"}
+                    },
+                    "required": ["a", "b"]
+                }
+            }
+        }]
+        
+        print("Making function call request...")
+        response = traced_client.chat.completions.create(
+            model="gpt-4o-mini",
+            messages=[
+                {"role": "user", "content": "Calculate 15 + 27 using the calculate_sum function."},
+            ],
+            tools=tools,
+            tool_choice="auto",
+        )
+        
+        message = response.choices[0].message
+        if message.tool_calls:
+            print(f"✓ Function called: {message.tool_calls[0].function.name}")
+            print(f"✓ Arguments: {message.tool_calls[0].function.arguments}")
+        else:
+            print(f"✓ Response: {message.content}")
+        
+        print("✓ Function calling test PASSED")
+        return True
+        
+    except Exception as e:
+        print(f"✗ Function calling test FAILED: {e}")
+        return False
+
+def verify_tracing_setup():
+    """Verify that tracing is properly configured."""
+    print("\n=== Verifying Tracing Setup ===")
+    
+    # Check environment variables
+    pipeline_id = os.environ.get("OPENLAYER_INFERENCE_PIPELINE_ID")
+    api_key = os.environ.get("OPENLAYER_API_KEY")
+    openai_key = os.environ.get("OPENAI_API_KEY")
+    
+    print(f"✓ Openlayer Pipeline ID: {pipeline_id[:20]}..." if pipeline_id else "✗ Missing Pipeline ID")
+    print(f"✓ Openlayer API Key: {api_key[:10]}..." if api_key else "✗ Missing API Key")
+    print(f"✓ OpenAI API Key: {openai_key[:10]}..." if openai_key else "✗ Missing OpenAI Key")
+    
+    # Test basic client creation
+    try:
+        client = openai.OpenAI()
+        traced_client = trace_openai(client)
+        print("✓ Successfully created traced OpenAI client")
+        
+        # Check if Responses API is available
+        has_responses = hasattr(traced_client, 'responses')
+        print(f"✓ Responses API available: {has_responses}")
+        
+        return True
+    except Exception as e:
+        print(f"✗ Failed to create traced client: {e}")
+        return False
+
+async def run_async_tests():
+    """Run all async tests."""
+    results = []
+    results.append(await test_async_chat_completions())
+    results.append(await test_async_responses_api())
+    return results
+
+def main():
+    """Run all integration tests."""
+    print("OpenAI Responses API Integration Test")
+    print("=" * 60)
+    
+    # Verify setup
+    if not verify_tracing_setup():
+        print("❌ Setup verification failed!")
+        return 1
+    
+    # Run sync tests
+    results = []
+    results.append(test_chat_completions_non_streaming())
+    results.append(test_chat_completions_streaming())
+    results.append(test_responses_api_non_streaming())
+    results.append(test_responses_api_streaming())
+    results.append(test_function_calling())
+    
+    # Run async tests
+    async_results = asyncio.run(run_async_tests())
+    results.extend(async_results)
+    
+    # Summary
+    passed = sum(results)
+    total = len(results)
+    
+    print(f"\n=== Test Results ===")
+    print(f"✓ Passed: {passed}/{total}")
+    print(f"✗ Failed: {total - passed}/{total}")
+    
+    if passed == total:
+        print("🎉 All tests PASSED!")
+        print("\n✅ Integration Status:")
+        print("✓ Chat Completions API backward compatibility maintained")
+        print("✓ Responses API integration working (when available)")
+        print("✓ Streaming functionality working for both APIs")
+        print("✓ Function calling working")
+        print("✓ Async support working")
+        print("✓ Traces should be visible in Openlayer dashboard")
+        return 0
+    else:
+        print("❌ Some tests failed!")
+        return 1
+
+if __name__ == "__main__":
+    exit_code = main()
+    sys.exit(exit_code)