moved tests

2026-01-27 17:28:07 +08:00
parent 3bb961d6c1
commit 01faaa66a8
3 changed files with 261 additions and 2 deletions
--- a/tests/test_concurrent_calculator.py
+++ b/tests/test_concurrent_calculator.py
@@ -0,0 +1,259 @@
+#!/usr/bin/env python3
+"""
+Concurrent calculator test for DashScope Application.call against server_dashscope.py
+
+Tests the agent's performance when handling multiple calculator requests concurrently
+with different session IDs.
+
+Instructions:
+- Start the DashScope-compatible server first:
+    uvicorn fastapi_server.server_dashscope:app --host 0.0.0.0 --port 8588 --reload
+- Run this script to test concurrent performance
+"""
+import os
+import uuid
+import time
+import asyncio
+from concurrent.futures import ThreadPoolExecutor, as_completed
+from dataclasses import dataclass
+from typing import Optional
+from dotenv import load_dotenv
+from loguru import logger
+from http import HTTPStatus
+
+load_dotenv()
+
+try:
+    from dashscope import Application
+    import dashscope
+except Exception as e:
+    print("dashscope package not found. Please install it: pip install dashscope")
+    raise
+
+# <<< Paste your running FastAPI base url here >>>
+BASE_URL = os.getenv("DS_BASE_URL", "http://127.0.0.1:8588/api/")
+
+# Params
+API_KEY = os.getenv("ALI_API_KEY", "test-key")
+APP_ID = os.getenv("ALI_APP_ID", "test-app")
+
+# Different equations to calculate
+EQUATIONS = [
+    "1234 * 5641",
+    "9876 + 5432 * 2",
+    "100000 / 256",
+    "2 ** 20",
+    "123456 - 78901",
+    "999 * 999",
+    "314159 / 100",
+    "42 ** 3",
+]
+
+
+@dataclass
+class RequestResult:
+    session_id: str
+    equation: str
+    response_text: str
+    duration_seconds: float
+    success: bool
+    error: Optional[str] = None
+
+
+def make_request(equation: str, session_id: str, stream: bool = True) -> RequestResult:
+    """Make a single calculator request and return the result with timing."""
+    dialogue = [
+        {"role": "system", "content": "You are a helpful assistant."},
+        {"role": "user", "content": f"use calculator to calculate {equation}"},
+    ]
+
+    call_params = {
+        "api_key": API_KEY,
+        "app_id": APP_ID,
+        "session_id": session_id,
+        "messages": dialogue,
+        "stream": stream,
+    }
+
+    start_time = time.perf_counter()
+    
+    try:
+        responses = Application.call(**call_params)
+        
+        if stream:
+            last_text = ""
+            final_text = ""
+            for resp in responses:
+                if resp.status_code != HTTPStatus.OK:
+                    raise Exception(f"Error: code={resp.status_code}, message={resp.message}")
+                current_text = getattr(getattr(resp, "output", None), "text", None)
+                if current_text is None:
+                    continue
+                if len(current_text) >= len(last_text):
+                    delta = current_text[len(last_text):]
+                else:
+                    delta = current_text
+                if delta:
+                    final_text = current_text
+                last_text = current_text
+            response_text = final_text
+        else:
+            if responses.status_code != HTTPStatus.OK:
+                raise Exception(f"Error: code={responses.status_code}, message={responses.message}")
+            response_text = getattr(getattr(responses, "output", None), "text", "")
+        
+        duration = time.perf_counter() - start_time
+        return RequestResult(
+            session_id=session_id,
+            equation=equation,
+            response_text=response_text,
+            duration_seconds=duration,
+            success=True,
+        )
+    except Exception as e:
+        duration = time.perf_counter() - start_time
+        return RequestResult(
+            session_id=session_id,
+            equation=equation,
+            response_text="",
+            duration_seconds=duration,
+            success=False,
+            error=str(e),
+        )
+
+
+def run_concurrent_test(equations: list[str], max_workers: int) -> list[RequestResult]:
+    """Run multiple calculator requests concurrently with specified worker count."""
+    results = []
+    
+    with ThreadPoolExecutor(max_workers=max_workers) as executor:
+        futures = {}
+        for eq in equations:
+            session_id = str(uuid.uuid4())
+            future = executor.submit(make_request, eq, session_id)
+            futures[future] = eq
+        
+        for future in as_completed(futures):
+            result = future.result()
+            results.append(result)
+    
+    return results
+
+
+def print_results(results: list[RequestResult], concurrency: int):
+    """Print formatted results for a test run."""
+    print(f"\n{'='*70}")
+    print(f"CONCURRENCY LEVEL: {concurrency}")
+    print(f"{'='*70}")
+    
+    successful = [r for r in results if r.success]
+    failed = [r for r in results if not r.success]
+    
+    total_duration = sum(r.duration_seconds for r in results)
+    avg_duration = total_duration / len(results) if results else 0
+    max_duration = max(r.duration_seconds for r in results) if results else 0
+    min_duration = min(r.duration_seconds for r in results) if results else 0
+    
+    print(f"\nSummary:")
+    print(f"  Total requests:    {len(results)}")
+    print(f"  Successful:        {len(successful)}")
+    print(f"  Failed:            {len(failed)}")
+    print(f"  Avg duration:      {avg_duration:.3f}s")
+    print(f"  Min duration:      {min_duration:.3f}s")
+    print(f"  Max duration:      {max_duration:.3f}s")
+    print(f"  Total time (wall): {max_duration:.3f}s (limited by slowest)")
+    
+    print(f"\nDetailed Results:")
+    print(f"  {'Equation':<25} {'Duration':<12} {'Status':<10} {'Session ID (first 8)'}")
+    print(f"  {'-'*25} {'-'*12} {'-'*10} {'-'*20}")
+    
+    for r in sorted(results, key=lambda x: x.duration_seconds):
+        status = "✓ OK" if r.success else "✗ FAIL"
+        print(f"  {r.equation:<25} {r.duration_seconds:>8.3f}s   {status:<10} {r.session_id[:8]}")
+        if not r.success:
+            print(f"    Error: {r.error}")
+    
+    if successful:
+        print(f"\nSample Response (first successful):")
+        sample = successful[0]
+        response_preview = sample.response_text[:200] + "..." if len(sample.response_text) > 200 else sample.response_text
+        print(f"  Equation: {sample.equation}")
+        print(f"  Response: {response_preview}")
+
+
+def main():
+    # Point the SDK to our FastAPI implementation
+    if BASE_URL and ("/api/" in BASE_URL):
+        dashscope.base_http_api_url = BASE_URL
+    print(f"Using base_http_api_url = {dashscope.base_http_api_url}")
+    
+    # Test with different concurrency levels
+    concurrency_levels = [1, 2, 4, 8]
+    
+    # Use first 2 equations for basic test, then more for higher concurrency
+    test_configs = [
+        (1, EQUATIONS[:2]),    # Sequential: 2 equations
+        (2, EQUATIONS[:2]),    # 2 concurrent: 2 equations
+        (4, EQUATIONS[:4]),    # 4 concurrent: 4 equations
+        (8, EQUATIONS[:8]),    # 8 concurrent: 8 equations
+    ]
+    
+    all_results = {}
+    overall_start = time.perf_counter()
+    
+    for concurrency, equations in test_configs:
+        print(f"\n>>> Running test with concurrency={concurrency}, equations={len(equations)}")
+        test_start = time.perf_counter()
+        results = run_concurrent_test(equations, max_workers=concurrency)
+        test_duration = time.perf_counter() - test_start
+        all_results[concurrency] = {
+            "results": results,
+            "wall_time": test_duration,
+        }
+        print_results(results, concurrency)
+        print(f"\n  Wall clock time for this test: {test_duration:.3f}s")
+    
+    overall_duration = time.perf_counter() - overall_start
+    
+    # Final comparison
+    print(f"\n{'='*70}")
+    print("CONCURRENCY COMPARISON")
+    print(f"{'='*70}")
+    print(f"  {'Concurrency':<15} {'Requests':<12} {'Wall Time':<15} {'Throughput'}")
+    print(f"  {'-'*15} {'-'*12} {'-'*15} {'-'*20}")
+    
+    for concurrency, data in all_results.items():
+        num_requests = len(data["results"])
+        wall_time = data["wall_time"]
+        throughput = num_requests / wall_time if wall_time > 0 else 0
+        print(f"  {concurrency:<15} {num_requests:<12} {wall_time:<15.3f} {throughput:.2f} req/s")
+    
+    print(f"\nTotal test duration: {overall_duration:.3f}s")
+
+
+if __name__ == "__main__":
+    main()
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
--- a/tests/test_dashscope_client.py
+++ b/tests/test_dashscope_client.py
@@ -0,0 +1,107 @@
+#!/usr/bin/env python3
+"""
+Minimal test for DashScope Application.call against server_dashscope.py
+
+Instructions:
+- Start the DashScope-compatible server first, e.g.:
+    uvicorn fastapi_server.server_dashscope:app --host 0.0.0.0 --port 8588 --reload
+- Set BASE_URL below to the server base URL you started.
+- Optionally set environment variables ALI_API_KEY and ALI_APP_ID.
+"""
+import os
+import uuid
+from dotenv import load_dotenv
+from loguru import logger
+from http import HTTPStatus
+
+TAG = __name__
+
+load_dotenv()
+
+try:
+    from dashscope import Application
+    import dashscope
+except Exception as e:
+    print("dashscope package not found. Please install it: pip install dashscope")
+    raise
+
+
+# <<< Paste your running FastAPI base url here >>>
+BASE_URL = os.getenv("DS_BASE_URL", "http://127.0.0.1:8588/api/")
+
+# Params
+API_KEY = os.getenv("FAST_AUTH_KEYS", "test-key")
+APP_ID = os.getenv("ALI_APP_ID", "test-app")
+SESSION_ID = str(uuid.uuid4())
+
+dialogue = [
+    {"role": "system", "content": "You are a helpful assistant."},
+    {"role": "user", "content": "Say 'the world is awesome and beautiful'."},
+]
+
+call_params = {
+    "api_key": API_KEY,
+    "app_id": "test_app",
+    "session_id": "123",
+    "messages": dialogue,
+    "stream": True,
+}
+
+
+def main():
+    # Point the SDK to our FastAPI implementation
+    if BASE_URL and ("/api/" in BASE_URL):
+        dashscope.base_http_api_url = BASE_URL
+    # dashscope.base_http_api_url = BASE_URL
+    print(f"Using base_http_api_url = {dashscope.base_http_api_url}")
+
+    print("\nCalling Application.call(stream=True)...\n")
+    responses = Application.call(**call_params)
+
+    try:
+        last_text = ""
+        u = ""
+        for resp in responses:
+            if resp.status_code != HTTPStatus.OK:
+                logger.bind(tag=TAG).error(
+                    f"code={resp.status_code}, message={resp.message}, 请参考文档：https://help.aliyun.com/zh/model-studio/developer-reference/error-code"
+                )
+                continue
+            current_text = getattr(getattr(resp, "output", None), "text", None)
+            if current_text is None:
+                continue
+            # SDK流式为增量覆盖，计算差量输出
+            if len(current_text) >= len(last_text):
+                delta = current_text[len(last_text):]
+            else:
+                # 避免偶发回退
+                delta = current_text
+            if delta:
+                u =  delta
+            last_text = current_text
+
+            logger.info(f"from stream: {u}")
+    except TypeError:
+        # 非流式回落（一次性返回）
+        if responses.status_code != HTTPStatus.OK:
+            logger.bind(tag=TAG).error(
+                f"code={responses.status_code}, message={responses.message}, 请参考文档：https://help.aliyun.com/zh/model-studio/developer-reference/error-code"
+            )
+            u =  "【阿里百练API服务响应异常】"
+        else:
+            full_text = getattr(getattr(responses, "output", None), "text", "")
+            logger.bind(tag=TAG).info(
+                f"【阿里百练API服务】完整响应长度: {len(full_text)}"
+            )
+            u = full_text
+            print("from non-stream: ", u)
+    except Exception as e:
+        logger.bind(tag=TAG).error(f"Error: {e}")
+        u =  "【阿里百练API服务响应异常】"
+            
+
+
+if __name__ == "__main__":
+    main()
+
+
--- a/tests/test_openai_client.py
+++ b/tests/test_openai_client.py
@@ -0,0 +1,147 @@
+#!/usr/bin/env python3
+"""
+Test for OpenAI-compatible API against server_openai.py
+
+Instructions:
+- Start the OpenAI-compatible server first, e.g.:
+    python fastapi_server/server_openai.py --llm_name qwen-plus --llm_provider openai --base_url https://dashscope.aliyuncs.com/compatible-mode/v1
+- Or with uvicorn:
+    uvicorn fastapi_server.server_openai:app --host 0.0.0.0 --port 8589 --reload
+- Set BASE_URL and API_KEY environment variables (or in .env file):
+    OPENAI_BASE_URL=http://127.0.0.1:8589/v1
+    API_KEY=sk-your-api-key-here
+- Make sure the API_KEY matches one of the keys in the server's API_KEYS environment variable
+"""
+import os
+from dotenv import load_dotenv
+from loguru import logger
+
+TAG = __name__
+
+load_dotenv()
+
+try:
+    from openai import OpenAI
+except Exception as e:
+    print("openai package not found. Please install it: pip install openai")
+    raise
+
+
+# <<< Paste your running FastAPI base url here >>>
+BASE_URL = os.getenv("OPENAI_BASE_URL", "http://121.40.192.128:8589/v1")
+API_KEY = os.getenv("FAST_AUTH_KEYS", None)
+
+# Test configuration matching the server setup
+# llm_name: "qwen-plus"
+# llm_provider: "openai"
+# base_url: "https://dashscope.aliyuncs.com/compatible-mode/v1"
+
+# Test messages
+messages = [
+    {"role": "system", "content": "You are a helpful assistant."},
+    {"role": "user", "content": "use calculator to calculate 1234*5641"},
+]
+
+
+def test_streaming():
+    """Test streaming chat completion"""
+    print("\n" + "="*60)
+    print("Testing STREAMING chat completion...")
+    print("="*60 + "\n")
+    
+    if not API_KEY:
+        logger.warning("API_KEY not set. Set it in environment variable or .env file.")
+        raise ValueError("API_KEY environment variable is required for authentication")
+    
+    client = OpenAI(
+        base_url=BASE_URL,
+        api_key=API_KEY
+    )
+    
+    try:
+        stream = client.chat.completions.create(
+            model="qwen-plus",  # Using qwen-plus as configured
+            messages=messages,
+            stream=True,
+            extra_body={"thread_id":"2000"}
+        )
+        
+        full_response = ""
+        for chunk in stream:
+            if chunk.choices[0].delta.content is not None:
+                content = chunk.choices[0].delta.content
+                full_response += content
+                print(content, end="", flush=True)
+        
+        print("\n\n" + "-"*60)
+        print(f"Full streaming response length: {len(full_response)}")
+        print("-"*60)
+        
+        return full_response
+    
+    except Exception as e:
+        logger.error(f"Streaming test error: {e}")
+        raise
+
+
+def test_non_streaming():
+    """Test non-streaming chat completion"""
+    print("\n" + "="*60)
+    print("Testing NON-STREAMING chat completion...")
+    print("="*60 + "\n")
+    
+    if not API_KEY:
+        logger.warning("API_KEY not set. Set it in environment variable or .env file.")
+        raise ValueError("API_KEY environment variable is required for authentication")
+    
+    client = OpenAI(
+        base_url=BASE_URL,
+        api_key=API_KEY
+    )
+    
+    try:
+        response = client.chat.completions.create(
+            model="qwen-plus",  # Using qwen-plus as configured
+            messages=messages,
+            stream=False,
+            extra_body={"thread_id":"2000"}
+        )
+        
+        content = response.choices[0].message.content
+        print(f"Response: {content}")
+        print("\n" + "-"*60)
+        print(f"Full non-streaming response length: {len(content)}")
+        print(f"Finish reason: {response.choices[0].finish_reason}")
+        print("-"*60)
+        
+        return content
+    
+    except Exception as e:
+        logger.error(f"Non-streaming test error: {e}")
+        raise
+
+
+def main():
+    print(f"\nUsing base_url = {BASE_URL}")
+    if API_KEY:
+        # Show only first 8 chars for security
+        masked_key = API_KEY[:8] + "..." if len(API_KEY) > 8 else API_KEY
+        print(f"Using API_KEY = {masked_key}")
+    else:
+        print("WARNING: API_KEY not set!")
+    print()
+    
+    # Test both streaming and non-streaming
+    streaming_result = "" #test_streaming()
+    non_streaming_result = test_non_streaming()
+    
+    print("\n" + "="*60)
+    print("SUMMARY")
+    print("="*60)
+    print(f"Streaming response length: {len(streaming_result)}")
+    print(f"Non-streaming response length: {len(non_streaming_result)}")
+    print("\nBoth tests completed successfully!")
+
+
+if __name__ == "__main__":
+    main()