Rapid-MLX/tests/integrations/test_pydantic_ai_full.py at main · raullenchai/Rapid-MLX · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
"""Thorough PydanticAI test suite against local rapid-mlx server."""

import asyncio
import os

import httpx as _httpx
from pydantic import BaseModel
from pydantic_ai import Agent
from pydantic_ai.models.openai import OpenAIChatModel
from pydantic_ai.providers.openai import OpenAIProvider

_BASE = os.environ.get("RAPID_MLX_BASE_URL", "http://localhost:8000/v1")
try:
    MODEL_ID = _httpx.get(f"{_BASE}/models", timeout=5).json()["data"][0]["id"]
except Exception:
    MODEL_ID = "default"

model = OpenAIChatModel(
    model_name=MODEL_ID,
    provider=OpenAIProvider(
        base_url=_BASE,
        api_key="not-needed",
    ),
)

results = {}

# === 1. Plain completion ===
print("=== Test 1: Plain completion ===")
try:
    agent = Agent(model)
    r = agent.run_sync("What is 2+2? Reply with just the number.")
    assert "4" in r.output, r.output
    print(f"PASS: {r.output[:80]}")
    results["1_plain"] = "PASS"
except Exception as e:
    print(f"FAIL: {e}")
    results["1_plain"] = f"FAIL: {e}"

# === 2. Streaming ===
print("\n=== Test 2: Streaming ===")
try:

    async def stream_test():
        agent = Agent(model)
        chunks = []
        async with agent.run_stream(
            "Count from 1 to 5, separated by commas."
        ) as result:
            async for delta in result.stream_text(delta=True):
                chunks.append(delta)
        return "".join(chunks)

    out = asyncio.run(stream_test())
    assert len(out) > 5, f"Too short: {out}"
    assert any(d in out for d in ["1", "2", "3"]), out
    print(f"PASS: chunks={len(out)} chars, output={out[:80]}")
    results["2_stream"] = "PASS"
except Exception as e:
    print(f"FAIL: {e}")
    results["2_stream"] = f"FAIL: {e}"

# === 3. Structured output (BaseModel) ===
print("\n=== Test 3: Structured output ===")
try:

    class Person(BaseModel):
        name: str
        age: int

    agent = Agent(model, output_type=Person)
    r = agent.run_sync("Extract: 'Alice is 30 years old'")
    assert isinstance(r.output, Person), type(r.output)
    assert r.output.name.lower() == "alice", r.output.name
    assert r.output.age == 30, r.output.age
    print(f"PASS: {r.output}")
    results["3_structured"] = "PASS"
except Exception as e:
    print(f"FAIL: {e}")
    results["3_structured"] = f"FAIL: {e}"

# === 4. Tool calling (single) ===
print("\n=== Test 4: Single tool call ===")
try:
    agent = Agent(model)

    @agent.tool_plain
    def get_weather(city: str) -> str:
        """Get the weather for a city."""
        return f"sunny, 22C in {city}"

    r = agent.run_sync("What's the weather in Paris?")
    assert "Paris" in r.output or "22" in r.output, r.output
    called = any("get_weather" in str(m) for m in r.all_messages())
    assert called, "tool not called"
    print(f"PASS: {r.output[:80]}")
    results["4_tool_single"] = "PASS"
except Exception as e:
    print(f"FAIL: {e}")
    results["4_tool_single"] = f"FAIL: {e}"

# === 5. Multi-turn conversation ===
print("\n=== Test 5: Multi-turn ===")
try:
    agent = Agent(model)
    r1 = agent.run_sync("My name is Bob. Remember this.")
    r2 = agent.run_sync("What is my name?", message_history=r1.all_messages())
    assert "bob" in r2.output.lower(), r2.output
    print(f"PASS: turn2 = {r2.output[:80]}")
    results["5_multi_turn"] = "PASS"
except Exception as e:
    print(f"FAIL: {e}")
    results["5_multi_turn"] = f"FAIL: {e}"

# === 6. Multiple tools, sequential ===
print("\n=== Test 6: Multiple tools ===")
try:
    agent = Agent(model)

    @agent.tool_plain
    def add(a: int, b: int) -> int:
        """Add two numbers."""
        return a + b

    @agent.tool_plain
    def multiply(a: int, b: int) -> int:
        """Multiply two numbers."""
        return a * b

    r = agent.run_sync("Compute (3+4)*5 using the tools. Show the result.")
    assert "35" in r.output, r.output
    called_tools = [str(m) for m in r.all_messages()]
    add_called = any("add" in t for t in called_tools)
    mul_called = any("multiply" in t for t in called_tools)
    assert add_called and mul_called, f"add={add_called} mul={mul_called}"
    print(f"PASS: {r.output[:80]}")
    results["6_multi_tool"] = "PASS"
except Exception as e:
    print(f"FAIL: {e}")
    results["6_multi_tool"] = f"FAIL: {e}"

# === Summary ===
print("\n" + "=" * 50)
passed = sum(1 for v in results.values() if v == "PASS")
total = len(results)
print(f"PydanticAI: {passed}/{total} passed")
for k, v in results.items():
    print(f"  {k}: {v[:120]}")
exit(0 if passed == total else 1)