|
|
"""OpenRouter API client for making LLM requests.""" |
|
|
|
|
|
import httpx |
|
|
from typing import List, Dict, Any, Optional |
|
|
from .config import OPENROUTER_API_KEY, OPENROUTER_API_URL |
|
|
|
|
|
|
|
|
async def query_model( |
|
|
model: str, messages: List[Dict[str, str]], timeout: float = 120.0 |
|
|
) -> Optional[Dict[str, Any]]: |
|
|
""" |
|
|
Query a single model via OpenRouter API. |
|
|
|
|
|
Args: |
|
|
model: OpenRouter model identifier (e.g., "openai/gpt-4o") |
|
|
messages: List of message dicts with 'role' and 'content' |
|
|
timeout: Request timeout in seconds |
|
|
|
|
|
Returns: |
|
|
Response dict with 'content' and optional 'reasoning_details', or None if failed |
|
|
""" |
|
|
headers = { |
|
|
"Authorization": f"Bearer {OPENROUTER_API_KEY}", |
|
|
"Content-Type": "application/json", |
|
|
} |
|
|
|
|
|
payload = { |
|
|
"model": model, |
|
|
"messages": messages, |
|
|
} |
|
|
|
|
|
try: |
|
|
async with httpx.AsyncClient(timeout=timeout) as client: |
|
|
response = await client.post(OPENROUTER_API_URL, headers=headers, json=payload) |
|
|
response.raise_for_status() |
|
|
|
|
|
data = response.json() |
|
|
message = data["choices"][0]["message"] |
|
|
|
|
|
return {"content": message.get("content"), "reasoning_details": message.get("reasoning_details")} |
|
|
|
|
|
except Exception as e: |
|
|
print(f"Error querying model {model}: {e}") |
|
|
return None |
|
|
|
|
|
|
|
|
async def query_model_stream(model: str, messages: List[Dict[str, str]], timeout: float = 120.0): |
|
|
""" |
|
|
Query a model via OpenRouter API and stream the response. |
|
|
Yields content chunks as they arrive. |
|
|
""" |
|
|
headers = { |
|
|
"Authorization": f"Bearer {OPENROUTER_API_KEY}", |
|
|
"Content-Type": "application/json", |
|
|
} |
|
|
|
|
|
payload = {"model": model, "messages": messages, "stream": True} |
|
|
|
|
|
import json |
|
|
|
|
|
try: |
|
|
async with httpx.AsyncClient(timeout=timeout) as client: |
|
|
async with client.stream("POST", OPENROUTER_API_URL, headers=headers, json=payload) as response: |
|
|
response.raise_for_status() |
|
|
async for line in response.aiter_lines(): |
|
|
if line.startswith("data: "): |
|
|
data_str = line[6:] |
|
|
if data_str.strip() == "[DONE]": |
|
|
break |
|
|
try: |
|
|
data = json.loads(data_str) |
|
|
delta = data["choices"][0]["delta"] |
|
|
content = delta.get("content") |
|
|
if content: |
|
|
yield content |
|
|
except json.JSONDecodeError: |
|
|
pass |
|
|
except Exception as e: |
|
|
print(f"Error streaming model {model}: {e}") |
|
|
yield f"[Error: {str(e)}]" |
|
|
|
|
|
|
|
|
async def query_models_parallel( |
|
|
models: List[str], messages: List[Dict[str, str]] |
|
|
) -> Dict[str, Optional[Dict[str, Any]]]: |
|
|
""" |
|
|
Query multiple models in parallel. |
|
|
|
|
|
Args: |
|
|
models: List of OpenRouter model identifiers |
|
|
messages: List of message dicts to send to each model |
|
|
|
|
|
Returns: |
|
|
Dict mapping model identifier to response dict (or None if failed) |
|
|
""" |
|
|
import asyncio |
|
|
|
|
|
|
|
|
tasks = [query_model(model, messages) for model in models] |
|
|
|
|
|
|
|
|
responses = await asyncio.gather(*tasks) |
|
|
|
|
|
|
|
|
return {model: response for model, response in zip(models, responses)} |
|
|
|