- those are my routing options
"models" => ["openai/gpt-oss-20b", "google/gemini-2.5-flash-lite", "openai/o4-mini"], "provider" => %{"only" => ["fireworks", "google-ai-studio", "google-vertex", "groq", "hyperbolic", "inference-net", "ncompass", "novita", "openai", "phala", "together"], "quantizations" => [], "require_parameters" => true}
- request metadata
{
"id": 25736918293,
"generation_id": "gen-1760374167-B0UFhQdqF2L0QKPLSbhw",
"provider_name": "Google",
"model": "openai/gpt-oss-20b",
"app_id": null,
"external_user": redacted,
"streamed": true,
"cancelled": false,
"generation_time": 599378,
"latency": 413,
"moderation_latency": null,
"created_at": "2025-10-13T16:59:27.63713+00:00",
"tokens_prompt": 173,
"tokens_completion": 10795,
"native_tokens_prompt": 232,
"native_tokens_completion": 26827,
"native_tokens_completion_images": null,
"native_tokens_reasoning": 26827,
"native_tokens_cached": 0,
"num_media_prompt": null,
"num_media_completion": 0,
"num_search_results": null,
"origin": "",
"usage": 0,
"finish_reason": null,
"usage_cache": null,
"usage_data": null,
"usage_web": null,
"usage_file": 0,
"byok_usage_inference": 0.0080655,
"provider_responses": [
{
"id": "ly3taPPAGvinnvgPxqnq4Q4",
"endpoint_id": "d14eeefb-d9fc-4732-b0d7-db609aad8308",
"provider_name": "Google",
"status": 200,
"latency": 413,
"is_byok": true
}
],
"provider_api_key_id": 271544,
"api_type": "completions",
"is_byok": true,
"native_finish_reason": null
}
- request body includes requirement for json schema output. plus routing options as provided above