{
    "models": [
        {
            "slug": "black-forest-labs/flux.2-klein-4b",
            "hf_slug": "",
            "updated_at": "2026-01-16T04:32:32.594442+00:00",
            "created_at": "2026-01-14T22:20:28.450361+00:00",
            "hf_updated_at": null,
            "name": "Black Forest Labs: FLUX.2 Klein 4B",
            "short_name": "FLUX.2 Klein 4B",
            "author": "black-forest-labs",
            "description": "FLUX.2 [klein] 4B is the fastest and most cost-effective model in the FLUX.2 family, optimized for high-throughput use cases while maintaining excellent image quality.\n\nPricing is based on the output image. The first generated megapixel is charged $0.014. Each subsequent megapixel is charged $0.001.",
            "model_version_group_id": null,
            "context_length": 40960,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "image"
            ],
            "has_text_output": false,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "black-forest-labs/flux.2-klein-4b",
            "supports_reasoning": false,
            "reasoning_config": {},
            "features": {
                "reasoning_config": {},
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "image_generation",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "9e2e48d5-2016-4e18-976a-c463146c7f9c",
                "name": "Black Forest Labs | black-forest-labs/flux.2-klein-4b",
                "context_length": 40960,
                "model": {
                    "slug": "black-forest-labs/flux.2-klein-4b",
                    "hf_slug": "",
                    "updated_at": "2026-01-16T04:32:32.594442+00:00",
                    "created_at": "2026-01-14T22:20:28.450361+00:00",
                    "hf_updated_at": null,
                    "name": "Black Forest Labs: FLUX.2 Klein 4B",
                    "short_name": "FLUX.2 Klein 4B",
                    "author": "black-forest-labs",
                    "description": "FLUX.2 [klein] 4B is the fastest and most cost-effective model in the FLUX.2 family, optimized for high-throughput use cases while maintaining excellent image quality.\n\nPricing is based on the output image. The first generated megapixel is charged $0.014. Each subsequent megapixel is charged $0.001.",
                    "model_version_group_id": null,
                    "context_length": 40960,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "image"
                    ],
                    "has_text_output": false,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "black-forest-labs/flux.2-klein-4b",
                    "supports_reasoning": false,
                    "reasoning_config": {},
                    "features": {
                        "reasoning_config": {},
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "image_generation",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "black-forest-labs/flux.2-klein-4b",
                "model_variant_permaslug": "black-forest-labs/flux.2-klein-4b",
                "adapter_name": "BlackForestLabsAdapter",
                "provider_name": "Black Forest Labs",
                "provider_info": {
                    "name": "Black Forest Labs",
                    "displayName": "Black Forest Labs",
                    "slug": "black-forest-labs",
                    "baseUrl": "https://api.bfl.ai/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://bfl.ai/legal/terms-of-service",
                        "privacyPolicyURL": "https://bfl.ai/legal/privacy-policy"
                    },
                    "datacenters": [],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "BlackForestLabsAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://bfl.ai&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "bfl"
                },
                "provider_display_name": "Black Forest Labs",
                "provider_slug": "black-forest-labs",
                "provider_model_id": "flux-2-klein-4b",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://bfl.ai/legal/terms-of-service",
                    "privacyPolicyURL": "https://bfl.ai/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "image_output": "0.00000341796875",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "bfl:upstream_cost_cents": "1",
                    "bfl:informational_output_megapixels": 0.014
                },
                "pricing_version_id": "2fe2f4f4-cec3-4788-9f83-47f3be988f17",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5.2-codex",
            "hf_slug": "",
            "updated_at": "2026-01-14T18:06:58.161562+00:00",
            "created_at": "2026-01-14T16:48:35.067026+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5.2-Codex",
            "short_name": "GPT-5.2-Codex",
            "author": "openai",
            "description": "GPT-5.2-Codex is an upgraded version of GPT-5.1-Codex optimized for software engineering and coding workflows. It is designed for both interactive development sessions and long, independent execution of complex engineering tasks. The model supports building projects from scratch, feature development, debugging, large-scale refactoring, and code review. Compared to GPT-5.1-Codex, 5.2-Codex is more steerable, adheres closely to developer instructions, and produces cleaner, higher-quality code outputs. Reasoning effort can be adjusted with the `reasoning.effort` parameter. Read the [docs here](https://openrouter.ai/docs/use-cases/reasoning-tokens#reasoning-effort-level)\n\nCodex integrates into developer environments including the CLI, IDE extensions, GitHub, and cloud tasks. It adapts reasoning effort dynamically—providing fast responses for small tasks while sustaining extended multi-hour runs for large projects. The model is trained to perform structured code reviews, catching critical flaws by reasoning over dependencies and validating behavior against tests. It also supports multimodal inputs such as images or screenshots for UI development and integrates tool use for search, dependency installation, and environment setup. Codex is intended specifically for agentic coding applications.",
            "model_version_group_id": null,
            "context_length": 400000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "openai/gpt-5.2-codex-20260114",
            "supports_reasoning": true,
            "reasoning_config": {
                "is_mandatory_reasoning": true,
                "supports_reasoning_effort": true,
                "supported_reasoning_efforts": [
                    "low",
                    "medium",
                    "high",
                    "xhigh"
                ],
                "default_reasoning_effort": "medium"
            },
            "features": {
                "reasoning_config": {
                    "is_mandatory_reasoning": true,
                    "supports_reasoning_effort": true,
                    "supported_reasoning_efforts": [
                        "low",
                        "medium",
                        "high",
                        "xhigh"
                    ],
                    "default_reasoning_effort": "medium"
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "dff70494-a1eb-4be2-b61f-9b2277db56c9",
                "name": "OpenAI | openai/gpt-5.2-codex-20260114",
                "context_length": 400000,
                "model": {
                    "slug": "openai/gpt-5.2-codex",
                    "hf_slug": "",
                    "updated_at": "2026-01-14T18:06:58.161562+00:00",
                    "created_at": "2026-01-14T16:48:35.067026+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5.2-Codex",
                    "short_name": "GPT-5.2-Codex",
                    "author": "openai",
                    "description": "GPT-5.2-Codex is an upgraded version of GPT-5.1-Codex optimized for software engineering and coding workflows. It is designed for both interactive development sessions and long, independent execution of complex engineering tasks. The model supports building projects from scratch, feature development, debugging, large-scale refactoring, and code review. Compared to GPT-5.1-Codex, 5.2-Codex is more steerable, adheres closely to developer instructions, and produces cleaner, higher-quality code outputs. Reasoning effort can be adjusted with the `reasoning.effort` parameter. Read the [docs here](https://openrouter.ai/docs/use-cases/reasoning-tokens#reasoning-effort-level)\n\nCodex integrates into developer environments including the CLI, IDE extensions, GitHub, and cloud tasks. It adapts reasoning effort dynamically—providing fast responses for small tasks while sustaining extended multi-hour runs for large projects. The model is trained to perform structured code reviews, catching critical flaws by reasoning over dependencies and validating behavior against tests. It also supports multimodal inputs such as images or screenshots for UI development and integrates tool use for search, dependency installation, and environment setup. Codex is intended specifically for agentic coding applications.",
                    "model_version_group_id": null,
                    "context_length": 400000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "openai/gpt-5.2-codex-20260114",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "is_mandatory_reasoning": true,
                        "supports_reasoning_effort": true,
                        "supported_reasoning_efforts": [
                            "low",
                            "medium",
                            "high",
                            "xhigh"
                        ],
                        "default_reasoning_effort": "medium"
                    },
                    "features": {
                        "reasoning_config": {
                            "is_mandatory_reasoning": true,
                            "supports_reasoning_effort": true,
                            "supported_reasoning_efforts": [
                                "low",
                                "medium",
                                "high",
                                "xhigh"
                            ],
                            "default_reasoning_effort": "medium"
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5.2-codex",
                "model_variant_permaslug": "openai/gpt-5.2-codex-20260114",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-5.2-codex",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": 272000,
                "max_completion_tokens": 128000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "logit_bias",
                    "logprobs",
                    "top_logprobs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000175",
                    "completion": "0.000014",
                    "input_cache_read": "0.000000175",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.00000175,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.000014,
                    "openai_responses:cached_prompt_tokens": 1.75e-7
                },
                "pricing_version_id": "bdea8a94-f94d-4281-b6a6-da5ffdf163c5",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "allenai/molmo-2-8b",
            "hf_slug": "allenai/Molmo2-8B",
            "updated_at": "2026-01-09T22:20:28.970761+00:00",
            "created_at": "2026-01-09T22:11:12.589713+00:00",
            "hf_updated_at": null,
            "name": "AllenAI: Molmo2 8B (free)",
            "short_name": "Molmo2 8B (free)",
            "author": "allenai",
            "description": "Molmo2-8B is an open vision-language model developed by the Allen Institute for AI (Ai2) as part of the Molmo2 family, supporting image, video, and multi-image understanding and grounding. It is based on Qwen3-8B and uses SigLIP 2 as its vision backbone, outperforming other open-weight, open-data models on short videos, counting, and captioning, while remaining competitive on long-video tasks.",
            "model_version_group_id": null,
            "context_length": 36864,
            "input_modalities": [
                "text",
                "image",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "allenai/molmo-2-8b-20260109",
            "supports_reasoning": false,
            "reasoning_config": {},
            "features": {
                "reasoning_config": {},
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "ed2677ef-e5a8-439e-8d23-0bc398915e61",
                "name": "Parasail | allenai/molmo-2-8b-20260109:free",
                "context_length": 36864,
                "model": {
                    "slug": "allenai/molmo-2-8b",
                    "hf_slug": "allenai/Molmo2-8B",
                    "updated_at": "2026-01-09T22:20:28.970761+00:00",
                    "created_at": "2026-01-09T22:11:12.589713+00:00",
                    "hf_updated_at": null,
                    "name": "AllenAI: Molmo2 8B",
                    "short_name": "Molmo2 8B",
                    "author": "allenai",
                    "description": "Molmo2-8B is an open vision-language model developed by the Allen Institute for AI (Ai2) as part of the Molmo2 family, supporting image, video, and multi-image understanding and grounding. It is based on Qwen3-8B and uses SigLIP 2 as its vision backbone, outperforming other open-weight, open-data models on short videos, counting, and captioning, while remaining competitive on long-video tasks.",
                    "model_version_group_id": null,
                    "context_length": 36864,
                    "input_modalities": [
                        "text",
                        "image",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "allenai/molmo-2-8b-20260109",
                    "supports_reasoning": false,
                    "reasoning_config": {},
                    "features": {
                        "reasoning_config": {},
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "allenai/molmo-2-8b:free",
                "model_variant_permaslug": "allenai/molmo-2-8b-20260109:free",
                "adapter_name": "ParasailAdapter",
                "provider_name": "Parasail",
                "provider_info": {
                    "name": "Parasail",
                    "displayName": "Parasail",
                    "slug": "parasail",
                    "baseUrl": "https://api.parasail.io/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.parasail.io/legal/terms",
                        "privacyPolicyURL": "https://www.parasail.io/legal/privacy-policy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "org_34P5Ca01in28Ek1oxb5OtfZdEjQ",
                        "user_37qaJKhqfUEFgVF46sarwDHxE50"
                    ],
                    "adapterName": "ParasailAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://www.parasail.io/&size=256"
                    },
                    "ignoredProviderModels": [
                        "parasail-olmo-2-1124-7b-instruct",
                        "parasail-qwen3-omni-30b-a3b-thinking",
                        "parasail-qwen3-omni-30b-a3b-instruct",
                        "parasail-dots-ocr",
                        "parasail-auto-glm-9b-multilingual"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Parasail",
                "provider_slug": "parasail/bf16",
                "provider_model_id": "parasail-molmo2-8b",
                "quantization": "bf16",
                "variant": "free",
                "is_free": true,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 36864,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "frequency_penalty",
                    "presence_penalty",
                    "repetition_penalty",
                    "seed",
                    "stop",
                    "top_k",
                    "logit_bias",
                    "response_format"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.parasail.io/legal/terms",
                    "privacyPolicyURL": "https://www.parasail.io/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0",
                    "openai:completion_tokens": "0"
                },
                "pricing_version_id": "cba2167e-8a12-41bb-9d8e-a39abd4907cc",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_base64_video_input": true,
                    "supports_video_urls": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "bytedance-seed/seedream-4.5",
            "hf_slug": "",
            "updated_at": "2025-12-23T20:23:30.403+00:00",
            "created_at": "2025-12-23T19:51:46+00:00",
            "hf_updated_at": null,
            "name": "ByteDance Seed: Seedream 4.5",
            "short_name": "Seedream 4.5",
            "author": "bytedance-seed",
            "description": "Seedream 4.5 is the latest in-house image generation model developed by ByteDance. Compared with Seedream 4.0, it delivers comprehensive improvements, especially in editing consistency, including better preservation of subject details, lighting, and color tone. It also enhances portrait refinement and small-text rendering. The model’s multi-image composition capabilities have been significantly strengthened, and both reasoning performance and visual aesthetics continue to advance, enabling more accurate and artistically expressive image generation.\n\nPricing is $0.04 per output image, regardless of size.",
            "model_version_group_id": null,
            "context_length": 4096,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "image"
            ],
            "has_text_output": false,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "bytedance-seed/seedream-4.5-20251203",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": null,
                "supports_reasoning_max_tokens": null,
                "supported_reasoning_efforts": null,
                "default_reasoning_effort": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": null,
                    "supports_reasoning_max_tokens": null,
                    "supported_reasoning_efforts": null,
                    "default_reasoning_effort": null
                },
                "chat_template_config": {
                    "should_hoist_and_merge_system_messages": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "image_generation",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "2bc65671-3e31-4205-add1-10884b5cda4e",
                "name": "Seed | bytedance-seed/seedream-4.5-20251203",
                "context_length": 4096,
                "model": {
                    "slug": "bytedance-seed/seedream-4.5",
                    "hf_slug": "",
                    "updated_at": "2025-12-23T20:23:30.403+00:00",
                    "created_at": "2025-12-23T19:51:46+00:00",
                    "hf_updated_at": null,
                    "name": "ByteDance Seed: Seedream 4.5",
                    "short_name": "Seedream 4.5",
                    "author": "bytedance-seed",
                    "description": "Seedream 4.5 is the latest in-house image generation model developed by ByteDance. Compared with Seedream 4.0, it delivers comprehensive improvements, especially in editing consistency, including better preservation of subject details, lighting, and color tone. It also enhances portrait refinement and small-text rendering. The model’s multi-image composition capabilities have been significantly strengthened, and both reasoning performance and visual aesthetics continue to advance, enabling more accurate and artistically expressive image generation.\n\nPricing is $0.04 per output image, regardless of size.",
                    "model_version_group_id": null,
                    "context_length": 4096,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "image"
                    ],
                    "has_text_output": false,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "bytedance-seed/seedream-4.5-20251203",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": null,
                        "supports_reasoning_max_tokens": null,
                        "supported_reasoning_efforts": null,
                        "default_reasoning_effort": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": null,
                            "supports_reasoning_max_tokens": null,
                            "supported_reasoning_efforts": null,
                            "default_reasoning_effort": null
                        },
                        "chat_template_config": {
                            "should_hoist_and_merge_system_messages": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "image_generation",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "bytedance-seed/seedream-4.5",
                "model_variant_permaslug": "bytedance-seed/seedream-4.5-20251203",
                "adapter_name": "SeedreamAdapter",
                "provider_name": "Seed",
                "provider_info": {
                    "name": "Seed",
                    "displayName": "Seed",
                    "slug": "seed",
                    "baseUrl": "https://ark.ap-southeast.bytepluses.com/api/v3",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://docs.byteplus.com/en/docs/legal/docs-terms-of-service",
                        "privacyPolicyURL": "https://docs.byteplus.com/en/docs/legal/docs-privacy-policy"
                    },
                    "headquarters": "SG",
                    "datacenters": [],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [],
                    "owners": [],
                    "adapterName": "SeedreamAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://avatars.githubusercontent.com/u/4158466?v=4&size=256"
                    },
                    "ignoredProviderModels": [
                        "ep-20251223020539-6m7wz"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "seedream"
                },
                "provider_display_name": "Seed",
                "provider_slug": "seed",
                "provider_model_id": "ep-20251223020539-6m7wz",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "frequency_penalty",
                    "max_tokens",
                    "temperature",
                    "top_p"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://docs.byteplus.com/en/docs/legal/docs-terms-of-service",
                    "privacyPolicyURL": "https://docs.byteplus.com/en/docs/legal/docs-privacy-policy"
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "image_output": "0.04",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "seedream:cents_per_image_output": 4,
                    "seedream:informational_output_tokens": "0"
                },
                "pricing_version_id": "1aa3d4ce-6b6a-4cba-9585-5409c3359caf",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "bytedance-seed/seed-1.6-flash",
            "hf_slug": "",
            "updated_at": "2025-12-23T15:50:11.246001+00:00",
            "created_at": "2025-12-23T15:50:11+00:00",
            "hf_updated_at": null,
            "name": "ByteDance Seed: Seed 1.6 Flash",
            "short_name": "Seed 1.6 Flash",
            "author": "bytedance-seed",
            "description": "Seed 1.6 Flash is an ultra-fast multimodal deep thinking model by ByteDance Seed, supporting both text and visual understanding. It features a 256k context window and can generate outputs of up to 16k tokens.",
            "model_version_group_id": null,
            "context_length": 262144,
            "input_modalities": [
                "image",
                "text",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "bytedance-seed/seed-1.6-flash-20250625",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": "<think>",
                "end_token": "</think>",
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": "<think>",
                    "end_token": "</think>",
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "e01a1227-001b-44d4-a376-90850668fa84",
                "name": "Seed | bytedance-seed/seed-1.6-flash-20250625",
                "context_length": 262144,
                "model": {
                    "slug": "bytedance-seed/seed-1.6-flash",
                    "hf_slug": "",
                    "updated_at": "2025-12-23T15:50:11.246001+00:00",
                    "created_at": "2025-12-23T15:50:11+00:00",
                    "hf_updated_at": null,
                    "name": "ByteDance Seed: Seed 1.6 Flash",
                    "short_name": "Seed 1.6 Flash",
                    "author": "bytedance-seed",
                    "description": "Seed 1.6 Flash is an ultra-fast multimodal deep thinking model by ByteDance Seed, supporting both text and visual understanding. It features a 256k context window and can generate outputs of up to 16k tokens.",
                    "model_version_group_id": null,
                    "context_length": 262144,
                    "input_modalities": [
                        "image",
                        "text",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "bytedance-seed/seed-1.6-flash-20250625",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": "<think>",
                        "end_token": "</think>",
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": "<think>",
                            "end_token": "</think>",
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "bytedance-seed/seed-1.6-flash",
                "model_variant_permaslug": "bytedance-seed/seed-1.6-flash-20250625",
                "adapter_name": "BytePlusAdapter",
                "provider_name": "Seed",
                "provider_info": {
                    "name": "Seed",
                    "displayName": "Seed",
                    "slug": "seed",
                    "baseUrl": "https://ark.ap-southeast.bytepluses.com/api/v3",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://docs.byteplus.com/en/docs/legal/docs-terms-of-service",
                        "privacyPolicyURL": "https://docs.byteplus.com/en/docs/legal/docs-privacy-policy"
                    },
                    "headquarters": "SG",
                    "datacenters": [],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [],
                    "owners": [],
                    "adapterName": "BytePlusAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://avatars.githubusercontent.com/u/4158466?v=4&size=256"
                    },
                    "ignoredProviderModels": [
                        "ep-20251223020539-6m7wz"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "byteplus"
                },
                "provider_display_name": "Seed",
                "provider_slug": "seed/fp8",
                "provider_model_id": "ep-20251022091553-b9gf5",
                "quantization": "fp8",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 32768,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "frequency_penalty",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "tools",
                    "tool_choice",
                    "response_format",
                    "structured_outputs"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://docs.byteplus.com/en/docs/legal/docs-terms-of-service",
                    "privacyPolicyURL": "https://docs.byteplus.com/en/docs/legal/docs-privacy-policy"
                },
                "pricing": {
                    "prompt": "0.000000075",
                    "completion": "0.0000003",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "prompt-threshold",
                        "threshold": 128000,
                        "prompt": "0.0000001",
                        "completions": "0.0000008",
                        "input_cache_read": "0",
                        "input_cache_write": "0"
                    }
                ],
                "pricing_json": {
                    "openai:prompt_tokens": 7.5e-8,
                    "byteplus:prompt_tokens": "0.000000075",
                    "openai:completion_tokens": 3e-7,
                    "byteplus:completion_tokens": "0.0000003",
                    "byteplus:long_context_threshold": "128000",
                    "byteplus:prompt_tokens_long_context": "0.0000001",
                    "byteplus:completion_tokens_long_context": "0.0000008"
                },
                "pricing_version_id": "d70609e1-9841-4111-8962-b9967c58b5bb",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_base64_video_input": true,
                    "supports_video_urls": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "bytedance-seed/seed-1.6",
            "hf_slug": "",
            "updated_at": "2025-12-23T15:49:57.589744+00:00",
            "created_at": "2025-12-23T15:49:57+00:00",
            "hf_updated_at": null,
            "name": "ByteDance Seed: Seed 1.6",
            "short_name": "Seed 1.6",
            "author": "bytedance-seed",
            "description": "Seed 1.6 is a general-purpose model released by the ByteDance Seed team. It incorporates multimodal capabilities and adaptive deep thinking with a 256K context window.",
            "model_version_group_id": null,
            "context_length": 262144,
            "input_modalities": [
                "image",
                "text",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "bytedance-seed/seed-1.6-20250625",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": "<think>",
                "end_token": "</think>",
                "system_prompt": null,
                "is_mandatory_reasoning": null,
                "supports_reasoning_max_tokens": null,
                "supported_reasoning_efforts": null,
                "default_reasoning_effort": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": "<think>",
                    "end_token": "</think>",
                    "system_prompt": null,
                    "is_mandatory_reasoning": null,
                    "supports_reasoning_max_tokens": null,
                    "supported_reasoning_efforts": null,
                    "default_reasoning_effort": null
                },
                "chat_template_config": {
                    "should_hoist_and_merge_system_messages": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "d85c3862-4e0d-4f8d-955b-babc62f98124",
                "name": "Seed | bytedance-seed/seed-1.6-20250625",
                "context_length": 262144,
                "model": {
                    "slug": "bytedance-seed/seed-1.6",
                    "hf_slug": "",
                    "updated_at": "2025-12-23T15:49:57.589744+00:00",
                    "created_at": "2025-12-23T15:49:57+00:00",
                    "hf_updated_at": null,
                    "name": "ByteDance Seed: Seed 1.6",
                    "short_name": "Seed 1.6",
                    "author": "bytedance-seed",
                    "description": "Seed 1.6 is a general-purpose model released by the ByteDance Seed team. It incorporates multimodal capabilities and adaptive deep thinking with a 256K context window.",
                    "model_version_group_id": null,
                    "context_length": 262144,
                    "input_modalities": [
                        "image",
                        "text",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "bytedance-seed/seed-1.6-20250625",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": "<think>",
                        "end_token": "</think>",
                        "system_prompt": null,
                        "is_mandatory_reasoning": null,
                        "supports_reasoning_max_tokens": null,
                        "supported_reasoning_efforts": null,
                        "default_reasoning_effort": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": "<think>",
                            "end_token": "</think>",
                            "system_prompt": null,
                            "is_mandatory_reasoning": null,
                            "supports_reasoning_max_tokens": null,
                            "supported_reasoning_efforts": null,
                            "default_reasoning_effort": null
                        },
                        "chat_template_config": {
                            "should_hoist_and_merge_system_messages": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "bytedance-seed/seed-1.6",
                "model_variant_permaslug": "bytedance-seed/seed-1.6-20250625",
                "adapter_name": "BytePlusAdapter",
                "provider_name": "Seed",
                "provider_info": {
                    "name": "Seed",
                    "displayName": "Seed",
                    "slug": "seed",
                    "baseUrl": "https://ark.ap-southeast.bytepluses.com/api/v3",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://docs.byteplus.com/en/docs/legal/docs-terms-of-service",
                        "privacyPolicyURL": "https://docs.byteplus.com/en/docs/legal/docs-privacy-policy"
                    },
                    "headquarters": "SG",
                    "datacenters": [],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [],
                    "owners": [],
                    "adapterName": "BytePlusAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://avatars.githubusercontent.com/u/4158466?v=4&size=256"
                    },
                    "ignoredProviderModels": [
                        "ep-20251223020539-6m7wz"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "byteplus"
                },
                "provider_display_name": "Seed",
                "provider_slug": "seed/fp8",
                "provider_model_id": "ep-20251022091355-w7xt5",
                "quantization": "fp8",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 32768,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "frequency_penalty",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "tools",
                    "tool_choice",
                    "response_format",
                    "structured_outputs"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://docs.byteplus.com/en/docs/legal/docs-terms-of-service",
                    "privacyPolicyURL": "https://docs.byteplus.com/en/docs/legal/docs-privacy-policy"
                },
                "pricing": {
                    "prompt": "0.00000025",
                    "completion": "0.000002",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "prompt-threshold",
                        "threshold": 128000,
                        "prompt": "0.0000005",
                        "completions": "0.000004",
                        "input_cache_read": "0",
                        "input_cache_write": "0"
                    }
                ],
                "pricing_json": {
                    "openai:prompt_tokens": 2.5e-7,
                    "byteplus:prompt_tokens": "0.00000025",
                    "openai:completion_tokens": 0.000002,
                    "byteplus:completion_tokens": "0.000002",
                    "byteplus:long_context_threshold": "128000",
                    "byteplus:prompt_tokens_long_context": "0.0000005",
                    "byteplus:completion_tokens_long_context": "0.000004"
                },
                "pricing_version_id": "2d6fe62d-b1bd-49e8-a789-9612754d14b7",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_base64_video_input": true,
                    "supports_video_urls": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemini-3-flash-preview",
            "hf_slug": "",
            "updated_at": "2025-12-17T16:17:44.159277+00:00",
            "created_at": "2025-12-17T15:57:58+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 3 Flash Preview",
            "short_name": "Gemini 3 Flash Preview",
            "author": "google",
            "description": "Gemini 3 Flash Preview is a high speed, high value thinking model designed for agentic workflows, multi turn chat, and coding assistance. It delivers near Pro level reasoning and tool use performance with substantially lower latency than larger Gemini variants, making it well suited for interactive development, long running agent loops, and collaborative coding tasks. Compared to Gemini 2.5 Flash, it provides broad quality improvements across reasoning, multimodal understanding, and reliability.\n\nThe model supports a 1M token context window and multimodal inputs including text, images, audio, video, and PDFs, with text output. It includes configurable reasoning via thinking levels (minimal, low, medium, high), structured output, tool use, and automatic context caching. Gemini 3 Flash Preview is optimized for users who want strong reasoning and agentic behavior without the cost or latency of full scale frontier models.",
            "model_version_group_id": null,
            "context_length": 1048576,
            "input_modalities": [
                "text",
                "image",
                "file",
                "audio",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "google/gemini-3-flash-preview-20251217",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": null,
                "supports_reasoning_effort": true,
                "supports_reasoning_max_tokens": null,
                "supported_reasoning_efforts": [
                    "low",
                    "medium",
                    "high",
                    "minimal"
                ],
                "default_reasoning_effort": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": null,
                    "supports_reasoning_effort": true,
                    "supports_reasoning_max_tokens": null,
                    "supported_reasoning_efforts": [
                        "low",
                        "medium",
                        "high",
                        "minimal"
                    ],
                    "default_reasoning_effort": null
                },
                "chat_template_config": {
                    "should_hoist_and_merge_system_messages": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [
                "google-vertex",
                "google-ai-studio"
            ],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "d06bdb18-3cc2-46b0-bf23-922e485dc255",
                "name": "Google | google/gemini-3-flash-preview-20251217",
                "context_length": 1048576,
                "model": {
                    "slug": "google/gemini-3-flash-preview",
                    "hf_slug": "",
                    "updated_at": "2025-12-17T16:17:44.159277+00:00",
                    "created_at": "2025-12-17T15:57:58+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemini 3 Flash Preview",
                    "short_name": "Gemini 3 Flash Preview",
                    "author": "google",
                    "description": "Gemini 3 Flash Preview is a high speed, high value thinking model designed for agentic workflows, multi turn chat, and coding assistance. It delivers near Pro level reasoning and tool use performance with substantially lower latency than larger Gemini variants, making it well suited for interactive development, long running agent loops, and collaborative coding tasks. Compared to Gemini 2.5 Flash, it provides broad quality improvements across reasoning, multimodal understanding, and reliability.\n\nThe model supports a 1M token context window and multimodal inputs including text, images, audio, video, and PDFs, with text output. It includes configurable reasoning via thinking levels (minimal, low, medium, high), structured output, tool use, and automatic context caching. Gemini 3 Flash Preview is optimized for users who want strong reasoning and agentic behavior without the cost or latency of full scale frontier models.",
                    "model_version_group_id": null,
                    "context_length": 1048576,
                    "input_modalities": [
                        "text",
                        "image",
                        "file",
                        "audio",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "google/gemini-3-flash-preview-20251217",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": null,
                        "supports_reasoning_effort": true,
                        "supports_reasoning_max_tokens": null,
                        "supported_reasoning_efforts": [
                            "low",
                            "medium",
                            "high",
                            "minimal"
                        ],
                        "default_reasoning_effort": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": null,
                            "supports_reasoning_effort": true,
                            "supports_reasoning_max_tokens": null,
                            "supported_reasoning_efforts": [
                                "low",
                                "medium",
                                "high",
                                "minimal"
                            ],
                            "default_reasoning_effort": null
                        },
                        "chat_template_config": {
                            "should_hoist_and_merge_system_messages": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [
                        "google-vertex",
                        "google-ai-studio"
                    ],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemini-3-flash-preview",
                "model_variant_permaslug": "google/gemini-3-flash-preview-20251217",
                "adapter_name": "GoogleVertexGeminiAdapter",
                "provider_name": "Google",
                "provider_info": {
                    "name": "Google",
                    "displayName": "Google Vertex",
                    "slug": "google-vertex",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "not-used"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleVertexGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.cloud.google.com/products/sdXM79fz1FS6ekNpu37K/history",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleVertex.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-exp-03-25",
                        "gemini-2.0-flash-exp",
                        "gemini-1.5-flash-002",
                        "gemini-2.0-flash-lite-001",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-2.0-flash-001",
                        "llama-4-scout-17b-16e-instruct-maas",
                        "qwen3-235b-a22b-instruct-2507-maas",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-image-preview",
                        "llama-4-maverick-17b-128e-instruct-maas",
                        "llama-3.3-70b-instruct-maas",
                        "claude-3-5-haiku@20241022",
                        "qwen3-coder-480b-a35b-instruct-maas",
                        "gemini-1.5-pro-002",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-pro",
                        "deepseek-r1-0528-maas",
                        "claude-3-7-sonnet@20250219",
                        "claude-3-5-sonnet-v2@20241022",
                        "claude-sonnet-4@20250514",
                        "claude-opus-4-1@20250805",
                        "claude-opus-4@20250514",
                        "claude-3-haiku@20240307",
                        "claude-3-5-sonnet@20240620",
                        "claude-3-opus@20240229",
                        "gemini-2.5-flash-lite-preview-09-2025",
                        "gemini-2.5-flash-preview-09-2025",
                        "gemini-2.5-flash-image",
                        "claude-sonnet-4-5@20250929",
                        "claude-haiku-4-5@20251001",
                        "minimax/minimax-m2-maas",
                        "gemini-3-pro-preview",
                        "gemini-3-pro-image-preview",
                        "claude-opus-4-5@20251101"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google Vertex",
                "provider_slug": "google-vertex",
                "provider_model_id": "gemini-3-flash-preview",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 65535,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "response_format",
                    "stop",
                    "structured_outputs",
                    "tool_choice",
                    "tools"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.0000005",
                    "completion": "0.000003",
                    "image": "0.0000005",
                    "audio": "0.000001",
                    "input_audio_cache": "0.0000001",
                    "input_cache_read": "0.00000005",
                    "input_cache_write": "0.00000008333333333333334",
                    "internal_reasoning": "0.000003",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "gemini:prompt_tokens": 5e-7,
                    "gemini:reasoning_tokens": 0.000003,
                    "gemini:cache_read_tokens": 5e-8,
                    "gemini:completion_tokens": 0.000003,
                    "gemini:text_input_tokens": 5e-7,
                    "gemini:audio_input_tokens": 0.000001,
                    "gemini:image_input_tokens": 5e-7,
                    "gemini:video_input_tokens": 5e-7,
                    "gemini:cache_read_text_tokens": 5e-8,
                    "gemini:cache_read_audio_tokens": 1e-7,
                    "gemini:cache_read_image_tokens": 5e-8,
                    "gemini:cache_read_video_tokens": 5e-8,
                    "gemini:cache_write_storage_hours": 0.000001,
                    "gemini:cache_read_tokens_high_context": 1e-7,
                    "gemini:cache_read_text_tokens_high_context": 1e-7,
                    "gemini:cache_read_audio_tokens_high_context": 2e-7,
                    "gemini:cache_read_image_tokens_high_context": 1e-7,
                    "gemini:cache_read_video_tokens_high_context": 1e-7,
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "74036019-cef5-428a-b27f-0519ac4e5720",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_file_urls": true,
                    "supports_base64_video_input": true,
                    "supports_video_urls": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": true
                },
                "provider_region": "global",
                "deprecation_date": null
            }
        },
        {
            "slug": "black-forest-labs/flux.2-max",
            "hf_slug": "",
            "updated_at": "2025-12-16T17:17:13.934433+00:00",
            "created_at": "2025-12-16T03:59:30.221034+00:00",
            "hf_updated_at": null,
            "name": "Black Forest Labs: FLUX.2 Max",
            "short_name": "FLUX.2 Max",
            "author": "black-forest-labs",
            "description": "FLUX.2 [max] is the new top-tier image model from Black Forest Labs, pushing image quality, prompt understanding, and editing consistency to the highest level yet.\n\nPricing is as follows, [per the docs](https://bfl.ai/pricing?category=flux.2):\nInput: We charge $0.03 for each megapixel on the input (i.e. reference images for editing)\nOutput: The first generated megapixel is charged $0.07. Each subsequent megapixel is charged $0.03.",
            "model_version_group_id": null,
            "context_length": 46864,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "image"
            ],
            "has_text_output": false,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "black-forest-labs/flux.2-max",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": null,
                "supports_reasoning_max_tokens": null,
                "supported_reasoning_efforts": null,
                "default_reasoning_effort": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": null,
                    "supports_reasoning_max_tokens": null,
                    "supported_reasoning_efforts": null,
                    "default_reasoning_effort": null
                },
                "chat_template_config": {
                    "should_hoist_and_merge_system_messages": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "image_generation",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "79c839a0-5da8-4cc4-8324-dab2dd6893b0",
                "name": "Black Forest Labs | black-forest-labs/flux.2-max",
                "context_length": 46864,
                "model": {
                    "slug": "black-forest-labs/flux.2-max",
                    "hf_slug": "",
                    "updated_at": "2025-12-16T17:17:13.934433+00:00",
                    "created_at": "2025-12-16T03:59:30.221034+00:00",
                    "hf_updated_at": null,
                    "name": "Black Forest Labs: FLUX.2 Max",
                    "short_name": "FLUX.2 Max",
                    "author": "black-forest-labs",
                    "description": "FLUX.2 [max] is the new top-tier image model from Black Forest Labs, pushing image quality, prompt understanding, and editing consistency to the highest level yet.\n\nPricing is as follows, [per the docs](https://bfl.ai/pricing?category=flux.2):\nInput: We charge $0.03 for each megapixel on the input (i.e. reference images for editing)\nOutput: The first generated megapixel is charged $0.07. Each subsequent megapixel is charged $0.03.",
                    "model_version_group_id": null,
                    "context_length": 46864,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "image"
                    ],
                    "has_text_output": false,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "black-forest-labs/flux.2-max",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": null,
                        "supports_reasoning_max_tokens": null,
                        "supported_reasoning_efforts": null,
                        "default_reasoning_effort": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": null,
                            "supports_reasoning_max_tokens": null,
                            "supported_reasoning_efforts": null,
                            "default_reasoning_effort": null
                        },
                        "chat_template_config": {
                            "should_hoist_and_merge_system_messages": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "image_generation",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "black-forest-labs/flux.2-max",
                "model_variant_permaslug": "black-forest-labs/flux.2-max",
                "adapter_name": "BlackForestLabsAdapter",
                "provider_name": "Black Forest Labs",
                "provider_info": {
                    "name": "Black Forest Labs",
                    "displayName": "Black Forest Labs",
                    "slug": "black-forest-labs",
                    "baseUrl": "https://api.us3.bfl.ai/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://bfl.ai/legal/terms-of-service",
                        "privacyPolicyURL": "https://bfl.ai/legal/privacy-policy"
                    },
                    "datacenters": [],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "BlackForestLabsAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://bfl.ai&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "bfl"
                },
                "provider_display_name": "Black Forest Labs",
                "provider_slug": "black-forest-labs",
                "provider_model_id": "flux-2-max",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://bfl.ai/legal/terms-of-service",
                    "privacyPolicyURL": "https://bfl.ai/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "image_output": "0.00001708984375",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "bfl:upstream_cost_cents": "1",
                    "bfl:informational_output_megapixels": 0.07
                },
                "pricing_version_id": "56413436-161e-411a-852e-d10df3fb508b",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5.2-chat",
            "hf_slug": "",
            "updated_at": "2025-12-11T18:20:07.580251+00:00",
            "created_at": "2025-12-10T18:03:03.398082+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5.2 Chat",
            "short_name": "GPT-5.2 Chat",
            "author": "openai",
            "description": "GPT-5.2 Chat (AKA Instant) is the fast, lightweight member of the 5.2 family, optimized for low-latency chat while retaining strong general intelligence. It uses adaptive reasoning to selectively “think” on harder queries, improving accuracy on math, coding, and multi-step tasks without slowing down typical conversations. The model is warmer and more conversational by default, with better instruction following and more stable short-form reasoning. GPT-5.2 Chat is designed for high-throughput, interactive workloads where responsiveness and consistency matter more than deep deliberation.",
            "model_version_group_id": null,
            "context_length": 128000,
            "input_modalities": [
                "file",
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "openai/gpt-5.2-chat-20251211",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "e510ac71-5b26-4f05-b214-f95ba530d45d",
                "name": "OpenAI | openai/gpt-5.2-chat-20251211",
                "context_length": 128000,
                "model": {
                    "slug": "openai/gpt-5.2-chat",
                    "hf_slug": "",
                    "updated_at": "2025-12-11T18:20:07.580251+00:00",
                    "created_at": "2025-12-10T18:03:03.398082+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5.2 Chat",
                    "short_name": "GPT-5.2 Chat",
                    "author": "openai",
                    "description": "GPT-5.2 Chat (AKA Instant) is the fast, lightweight member of the 5.2 family, optimized for low-latency chat while retaining strong general intelligence. It uses adaptive reasoning to selectively “think” on harder queries, improving accuracy on math, coding, and multi-step tasks without slowing down typical conversations. The model is warmer and more conversational by default, with better instruction following and more stable short-form reasoning. GPT-5.2 Chat is designed for high-throughput, interactive workloads where responsiveness and consistency matter more than deep deliberation.",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "file",
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "openai/gpt-5.2-chat-20251211",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5.2-chat",
                "model_variant_permaslug": "openai/gpt-5.2-chat-20251211",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-5.2-chat-latest",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 16384,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000175",
                    "completion": "0.000014",
                    "input_cache_read": "0.000000175",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.00000175,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.000014,
                    "openai_responses:cached_prompt_tokens": 1.75e-7
                },
                "pricing_version_id": "8b5b51b9-4341-46e1-a5aa-7dd5ffa66a3f",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5.2-pro",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-12-10T18:03:00.055991+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5.2 Pro",
            "short_name": "GPT-5.2 Pro",
            "author": "openai",
            "description": "GPT-5.2 Pro is OpenAI’s most advanced model, offering major improvements in agentic coding and long context performance over GPT-5 Pro. It is optimized for complex tasks that require step-by-step reasoning, instruction following, and accuracy in high-stakes use cases. It supports test-time routing features and advanced prompt understanding, including user-specified intent like \"think hard about this.\" Improvements include reductions in hallucination, sycophancy, and better performance in coding, writing, and health-related tasks.",
            "model_version_group_id": null,
            "context_length": 400000,
            "input_modalities": [
                "image",
                "text",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "openai/gpt-5.2-pro-20251211",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true,
                "supports_reasoning_effort": true,
                "supports_reasoning_max_tokens": null,
                "supported_reasoning_efforts": [
                    "medium",
                    "high",
                    "xhigh"
                ],
                "default_reasoning_effort": null,
                "default_reasoning_enabled": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true,
                    "supports_reasoning_effort": true,
                    "supports_reasoning_max_tokens": null,
                    "supported_reasoning_efforts": [
                        "medium",
                        "high",
                        "xhigh"
                    ],
                    "default_reasoning_effort": null,
                    "default_reasoning_enabled": null
                },
                "chat_template_config": {
                    "should_hoist_and_merge_system_messages": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "1abae580-6f7a-4092-ae6c-b87ce6067f61",
                "name": "OpenAI | openai/gpt-5.2-pro-20251211",
                "context_length": 400000,
                "model": {
                    "slug": "openai/gpt-5.2-pro",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-12-10T18:03:00.055991+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5.2 Pro",
                    "short_name": "GPT-5.2 Pro",
                    "author": "openai",
                    "description": "GPT-5.2 Pro is OpenAI’s most advanced model, offering major improvements in agentic coding and long context performance over GPT-5 Pro. It is optimized for complex tasks that require step-by-step reasoning, instruction following, and accuracy in high-stakes use cases. It supports test-time routing features and advanced prompt understanding, including user-specified intent like \"think hard about this.\" Improvements include reductions in hallucination, sycophancy, and better performance in coding, writing, and health-related tasks.",
                    "model_version_group_id": null,
                    "context_length": 400000,
                    "input_modalities": [
                        "image",
                        "text",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "openai/gpt-5.2-pro-20251211",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true,
                        "supports_reasoning_effort": true,
                        "supports_reasoning_max_tokens": null,
                        "supported_reasoning_efforts": [
                            "medium",
                            "high",
                            "xhigh"
                        ],
                        "default_reasoning_effort": null,
                        "default_reasoning_enabled": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true,
                            "supports_reasoning_effort": true,
                            "supports_reasoning_max_tokens": null,
                            "supported_reasoning_efforts": [
                                "medium",
                                "high",
                                "xhigh"
                            ],
                            "default_reasoning_effort": null,
                            "default_reasoning_enabled": null
                        },
                        "chat_template_config": {
                            "should_hoist_and_merge_system_messages": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5.2-pro",
                "model_variant_permaslug": "openai/gpt-5.2-pro-20251211",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-5.2-pro-2025-12-11",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": 272000,
                "max_completion_tokens": 128000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000021",
                    "completion": "0.000168",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.000021,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.000168
                },
                "pricing_version_id": "28cb6295-41bb-4331-80fc-0126e243b777",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "is_mandatory_reasoning": true,
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5.2",
            "hf_slug": "",
            "updated_at": "2025-12-11T18:20:09.990885+00:00",
            "created_at": "2025-12-10T18:02:55.765028+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5.2",
            "short_name": "GPT-5.2",
            "author": "openai",
            "description": "GPT-5.2 is the latest frontier-grade model in the GPT-5 series, offering stronger agentic and long context perfomance compared to GPT-5.1. It uses adaptive reasoning to allocate computation dynamically, responding quickly to simple queries while spending more depth on complex tasks.\n\nBuilt for broad task coverage, GPT-5.2 delivers consistent gains across math, coding, sciende, and tool calling workloads, with more coherent long-form answers and improved tool-use reliability.",
            "model_version_group_id": null,
            "context_length": 400000,
            "input_modalities": [
                "file",
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "openai/gpt-5.2-20251211",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "f00142c2-6a93-49ce-9e36-5593b904ce3b",
                "name": "OpenAI | openai/gpt-5.2-20251211",
                "context_length": 400000,
                "model": {
                    "slug": "openai/gpt-5.2",
                    "hf_slug": "",
                    "updated_at": "2025-12-11T18:20:09.990885+00:00",
                    "created_at": "2025-12-10T18:02:55.765028+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5.2",
                    "short_name": "GPT-5.2",
                    "author": "openai",
                    "description": "GPT-5.2 is the latest frontier-grade model in the GPT-5 series, offering stronger agentic and long context perfomance compared to GPT-5.1. It uses adaptive reasoning to allocate computation dynamically, responding quickly to simple queries while spending more depth on complex tasks.\n\nBuilt for broad task coverage, GPT-5.2 delivers consistent gains across math, coding, sciende, and tool calling workloads, with more coherent long-form answers and improved tool-use reliability.",
                    "model_version_group_id": null,
                    "context_length": 400000,
                    "input_modalities": [
                        "file",
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "openai/gpt-5.2-20251211",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5.2",
                "model_variant_permaslug": "openai/gpt-5.2-20251211",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-5.2-2025-12-11",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": 272000,
                "max_completion_tokens": 128000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000175",
                    "completion": "0.000014",
                    "input_cache_read": "0.000000175",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.00000175,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.000014,
                    "openai_responses:cached_prompt_tokens": 1.75e-7
                },
                "pricing_version_id": "cbf3dc18-db59-46fa-9a74-127ca74f3ab7",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "is_mandatory_reasoning": false,
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "sourceful/riverflow-v2-max-preview",
            "hf_slug": "",
            "updated_at": "2025-12-09T14:33:09.632974+00:00",
            "created_at": "2025-12-08T23:50:49+00:00",
            "hf_updated_at": null,
            "name": "Sourceful: Riverflow V2 Max Preview",
            "short_name": "Riverflow V2 Max Preview",
            "author": "sourceful",
            "description": "Riverflow V2 Max Preview is the most powerful variant of Sourceful's Riverflow V2 preview lineup. This preview version exceeds the performance of Riverflow 1 Family and is Sourceful's first unified text-to-image and image-to-image model family.\n\nPricing is $0.075 per output image, regardless of size.\n\nSourceful imposes a 4.5MB request size limit, therefore it is highly recommended to pass image URLs instead of Base64 data.",
            "model_version_group_id": null,
            "context_length": 8192,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "image"
            ],
            "has_text_output": false,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "sourceful/riverflow-v2-max-preview",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "image_generation",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "8db3f8c4-038a-41ba-924a-e5cf268ee330",
                "name": "Sourceful | sourceful/riverflow-v2-max-preview",
                "context_length": 8192,
                "model": {
                    "slug": "sourceful/riverflow-v2-max-preview",
                    "hf_slug": "",
                    "updated_at": "2025-12-09T14:33:09.632974+00:00",
                    "created_at": "2025-12-08T23:50:49+00:00",
                    "hf_updated_at": null,
                    "name": "Sourceful: Riverflow V2 Max Preview",
                    "short_name": "Riverflow V2 Max Preview",
                    "author": "sourceful",
                    "description": "Riverflow V2 Max Preview is the most powerful variant of Sourceful's Riverflow V2 preview lineup. This preview version exceeds the performance of Riverflow 1 Family and is Sourceful's first unified text-to-image and image-to-image model family.\n\nPricing is $0.075 per output image, regardless of size.\n\nSourceful imposes a 4.5MB request size limit, therefore it is highly recommended to pass image URLs instead of Base64 data.",
                    "model_version_group_id": null,
                    "context_length": 8192,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "image"
                    ],
                    "has_text_output": false,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "sourceful/riverflow-v2-max-preview",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "image_generation",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "sourceful/riverflow-v2-max-preview",
                "model_variant_permaslug": "sourceful/riverflow-v2-max-preview",
                "adapter_name": "SourcefulAdapter",
                "provider_name": "Sourceful",
                "provider_info": {
                    "name": "Sourceful",
                    "displayName": "Sourceful",
                    "slug": "sourceful",
                    "baseUrl": "https://design-api.sourceful.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.sourceful.com/legal/spring-terms-of-use",
                        "privacyPolicyURL": "https://www.sourceful.com/legal/privacy-policy"
                    },
                    "datacenters": [],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [],
                    "owners": [],
                    "adapterName": "SourcefulAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://www.sourceful.com&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "sourceful"
                },
                "provider_display_name": "Sourceful",
                "provider_slug": "sourceful",
                "provider_model_id": "sourceful/riverflow-v2-max-preview",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.sourceful.com/legal/spring-terms-of-use",
                    "privacyPolicyURL": "https://www.sourceful.com/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "image_token": "0.00001796407185628743",
                    "image_output": "0.075",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "sourceful:cents_per_image_output": 7.5
                },
                "pricing_version_id": "a1b54c23-6587-47bb-b0f5-ccd18f46481f",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "sourceful/riverflow-v2-standard-preview",
            "hf_slug": "",
            "updated_at": "2025-12-09T14:33:12.112144+00:00",
            "created_at": "2025-12-08T23:50:36+00:00",
            "hf_updated_at": null,
            "name": "Sourceful: Riverflow V2 Standard Preview",
            "short_name": "Riverflow V2 Standard Preview",
            "author": "sourceful",
            "description": "Riverflow V2 Standard Preview is the standard variant of Sourceful's Riverflow V2 preview lineup. This preview version exceeds the performance of Riverflow 1 Family and is Sourceful's first unified text-to-image and image-to-image model family.\n\nPricing is $0.035 per output image, regardless of size.\n\nSourceful imposes a 4.5MB request size limit, therefore it is highly recommended to pass image URLs instead of Base64 data.",
            "model_version_group_id": null,
            "context_length": 8192,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "image"
            ],
            "has_text_output": false,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "sourceful/riverflow-v2-standard-preview",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "image_generation",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "69bbbbea-d1e2-47ed-8d2a-ee2e9a329005",
                "name": "Sourceful | sourceful/riverflow-v2-standard-preview",
                "context_length": 8192,
                "model": {
                    "slug": "sourceful/riverflow-v2-standard-preview",
                    "hf_slug": "",
                    "updated_at": "2025-12-09T14:33:12.112144+00:00",
                    "created_at": "2025-12-08T23:50:36+00:00",
                    "hf_updated_at": null,
                    "name": "Sourceful: Riverflow V2 Standard Preview",
                    "short_name": "Riverflow V2 Standard Preview",
                    "author": "sourceful",
                    "description": "Riverflow V2 Standard Preview is the standard variant of Sourceful's Riverflow V2 preview lineup. This preview version exceeds the performance of Riverflow 1 Family and is Sourceful's first unified text-to-image and image-to-image model family.\n\nPricing is $0.035 per output image, regardless of size.\n\nSourceful imposes a 4.5MB request size limit, therefore it is highly recommended to pass image URLs instead of Base64 data.",
                    "model_version_group_id": null,
                    "context_length": 8192,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "image"
                    ],
                    "has_text_output": false,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "sourceful/riverflow-v2-standard-preview",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "image_generation",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "sourceful/riverflow-v2-standard-preview",
                "model_variant_permaslug": "sourceful/riverflow-v2-standard-preview",
                "adapter_name": "SourcefulAdapter",
                "provider_name": "Sourceful",
                "provider_info": {
                    "name": "Sourceful",
                    "displayName": "Sourceful",
                    "slug": "sourceful",
                    "baseUrl": "https://design-api.sourceful.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.sourceful.com/legal/spring-terms-of-use",
                        "privacyPolicyURL": "https://www.sourceful.com/legal/privacy-policy"
                    },
                    "datacenters": [],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [],
                    "owners": [],
                    "adapterName": "SourcefulAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://www.sourceful.com&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "sourceful"
                },
                "provider_display_name": "Sourceful",
                "provider_slug": "sourceful",
                "provider_model_id": "sourceful/riverflow-v2-standard-preview",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.sourceful.com/legal/spring-terms-of-use",
                    "privacyPolicyURL": "https://www.sourceful.com/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "image_token": "0.00000838323353293413",
                    "image_output": "0.035",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "sourceful:cents_per_image_output": 3.5
                },
                "pricing_version_id": "1172ed9d-3508-4dd6-a1da-8e463dede88e",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "sourceful/riverflow-v2-fast-preview",
            "hf_slug": "",
            "updated_at": "2025-12-09T14:33:14.431363+00:00",
            "created_at": "2025-12-08T23:50:20+00:00",
            "hf_updated_at": null,
            "name": "Sourceful: Riverflow V2 Fast Preview",
            "short_name": "Riverflow V2 Fast Preview",
            "author": "sourceful",
            "description": "Riverflow V2 Fast Preview is the fastest variant of Sourceful's Riverflow V2 preview lineup. This preview version exceeds the performance of Riverflow 1 Family and is Sourceful's first unified text-to-image and image-to-image model family.\n\nPricing is $0.03 per output image, regardless of size.\n\nSourceful imposes a 4.5MB request size limit, therefore it is highly recommended to pass image URLs instead of Base64 data.",
            "model_version_group_id": null,
            "context_length": 8192,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "image"
            ],
            "has_text_output": false,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "sourceful/riverflow-v2-fast-preview",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "image_generation",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "ee33a0ab-9f6a-4121-aa4a-56d4b3fe630f",
                "name": "Sourceful | sourceful/riverflow-v2-fast-preview",
                "context_length": 8192,
                "model": {
                    "slug": "sourceful/riverflow-v2-fast-preview",
                    "hf_slug": "",
                    "updated_at": "2025-12-09T14:33:14.431363+00:00",
                    "created_at": "2025-12-08T23:50:20+00:00",
                    "hf_updated_at": null,
                    "name": "Sourceful: Riverflow V2 Fast Preview",
                    "short_name": "Riverflow V2 Fast Preview",
                    "author": "sourceful",
                    "description": "Riverflow V2 Fast Preview is the fastest variant of Sourceful's Riverflow V2 preview lineup. This preview version exceeds the performance of Riverflow 1 Family and is Sourceful's first unified text-to-image and image-to-image model family.\n\nPricing is $0.03 per output image, regardless of size.\n\nSourceful imposes a 4.5MB request size limit, therefore it is highly recommended to pass image URLs instead of Base64 data.",
                    "model_version_group_id": null,
                    "context_length": 8192,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "image"
                    ],
                    "has_text_output": false,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "sourceful/riverflow-v2-fast-preview",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "image_generation",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "sourceful/riverflow-v2-fast-preview",
                "model_variant_permaslug": "sourceful/riverflow-v2-fast-preview",
                "adapter_name": "SourcefulAdapter",
                "provider_name": "Sourceful",
                "provider_info": {
                    "name": "Sourceful",
                    "displayName": "Sourceful",
                    "slug": "sourceful",
                    "baseUrl": "https://design-api.sourceful.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.sourceful.com/legal/spring-terms-of-use",
                        "privacyPolicyURL": "https://www.sourceful.com/legal/privacy-policy"
                    },
                    "datacenters": [],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [],
                    "owners": [],
                    "adapterName": "SourcefulAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://www.sourceful.com&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "sourceful"
                },
                "provider_display_name": "Sourceful",
                "provider_slug": "sourceful",
                "provider_model_id": "sourceful/riverflow-v2-fast-preview",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.sourceful.com/legal/spring-terms-of-use",
                    "privacyPolicyURL": "https://www.sourceful.com/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "image_token": "0.00000718562874251497",
                    "image_output": "0.03",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "sourceful:cents_per_image_output": 3
                },
                "pricing_version_id": "0ebeb00e-efd5-4be3-93cf-7f57eb03eedb",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "z-ai/glm-4.6v",
            "hf_slug": "zai-org/GLM-4.6V",
            "updated_at": "2025-12-08T15:45:24.970322+00:00",
            "created_at": "2025-12-08T15:24:22.464154+00:00",
            "hf_updated_at": null,
            "name": "Z.AI: GLM 4.6V",
            "short_name": "GLM 4.6V",
            "author": "z-ai",
            "description": "GLM-4.6V is a large multimodal model designed for high-fidelity visual understanding and long-context reasoning across images, documents, and mixed media. It supports up to 128K tokens, processes complex page layouts and charts directly as visual inputs, and integrates native multimodal function calling to connect perception with downstream tool execution. The model also enables interleaved image-text generation and UI reconstruction workflows, including screenshot-to-HTML synthesis and iterative visual editing.",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "image",
                "text",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "z-ai/glm-4.6-20251208",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": "<think>",
                "end_token": "</think>",
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": "<think>",
                    "end_token": "</think>",
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": 0.8,
                "top_p": 0.6,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "a341c9a0-4b18-429a-b620-9e4fd811803c",
                "name": "SiliconFlow | z-ai/glm-4.6-20251208",
                "context_length": 131072,
                "model": {
                    "slug": "z-ai/glm-4.6v",
                    "hf_slug": "zai-org/GLM-4.6V",
                    "updated_at": "2025-12-08T15:45:24.970322+00:00",
                    "created_at": "2025-12-08T15:24:22.464154+00:00",
                    "hf_updated_at": null,
                    "name": "Z.AI: GLM 4.6V",
                    "short_name": "GLM 4.6V",
                    "author": "z-ai",
                    "description": "GLM-4.6V is a large multimodal model designed for high-fidelity visual understanding and long-context reasoning across images, documents, and mixed media. It supports up to 128K tokens, processes complex page layouts and charts directly as visual inputs, and integrates native multimodal function calling to connect perception with downstream tool execution. The model also enables interleaved image-text generation and UI reconstruction workflows, including screenshot-to-HTML synthesis and iterative visual editing.",
                    "model_version_group_id": null,
                    "context_length": 131072,
                    "input_modalities": [
                        "image",
                        "text",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "z-ai/glm-4.6-20251208",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": "<think>",
                        "end_token": "</think>",
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": "<think>",
                            "end_token": "</think>",
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": 0.8,
                        "top_p": 0.6,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "z-ai/glm-4.6v",
                "model_variant_permaslug": "z-ai/glm-4.6-20251208",
                "adapter_name": "SiliconFlowAdapter",
                "provider_name": "SiliconFlow",
                "provider_info": {
                    "name": "SiliconFlow",
                    "displayName": "SiliconFlow",
                    "slug": "siliconflow",
                    "baseUrl": "https://api.siliconflow.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://docs.siliconflow.com/en/legals/terms-of-service",
                        "privacyPolicyURL": "https://docs.siliconflow.com/en/legals/privacy-policy"
                    },
                    "headquarters": "SG",
                    "datacenters": [],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "SiliconFlowAdapter",
                    "isMultipartSupported": false,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "/images/icons/SiliconFlow.svg"
                    },
                    "ignoredProviderModels": [
                        "inclusionAI/Ling-mini-2.0",
                        "inclusionAI/Ring-flash-2.0",
                        "inclusionAI/Ling-flash-2.0"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "SiliconFlow",
                "provider_slug": "siliconflow/fp8",
                "provider_model_id": "zai-org/GLM-4.6V",
                "quantization": "fp8",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 131072,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "temperature",
                    "top_p",
                    "top_k",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://docs.siliconflow.com/en/legals/terms-of-service",
                    "privacyPolicyURL": "https://docs.siliconflow.com/en/legals/privacy-policy"
                },
                "pricing": {
                    "prompt": "0.0000003",
                    "completion": "0.0000009",
                    "image": "0",
                    "request": "0",
                    "input_cache_read": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.0000003",
                    "openai:completion_tokens": "0.0000009"
                },
                "pricing_version_id": "12be62ec-1783-4c33-a291-7b82056a75df",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_base64_video_input": false,
                    "supports_video_urls": false,
                    "supports_tool_choice": {
                        "literal_none": false,
                        "literal_auto": true,
                        "literal_required": false,
                        "type_function": false
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5.1-codex-max",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-12-04T20:08:54.10013+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5.1-Codex-Max",
            "short_name": "GPT-5.1-Codex-Max",
            "author": "openai",
            "description": "GPT-5.1-Codex-Max is OpenAI’s latest agentic coding model, designed for long-running, high-context software development tasks. It is based on an updated version of the 5.1 reasoning stack and trained on agentic workflows spanning software engineering, mathematics, and research. \nGPT-5.1-Codex-Max delivers faster performance, improved reasoning, and higher token efficiency across the development lifecycle. ",
            "model_version_group_id": null,
            "context_length": 400000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "openai/gpt-5.1-codex-max-20251204",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "f225ad30-4cb3-4e28-b677-0eff326af277",
                "name": "OpenAI | openai/gpt-5.1-codex-max-20251204",
                "context_length": 400000,
                "model": {
                    "slug": "openai/gpt-5.1-codex-max",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-12-04T20:08:54.10013+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5.1-Codex-Max",
                    "short_name": "GPT-5.1-Codex-Max",
                    "author": "openai",
                    "description": "GPT-5.1-Codex-Max is OpenAI’s latest agentic coding model, designed for long-running, high-context software development tasks. It is based on an updated version of the 5.1 reasoning stack and trained on agentic workflows spanning software engineering, mathematics, and research. \nGPT-5.1-Codex-Max delivers faster performance, improved reasoning, and higher token efficiency across the development lifecycle. ",
                    "model_version_group_id": null,
                    "context_length": 400000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "openai/gpt-5.1-codex-max-20251204",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5.1-codex-max",
                "model_variant_permaslug": "openai/gpt-5.1-codex-max-20251204",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-5.1-codex-max",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 128000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "tool_choice",
                    "tools"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000125",
                    "completion": "0.00001",
                    "input_cache_read": "0.000000125",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.00000125,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.00001,
                    "openai_responses:cached_prompt_tokens": 1.25e-7
                },
                "pricing_version_id": "caa166de-dce5-44c0-a280-fef824e3d18e",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "is_mandatory_reasoning": true,
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "amazon/nova-2-lite-v1",
            "hf_slug": "",
            "updated_at": "2025-12-05T00:11:57.060181+00:00",
            "created_at": "2025-12-02T17:31:12+00:00",
            "hf_updated_at": null,
            "name": "Amazon: Nova 2 Lite",
            "short_name": "Nova 2 Lite",
            "author": "amazon",
            "description": "Nova 2 Lite is a fast, cost-effective reasoning model for everyday workloads that can process text, images, and videos to generate text. \n\nNova 2 Lite demonstrates standout capabilities in processing documents, extracting information from videos, generating code, providing accurate grounded answers, and automating multi-step agentic workflows.",
            "model_version_group_id": null,
            "context_length": 1000000,
            "input_modalities": [
                "text",
                "image",
                "video",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Nova",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "amazon/nova-2-lite-v1",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "b1b489e5-7029-4ab2-9e12-5415b55b4afa",
                "name": "Amazon Bedrock | amazon/nova-2-lite-v1",
                "context_length": 1000000,
                "model": {
                    "slug": "amazon/nova-2-lite-v1",
                    "hf_slug": "",
                    "updated_at": "2025-12-05T00:11:57.060181+00:00",
                    "created_at": "2025-12-02T17:31:12+00:00",
                    "hf_updated_at": null,
                    "name": "Amazon: Nova 2 Lite",
                    "short_name": "Nova 2 Lite",
                    "author": "amazon",
                    "description": "Nova 2 Lite is a fast, cost-effective reasoning model for everyday workloads that can process text, images, and videos to generate text. \n\nNova 2 Lite demonstrates standout capabilities in processing documents, extracting information from videos, generating code, providing accurate grounded answers, and automating multi-step agentic workflows.",
                    "model_version_group_id": null,
                    "context_length": 1000000,
                    "input_modalities": [
                        "text",
                        "image",
                        "video",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Nova",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "amazon/nova-2-lite-v1",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "amazon/nova-2-lite-v1",
                "model_variant_permaslug": "amazon/nova-2-lite-v1",
                "adapter_name": "AmazonBedrockConverseNovaReasoningAdapter",
                "provider_name": "Amazon Bedrock",
                "provider_info": {
                    "name": "Amazon Bedrock",
                    "displayName": "Amazon Bedrock",
                    "slug": "amazon-bedrock",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                        "privacyPolicyURL": "https://aws.amazon.com/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "dummy-value"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "AmazonBedrockConverseNovaReasoningAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://health.aws.amazon.com/health/status",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Bedrock.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": null
                },
                "provider_display_name": "Amazon Bedrock",
                "provider_slug": "amazon-bedrock",
                "provider_model_id": "us.amazon.nova-2-lite-v1:0",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 65535,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "top_k",
                    "stop",
                    "tool_choice",
                    "tools"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                    "privacyPolicyURL": "https://aws.amazon.com/privacy"
                },
                "pricing": {
                    "prompt": "0.0000003",
                    "completion": "0.0000025",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": false,
                    "supports_base64_video_input": true,
                    "supports_video_urls": false,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "is_mandatory_reasoning": false,
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "mistralai/ministral-14b-2512",
            "hf_slug": "mistralai/Ministral-3-14B-Instruct-2512",
            "updated_at": "2025-12-10T16:54:21.432818+00:00",
            "created_at": "2025-12-02T13:22:15.851192+00:00",
            "hf_updated_at": null,
            "name": "Mistral: Ministral 3 14B 2512",
            "short_name": "Ministral 3 14B 2512",
            "author": "mistralai",
            "description": "The largest model in the Ministral 3 family, Ministral 3 14B offers frontier capabilities and performance comparable to its larger Mistral Small 3.2 24B counterpart. A powerful and efficient language model with vision capabilities.",
            "model_version_group_id": null,
            "context_length": 262144,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Mistral",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "mistralai/ministral-14b-2512",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": 0.3,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "0b53717b-9af5-4de3-80af-ebedd2adf981",
                "name": "Mistral | mistralai/ministral-14b-2512",
                "context_length": 262144,
                "model": {
                    "slug": "mistralai/ministral-14b-2512",
                    "hf_slug": "mistralai/Ministral-3-14B-Instruct-2512",
                    "updated_at": "2025-12-10T16:54:21.432818+00:00",
                    "created_at": "2025-12-02T13:22:15.851192+00:00",
                    "hf_updated_at": null,
                    "name": "Mistral: Ministral 3 14B 2512",
                    "short_name": "Ministral 3 14B 2512",
                    "author": "mistralai",
                    "description": "The largest model in the Ministral 3 family, Ministral 3 14B offers frontier capabilities and performance comparable to its larger Mistral Small 3.2 24B counterpart. A powerful and efficient language model with vision capabilities.",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Mistral",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "mistralai/ministral-14b-2512",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": 0.3,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "mistralai/ministral-14b-2512",
                "model_variant_permaslug": "mistralai/ministral-14b-2512",
                "adapter_name": "MistralAdapter",
                "provider_name": "Mistral",
                "provider_info": {
                    "name": "Mistral",
                    "displayName": "Mistral",
                    "slug": "mistral",
                    "baseUrl": "https://api.mistral.ai/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://mistral.ai/terms/#terms-of-use",
                        "privacyPolicyURL": "https://mistral.ai/terms/#privacy-policy"
                    },
                    "headquarters": "FR",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "MistralAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.mistral.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Mistral.png"
                    },
                    "ignoredProviderModels": [
                        "mistral-moderation-2411-all",
                        "voxtral-mini-2507",
                        "voxtral-small-2507",
                        "voxtral-mini-transcribe-2507",
                        "mistral-medium",
                        "mistral-tiny",
                        "mistral-tiny-2312",
                        "open-mistral-nemo",
                        "mistral-tiny-2407",
                        "open-mixtral-8x7b",
                        "mistral-small",
                        "mistral-small-2312",
                        "open-mixtral-8x22b-2404",
                        "mistral-large-pixtral-2411",
                        "codestral-2412",
                        "codestral-2411-rc5",
                        "pixtral-12b",
                        "mistral-moderation-2411",
                        "mistral-ocr-2503",
                        "mistral-ocr-2505",
                        "mistral-saba-2502",
                        "open-mixtral-8x22b",
                        "mistral-large-2407",
                        "magistral-medium-2507",
                        "mistral-embed",
                        "codestral-embed",
                        "codestral-2501",
                        "mistral-small-2501",
                        "mistral-ocr-2512",
                        "labs-devstral-small-2512"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "mistral"
                },
                "provider_display_name": "Mistral",
                "provider_slug": "mistral",
                "provider_model_id": "ministral-14b-2512",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://mistral.ai/terms/#terms-of-use",
                    "privacyPolicyURL": "https://mistral.ai/terms/#privacy-policy"
                },
                "pricing": {
                    "prompt": "0.0000002",
                    "completion": "0.0000002",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "mistral:prompt_tokens": 2e-7,
                    "mistral:completion_tokens": 2e-7
                },
                "pricing_version_id": "b0ff8ca8-ffa3-4feb-ad65-91090aa5c22b",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "mistralai/ministral-8b-2512",
            "hf_slug": "mistralai/Ministral-3-8B-Instruct-2512",
            "updated_at": "2025-12-10T16:54:03.715606+00:00",
            "created_at": "2025-12-02T13:20:54.103183+00:00",
            "hf_updated_at": null,
            "name": "Mistral: Ministral 3 8B 2512",
            "short_name": "Ministral 3 8B 2512",
            "author": "mistralai",
            "description": "A balanced model in the Ministral 3 family, Ministral 3 8B is a powerful, efficient tiny language model with vision capabilities.",
            "model_version_group_id": null,
            "context_length": 262144,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Mistral",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "mistralai/ministral-8b-2512",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": 0.3,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "c85d26e1-1e0c-449b-9775-2afce7ae510b",
                "name": "Mistral | mistralai/ministral-8b-2512",
                "context_length": 262144,
                "model": {
                    "slug": "mistralai/ministral-8b-2512",
                    "hf_slug": "mistralai/Ministral-3-8B-Instruct-2512",
                    "updated_at": "2025-12-10T16:54:03.715606+00:00",
                    "created_at": "2025-12-02T13:20:54.103183+00:00",
                    "hf_updated_at": null,
                    "name": "Mistral: Ministral 3 8B 2512",
                    "short_name": "Ministral 3 8B 2512",
                    "author": "mistralai",
                    "description": "A balanced model in the Ministral 3 family, Ministral 3 8B is a powerful, efficient tiny language model with vision capabilities.",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Mistral",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "mistralai/ministral-8b-2512",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": 0.3,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "mistralai/ministral-8b-2512",
                "model_variant_permaslug": "mistralai/ministral-8b-2512",
                "adapter_name": "MistralAdapter",
                "provider_name": "Mistral",
                "provider_info": {
                    "name": "Mistral",
                    "displayName": "Mistral",
                    "slug": "mistral",
                    "baseUrl": "https://api.mistral.ai/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://mistral.ai/terms/#terms-of-use",
                        "privacyPolicyURL": "https://mistral.ai/terms/#privacy-policy"
                    },
                    "headquarters": "FR",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "MistralAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.mistral.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Mistral.png"
                    },
                    "ignoredProviderModels": [
                        "mistral-moderation-2411-all",
                        "voxtral-mini-2507",
                        "voxtral-small-2507",
                        "voxtral-mini-transcribe-2507",
                        "mistral-medium",
                        "mistral-tiny",
                        "mistral-tiny-2312",
                        "open-mistral-nemo",
                        "mistral-tiny-2407",
                        "open-mixtral-8x7b",
                        "mistral-small",
                        "mistral-small-2312",
                        "open-mixtral-8x22b-2404",
                        "mistral-large-pixtral-2411",
                        "codestral-2412",
                        "codestral-2411-rc5",
                        "pixtral-12b",
                        "mistral-moderation-2411",
                        "mistral-ocr-2503",
                        "mistral-ocr-2505",
                        "mistral-saba-2502",
                        "open-mixtral-8x22b",
                        "mistral-large-2407",
                        "magistral-medium-2507",
                        "mistral-embed",
                        "codestral-embed",
                        "codestral-2501",
                        "mistral-small-2501",
                        "mistral-ocr-2512",
                        "labs-devstral-small-2512"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "mistral"
                },
                "provider_display_name": "Mistral",
                "provider_slug": "mistral",
                "provider_model_id": "ministral-8b-2512",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://mistral.ai/terms/#terms-of-use",
                    "privacyPolicyURL": "https://mistral.ai/terms/#privacy-policy"
                },
                "pricing": {
                    "prompt": "0.00000015",
                    "completion": "0.00000015",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "mistral:prompt_tokens": 1.5e-7,
                    "mistral:completion_tokens": 1.5e-7
                },
                "pricing_version_id": "d683019f-fb1b-407c-9fef-5b0efff712e1",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "mistralai/ministral-3b-2512",
            "hf_slug": "mistralai/Ministral-3-3B-Instruct-2512",
            "updated_at": "2025-12-10T16:53:53.577361+00:00",
            "created_at": "2025-12-02T13:19:20.726635+00:00",
            "hf_updated_at": null,
            "name": "Mistral: Ministral 3 3B 2512",
            "short_name": "Ministral 3 3B 2512",
            "author": "mistralai",
            "description": "The smallest model in the Ministral 3 family, Ministral 3 3B is a powerful, efficient tiny language model with vision capabilities.",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Mistral",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "mistralai/ministral-3b-2512",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": 0.3,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "b9f6828f-aef9-498a-91f5-6816fbf72420",
                "name": "Mistral | mistralai/ministral-3b-2512",
                "context_length": 131072,
                "model": {
                    "slug": "mistralai/ministral-3b-2512",
                    "hf_slug": "mistralai/Ministral-3-3B-Instruct-2512",
                    "updated_at": "2025-12-10T16:53:53.577361+00:00",
                    "created_at": "2025-12-02T13:19:20.726635+00:00",
                    "hf_updated_at": null,
                    "name": "Mistral: Ministral 3 3B 2512",
                    "short_name": "Ministral 3 3B 2512",
                    "author": "mistralai",
                    "description": "The smallest model in the Ministral 3 family, Ministral 3 3B is a powerful, efficient tiny language model with vision capabilities.",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Mistral",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "mistralai/ministral-3b-2512",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": 0.3,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "mistralai/ministral-3b-2512",
                "model_variant_permaslug": "mistralai/ministral-3b-2512",
                "adapter_name": "MistralAdapter",
                "provider_name": "Mistral",
                "provider_info": {
                    "name": "Mistral",
                    "displayName": "Mistral",
                    "slug": "mistral",
                    "baseUrl": "https://api.mistral.ai/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://mistral.ai/terms/#terms-of-use",
                        "privacyPolicyURL": "https://mistral.ai/terms/#privacy-policy"
                    },
                    "headquarters": "FR",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "MistralAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.mistral.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Mistral.png"
                    },
                    "ignoredProviderModels": [
                        "mistral-moderation-2411-all",
                        "voxtral-mini-2507",
                        "voxtral-small-2507",
                        "voxtral-mini-transcribe-2507",
                        "mistral-medium",
                        "mistral-tiny",
                        "mistral-tiny-2312",
                        "open-mistral-nemo",
                        "mistral-tiny-2407",
                        "open-mixtral-8x7b",
                        "mistral-small",
                        "mistral-small-2312",
                        "open-mixtral-8x22b-2404",
                        "mistral-large-pixtral-2411",
                        "codestral-2412",
                        "codestral-2411-rc5",
                        "pixtral-12b",
                        "mistral-moderation-2411",
                        "mistral-ocr-2503",
                        "mistral-ocr-2505",
                        "mistral-saba-2502",
                        "open-mixtral-8x22b",
                        "mistral-large-2407",
                        "magistral-medium-2507",
                        "mistral-embed",
                        "codestral-embed",
                        "codestral-2501",
                        "mistral-small-2501",
                        "mistral-ocr-2512",
                        "labs-devstral-small-2512"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "mistral"
                },
                "provider_display_name": "Mistral",
                "provider_slug": "mistral",
                "provider_model_id": "ministral-3b-2512",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "response_format",
                    "structured_outputs",
                    "tool_choice",
                    "tools"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://mistral.ai/terms/#terms-of-use",
                    "privacyPolicyURL": "https://mistral.ai/terms/#privacy-policy"
                },
                "pricing": {
                    "prompt": "0.0000001",
                    "completion": "0.0000001",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "mistral:prompt_tokens": 1e-7,
                    "mistral:completion_tokens": 1e-7
                },
                "pricing_version_id": "ec8022e6-9795-4d78-a729-b7c198e0326d",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "mistralai/mistral-large-2512",
            "hf_slug": "",
            "updated_at": "2025-12-02T15:19:24.969824+00:00",
            "created_at": "2025-12-01T21:27:52.65109+00:00",
            "hf_updated_at": null,
            "name": "Mistral: Mistral Large 3 2512",
            "short_name": "Mistral Large 3 2512",
            "author": "mistralai",
            "description": "Mistral Large 3 2512 is Mistral’s most capable model to date, featuring a sparse mixture-of-experts architecture with 41B active parameters (675B total), and released under the Apache 2.0 license.",
            "model_version_group_id": null,
            "context_length": 262144,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Mistral",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "",
            "permaslug": "mistralai/mistral-large-2512",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": 0.0645,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "text",
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "fa718841-07ea-4b7e-b8a3-6069545c7e6a",
                "name": "Mistral | mistralai/mistral-large-2512",
                "context_length": 262144,
                "model": {
                    "slug": "mistralai/mistral-large-2512",
                    "hf_slug": "",
                    "updated_at": "2025-12-02T15:19:24.969824+00:00",
                    "created_at": "2025-12-01T21:27:52.65109+00:00",
                    "hf_updated_at": null,
                    "name": "Mistral: Mistral Large 3 2512",
                    "short_name": "Mistral Large 3 2512",
                    "author": "mistralai",
                    "description": "Mistral Large 3 2512 is Mistral’s most capable model to date, featuring a sparse mixture-of-experts architecture with 41B active parameters (675B total), and released under the Apache 2.0 license.",
                    "model_version_group_id": null,
                    "context_length": 256000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Mistral",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "",
                    "permaslug": "mistralai/mistral-large-2512",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": 0.0645,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "text",
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "mistralai/mistral-large-2512",
                "model_variant_permaslug": "mistralai/mistral-large-2512",
                "adapter_name": "MistralAdapter",
                "provider_name": "Mistral",
                "provider_info": {
                    "name": "Mistral",
                    "displayName": "Mistral",
                    "slug": "mistral",
                    "baseUrl": "https://api.mistral.ai/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://mistral.ai/terms/#terms-of-use",
                        "privacyPolicyURL": "https://mistral.ai/terms/#privacy-policy"
                    },
                    "headquarters": "FR",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "MistralAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.mistral.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Mistral.png"
                    },
                    "ignoredProviderModels": [
                        "mistral-moderation-2411-all",
                        "voxtral-mini-2507",
                        "voxtral-small-2507",
                        "voxtral-mini-transcribe-2507",
                        "mistral-medium",
                        "mistral-tiny",
                        "mistral-tiny-2312",
                        "open-mistral-nemo",
                        "mistral-tiny-2407",
                        "open-mixtral-8x7b",
                        "mistral-small",
                        "mistral-small-2312",
                        "open-mixtral-8x22b-2404",
                        "mistral-large-pixtral-2411",
                        "codestral-2412",
                        "codestral-2411-rc5",
                        "pixtral-12b",
                        "mistral-moderation-2411",
                        "mistral-ocr-2503",
                        "mistral-ocr-2505",
                        "mistral-saba-2502",
                        "open-mixtral-8x22b",
                        "mistral-large-2407",
                        "magistral-medium-2507",
                        "mistral-embed",
                        "codestral-embed",
                        "codestral-2501",
                        "mistral-small-2501",
                        "mistral-ocr-2512",
                        "labs-devstral-small-2512"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "mistral"
                },
                "provider_display_name": "Mistral",
                "provider_slug": "mistral",
                "provider_model_id": "mistral-large-2512",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://mistral.ai/terms/#terms-of-use",
                    "privacyPolicyURL": "https://mistral.ai/terms/#privacy-policy"
                },
                "pricing": {
                    "prompt": "0.0000005",
                    "completion": "0.0000015",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "mistral:prompt_tokens": 5e-7,
                    "mistral:completion_tokens": 0.0000015
                },
                "pricing_version_id": "063c942f-5035-4cfc-8b26-911b375a5c4a",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": false,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "black-forest-labs/flux.2-flex",
            "hf_slug": "",
            "updated_at": "2025-11-25T16:34:07.604557+00:00",
            "created_at": "2025-11-25T04:46:27.810953+00:00",
            "hf_updated_at": null,
            "name": "Black Forest Labs: FLUX.2 Flex",
            "short_name": "FLUX.2 Flex",
            "author": "black-forest-labs",
            "description": "FLUX.2 [flex] excels at rendering complex text, typography, and fine details, and supports multi-reference editing in the same unified architecture.\n\nPricing is as follows, [per the docs](https://bfl.ai/pricing?category=flux.2):\nWe charge $0.06 for each megapixel on both input and output side.",
            "model_version_group_id": null,
            "context_length": 67344,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "image"
            ],
            "has_text_output": false,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "black-forest-labs/flux.2-flex",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "image_generation",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "ec92e60a-e4f4-474e-b1aa-7b48a509b343",
                "name": "Black Forest Labs | black-forest-labs/flux.2-flex",
                "context_length": 67344,
                "model": {
                    "slug": "black-forest-labs/flux.2-flex",
                    "hf_slug": "",
                    "updated_at": "2025-11-25T16:34:07.604557+00:00",
                    "created_at": "2025-11-25T04:46:27.810953+00:00",
                    "hf_updated_at": null,
                    "name": "Black Forest Labs: FLUX.2 Flex",
                    "short_name": "FLUX.2 Flex",
                    "author": "black-forest-labs",
                    "description": "FLUX.2 [flex] excels at rendering complex text, typography, and fine details, and supports multi-reference editing in the same unified architecture.\n\nPricing is as follows, [per the docs](https://bfl.ai/pricing?category=flux.2):\nWe charge $0.06 for each megapixel on both input and output side.",
                    "model_version_group_id": null,
                    "context_length": 67344,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "image"
                    ],
                    "has_text_output": false,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "black-forest-labs/flux.2-flex",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "image_generation",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "black-forest-labs/flux.2-flex",
                "model_variant_permaslug": "black-forest-labs/flux.2-flex",
                "adapter_name": "BlackForestLabsAdapter",
                "provider_name": "Black Forest Labs",
                "provider_info": {
                    "name": "Black Forest Labs",
                    "displayName": "Black Forest Labs",
                    "slug": "black-forest-labs",
                    "baseUrl": "https://api.us3.bfl.ai/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://bfl.ai/legal/terms-of-service",
                        "privacyPolicyURL": "https://bfl.ai/legal/privacy-policy"
                    },
                    "datacenters": [],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "BlackForestLabsAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://bfl.ai&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "bfl"
                },
                "provider_display_name": "Black Forest Labs",
                "provider_slug": "black-forest-labs",
                "provider_model_id": "flux-2-flex",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://bfl.ai/legal/terms-of-service",
                    "privacyPolicyURL": "https://bfl.ai/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "image_token": "0.0000146484375",
                    "image_output": "0.0000146484375",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "bfl:upstream_cost_cents": "1",
                    "bfl:informational_input_megapixels": 0.06,
                    "bfl:informational_output_megapixels": 0.06
                },
                "pricing_version_id": "9fbdc6b3-1cfc-40a8-ad76-5f6cf1c6a31c",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "black-forest-labs/flux.2-pro",
            "hf_slug": "",
            "updated_at": "2025-11-25T16:34:12.266076+00:00",
            "created_at": "2025-11-25T00:24:34.639016+00:00",
            "hf_updated_at": null,
            "name": "Black Forest Labs: FLUX.2 Pro",
            "short_name": "FLUX.2 Pro",
            "author": "black-forest-labs",
            "description": "A high-end image generation and editing model focused on frontier-level visual quality and reliability. It delivers strong prompt adherence, stable lighting, sharp textures, and consistent character/style reproduction across multi-reference inputs. Designed for production workloads, it balances speed and quality while supporting text-to-image and image editing up to 4 MP resolution.\n\nPricing is as follows, [per the docs](https://bfl.ai/pricing?category=flux.2):\nInput: We charge $0.015 for each megapixel on the input (i.e. reference images for editing)\nOutput: The first megapixel is charged $0.03 and then each subsequent MP will be charged $0.015. ",
            "model_version_group_id": null,
            "context_length": 46864,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "image"
            ],
            "has_text_output": false,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "black-forest-labs/flux.2-pro",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "image_generation",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "660ad218-5dae-4429-83fa-528514aa9bb8",
                "name": "Black Forest Labs | black-forest-labs/flux.2-pro",
                "context_length": 46864,
                "model": {
                    "slug": "black-forest-labs/flux.2-pro",
                    "hf_slug": "",
                    "updated_at": "2025-11-25T16:34:12.266076+00:00",
                    "created_at": "2025-11-25T00:24:34.639016+00:00",
                    "hf_updated_at": null,
                    "name": "Black Forest Labs: FLUX.2 Pro",
                    "short_name": "FLUX.2 Pro",
                    "author": "black-forest-labs",
                    "description": "A high-end image generation and editing model focused on frontier-level visual quality and reliability. It delivers strong prompt adherence, stable lighting, sharp textures, and consistent character/style reproduction across multi-reference inputs. Designed for production workloads, it balances speed and quality while supporting text-to-image and image editing up to 4 MP resolution.\n\nPricing is as follows, [per the docs](https://bfl.ai/pricing?category=flux.2):\nInput: We charge $0.015 for each megapixel on the input (i.e. reference images for editing)\nOutput: The first megapixel is charged $0.03 and then each subsequent MP will be charged $0.015. ",
                    "model_version_group_id": null,
                    "context_length": 46864,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "image"
                    ],
                    "has_text_output": false,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "black-forest-labs/flux.2-pro",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "image_generation",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "black-forest-labs/flux.2-pro",
                "model_variant_permaslug": "black-forest-labs/flux.2-pro",
                "adapter_name": "BlackForestLabsAdapter",
                "provider_name": "Black Forest Labs",
                "provider_info": {
                    "name": "Black Forest Labs",
                    "displayName": "Black Forest Labs",
                    "slug": "black-forest-labs",
                    "baseUrl": "https://api.bfl.ai/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://bfl.ai/legal/terms-of-service",
                        "privacyPolicyURL": "https://bfl.ai/legal/privacy-policy"
                    },
                    "datacenters": [],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "BlackForestLabsAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://bfl.ai&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "bfl"
                },
                "provider_display_name": "Black Forest Labs",
                "provider_slug": "black-forest-labs",
                "provider_model_id": "flux-2-pro",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://bfl.ai/legal/terms-of-service",
                    "privacyPolicyURL": "https://bfl.ai/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "image_output": "0.00000732421875",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "bfl:upstream_cost_cents": "1",
                    "bfl:informational_output_megapixels": 0.03
                },
                "pricing_version_id": "e091d2ff-e677-4f80-8303-6c2485098a3f",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "anthropic/claude-opus-4.5",
            "hf_slug": "",
            "updated_at": "2026-01-15T17:57:03.680811+00:00",
            "created_at": "2025-11-24T18:56:20+00:00",
            "hf_updated_at": null,
            "name": "Anthropic: Claude Opus 4.5",
            "short_name": "Claude Opus 4.5",
            "author": "anthropic",
            "description": "Claude Opus 4.5 is Anthropic’s frontier reasoning model optimized for complex software engineering, agentic workflows, and long-horizon computer use. It offers strong multimodal capabilities, competitive performance across real-world coding and reasoning benchmarks, and improved robustness to prompt injection. The model is designed to operate efficiently across varied effort levels, enabling developers to trade off speed, depth, and token usage depending on task requirements. It comes with a new parameter to control token efficiency, which can be accessed using the OpenRouter Verbosity parameter with low, medium, or high.\n\nOpus 4.5 supports advanced tool use, extended context management, and coordinated multi-agent setups, making it well-suited for autonomous research, debugging, multi-step planning, and spreadsheet/browser manipulation. It delivers substantial gains in structured reasoning, execution reliability, and alignment compared to prior Opus generations, while reducing token overhead and improving performance on long-running tasks.",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "file",
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Claude",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "anthropic/claude-4.5-opus-20251124",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [
                "amazon-bedrock",
                "google-vertex",
                "anthropic"
            ],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "be883404-eb42-4b2d-b6e4-c7daa3aa8d62",
                "name": "Anthropic | anthropic/claude-4.5-opus-20251124",
                "context_length": 200000,
                "model": {
                    "slug": "anthropic/claude-opus-4.5",
                    "hf_slug": "",
                    "updated_at": "2026-01-15T17:57:03.680811+00:00",
                    "created_at": "2025-11-24T18:56:20+00:00",
                    "hf_updated_at": null,
                    "name": "Anthropic: Claude Opus 4.5",
                    "short_name": "Claude Opus 4.5",
                    "author": "anthropic",
                    "description": "Claude Opus 4.5 is Anthropic’s frontier reasoning model optimized for complex software engineering, agentic workflows, and long-horizon computer use. It offers strong multimodal capabilities, competitive performance across real-world coding and reasoning benchmarks, and improved robustness to prompt injection. The model is designed to operate efficiently across varied effort levels, enabling developers to trade off speed, depth, and token usage depending on task requirements. It comes with a new parameter to control token efficiency, which can be accessed using the OpenRouter Verbosity parameter with low, medium, or high.\n\nOpus 4.5 supports advanced tool use, extended context management, and coordinated multi-agent setups, making it well-suited for autonomous research, debugging, multi-step planning, and spreadsheet/browser manipulation. It delivers substantial gains in structured reasoning, execution reliability, and alignment compared to prior Opus generations, while reducing token overhead and improving performance on long-running tasks.",
                    "model_version_group_id": null,
                    "context_length": 200000,
                    "input_modalities": [
                        "file",
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Claude",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "anthropic/claude-4.5-opus-20251124",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [
                        "amazon-bedrock",
                        "google-vertex",
                        "anthropic"
                    ],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "anthropic/claude-opus-4.5",
                "model_variant_permaslug": "anthropic/claude-4.5-opus-20251124",
                "adapter_name": "AnthropicMessageAdapter",
                "provider_name": "Anthropic",
                "provider_info": {
                    "name": "Anthropic",
                    "displayName": "Anthropic",
                    "slug": "anthropic",
                    "baseUrl": "https://api.anthropic.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.anthropic.com/legal/commercial-terms",
                        "privacyPolicyURL": "https://www.anthropic.com/legal/privacy",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "AnthropicMessageAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.anthropic.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Anthropic.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "anthropic"
                },
                "provider_display_name": "Anthropic",
                "provider_slug": "anthropic",
                "provider_model_id": "claude-opus-4-5-20251101",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 64000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "stop",
                    "reasoning",
                    "include_reasoning",
                    "tool_choice",
                    "tools",
                    "structured_outputs",
                    "response_format",
                    "verbosity"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.anthropic.com/legal/commercial-terms",
                    "privacyPolicyURL": "https://www.anthropic.com/legal/privacy",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000005",
                    "completion": "0.000025",
                    "input_cache_read": "0.0000005",
                    "input_cache_write": "0.00000625",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "anthropic:prompt_tokens": 0.000005,
                    "anthropic:web_search_calls": 0.01,
                    "anthropic:cache_read_tokens": 5e-7,
                    "anthropic:completion_tokens": 0.000025,
                    "anthropic:cache_write_1h_tokens": 0.00001,
                    "anthropic:cache_write_5m_tokens": 0.00000625
                },
                "pricing_version_id": "2b155b3b-876e-446f-98ca-ad47df5dffce",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": 40,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemini-3-pro-image-preview",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-11-20T15:49:57.064095+00:00",
            "hf_updated_at": null,
            "name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)",
            "short_name": "Nano Banana Pro (Gemini 3 Pro Image Preview)",
            "author": "google",
            "description": "Nano Banana Pro is Google’s most advanced image-generation and editing model, built on Gemini 3 Pro. It extends the original Nano Banana with significantly improved multimodal reasoning, real-world grounding, and high-fidelity visual synthesis. The model generates context-rich graphics, from infographics and diagrams to cinematic composites, and can incorporate real-time information via Search grounding.\n\nIt offers industry-leading text rendering in images (including long passages and multilingual layouts), consistent multi-image blending, and accurate identity preservation across up to five subjects. Nano Banana Pro adds fine-grained creative controls such as localized edits, lighting and focus adjustments, camera transformations, and support for 2K/4K outputs and flexible aspect ratios. It is designed for professional-grade design, product visualization, storyboarding, and complex multi-element compositions while remaining efficient for general image creation workflows.",
            "model_version_group_id": null,
            "context_length": 65536,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "image",
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "google/gemini-3-pro-image-preview-20251120",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true,
                "supports_reasoning_effort": false,
                "supports_reasoning_max_tokens": null,
                "supported_reasoning_efforts": [],
                "default_reasoning_effort": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true,
                    "supports_reasoning_effort": false,
                    "supports_reasoning_max_tokens": null,
                    "supported_reasoning_efforts": [],
                    "default_reasoning_effort": null
                },
                "chat_template_config": {
                    "should_hoist_and_merge_system_messages": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "image_generation",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "f5a725e2-8f66-4754-9232-7550685ab3d0",
                "name": "Google AI Studio | google/gemini-3-pro-image-preview-20251120",
                "context_length": 65536,
                "model": {
                    "slug": "google/gemini-3-pro-image-preview",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-11-20T15:49:57.064095+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Nano Banana Pro (Gemini 3 Pro Image Preview)",
                    "short_name": "Nano Banana Pro (Gemini 3 Pro Image Preview)",
                    "author": "google",
                    "description": "Nano Banana Pro is Google’s most advanced image-generation and editing model, built on Gemini 3 Pro. It extends the original Nano Banana with significantly improved multimodal reasoning, real-world grounding, and high-fidelity visual synthesis. The model generates context-rich graphics, from infographics and diagrams to cinematic composites, and can incorporate real-time information via Search grounding.\n\nIt offers industry-leading text rendering in images (including long passages and multilingual layouts), consistent multi-image blending, and accurate identity preservation across up to five subjects. Nano Banana Pro adds fine-grained creative controls such as localized edits, lighting and focus adjustments, camera transformations, and support for 2K/4K outputs and flexible aspect ratios. It is designed for professional-grade design, product visualization, storyboarding, and complex multi-element compositions while remaining efficient for general image creation workflows.",
                    "model_version_group_id": null,
                    "context_length": 65536,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "image",
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "google/gemini-3-pro-image-preview-20251120",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true,
                        "supports_reasoning_effort": false,
                        "supports_reasoning_max_tokens": null,
                        "supported_reasoning_efforts": [],
                        "default_reasoning_effort": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true,
                            "supports_reasoning_effort": false,
                            "supports_reasoning_max_tokens": null,
                            "supported_reasoning_efforts": [],
                            "default_reasoning_effort": null
                        },
                        "chat_template_config": {
                            "should_hoist_and_merge_system_messages": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "image_generation",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemini-3-pro-image-preview",
                "model_variant_permaslug": "google/gemini-3-pro-image-preview-20251120",
                "adapter_name": "GoogleAIStudioGeminiAdapter",
                "provider_name": "Google AI Studio",
                "provider_info": {
                    "name": "Google AI Studio",
                    "displayName": "Google AI Studio",
                    "slug": "google-ai-studio",
                    "baseUrl": "https://generativelanguage.googleapis.com/v1beta",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 55,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleAIStudioGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleAIStudio.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-1p",
                        "gemini-2.5-pro-1p-recitation-off",
                        "gemini-2.5-flash-1p",
                        "gemini-2.5-flash-1p-recitation-off",
                        "gemini-2.5-flash-lite-preview-06-11-summarized",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-1.5-pro-latest",
                        "gemini-1.5-pro",
                        "gemini-1.5-flash-latest",
                        "gemini-1.5-flash",
                        "gemini-1.5-flash-8b",
                        "gemini-1.5-flash-8b-latest",
                        "gemini-2.5-pro-preview-03-25",
                        "gemini-2.0-flash",
                        "gemini-2.0-flash-lite",
                        "gemini-2.0-flash-lite-preview",
                        "gemini-2.0-pro-exp",
                        "gemini-2.0-flash-thinking-exp",
                        "gemini-2.5-flash-preview-tts",
                        "gemini-2.5-pro-preview-tts",
                        "learnlm-2.0-flash-experimental",
                        "gracefulgolem",
                        "gemini-2.5-flash-preview-05-20",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.0-flash-exp-image-generation",
                        "gemini-2.0-flash-preview-image-generation",
                        "gemini-2.0-flash-lite-preview-02-05",
                        "gemini-2.0-pro-exp-02-05",
                        "gemini-exp-1206",
                        "gemini-2.0-flash-thinking-exp-01-21",
                        "gemini-2.0-flash-thinking-exp-1219",
                        "gemma-3-1b-it",
                        "gemini-flash-latest",
                        "gemini-flash-lite-latest",
                        "gemini-pro-latest",
                        "gemini-robotics-er-1.5-preview",
                        "gemini-embedding-001",
                        "riftrunner-fst-rewind",
                        "gemini-3-pro-image-preview",
                        "nano-banana-pro-preview",
                        "fiercefalcon",
                        "fiercefalcon-inline-citation",
                        "fiercefalcon-blocked-sites"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google AI Studio",
                "provider_slug": "google-ai-studio",
                "provider_model_id": "gemini-3-pro-image-preview",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 32768,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "response_format",
                    "stop",
                    "structured_outputs"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 55,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice"
                },
                "pricing": {
                    "prompt": "0.000002",
                    "completion": "0.000012",
                    "image": "0.000002",
                    "audio": "0.000002",
                    "input_audio_cache": "0.0000002",
                    "input_cache_read": "0.0000002",
                    "input_cache_write": "0.000000375",
                    "internal_reasoning": "0.000012",
                    "image_output": "0.00012",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "gemini:prompt_tokens": 0.000002,
                    "gemini:reasoning_tokens": 0.000012,
                    "gemini:cache_read_tokens": 2e-7,
                    "gemini:completion_tokens": 0.000012,
                    "gemini:text_input_tokens": 0.000002,
                    "gemini:audio_input_tokens": 0.000002,
                    "gemini:image_input_tokens": 0.000002,
                    "gemini:video_input_tokens": 0.000002,
                    "gemini:image_output_tokens": 0.00012,
                    "gemini:cache_read_text_tokens": 2e-7,
                    "gemini:cache_read_audio_tokens": 2e-7,
                    "gemini:cache_read_image_tokens": 2e-7,
                    "gemini:cache_read_video_tokens": 2e-7,
                    "gemini:cache_write_storage_hours": 0.0000045,
                    "gemini:prompt_tokens_high_context": 0.000004,
                    "gemini:reasoning_tokens_high_context": 0.000018,
                    "gemini:cache_read_tokens_high_context": 4e-7,
                    "gemini:completion_tokens_high_context": 0.000018,
                    "gemini:cache_read_text_tokens_high_context": 4e-7,
                    "gemini:cache_read_audio_tokens_high_context": 4e-7,
                    "gemini:cache_read_image_tokens_high_context": 4e-7,
                    "gemini:cache_read_video_tokens_high_context": 4e-7,
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "4c53647d-b03e-43cf-a0eb-1ea158e4626f",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": 250,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "is_mandatory_reasoning": true,
                    "supports_input_audio": false
                },
                "provider_region": "global",
                "deprecation_date": null
            }
        },
        {
            "slug": "x-ai/grok-4.1-fast",
            "hf_slug": "",
            "updated_at": "2025-12-03T20:06:03.459371+00:00",
            "created_at": "2025-11-19T21:25:02.724692+00:00",
            "hf_updated_at": null,
            "name": "xAI: Grok 4.1 Fast",
            "short_name": "Grok 4.1 Fast",
            "author": "x-ai",
            "description": "Grok 4.1 Fast is xAI's best agentic tool calling model that shines in real-world use cases like customer support and deep research. 2M context window.\n\nReasoning can be enabled/disabled using the `reasoning` `enabled` parameter in the API. [Learn more in our docs](https://openrouter.ai/docs/use-cases/reasoning-tokens#controlling-reasoning-tokens)",
            "model_version_group_id": null,
            "context_length": 2000000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Grok",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "The free Grok 4.1 Fast period has ended. To continue using this model, please migrate to the paid slug: x-ai/grok-4.1-fast",
            "permaslug": "x-ai/grok-4.1-fast",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": 0.7,
                "top_p": 0.95,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "9821aa0e-dce3-4c27-9716-161359123d0b",
                "name": "xAI | x-ai/grok-4.1-fast",
                "context_length": 2000000,
                "model": {
                    "slug": "x-ai/grok-4.1-fast",
                    "hf_slug": "",
                    "updated_at": "2025-12-03T20:06:03.459371+00:00",
                    "created_at": "2025-11-19T21:25:02.724692+00:00",
                    "hf_updated_at": null,
                    "name": "xAI: Grok 4.1 Fast",
                    "short_name": "Grok 4.1 Fast",
                    "author": "x-ai",
                    "description": "Grok 4.1 Fast is xAI's best agentic tool calling model that shines in real-world use cases like customer support and deep research. 2M context window.\n\nReasoning can be enabled/disabled using the `reasoning` `enabled` parameter in the API. [Learn more in our docs](https://openrouter.ai/docs/use-cases/reasoning-tokens#controlling-reasoning-tokens)",
                    "model_version_group_id": null,
                    "context_length": 2000000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Grok",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": "The free Grok 4.1 Fast period has ended. To continue using this model, please migrate to the paid slug: x-ai/grok-4.1-fast",
                    "permaslug": "x-ai/grok-4.1-fast",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": 0.7,
                        "top_p": 0.95,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "x-ai/grok-4.1-fast",
                "model_variant_permaslug": "x-ai/grok-4.1-fast",
                "adapter_name": "XAIResponsesAdapter",
                "provider_name": "xAI",
                "provider_info": {
                    "name": "xAI",
                    "displayName": "xAI",
                    "slug": "xai",
                    "baseUrl": "https://api.x.ai/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://x.ai/legal/terms-of-service-enterprise",
                        "privacyPolicyURL": "https://x.ai/legal/privacy-policy",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "XAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.x.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://x.ai/&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": null
                },
                "provider_display_name": "xAI",
                "provider_slug": "xai",
                "provider_model_id": "grok-4-1-fast-non-reasoning",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 30000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "logprobs",
                    "top_logprobs",
                    "response_format",
                    "tools",
                    "tool_choice",
                    "structured_outputs"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://x.ai/legal/terms-of-service-enterprise",
                    "privacyPolicyURL": "https://x.ai/legal/privacy-policy",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.0000002",
                    "completion": "0.0000005",
                    "image": "0",
                    "request": "0",
                    "input_cache_read": "0.00000005",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "prompt-threshold",
                        "threshold": 128000,
                        "prompt": "0.0000004",
                        "completions": "0.000001",
                        "input_cache_read": "0.00000005"
                    }
                ],
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemini-3-pro-preview",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-11-18T14:04:28+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 3 Pro Preview",
            "short_name": "Gemini 3 Pro Preview",
            "author": "google",
            "description": "Gemini 3 Pro is Google’s flagship frontier model for high-precision multimodal reasoning, combining strong performance across text, image, video, audio, and code with a 1M-token context window. Reasoning Details must be preserved when using multi-turn tool calling, see our docs here: https://openrouter.ai/docs/use-cases/reasoning-tokens#preserving-reasoning-blocks. It delivers state-of-the-art benchmark results in general reasoning, STEM problem solving, factual QA, and multimodal understanding, including leading scores on LMArena, GPQA Diamond, MathArena Apex, MMMU-Pro, and Video-MMMU. Interactions emphasize depth and interpretability: the model is designed to infer intent with minimal prompting and produce direct, insight-focused responses.\n\nBuilt for advanced development and agentic workflows, Gemini 3 Pro provides robust tool-calling, long-horizon planning stability, and strong zero-shot generation for complex UI, visualization, and coding tasks. It excels at agentic coding (SWE-Bench Verified, Terminal-Bench 2.0), multimodal analysis, and structured long-form tasks such as research synthesis, planning, and interactive learning experiences. Suitable applications include autonomous agents, coding assistants, multimodal analytics, scientific reasoning, and high-context information processing.",
            "model_version_group_id": null,
            "context_length": 1048576,
            "input_modalities": [
                "text",
                "image",
                "file",
                "audio",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "google/gemini-3-pro-preview-20251117",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true,
                "supports_reasoning_effort": true,
                "supports_reasoning_max_tokens": null,
                "supported_reasoning_efforts": [
                    "high",
                    "low"
                ],
                "default_reasoning_effort": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true,
                    "supports_reasoning_effort": true,
                    "supports_reasoning_max_tokens": null,
                    "supported_reasoning_efforts": [
                        "high",
                        "low"
                    ],
                    "default_reasoning_effort": null
                },
                "chat_template_config": {
                    "should_hoist_and_merge_system_messages": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "ca4e1f52-1f15-4258-a4eb-d6b56c0c4057",
                "name": "Google | google/gemini-3-pro-preview-20251117",
                "context_length": 1048576,
                "model": {
                    "slug": "google/gemini-3-pro-preview",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-11-18T14:04:28+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemini 3 Pro Preview",
                    "short_name": "Gemini 3 Pro Preview",
                    "author": "google",
                    "description": "Gemini 3 Pro is Google’s flagship frontier model for high-precision multimodal reasoning, combining strong performance across text, image, video, audio, and code with a 1M-token context window. Reasoning Details must be preserved when using multi-turn tool calling, see our docs here: https://openrouter.ai/docs/use-cases/reasoning-tokens#preserving-reasoning-blocks. It delivers state-of-the-art benchmark results in general reasoning, STEM problem solving, factual QA, and multimodal understanding, including leading scores on LMArena, GPQA Diamond, MathArena Apex, MMMU-Pro, and Video-MMMU. Interactions emphasize depth and interpretability: the model is designed to infer intent with minimal prompting and produce direct, insight-focused responses.\n\nBuilt for advanced development and agentic workflows, Gemini 3 Pro provides robust tool-calling, long-horizon planning stability, and strong zero-shot generation for complex UI, visualization, and coding tasks. It excels at agentic coding (SWE-Bench Verified, Terminal-Bench 2.0), multimodal analysis, and structured long-form tasks such as research synthesis, planning, and interactive learning experiences. Suitable applications include autonomous agents, coding assistants, multimodal analytics, scientific reasoning, and high-context information processing.",
                    "model_version_group_id": null,
                    "context_length": 1048576,
                    "input_modalities": [
                        "text",
                        "image",
                        "file",
                        "audio",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "google/gemini-3-pro-preview-20251117",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true,
                        "supports_reasoning_effort": true,
                        "supports_reasoning_max_tokens": null,
                        "supported_reasoning_efforts": [
                            "high",
                            "low"
                        ],
                        "default_reasoning_effort": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true,
                            "supports_reasoning_effort": true,
                            "supports_reasoning_max_tokens": null,
                            "supported_reasoning_efforts": [
                                "high",
                                "low"
                            ],
                            "default_reasoning_effort": null
                        },
                        "chat_template_config": {
                            "should_hoist_and_merge_system_messages": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemini-3-pro-preview",
                "model_variant_permaslug": "google/gemini-3-pro-preview-20251117",
                "adapter_name": "GoogleVertexGeminiAdapter",
                "provider_name": "Google",
                "provider_info": {
                    "name": "Google",
                    "displayName": "Google Vertex",
                    "slug": "google-vertex",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "not-used"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleVertexGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.cloud.google.com/products/sdXM79fz1FS6ekNpu37K/history",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleVertex.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-exp-03-25",
                        "gemini-2.0-flash-exp",
                        "gemini-1.5-flash-002",
                        "gemini-2.0-flash-lite-001",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-2.0-flash-001",
                        "llama-4-scout-17b-16e-instruct-maas",
                        "qwen3-235b-a22b-instruct-2507-maas",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-image-preview",
                        "llama-4-maverick-17b-128e-instruct-maas",
                        "llama-3.3-70b-instruct-maas",
                        "claude-3-5-haiku@20241022",
                        "qwen3-coder-480b-a35b-instruct-maas",
                        "gemini-1.5-pro-002",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-pro",
                        "deepseek-r1-0528-maas",
                        "claude-3-7-sonnet@20250219",
                        "claude-3-5-sonnet-v2@20241022",
                        "claude-sonnet-4@20250514",
                        "claude-opus-4-1@20250805",
                        "claude-opus-4@20250514",
                        "claude-3-haiku@20240307",
                        "claude-3-5-sonnet@20240620",
                        "claude-3-opus@20240229",
                        "gemini-2.5-flash-lite-preview-09-2025",
                        "gemini-2.5-flash-preview-09-2025",
                        "gemini-2.5-flash-image",
                        "claude-sonnet-4-5@20250929",
                        "claude-haiku-4-5@20251001",
                        "minimax/minimax-m2-maas",
                        "gemini-3-pro-preview",
                        "gemini-3-pro-image-preview",
                        "claude-opus-4-5@20251101"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google Vertex",
                "provider_slug": "google-vertex",
                "provider_model_id": "gemini-3-pro-preview",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 65536,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "stop",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000002",
                    "completion": "0.000012",
                    "image": "0.000002",
                    "audio": "0.000002",
                    "input_audio_cache": "0.0000002",
                    "input_cache_read": "0.0000002",
                    "input_cache_write": "0.000000375",
                    "internal_reasoning": "0.000012",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "prompt-threshold",
                        "threshold": 200000,
                        "prompt": "0.000004",
                        "completions": "0.000018",
                        "input_cache_read": "0.0000004",
                        "input_cache_write": "0.00000075"
                    }
                ],
                "pricing_json": {
                    "gemini:prompt_tokens": 0.000002,
                    "gemini:reasoning_tokens": 0.000012,
                    "gemini:cache_read_tokens": 2e-7,
                    "gemini:completion_tokens": 0.000012,
                    "gemini:text_input_tokens": 0.000002,
                    "gemini:audio_input_tokens": 0.000002,
                    "gemini:image_input_tokens": 0.000002,
                    "gemini:video_input_tokens": 0.000002,
                    "gemini:cache_read_text_tokens": 2e-7,
                    "gemini:cache_read_audio_tokens": 2e-7,
                    "gemini:cache_read_image_tokens": 2e-7,
                    "gemini:cache_read_video_tokens": 2e-7,
                    "gemini:cache_write_storage_hours": 0.0000045,
                    "gemini:prompt_tokens_high_context": 0.000004,
                    "gemini:reasoning_tokens_high_context": 0.000018,
                    "gemini:cache_read_tokens_high_context": 4e-7,
                    "gemini:completion_tokens_high_context": 0.000018,
                    "gemini:cache_read_text_tokens_high_context": 4e-7,
                    "gemini:cache_read_audio_tokens_high_context": 4e-7,
                    "gemini:cache_read_image_tokens_high_context": 4e-7,
                    "gemini:cache_read_video_tokens_high_context": 4e-7,
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "3b180fff-70f2-4a89-9a66-9d051e7b9bf9",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_base64_video_input": true,
                    "supports_video_urls": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true
                },
                "provider_region": "global",
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5.1",
            "hf_slug": "",
            "updated_at": "2025-11-13T18:58:25.56227+00:00",
            "created_at": "2025-11-13T18:58:25+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5.1",
            "short_name": "GPT-5.1",
            "author": "openai",
            "description": "GPT-5.1 is the latest frontier-grade model in the GPT-5 series, offering stronger general-purpose reasoning, improved instruction adherence, and a more natural conversational style compared to GPT-5. It uses adaptive reasoning to allocate computation dynamically, responding quickly to simple queries while spending more depth on complex tasks. The model produces clearer, more grounded explanations with reduced jargon, making it easier to follow even on technical or multi-step problems.\n\nBuilt for broad task coverage, GPT-5.1 delivers consistent gains across math, coding, and structured analysis workloads, with more coherent long-form answers and improved tool-use reliability. It also features refined conversational alignment, enabling warmer, more intuitive responses without compromising precision. GPT-5.1 serves as the primary full-capability successor to GPT-5",
            "model_version_group_id": null,
            "context_length": 400000,
            "input_modalities": [
                "image",
                "text",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "openai/gpt-5.1-20251113",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "764eb97f-8bab-4326-b29b-7a8799b00a70",
                "name": "OpenAI | openai/gpt-5.1-20251113",
                "context_length": 400000,
                "model": {
                    "slug": "openai/gpt-5.1",
                    "hf_slug": "",
                    "updated_at": "2025-11-13T18:58:25.56227+00:00",
                    "created_at": "2025-11-13T18:58:25+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5.1",
                    "short_name": "GPT-5.1",
                    "author": "openai",
                    "description": "GPT-5.1 is the latest frontier-grade model in the GPT-5 series, offering stronger general-purpose reasoning, improved instruction adherence, and a more natural conversational style compared to GPT-5. It uses adaptive reasoning to allocate computation dynamically, responding quickly to simple queries while spending more depth on complex tasks. The model produces clearer, more grounded explanations with reduced jargon, making it easier to follow even on technical or multi-step problems.\n\nBuilt for broad task coverage, GPT-5.1 delivers consistent gains across math, coding, and structured analysis workloads, with more coherent long-form answers and improved tool-use reliability. It also features refined conversational alignment, enabling warmer, more intuitive responses without compromising precision. GPT-5.1 serves as the primary full-capability successor to GPT-5",
                    "model_version_group_id": null,
                    "context_length": 400000,
                    "input_modalities": [
                        "image",
                        "text",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-5.1-20251113",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5.1",
                "model_variant_permaslug": "openai/gpt-5.1-20251113",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai/default",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai/default",
                "provider_model_id": "gpt-5.1-2025-11-13",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": 272000,
                "max_completion_tokens": 128000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000125",
                    "completion": "0.00001",
                    "input_cache_read": "0.000000125",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.00000125,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.00001,
                    "openai_responses:cached_prompt_tokens": 1.25e-7
                },
                "pricing_version_id": "177855b5-4b6e-4f70-a823-4eb03aa1322b",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": false,
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5.1-chat",
            "hf_slug": "",
            "updated_at": "2025-11-13T18:58:22.624591+00:00",
            "created_at": "2025-11-13T18:58:22+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5.1 Chat",
            "short_name": "GPT-5.1 Chat",
            "author": "openai",
            "description": "GPT-5.1 Chat (AKA Instant is the fast, lightweight member of the 5.1 family, optimized for low-latency chat while retaining strong general intelligence. It uses adaptive reasoning to selectively “think” on harder queries, improving accuracy on math, coding, and multi-step tasks without slowing down typical conversations. The model is warmer and more conversational by default, with better instruction following and more stable short-form reasoning. GPT-5.1 Chat is designed for high-throughput, interactive workloads where responsiveness and consistency matter more than deep deliberation.\n",
            "model_version_group_id": null,
            "context_length": 128000,
            "input_modalities": [
                "file",
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "openai/gpt-5.1-chat-20251113",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "f27c561c-0804-4e51-a96e-18bc1968212d",
                "name": "OpenAI | openai/gpt-5.1-chat-20251113",
                "context_length": 128000,
                "model": {
                    "slug": "openai/gpt-5.1-chat",
                    "hf_slug": "",
                    "updated_at": "2025-11-13T18:58:22.624591+00:00",
                    "created_at": "2025-11-13T18:58:22+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5.1 Chat",
                    "short_name": "GPT-5.1 Chat",
                    "author": "openai",
                    "description": "GPT-5.1 Chat (AKA Instant is the fast, lightweight member of the 5.1 family, optimized for low-latency chat while retaining strong general intelligence. It uses adaptive reasoning to selectively “think” on harder queries, improving accuracy on math, coding, and multi-step tasks without slowing down typical conversations. The model is warmer and more conversational by default, with better instruction following and more stable short-form reasoning. GPT-5.1 Chat is designed for high-throughput, interactive workloads where responsiveness and consistency matter more than deep deliberation.\n",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "file",
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-5.1-chat-20251113",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5.1-chat",
                "model_variant_permaslug": "openai/gpt-5.1-chat-20251113",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-5.1-chat-latest",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 16384,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "tool_choice",
                    "tools"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000125",
                    "completion": "0.00001",
                    "input_cache_read": "0.000000125",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.00000125,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.00001,
                    "openai_responses:cached_prompt_tokens": 1.25e-7
                },
                "pricing_version_id": "2e4eef73-9912-412b-892f-833ea583790a",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5.1-codex",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-11-13T18:58:18+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5.1-Codex",
            "short_name": "GPT-5.1-Codex",
            "author": "openai",
            "description": "GPT-5.1-Codex is a specialized version of GPT-5.1 optimized for software engineering and coding workflows. It is designed for both interactive development sessions and long, independent execution of complex engineering tasks. The model supports building projects from scratch, feature development, debugging, large-scale refactoring, and code review. Compared to GPT-5.1, Codex is more steerable, adheres closely to developer instructions, and produces cleaner, higher-quality code outputs. Reasoning effort can be adjusted with the `reasoning.effort` parameter. Read the [docs here](https://openrouter.ai/docs/use-cases/reasoning-tokens#reasoning-effort-level)\n\nCodex integrates into developer environments including the CLI, IDE extensions, GitHub, and cloud tasks. It adapts reasoning effort dynamically—providing fast responses for small tasks while sustaining extended multi-hour runs for large projects. The model is trained to perform structured code reviews, catching critical flaws by reasoning over dependencies and validating behavior against tests. It also supports multimodal inputs such as images or screenshots for UI development and integrates tool use for search, dependency installation, and environment setup. Codex is intended specifically for agentic coding applications.",
            "model_version_group_id": null,
            "context_length": 400000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "openai/gpt-5.1-codex-20251113",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "58caabab-f2a1-4a27-b098-b46b924efd27",
                "name": "OpenAI | openai/gpt-5.1-codex-20251113",
                "context_length": 400000,
                "model": {
                    "slug": "openai/gpt-5.1-codex",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-11-13T18:58:18+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5.1-Codex",
                    "short_name": "GPT-5.1-Codex",
                    "author": "openai",
                    "description": "GPT-5.1-Codex is a specialized version of GPT-5.1 optimized for software engineering and coding workflows. It is designed for both interactive development sessions and long, independent execution of complex engineering tasks. The model supports building projects from scratch, feature development, debugging, large-scale refactoring, and code review. Compared to GPT-5.1, Codex is more steerable, adheres closely to developer instructions, and produces cleaner, higher-quality code outputs. Reasoning effort can be adjusted with the `reasoning.effort` parameter. Read the [docs here](https://openrouter.ai/docs/use-cases/reasoning-tokens#reasoning-effort-level)\n\nCodex integrates into developer environments including the CLI, IDE extensions, GitHub, and cloud tasks. It adapts reasoning effort dynamically—providing fast responses for small tasks while sustaining extended multi-hour runs for large projects. The model is trained to perform structured code reviews, catching critical flaws by reasoning over dependencies and validating behavior against tests. It also supports multimodal inputs such as images or screenshots for UI development and integrates tool use for search, dependency installation, and environment setup. Codex is intended specifically for agentic coding applications.",
                    "model_version_group_id": null,
                    "context_length": 400000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-5.1-codex-20251113",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5.1-codex",
                "model_variant_permaslug": "openai/gpt-5.1-codex-20251113",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-5.1-codex",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": 272000,
                "max_completion_tokens": 128000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000125",
                    "completion": "0.00001",
                    "input_cache_read": "0.000000125",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.00000125,
                    "openai_responses:completion_tokens": 0.00001,
                    "openai_responses:cached_prompt_tokens": 1.25e-7
                },
                "pricing_version_id": "700f737d-f192-40f9-8c4a-c74b295e3881",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true,
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5.1-codex-mini",
            "hf_slug": "",
            "updated_at": "2025-11-13T18:54:22.09584+00:00",
            "created_at": "2025-11-13T18:17:00.379348+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5.1-Codex-Mini",
            "short_name": "GPT-5.1-Codex-Mini",
            "author": "openai",
            "description": "GPT-5.1-Codex-Mini is a smaller and faster version of GPT-5.1-Codex",
            "model_version_group_id": null,
            "context_length": 400000,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "openai/gpt-5.1-codex-mini-20251113",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "27923ab8-2d0e-47ac-b04c-fc79d77ddbd5",
                "name": "OpenAI | openai/gpt-5.1-codex-mini-20251113",
                "context_length": 400000,
                "model": {
                    "slug": "openai/gpt-5.1-codex-mini",
                    "hf_slug": "",
                    "updated_at": "2025-11-13T18:54:22.09584+00:00",
                    "created_at": "2025-11-13T18:17:00.379348+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5.1-Codex-Mini",
                    "short_name": "GPT-5.1-Codex-Mini",
                    "author": "openai",
                    "description": "GPT-5.1-Codex-Mini is a smaller and faster version of GPT-5.1-Codex",
                    "model_version_group_id": null,
                    "context_length": 400000,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-5.1-codex-mini-20251113",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5.1-codex-mini",
                "model_variant_permaslug": "openai/gpt-5.1-codex-mini-20251113",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-5.1-codex-mini",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 100000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000025",
                    "completion": "0.000002",
                    "input_cache_read": "0.000000025",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 2.5e-7,
                    "openai_responses:completion_tokens": 0.000002,
                    "openai_responses:cached_prompt_tokens": 2.5e-8
                },
                "pricing_version_id": "b2297b73-9598-4b1a-942f-fdcb3733ddf5",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "amazon/nova-premier-v1",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-10-31T22:38:52.074161+00:00",
            "hf_updated_at": null,
            "name": "Amazon: Nova Premier 1.0",
            "short_name": "Nova Premier 1.0",
            "author": "amazon",
            "description": "Amazon Nova Premier is the most capable of Amazon’s multimodal models for complex reasoning tasks and for use as the best teacher for distilling custom models.",
            "model_version_group_id": null,
            "context_length": 1000000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Nova",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "amazon/nova-premier-v1",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "6e4da481-6c8d-45d0-a3f5-11a9ba527485",
                "name": "Amazon Bedrock | amazon/nova-premier-v1",
                "context_length": 1000000,
                "model": {
                    "slug": "amazon/nova-premier-v1",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-10-31T22:38:52.074161+00:00",
                    "hf_updated_at": null,
                    "name": "Amazon: Nova Premier 1.0",
                    "short_name": "Nova Premier 1.0",
                    "author": "amazon",
                    "description": "Amazon Nova Premier is the most capable of Amazon’s multimodal models for complex reasoning tasks and for use as the best teacher for distilling custom models.",
                    "model_version_group_id": null,
                    "context_length": 1000000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Nova",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "amazon/nova-premier-v1",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "amazon/nova-premier-v1",
                "model_variant_permaslug": "amazon/nova-premier-v1",
                "adapter_name": "AmazonBedrockConverseAdapter",
                "provider_name": "Amazon Bedrock",
                "provider_info": {
                    "name": "Amazon Bedrock",
                    "displayName": "Amazon Bedrock",
                    "slug": "amazon-bedrock",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                        "privacyPolicyURL": "https://aws.amazon.com/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "dummy-value"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "AmazonBedrockConverseAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://health.aws.amazon.com/health/status",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Bedrock.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": null
                },
                "provider_display_name": "Amazon Bedrock",
                "provider_slug": "amazon-bedrock",
                "provider_model_id": "us.amazon.nova-premier-v1:0\t",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 32000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "top_k",
                    "stop",
                    "tools"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                    "privacyPolicyURL": "https://aws.amazon.com/privacy"
                },
                "pricing": {
                    "prompt": "0.0000025",
                    "completion": "0.0000125",
                    "image": "0",
                    "request": "0",
                    "input_cache_read": "0.000000625",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "perplexity/sonar-pro-search",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-10-30T19:59:26+00:00",
            "hf_updated_at": null,
            "name": "Perplexity: Sonar Pro Search",
            "short_name": "Sonar Pro Search",
            "author": "perplexity",
            "description": "Exclusively available on the OpenRouter API, Sonar Pro's new Pro Search mode is Perplexity's most advanced agentic search system. It is designed for deeper reasoning and analysis. Pricing is based on tokens plus $18 per thousand requests. This model powers the Pro Search mode on the Perplexity platform.\n\nSonar Pro Search adds autonomous, multi-step reasoning to Sonar Pro. So, instead of just one query + synthesis, it plans and executes entire research workflows using tools.",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "perplexity/sonar-pro-search",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "c78926bd-fa25-4883-8794-22de8c1ce79c",
                "name": "Perplexity | perplexity/sonar-pro-search",
                "context_length": 200000,
                "model": {
                    "slug": "perplexity/sonar-pro-search",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-10-30T19:59:26+00:00",
                    "hf_updated_at": null,
                    "name": "Perplexity: Sonar Pro Search",
                    "short_name": "Sonar Pro Search",
                    "author": "perplexity",
                    "description": "Exclusively available on the OpenRouter API, Sonar Pro's new Pro Search mode is Perplexity's most advanced agentic search system. It is designed for deeper reasoning and analysis. Pricing is based on tokens plus $18 per thousand requests. This model powers the Pro Search mode on the Perplexity platform.\n\nSonar Pro Search adds autonomous, multi-step reasoning to Sonar Pro. So, instead of just one query + synthesis, it plans and executes entire research workflows using tools.",
                    "model_version_group_id": null,
                    "context_length": 200000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "perplexity/sonar-pro-search",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "perplexity/sonar-pro-search",
                "model_variant_permaslug": "perplexity/sonar-pro-search",
                "adapter_name": "PerplexityAdapter",
                "provider_name": "Perplexity",
                "provider_info": {
                    "name": "Perplexity",
                    "displayName": "Perplexity",
                    "slug": "perplexity",
                    "baseUrl": "https://api.perplexity.ai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.perplexity.ai/hub/legal/perplexity-api-terms-of-service",
                        "privacyPolicyURL": "https://www.perplexity.ai/hub/legal/privacy-policy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "PerplexityAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.perplexity.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Perplexity.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": null
                },
                "provider_display_name": "Perplexity",
                "provider_slug": "perplexity",
                "provider_model_id": "sonar-pro",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 8000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "top_k",
                    "frequency_penalty",
                    "presence_penalty",
                    "web_search_options",
                    "structured_outputs"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.perplexity.ai/hub/legal/perplexity-api-terms-of-service",
                    "privacyPolicyURL": "https://www.perplexity.ai/hub/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0.000003",
                    "completion": "0.000015",
                    "image": "0",
                    "request": "0.018",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "search-threshold",
                        "threshold": "high",
                        "request": "0.022"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "medium",
                        "request": "0.018"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "low",
                        "request": "0.014"
                    }
                ],
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {},
                    "is_mandatory_reasoning": true,
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "nvidia/nemotron-nano-12b-v2-vl",
            "hf_slug": "nvidia/NVIDIA-Nemotron-Nano-12B-v2-VL-BF16",
            "updated_at": "2025-11-12T02:19:07.557675+00:00",
            "created_at": "2025-10-28T18:19:25.723503+00:00",
            "hf_updated_at": null,
            "name": "NVIDIA: Nemotron Nano 12B 2 VL (free)",
            "short_name": "Nemotron Nano 12B 2 VL (free)",
            "author": "nvidia",
            "description": "NVIDIA Nemotron Nano 2 VL is a 12-billion-parameter open multimodal reasoning model designed for video understanding and document intelligence. It introduces a hybrid Transformer-Mamba architecture, combining transformer-level accuracy with Mamba’s memory-efficient sequence modeling for significantly higher throughput and lower latency.\n\nThe model supports inputs of text and multi-image documents, producing natural-language outputs. It is trained on high-quality NVIDIA-curated synthetic datasets optimized for optical-character recognition, chart reasoning, and multimodal comprehension.\n\nNemotron Nano 2 VL achieves leading results on OCRBench v2 and scores ≈ 74 average across MMMU, MathVista, AI2D, OCRBench, OCR-Reasoning, ChartQA, DocVQA, and Video-MME—surpassing prior open VL baselines. With Efficient Video Sampling (EVS), it handles long-form videos while reducing inference cost.\n\nOpen-weights, training data, and fine-tuning recipes are released under a permissive NVIDIA open license, with deployment supported across NeMo, NIM, and major inference runtimes.",
            "model_version_group_id": null,
            "context_length": 128000,
            "input_modalities": [
                "image",
                "text",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "nvidia/nemotron-nano-12b-v2-vl",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": "<think>",
                "end_token": "</think>",
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": "<think>",
                    "end_token": "</think>",
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "28304d1d-c2b9-4291-ba4d-dc63e798227e",
                "name": "Nvidia | nvidia/nemotron-nano-12b-v2-vl:free",
                "context_length": 128000,
                "model": {
                    "slug": "nvidia/nemotron-nano-12b-v2-vl",
                    "hf_slug": "nvidia/NVIDIA-Nemotron-Nano-12B-v2-VL-BF16",
                    "updated_at": "2025-11-12T02:19:07.557675+00:00",
                    "created_at": "2025-10-28T18:19:25.723503+00:00",
                    "hf_updated_at": null,
                    "name": "NVIDIA: Nemotron Nano 12B 2 VL",
                    "short_name": "Nemotron Nano 12B 2 VL",
                    "author": "nvidia",
                    "description": "NVIDIA Nemotron Nano 2 VL is a 12-billion-parameter open multimodal reasoning model designed for video understanding and document intelligence. It introduces a hybrid Transformer-Mamba architecture, combining transformer-level accuracy with Mamba’s memory-efficient sequence modeling for significantly higher throughput and lower latency.\n\nThe model supports inputs of text and multi-image documents, producing natural-language outputs. It is trained on high-quality NVIDIA-curated synthetic datasets optimized for optical-character recognition, chart reasoning, and multimodal comprehension.\n\nNemotron Nano 2 VL achieves leading results on OCRBench v2 and scores ≈ 74 average across MMMU, MathVista, AI2D, OCRBench, OCR-Reasoning, ChartQA, DocVQA, and Video-MME—surpassing prior open VL baselines. With Efficient Video Sampling (EVS), it handles long-form videos while reducing inference cost.\n\nOpen-weights, training data, and fine-tuning recipes are released under a permissive NVIDIA open license, with deployment supported across NeMo, NIM, and major inference runtimes.",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "image",
                        "text",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "nvidia/nemotron-nano-12b-v2-vl",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": "<think>",
                        "end_token": "</think>",
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": "<think>",
                            "end_token": "</think>",
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "nvidia/nemotron-nano-12b-v2-vl:free",
                "model_variant_permaslug": "nvidia/nemotron-nano-12b-v2-vl:free",
                "adapter_name": "OpenAIAdapter",
                "provider_name": "Nvidia",
                "provider_info": {
                    "name": "Nvidia",
                    "displayName": "NVIDIA",
                    "slug": "nvidia",
                    "baseUrl": "https://1afcd6e8-59bf-4102-95ed-7ec410f6959f.invocation.api.nvcf.nvidia.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://assets.ngc.nvidia.com/products/api-catalog/legal/NVIDIA%20API%20Trial%20Terms%20of%20Service.pdf",
                        "privacyPolicyURL": "https://www.nvidia.com/en-us/about-nvidia/privacy-policy/"
                    },
                    "headquarters": "US",
                    "datacenters": [
                        "US"
                    ],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [],
                    "owners": [],
                    "adapterName": "OpenAIAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://www.nvidia.com/en-us/&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "NVIDIA",
                "provider_slug": "nvidia",
                "provider_model_id": "nvidia/nvidia-nemotron-nano-12b-v2-vl",
                "quantization": "unknown",
                "variant": "free",
                "is_free": true,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 128000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "temperature",
                    "max_tokens",
                    "seed",
                    "top_p",
                    "tool_choice",
                    "tools"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": true,
                    "trainingOpenRouter": true,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://assets.ngc.nvidia.com/products/api-catalog/legal/NVIDIA%20API%20Trial%20Terms%20of%20Service.pdf",
                    "privacyPolicyURL": "https://www.nvidia.com/en-us/about-nvidia/privacy-policy/"
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0",
                    "openai:completion_tokens": "0",
                    "openai:cached_prompt_tokens": "0"
                },
                "pricing_version_id": "f11f3cb2-257d-47c5-a74a-4d3c7fb63962",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_base64_video_input": true,
                    "supports_video_urls": true,
                    "disable_free_endpoint_limits": false,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "nvidia/nemotron-nano-12b-v2-vl",
            "hf_slug": "nvidia/NVIDIA-Nemotron-Nano-12B-v2-VL-BF16",
            "updated_at": "2025-11-12T02:19:07.557675+00:00",
            "created_at": "2025-10-28T18:19:25.723503+00:00",
            "hf_updated_at": null,
            "name": "NVIDIA: Nemotron Nano 12B 2 VL",
            "short_name": "Nemotron Nano 12B 2 VL",
            "author": "nvidia",
            "description": "NVIDIA Nemotron Nano 2 VL is a 12-billion-parameter open multimodal reasoning model designed for video understanding and document intelligence. It introduces a hybrid Transformer-Mamba architecture, combining transformer-level accuracy with Mamba’s memory-efficient sequence modeling for significantly higher throughput and lower latency.\n\nThe model supports inputs of text and multi-image documents, producing natural-language outputs. It is trained on high-quality NVIDIA-curated synthetic datasets optimized for optical-character recognition, chart reasoning, and multimodal comprehension.\n\nNemotron Nano 2 VL achieves leading results on OCRBench v2 and scores ≈ 74 average across MMMU, MathVista, AI2D, OCRBench, OCR-Reasoning, ChartQA, DocVQA, and Video-MME—surpassing prior open VL baselines. With Efficient Video Sampling (EVS), it handles long-form videos while reducing inference cost.\n\nOpen-weights, training data, and fine-tuning recipes are released under a permissive NVIDIA open license, with deployment supported across NeMo, NIM, and major inference runtimes.",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "image",
                "text",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "nvidia/nemotron-nano-12b-v2-vl",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": "<think>",
                "end_token": "</think>",
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": "<think>",
                    "end_token": "</think>",
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "da29268d-2dd6-4eb5-bb11-1f5a1f86b91a",
                "name": "DeepInfra | nvidia/nemotron-nano-12b-v2-vl",
                "context_length": 131072,
                "model": {
                    "slug": "nvidia/nemotron-nano-12b-v2-vl",
                    "hf_slug": "nvidia/NVIDIA-Nemotron-Nano-12B-v2-VL-BF16",
                    "updated_at": "2025-11-12T02:19:07.557675+00:00",
                    "created_at": "2025-10-28T18:19:25.723503+00:00",
                    "hf_updated_at": null,
                    "name": "NVIDIA: Nemotron Nano 12B 2 VL",
                    "short_name": "Nemotron Nano 12B 2 VL",
                    "author": "nvidia",
                    "description": "NVIDIA Nemotron Nano 2 VL is a 12-billion-parameter open multimodal reasoning model designed for video understanding and document intelligence. It introduces a hybrid Transformer-Mamba architecture, combining transformer-level accuracy with Mamba’s memory-efficient sequence modeling for significantly higher throughput and lower latency.\n\nThe model supports inputs of text and multi-image documents, producing natural-language outputs. It is trained on high-quality NVIDIA-curated synthetic datasets optimized for optical-character recognition, chart reasoning, and multimodal comprehension.\n\nNemotron Nano 2 VL achieves leading results on OCRBench v2 and scores ≈ 74 average across MMMU, MathVista, AI2D, OCRBench, OCR-Reasoning, ChartQA, DocVQA, and Video-MME—surpassing prior open VL baselines. With Efficient Video Sampling (EVS), it handles long-form videos while reducing inference cost.\n\nOpen-weights, training data, and fine-tuning recipes are released under a permissive NVIDIA open license, with deployment supported across NeMo, NIM, and major inference runtimes.",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "image",
                        "text",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "nvidia/nemotron-nano-12b-v2-vl",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": "<think>",
                        "end_token": "</think>",
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": "<think>",
                            "end_token": "</think>",
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "nvidia/nemotron-nano-12b-v2-vl",
                "model_variant_permaslug": "nvidia/nemotron-nano-12b-v2-vl",
                "adapter_name": "DeepInfraAdapter",
                "provider_name": "DeepInfra",
                "provider_info": {
                    "name": "DeepInfra",
                    "displayName": "DeepInfra",
                    "slug": "deepinfra",
                    "baseUrl": "https://api.deepinfra.com/v1/openai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://deepinfra.com/terms",
                        "privacyPolicyURL": "https://deepinfra.com/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}",
                        "org_38GSfr7NVq111kyg6iXh1TTpKuz"
                    ],
                    "adapterName": "DeepInfraAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.deepinfra.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/DeepInfra.webp"
                    },
                    "ignoredProviderModels": [
                        "anthropic/claude-4-opus",
                        "anthropic/claude-4-sonnet",
                        "deepseek-ai/DeepSeek-R1-0528-Turbo",
                        "meta-llama/Llama-2-70b-chat-hf",
                        "mistralai/Mixtral-8x22B-Instruct-v0.1",
                        "google/gemma-1.1-7b-it",
                        "microsoft/Phi-3-medium-4k-instruct",
                        "google/gemma-2-27b-it",
                        "microsoft/WizardLM-2-7B",
                        "mattshumer/Reflection-Llama-3.1-70B",
                        "Sao10K/L3-8B-Lunaris-v1",
                        "openbmb/MiniCPM-Llama3-V-2_5",
                        "Qwen/QVQ-72B-Preview",
                        "deepinfra/airoboros-70b",
                        "Qwen/QwQ-32B-Preview",
                        "Phind/Phind-CodeLlama-34B-v2",
                        "lizpreciatior/lzlv_70b_fp16_hf",
                        "mistralai/Mistral-7B-Instruct-v0.2",
                        "cognitivecomputations/dolphin-2.6-mixtral-8x7b",
                        "cognitivecomputations/dolphin-2.9.1-llama-3-70b",
                        "Qwen/Qwen2-72B-Instruct",
                        "Qwen/Qwen2-7B-Instruct",
                        "google/gemma-2-9b-it",
                        "Sao10K/L3-70B-Euryale-v2.1",
                        "google/codegemma-7b-it",
                        "mistralai/Mistral-7B-Instruct-v0.1",
                        "KoboldAI/LLaMA2-13B-Tiefighter",
                        "meta-llama/Llama-2-13b-chat-hf",
                        "openchat/openchat_3.5",
                        "openchat/openchat-3.6-8b",
                        "bigcode/starcoder2-15b-instruct-v0.1",
                        "Gryphe/MythoMax-L2-13b-turbo",
                        "Austism/chronos-hermes-13b-v2",
                        "Qwen/Qwen2.5-Coder-7B",
                        "moonshotai/Kimi-K2-Instruct",
                        "google/gemini-1.5-flash",
                        "google/gemini-2.5-flash",
                        "google/gemini-2.0-flash-001",
                        "anthropic/claude-3-7-sonnet-latest",
                        "google/gemini-1.5-flash-8b",
                        "google/gemini-2.5-pro",
                        "NovaSky-AI/Sky-T1-32B-Preview",
                        "allenai/olmOCR-7B-0725-FP8",
                        "allenai/olmOCR-7B-0825",
                        "deepseek-ai/DeepSeek-V3-0324-Turbo",
                        "PaddlePaddle/PaddleOCR-VL-0.9B",
                        "allenai/olmOCR-7B-1025",
                        "allenai/olmOCR-2-7B-1025",
                        "allenai/olmOCR-2",
                        "deepseek-ai/DeepSeek-OCR",
                        "meta-llama/Llama-3.2-1B-Instruct",
                        "sentence-transformers/clip-ViT-B-32-multilingual-v1",
                        "shibing624/text2vec-base-chinese",
                        "sentence-transformers/clip-ViT-B-32",
                        "BAAI/bge-en-icl",
                        "Qwen/Qwen3-Embedding-8B-batch",
                        "Qwen/Qwen3-Embedding-4B-batch",
                        "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
                        "meta-llama/Meta-Llama-3.1-405B-Instruct",
                        "BAAI/bge-m3-multi",
                        "google/embeddinggemma-300m",
                        "Qwen/Qwen3-Embedding-0.6B-batch",
                        "meta-llama/Llama-4-Maverick-17B-128E-Instruct-Turbo",
                        "microsoft/Phi-4-multimodal-instruct",
                        "deepseek-ai/DeepSeek-V3.2-Exp",
                        "meta-llama/Llama-3.2-90B-Vision-Instruct",
                        "meta-llama/Meta-Llama-3-70B-Instruct",
                        "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "DeepInfra",
                "provider_slug": "deepinfra/fp8",
                "provider_model_id": "nvidia/NVIDIA-Nemotron-Nano-12B-v2-VL",
                "quantization": "fp8",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "repetition_penalty",
                    "top_k",
                    "seed",
                    "min_p",
                    "response_format"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://deepinfra.com/terms",
                    "privacyPolicyURL": "https://deepinfra.com/privacy"
                },
                "pricing": {
                    "prompt": "0.0000002",
                    "completion": "0.0000006",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.0000002",
                    "openai:completion_tokens": "0.0000006"
                },
                "pricing_version_id": "43757121-36e7-49de-814c-1f542ffb49ae",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "qwen/qwen3-vl-32b-instruct",
            "hf_slug": "Qwen/Qwen3-VL-32B-Instruct",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-10-23T14:55:32.53917+00:00",
            "hf_updated_at": null,
            "name": "Qwen: Qwen3 VL 32B Instruct",
            "short_name": "Qwen3 VL 32B Instruct",
            "author": "qwen",
            "description": "Qwen3-VL-32B-Instruct is a large-scale multimodal vision-language model designed for high-precision understanding and reasoning across text, images, and video. With 32 billion parameters, it combines deep visual perception with advanced text comprehension, enabling fine-grained spatial reasoning, document and scene analysis, and long-horizon video understanding.Robust OCR in 32 languages, and enhanced multimodal fusion through Interleaved-MRoPE and DeepStack architectures. Optimized for agentic interaction and visual tool use, Qwen3-VL-32B delivers state-of-the-art performance for complex real-world multimodal tasks.",
            "model_version_group_id": null,
            "context_length": 262144,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Qwen",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "qwen/qwen3-vl-32b-instruct",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "cc9ec262-af0e-4a84-9ce3-218a517f85b3",
                "name": "Together | qwen/qwen3-vl-32b-instruct",
                "context_length": 262144,
                "model": {
                    "slug": "qwen/qwen3-vl-32b-instruct",
                    "hf_slug": "Qwen/Qwen3-VL-32B-Instruct",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-10-23T14:55:32.53917+00:00",
                    "hf_updated_at": null,
                    "name": "Qwen: Qwen3 VL 32B Instruct",
                    "short_name": "Qwen3 VL 32B Instruct",
                    "author": "qwen",
                    "description": "Qwen3-VL-32B-Instruct is a large-scale multimodal vision-language model designed for high-precision understanding and reasoning across text, images, and video. With 32 billion parameters, it combines deep visual perception with advanced text comprehension, enabling fine-grained spatial reasoning, document and scene analysis, and long-horizon video understanding.Robust OCR in 32 languages, and enhanced multimodal fusion through Interleaved-MRoPE and DeepStack architectures. Optimized for agentic interaction and visual tool use, Qwen3-VL-32B delivers state-of-the-art performance for complex real-world multimodal tasks.",
                    "model_version_group_id": null,
                    "context_length": 262144,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Qwen",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "qwen/qwen3-vl-32b-instruct",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "qwen/qwen3-vl-32b-instruct",
                "model_variant_permaslug": "qwen/qwen3-vl-32b-instruct",
                "adapter_name": "TogetherAdapter",
                "provider_name": "Together",
                "provider_info": {
                    "name": "Together",
                    "displayName": "Together",
                    "slug": "together",
                    "baseUrl": "https://api.together.xyz/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.together.ai/terms-of-service",
                        "privacyPolicyURL": "https://www.together.ai/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "TogetherAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.together.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://www.together.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "mixedbread-ai/Mxbai-Rerank-Large-V2",
                        "BAAI/bge-base-en-v1.5-vllm",
                        "scb10x/scb10x-typhoon-2-1-gemma3-12b",
                        "arcee-ai/AFM-4.5B-Preview",
                        "deepseek-ai/DeepSeek-R1-0528-tput",
                        "black-forest-labs/FLUX.1-kontext-dev",
                        "google/gemma-3-27b-it",
                        "Qwen/Qwen3-32B-FP8",
                        "openai/whisper-large-v3",
                        "eddie/Qwen3-32B",
                        "eddiehou/meta-llama/Llama-3.1-405B",
                        "yan/deepseek-ai-deepseek-v3",
                        "moz/Llama-3.3-70B-Instruct-Turbo",
                        "serverless-qwen-qwen3-32b-fp8",
                        "qwen-qwen3-32b-fp8-serverless",
                        "moz-llama-3-3-70b-instruct-turbo",
                        "moonshotai/Kimi-K2-Instruct-tgl-testing",
                        "VirtueAIxTogether/VirtueGuard-Text-Lite",
                        "Virtue-AI/VirtueGuard-Text-Lite",
                        "black-forest-labs/FLUX.1-krea-dev",
                        "prosus/qwen-qwen3-32b-fp8-long-context",
                        "meta-llama/Llama-4-Scout-17B-16E-Instruct-batch",
                        "deepseek-ai/DeepSeek-R1-DE",
                        "arize-ai/qwen-2-1.5b-instruct",
                        "openai/gpt-oss-120b",
                        "meta-llama/Llama-3-70b-hf",
                        "Qwen/Qwen2.5-72B-Instruct",
                        "meta-llama/Meta-Llama-3.1-70B-Instruct-Reference",
                        "meta-llama/Llama-3.2-1B-Instruct",
                        "meta-llama/Meta-Llama-3.1-8B-Instruct-Reference",
                        "meta-llama/Meta-Llama-3-8B-Instruct",
                        "meta-llama/Llama-3.1-405B-Instruct",
                        "cartesia/sonic",
                        "cartesia/sonic-2",
                        "togethercomputer/MoA-1",
                        "Salesforce/Llama-Rank-V1",
                        "black-forest-labs/FLUX.1-schnell",
                        "lgai/exaone-3-5-32b-instruct",
                        "lgai/exaone-deep-32b",
                        "black-forest-labs/FLUX.1-dev",
                        "marin-community/marin-8b-instruct",
                        "togethercomputer/Refuel-Llm-V2-Small",
                        "meta-llama/Llama-3-70b-chat-hf",
                        "Alibaba-NLP/gte-modernbert-base",
                        "black-forest-labs/FLUX.1-pro",
                        "black-forest-labs/FLUX.1.1-pro",
                        "togethercomputer/MoA-1-Turbo",
                        "black-forest-labs/FLUX.1-dev-lora",
                        "meta-llama/Llama-2-70b-hf",
                        "togethercomputer/m2-bert-80M-32k-retrieval",
                        "togethercomputer/Refuel-Llm-V2",
                        "intfloat/multilingual-e5-large-instruct",
                        "black-forest-labs/FLUX.1-kontext-max",
                        "black-forest-labs/FLUX.1-schnell-Free",
                        "black-forest-labs/FLUX.1-kontext-pro",
                        "BAAI/bge-large-en-v1.5",
                        "BAAI/bge-base-en-v1.5",
                        "Qwen/Qwen3-Next-80B-A3B-Instruct",
                        "ServiceNow-AI/Apriel-1.5-15b-Thinker",
                        "openai/whisper-large-v3-test",
                        "codellama/CodeLlama-34b-Instruct-hf",
                        "meta-llama/Llama-2-13b-chat-hf",
                        "togethercomputer/m2-bert-80M-8k-retrieval",
                        "WhereIsAI/UAE-Large-V1",
                        "meta-llama/Meta-Llama-3.1-405B-Instruct-Lite-Pro",
                        "togethercomputer/m2-bert-80M-2k-retrieval",
                        "meta-llama/Meta-Llama-3-70B-Instruct-Lite",
                        "Meta-Llama/Llama-Guard-7b",
                        "Gryphe/MythoMax-L2-13b-Lite",
                        "upstage/SOLAR-10.7B-Instruct-v1.0",
                        "Qwen/Qwen2.5-14B-Instruct",
                        "meta-llama/Llama-3.3-70B-Instruct-Turbo-Free",
                        "deepseek-ai/DeepSeek-R1-Distill-Llama-70B-free",
                        "zai-org/GLM-4.5-Air-FP8",
                        "kwaivgI/kling-1.6-standard",
                        "HiDream-ai/HiDream-I1-Full",
                        "ByteDance-Seed/Seedream-3.0",
                        "ByteDance-Seed/Seedream-4.0",
                        "Lykon/DreamShaper",
                        "HiDream-ai/HiDream-I1-Dev",
                        "Qwen/Qwen-Image",
                        "RunDiffusion/Juggernaut-pro-flux",
                        "google/imagen-4.0-preview",
                        "google/imagen-4.0-ultra",
                        "google/veo-3.0",
                        "minimax/hailuo-02",
                        "stabilityai/stable-diffusion-3-medium",
                        "black-forest-labs/FLUX.1-Canny-pro",
                        "google/imagen-4.0-fast",
                        "minimax/video-01-director",
                        "HiDream-ai/HiDream-I1-Fast",
                        "Wan-AI/Wan2.2-T2V-A14B",
                        "ByteDance/Seedance-1.0-pro",
                        "google/veo-3.0-fast-audio",
                        "vidu/vidu-q1",
                        "kwaivgI/kling-2.1-master",
                        "google/veo-3.0-audio",
                        "Rundiffusion/Juggernaut-Lightning-Flux",
                        "Wan-AI/Wan2.2-I2V-A14B",
                        "google/flash-image-2.5",
                        "google/veo-2.0",
                        "openai/sora-2",
                        "google/veo-3.0-fast",
                        "ideogram/ideogram-3.0",
                        "kwaivgI/kling-2.0-master",
                        "kwaivgI/kling-2.1-standard",
                        "pixverse/pixverse-v5",
                        "stabilityai/stable-diffusion-xl-base-1.0",
                        "openai/sora-2-pro",
                        "ByteDance/Seedance-1.0-lite",
                        "kwaivgI/kling-1.6-pro",
                        "vidu/vidu-2.0",
                        "kwaivgI/kling-2.1-pro",
                        "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo",
                        "canopylabs/orpheus-3b-0.1-ft",
                        "hexgrad/Kokoro-82M",
                        "eddie/gemma-2b-it",
                        "mistralai/Voxtral-Mini-3B-2507",
                        "arcee-ai/coder-large",
                        "arcee-ai/virtuoso-large",
                        "arcee-ai/maestro-reasoning",
                        "deepcogito/cogito-v2-1-671b",
                        "arcee_ai/arcee-spotlight",
                        "google/gemini-3-pro-image",
                        "mercor/cwm",
                        "black-forest-labs/FLUX.2-flex",
                        "keith-aditya/kimi-k2-instruct",
                        "pangram/mistral-small-2501",
                        "black-forest-labs/FLUX.2-pro",
                        "black-forest-labs/FLUX.2-dev",
                        "ServiceNow-AI/Apriel-1.6-15b-Thinker"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Together",
                "provider_slug": "together",
                "provider_model_id": "Qwen/Qwen3-VL-32B-Instruct",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "top_k",
                    "repetition_penalty",
                    "logit_bias",
                    "min_p",
                    "structured_outputs",
                    "response_format"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.together.ai/terms-of-service",
                    "privacyPolicyURL": "https://www.together.ai/privacy"
                },
                "pricing": {
                    "prompt": "0.0000005",
                    "completion": "0.0000015",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.0000005",
                    "openai:completion_tokens": "0.0000015"
                },
                "pricing_version_id": "65677213-46f1-457c-abb0-4cfeaec61a6f",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5-image-mini",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-10-16T14:23:03.143259+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5 Image Mini",
            "short_name": "GPT-5 Image Mini",
            "author": "openai",
            "description": "GPT-5 Image Mini combines OpenAI's advanced language capabilities, powered by [GPT-5 Mini](https://openrouter.ai/openai/gpt-5-mini), with GPT Image 1 Mini for efficient image generation. This natively multimodal model features superior instruction following, text rendering, and detailed image editing with reduced latency and cost. It excels at high-quality visual creation while maintaining strong text understanding, making it ideal for applications that require both efficient image generation and text processing at scale.",
            "model_version_group_id": null,
            "context_length": 400000,
            "input_modalities": [
                "file",
                "image",
                "text"
            ],
            "output_modalities": [
                "image",
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "openai/gpt-5-image-mini",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "7c09094a-64ec-4d53-bd69-c165ac31c465",
                "name": "OpenAI | openai/gpt-5-image-mini",
                "context_length": 400000,
                "model": {
                    "slug": "openai/gpt-5-image-mini",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-10-16T14:23:03.143259+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5 Image Mini",
                    "short_name": "GPT-5 Image Mini",
                    "author": "openai",
                    "description": "GPT-5 Image Mini combines OpenAI's advanced language capabilities, powered by [GPT-5 Mini](https://openrouter.ai/openai/gpt-5-mini), with GPT Image 1 Mini for efficient image generation. This natively multimodal model features superior instruction following, text rendering, and detailed image editing with reduced latency and cost. It excels at high-quality visual creation while maintaining strong text understanding, making it ideal for applications that require both efficient image generation and text processing at scale.",
                    "model_version_group_id": null,
                    "context_length": 400000,
                    "input_modalities": [
                        "file",
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "image",
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-5-image-mini",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5-image-mini",
                "model_variant_permaslug": "openai/gpt-5-image-mini",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-5-mini-2025-08-07",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": 272000,
                "max_completion_tokens": 128000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "logit_bias",
                    "logprobs",
                    "top_logprobs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.0000025",
                    "completion": "0.000002",
                    "input_cache_read": "0.00000025",
                    "web_search": "0.01",
                    "image_output": "0.000008",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.0000025,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.000002,
                    "openai_responses:image_output_tokens": 0.000008,
                    "openai_responses:cached_prompt_tokens": 2.5e-7
                },
                "pricing_version_id": "f2440c26-2f98-41c2-8d81-fcbca956e29a",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_implicit_caching": true,
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true,
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "anthropic/claude-haiku-4.5",
            "hf_slug": "",
            "updated_at": "2025-12-05T21:53:18.541396+00:00",
            "created_at": "2025-10-15T17:00:38+00:00",
            "hf_updated_at": null,
            "name": "Anthropic: Claude Haiku 4.5",
            "short_name": "Claude Haiku 4.5",
            "author": "anthropic",
            "description": "Claude Haiku 4.5 is Anthropic’s fastest and most efficient model, delivering near-frontier intelligence at a fraction of the cost and latency of larger Claude models. Matching Claude Sonnet 4’s performance across reasoning, coding, and computer-use tasks, Haiku 4.5 brings frontier-level capability to real-time and high-volume applications.\n\nIt introduces extended thinking to the Haiku line; enabling controllable reasoning depth, summarized or interleaved thought output, and tool-assisted workflows with full support for coding, bash, web search, and computer-use tools. Scoring >73% on SWE-bench Verified, Haiku 4.5 ranks among the world’s best coding models while maintaining exceptional responsiveness for sub-agents, parallelized execution, and scaled deployment.",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Claude",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "anthropic/claude-4.5-haiku-20251001",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [
                "amazon-bedrock",
                "google-vertex",
                "anthropic"
            ],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "8a5e69a1-ea0d-4af6-899e-8b7e1c93a7a9",
                "name": "Google | anthropic/claude-4.5-haiku-20251001",
                "context_length": 200000,
                "model": {
                    "slug": "anthropic/claude-haiku-4.5",
                    "hf_slug": "",
                    "updated_at": "2025-12-05T21:53:18.541396+00:00",
                    "created_at": "2025-10-15T17:00:38+00:00",
                    "hf_updated_at": null,
                    "name": "Anthropic: Claude Haiku 4.5",
                    "short_name": "Claude Haiku 4.5",
                    "author": "anthropic",
                    "description": "Claude Haiku 4.5 is Anthropic’s fastest and most efficient model, delivering near-frontier intelligence at a fraction of the cost and latency of larger Claude models. Matching Claude Sonnet 4’s performance across reasoning, coding, and computer-use tasks, Haiku 4.5 brings frontier-level capability to real-time and high-volume applications.\n\nIt introduces extended thinking to the Haiku line; enabling controllable reasoning depth, summarized or interleaved thought output, and tool-assisted workflows with full support for coding, bash, web search, and computer-use tools. Scoring >73% on SWE-bench Verified, Haiku 4.5 ranks among the world’s best coding models while maintaining exceptional responsiveness for sub-agents, parallelized execution, and scaled deployment.",
                    "model_version_group_id": null,
                    "context_length": 200000,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Claude",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "anthropic/claude-4.5-haiku-20251001",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [
                        "amazon-bedrock",
                        "google-vertex",
                        "anthropic"
                    ],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "anthropic/claude-haiku-4.5",
                "model_variant_permaslug": "anthropic/claude-4.5-haiku-20251001",
                "adapter_name": "GoogleVertexAnthropicAdapter",
                "provider_name": "Google",
                "provider_info": {
                    "name": "Google",
                    "displayName": "Google Vertex",
                    "slug": "google-vertex",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "not-used"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleVertexGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.cloud.google.com/products/sdXM79fz1FS6ekNpu37K/history",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleVertex.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-exp-03-25",
                        "gemini-2.0-flash-exp",
                        "gemini-1.5-flash-002",
                        "gemini-2.0-flash-lite-001",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-2.0-flash-001",
                        "llama-4-scout-17b-16e-instruct-maas",
                        "qwen3-235b-a22b-instruct-2507-maas",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-image-preview",
                        "llama-4-maverick-17b-128e-instruct-maas",
                        "llama-3.3-70b-instruct-maas",
                        "claude-3-5-haiku@20241022",
                        "qwen3-coder-480b-a35b-instruct-maas",
                        "gemini-1.5-pro-002",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-pro",
                        "deepseek-r1-0528-maas",
                        "claude-3-7-sonnet@20250219",
                        "claude-3-5-sonnet-v2@20241022",
                        "claude-sonnet-4@20250514",
                        "claude-opus-4-1@20250805",
                        "claude-opus-4@20250514",
                        "claude-3-haiku@20240307",
                        "claude-3-5-sonnet@20240620",
                        "claude-3-opus@20240229",
                        "gemini-2.5-flash-lite-preview-09-2025",
                        "gemini-2.5-flash-preview-09-2025",
                        "gemini-2.5-flash-image",
                        "claude-sonnet-4-5@20250929",
                        "claude-haiku-4-5@20251001",
                        "minimax/minimax-m2-maas",
                        "gemini-3-pro-preview",
                        "gemini-3-pro-image-preview",
                        "claude-opus-4-5@20251101"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "anthropic"
                },
                "provider_display_name": "Google Vertex",
                "provider_slug": "google-vertex",
                "provider_model_id": "claude-haiku-4-5@20251001",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 64000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "top_p",
                    "temperature",
                    "stop",
                    "reasoning",
                    "include_reasoning",
                    "tools",
                    "tool_choice",
                    "top_k"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000001",
                    "completion": "0.000005",
                    "input_cache_read": "0.0000001",
                    "input_cache_write": "0.00000125",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "anthropic:prompt_tokens": 0.000001,
                    "anthropic:web_search_calls": 0.01,
                    "anthropic:cache_read_tokens": 1e-7,
                    "anthropic:completion_tokens": 0.000005,
                    "anthropic:cache_write_1h_tokens": 0.000002,
                    "anthropic:cache_write_5m_tokens": 0.00000125
                },
                "pricing_version_id": "2f1bce8a-465d-4d77-9efa-5f1c83f908dc",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_native_web_search": false,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {},
                    "supports_input_audio": false
                },
                "provider_region": "global",
                "deprecation_date": null
            }
        },
        {
            "slug": "qwen/qwen3-vl-8b-thinking",
            "hf_slug": "Qwen/Qwen3-VL-8B-Thinking",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-10-14T17:42:26.552544+00:00",
            "hf_updated_at": null,
            "name": "Qwen: Qwen3 VL 8B Thinking",
            "short_name": "Qwen3 VL 8B Thinking",
            "author": "qwen",
            "description": "Qwen3-VL-8B-Thinking is the reasoning-optimized variant of the Qwen3-VL-8B multimodal model, designed for advanced visual and textual reasoning across complex scenes, documents, and temporal sequences. It integrates enhanced multimodal alignment and long-context processing (native 256K, expandable to 1M tokens) for tasks such as scientific visual analysis, causal inference, and mathematical reasoning over image or video inputs.\n\nCompared to the Instruct edition, the Thinking version introduces deeper visual-language fusion and deliberate reasoning pathways that improve performance on long-chain logic tasks, STEM problem-solving, and multi-step video understanding. It achieves stronger temporal grounding via Interleaved-MRoPE and timestamp-aware embeddings, while maintaining robust OCR, multilingual comprehension, and text generation on par with large text-only LLMs.",
            "model_version_group_id": null,
            "context_length": 256000,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Qwen3",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "qwen/qwen3-vl-8b-thinking",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true
                }
            },
            "default_parameters": {
                "temperature": 1,
                "top_p": 0.95
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "6cb46014-347b-4d67-aefa-7b83e065b8c3",
                "name": "Alibaba | qwen/qwen3-vl-8b-thinking",
                "context_length": 256000,
                "model": {
                    "slug": "qwen/qwen3-vl-8b-thinking",
                    "hf_slug": "Qwen/Qwen3-VL-8B-Thinking",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-10-14T17:42:26.552544+00:00",
                    "hf_updated_at": null,
                    "name": "Qwen: Qwen3 VL 8B Thinking",
                    "short_name": "Qwen3 VL 8B Thinking",
                    "author": "qwen",
                    "description": "Qwen3-VL-8B-Thinking is the reasoning-optimized variant of the Qwen3-VL-8B multimodal model, designed for advanced visual and textual reasoning across complex scenes, documents, and temporal sequences. It integrates enhanced multimodal alignment and long-context processing (native 256K, expandable to 1M tokens) for tasks such as scientific visual analysis, causal inference, and mathematical reasoning over image or video inputs.\n\nCompared to the Instruct edition, the Thinking version introduces deeper visual-language fusion and deliberate reasoning pathways that improve performance on long-chain logic tasks, STEM problem-solving, and multi-step video understanding. It achieves stronger temporal grounding via Interleaved-MRoPE and timestamp-aware embeddings, while maintaining robust OCR, multilingual comprehension, and text generation on par with large text-only LLMs.",
                    "model_version_group_id": null,
                    "context_length": 256000,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Qwen3",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "qwen/qwen3-vl-8b-thinking",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true
                        }
                    },
                    "default_parameters": {
                        "temperature": 1,
                        "top_p": 0.95
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "qwen/qwen3-vl-8b-thinking",
                "model_variant_permaslug": "qwen/qwen3-vl-8b-thinking",
                "adapter_name": "AlibabaAdapter",
                "provider_name": "Alibaba",
                "provider_info": {
                    "name": "Alibaba",
                    "displayName": "Alibaba Cloud Int.",
                    "slug": "alibaba",
                    "baseUrl": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.alibabacloud.com/help/en/legal/latest/alibaba-cloud-international-website-product-terms-of-service-v-3-8-0",
                        "privacyPolicyURL": "https://www.alibabacloud.com/help/en/legal/latest/alibaba-cloud-international-website-privacy-policy"
                    },
                    "headquarters": "SG",
                    "datacenters": [
                        "SG",
                        "CN"
                    ],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "AlibabaAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.alibabacloud.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://www.alibabacloud.com/&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": null
                },
                "provider_display_name": "Alibaba Cloud Int.",
                "provider_slug": "alibaba",
                "provider_model_id": "qwen3-vl-8b-thinking",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 32768,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "presence_penalty",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.alibabacloud.com/help/en/legal/latest/alibaba-cloud-international-website-product-terms-of-service-v-3-8-0",
                    "privacyPolicyURL": "https://www.alibabacloud.com/help/en/legal/latest/alibaba-cloud-international-website-privacy-policy"
                },
                "pricing": {
                    "prompt": "0.00000018",
                    "completion": "0.0000021",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true,
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "qwen/qwen3-vl-8b-instruct",
            "hf_slug": "Qwen/Qwen3-VL-8B-Instruct",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-10-14T17:35:08.402158+00:00",
            "hf_updated_at": null,
            "name": "Qwen: Qwen3 VL 8B Instruct",
            "short_name": "Qwen3 VL 8B Instruct",
            "author": "qwen",
            "description": "Qwen3-VL-8B-Instruct is a multimodal vision-language model from the Qwen3-VL series, built for high-fidelity understanding and reasoning across text, images, and video. It features improved multimodal fusion with Interleaved-MRoPE for long-horizon temporal reasoning, DeepStack for fine-grained visual-text alignment, and text-timestamp alignment for precise event localization.\n\nThe model supports a native 256K-token context window, extensible to 1M tokens, and handles both static and dynamic media inputs for tasks like document parsing, visual question answering, spatial reasoning, and GUI control. It achieves text understanding comparable to leading LLMs while expanding OCR coverage to 32 languages and enhancing robustness under varied visual conditions.",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Qwen3",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "qwen/qwen3-vl-8b-instruct",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": 0.7,
                "top_p": 0.8,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "6bfd6b5b-ff8c-436f-ae3f-d28c02bcfce3",
                "name": "Novita | qwen/qwen3-vl-8b-instruct",
                "context_length": 131072,
                "model": {
                    "slug": "qwen/qwen3-vl-8b-instruct",
                    "hf_slug": "Qwen/Qwen3-VL-8B-Instruct",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-10-14T17:35:08.402158+00:00",
                    "hf_updated_at": null,
                    "name": "Qwen: Qwen3 VL 8B Instruct",
                    "short_name": "Qwen3 VL 8B Instruct",
                    "author": "qwen",
                    "description": "Qwen3-VL-8B-Instruct is a multimodal vision-language model from the Qwen3-VL series, built for high-fidelity understanding and reasoning across text, images, and video. It features improved multimodal fusion with Interleaved-MRoPE for long-horizon temporal reasoning, DeepStack for fine-grained visual-text alignment, and text-timestamp alignment for precise event localization.\n\nThe model supports a native 256K-token context window, extensible to 1M tokens, and handles both static and dynamic media inputs for tasks like document parsing, visual question answering, spatial reasoning, and GUI control. It achieves text understanding comparable to leading LLMs while expanding OCR coverage to 32 languages and enhancing robustness under varied visual conditions.",
                    "model_version_group_id": null,
                    "context_length": 256000,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Qwen3",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "qwen/qwen3-vl-8b-instruct",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {
                        "temperature": 0.7,
                        "top_p": 0.8,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "qwen/qwen3-vl-8b-instruct",
                "model_variant_permaslug": "qwen/qwen3-vl-8b-instruct",
                "adapter_name": "NovitaAdapter",
                "provider_name": "Novita",
                "provider_info": {
                    "name": "Novita",
                    "displayName": "NovitaAI",
                    "slug": "novita",
                    "baseUrl": "https://api.novita.ai/v3/openai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://novita.ai/legal/terms-of-service",
                        "privacyPolicyURL": "https://novita.ai/legal/privacy-policy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "org_34P2zP0TCZwbzCC8QkH8m8o1i8M"
                    ],
                    "adapterName": "NovitaAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.novita.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://novita.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "google/gemma-3-1b-it",
                        "baichuan/baichuan-m2-32b",
                        "baidu/ernie-4.5-0.3b",
                        "qwen/qwen-mt-plus",
                        "qwen/qwen3-4b-fp8",
                        "meta-llama/llama-3.2-1b-instruct",
                        "sophosympatheia/midnight-rose-70b",
                        "deepseek/deepseek-prover-v2-671b",
                        "Sao10K/L3-8B-Stheno-v3.2",
                        "thudm/glm-4-32b-0414",
                        "qwen/qwen3-omni-30b-a3b-thinking",
                        "qwen/qwen3-omni-30b-a3b-instruct",
                        "paddlepaddle/paddleocr-vl",
                        "deepseek/deepseek-ocr",
                        "skywork/r1v4-lite",
                        "baidu/ernie-4.5-vl-28b-a3b-thinking",
                        "zai-org/autoglm-phone-9b-multilingual"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "NovitaAI",
                "provider_slug": "novita/fp8",
                "provider_model_id": "qwen/qwen3-vl-8b-instruct",
                "quantization": "fp8",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 32768,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "structured_outputs",
                    "response_format",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "top_k",
                    "repetition_penalty",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://novita.ai/legal/terms-of-service",
                    "privacyPolicyURL": "https://novita.ai/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0.00000008",
                    "completion": "0.0000005",
                    "image": "0",
                    "request": "0",
                    "input_cache_read": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000008",
                    "openai:completion_tokens": "0.0000005"
                },
                "pricing_version_id": "9e2dd497-044e-4748-b403-b4743fad861d",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5-image",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-10-14T13:19:46.029021+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5 Image",
            "short_name": "GPT-5 Image",
            "author": "openai",
            "description": "[GPT-5](https://openrouter.ai/openai/gpt-5) Image combines OpenAI's GPT-5 model with state-of-the-art image generation capabilities. It offers major improvements in reasoning, code quality, and user experience while incorporating GPT Image 1's superior instruction following, text rendering, and detailed image editing.",
            "model_version_group_id": null,
            "context_length": 400000,
            "input_modalities": [
                "image",
                "text",
                "file"
            ],
            "output_modalities": [
                "image",
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "openai/gpt-5-image",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true,
                "supports_reasoning_max_tokens": null,
                "supported_reasoning_efforts": null,
                "default_reasoning_effort": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true,
                    "supports_reasoning_max_tokens": null,
                    "supported_reasoning_efforts": null,
                    "default_reasoning_effort": null
                },
                "chat_template_config": {
                    "should_hoist_and_merge_system_messages": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "image_generation",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "be0ed145-8bfc-4aec-a62d-685ed334fe17",
                "name": "OpenAI | openai/gpt-5-image",
                "context_length": 400000,
                "model": {
                    "slug": "openai/gpt-5-image",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-10-14T13:19:46.029021+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5 Image",
                    "short_name": "GPT-5 Image",
                    "author": "openai",
                    "description": "[GPT-5](https://openrouter.ai/openai/gpt-5) Image combines OpenAI's GPT-5 model with state-of-the-art image generation capabilities. It offers major improvements in reasoning, code quality, and user experience while incorporating GPT Image 1's superior instruction following, text rendering, and detailed image editing.",
                    "model_version_group_id": null,
                    "context_length": 400000,
                    "input_modalities": [
                        "image",
                        "text",
                        "file"
                    ],
                    "output_modalities": [
                        "image",
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-5-image",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true,
                        "supports_reasoning_max_tokens": null,
                        "supported_reasoning_efforts": null,
                        "default_reasoning_effort": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true,
                            "supports_reasoning_max_tokens": null,
                            "supported_reasoning_efforts": null,
                            "default_reasoning_effort": null
                        },
                        "chat_template_config": {
                            "should_hoist_and_merge_system_messages": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "image_generation",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5-image",
                "model_variant_permaslug": "openai/gpt-5-image",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-5-2025-08-07",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": 272000,
                "max_completion_tokens": 128000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "logit_bias",
                    "logprobs",
                    "top_logprobs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00001",
                    "completion": "0.00001",
                    "input_cache_read": "0.00000125",
                    "web_search": "0.01",
                    "image_output": "0.00004",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.00001,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.00001,
                    "openai_responses:image_output_tokens": 0.00004,
                    "openai_responses:cached_prompt_tokens": 0.00000125
                },
                "pricing_version_id": "b9d2cf4c-5f0e-41c0-b7ba-082300d4a127",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true,
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/o3-deep-research",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-10-10T20:54:21.971349+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: o3 Deep Research",
            "short_name": "o3 Deep Research",
            "author": "openai",
            "description": "o3-deep-research is OpenAI's advanced model for deep research, designed to tackle complex, multi-step research tasks.\n\nNote: This model always uses the 'web_search' tool which adds additional cost.",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "image",
                "text",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "openai/o3-deep-research-2025-06-26",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "a697c6df-cbb4-4a6b-8b1e-04e92f00146a",
                "name": "OpenAI | openai/o3-deep-research-2025-06-26",
                "context_length": 200000,
                "model": {
                    "slug": "openai/o3-deep-research",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-10-10T20:54:21.971349+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: o3 Deep Research",
                    "short_name": "o3 Deep Research",
                    "author": "openai",
                    "description": "o3-deep-research is OpenAI's advanced model for deep research, designed to tackle complex, multi-step research tasks.\n\nNote: This model always uses the 'web_search' tool which adds additional cost.",
                    "model_version_group_id": null,
                    "context_length": 200000,
                    "input_modalities": [
                        "image",
                        "text",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "openai/o3-deep-research-2025-06-26",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/o3-deep-research",
                "model_variant_permaslug": "openai/o3-deep-research-2025-06-26",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "o3-deep-research-2025-06-26",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 100000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "logit_bias",
                    "logprobs",
                    "top_logprobs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00001",
                    "completion": "0.00004",
                    "input_cache_read": "0.0000025",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.00001,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.00004,
                    "openai_responses:cached_prompt_tokens": 0.0000025
                },
                "pricing_version_id": "46ca33ba-23c1-4a17-a248-30cb67033660",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/o4-mini-deep-research",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-10-10T20:54:02.725273+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: o4 Mini Deep Research",
            "short_name": "o4 Mini Deep Research",
            "author": "openai",
            "description": "o4-mini-deep-research is OpenAI's faster, more affordable deep research model—ideal for tackling complex, multi-step research tasks.\n\nNote: This model always uses the 'web_search' tool which adds additional cost.",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "file",
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "openai/o4-mini-deep-research-2025-06-26",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "97f9f7c3-9e55-4f6d-8de4-459d4f23e2a9",
                "name": "OpenAI | openai/o4-mini-deep-research-2025-06-26",
                "context_length": 200000,
                "model": {
                    "slug": "openai/o4-mini-deep-research",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-10-10T20:54:02.725273+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: o4 Mini Deep Research",
                    "short_name": "o4 Mini Deep Research",
                    "author": "openai",
                    "description": "o4-mini-deep-research is OpenAI's faster, more affordable deep research model—ideal for tackling complex, multi-step research tasks.\n\nNote: This model always uses the 'web_search' tool which adds additional cost.",
                    "model_version_group_id": null,
                    "context_length": 200000,
                    "input_modalities": [
                        "file",
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "openai/o4-mini-deep-research-2025-06-26",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/o4-mini-deep-research",
                "model_variant_permaslug": "openai/o4-mini-deep-research-2025-06-26",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "o4-mini-deep-research-2025-06-26",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 100000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "logit_bias",
                    "logprobs",
                    "top_logprobs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000002",
                    "completion": "0.000008",
                    "input_cache_read": "0.0000005",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.000002,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.000008,
                    "openai_responses:cached_prompt_tokens": 5e-7
                },
                "pricing_version_id": "aecfa236-8c7d-479b-b3fe-7450fb7d299f",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemini-2.5-flash-image",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-10-07T20:53:51+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 2.5 Flash Image (Nano Banana)",
            "short_name": "Gemini 2.5 Flash Image (Nano Banana)",
            "author": "google",
            "description": "Gemini 2.5 Flash Image, a.k.a. \"Nano Banana,\" is now generally available. It is a state of the art image generation model with contextual understanding. It is capable of image generation, edits, and multi-turn conversations. Aspect ratios can be controlled with the [image_config API Parameter](https://openrouter.ai/docs/features/multimodal/image-generation#image-aspect-ratio-configuration)",
            "model_version_group_id": null,
            "context_length": 32768,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "image",
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "google/gemini-2.5-flash-image",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [
                "google-vertex"
            ],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "2341e1bc-99ea-46ab-ae2d-9a83846afb43",
                "name": "Google AI Studio | google/gemini-2.5-flash-image",
                "context_length": 32768,
                "model": {
                    "slug": "google/gemini-2.5-flash-image",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-10-07T20:53:51+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemini 2.5 Flash Image (Nano Banana)",
                    "short_name": "Gemini 2.5 Flash Image (Nano Banana)",
                    "author": "google",
                    "description": "Gemini 2.5 Flash Image, a.k.a. \"Nano Banana,\" is now generally available. It is a state of the art image generation model with contextual understanding. It is capable of image generation, edits, and multi-turn conversations. Aspect ratios can be controlled with the [image_config API Parameter](https://openrouter.ai/docs/features/multimodal/image-generation#image-aspect-ratio-configuration)",
                    "model_version_group_id": null,
                    "context_length": 32768,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "image",
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "google/gemini-2.5-flash-image",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [
                        "google-vertex"
                    ],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemini-2.5-flash-image",
                "model_variant_permaslug": "google/gemini-2.5-flash-image",
                "adapter_name": "GoogleAIStudioGeminiAdapter",
                "provider_name": "Google AI Studio",
                "provider_info": {
                    "name": "Google AI Studio",
                    "displayName": "Google AI Studio",
                    "slug": "google-ai-studio",
                    "baseUrl": "https://generativelanguage.googleapis.com/v1beta",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 55,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleAIStudioGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleAIStudio.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-1p",
                        "gemini-2.5-pro-1p-recitation-off",
                        "gemini-2.5-flash-1p",
                        "gemini-2.5-flash-1p-recitation-off",
                        "gemini-2.5-flash-lite-preview-06-11-summarized",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-1.5-pro-latest",
                        "gemini-1.5-pro",
                        "gemini-1.5-flash-latest",
                        "gemini-1.5-flash",
                        "gemini-1.5-flash-8b",
                        "gemini-1.5-flash-8b-latest",
                        "gemini-2.5-pro-preview-03-25",
                        "gemini-2.0-flash",
                        "gemini-2.0-flash-lite",
                        "gemini-2.0-flash-lite-preview",
                        "gemini-2.0-pro-exp",
                        "gemini-2.0-flash-thinking-exp",
                        "gemini-2.5-flash-preview-tts",
                        "gemini-2.5-pro-preview-tts",
                        "learnlm-2.0-flash-experimental",
                        "gracefulgolem",
                        "gemini-2.5-flash-preview-05-20",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.0-flash-exp-image-generation",
                        "gemini-2.0-flash-preview-image-generation",
                        "gemini-2.0-flash-lite-preview-02-05",
                        "gemini-2.0-pro-exp-02-05",
                        "gemini-exp-1206",
                        "gemini-2.0-flash-thinking-exp-01-21",
                        "gemini-2.0-flash-thinking-exp-1219",
                        "gemma-3-1b-it",
                        "gemini-flash-latest",
                        "gemini-flash-lite-latest",
                        "gemini-pro-latest",
                        "gemini-robotics-er-1.5-preview",
                        "gemini-embedding-001",
                        "riftrunner-fst-rewind",
                        "gemini-3-pro-image-preview",
                        "nano-banana-pro-preview",
                        "fiercefalcon",
                        "fiercefalcon-inline-citation",
                        "fiercefalcon-blocked-sites"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google AI Studio",
                "provider_slug": "google-ai-studio",
                "provider_model_id": "gemini-2.5-flash-image",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 32768,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "response_format",
                    "structured_outputs"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 55,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice"
                },
                "pricing": {
                    "prompt": "0.0000003",
                    "completion": "0.0000025",
                    "image": "0.0000003",
                    "audio": "0.000001",
                    "input_audio_cache": "0.0000001",
                    "input_cache_read": "0.00000003",
                    "input_cache_write": "0.00000008333333333333334",
                    "internal_reasoning": "0.0000025",
                    "image_output": "0.00003",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "gemini:prompt_tokens": 3e-7,
                    "gemini:reasoning_tokens": 0.0000025,
                    "gemini:cache_read_tokens": 3e-8,
                    "gemini:completion_tokens": 0.0000025,
                    "gemini:text_input_tokens": 3e-7,
                    "gemini:audio_input_tokens": 0.000001,
                    "gemini:image_input_tokens": 3e-7,
                    "gemini:video_input_tokens": 3e-7,
                    "gemini:image_output_tokens": 0.00003,
                    "gemini:cache_read_text_tokens": 3e-8,
                    "gemini:cache_read_audio_tokens": 1e-7,
                    "gemini:cache_read_image_tokens": 3e-8,
                    "gemini:cache_read_video_tokens": 3e-8,
                    "gemini:cache_write_storage_hours": 0.000001,
                    "gemini:cache_read_tokens_high_context": 1e-7,
                    "gemini:cache_read_text_tokens_high_context": 1e-7,
                    "gemini:cache_read_audio_tokens_high_context": 2e-7,
                    "gemini:cache_read_image_tokens_high_context": 1e-7,
                    "gemini:cache_read_video_tokens_high_context": 1e-7,
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "549376c3-3914-47e7-9801-c410ca4dc4dd",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": 1000,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {},
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "qwen/qwen3-vl-30b-a3b-thinking",
            "hf_slug": "Qwen/Qwen3-VL-30B-A3B-Thinking",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-10-06T23:47:59.575824+00:00",
            "hf_updated_at": null,
            "name": "Qwen: Qwen3 VL 30B A3B Thinking",
            "short_name": "Qwen3 VL 30B A3B Thinking",
            "author": "qwen",
            "description": "Qwen3-VL-30B-A3B-Thinking is a multimodal model that unifies strong text generation with visual understanding for images and videos. Its Thinking variant enhances reasoning in STEM, math, and complex tasks. It excels in perception of real-world/synthetic categories, 2D/3D spatial grounding, and long-form visual comprehension, achieving competitive multimodal benchmark results. For agentic use, it handles multi-image multi-turn instructions, video timeline alignments, GUI automation, and visual coding from sketches to debugged UI. Text performance matches flagship Qwen3 models, suiting document AI, OCR, UI assistance, spatial tasks, and agent research.",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Qwen3",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "qwen/qwen3-vl-30b-a3b-thinking",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": "<think>",
                "end_token": "</think>",
                "system_prompt": null,
                "is_mandatory_reasoning": true
            },
            "features": {
                "reasoning_config": {
                    "start_token": "<think>",
                    "end_token": "</think>",
                    "system_prompt": null,
                    "is_mandatory_reasoning": true
                }
            },
            "default_parameters": {
                "temperature": 0.8,
                "top_p": 0.95
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "38ee90ad-31ec-4a90-925c-a95d9829636a",
                "name": "Novita | qwen/qwen3-vl-30b-a3b-thinking",
                "context_length": 131072,
                "model": {
                    "slug": "qwen/qwen3-vl-30b-a3b-thinking",
                    "hf_slug": "Qwen/Qwen3-VL-30B-A3B-Thinking",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-10-06T23:47:59.575824+00:00",
                    "hf_updated_at": null,
                    "name": "Qwen: Qwen3 VL 30B A3B Thinking",
                    "short_name": "Qwen3 VL 30B A3B Thinking",
                    "author": "qwen",
                    "description": "Qwen3-VL-30B-A3B-Thinking is a multimodal model that unifies strong text generation with visual understanding for images and videos. Its Thinking variant enhances reasoning in STEM, math, and complex tasks. It excels in perception of real-world/synthetic categories, 2D/3D spatial grounding, and long-form visual comprehension, achieving competitive multimodal benchmark results. For agentic use, it handles multi-image multi-turn instructions, video timeline alignments, GUI automation, and visual coding from sketches to debugged UI. Text performance matches flagship Qwen3 models, suiting document AI, OCR, UI assistance, spatial tasks, and agent research.",
                    "model_version_group_id": null,
                    "context_length": 0,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Qwen3",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "qwen/qwen3-vl-30b-a3b-thinking",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": "<think>",
                        "end_token": "</think>",
                        "system_prompt": null,
                        "is_mandatory_reasoning": true
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": "<think>",
                            "end_token": "</think>",
                            "system_prompt": null,
                            "is_mandatory_reasoning": true
                        }
                    },
                    "default_parameters": {
                        "temperature": 0.8,
                        "top_p": 0.95
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "qwen/qwen3-vl-30b-a3b-thinking",
                "model_variant_permaslug": "qwen/qwen3-vl-30b-a3b-thinking",
                "adapter_name": "NovitaAdapter",
                "provider_name": "Novita",
                "provider_info": {
                    "name": "Novita",
                    "displayName": "NovitaAI",
                    "slug": "novita",
                    "baseUrl": "https://api.novita.ai/v3/openai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://novita.ai/legal/terms-of-service",
                        "privacyPolicyURL": "https://novita.ai/legal/privacy-policy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "org_34P2zP0TCZwbzCC8QkH8m8o1i8M"
                    ],
                    "adapterName": "NovitaAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.novita.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://novita.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "google/gemma-3-1b-it",
                        "baichuan/baichuan-m2-32b",
                        "baidu/ernie-4.5-0.3b",
                        "qwen/qwen-mt-plus",
                        "qwen/qwen3-4b-fp8",
                        "meta-llama/llama-3.2-1b-instruct",
                        "sophosympatheia/midnight-rose-70b",
                        "deepseek/deepseek-prover-v2-671b",
                        "Sao10K/L3-8B-Stheno-v3.2",
                        "thudm/glm-4-32b-0414",
                        "qwen/qwen3-omni-30b-a3b-thinking",
                        "qwen/qwen3-omni-30b-a3b-instruct",
                        "paddlepaddle/paddleocr-vl",
                        "deepseek/deepseek-ocr",
                        "skywork/r1v4-lite",
                        "baidu/ernie-4.5-vl-28b-a3b-thinking",
                        "zai-org/autoglm-phone-9b-multilingual"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "NovitaAI",
                "provider_slug": "novita/fp16",
                "provider_model_id": "qwen/qwen3-vl-30b-a3b-thinking",
                "quantization": "fp16",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 32768,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "top_k",
                    "repetition_penalty",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://novita.ai/legal/terms-of-service",
                    "privacyPolicyURL": "https://novita.ai/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0.0000002",
                    "completion": "0.000001",
                    "image": "0",
                    "request": "0",
                    "input_cache_read": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.0000002",
                    "openai:completion_tokens": "0.000001"
                },
                "pricing_version_id": "5224499e-cd5b-4c1e-a1ff-a79b4af53aa1",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "qwen/qwen3-vl-30b-a3b-instruct",
            "hf_slug": "Qwen/Qwen3-VL-30B-A3B-Instruct",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-10-06T23:47:56.430294+00:00",
            "hf_updated_at": null,
            "name": "Qwen: Qwen3 VL 30B A3B Instruct",
            "short_name": "Qwen3 VL 30B A3B Instruct",
            "author": "qwen",
            "description": "Qwen3-VL-30B-A3B-Instruct is a multimodal model that unifies strong text generation with visual understanding for images and videos. Its Instruct variant optimizes instruction-following for general multimodal tasks. It excels in perception of real-world/synthetic categories, 2D/3D spatial grounding, and long-form visual comprehension, achieving competitive multimodal benchmark results. For agentic use, it handles multi-image multi-turn instructions, video timeline alignments, GUI automation, and visual coding from sketches to debugged UI. Text performance matches flagship Qwen3 models, suiting document AI, OCR, UI assistance, spatial tasks, and agent research.",
            "model_version_group_id": null,
            "context_length": 262144,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Qwen3",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "qwen/qwen3-vl-30b-a3b-instruct",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": 0.7,
                "top_p": 0.8,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "dbb294c1-20cd-4d67-b225-2ff03a050cc8",
                "name": "Fireworks | qwen/qwen3-vl-30b-a3b-instruct",
                "context_length": 262144,
                "model": {
                    "slug": "qwen/qwen3-vl-30b-a3b-instruct",
                    "hf_slug": "Qwen/Qwen3-VL-30B-A3B-Instruct",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-10-06T23:47:56.430294+00:00",
                    "hf_updated_at": null,
                    "name": "Qwen: Qwen3 VL 30B A3B Instruct",
                    "short_name": "Qwen3 VL 30B A3B Instruct",
                    "author": "qwen",
                    "description": "Qwen3-VL-30B-A3B-Instruct is a multimodal model that unifies strong text generation with visual understanding for images and videos. Its Instruct variant optimizes instruction-following for general multimodal tasks. It excels in perception of real-world/synthetic categories, 2D/3D spatial grounding, and long-form visual comprehension, achieving competitive multimodal benchmark results. For agentic use, it handles multi-image multi-turn instructions, video timeline alignments, GUI automation, and visual coding from sketches to debugged UI. Text performance matches flagship Qwen3 models, suiting document AI, OCR, UI assistance, spatial tasks, and agent research.",
                    "model_version_group_id": null,
                    "context_length": 262144,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Qwen3",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "qwen/qwen3-vl-30b-a3b-instruct",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": 0.7,
                        "top_p": 0.8,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "qwen/qwen3-vl-30b-a3b-instruct",
                "model_variant_permaslug": "qwen/qwen3-vl-30b-a3b-instruct",
                "adapter_name": "FireworksAdapter",
                "provider_name": "Fireworks",
                "provider_info": {
                    "name": "Fireworks",
                    "displayName": "Fireworks",
                    "slug": "fireworks",
                    "baseUrl": "https://api.fireworks.ai/inference/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://fireworks.ai/terms-of-service",
                        "privacyPolicyURL": "https://fireworks.ai/privacy-policy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "org_34k70EDz4tN23XFsU2l3tSqm4wF"
                    ],
                    "adapterName": "FireworksAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.fireworks.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Fireworks.png"
                    },
                    "ignoredProviderModels": [
                        "accounts/fireworks/models/qwen2-vl-72b-instruct",
                        "accounts/fireworks/models/llama4-scout-instruct-basic",
                        "accounts/scale-ai/models/arctic-text2sql-r1-7b-public",
                        "accounts/fireworks/models/qwen3-embedding-8b",
                        "accounts/fireworks/models/glm-4p5-air",
                        "accounts/fireworks/models/qwen3-30b-a3b-instruct-2507",
                        "accounts/fireworks/models/qwen3-coder-30b-a3b-instruct",
                        "accounts/lukablaskovic2000-738cce/models/bio-mistral-7b",
                        "accounts/perplexity/models/r1-1776",
                        "accounts/sentientfoundation/models/dobby-unhinged-llama-3-3-70b-new",
                        "accounts/fireworks/models/qwen3-reranker-8b",
                        "accounts/fireworks/models/deepseek-v3p1-terminus",
                        "accounts/sentientfoundation-serverless/models/dobby-mini-unhinged-plus-llama-3-1-8b",
                        "accounts/fireworks/models/deepseek-r1-basic"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Fireworks",
                "provider_slug": "fireworks",
                "provider_model_id": "accounts/fireworks/models/qwen3-vl-30b-a3b-instruct",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "top_k",
                    "repetition_penalty",
                    "logit_bias",
                    "logprobs",
                    "top_logprobs",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://fireworks.ai/terms-of-service",
                    "privacyPolicyURL": "https://fireworks.ai/privacy-policy"
                },
                "pricing": {
                    "prompt": "0.00000015",
                    "completion": "0.0000006",
                    "input_cache_read": "0.000000075",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000015",
                    "openai:completion_tokens": "0.0000006",
                    "openai:cached_prompt_tokens": "0.000000075"
                },
                "pricing_version_id": "589bf4b0-9c5c-4004-a748-58881360475c",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5-pro",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-10-06T18:51:03.215373+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5 Pro",
            "short_name": "GPT-5 Pro",
            "author": "openai",
            "description": "GPT-5 Pro is OpenAI’s most advanced model, offering major improvements in reasoning, code quality, and user experience. It is optimized for complex tasks that require step-by-step reasoning, instruction following, and accuracy in high-stakes use cases. It supports test-time routing features and advanced prompt understanding, including user-specified intent like \"think hard about this.\" Improvements include reductions in hallucination, sycophancy, and better performance in coding, writing, and health-related tasks.",
            "model_version_group_id": null,
            "context_length": 400000,
            "input_modalities": [
                "image",
                "text",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "openai/gpt-5-pro-2025-10-06",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true,
                "supports_reasoning_effort": true,
                "supports_reasoning_max_tokens": null,
                "supported_reasoning_efforts": [
                    "high"
                ],
                "default_reasoning_effort": null,
                "default_reasoning_enabled": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true,
                    "supports_reasoning_effort": true,
                    "supports_reasoning_max_tokens": null,
                    "supported_reasoning_efforts": [
                        "high"
                    ],
                    "default_reasoning_effort": null,
                    "default_reasoning_enabled": null
                },
                "chat_template_config": {
                    "should_hoist_and_merge_system_messages": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "86e3e664-d291-415d-a769-8e08b96a79e9",
                "name": "OpenAI | openai/gpt-5-pro-2025-10-06",
                "context_length": 400000,
                "model": {
                    "slug": "openai/gpt-5-pro",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-10-06T18:51:03.215373+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5 Pro",
                    "short_name": "GPT-5 Pro",
                    "author": "openai",
                    "description": "GPT-5 Pro is OpenAI’s most advanced model, offering major improvements in reasoning, code quality, and user experience. It is optimized for complex tasks that require step-by-step reasoning, instruction following, and accuracy in high-stakes use cases. It supports test-time routing features and advanced prompt understanding, including user-specified intent like \"think hard about this.\" Improvements include reductions in hallucination, sycophancy, and better performance in coding, writing, and health-related tasks.",
                    "model_version_group_id": null,
                    "context_length": 400000,
                    "input_modalities": [
                        "image",
                        "text",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-5-pro-2025-10-06",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true,
                        "supports_reasoning_effort": true,
                        "supports_reasoning_max_tokens": null,
                        "supported_reasoning_efforts": [
                            "high"
                        ],
                        "default_reasoning_effort": null,
                        "default_reasoning_enabled": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true,
                            "supports_reasoning_effort": true,
                            "supports_reasoning_max_tokens": null,
                            "supported_reasoning_efforts": [
                                "high"
                            ],
                            "default_reasoning_effort": null,
                            "default_reasoning_enabled": null
                        },
                        "chat_template_config": {
                            "should_hoist_and_merge_system_messages": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": "reasoning",
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5-pro",
                "model_variant_permaslug": "openai/gpt-5-pro-2025-10-06",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-5-pro-2025-10-06",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": 272000,
                "max_completion_tokens": 128000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000015",
                    "completion": "0.00012",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.000015,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.00012
                },
                "pricing_version_id": "f10148f9-4c52-440d-8ba0-7b474ed90068",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true,
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "anthropic/claude-sonnet-4.5",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-09-29T16:01:16.552976+00:00",
            "hf_updated_at": null,
            "name": "Anthropic: Claude Sonnet 4.5",
            "short_name": "Claude Sonnet 4.5",
            "author": "anthropic",
            "description": "Claude Sonnet 4.5 is Anthropic’s most advanced Sonnet model to date, optimized for real-world agents and coding workflows. It delivers state-of-the-art performance on coding benchmarks such as SWE-bench Verified, with improvements across system design, code security, and specification adherence. The model is designed for extended autonomous operation, maintaining task continuity across sessions and providing fact-based progress tracking.\n\nSonnet 4.5 also introduces stronger agentic capabilities, including improved tool orchestration, speculative parallel execution, and more efficient context and memory management. With enhanced context tracking and awareness of token usage across tool calls, it is particularly well-suited for multi-context and long-running workflows. Use cases span software engineering, cybersecurity, financial analysis, research agents, and other domains requiring sustained reasoning and tool use.",
            "model_version_group_id": null,
            "context_length": 1000000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Claude",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "anthropic/claude-4.5-sonnet-20250929",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": 1,
                "top_p": 1,
                "frequency_penalty": null
            },
            "default_order": [
                "google-vertex",
                "amazon-bedrock",
                "anthropic"
            ],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "d8bee848-f020-454a-b2be-4a7ce868f99f",
                "name": "Amazon Bedrock | anthropic/claude-4.5-sonnet-20250929",
                "context_length": 1000000,
                "model": {
                    "slug": "anthropic/claude-sonnet-4.5",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-09-29T16:01:16.552976+00:00",
                    "hf_updated_at": null,
                    "name": "Anthropic: Claude Sonnet 4.5",
                    "short_name": "Claude Sonnet 4.5",
                    "author": "anthropic",
                    "description": "Claude Sonnet 4.5 is Anthropic’s most advanced Sonnet model to date, optimized for real-world agents and coding workflows. It delivers state-of-the-art performance on coding benchmarks such as SWE-bench Verified, with improvements across system design, code security, and specification adherence. The model is designed for extended autonomous operation, maintaining task continuity across sessions and providing fact-based progress tracking.\n\nSonnet 4.5 also introduces stronger agentic capabilities, including improved tool orchestration, speculative parallel execution, and more efficient context and memory management. With enhanced context tracking and awareness of token usage across tool calls, it is particularly well-suited for multi-context and long-running workflows. Use cases span software engineering, cybersecurity, financial analysis, research agents, and other domains requiring sustained reasoning and tool use.",
                    "model_version_group_id": null,
                    "context_length": 1000000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Claude",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "anthropic/claude-4.5-sonnet-20250929",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {
                        "temperature": 1,
                        "top_p": 1,
                        "frequency_penalty": null
                    },
                    "default_order": [
                        "google-vertex",
                        "amazon-bedrock",
                        "anthropic"
                    ],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "anthropic/claude-sonnet-4.5",
                "model_variant_permaslug": "anthropic/claude-4.5-sonnet-20250929",
                "adapter_name": "AmazonBedrockInvokeAnthropicAdapter",
                "provider_name": "Amazon Bedrock",
                "provider_info": {
                    "name": "Amazon Bedrock",
                    "displayName": "Amazon Bedrock",
                    "slug": "amazon-bedrock",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                        "privacyPolicyURL": "https://aws.amazon.com/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "dummy-value"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "AmazonBedrockConverseAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://health.aws.amazon.com/health/status",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Bedrock.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "anthropic"
                },
                "provider_display_name": "Amazon Bedrock",
                "provider_slug": "amazon-bedrock",
                "provider_model_id": "global.anthropic.claude-sonnet-4-5-20250929-v1:0",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 64000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "top_k",
                    "stop",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                    "privacyPolicyURL": "https://aws.amazon.com/privacy"
                },
                "pricing": {
                    "prompt": "0.000003",
                    "completion": "0.000015",
                    "input_cache_read": "0.0000003",
                    "input_cache_write": "0.00000375",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "prompt-threshold",
                        "threshold": 200000,
                        "prompt": "0.000006",
                        "completions": "0.0000225",
                        "input_cache_read": "0.0000006",
                        "input_cache_write": "0.0000075"
                    }
                ],
                "pricing_json": {
                    "anthropic:prompt_tokens": 0.000003,
                    "anthropic:web_search_calls": 0.01,
                    "anthropic:cache_read_tokens": 3e-7,
                    "anthropic:completion_tokens": 0.000015,
                    "anthropic:cache_write_1h_tokens": 0.000006,
                    "anthropic:cache_write_5m_tokens": 0.00000375,
                    "anthropic:long_context_threshold": 200000,
                    "anthropic:prompt_tokens_long_context": 0.000006,
                    "anthropic:cache_read_tokens_long_context": 6e-7,
                    "anthropic:completion_tokens_long_context": 0.0000225,
                    "anthropic:cache_write_1h_tokens_long_context": 0.000012,
                    "anthropic:cache_write_5m_tokens_long_context": 0.0000075
                },
                "pricing_version_id": "f1afe5e8-55e9-4d00-bc49-33b73ac3d69e",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {},
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemini-2.5-flash-preview-09-2025",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-09-25T17:09:38.646963+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 2.5 Flash Preview 09-2025",
            "short_name": "Gemini 2.5 Flash Preview 09-2025",
            "author": "google",
            "description": "Gemini 2.5 Flash Preview September 2025 Checkpoint is Google's state-of-the-art workhorse model, specifically designed for advanced reasoning, coding, mathematics, and scientific tasks. It includes built-in \"thinking\" capabilities, enabling it to provide responses with greater accuracy and nuanced context handling. \n\nAdditionally, Gemini 2.5 Flash is configurable through the \"max tokens for reasoning\" parameter, as described in the documentation (https://openrouter.ai/docs/use-cases/reasoning-tokens#max-tokens-for-reasoning).",
            "model_version_group_id": null,
            "context_length": 1048576,
            "input_modalities": [
                "image",
                "file",
                "text",
                "audio",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "google/gemini-2.5-flash-preview-09-2025",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "3135cae6-b7a4-49be-9994-12aebe3caf27",
                "name": "Google | google/gemini-2.5-flash-preview-09-2025",
                "context_length": 1048576,
                "model": {
                    "slug": "google/gemini-2.5-flash-preview-09-2025",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-09-25T17:09:38.646963+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemini 2.5 Flash Preview 09-2025",
                    "short_name": "Gemini 2.5 Flash Preview 09-2025",
                    "author": "google",
                    "description": "Gemini 2.5 Flash Preview September 2025 Checkpoint is Google's state-of-the-art workhorse model, specifically designed for advanced reasoning, coding, mathematics, and scientific tasks. It includes built-in \"thinking\" capabilities, enabling it to provide responses with greater accuracy and nuanced context handling. \n\nAdditionally, Gemini 2.5 Flash is configurable through the \"max tokens for reasoning\" parameter, as described in the documentation (https://openrouter.ai/docs/use-cases/reasoning-tokens#max-tokens-for-reasoning).",
                    "model_version_group_id": null,
                    "context_length": 1048576,
                    "input_modalities": [
                        "image",
                        "file",
                        "text",
                        "audio",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "google/gemini-2.5-flash-preview-09-2025",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemini-2.5-flash-preview-09-2025",
                "model_variant_permaslug": "google/gemini-2.5-flash-preview-09-2025",
                "adapter_name": "GoogleVertexGeminiAdapter",
                "provider_name": "Google",
                "provider_info": {
                    "name": "Google",
                    "displayName": "Google Vertex (Global)",
                    "slug": "google-vertex/global",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "not-used"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleVertexGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.cloud.google.com/products/sdXM79fz1FS6ekNpu37K/history",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleVertex.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-exp-03-25",
                        "gemini-2.0-flash-exp",
                        "gemini-1.5-flash-002",
                        "gemini-2.0-flash-lite-001",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-2.0-flash-001",
                        "llama-4-scout-17b-16e-instruct-maas",
                        "qwen3-235b-a22b-instruct-2507-maas",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-image-preview",
                        "llama-4-maverick-17b-128e-instruct-maas",
                        "llama-3.3-70b-instruct-maas",
                        "claude-3-5-haiku@20241022",
                        "qwen3-coder-480b-a35b-instruct-maas",
                        "gemini-1.5-pro-002",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-pro",
                        "deepseek-r1-0528-maas",
                        "claude-3-7-sonnet@20250219",
                        "claude-3-5-sonnet-v2@20241022",
                        "claude-sonnet-4@20250514",
                        "claude-opus-4-1@20250805",
                        "claude-opus-4@20250514",
                        "claude-3-haiku@20240307",
                        "claude-3-5-sonnet@20240620",
                        "claude-3-opus@20240229",
                        "gemini-2.5-flash-lite-preview-09-2025",
                        "gemini-2.5-flash-preview-09-2025",
                        "gemini-2.5-flash-image",
                        "claude-sonnet-4-5@20250929",
                        "claude-haiku-4-5@20251001",
                        "minimax/minimax-m2-maas",
                        "gemini-3-pro-preview",
                        "gemini-3-pro-image-preview",
                        "claude-opus-4-5@20251101"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google Vertex (Global)",
                "provider_slug": "google-vertex/global",
                "provider_model_id": "gemini-2.5-flash-preview-09-2025",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 65535,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "stop",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.0000003",
                    "completion": "0.0000025",
                    "image": "0.0000003",
                    "audio": "0.000001",
                    "input_audio_cache": "0.0000001",
                    "input_cache_read": "0.00000003",
                    "input_cache_write": "0.00000008333333333333334",
                    "internal_reasoning": "0.0000025",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "gemini:prompt_tokens": 3e-7,
                    "gemini:reasoning_tokens": 0.0000025,
                    "gemini:cache_read_tokens": 3e-8,
                    "gemini:completion_tokens": 0.0000025,
                    "gemini:text_input_tokens": 3e-7,
                    "gemini:audio_input_tokens": 0.000001,
                    "gemini:image_input_tokens": 3e-7,
                    "gemini:video_input_tokens": 3e-7,
                    "gemini:cache_read_text_tokens": 3e-8,
                    "gemini:cache_read_audio_tokens": 1e-7,
                    "gemini:cache_read_image_tokens": 3e-8,
                    "gemini:cache_read_video_tokens": 3e-8,
                    "gemini:cache_write_storage_hours": 0.000001,
                    "gemini:cache_read_tokens_high_context": 1e-7,
                    "gemini:cache_read_text_tokens_high_context": 1e-7,
                    "gemini:cache_read_audio_tokens_high_context": 2e-7,
                    "gemini:cache_read_image_tokens_high_context": 1e-7,
                    "gemini:cache_read_video_tokens_high_context": 1e-7,
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "2fe6cb2f-c190-4a31-bd69-15f6c4b81c84",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_base64_video_input": true,
                    "supports_video_urls": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "supports_input_audio": true
                },
                "provider_region": "global",
                "deprecation_date": "2026-02-17"
            }
        },
        {
            "slug": "google/gemini-2.5-flash-lite-preview-09-2025",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-09-25T17:01:26.198818+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 2.5 Flash Lite Preview 09-2025",
            "short_name": "Gemini 2.5 Flash Lite Preview 09-2025",
            "author": "google",
            "description": "Gemini 2.5 Flash-Lite is a lightweight reasoning model in the Gemini 2.5 family, optimized for ultra-low latency and cost efficiency. It offers improved throughput, faster token generation, and better performance across common benchmarks compared to earlier Flash models. By default, \"thinking\" (i.e. multi-pass reasoning) is disabled to prioritize speed, but developers can enable it via the [Reasoning API parameter](https://openrouter.ai/docs/use-cases/reasoning-tokens) to selectively trade off cost for intelligence. ",
            "model_version_group_id": null,
            "context_length": 1048576,
            "input_modalities": [
                "text",
                "image",
                "file",
                "audio",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "google/gemini-2.5-flash-lite-preview-09-2025",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "6e63b201-b2cc-45d9-b0c0-da687a96efa0",
                "name": "Google | google/gemini-2.5-flash-lite-preview-09-2025",
                "context_length": 1048576,
                "model": {
                    "slug": "google/gemini-2.5-flash-lite-preview-09-2025",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-09-25T17:01:26.198818+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemini 2.5 Flash Lite Preview 09-2025",
                    "short_name": "Gemini 2.5 Flash Lite Preview 09-2025",
                    "author": "google",
                    "description": "Gemini 2.5 Flash-Lite is a lightweight reasoning model in the Gemini 2.5 family, optimized for ultra-low latency and cost efficiency. It offers improved throughput, faster token generation, and better performance across common benchmarks compared to earlier Flash models. By default, \"thinking\" (i.e. multi-pass reasoning) is disabled to prioritize speed, but developers can enable it via the [Reasoning API parameter](https://openrouter.ai/docs/use-cases/reasoning-tokens) to selectively trade off cost for intelligence. ",
                    "model_version_group_id": null,
                    "context_length": 1048576,
                    "input_modalities": [
                        "text",
                        "image",
                        "file",
                        "audio",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "google/gemini-2.5-flash-lite-preview-09-2025",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemini-2.5-flash-lite-preview-09-2025",
                "model_variant_permaslug": "google/gemini-2.5-flash-lite-preview-09-2025",
                "adapter_name": "GoogleVertexGeminiAdapter",
                "provider_name": "Google",
                "provider_info": {
                    "name": "Google",
                    "displayName": "Google Vertex",
                    "slug": "google-vertex",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "not-used"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleVertexGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.cloud.google.com/products/sdXM79fz1FS6ekNpu37K/history",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleVertex.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-exp-03-25",
                        "gemini-2.0-flash-exp",
                        "gemini-1.5-flash-002",
                        "gemini-2.0-flash-lite-001",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-2.0-flash-001",
                        "llama-4-scout-17b-16e-instruct-maas",
                        "qwen3-235b-a22b-instruct-2507-maas",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-image-preview",
                        "llama-4-maverick-17b-128e-instruct-maas",
                        "llama-3.3-70b-instruct-maas",
                        "claude-3-5-haiku@20241022",
                        "qwen3-coder-480b-a35b-instruct-maas",
                        "gemini-1.5-pro-002",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-pro",
                        "deepseek-r1-0528-maas",
                        "claude-3-7-sonnet@20250219",
                        "claude-3-5-sonnet-v2@20241022",
                        "claude-sonnet-4@20250514",
                        "claude-opus-4-1@20250805",
                        "claude-opus-4@20250514",
                        "claude-3-haiku@20240307",
                        "claude-3-5-sonnet@20240620",
                        "claude-3-opus@20240229",
                        "gemini-2.5-flash-lite-preview-09-2025",
                        "gemini-2.5-flash-preview-09-2025",
                        "gemini-2.5-flash-image",
                        "claude-sonnet-4-5@20250929",
                        "claude-haiku-4-5@20251001",
                        "minimax/minimax-m2-maas",
                        "gemini-3-pro-preview",
                        "gemini-3-pro-image-preview",
                        "claude-opus-4-5@20251101"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google Vertex",
                "provider_slug": "google-vertex",
                "provider_model_id": "gemini-2.5-flash-lite-preview-09-2025",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 65535,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "stop",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.0000001",
                    "completion": "0.0000004",
                    "image": "0.0000001",
                    "audio": "0.0000003",
                    "input_audio_cache": "0.00000003",
                    "input_cache_read": "0.00000001",
                    "input_cache_write": "0.00000008333333333333334",
                    "internal_reasoning": "0.0000004",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "gemini:prompt_tokens": 1e-7,
                    "gemini:reasoning_tokens": 4e-7,
                    "gemini:cache_read_tokens": 1e-8,
                    "gemini:completion_tokens": 4e-7,
                    "gemini:text_input_tokens": 1e-7,
                    "gemini:audio_input_tokens": 3e-7,
                    "gemini:image_input_tokens": 1e-7,
                    "gemini:video_input_tokens": 1e-7,
                    "gemini:cache_read_text_tokens": 1e-8,
                    "gemini:cache_read_audio_tokens": 3e-8,
                    "gemini:cache_read_image_tokens": 1e-8,
                    "gemini:cache_read_video_tokens": 1e-8,
                    "gemini:cache_write_storage_hours": 0.000001,
                    "gemini:cache_read_tokens_high_context": 3e-8,
                    "gemini:cache_read_text_tokens_high_context": 3e-8,
                    "gemini:cache_read_audio_tokens_high_context": 6e-8,
                    "gemini:cache_read_image_tokens_high_context": 3e-8,
                    "gemini:cache_read_video_tokens_high_context": 3e-8,
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "b52b655f-9872-4089-9ec1-fabaaa9f6a5f",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_base64_video_input": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "supports_input_audio": true
                },
                "provider_region": "global",
                "deprecation_date": null
            }
        },
        {
            "slug": "qwen/qwen3-vl-235b-a22b-thinking",
            "hf_slug": "Qwen/Qwen3-VL-235B-A22B-Thinking",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-09-23T23:04:50+00:00",
            "hf_updated_at": null,
            "name": "Qwen: Qwen3 VL 235B A22B Thinking",
            "short_name": "Qwen3 VL 235B A22B Thinking",
            "author": "qwen",
            "description": "Qwen3-VL-235B-A22B Thinking is a multimodal model that unifies strong text generation with visual understanding across images and video. The Thinking model is optimized for multimodal reasoning in STEM and math. The series emphasizes robust perception (recognition of diverse real-world and synthetic categories), spatial understanding (2D/3D grounding), and long-form visual comprehension, with competitive results on public multimodal benchmarks for both perception and reasoning.\n\nBeyond analysis, Qwen3-VL supports agentic interaction and tool use: it can follow complex instructions over multi-image, multi-turn dialogues; align text to video timelines for precise temporal queries; and operate GUI elements for automation tasks. The models also enable visual coding workflows, turning sketches or mockups into code and assisting with UI debugging, while maintaining strong text-only performance comparable to the flagship Qwen3 language models. This makes Qwen3-VL suitable for production scenarios spanning document AI, multilingual OCR, software/UI assistance, spatial/embodied tasks, and research on vision-language agents.",
            "model_version_group_id": null,
            "context_length": 262144,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Qwen3",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "qwen/qwen3-vl-235b-a22b-thinking",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": "<think>",
                "end_token": "</think>",
                "system_prompt": null,
                "is_mandatory_reasoning": true
            },
            "features": {
                "reasoning_config": {
                    "start_token": "<think>",
                    "end_token": "</think>",
                    "system_prompt": null,
                    "is_mandatory_reasoning": true
                }
            },
            "default_parameters": {
                "temperature": 0.8,
                "top_p": 0.95,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "37f02013-5c66-4800-bf34-dac4804abd14",
                "name": "SiliconFlow | qwen/qwen3-vl-235b-a22b-thinking",
                "context_length": 262144,
                "model": {
                    "slug": "qwen/qwen3-vl-235b-a22b-thinking",
                    "hf_slug": "Qwen/Qwen3-VL-235B-A22B-Thinking",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-09-23T23:04:50+00:00",
                    "hf_updated_at": null,
                    "name": "Qwen: Qwen3 VL 235B A22B Thinking",
                    "short_name": "Qwen3 VL 235B A22B Thinking",
                    "author": "qwen",
                    "description": "Qwen3-VL-235B-A22B Thinking is a multimodal model that unifies strong text generation with visual understanding across images and video. The Thinking model is optimized for multimodal reasoning in STEM and math. The series emphasizes robust perception (recognition of diverse real-world and synthetic categories), spatial understanding (2D/3D grounding), and long-form visual comprehension, with competitive results on public multimodal benchmarks for both perception and reasoning.\n\nBeyond analysis, Qwen3-VL supports agentic interaction and tool use: it can follow complex instructions over multi-image, multi-turn dialogues; align text to video timelines for precise temporal queries; and operate GUI elements for automation tasks. The models also enable visual coding workflows, turning sketches or mockups into code and assisting with UI debugging, while maintaining strong text-only performance comparable to the flagship Qwen3 language models. This makes Qwen3-VL suitable for production scenarios spanning document AI, multilingual OCR, software/UI assistance, spatial/embodied tasks, and research on vision-language agents.",
                    "model_version_group_id": null,
                    "context_length": 131072,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Qwen3",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "qwen/qwen3-vl-235b-a22b-thinking",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": "<think>",
                        "end_token": "</think>",
                        "system_prompt": null,
                        "is_mandatory_reasoning": true
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": "<think>",
                            "end_token": "</think>",
                            "system_prompt": null,
                            "is_mandatory_reasoning": true
                        }
                    },
                    "default_parameters": {
                        "temperature": 0.8,
                        "top_p": 0.95,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "qwen/qwen3-vl-235b-a22b-thinking",
                "model_variant_permaslug": "qwen/qwen3-vl-235b-a22b-thinking",
                "adapter_name": "SiliconFlowAdapter",
                "provider_name": "SiliconFlow",
                "provider_info": {
                    "name": "SiliconFlow",
                    "displayName": "SiliconFlow",
                    "slug": "siliconflow",
                    "baseUrl": "https://api.siliconflow.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://docs.siliconflow.com/en/legals/terms-of-service",
                        "privacyPolicyURL": "https://docs.siliconflow.com/en/legals/privacy-policy"
                    },
                    "headquarters": "SG",
                    "datacenters": [],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "SiliconFlowAdapter",
                    "isMultipartSupported": false,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "/images/icons/SiliconFlow.svg"
                    },
                    "ignoredProviderModels": [
                        "inclusionAI/Ling-mini-2.0",
                        "inclusionAI/Ring-flash-2.0",
                        "inclusionAI/Ling-flash-2.0"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "SiliconFlow",
                "provider_slug": "siliconflow/fp8",
                "provider_model_id": "Qwen/Qwen3-VL-235B-A22B-Thinking",
                "quantization": "fp8",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 262144,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "temperature",
                    "top_p",
                    "top_k",
                    "frequency_penalty",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://docs.siliconflow.com/en/legals/terms-of-service",
                    "privacyPolicyURL": "https://docs.siliconflow.com/en/legals/privacy-policy"
                },
                "pricing": {
                    "prompt": "0.00000045",
                    "completion": "0.0000035",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000045",
                    "openai:completion_tokens": "0.0000035"
                },
                "pricing_version_id": "75357189-5294-4f42-8678-e406f1c9fbcd",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "qwen/qwen3-vl-235b-a22b-instruct",
            "hf_slug": "Qwen/Qwen3-VL-235B-A22B-Instruct",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-09-23T23:04:47+00:00",
            "hf_updated_at": null,
            "name": "Qwen: Qwen3 VL 235B A22B Instruct",
            "short_name": "Qwen3 VL 235B A22B Instruct",
            "author": "qwen",
            "description": "Qwen3-VL-235B-A22B Instruct is an open-weight multimodal model that unifies strong text generation with visual understanding across images and video. The Instruct model targets general vision-language use (VQA, document parsing, chart/table extraction, multilingual OCR). The series emphasizes robust perception (recognition of diverse real-world and synthetic categories), spatial understanding (2D/3D grounding), and long-form visual comprehension, with competitive results on public multimodal benchmarks for both perception and reasoning.\n\nBeyond analysis, Qwen3-VL supports agentic interaction and tool use: it can follow complex instructions over multi-image, multi-turn dialogues; align text to video timelines for precise temporal queries; and operate GUI elements for automation tasks. The models also enable visual coding workflows—turning sketches or mockups into code and assisting with UI debugging—while maintaining strong text-only performance comparable to the flagship Qwen3 language models. This makes Qwen3-VL suitable for production scenarios spanning document AI, multilingual OCR, software/UI assistance, spatial/embodied tasks, and research on vision-language agents.",
            "model_version_group_id": null,
            "context_length": 262144,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Qwen3",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "qwen/qwen3-vl-235b-a22b-instruct",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": 0.7,
                "top_p": 0.8,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "a352cc82-2bdb-411b-9f99-bd7829655412",
                "name": "DeepInfra | qwen/qwen3-vl-235b-a22b-instruct",
                "context_length": 262144,
                "model": {
                    "slug": "qwen/qwen3-vl-235b-a22b-instruct",
                    "hf_slug": "Qwen/Qwen3-VL-235B-A22B-Instruct",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-09-23T23:04:47+00:00",
                    "hf_updated_at": null,
                    "name": "Qwen: Qwen3 VL 235B A22B Instruct",
                    "short_name": "Qwen3 VL 235B A22B Instruct",
                    "author": "qwen",
                    "description": "Qwen3-VL-235B-A22B Instruct is an open-weight multimodal model that unifies strong text generation with visual understanding across images and video. The Instruct model targets general vision-language use (VQA, document parsing, chart/table extraction, multilingual OCR). The series emphasizes robust perception (recognition of diverse real-world and synthetic categories), spatial understanding (2D/3D grounding), and long-form visual comprehension, with competitive results on public multimodal benchmarks for both perception and reasoning.\n\nBeyond analysis, Qwen3-VL supports agentic interaction and tool use: it can follow complex instructions over multi-image, multi-turn dialogues; align text to video timelines for precise temporal queries; and operate GUI elements for automation tasks. The models also enable visual coding workflows—turning sketches or mockups into code and assisting with UI debugging—while maintaining strong text-only performance comparable to the flagship Qwen3 language models. This makes Qwen3-VL suitable for production scenarios spanning document AI, multilingual OCR, software/UI assistance, spatial/embodied tasks, and research on vision-language agents.",
                    "model_version_group_id": null,
                    "context_length": 131072,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Qwen3",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "qwen/qwen3-vl-235b-a22b-instruct",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {
                        "temperature": 0.7,
                        "top_p": 0.8,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "qwen/qwen3-vl-235b-a22b-instruct",
                "model_variant_permaslug": "qwen/qwen3-vl-235b-a22b-instruct",
                "adapter_name": "DeepInfraAdapter",
                "provider_name": "DeepInfra",
                "provider_info": {
                    "name": "DeepInfra",
                    "displayName": "DeepInfra",
                    "slug": "deepinfra",
                    "baseUrl": "https://api.deepinfra.com/v1/openai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://deepinfra.com/terms",
                        "privacyPolicyURL": "https://deepinfra.com/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}",
                        "org_38GSfr7NVq111kyg6iXh1TTpKuz"
                    ],
                    "adapterName": "DeepInfraAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.deepinfra.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/DeepInfra.webp"
                    },
                    "ignoredProviderModels": [
                        "anthropic/claude-4-opus",
                        "anthropic/claude-4-sonnet",
                        "deepseek-ai/DeepSeek-R1-0528-Turbo",
                        "meta-llama/Llama-2-70b-chat-hf",
                        "mistralai/Mixtral-8x22B-Instruct-v0.1",
                        "google/gemma-1.1-7b-it",
                        "microsoft/Phi-3-medium-4k-instruct",
                        "google/gemma-2-27b-it",
                        "microsoft/WizardLM-2-7B",
                        "mattshumer/Reflection-Llama-3.1-70B",
                        "Sao10K/L3-8B-Lunaris-v1",
                        "openbmb/MiniCPM-Llama3-V-2_5",
                        "Qwen/QVQ-72B-Preview",
                        "deepinfra/airoboros-70b",
                        "Qwen/QwQ-32B-Preview",
                        "Phind/Phind-CodeLlama-34B-v2",
                        "lizpreciatior/lzlv_70b_fp16_hf",
                        "mistralai/Mistral-7B-Instruct-v0.2",
                        "cognitivecomputations/dolphin-2.6-mixtral-8x7b",
                        "cognitivecomputations/dolphin-2.9.1-llama-3-70b",
                        "Qwen/Qwen2-72B-Instruct",
                        "Qwen/Qwen2-7B-Instruct",
                        "google/gemma-2-9b-it",
                        "Sao10K/L3-70B-Euryale-v2.1",
                        "google/codegemma-7b-it",
                        "mistralai/Mistral-7B-Instruct-v0.1",
                        "KoboldAI/LLaMA2-13B-Tiefighter",
                        "meta-llama/Llama-2-13b-chat-hf",
                        "openchat/openchat_3.5",
                        "openchat/openchat-3.6-8b",
                        "bigcode/starcoder2-15b-instruct-v0.1",
                        "Gryphe/MythoMax-L2-13b-turbo",
                        "Austism/chronos-hermes-13b-v2",
                        "Qwen/Qwen2.5-Coder-7B",
                        "moonshotai/Kimi-K2-Instruct",
                        "google/gemini-1.5-flash",
                        "google/gemini-2.5-flash",
                        "google/gemini-2.0-flash-001",
                        "anthropic/claude-3-7-sonnet-latest",
                        "google/gemini-1.5-flash-8b",
                        "google/gemini-2.5-pro",
                        "NovaSky-AI/Sky-T1-32B-Preview",
                        "allenai/olmOCR-7B-0725-FP8",
                        "allenai/olmOCR-7B-0825",
                        "deepseek-ai/DeepSeek-V3-0324-Turbo",
                        "PaddlePaddle/PaddleOCR-VL-0.9B",
                        "allenai/olmOCR-7B-1025",
                        "allenai/olmOCR-2-7B-1025",
                        "allenai/olmOCR-2",
                        "deepseek-ai/DeepSeek-OCR",
                        "meta-llama/Llama-3.2-1B-Instruct",
                        "sentence-transformers/clip-ViT-B-32-multilingual-v1",
                        "shibing624/text2vec-base-chinese",
                        "sentence-transformers/clip-ViT-B-32",
                        "BAAI/bge-en-icl",
                        "Qwen/Qwen3-Embedding-8B-batch",
                        "Qwen/Qwen3-Embedding-4B-batch",
                        "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
                        "meta-llama/Meta-Llama-3.1-405B-Instruct",
                        "BAAI/bge-m3-multi",
                        "google/embeddinggemma-300m",
                        "Qwen/Qwen3-Embedding-0.6B-batch",
                        "meta-llama/Llama-4-Maverick-17B-128E-Instruct-Turbo",
                        "microsoft/Phi-4-multimodal-instruct",
                        "deepseek-ai/DeepSeek-V3.2-Exp",
                        "meta-llama/Llama-3.2-90B-Vision-Instruct",
                        "meta-llama/Meta-Llama-3-70B-Instruct",
                        "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "DeepInfra",
                "provider_slug": "deepinfra/fp8",
                "provider_model_id": "Qwen/Qwen3-VL-235B-A22B-Instruct",
                "quantization": "fp8",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "repetition_penalty",
                    "top_k",
                    "seed",
                    "min_p",
                    "response_format"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://deepinfra.com/terms",
                    "privacyPolicyURL": "https://deepinfra.com/privacy"
                },
                "pricing": {
                    "prompt": "0.0000002",
                    "completion": "0.0000012",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.0000002",
                    "openai:completion_tokens": "0.0000012"
                },
                "pricing_version_id": "e564dec6-f9d2-4049-bd90-bc07dbd96bd3",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": false,
                        "structured_outputs": false
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5-codex",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-09-23T16:03:23.098042+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5 Codex",
            "short_name": "GPT-5 Codex",
            "author": "openai",
            "description": "GPT-5-Codex is a specialized version of GPT-5 optimized for software engineering and coding workflows. It is designed for both interactive development sessions and long, independent execution of complex engineering tasks. The model supports building projects from scratch, feature development, debugging, large-scale refactoring, and code review. Compared to GPT-5, Codex is more steerable, adheres closely to developer instructions, and produces cleaner, higher-quality code outputs. Reasoning effort can be adjusted with the `reasoning.effort` parameter. Read the [docs here](https://openrouter.ai/docs/use-cases/reasoning-tokens#reasoning-effort-level)\n\nCodex integrates into developer environments including the CLI, IDE extensions, GitHub, and cloud tasks. It adapts reasoning effort dynamically—providing fast responses for small tasks while sustaining extended multi-hour runs for large projects. The model is trained to perform structured code reviews, catching critical flaws by reasoning over dependencies and validating behavior against tests. It also supports multimodal inputs such as images or screenshots for UI development and integrates tool use for search, dependency installation, and environment setup. Codex is intended specifically for agentic coding applications.",
            "model_version_group_id": null,
            "context_length": 400000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "openai/gpt-5-codex",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "f10a63bc-2bcd-4726-9e75-1e482efd080c",
                "name": "OpenAI | openai/gpt-5-codex",
                "context_length": 400000,
                "model": {
                    "slug": "openai/gpt-5-codex",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-09-23T16:03:23.098042+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5 Codex",
                    "short_name": "GPT-5 Codex",
                    "author": "openai",
                    "description": "GPT-5-Codex is a specialized version of GPT-5 optimized for software engineering and coding workflows. It is designed for both interactive development sessions and long, independent execution of complex engineering tasks. The model supports building projects from scratch, feature development, debugging, large-scale refactoring, and code review. Compared to GPT-5, Codex is more steerable, adheres closely to developer instructions, and produces cleaner, higher-quality code outputs. Reasoning effort can be adjusted with the `reasoning.effort` parameter. Read the [docs here](https://openrouter.ai/docs/use-cases/reasoning-tokens#reasoning-effort-level)\n\nCodex integrates into developer environments including the CLI, IDE extensions, GitHub, and cloud tasks. It adapts reasoning effort dynamically—providing fast responses for small tasks while sustaining extended multi-hour runs for large projects. The model is trained to perform structured code reviews, catching critical flaws by reasoning over dependencies and validating behavior against tests. It also supports multimodal inputs such as images or screenshots for UI development and integrates tool use for search, dependency installation, and environment setup. Codex is intended specifically for agentic coding applications.",
                    "model_version_group_id": null,
                    "context_length": 400000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-5-codex",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5-codex",
                "model_variant_permaslug": "openai/gpt-5-codex",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-5-codex",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": 272000,
                "max_completion_tokens": 128000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000125",
                    "completion": "0.00001",
                    "input_cache_read": "0.000000125",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.00000125,
                    "openai_responses:completion_tokens": 0.00001,
                    "openai_responses:cached_prompt_tokens": 1.25e-7
                },
                "pricing_version_id": "a7ad56ea-d51d-4add-b41a-b2c02e411b01",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true,
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "x-ai/grok-4-fast",
            "hf_slug": "",
            "updated_at": "2025-11-19T22:48:00.44912+00:00",
            "created_at": "2025-09-19T00:01:30.267569+00:00",
            "hf_updated_at": null,
            "name": "xAI: Grok 4 Fast",
            "short_name": "Grok 4 Fast",
            "author": "x-ai",
            "description": "Grok 4 Fast is xAI's latest multimodal model with SOTA cost-efficiency and a 2M token context window. It comes in two flavors: non-reasoning and reasoning. Read more about the model on xAI's [news post](http://x.ai/news/grok-4-fast).\n\nReasoning can be enabled/disabled using the `reasoning` `enabled` parameter in the API. [Learn more in our docs](https://openrouter.ai/docs/use-cases/reasoning-tokens#controlling-reasoning-tokens)",
            "model_version_group_id": null,
            "context_length": 2000000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Grok",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "x-ai/grok-4-fast",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "c9586d9d-97ff-40ca-ae94-22504d6f9b7e",
                "name": "xAI | x-ai/grok-4-fast",
                "context_length": 2000000,
                "model": {
                    "slug": "x-ai/grok-4-fast",
                    "hf_slug": "",
                    "updated_at": "2025-11-19T22:48:00.44912+00:00",
                    "created_at": "2025-09-19T00:01:30.267569+00:00",
                    "hf_updated_at": null,
                    "name": "xAI: Grok 4 Fast",
                    "short_name": "Grok 4 Fast",
                    "author": "x-ai",
                    "description": "Grok 4 Fast is xAI's latest multimodal model with SOTA cost-efficiency and a 2M token context window. It comes in two flavors: non-reasoning and reasoning. Read more about the model on xAI's [news post](http://x.ai/news/grok-4-fast).\n\nReasoning can be enabled/disabled using the `reasoning` `enabled` parameter in the API. [Learn more in our docs](https://openrouter.ai/docs/use-cases/reasoning-tokens#controlling-reasoning-tokens)",
                    "model_version_group_id": null,
                    "context_length": 2000000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Grok",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "x-ai/grok-4-fast",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "x-ai/grok-4-fast",
                "model_variant_permaslug": "x-ai/grok-4-fast",
                "adapter_name": "XAIResponsesAdapter",
                "provider_name": "xAI",
                "provider_info": {
                    "name": "xAI",
                    "displayName": "xAI",
                    "slug": "xai",
                    "baseUrl": "https://api.x.ai/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://x.ai/legal/terms-of-service-enterprise",
                        "privacyPolicyURL": "https://x.ai/legal/privacy-policy",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "XAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.x.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://x.ai/&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": null
                },
                "provider_display_name": "xAI",
                "provider_slug": "xai",
                "provider_model_id": "grok-4-fast-non-reasoning",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 30000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "logprobs",
                    "top_logprobs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://x.ai/legal/terms-of-service-enterprise",
                    "privacyPolicyURL": "https://x.ai/legal/privacy-policy",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.0000002",
                    "completion": "0.0000005",
                    "image": "0",
                    "request": "0",
                    "input_cache_read": "0.00000005",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "prompt-threshold",
                        "threshold": 128000,
                        "prompt": "0.0000004",
                        "completions": "0.000001",
                        "input_cache_read": "0.00000005"
                    }
                ],
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_native_web_search": true,
                    "disable_free_endpoint_limits": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "opengvlab/internvl3-78b",
            "hf_slug": "OpenGVLab/InternVL3-78B",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-09-15T18:55:55.952936+00:00",
            "hf_updated_at": null,
            "name": "OpenGVLab: InternVL3 78B",
            "short_name": "InternVL3 78B",
            "author": "opengvlab",
            "description": "The InternVL3 series is an advanced multimodal large language model (MLLM). Compared to InternVL 2.5, InternVL3 demonstrates stronger multimodal perception and reasoning capabilities. \n\nIn addition, InternVL3 is benchmarked against the Qwen2.5 Chat models, whose pre-trained base models serve as the initialization for its language component. Benefiting from Native Multimodal Pre-Training, the InternVL3 series surpasses the Qwen2.5 series in overall text performance.",
            "model_version_group_id": null,
            "context_length": 32768,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "opengvlab/internvl3-78b",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "832d7038-1b47-4530-ba1e-ce6668e1fdfa",
                "name": "Chutes | opengvlab/internvl3-78b",
                "context_length": 32768,
                "model": {
                    "slug": "opengvlab/internvl3-78b",
                    "hf_slug": "OpenGVLab/InternVL3-78B",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-09-15T18:55:55.952936+00:00",
                    "hf_updated_at": null,
                    "name": "OpenGVLab: InternVL3 78B",
                    "short_name": "InternVL3 78B",
                    "author": "opengvlab",
                    "description": "The InternVL3 series is an advanced multimodal large language model (MLLM). Compared to InternVL 2.5, InternVL3 demonstrates stronger multimodal perception and reasoning capabilities. \n\nIn addition, InternVL3 is benchmarked against the Qwen2.5 Chat models, whose pre-trained base models serve as the initialization for its language component. Benefiting from Native Multimodal Pre-Training, the InternVL3 series surpasses the Qwen2.5 series in overall text performance.",
                    "model_version_group_id": null,
                    "context_length": 0,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "opengvlab/internvl3-78b",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "opengvlab/internvl3-78b",
                "model_variant_permaslug": "opengvlab/internvl3-78b",
                "adapter_name": "ChutesAdapter",
                "provider_name": "Chutes",
                "provider_info": {
                    "name": "Chutes",
                    "displayName": "Chutes",
                    "slug": "chutes",
                    "baseUrl": "https://llm.chutes.ai/v1",
                    "dataPolicy": {
                        "training": true,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://chutes.ai/tos"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "ChutesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://chutes.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "openbmb/MiniCPM4-8B",
                        "agentica-org/DeepSWE-Preview",
                        "moonshotai/Kimi-K2-Instruct-tools",
                        "internlm/Intern-S1",
                        "TheDrummer/Gemmasutra-Pro-27B-v1.1",
                        "all-hands/openhands-lm-32b-v0.1-ep3",
                        "TheDrummer/Tunguska-39B-v1",
                        "Meridian",
                        "Zenith",
                        "Proxima",
                        "agentica-org/DeepCoder-14B-Preview",
                        "TheDrummer/Cydonia-24B-v2.1",
                        "Tesslate/UIGEN-X-32B-0727",
                        "NousResearch/Hermes-4-14B",
                        "unsloth/gemma-3-4b-it",
                        "tencent/Hunyuan-A13B-Instruct",
                        "unsloth/Llama-3.2-3B-Instruct",
                        "unsloth/Llama-3.2-1B-Instruct",
                        "zai-org/GLM-4.5-turbo",
                        "zai-org/GLM-4.6-turbo",
                        "rednote-hilab/dots.ocr",
                        "deepseek-ai/DeepSeek-V3-0324-turbo",
                        "deepseek-ai/DeepSeek-V3.1-turbo",
                        "moonshotai/Kimi-K2-Thinking",
                        "zai-org/GLM-4.5",
                        "deepseek-ai/DeepSeek-V3.1",
                        "zai-org/GLM-4.6-FP8",
                        "zai-org/GLM-4.7-FP8",
                        "zai-org/GLM-4.5-FP8"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Chutes",
                "provider_slug": "chutes/bf16",
                "provider_model_id": "OpenGVLab/InternVL3-78B-TEE",
                "quantization": "bf16",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 32768,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "top_k",
                    "repetition_penalty",
                    "response_format",
                    "structured_outputs"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": true,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://chutes.ai/tos"
                },
                "pricing": {
                    "prompt": "0.0000001",
                    "completion": "0.00000039",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.0000001",
                    "openai:completion_tokens": "0.00000039"
                },
                "pricing_version_id": "c6552ee8-61f8-4cce-8350-41844cfd6986",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "deepcogito/cogito-v2-preview-llama-109b-moe",
            "hf_slug": "deepcogito/cogito-v2-preview-llama-109B-MoE",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-09-02T16:46:08.407814+00:00",
            "hf_updated_at": null,
            "name": "Cogito V2 Preview Llama 109B",
            "short_name": "Cogito V2 Preview Llama 109B",
            "author": "deepcogito",
            "description": "An instruction-tuned, hybrid-reasoning Mixture-of-Experts model built on Llama-4-Scout-17B-16E. Cogito v2 can answer directly or engage an extended “thinking” phase, with alignment guided by Iterated Distillation & Amplification (IDA). It targets coding, STEM, instruction following, and general helpfulness, with stronger multilingual, tool-calling, and reasoning performance than size-equivalent baselines. The model supports long-context use (up to 10M tokens) and standard Transformers workflows. Users can control the reasoning behaviour with the `reasoning` `enabled` boolean. [Learn more in our docs](https://openrouter.ai/docs/use-cases/reasoning-tokens#enable-reasoning-with-default-config)",
            "model_version_group_id": null,
            "context_length": 32767,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Llama4",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "deepcogito/cogito-v2-preview-llama-109b-moe",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": "<think>",
                "end_token": "</think>",
                "system_prompt": "Enable deep thinking subroutine."
            },
            "features": {
                "reasoning_config": {
                    "start_token": "<think>",
                    "end_token": "</think>",
                    "system_prompt": "Enable deep thinking subroutine."
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "349f6bd6-3722-4ffd-a1af-cee16a5d6784",
                "name": "Together | deepcogito/cogito-v2-preview-llama-109b-moe",
                "context_length": 32767,
                "model": {
                    "slug": "deepcogito/cogito-v2-preview-llama-109b-moe",
                    "hf_slug": "deepcogito/cogito-v2-preview-llama-109B-MoE",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-09-02T16:46:08.407814+00:00",
                    "hf_updated_at": null,
                    "name": "Cogito V2 Preview Llama 109B",
                    "short_name": "Cogito V2 Preview Llama 109B",
                    "author": "deepcogito",
                    "description": "An instruction-tuned, hybrid-reasoning Mixture-of-Experts model built on Llama-4-Scout-17B-16E. Cogito v2 can answer directly or engage an extended “thinking” phase, with alignment guided by Iterated Distillation & Amplification (IDA). It targets coding, STEM, instruction following, and general helpfulness, with stronger multilingual, tool-calling, and reasoning performance than size-equivalent baselines. The model supports long-context use (up to 10M tokens) and standard Transformers workflows. Users can control the reasoning behaviour with the `reasoning` `enabled` boolean. [Learn more in our docs](https://openrouter.ai/docs/use-cases/reasoning-tokens#enable-reasoning-with-default-config)",
                    "model_version_group_id": null,
                    "context_length": 131072,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Llama4",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "deepcogito/cogito-v2-preview-llama-109b-moe",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": "<think>",
                        "end_token": "</think>",
                        "system_prompt": "Enable deep thinking subroutine."
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": "<think>",
                            "end_token": "</think>",
                            "system_prompt": "Enable deep thinking subroutine."
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "deepcogito/cogito-v2-preview-llama-109b-moe",
                "model_variant_permaslug": "deepcogito/cogito-v2-preview-llama-109b-moe",
                "adapter_name": "TogetherAdapter",
                "provider_name": "Together",
                "provider_info": {
                    "name": "Together",
                    "displayName": "Together",
                    "slug": "together",
                    "baseUrl": "https://api.together.xyz/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.together.ai/terms-of-service",
                        "privacyPolicyURL": "https://www.together.ai/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "TogetherAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.together.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://www.together.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "mixedbread-ai/Mxbai-Rerank-Large-V2",
                        "BAAI/bge-base-en-v1.5-vllm",
                        "scb10x/scb10x-typhoon-2-1-gemma3-12b",
                        "arcee-ai/AFM-4.5B-Preview",
                        "deepseek-ai/DeepSeek-R1-0528-tput",
                        "black-forest-labs/FLUX.1-kontext-dev",
                        "google/gemma-3-27b-it",
                        "Qwen/Qwen3-32B-FP8",
                        "openai/whisper-large-v3",
                        "eddie/Qwen3-32B",
                        "eddiehou/meta-llama/Llama-3.1-405B",
                        "yan/deepseek-ai-deepseek-v3",
                        "moz/Llama-3.3-70B-Instruct-Turbo",
                        "serverless-qwen-qwen3-32b-fp8",
                        "qwen-qwen3-32b-fp8-serverless",
                        "moz-llama-3-3-70b-instruct-turbo",
                        "moonshotai/Kimi-K2-Instruct-tgl-testing",
                        "VirtueAIxTogether/VirtueGuard-Text-Lite",
                        "Virtue-AI/VirtueGuard-Text-Lite",
                        "black-forest-labs/FLUX.1-krea-dev",
                        "prosus/qwen-qwen3-32b-fp8-long-context",
                        "meta-llama/Llama-4-Scout-17B-16E-Instruct-batch",
                        "deepseek-ai/DeepSeek-R1-DE",
                        "arize-ai/qwen-2-1.5b-instruct",
                        "openai/gpt-oss-120b",
                        "meta-llama/Llama-3-70b-hf",
                        "Qwen/Qwen2.5-72B-Instruct",
                        "meta-llama/Meta-Llama-3.1-70B-Instruct-Reference",
                        "meta-llama/Llama-3.2-1B-Instruct",
                        "meta-llama/Meta-Llama-3.1-8B-Instruct-Reference",
                        "meta-llama/Meta-Llama-3-8B-Instruct",
                        "meta-llama/Llama-3.1-405B-Instruct",
                        "cartesia/sonic",
                        "cartesia/sonic-2",
                        "togethercomputer/MoA-1",
                        "Salesforce/Llama-Rank-V1",
                        "black-forest-labs/FLUX.1-schnell",
                        "lgai/exaone-3-5-32b-instruct",
                        "lgai/exaone-deep-32b",
                        "black-forest-labs/FLUX.1-dev",
                        "marin-community/marin-8b-instruct",
                        "togethercomputer/Refuel-Llm-V2-Small",
                        "meta-llama/Llama-3-70b-chat-hf",
                        "Alibaba-NLP/gte-modernbert-base",
                        "black-forest-labs/FLUX.1-pro",
                        "black-forest-labs/FLUX.1.1-pro",
                        "togethercomputer/MoA-1-Turbo",
                        "black-forest-labs/FLUX.1-dev-lora",
                        "meta-llama/Llama-2-70b-hf",
                        "togethercomputer/m2-bert-80M-32k-retrieval",
                        "togethercomputer/Refuel-Llm-V2",
                        "intfloat/multilingual-e5-large-instruct",
                        "black-forest-labs/FLUX.1-kontext-max",
                        "black-forest-labs/FLUX.1-schnell-Free",
                        "black-forest-labs/FLUX.1-kontext-pro",
                        "BAAI/bge-large-en-v1.5",
                        "BAAI/bge-base-en-v1.5",
                        "Qwen/Qwen3-Next-80B-A3B-Instruct",
                        "ServiceNow-AI/Apriel-1.5-15b-Thinker",
                        "openai/whisper-large-v3-test",
                        "codellama/CodeLlama-34b-Instruct-hf",
                        "meta-llama/Llama-2-13b-chat-hf",
                        "togethercomputer/m2-bert-80M-8k-retrieval",
                        "WhereIsAI/UAE-Large-V1",
                        "meta-llama/Meta-Llama-3.1-405B-Instruct-Lite-Pro",
                        "togethercomputer/m2-bert-80M-2k-retrieval",
                        "meta-llama/Meta-Llama-3-70B-Instruct-Lite",
                        "Meta-Llama/Llama-Guard-7b",
                        "Gryphe/MythoMax-L2-13b-Lite",
                        "upstage/SOLAR-10.7B-Instruct-v1.0",
                        "Qwen/Qwen2.5-14B-Instruct",
                        "meta-llama/Llama-3.3-70B-Instruct-Turbo-Free",
                        "deepseek-ai/DeepSeek-R1-Distill-Llama-70B-free",
                        "zai-org/GLM-4.5-Air-FP8",
                        "kwaivgI/kling-1.6-standard",
                        "HiDream-ai/HiDream-I1-Full",
                        "ByteDance-Seed/Seedream-3.0",
                        "ByteDance-Seed/Seedream-4.0",
                        "Lykon/DreamShaper",
                        "HiDream-ai/HiDream-I1-Dev",
                        "Qwen/Qwen-Image",
                        "RunDiffusion/Juggernaut-pro-flux",
                        "google/imagen-4.0-preview",
                        "google/imagen-4.0-ultra",
                        "google/veo-3.0",
                        "minimax/hailuo-02",
                        "stabilityai/stable-diffusion-3-medium",
                        "black-forest-labs/FLUX.1-Canny-pro",
                        "google/imagen-4.0-fast",
                        "minimax/video-01-director",
                        "HiDream-ai/HiDream-I1-Fast",
                        "Wan-AI/Wan2.2-T2V-A14B",
                        "ByteDance/Seedance-1.0-pro",
                        "google/veo-3.0-fast-audio",
                        "vidu/vidu-q1",
                        "kwaivgI/kling-2.1-master",
                        "google/veo-3.0-audio",
                        "Rundiffusion/Juggernaut-Lightning-Flux",
                        "Wan-AI/Wan2.2-I2V-A14B",
                        "google/flash-image-2.5",
                        "google/veo-2.0",
                        "openai/sora-2",
                        "google/veo-3.0-fast",
                        "ideogram/ideogram-3.0",
                        "kwaivgI/kling-2.0-master",
                        "kwaivgI/kling-2.1-standard",
                        "pixverse/pixverse-v5",
                        "stabilityai/stable-diffusion-xl-base-1.0",
                        "openai/sora-2-pro",
                        "ByteDance/Seedance-1.0-lite",
                        "kwaivgI/kling-1.6-pro",
                        "vidu/vidu-2.0",
                        "kwaivgI/kling-2.1-pro",
                        "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo",
                        "canopylabs/orpheus-3b-0.1-ft",
                        "hexgrad/Kokoro-82M",
                        "eddie/gemma-2b-it",
                        "mistralai/Voxtral-Mini-3B-2507",
                        "arcee-ai/coder-large",
                        "arcee-ai/virtuoso-large",
                        "arcee-ai/maestro-reasoning",
                        "deepcogito/cogito-v2-1-671b",
                        "arcee_ai/arcee-spotlight",
                        "google/gemini-3-pro-image",
                        "mercor/cwm",
                        "black-forest-labs/FLUX.2-flex",
                        "keith-aditya/kimi-k2-instruct",
                        "pangram/mistral-small-2501",
                        "black-forest-labs/FLUX.2-pro",
                        "black-forest-labs/FLUX.2-dev",
                        "ServiceNow-AI/Apriel-1.6-15b-Thinker"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Together",
                "provider_slug": "together",
                "provider_model_id": "deepcogito/cogito-v2-preview-llama-109B-MoE",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "top_k",
                    "repetition_penalty",
                    "logit_bias",
                    "min_p",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.together.ai/terms-of-service",
                    "privacyPolicyURL": "https://www.together.ai/privacy"
                },
                "pricing": {
                    "prompt": "0.00000018",
                    "completion": "0.00000059",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000018",
                    "openai:completion_tokens": "0.00000059"
                },
                "pricing_version_id": "bf29ccf8-e7d6-4fed-8e34-100d2a2172c4",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": "2026-02-04"
            }
        },
        {
            "slug": "stepfun-ai/step3",
            "hf_slug": "stepfun-ai/step3",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-08-28T21:09:35.282323+00:00",
            "hf_updated_at": null,
            "name": "StepFun: Step3",
            "short_name": "Step3",
            "author": "stepfun-ai",
            "description": "Step3 is a cutting-edge multimodal reasoning model—built on a Mixture-of-Experts architecture with 321B total parameters and 38B active. It is designed end-to-end to minimize decoding costs while delivering top-tier performance in vision–language reasoning. Through the co-design of Multi-Matrix Factorization Attention (MFA) and Attention-FFN Disaggregation (AFD), Step3 maintains exceptional efficiency across both flagship and low-end accelerators.",
            "model_version_group_id": null,
            "context_length": 65536,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "stepfun-ai/step3",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "d07c4675-6f77-4783-b2ab-2123a5064d2c",
                "name": "SiliconFlow | stepfun-ai/step3",
                "context_length": 65536,
                "model": {
                    "slug": "stepfun-ai/step3",
                    "hf_slug": "stepfun-ai/step3",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-08-28T21:09:35.282323+00:00",
                    "hf_updated_at": null,
                    "name": "StepFun: Step3",
                    "short_name": "Step3",
                    "author": "stepfun-ai",
                    "description": "Step3 is a cutting-edge multimodal reasoning model—built on a Mixture-of-Experts architecture with 321B total parameters and 38B active. It is designed end-to-end to minimize decoding costs while delivering top-tier performance in vision–language reasoning. Through the co-design of Multi-Matrix Factorization Attention (MFA) and Attention-FFN Disaggregation (AFD), Step3 maintains exceptional efficiency across both flagship and low-end accelerators.",
                    "model_version_group_id": null,
                    "context_length": 65536,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "stepfun-ai/step3",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "stepfun-ai/step3",
                "model_variant_permaslug": "stepfun-ai/step3",
                "adapter_name": "SiliconFlowAdapter",
                "provider_name": "SiliconFlow",
                "provider_info": {
                    "name": "SiliconFlow",
                    "displayName": "SiliconFlow",
                    "slug": "siliconflow",
                    "baseUrl": "https://api.siliconflow.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://docs.siliconflow.com/en/legals/terms-of-service",
                        "privacyPolicyURL": "https://docs.siliconflow.com/en/legals/privacy-policy"
                    },
                    "headquarters": "SG",
                    "datacenters": [],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "SiliconFlowAdapter",
                    "isMultipartSupported": false,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "/images/icons/SiliconFlow.svg"
                    },
                    "ignoredProviderModels": [
                        "inclusionAI/Ling-mini-2.0",
                        "inclusionAI/Ring-flash-2.0",
                        "inclusionAI/Ling-flash-2.0"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "SiliconFlow",
                "provider_slug": "siliconflow/fp8",
                "provider_model_id": "stepfun-ai/step3",
                "quantization": "fp8",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 65536,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "temperature",
                    "top_p",
                    "top_k",
                    "frequency_penalty",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://docs.siliconflow.com/en/legals/terms-of-service",
                    "privacyPolicyURL": "https://docs.siliconflow.com/en/legals/privacy-policy"
                },
                "pricing": {
                    "prompt": "0.00000057",
                    "completion": "0.00000142",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000057",
                    "openai:completion_tokens": "0.00000142"
                },
                "pricing_version_id": "691bbba1-c72e-4d5a-85f4-89fe9fe29f3b",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "mistralai/mistral-medium-3.1",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-08-13T14:33:59.459114+00:00",
            "hf_updated_at": null,
            "name": "Mistral: Mistral Medium 3.1",
            "short_name": "Mistral Medium 3.1",
            "author": "mistralai",
            "description": "Mistral Medium 3.1 is an updated version of Mistral Medium 3, which is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced operational cost. It balances state-of-the-art reasoning and multimodal performance with 8× lower cost compared to traditional large models, making it suitable for scalable deployments across professional and industrial use cases.\n\nThe model excels in domains such as coding, STEM reasoning, and enterprise adaptation. It supports hybrid, on-prem, and in-VPC deployments and is optimized for integration into custom workflows. Mistral Medium 3.1 offers competitive accuracy relative to larger models like Claude Sonnet 3.5/3.7, Llama 4 Maverick, and Command R+, while maintaining broad compatibility across cloud environments.",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Mistral",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "mistralai/mistral-medium-3.1",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": 0.3
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "13c5002b-8c5b-490c-8a5f-52ec0242804f",
                "name": "Mistral | mistralai/mistral-medium-3.1",
                "context_length": 131072,
                "model": {
                    "slug": "mistralai/mistral-medium-3.1",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-08-13T14:33:59.459114+00:00",
                    "hf_updated_at": null,
                    "name": "Mistral: Mistral Medium 3.1",
                    "short_name": "Mistral Medium 3.1",
                    "author": "mistralai",
                    "description": "Mistral Medium 3.1 is an updated version of Mistral Medium 3, which is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced operational cost. It balances state-of-the-art reasoning and multimodal performance with 8× lower cost compared to traditional large models, making it suitable for scalable deployments across professional and industrial use cases.\n\nThe model excels in domains such as coding, STEM reasoning, and enterprise adaptation. It supports hybrid, on-prem, and in-VPC deployments and is optimized for integration into custom workflows. Mistral Medium 3.1 offers competitive accuracy relative to larger models like Claude Sonnet 3.5/3.7, Llama 4 Maverick, and Command R+, while maintaining broad compatibility across cloud environments.",
                    "model_version_group_id": null,
                    "context_length": 131072,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Mistral",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "mistralai/mistral-medium-3.1",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {
                        "temperature": 0.3
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "mistralai/mistral-medium-3.1",
                "model_variant_permaslug": "mistralai/mistral-medium-3.1",
                "adapter_name": "MistralAdapter",
                "provider_name": "Mistral",
                "provider_info": {
                    "name": "Mistral",
                    "displayName": "Mistral",
                    "slug": "mistral",
                    "baseUrl": "https://api.mistral.ai/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://mistral.ai/terms/#terms-of-use",
                        "privacyPolicyURL": "https://mistral.ai/terms/#privacy-policy"
                    },
                    "headquarters": "FR",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "MistralAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.mistral.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Mistral.png"
                    },
                    "ignoredProviderModels": [
                        "mistral-moderation-2411-all",
                        "voxtral-mini-2507",
                        "voxtral-small-2507",
                        "voxtral-mini-transcribe-2507",
                        "mistral-medium",
                        "mistral-tiny",
                        "mistral-tiny-2312",
                        "open-mistral-nemo",
                        "mistral-tiny-2407",
                        "open-mixtral-8x7b",
                        "mistral-small",
                        "mistral-small-2312",
                        "open-mixtral-8x22b-2404",
                        "mistral-large-pixtral-2411",
                        "codestral-2412",
                        "codestral-2411-rc5",
                        "pixtral-12b",
                        "mistral-moderation-2411",
                        "mistral-ocr-2503",
                        "mistral-ocr-2505",
                        "mistral-saba-2502",
                        "open-mixtral-8x22b",
                        "mistral-large-2407",
                        "magistral-medium-2507",
                        "mistral-embed",
                        "codestral-embed",
                        "codestral-2501",
                        "mistral-small-2501",
                        "mistral-ocr-2512",
                        "labs-devstral-small-2512"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "mistral"
                },
                "provider_display_name": "Mistral",
                "provider_slug": "mistral",
                "provider_model_id": "mistral-medium-2508",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://mistral.ai/terms/#terms-of-use",
                    "privacyPolicyURL": "https://mistral.ai/terms/#privacy-policy"
                },
                "pricing": {
                    "prompt": "0.0000004",
                    "completion": "0.000002",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "mistral:prompt_tokens": 4e-7,
                    "mistral:completion_tokens": 0.000002
                },
                "pricing_version_id": "2fd2a6a7-7579-4e66-88b2-3ff4e4d7e68d",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {},
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "baidu/ernie-4.5-vl-28b-a3b",
            "hf_slug": "baidu/ERNIE-4.5-VL-28B-A3B-PT",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-08-12T21:07:16.565993+00:00",
            "hf_updated_at": null,
            "name": "Baidu: ERNIE 4.5 VL 28B A3B",
            "short_name": "ERNIE 4.5 VL 28B A3B",
            "author": "baidu",
            "description": "A powerful multimodal Mixture-of-Experts chat model featuring 28B total parameters with 3B activated per token, delivering exceptional text and vision understanding through its innovative heterogeneous MoE structure with modality-isolated routing. Built with scaling-efficient infrastructure for high-throughput training and inference, the model leverages advanced post-training techniques including SFT, DPO, and UPO for optimized performance, while supporting an impressive 131K context length and RLVR alignment for superior cross-modal reasoning and generation capabilities.",
            "model_version_group_id": null,
            "context_length": 30000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "baidu/ernie-4.5-vl-28b-a3b",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "75e64609-6b51-4e35-96ea-5065c6fbda63",
                "name": "Novita | baidu/ernie-4.5-vl-28b-a3b",
                "context_length": 30000,
                "model": {
                    "slug": "baidu/ernie-4.5-vl-28b-a3b",
                    "hf_slug": "baidu/ERNIE-4.5-VL-28B-A3B-PT",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-08-12T21:07:16.565993+00:00",
                    "hf_updated_at": null,
                    "name": "Baidu: ERNIE 4.5 VL 28B A3B",
                    "short_name": "ERNIE 4.5 VL 28B A3B",
                    "author": "baidu",
                    "description": "A powerful multimodal Mixture-of-Experts chat model featuring 28B total parameters with 3B activated per token, delivering exceptional text and vision understanding through its innovative heterogeneous MoE structure with modality-isolated routing. Built with scaling-efficient infrastructure for high-throughput training and inference, the model leverages advanced post-training techniques including SFT, DPO, and UPO for optimized performance, while supporting an impressive 131K context length and RLVR alignment for superior cross-modal reasoning and generation capabilities.",
                    "model_version_group_id": null,
                    "context_length": 131072,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "baidu/ernie-4.5-vl-28b-a3b",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "baidu/ernie-4.5-vl-28b-a3b",
                "model_variant_permaslug": "baidu/ernie-4.5-vl-28b-a3b",
                "adapter_name": "NovitaAdapter",
                "provider_name": "Novita",
                "provider_info": {
                    "name": "Novita",
                    "displayName": "NovitaAI",
                    "slug": "novita",
                    "baseUrl": "https://api.novita.ai/v3/openai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://novita.ai/legal/terms-of-service",
                        "privacyPolicyURL": "https://novita.ai/legal/privacy-policy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "org_34P2zP0TCZwbzCC8QkH8m8o1i8M"
                    ],
                    "adapterName": "NovitaAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.novita.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://novita.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "google/gemma-3-1b-it",
                        "baichuan/baichuan-m2-32b",
                        "baidu/ernie-4.5-0.3b",
                        "qwen/qwen-mt-plus",
                        "qwen/qwen3-4b-fp8",
                        "meta-llama/llama-3.2-1b-instruct",
                        "sophosympatheia/midnight-rose-70b",
                        "deepseek/deepseek-prover-v2-671b",
                        "Sao10K/L3-8B-Stheno-v3.2",
                        "thudm/glm-4-32b-0414",
                        "qwen/qwen3-omni-30b-a3b-thinking",
                        "qwen/qwen3-omni-30b-a3b-instruct",
                        "paddlepaddle/paddleocr-vl",
                        "deepseek/deepseek-ocr",
                        "skywork/r1v4-lite",
                        "baidu/ernie-4.5-vl-28b-a3b-thinking",
                        "zai-org/autoglm-phone-9b-multilingual"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "NovitaAI",
                "provider_slug": "novita/fp16",
                "provider_model_id": "baidu/ernie-4.5-vl-28b-a3b",
                "quantization": "fp16",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 8000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "top_k",
                    "repetition_penalty",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://novita.ai/legal/terms-of-service",
                    "privacyPolicyURL": "https://novita.ai/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0.00000014",
                    "completion": "0.00000056",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000014",
                    "openai:completion_tokens": "0.00000056"
                },
                "pricing_version_id": "2b814f58-4fa0-4308-ae26-03d5ed15732f",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {},
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "z-ai/glm-4.5v",
            "hf_slug": "zai-org/GLM-4.5V",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-08-11T14:24:48.340676+00:00",
            "hf_updated_at": null,
            "name": "Z.AI: GLM 4.5V",
            "short_name": "GLM 4.5V",
            "author": "z-ai",
            "description": "GLM-4.5V is a vision-language foundation model for multimodal agent applications. Built on a Mixture-of-Experts (MoE) architecture with 106B parameters and 12B activated parameters, it achieves state-of-the-art results in video understanding, image Q&A, OCR, and document parsing, with strong gains in front-end web coding, grounding, and spatial reasoning. It offers a hybrid inference mode: a \"thinking mode\" for deep reasoning and a \"non-thinking mode\" for fast responses. Reasoning behavior can be toggled via the `reasoning` `enabled` boolean. [Learn more in our docs](https://openrouter.ai/docs/use-cases/reasoning-tokens#enable-reasoning-with-default-config)",
            "model_version_group_id": null,
            "context_length": 65536,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "z-ai/glm-4.5v",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": "<think>",
                "end_token": "</think>",
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": "<think>",
                    "end_token": "</think>",
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": 0.75,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "30f10717-f218-430f-a3d7-858bf5fdf303",
                "name": "Novita | z-ai/glm-4.5v",
                "context_length": 65536,
                "model": {
                    "slug": "z-ai/glm-4.5v",
                    "hf_slug": "zai-org/GLM-4.5V",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-08-11T14:24:48.340676+00:00",
                    "hf_updated_at": null,
                    "name": "Z.AI: GLM 4.5V",
                    "short_name": "GLM 4.5V",
                    "author": "z-ai",
                    "description": "GLM-4.5V is a vision-language foundation model for multimodal agent applications. Built on a Mixture-of-Experts (MoE) architecture with 106B parameters and 12B activated parameters, it achieves state-of-the-art results in video understanding, image Q&A, OCR, and document parsing, with strong gains in front-end web coding, grounding, and spatial reasoning. It offers a hybrid inference mode: a \"thinking mode\" for deep reasoning and a \"non-thinking mode\" for fast responses. Reasoning behavior can be toggled via the `reasoning` `enabled` boolean. [Learn more in our docs](https://openrouter.ai/docs/use-cases/reasoning-tokens#enable-reasoning-with-default-config)",
                    "model_version_group_id": null,
                    "context_length": 65536,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "z-ai/glm-4.5v",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": "<think>",
                        "end_token": "</think>",
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": "<think>",
                            "end_token": "</think>",
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {
                        "temperature": 0.75,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "z-ai/glm-4.5v",
                "model_variant_permaslug": "z-ai/glm-4.5v",
                "adapter_name": "NovitaAdapter",
                "provider_name": "Novita",
                "provider_info": {
                    "name": "Novita",
                    "displayName": "NovitaAI",
                    "slug": "novita",
                    "baseUrl": "https://api.novita.ai/v3/openai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://novita.ai/legal/terms-of-service",
                        "privacyPolicyURL": "https://novita.ai/legal/privacy-policy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "org_34P2zP0TCZwbzCC8QkH8m8o1i8M"
                    ],
                    "adapterName": "NovitaAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.novita.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://novita.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "google/gemma-3-1b-it",
                        "baichuan/baichuan-m2-32b",
                        "baidu/ernie-4.5-0.3b",
                        "qwen/qwen-mt-plus",
                        "qwen/qwen3-4b-fp8",
                        "meta-llama/llama-3.2-1b-instruct",
                        "sophosympatheia/midnight-rose-70b",
                        "deepseek/deepseek-prover-v2-671b",
                        "Sao10K/L3-8B-Stheno-v3.2",
                        "thudm/glm-4-32b-0414",
                        "qwen/qwen3-omni-30b-a3b-thinking",
                        "qwen/qwen3-omni-30b-a3b-instruct",
                        "paddlepaddle/paddleocr-vl",
                        "deepseek/deepseek-ocr",
                        "skywork/r1v4-lite",
                        "baidu/ernie-4.5-vl-28b-a3b-thinking",
                        "zai-org/autoglm-phone-9b-multilingual"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "NovitaAI",
                "provider_slug": "novita/fp8",
                "provider_model_id": "zai-org/glm-4.5v",
                "quantization": "fp8",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 16384,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "top_k",
                    "repetition_penalty",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://novita.ai/legal/terms-of-service",
                    "privacyPolicyURL": "https://novita.ai/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0.0000006",
                    "completion": "0.0000018",
                    "image": "0",
                    "request": "0",
                    "input_cache_read": "0.00000011",
                    "input_cache_write": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.0000006",
                    "openai:completion_tokens": "0.0000018",
                    "openai:cached_prompt_tokens": "0.00000011"
                },
                "pricing_version_id": "e6847a35-8151-4bb4-893d-caa884086509",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {},
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5-chat",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-08-07T17:30:37.42514+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5 Chat",
            "short_name": "GPT-5 Chat",
            "author": "openai",
            "description": "GPT-5 Chat is designed for advanced, natural, multimodal, and context-aware conversations for enterprise applications.",
            "model_version_group_id": null,
            "context_length": 128000,
            "input_modalities": [
                "file",
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-5-chat-2025-08-07",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "8f8398f5-523f-4676-8ba4-e82e3484efb1",
                "name": "OpenAI | openai/gpt-5-chat-2025-08-07",
                "context_length": 128000,
                "model": {
                    "slug": "openai/gpt-5-chat",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-08-07T17:30:37.42514+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5 Chat",
                    "short_name": "GPT-5 Chat",
                    "author": "openai",
                    "description": "GPT-5 Chat is designed for advanced, natural, multimodal, and context-aware conversations for enterprise applications.",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "file",
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-5-chat-2025-08-07",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5-chat",
                "model_variant_permaslug": "openai/gpt-5-chat-2025-08-07",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-5-chat-latest",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 16384,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000125",
                    "completion": "0.00001",
                    "input_cache_read": "0.000000125",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.00000125,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.00001,
                    "openai_responses:cached_prompt_tokens": 1.25e-7
                },
                "pricing_version_id": "3895cfdc-b31b-4b8e-b29a-e5b9d384a71e",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-08-07T17:23:33+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5",
            "short_name": "GPT-5",
            "author": "openai",
            "description": "GPT-5 is OpenAI’s most advanced model, offering major improvements in reasoning, code quality, and user experience. It is optimized for complex tasks that require step-by-step reasoning, instruction following, and accuracy in high-stakes use cases. It supports test-time routing features and advanced prompt understanding, including user-specified intent like \"think hard about this.\" Improvements include reductions in hallucination, sycophancy, and better performance in coding, writing, and health-related tasks.",
            "model_version_group_id": null,
            "context_length": 400000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "openai/gpt-5-2025-08-07",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true,
                "supports_reasoning_max_tokens": null,
                "supported_reasoning_efforts": null,
                "default_reasoning_effort": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true,
                    "supports_reasoning_max_tokens": null,
                    "supported_reasoning_efforts": null,
                    "default_reasoning_effort": null
                },
                "chat_template_config": {
                    "should_hoist_and_merge_system_messages": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [
                "openai/discounted",
                "openai/default",
                "azure"
            ],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "7c2f859a-7890-4e8e-b1de-1cd1c0a800b4",
                "name": "OpenAI | openai/gpt-5-2025-08-07",
                "context_length": 400000,
                "model": {
                    "slug": "openai/gpt-5",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-08-07T17:23:33+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5",
                    "short_name": "GPT-5",
                    "author": "openai",
                    "description": "GPT-5 is OpenAI’s most advanced model, offering major improvements in reasoning, code quality, and user experience. It is optimized for complex tasks that require step-by-step reasoning, instruction following, and accuracy in high-stakes use cases. It supports test-time routing features and advanced prompt understanding, including user-specified intent like \"think hard about this.\" Improvements include reductions in hallucination, sycophancy, and better performance in coding, writing, and health-related tasks.",
                    "model_version_group_id": null,
                    "context_length": 400000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": "",
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-5-2025-08-07",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true,
                        "supports_reasoning_max_tokens": null,
                        "supported_reasoning_efforts": null,
                        "default_reasoning_effort": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true,
                            "supports_reasoning_max_tokens": null,
                            "supported_reasoning_efforts": null,
                            "default_reasoning_effort": null
                        },
                        "chat_template_config": {
                            "should_hoist_and_merge_system_messages": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [
                        "openai/discounted",
                        "openai/default",
                        "azure"
                    ],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5",
                "model_variant_permaslug": "openai/gpt-5-2025-08-07",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai/default",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai/default",
                "provider_model_id": "gpt-5-2025-08-07",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": 272000,
                "max_completion_tokens": 128000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000125",
                    "completion": "0.00001",
                    "input_cache_read": "0.000000125",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.00000125,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.00001,
                    "openai_responses:cached_prompt_tokens": 1.25e-7
                },
                "pricing_version_id": "c6d64142-2e88-4d34-8469-6b1dd34b407a",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true,
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5-mini",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-08-07T17:23:27+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5 Mini",
            "short_name": "GPT-5 Mini",
            "author": "openai",
            "description": "GPT-5 Mini is a compact version of GPT-5, designed to handle lighter-weight reasoning tasks. It provides the same instruction-following and safety-tuning benefits as GPT-5, but with reduced latency and cost. GPT-5 Mini is the successor to OpenAI's o4-mini model.",
            "model_version_group_id": null,
            "context_length": 400000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-5-mini-2025-08-07",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "c4f66d01-20b0-4c27-a225-438ea22fda43",
                "name": "OpenAI | openai/gpt-5-mini-2025-08-07",
                "context_length": 400000,
                "model": {
                    "slug": "openai/gpt-5-mini",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-08-07T17:23:27+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5 Mini",
                    "short_name": "GPT-5 Mini",
                    "author": "openai",
                    "description": "GPT-5 Mini is a compact version of GPT-5, designed to handle lighter-weight reasoning tasks. It provides the same instruction-following and safety-tuning benefits as GPT-5, but with reduced latency and cost. GPT-5 Mini is the successor to OpenAI's o4-mini model.",
                    "model_version_group_id": null,
                    "context_length": 400000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-5-mini-2025-08-07",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5-mini",
                "model_variant_permaslug": "openai/gpt-5-mini-2025-08-07",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-5-mini-2025-08-07",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": 272000,
                "max_completion_tokens": 128000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000025",
                    "completion": "0.000002",
                    "input_cache_read": "0.000000025",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 2.5e-7,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.000002,
                    "openai_responses:cached_prompt_tokens": 2.5e-8
                },
                "pricing_version_id": "e3e873c5-5dc5-476b-9720-a23c7d318945",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true,
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-5-nano",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-08-07T17:23:22+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-5 Nano",
            "short_name": "GPT-5 Nano",
            "author": "openai",
            "description": "GPT-5-Nano is the smallest and fastest variant in the GPT-5 system, optimized for developer tools, rapid interactions, and ultra-low latency environments. While limited in reasoning depth compared to its larger counterparts, it retains key instruction-following and safety features. It is the successor to GPT-4.1-nano and offers a lightweight option for cost-sensitive or real-time applications.",
            "model_version_group_id": null,
            "context_length": 400000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-5-nano-2025-08-07",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "50329d77-04e1-4979-a184-c33030289476",
                "name": "OpenAI | openai/gpt-5-nano-2025-08-07",
                "context_length": 400000,
                "model": {
                    "slug": "openai/gpt-5-nano",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-08-07T17:23:22+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-5 Nano",
                    "short_name": "GPT-5 Nano",
                    "author": "openai",
                    "description": "GPT-5-Nano is the smallest and fastest variant in the GPT-5 system, optimized for developer tools, rapid interactions, and ultra-low latency environments. While limited in reasoning depth compared to its larger counterparts, it retains key instruction-following and safety features. It is the successor to GPT-4.1-nano and offers a lightweight option for cost-sensitive or real-time applications.",
                    "model_version_group_id": null,
                    "context_length": 400000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-5-nano-2025-08-07",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-5-nano",
                "model_variant_permaslug": "openai/gpt-5-nano-2025-08-07",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-5-nano-2025-08-07",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": 272000,
                "max_completion_tokens": 128000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000005",
                    "completion": "0.0000004",
                    "input_cache_read": "0.000000005",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 5e-8,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 4e-7,
                    "openai_responses:cached_prompt_tokens": 5e-9
                },
                "pricing_version_id": "ea868e66-5993-4315-9540-a5f7cd5d9d07",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_implicit_caching": true,
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true,
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "anthropic/claude-opus-4.1",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-08-05T16:33:11.634562+00:00",
            "hf_updated_at": null,
            "name": "Anthropic: Claude Opus 4.1",
            "short_name": "Claude Opus 4.1",
            "author": "anthropic",
            "description": "Claude Opus 4.1 is an updated version of Anthropic’s flagship model, offering improved performance in coding, reasoning, and agentic tasks. It achieves 74.5% on SWE-bench Verified and shows notable gains in multi-file code refactoring, debugging precision, and detail-oriented reasoning. The model supports extended thinking up to 64K tokens and is optimized for tasks involving research, data analysis, and tool-assisted reasoning.",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "image",
                "text",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Claude",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "anthropic/claude-4.1-opus-20250805",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [
                "google-vertex",
                "amazon-bedrock",
                "anthropic"
            ],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "ece5c3c6-e437-4297-92fc-150a1771ec56",
                "name": "Amazon Bedrock | anthropic/claude-4.1-opus-20250805",
                "context_length": 200000,
                "model": {
                    "slug": "anthropic/claude-opus-4.1",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-08-05T16:33:11.634562+00:00",
                    "hf_updated_at": null,
                    "name": "Anthropic: Claude Opus 4.1",
                    "short_name": "Claude Opus 4.1",
                    "author": "anthropic",
                    "description": "Claude Opus 4.1 is an updated version of Anthropic’s flagship model, offering improved performance in coding, reasoning, and agentic tasks. It achieves 74.5% on SWE-bench Verified and shows notable gains in multi-file code refactoring, debugging precision, and detail-oriented reasoning. The model supports extended thinking up to 64K tokens and is optimized for tasks involving research, data analysis, and tool-assisted reasoning.",
                    "model_version_group_id": null,
                    "context_length": 200000,
                    "input_modalities": [
                        "image",
                        "text",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Claude",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "anthropic/claude-4.1-opus-20250805",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [
                        "google-vertex",
                        "amazon-bedrock",
                        "anthropic"
                    ],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "anthropic/claude-opus-4.1",
                "model_variant_permaslug": "anthropic/claude-4.1-opus-20250805",
                "adapter_name": "AmazonBedrockInvokeAnthropicAdapter",
                "provider_name": "Amazon Bedrock",
                "provider_info": {
                    "name": "Amazon Bedrock",
                    "displayName": "Amazon Bedrock",
                    "slug": "amazon-bedrock",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                        "privacyPolicyURL": "https://aws.amazon.com/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "dummy-value"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "AmazonBedrockConverseAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://health.aws.amazon.com/health/status",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Bedrock.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "anthropic"
                },
                "provider_display_name": "Amazon Bedrock",
                "provider_slug": "amazon-bedrock",
                "provider_model_id": "us.anthropic.claude-opus-4-1-20250805-v1:0",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 32000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "top_k",
                    "stop",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                    "privacyPolicyURL": "https://aws.amazon.com/privacy"
                },
                "pricing": {
                    "prompt": "0.000015",
                    "completion": "0.000075",
                    "input_cache_read": "0.0000015",
                    "input_cache_write": "0.00001875",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "anthropic:prompt_tokens": 0.000015,
                    "anthropic:web_search_calls": 0.01,
                    "anthropic:cache_read_tokens": 0.0000015,
                    "anthropic:completion_tokens": 0.000075,
                    "anthropic:cache_write_1h_tokens": 0.00003,
                    "anthropic:cache_write_5m_tokens": 0.00001875
                },
                "pricing_version_id": "ce33ad08-2e47-4675-9bac-0d5dbf2173f3",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {},
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "bytedance/ui-tars-1.5-7b",
            "hf_slug": "ByteDance-Seed/UI-TARS-1.5-7B",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-07-22T17:24:16.94785+00:00",
            "hf_updated_at": null,
            "name": "ByteDance: UI-TARS 7B ",
            "short_name": "UI-TARS 7B ",
            "author": "bytedance",
            "description": "UI-TARS-1.5 is a multimodal vision-language agent optimized for GUI-based environments, including desktop interfaces, web browsers, mobile systems, and games. Built by ByteDance, it builds upon the UI-TARS framework with reinforcement learning-based reasoning, enabling robust action planning and execution across virtual interfaces.\n\nThis model achieves state-of-the-art results on a range of interactive and grounding benchmarks, including OSworld, WebVoyager, AndroidWorld, and ScreenSpot. It also demonstrates perfect task completion across diverse Poki games and outperforms prior models in Minecraft agent tasks. UI-TARS-1.5 supports thought decomposition during inference and shows strong scaling across variants, with the 1.5 version notably exceeding the performance of earlier 72B and 7B checkpoints.",
            "model_version_group_id": null,
            "context_length": 128000,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "bytedance/ui-tars-1.5-7b",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "22a474a1-cb4e-42d2-b19a-c1be103f5abd",
                "name": "Parasail | bytedance/ui-tars-1.5-7b",
                "context_length": 128000,
                "model": {
                    "slug": "bytedance/ui-tars-1.5-7b",
                    "hf_slug": "ByteDance-Seed/UI-TARS-1.5-7B",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-07-22T17:24:16.94785+00:00",
                    "hf_updated_at": null,
                    "name": "ByteDance: UI-TARS 7B ",
                    "short_name": "UI-TARS 7B ",
                    "author": "bytedance",
                    "description": "UI-TARS-1.5 is a multimodal vision-language agent optimized for GUI-based environments, including desktop interfaces, web browsers, mobile systems, and games. Built by ByteDance, it builds upon the UI-TARS framework with reinforcement learning-based reasoning, enabling robust action planning and execution across virtual interfaces.\n\nThis model achieves state-of-the-art results on a range of interactive and grounding benchmarks, including OSworld, WebVoyager, AndroidWorld, and ScreenSpot. It also demonstrates perfect task completion across diverse Poki games and outperforms prior models in Minecraft agent tasks. UI-TARS-1.5 supports thought decomposition during inference and shows strong scaling across variants, with the 1.5 version notably exceeding the performance of earlier 72B and 7B checkpoints.",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "bytedance/ui-tars-1.5-7b",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "bytedance/ui-tars-1.5-7b",
                "model_variant_permaslug": "bytedance/ui-tars-1.5-7b",
                "adapter_name": "ParasailAdapter",
                "provider_name": "Parasail",
                "provider_info": {
                    "name": "Parasail",
                    "displayName": "Parasail",
                    "slug": "parasail",
                    "baseUrl": "https://api.parasail.io/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.parasail.io/legal/terms",
                        "privacyPolicyURL": "https://www.parasail.io/legal/privacy-policy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "org_34P5Ca01in28Ek1oxb5OtfZdEjQ",
                        "user_37qaJKhqfUEFgVF46sarwDHxE50"
                    ],
                    "adapterName": "ParasailAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://www.parasail.io/&size=256"
                    },
                    "ignoredProviderModels": [
                        "parasail-olmo-2-1124-7b-instruct",
                        "parasail-qwen3-omni-30b-a3b-thinking",
                        "parasail-qwen3-omni-30b-a3b-instruct",
                        "parasail-dots-ocr",
                        "parasail-auto-glm-9b-multilingual"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Parasail",
                "provider_slug": "parasail/bf16",
                "provider_model_id": "parasail-ui-tars-1p5-7b",
                "quantization": "bf16",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 2048,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "frequency_penalty",
                    "presence_penalty",
                    "repetition_penalty",
                    "seed",
                    "stop",
                    "top_k",
                    "logit_bias"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.parasail.io/legal/terms",
                    "privacyPolicyURL": "https://www.parasail.io/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0.0000001",
                    "completion": "0.0000002",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.0000001",
                    "openai:completion_tokens": "0.0000002"
                },
                "pricing_version_id": "1b8708ef-a746-47f0-9c63-2fb0a1367dab",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemini-2.5-flash-lite",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-07-22T16:04:36.283638+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 2.5 Flash Lite",
            "short_name": "Gemini 2.5 Flash Lite",
            "author": "google",
            "description": "Gemini 2.5 Flash-Lite is a lightweight reasoning model in the Gemini 2.5 family, optimized for ultra-low latency and cost efficiency. It offers improved throughput, faster token generation, and better performance across common benchmarks compared to earlier Flash models. By default, \"thinking\" (i.e. multi-pass reasoning) is disabled to prioritize speed, but developers can enable it via the [Reasoning API parameter](https://openrouter.ai/docs/use-cases/reasoning-tokens) to selectively trade off cost for intelligence. ",
            "model_version_group_id": null,
            "context_length": 1048576,
            "input_modalities": [
                "text",
                "image",
                "file",
                "audio",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-2.5-flash-lite",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "ebdbef25-737d-4ac3-9e98-fd3928724e45",
                "name": "Google | google/gemini-2.5-flash-lite",
                "context_length": 1048576,
                "model": {
                    "slug": "google/gemini-2.5-flash-lite",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-07-22T16:04:36.283638+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemini 2.5 Flash Lite",
                    "short_name": "Gemini 2.5 Flash Lite",
                    "author": "google",
                    "description": "Gemini 2.5 Flash-Lite is a lightweight reasoning model in the Gemini 2.5 family, optimized for ultra-low latency and cost efficiency. It offers improved throughput, faster token generation, and better performance across common benchmarks compared to earlier Flash models. By default, \"thinking\" (i.e. multi-pass reasoning) is disabled to prioritize speed, but developers can enable it via the [Reasoning API parameter](https://openrouter.ai/docs/use-cases/reasoning-tokens) to selectively trade off cost for intelligence. ",
                    "model_version_group_id": null,
                    "context_length": 1048576,
                    "input_modalities": [
                        "text",
                        "image",
                        "file",
                        "audio",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "google/gemini-2.5-flash-lite",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemini-2.5-flash-lite",
                "model_variant_permaslug": "google/gemini-2.5-flash-lite",
                "adapter_name": "GoogleVertexGeminiAdapter",
                "provider_name": "Google",
                "provider_info": {
                    "name": "Google",
                    "displayName": "Google Vertex",
                    "slug": "google-vertex",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "not-used"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleVertexGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.cloud.google.com/products/sdXM79fz1FS6ekNpu37K/history",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleVertex.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-exp-03-25",
                        "gemini-2.0-flash-exp",
                        "gemini-1.5-flash-002",
                        "gemini-2.0-flash-lite-001",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-2.0-flash-001",
                        "llama-4-scout-17b-16e-instruct-maas",
                        "qwen3-235b-a22b-instruct-2507-maas",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-image-preview",
                        "llama-4-maverick-17b-128e-instruct-maas",
                        "llama-3.3-70b-instruct-maas",
                        "claude-3-5-haiku@20241022",
                        "qwen3-coder-480b-a35b-instruct-maas",
                        "gemini-1.5-pro-002",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-pro",
                        "deepseek-r1-0528-maas",
                        "claude-3-7-sonnet@20250219",
                        "claude-3-5-sonnet-v2@20241022",
                        "claude-sonnet-4@20250514",
                        "claude-opus-4-1@20250805",
                        "claude-opus-4@20250514",
                        "claude-3-haiku@20240307",
                        "claude-3-5-sonnet@20240620",
                        "claude-3-opus@20240229",
                        "gemini-2.5-flash-lite-preview-09-2025",
                        "gemini-2.5-flash-preview-09-2025",
                        "gemini-2.5-flash-image",
                        "claude-sonnet-4-5@20250929",
                        "claude-haiku-4-5@20251001",
                        "minimax/minimax-m2-maas",
                        "gemini-3-pro-preview",
                        "gemini-3-pro-image-preview",
                        "claude-opus-4-5@20251101"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google Vertex",
                "provider_slug": "google-vertex",
                "provider_model_id": "gemini-2.5-flash-lite",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 65535,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "stop",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.0000001",
                    "completion": "0.0000004",
                    "image": "0.0000001",
                    "audio": "0.0000003",
                    "input_audio_cache": "0.00000003",
                    "input_cache_read": "0.00000001",
                    "input_cache_write": "0.00000008333333333333334",
                    "internal_reasoning": "0.0000004",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "gemini:prompt_tokens": 1e-7,
                    "gemini:reasoning_tokens": 4e-7,
                    "gemini:cache_read_tokens": 1e-8,
                    "gemini:completion_tokens": 4e-7,
                    "gemini:text_input_tokens": 1e-7,
                    "gemini:audio_input_tokens": 3e-7,
                    "gemini:image_input_tokens": 1e-7,
                    "gemini:video_input_tokens": 1e-7,
                    "gemini:cache_read_text_tokens": 1e-8,
                    "gemini:cache_read_audio_tokens": 3e-8,
                    "gemini:cache_read_image_tokens": 1e-8,
                    "gemini:cache_read_video_tokens": 1e-8,
                    "gemini:cache_write_storage_hours": 0.000001,
                    "gemini:cache_read_tokens_high_context": 3e-8,
                    "gemini:cache_read_text_tokens_high_context": 3e-8,
                    "gemini:cache_read_audio_tokens_high_context": 6e-8,
                    "gemini:cache_read_image_tokens_high_context": 3e-8,
                    "gemini:cache_read_video_tokens_high_context": 3e-8,
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "ca89601f-77de-41b0-b355-c79b0503e789",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_base64_video_input": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "supports_input_audio": true
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "x-ai/grok-4",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-07-09T19:01:29.595463+00:00",
            "hf_updated_at": null,
            "name": "xAI: Grok 4",
            "short_name": "Grok 4",
            "author": "x-ai",
            "description": "Grok 4 is xAI's latest reasoning model with a 256k context window. It supports parallel tool calling, structured outputs, and both image and text inputs. Note that reasoning is not exposed, reasoning cannot be disabled, and the reasoning effort cannot be specified. Pricing increases once the total tokens in a given request is greater than 128k tokens. See more details on the [xAI docs](https://docs.x.ai/docs/models/grok-4-0709)",
            "model_version_group_id": null,
            "context_length": 256000,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Grok",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "x-ai/grok-4-07-09",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "d40bef9d-6936-4c57-9749-bf7399de4a77",
                "name": "xAI | x-ai/grok-4-07-09",
                "context_length": 256000,
                "model": {
                    "slug": "x-ai/grok-4",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-07-09T19:01:29.595463+00:00",
                    "hf_updated_at": null,
                    "name": "xAI: Grok 4",
                    "short_name": "Grok 4",
                    "author": "x-ai",
                    "description": "Grok 4 is xAI's latest reasoning model with a 256k context window. It supports parallel tool calling, structured outputs, and both image and text inputs. Note that reasoning is not exposed, reasoning cannot be disabled, and the reasoning effort cannot be specified. Pricing increases once the total tokens in a given request is greater than 128k tokens. See more details on the [xAI docs](https://docs.x.ai/docs/models/grok-4-0709)",
                    "model_version_group_id": null,
                    "context_length": 256000,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Grok",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "x-ai/grok-4-07-09",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "x-ai/grok-4",
                "model_variant_permaslug": "x-ai/grok-4-07-09",
                "adapter_name": "XAIResponsesAdapter",
                "provider_name": "xAI",
                "provider_info": {
                    "name": "xAI",
                    "displayName": "xAI",
                    "slug": "xai",
                    "baseUrl": "https://api.x.ai/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://x.ai/legal/terms-of-service-enterprise",
                        "privacyPolicyURL": "https://x.ai/legal/privacy-policy",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "XAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.x.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://x.ai/&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": null
                },
                "provider_display_name": "xAI",
                "provider_slug": "xai",
                "provider_model_id": "grok-4-0709",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "logprobs",
                    "top_logprobs",
                    "response_format",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://x.ai/legal/terms-of-service-enterprise",
                    "privacyPolicyURL": "https://x.ai/legal/privacy-policy",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000003",
                    "completion": "0.000015",
                    "image": "0",
                    "request": "0",
                    "input_cache_read": "0.00000075",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "prompt-threshold",
                        "threshold": 128000,
                        "prompt": "0.000006",
                        "completions": "0.00003",
                        "input_cache_read": "0.00000075"
                    }
                ],
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "baidu/ernie-4.5-vl-424b-a47b",
            "hf_slug": "baidu/ERNIE-4.5-VL-424B-A47B-PT",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-06-30T16:28:23.022047+00:00",
            "hf_updated_at": null,
            "name": "Baidu: ERNIE 4.5 VL 424B A47B ",
            "short_name": "ERNIE 4.5 VL 424B A47B ",
            "author": "baidu",
            "description": "ERNIE-4.5-VL-424B-A47B is a multimodal Mixture-of-Experts (MoE) model from Baidu’s ERNIE 4.5 series, featuring 424B total parameters with 47B active per token. It is trained jointly on text and image data using a heterogeneous MoE architecture and modality-isolated routing to enable high-fidelity cross-modal reasoning, image understanding, and long-context generation (up to 131k tokens). Fine-tuned with techniques like SFT, DPO, UPO, and RLVR, this model supports both “thinking” and non-thinking inference modes. Designed for vision-language tasks in English and Chinese, it is optimized for efficient scaling and can operate under 4-bit/8-bit quantization.",
            "model_version_group_id": null,
            "context_length": 123000,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "baidu/ernie-4.5-vl-424b-a47b",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": "<think>",
                "end_token": "</think>",
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": "<think>",
                    "end_token": "</think>",
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "1fe59382-263d-4107-a768-d7d2007bd3b6",
                "name": "Novita | baidu/ernie-4.5-vl-424b-a47b",
                "context_length": 123000,
                "model": {
                    "slug": "baidu/ernie-4.5-vl-424b-a47b",
                    "hf_slug": "baidu/ERNIE-4.5-VL-424B-A47B-PT",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-06-30T16:28:23.022047+00:00",
                    "hf_updated_at": null,
                    "name": "Baidu: ERNIE 4.5 VL 424B A47B ",
                    "short_name": "ERNIE 4.5 VL 424B A47B ",
                    "author": "baidu",
                    "description": "ERNIE-4.5-VL-424B-A47B is a multimodal Mixture-of-Experts (MoE) model from Baidu’s ERNIE 4.5 series, featuring 424B total parameters with 47B active per token. It is trained jointly on text and image data using a heterogeneous MoE architecture and modality-isolated routing to enable high-fidelity cross-modal reasoning, image understanding, and long-context generation (up to 131k tokens). Fine-tuned with techniques like SFT, DPO, UPO, and RLVR, this model supports both “thinking” and non-thinking inference modes. Designed for vision-language tasks in English and Chinese, it is optimized for efficient scaling and can operate under 4-bit/8-bit quantization.",
                    "model_version_group_id": null,
                    "context_length": 131072,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "baidu/ernie-4.5-vl-424b-a47b",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": "<think>",
                        "end_token": "</think>",
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": "<think>",
                            "end_token": "</think>",
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "baidu/ernie-4.5-vl-424b-a47b",
                "model_variant_permaslug": "baidu/ernie-4.5-vl-424b-a47b",
                "adapter_name": "NovitaAdapter",
                "provider_name": "Novita",
                "provider_info": {
                    "name": "Novita",
                    "displayName": "NovitaAI",
                    "slug": "novita",
                    "baseUrl": "https://api.novita.ai/v3/openai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://novita.ai/legal/terms-of-service",
                        "privacyPolicyURL": "https://novita.ai/legal/privacy-policy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "org_34P2zP0TCZwbzCC8QkH8m8o1i8M"
                    ],
                    "adapterName": "NovitaAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.novita.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://novita.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "google/gemma-3-1b-it",
                        "baichuan/baichuan-m2-32b",
                        "baidu/ernie-4.5-0.3b",
                        "qwen/qwen-mt-plus",
                        "qwen/qwen3-4b-fp8",
                        "meta-llama/llama-3.2-1b-instruct",
                        "sophosympatheia/midnight-rose-70b",
                        "deepseek/deepseek-prover-v2-671b",
                        "Sao10K/L3-8B-Stheno-v3.2",
                        "thudm/glm-4-32b-0414",
                        "qwen/qwen3-omni-30b-a3b-thinking",
                        "qwen/qwen3-omni-30b-a3b-instruct",
                        "paddlepaddle/paddleocr-vl",
                        "deepseek/deepseek-ocr",
                        "skywork/r1v4-lite",
                        "baidu/ernie-4.5-vl-28b-a3b-thinking",
                        "zai-org/autoglm-phone-9b-multilingual"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "NovitaAI",
                "provider_slug": "novita/fp16",
                "provider_model_id": "baidu/ernie-4.5-vl-424b-a47b",
                "quantization": "fp16",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 16000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "top_k",
                    "repetition_penalty"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://novita.ai/legal/terms-of-service",
                    "privacyPolicyURL": "https://novita.ai/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0.00000042",
                    "completion": "0.00000125",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000042",
                    "openai:completion_tokens": "0.00000125"
                },
                "pricing_version_id": "e58a9bae-ceb6-44a8-be53-c128c4e5511c",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": false,
                        "structured_outputs": false
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "mistralai/mistral-small-3.2-24b-instruct",
            "hf_slug": "mistralai/Mistral-Small-3.2-24B-Instruct-2506",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-06-20T18:10:16.960494+00:00",
            "hf_updated_at": null,
            "name": "Mistral: Mistral Small 3.2 24B",
            "short_name": "Mistral Small 3.2 24B",
            "author": "mistralai",
            "description": "Mistral-Small-3.2-24B-Instruct-2506 is an updated 24B parameter model from Mistral optimized for instruction following, repetition reduction, and improved function calling. Compared to the 3.1 release, version 3.2 significantly improves accuracy on WildBench and Arena Hard, reduces infinite generations, and delivers gains in tool use and structured output tasks.\n\nIt supports image and text inputs with structured outputs, function/tool calling, and strong performance across coding (HumanEval+, MBPP), STEM (MMLU, MATH, GPQA), and vision benchmarks (ChartQA, DocVQA).",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Mistral",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "mistralai/mistral-small-3.2-24b-instruct-2506",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {
                "temperature": 0.3
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "a19c2a4a-f3dc-451f-ae9f-07ae51a6b234",
                "name": "Chutes | mistralai/mistral-small-3.2-24b-instruct-2506",
                "context_length": 131072,
                "model": {
                    "slug": "mistralai/mistral-small-3.2-24b-instruct",
                    "hf_slug": "mistralai/Mistral-Small-3.2-24B-Instruct-2506",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-06-20T18:10:16.960494+00:00",
                    "hf_updated_at": null,
                    "name": "Mistral: Mistral Small 3.2 24B",
                    "short_name": "Mistral Small 3.2 24B",
                    "author": "mistralai",
                    "description": "Mistral-Small-3.2-24B-Instruct-2506 is an updated 24B parameter model from Mistral optimized for instruction following, repetition reduction, and improved function calling. Compared to the 3.1 release, version 3.2 significantly improves accuracy on WildBench and Arena Hard, reduces infinite generations, and delivers gains in tool use and structured output tasks.\n\nIt supports image and text inputs with structured outputs, function/tool calling, and strong performance across coding (HumanEval+, MBPP), STEM (MMLU, MATH, GPQA), and vision benchmarks (ChartQA, DocVQA).",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Mistral",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "mistralai/mistral-small-3.2-24b-instruct-2506",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {
                        "temperature": 0.3
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "mistralai/mistral-small-3.2-24b-instruct",
                "model_variant_permaslug": "mistralai/mistral-small-3.2-24b-instruct-2506",
                "adapter_name": "ChutesAdapter",
                "provider_name": "Chutes",
                "provider_info": {
                    "name": "Chutes",
                    "displayName": "Chutes",
                    "slug": "chutes",
                    "baseUrl": "https://llm.chutes.ai/v1",
                    "dataPolicy": {
                        "training": true,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://chutes.ai/tos"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "ChutesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://chutes.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "openbmb/MiniCPM4-8B",
                        "agentica-org/DeepSWE-Preview",
                        "moonshotai/Kimi-K2-Instruct-tools",
                        "internlm/Intern-S1",
                        "TheDrummer/Gemmasutra-Pro-27B-v1.1",
                        "all-hands/openhands-lm-32b-v0.1-ep3",
                        "TheDrummer/Tunguska-39B-v1",
                        "Meridian",
                        "Zenith",
                        "Proxima",
                        "agentica-org/DeepCoder-14B-Preview",
                        "TheDrummer/Cydonia-24B-v2.1",
                        "Tesslate/UIGEN-X-32B-0727",
                        "NousResearch/Hermes-4-14B",
                        "unsloth/gemma-3-4b-it",
                        "tencent/Hunyuan-A13B-Instruct",
                        "unsloth/Llama-3.2-3B-Instruct",
                        "unsloth/Llama-3.2-1B-Instruct",
                        "zai-org/GLM-4.5-turbo",
                        "zai-org/GLM-4.6-turbo",
                        "rednote-hilab/dots.ocr",
                        "deepseek-ai/DeepSeek-V3-0324-turbo",
                        "deepseek-ai/DeepSeek-V3.1-turbo",
                        "moonshotai/Kimi-K2-Thinking",
                        "zai-org/GLM-4.5",
                        "deepseek-ai/DeepSeek-V3.1",
                        "zai-org/GLM-4.6-FP8",
                        "zai-org/GLM-4.7-FP8",
                        "zai-org/GLM-4.5-FP8"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Chutes",
                "provider_slug": "chutes/bf16",
                "provider_model_id": "chutesai/Mistral-Small-3.2-24B-Instruct-2506",
                "quantization": "bf16",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 131072,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "structured_outputs",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "top_k",
                    "repetition_penalty",
                    "response_format",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": true,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://chutes.ai/tos"
                },
                "pricing": {
                    "prompt": "0.00000006",
                    "completion": "0.00000018",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000006",
                    "openai:completion_tokens": "0.00000018"
                },
                "pricing_version_id": "1d6d5961-adba-4451-802e-a5184f1d881a",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "structured_outputs": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemini-2.5-flash",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-06-17T15:01:28.103313+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 2.5 Flash",
            "short_name": "Gemini 2.5 Flash",
            "author": "google",
            "description": "Gemini 2.5 Flash is Google's state-of-the-art workhorse model, specifically designed for advanced reasoning, coding, mathematics, and scientific tasks. It includes built-in \"thinking\" capabilities, enabling it to provide responses with greater accuracy and nuanced context handling. \n\nAdditionally, Gemini 2.5 Flash is configurable through the \"max tokens for reasoning\" parameter, as described in the documentation (https://openrouter.ai/docs/use-cases/reasoning-tokens#max-tokens-for-reasoning).",
            "model_version_group_id": null,
            "context_length": 1048576,
            "input_modalities": [
                "file",
                "image",
                "text",
                "audio",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-2.5-flash",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "b9b095f0-6448-46bb-8e4c-0111ba2bf1b0",
                "name": "Google | google/gemini-2.5-flash",
                "context_length": 1048576,
                "model": {
                    "slug": "google/gemini-2.5-flash",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-06-17T15:01:28.103313+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemini 2.5 Flash",
                    "short_name": "Gemini 2.5 Flash",
                    "author": "google",
                    "description": "Gemini 2.5 Flash is Google's state-of-the-art workhorse model, specifically designed for advanced reasoning, coding, mathematics, and scientific tasks. It includes built-in \"thinking\" capabilities, enabling it to provide responses with greater accuracy and nuanced context handling. \n\nAdditionally, Gemini 2.5 Flash is configurable through the \"max tokens for reasoning\" parameter, as described in the documentation (https://openrouter.ai/docs/use-cases/reasoning-tokens#max-tokens-for-reasoning).",
                    "model_version_group_id": null,
                    "context_length": 1048576,
                    "input_modalities": [
                        "file",
                        "image",
                        "text",
                        "audio",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "google/gemini-2.5-flash",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemini-2.5-flash",
                "model_variant_permaslug": "google/gemini-2.5-flash",
                "adapter_name": "GoogleVertexGeminiAdapter",
                "provider_name": "Google",
                "provider_info": {
                    "name": "Google",
                    "displayName": "Google Vertex (Global)",
                    "slug": "google-vertex/global",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "not-used"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleVertexGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.cloud.google.com/products/sdXM79fz1FS6ekNpu37K/history",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleVertex.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-exp-03-25",
                        "gemini-2.0-flash-exp",
                        "gemini-1.5-flash-002",
                        "gemini-2.0-flash-lite-001",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-2.0-flash-001",
                        "llama-4-scout-17b-16e-instruct-maas",
                        "qwen3-235b-a22b-instruct-2507-maas",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-image-preview",
                        "llama-4-maverick-17b-128e-instruct-maas",
                        "llama-3.3-70b-instruct-maas",
                        "claude-3-5-haiku@20241022",
                        "qwen3-coder-480b-a35b-instruct-maas",
                        "gemini-1.5-pro-002",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-pro",
                        "deepseek-r1-0528-maas",
                        "claude-3-7-sonnet@20250219",
                        "claude-3-5-sonnet-v2@20241022",
                        "claude-sonnet-4@20250514",
                        "claude-opus-4-1@20250805",
                        "claude-opus-4@20250514",
                        "claude-3-haiku@20240307",
                        "claude-3-5-sonnet@20240620",
                        "claude-3-opus@20240229",
                        "gemini-2.5-flash-lite-preview-09-2025",
                        "gemini-2.5-flash-preview-09-2025",
                        "gemini-2.5-flash-image",
                        "claude-sonnet-4-5@20250929",
                        "claude-haiku-4-5@20251001",
                        "minimax/minimax-m2-maas",
                        "gemini-3-pro-preview",
                        "gemini-3-pro-image-preview",
                        "claude-opus-4-5@20251101"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google Vertex (Global)",
                "provider_slug": "google-vertex/global",
                "provider_model_id": "gemini-2.5-flash",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 65535,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "stop",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.0000003",
                    "completion": "0.0000025",
                    "image": "0.0000003",
                    "audio": "0.000001",
                    "input_audio_cache": "0.0000001",
                    "input_cache_read": "0.00000003",
                    "input_cache_write": "0.00000008333333333333334",
                    "internal_reasoning": "0.0000025",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "gemini:prompt_tokens": 3e-7,
                    "gemini:reasoning_tokens": 0.0000025,
                    "gemini:cache_read_tokens": 3e-8,
                    "gemini:completion_tokens": 0.0000025,
                    "gemini:text_input_tokens": 3e-7,
                    "gemini:audio_input_tokens": 0.000001,
                    "gemini:image_input_tokens": 3e-7,
                    "gemini:video_input_tokens": 3e-7,
                    "gemini:cache_read_text_tokens": 3e-8,
                    "gemini:cache_read_audio_tokens": 1e-7,
                    "gemini:cache_read_image_tokens": 3e-8,
                    "gemini:cache_read_video_tokens": 3e-8,
                    "gemini:cache_write_storage_hours": 0.000001,
                    "gemini:cache_read_tokens_high_context": 1e-7,
                    "gemini:cache_read_text_tokens_high_context": 1e-7,
                    "gemini:cache_read_audio_tokens_high_context": 2e-7,
                    "gemini:cache_read_image_tokens_high_context": 1e-7,
                    "gemini:cache_read_video_tokens_high_context": 1e-7,
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "797f6b33-5ecc-4010-bdf0-d1db8d4d4c00",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_base64_video_input": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "supports_input_audio": true
                },
                "provider_region": "global",
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemini-2.5-pro",
            "hf_slug": "",
            "updated_at": "2026-01-08T23:55:54.79011+00:00",
            "created_at": "2025-06-17T14:12:24+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 2.5 Pro",
            "short_name": "Gemini 2.5 Pro",
            "author": "google",
            "description": "Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks. It employs “thinking” capabilities, enabling it to reason through responses with enhanced accuracy and nuanced context handling. Gemini 2.5 Pro achieves top-tier performance on multiple benchmarks, including first-place positioning on the LMArena leaderboard, reflecting superior human-preference alignment and complex problem-solving abilities.",
            "model_version_group_id": null,
            "context_length": 1048576,
            "input_modalities": [
                "text",
                "image",
                "file",
                "audio",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-2.5-pro",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true,
                "supports_reasoning_max_tokens": null,
                "supported_reasoning_efforts": null,
                "default_reasoning_effort": null,
                "default_reasoning_enabled": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true,
                    "supports_reasoning_max_tokens": null,
                    "supported_reasoning_efforts": null,
                    "default_reasoning_effort": null,
                    "default_reasoning_enabled": null
                },
                "chat_template_config": {
                    "should_hoist_and_merge_system_messages": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "43106252-bd69-498f-84f5-1fde678783f7",
                "name": "Google | google/gemini-2.5-pro",
                "context_length": 1048576,
                "model": {
                    "slug": "google/gemini-2.5-pro",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T23:55:54.79011+00:00",
                    "created_at": "2025-06-17T14:12:24+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemini 2.5 Pro",
                    "short_name": "Gemini 2.5 Pro",
                    "author": "google",
                    "description": "Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks. It employs “thinking” capabilities, enabling it to reason through responses with enhanced accuracy and nuanced context handling. Gemini 2.5 Pro achieves top-tier performance on multiple benchmarks, including first-place positioning on the LMArena leaderboard, reflecting superior human-preference alignment and complex problem-solving abilities.",
                    "model_version_group_id": null,
                    "context_length": 1048576,
                    "input_modalities": [
                        "text",
                        "image",
                        "file",
                        "audio",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "google/gemini-2.5-pro",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true,
                        "supports_reasoning_max_tokens": null,
                        "supported_reasoning_efforts": null,
                        "default_reasoning_effort": null,
                        "default_reasoning_enabled": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true,
                            "supports_reasoning_max_tokens": null,
                            "supported_reasoning_efforts": null,
                            "default_reasoning_effort": null,
                            "default_reasoning_enabled": null
                        },
                        "chat_template_config": {
                            "should_hoist_and_merge_system_messages": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemini-2.5-pro",
                "model_variant_permaslug": "google/gemini-2.5-pro",
                "adapter_name": "GoogleVertexGeminiAdapter",
                "provider_name": "Google",
                "provider_info": {
                    "name": "Google",
                    "displayName": "Google Vertex (Global)",
                    "slug": "google-vertex/global",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "not-used"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleVertexGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.cloud.google.com/products/sdXM79fz1FS6ekNpu37K/history",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleVertex.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-exp-03-25",
                        "gemini-2.0-flash-exp",
                        "gemini-1.5-flash-002",
                        "gemini-2.0-flash-lite-001",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-2.0-flash-001",
                        "llama-4-scout-17b-16e-instruct-maas",
                        "qwen3-235b-a22b-instruct-2507-maas",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-image-preview",
                        "llama-4-maverick-17b-128e-instruct-maas",
                        "llama-3.3-70b-instruct-maas",
                        "claude-3-5-haiku@20241022",
                        "qwen3-coder-480b-a35b-instruct-maas",
                        "gemini-1.5-pro-002",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-pro",
                        "deepseek-r1-0528-maas",
                        "claude-3-7-sonnet@20250219",
                        "claude-3-5-sonnet-v2@20241022",
                        "claude-sonnet-4@20250514",
                        "claude-opus-4-1@20250805",
                        "claude-opus-4@20250514",
                        "claude-3-haiku@20240307",
                        "claude-3-5-sonnet@20240620",
                        "claude-3-opus@20240229",
                        "gemini-2.5-flash-lite-preview-09-2025",
                        "gemini-2.5-flash-preview-09-2025",
                        "gemini-2.5-flash-image",
                        "claude-sonnet-4-5@20250929",
                        "claude-haiku-4-5@20251001",
                        "minimax/minimax-m2-maas",
                        "gemini-3-pro-preview",
                        "gemini-3-pro-image-preview",
                        "claude-opus-4-5@20251101"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google Vertex (Global)",
                "provider_slug": "google-vertex/global",
                "provider_model_id": "gemini-2.5-pro",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 65536,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "stop",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000125",
                    "completion": "0.00001",
                    "image": "0.00000125",
                    "audio": "0.00000125",
                    "input_audio_cache": "0.000000125",
                    "input_cache_read": "0.000000125",
                    "input_cache_write": "0.000000375",
                    "internal_reasoning": "0.00001",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "prompt-threshold",
                        "threshold": 200000,
                        "prompt": "0.0000025",
                        "completions": "0.000015",
                        "input_cache_read": "0.00000025",
                        "input_cache_write": "0.00000075"
                    }
                ],
                "pricing_json": {
                    "gemini:prompt_tokens": 0.00000125,
                    "gemini:reasoning_tokens": 0.00001,
                    "gemini:cache_read_tokens": 1.25e-7,
                    "gemini:completion_tokens": 0.00001,
                    "gemini:text_input_tokens": 0.00000125,
                    "gemini:audio_input_tokens": 0.00000125,
                    "gemini:image_input_tokens": 0.00000125,
                    "gemini:video_input_tokens": 0.00000125,
                    "gemini:cache_read_text_tokens": 1.25e-7,
                    "gemini:cache_read_audio_tokens": 1.25e-7,
                    "gemini:cache_read_image_tokens": 1.25e-7,
                    "gemini:cache_read_video_tokens": 1.25e-7,
                    "gemini:cache_write_storage_hours": 0.0000045,
                    "gemini:prompt_tokens_high_context": 0.0000025,
                    "gemini:reasoning_tokens_high_context": 0.000015,
                    "gemini:cache_read_tokens_high_context": 2.5e-7,
                    "gemini:completion_tokens_high_context": 0.000015,
                    "gemini:cache_read_text_tokens_high_context": 2.5e-7,
                    "gemini:cache_read_audio_tokens_high_context": 2.5e-7,
                    "gemini:cache_read_image_tokens_high_context": 2.5e-7,
                    "gemini:cache_read_video_tokens_high_context": 2.5e-7,
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "30d9e9ac-2660-46f4-8467-957c8615eb9a",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": 300,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_base64_video_input": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true,
                    "supports_input_audio": true
                },
                "provider_region": "global",
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/o3-pro",
            "hf_slug": "",
            "updated_at": "2026-01-14T02:46:50.629344+00:00",
            "created_at": "2025-06-10T23:32:32.266087+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: o3 Pro",
            "short_name": "o3 Pro",
            "author": "openai",
            "description": "The o-series of models are trained with reinforcement learning to think before they answer and perform complex reasoning. The o3-pro model uses more compute to think harder and provide consistently better answers.\n\nNote that BYOK is required for this model. Set up here: https://openrouter.ai/settings/integrations",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "text",
                "file",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/o3-pro-2025-06-10",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "b8222376-66ee-4b89-a7c9-e627ba35db79",
                "name": "OpenAI | openai/o3-pro-2025-06-10",
                "context_length": 200000,
                "model": {
                    "slug": "openai/o3-pro",
                    "hf_slug": "",
                    "updated_at": "2026-01-14T02:46:50.629344+00:00",
                    "created_at": "2025-06-10T23:32:32.266087+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: o3 Pro",
                    "short_name": "o3 Pro",
                    "author": "openai",
                    "description": "The o-series of models are trained with reinforcement learning to think before they answer and perform complex reasoning. The o3-pro model uses more compute to think harder and provide consistently better answers.\n\nNote that BYOK is required for this model. Set up here: https://openrouter.ai/settings/integrations",
                    "model_version_group_id": null,
                    "context_length": 200000,
                    "input_modalities": [
                        "text",
                        "file",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/o3-pro-2025-06-10",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/o3-pro",
                "model_variant_permaslug": "openai/o3-pro-2025-06-10",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "o3-pro-2025-06-10",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 100000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00002",
                    "completion": "0.00008",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.00002,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.00008
                },
                "pricing_version_id": "1f6bd1f8-e039-4a39-818c-0c098678cc9b",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemini-2.5-pro-preview",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-06-05T15:27:37.538116+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 2.5 Pro Preview 06-05",
            "short_name": "Gemini 2.5 Pro Preview 06-05",
            "author": "google",
            "description": "Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks. It employs “thinking” capabilities, enabling it to reason through responses with enhanced accuracy and nuanced context handling. Gemini 2.5 Pro achieves top-tier performance on multiple benchmarks, including first-place positioning on the LMArena leaderboard, reflecting superior human-preference alignment and complex problem-solving abilities.\n",
            "model_version_group_id": null,
            "context_length": 1048576,
            "input_modalities": [
                "file",
                "image",
                "text",
                "audio"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-2.5-pro-preview-06-05",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "018040ae-9cda-43cd-8813-d8ca83f6c7ed",
                "name": "Google | google/gemini-2.5-pro-preview-06-05",
                "context_length": 1048576,
                "model": {
                    "slug": "google/gemini-2.5-pro-preview",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-06-05T15:27:37.538116+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemini 2.5 Pro Preview 06-05",
                    "short_name": "Gemini 2.5 Pro Preview 06-05",
                    "author": "google",
                    "description": "Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks. It employs “thinking” capabilities, enabling it to reason through responses with enhanced accuracy and nuanced context handling. Gemini 2.5 Pro achieves top-tier performance on multiple benchmarks, including first-place positioning on the LMArena leaderboard, reflecting superior human-preference alignment and complex problem-solving abilities.\n",
                    "model_version_group_id": null,
                    "context_length": 1048576,
                    "input_modalities": [
                        "file",
                        "image",
                        "text",
                        "audio"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "google/gemini-2.5-pro-preview-06-05",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemini-2.5-pro-preview",
                "model_variant_permaslug": "google/gemini-2.5-pro-preview-06-05",
                "adapter_name": "GoogleVertexGeminiAdapter",
                "provider_name": "Google",
                "provider_info": {
                    "name": "Google",
                    "displayName": "Google Vertex",
                    "slug": "google-vertex",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "not-used"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleVertexGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.cloud.google.com/products/sdXM79fz1FS6ekNpu37K/history",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleVertex.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-exp-03-25",
                        "gemini-2.0-flash-exp",
                        "gemini-1.5-flash-002",
                        "gemini-2.0-flash-lite-001",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-2.0-flash-001",
                        "llama-4-scout-17b-16e-instruct-maas",
                        "qwen3-235b-a22b-instruct-2507-maas",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-image-preview",
                        "llama-4-maverick-17b-128e-instruct-maas",
                        "llama-3.3-70b-instruct-maas",
                        "claude-3-5-haiku@20241022",
                        "qwen3-coder-480b-a35b-instruct-maas",
                        "gemini-1.5-pro-002",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-pro",
                        "deepseek-r1-0528-maas",
                        "claude-3-7-sonnet@20250219",
                        "claude-3-5-sonnet-v2@20241022",
                        "claude-sonnet-4@20250514",
                        "claude-opus-4-1@20250805",
                        "claude-opus-4@20250514",
                        "claude-3-haiku@20240307",
                        "claude-3-5-sonnet@20240620",
                        "claude-3-opus@20240229",
                        "gemini-2.5-flash-lite-preview-09-2025",
                        "gemini-2.5-flash-preview-09-2025",
                        "gemini-2.5-flash-image",
                        "claude-sonnet-4-5@20250929",
                        "claude-haiku-4-5@20251001",
                        "minimax/minimax-m2-maas",
                        "gemini-3-pro-preview",
                        "gemini-3-pro-image-preview",
                        "claude-opus-4-5@20251101"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google Vertex",
                "provider_slug": "google-vertex",
                "provider_model_id": "gemini-2.5-pro-preview-06-05",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 65536,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "stop",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000125",
                    "completion": "0.00001",
                    "image": "0.00000125",
                    "audio": "0.00000125",
                    "input_audio_cache": "0.000000125",
                    "input_cache_read": "0.000000125",
                    "input_cache_write": "0.000000375",
                    "internal_reasoning": "0.00001",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "prompt-threshold",
                        "threshold": 200000,
                        "prompt": "0.0000025",
                        "completions": "0.000015",
                        "input_cache_read": "0.000000625",
                        "input_cache_write": "0.00000075"
                    }
                ],
                "pricing_json": {
                    "gemini:prompt_tokens": 0.00000125,
                    "gemini:reasoning_tokens": 0.00001,
                    "gemini:cache_read_tokens": 1.25e-7,
                    "gemini:completion_tokens": 0.00001,
                    "gemini:text_input_tokens": 0.00000125,
                    "gemini:audio_input_tokens": 0.00000125,
                    "gemini:image_input_tokens": 0.00000125,
                    "gemini:video_input_tokens": 0.00000125,
                    "gemini:cache_read_text_tokens": 1.25e-7,
                    "gemini:cache_read_audio_tokens": 1.25e-7,
                    "gemini:cache_read_image_tokens": 1.25e-7,
                    "gemini:cache_read_video_tokens": 1.25e-7,
                    "gemini:cache_write_storage_hours": 0.0000045,
                    "gemini:prompt_tokens_high_context": 0.0000025,
                    "gemini:reasoning_tokens_high_context": 0.000015,
                    "gemini:cache_read_tokens_high_context": 2.5e-7,
                    "gemini:completion_tokens_high_context": 0.000015,
                    "gemini:cache_read_text_tokens_high_context": 2.5e-7,
                    "gemini:cache_read_audio_tokens_high_context": 2.5e-7,
                    "gemini:cache_read_image_tokens_high_context": 2.5e-7,
                    "gemini:cache_read_video_tokens_high_context": 2.5e-7,
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "5e816caa-530e-4a3d-be95-5a26323e7b48",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true
                },
                "provider_region": "global",
                "deprecation_date": null
            }
        },
        {
            "slug": "anthropic/claude-opus-4",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-05-22T16:27:25.029961+00:00",
            "hf_updated_at": null,
            "name": "Anthropic: Claude Opus 4",
            "short_name": "Claude Opus 4",
            "author": "anthropic",
            "description": "Claude Opus 4 is benchmarked as the world’s best coding model, at time of release, bringing sustained performance on complex, long-running tasks and agent workflows. It sets new benchmarks in software engineering, achieving leading results on SWE-bench (72.5%) and Terminal-bench (43.2%). Opus 4 supports extended, agentic workflows, handling thousands of task steps continuously for hours without degradation. \n\nRead more at the [blog post here](https://www.anthropic.com/news/claude-4)",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "image",
                "text",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Claude",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "anthropic/claude-4-opus-20250522",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [
                "google-vertex",
                "amazon-bedrock",
                "anthropic"
            ],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "a1d11e23-4e05-42cf-9fa3-6cacdb8d384a",
                "name": "Amazon Bedrock | anthropic/claude-4-opus-20250522",
                "context_length": 200000,
                "model": {
                    "slug": "anthropic/claude-opus-4",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-05-22T16:27:25.029961+00:00",
                    "hf_updated_at": null,
                    "name": "Anthropic: Claude Opus 4",
                    "short_name": "Claude Opus 4",
                    "author": "anthropic",
                    "description": "Claude Opus 4 is benchmarked as the world’s best coding model, at time of release, bringing sustained performance on complex, long-running tasks and agent workflows. It sets new benchmarks in software engineering, achieving leading results on SWE-bench (72.5%) and Terminal-bench (43.2%). Opus 4 supports extended, agentic workflows, handling thousands of task steps continuously for hours without degradation. \n\nRead more at the [blog post here](https://www.anthropic.com/news/claude-4)",
                    "model_version_group_id": null,
                    "context_length": 200000,
                    "input_modalities": [
                        "image",
                        "text",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Claude",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "anthropic/claude-4-opus-20250522",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [
                        "google-vertex",
                        "amazon-bedrock",
                        "anthropic"
                    ],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "anthropic/claude-opus-4",
                "model_variant_permaslug": "anthropic/claude-4-opus-20250522",
                "adapter_name": "AmazonBedrockInvokeAnthropicAdapter",
                "provider_name": "Amazon Bedrock",
                "provider_info": {
                    "name": "Amazon Bedrock",
                    "displayName": "Amazon Bedrock",
                    "slug": "amazon-bedrock",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                        "privacyPolicyURL": "https://aws.amazon.com/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "dummy-value"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "AmazonBedrockConverseAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://health.aws.amazon.com/health/status",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Bedrock.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "anthropic"
                },
                "provider_display_name": "Amazon Bedrock",
                "provider_slug": "amazon-bedrock",
                "provider_model_id": "us.anthropic.claude-opus-4-20250514-v1:0",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 32000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "top_k",
                    "stop",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                    "privacyPolicyURL": "https://aws.amazon.com/privacy"
                },
                "pricing": {
                    "prompt": "0.000015",
                    "completion": "0.000075",
                    "input_cache_read": "0.0000015",
                    "input_cache_write": "0.00001875",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "anthropic:prompt_tokens": 0.000015,
                    "anthropic:web_search_calls": 0.01,
                    "anthropic:cache_read_tokens": 0.0000015,
                    "anthropic:completion_tokens": 0.000075,
                    "anthropic:cache_write_1h_tokens": 0.00003,
                    "anthropic:cache_write_5m_tokens": 0.00001875
                },
                "pricing_version_id": "20a35276-23ac-4521-a7cb-ef4e84ed336e",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "anthropic/claude-sonnet-4",
            "hf_slug": "",
            "updated_at": "2025-12-05T21:53:41.372783+00:00",
            "created_at": "2025-05-22T16:12:51.381897+00:00",
            "hf_updated_at": null,
            "name": "Anthropic: Claude Sonnet 4",
            "short_name": "Claude Sonnet 4",
            "author": "anthropic",
            "description": "Claude Sonnet 4 significantly enhances the capabilities of its predecessor, Sonnet 3.7, excelling in both coding and reasoning tasks with improved precision and controllability. Achieving state-of-the-art performance on SWE-bench (72.7%), Sonnet 4 balances capability and computational efficiency, making it suitable for a broad range of applications from routine coding tasks to complex software development projects. Key enhancements include improved autonomous codebase navigation, reduced error rates in agent-driven workflows, and increased reliability in following intricate instructions. Sonnet 4 is optimized for practical everyday use, providing advanced reasoning capabilities while maintaining efficiency and responsiveness in diverse internal and external scenarios.\n\nRead more at the [blog post here](https://www.anthropic.com/news/claude-4)",
            "model_version_group_id": null,
            "context_length": 1000000,
            "input_modalities": [
                "image",
                "text",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Claude",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "anthropic/claude-4-sonnet-20250522",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [
                "google-vertex",
                "amazon-bedrock",
                "anthropic"
            ],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "5e3f0568-c089-416a-ab7b-6c432999b571",
                "name": "Google | anthropic/claude-4-sonnet-20250522",
                "context_length": 1000000,
                "model": {
                    "slug": "anthropic/claude-sonnet-4",
                    "hf_slug": "",
                    "updated_at": "2025-12-05T21:53:41.372783+00:00",
                    "created_at": "2025-05-22T16:12:51.381897+00:00",
                    "hf_updated_at": null,
                    "name": "Anthropic: Claude Sonnet 4",
                    "short_name": "Claude Sonnet 4",
                    "author": "anthropic",
                    "description": "Claude Sonnet 4 significantly enhances the capabilities of its predecessor, Sonnet 3.7, excelling in both coding and reasoning tasks with improved precision and controllability. Achieving state-of-the-art performance on SWE-bench (72.7%), Sonnet 4 balances capability and computational efficiency, making it suitable for a broad range of applications from routine coding tasks to complex software development projects. Key enhancements include improved autonomous codebase navigation, reduced error rates in agent-driven workflows, and increased reliability in following intricate instructions. Sonnet 4 is optimized for practical everyday use, providing advanced reasoning capabilities while maintaining efficiency and responsiveness in diverse internal and external scenarios.\n\nRead more at the [blog post here](https://www.anthropic.com/news/claude-4)",
                    "model_version_group_id": null,
                    "context_length": 1000000,
                    "input_modalities": [
                        "image",
                        "text",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Claude",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "anthropic/claude-4-sonnet-20250522",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [
                        "google-vertex",
                        "amazon-bedrock",
                        "anthropic"
                    ],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "anthropic/claude-sonnet-4",
                "model_variant_permaslug": "anthropic/claude-4-sonnet-20250522",
                "adapter_name": "GoogleVertexAnthropicAdapter",
                "provider_name": "Google",
                "provider_info": {
                    "name": "Google",
                    "displayName": "Google Vertex",
                    "slug": "google-vertex",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "not-used"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleVertexGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.cloud.google.com/products/sdXM79fz1FS6ekNpu37K/history",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleVertex.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-exp-03-25",
                        "gemini-2.0-flash-exp",
                        "gemini-1.5-flash-002",
                        "gemini-2.0-flash-lite-001",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-2.0-flash-001",
                        "llama-4-scout-17b-16e-instruct-maas",
                        "qwen3-235b-a22b-instruct-2507-maas",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-image-preview",
                        "llama-4-maverick-17b-128e-instruct-maas",
                        "llama-3.3-70b-instruct-maas",
                        "claude-3-5-haiku@20241022",
                        "qwen3-coder-480b-a35b-instruct-maas",
                        "gemini-1.5-pro-002",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-pro",
                        "deepseek-r1-0528-maas",
                        "claude-3-7-sonnet@20250219",
                        "claude-3-5-sonnet-v2@20241022",
                        "claude-sonnet-4@20250514",
                        "claude-opus-4-1@20250805",
                        "claude-opus-4@20250514",
                        "claude-3-haiku@20240307",
                        "claude-3-5-sonnet@20240620",
                        "claude-3-opus@20240229",
                        "gemini-2.5-flash-lite-preview-09-2025",
                        "gemini-2.5-flash-preview-09-2025",
                        "gemini-2.5-flash-image",
                        "claude-sonnet-4-5@20250929",
                        "claude-haiku-4-5@20251001",
                        "minimax/minimax-m2-maas",
                        "gemini-3-pro-preview",
                        "gemini-3-pro-image-preview",
                        "claude-opus-4-5@20251101"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "anthropic"
                },
                "provider_display_name": "Google Vertex",
                "provider_slug": "google-vertex",
                "provider_model_id": "claude-sonnet-4@20250514",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 64000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "top_p",
                    "temperature",
                    "stop",
                    "reasoning",
                    "include_reasoning",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000003",
                    "completion": "0.000015",
                    "input_cache_read": "0.0000003",
                    "input_cache_write": "0.00000375",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "prompt-threshold",
                        "threshold": 200000,
                        "prompt": "0.000006",
                        "completions": "0.0000225",
                        "input_cache_read": "0.0000006",
                        "input_cache_write": "0.0000075"
                    }
                ],
                "pricing_json": {
                    "anthropic:prompt_tokens": 0.000003,
                    "anthropic:web_search_calls": 0.01,
                    "anthropic:cache_read_tokens": 3e-7,
                    "anthropic:completion_tokens": 0.000015,
                    "anthropic:cache_write_1h_tokens": 0.000006,
                    "anthropic:cache_write_5m_tokens": 0.00000375,
                    "anthropic:long_context_threshold": 200000,
                    "anthropic:prompt_tokens_long_context": 0.000006,
                    "anthropic:cache_read_tokens_long_context": 6e-7,
                    "anthropic:completion_tokens_long_context": 0.0000225,
                    "anthropic:cache_write_1h_tokens_long_context": 0.000012,
                    "anthropic:cache_write_5m_tokens_long_context": 0.0000075
                },
                "pricing_version_id": "7a5a3265-459b-49f7-9a79-938da5dd2363",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "mistralai/mistral-medium-3",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-05-07T14:15:41.980763+00:00",
            "hf_updated_at": null,
            "name": "Mistral: Mistral Medium 3",
            "short_name": "Mistral Medium 3",
            "author": "mistralai",
            "description": "Mistral Medium 3 is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced operational cost. It balances state-of-the-art reasoning and multimodal performance with 8× lower cost compared to traditional large models, making it suitable for scalable deployments across professional and industrial use cases.\n\nThe model excels in domains such as coding, STEM reasoning, and enterprise adaptation. It supports hybrid, on-prem, and in-VPC deployments and is optimized for integration into custom workflows. Mistral Medium 3 offers competitive accuracy relative to larger models like Claude Sonnet 3.5/3.7, Llama 4 Maverick, and Command R+, while maintaining broad compatibility across cloud environments.",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Mistral",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "mistralai/mistral-medium-3",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {
                "temperature": 0.3
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "9d5ba5bf-8465-46df-9185-1330820338f5",
                "name": "Mistral | mistralai/mistral-medium-3",
                "context_length": 131072,
                "model": {
                    "slug": "mistralai/mistral-medium-3",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-05-07T14:15:41.980763+00:00",
                    "hf_updated_at": null,
                    "name": "Mistral: Mistral Medium 3",
                    "short_name": "Mistral Medium 3",
                    "author": "mistralai",
                    "description": "Mistral Medium 3 is a high-performance enterprise-grade language model designed to deliver frontier-level capabilities at significantly reduced operational cost. It balances state-of-the-art reasoning and multimodal performance with 8× lower cost compared to traditional large models, making it suitable for scalable deployments across professional and industrial use cases.\n\nThe model excels in domains such as coding, STEM reasoning, and enterprise adaptation. It supports hybrid, on-prem, and in-VPC deployments and is optimized for integration into custom workflows. Mistral Medium 3 offers competitive accuracy relative to larger models like Claude Sonnet 3.5/3.7, Llama 4 Maverick, and Command R+, while maintaining broad compatibility across cloud environments.",
                    "model_version_group_id": null,
                    "context_length": 131072,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Mistral",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "mistralai/mistral-medium-3",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {
                        "temperature": 0.3
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "mistralai/mistral-medium-3",
                "model_variant_permaslug": "mistralai/mistral-medium-3",
                "adapter_name": "MistralAdapter",
                "provider_name": "Mistral",
                "provider_info": {
                    "name": "Mistral",
                    "displayName": "Mistral",
                    "slug": "mistral",
                    "baseUrl": "https://api.mistral.ai/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://mistral.ai/terms/#terms-of-use",
                        "privacyPolicyURL": "https://mistral.ai/terms/#privacy-policy"
                    },
                    "headquarters": "FR",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "MistralAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.mistral.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Mistral.png"
                    },
                    "ignoredProviderModels": [
                        "mistral-moderation-2411-all",
                        "voxtral-mini-2507",
                        "voxtral-small-2507",
                        "voxtral-mini-transcribe-2507",
                        "mistral-medium",
                        "mistral-tiny",
                        "mistral-tiny-2312",
                        "open-mistral-nemo",
                        "mistral-tiny-2407",
                        "open-mixtral-8x7b",
                        "mistral-small",
                        "mistral-small-2312",
                        "open-mixtral-8x22b-2404",
                        "mistral-large-pixtral-2411",
                        "codestral-2412",
                        "codestral-2411-rc5",
                        "pixtral-12b",
                        "mistral-moderation-2411",
                        "mistral-ocr-2503",
                        "mistral-ocr-2505",
                        "mistral-saba-2502",
                        "open-mixtral-8x22b",
                        "mistral-large-2407",
                        "magistral-medium-2507",
                        "mistral-embed",
                        "codestral-embed",
                        "codestral-2501",
                        "mistral-small-2501",
                        "mistral-ocr-2512",
                        "labs-devstral-small-2512"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "mistral"
                },
                "provider_display_name": "Mistral",
                "provider_slug": "mistral",
                "provider_model_id": "mistral-medium-2505",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://mistral.ai/terms/#terms-of-use",
                    "privacyPolicyURL": "https://mistral.ai/terms/#privacy-policy"
                },
                "pricing": {
                    "prompt": "0.0000004",
                    "completion": "0.000002",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "mistral:prompt_tokens": 4e-7,
                    "mistral:completion_tokens": 0.000002
                },
                "pricing_version_id": "25450ac1-aa83-42d4-b87b-3a37014630c6",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemini-2.5-pro-preview-05-06",
            "hf_slug": "",
            "updated_at": "2026-01-08T19:23:52.555156+00:00",
            "created_at": "2025-05-07T00:41:53+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 2.5 Pro Preview 05-06",
            "short_name": "Gemini 2.5 Pro Preview 05-06",
            "author": "google",
            "description": "Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks. It employs “thinking” capabilities, enabling it to reason through responses with enhanced accuracy and nuanced context handling. Gemini 2.5 Pro achieves top-tier performance on multiple benchmarks, including first-place positioning on the LMArena leaderboard, reflecting superior human-preference alignment and complex problem-solving abilities.",
            "model_version_group_id": null,
            "context_length": 1048576,
            "input_modalities": [
                "text",
                "image",
                "file",
                "audio",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-2.5-pro-preview-03-25",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "9d2cac4d-81d4-4e67-ac7a-6c73040655ee",
                "name": "Google | google/gemini-2.5-pro-preview-03-25",
                "context_length": 1048576,
                "model": {
                    "slug": "google/gemini-2.5-pro-preview-05-06",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T19:23:52.555156+00:00",
                    "created_at": "2025-05-07T00:41:53+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemini 2.5 Pro Preview 05-06",
                    "short_name": "Gemini 2.5 Pro Preview 05-06",
                    "author": "google",
                    "description": "Gemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks. It employs “thinking” capabilities, enabling it to reason through responses with enhanced accuracy and nuanced context handling. Gemini 2.5 Pro achieves top-tier performance on multiple benchmarks, including first-place positioning on the LMArena leaderboard, reflecting superior human-preference alignment and complex problem-solving abilities.",
                    "model_version_group_id": null,
                    "context_length": 1048576,
                    "input_modalities": [
                        "text",
                        "image",
                        "file",
                        "audio",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "google/gemini-2.5-pro-preview-03-25",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemini-2.5-pro-preview-05-06",
                "model_variant_permaslug": "google/gemini-2.5-pro-preview-03-25",
                "adapter_name": "GoogleVertexGeminiAdapter",
                "provider_name": "Google",
                "provider_info": {
                    "name": "Google",
                    "displayName": "Google Vertex",
                    "slug": "google-vertex",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "not-used"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleVertexGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.cloud.google.com/products/sdXM79fz1FS6ekNpu37K/history",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleVertex.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-exp-03-25",
                        "gemini-2.0-flash-exp",
                        "gemini-1.5-flash-002",
                        "gemini-2.0-flash-lite-001",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-2.0-flash-001",
                        "llama-4-scout-17b-16e-instruct-maas",
                        "qwen3-235b-a22b-instruct-2507-maas",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-image-preview",
                        "llama-4-maverick-17b-128e-instruct-maas",
                        "llama-3.3-70b-instruct-maas",
                        "claude-3-5-haiku@20241022",
                        "qwen3-coder-480b-a35b-instruct-maas",
                        "gemini-1.5-pro-002",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-pro",
                        "deepseek-r1-0528-maas",
                        "claude-3-7-sonnet@20250219",
                        "claude-3-5-sonnet-v2@20241022",
                        "claude-sonnet-4@20250514",
                        "claude-opus-4-1@20250805",
                        "claude-opus-4@20250514",
                        "claude-3-haiku@20240307",
                        "claude-3-5-sonnet@20240620",
                        "claude-3-opus@20240229",
                        "gemini-2.5-flash-lite-preview-09-2025",
                        "gemini-2.5-flash-preview-09-2025",
                        "gemini-2.5-flash-image",
                        "claude-sonnet-4-5@20250929",
                        "claude-haiku-4-5@20251001",
                        "minimax/minimax-m2-maas",
                        "gemini-3-pro-preview",
                        "gemini-3-pro-image-preview",
                        "claude-opus-4-5@20251101"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google Vertex",
                "provider_slug": "google-vertex",
                "provider_model_id": "gemini-2.5-pro-preview-05-06",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 65535,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "stop",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000125",
                    "completion": "0.00001",
                    "image": "0.00000125",
                    "audio": "0.00000125",
                    "input_audio_cache": "0.000000125",
                    "input_cache_read": "0.000000125",
                    "input_cache_write": "0.000000375",
                    "internal_reasoning": "0.00001",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "prompt-threshold",
                        "threshold": 200000,
                        "prompt": "0.0000025",
                        "completions": "0.000015",
                        "input_cache_read": "0.000000625",
                        "input_cache_write": "0.00000075"
                    }
                ],
                "pricing_json": {
                    "gemini:prompt_tokens": 0.00000125,
                    "gemini:reasoning_tokens": 0.00001,
                    "gemini:cache_read_tokens": 1.25e-7,
                    "gemini:completion_tokens": 0.00001,
                    "gemini:text_input_tokens": 0.00000125,
                    "gemini:audio_input_tokens": 0.00000125,
                    "gemini:image_input_tokens": 0.00000125,
                    "gemini:video_input_tokens": 0.00000125,
                    "gemini:cache_read_text_tokens": 1.25e-7,
                    "gemini:cache_read_audio_tokens": 1.25e-7,
                    "gemini:cache_read_image_tokens": 1.25e-7,
                    "gemini:cache_read_video_tokens": 1.25e-7,
                    "gemini:cache_write_storage_hours": 0.0000045,
                    "gemini:prompt_tokens_high_context": 0.0000025,
                    "gemini:reasoning_tokens_high_context": 0.000015,
                    "gemini:cache_read_tokens_high_context": 2.5e-7,
                    "gemini:completion_tokens_high_context": 0.000015,
                    "gemini:cache_read_text_tokens_high_context": 2.5e-7,
                    "gemini:cache_read_audio_tokens_high_context": 2.5e-7,
                    "gemini:cache_read_image_tokens_high_context": 2.5e-7,
                    "gemini:cache_read_video_tokens_high_context": 2.5e-7,
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "9da9fe0b-1701-41e2-8b01-775ec4b54ffa",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_base64_video_input": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    },
                    "is_mandatory_reasoning": true
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "arcee-ai/spotlight",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-05-05T21:45:52.249082+00:00",
            "hf_updated_at": null,
            "name": "Arcee AI: Spotlight",
            "short_name": "Spotlight",
            "author": "arcee-ai",
            "description": "Spotlight is a 7‑billion‑parameter vision‑language model derived from Qwen 2.5‑VL and fine‑tuned by Arcee AI for tight image‑text grounding tasks. It offers a 32 k‑token context window, enabling rich multimodal conversations that combine lengthy documents with one or more images. Training emphasized fast inference on consumer GPUs while retaining strong captioning, visual‐question‑answering, and diagram‑analysis accuracy. As a result, Spotlight slots neatly into agent workflows where screenshots, charts or UI mock‑ups need to be interpreted on the fly. Early benchmarks show it matching or out‑scoring larger VLMs such as LLaVA‑1.6 13 B on popular VQA and POPE alignment tests. ",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "arcee-ai/spotlight",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "a9b3fe6f-e21f-4f3c-9ea7-f70d856939d6",
                "name": "Together | arcee-ai/spotlight",
                "context_length": 131072,
                "model": {
                    "slug": "arcee-ai/spotlight",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-05-05T21:45:52.249082+00:00",
                    "hf_updated_at": null,
                    "name": "Arcee AI: Spotlight",
                    "short_name": "Spotlight",
                    "author": "arcee-ai",
                    "description": "Spotlight is a 7‑billion‑parameter vision‑language model derived from Qwen 2.5‑VL and fine‑tuned by Arcee AI for tight image‑text grounding tasks. It offers a 32 k‑token context window, enabling rich multimodal conversations that combine lengthy documents with one or more images. Training emphasized fast inference on consumer GPUs while retaining strong captioning, visual‐question‑answering, and diagram‑analysis accuracy. As a result, Spotlight slots neatly into agent workflows where screenshots, charts or UI mock‑ups need to be interpreted on the fly. Early benchmarks show it matching or out‑scoring larger VLMs such as LLaVA‑1.6 13 B on popular VQA and POPE alignment tests. ",
                    "model_version_group_id": null,
                    "context_length": 131072,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "arcee-ai/spotlight",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "arcee-ai/spotlight",
                "model_variant_permaslug": "arcee-ai/spotlight",
                "adapter_name": "TogetherAdapter",
                "provider_name": "Together",
                "provider_info": {
                    "name": "Together",
                    "displayName": "Together",
                    "slug": "together",
                    "baseUrl": "https://api.together.xyz/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.together.ai/terms-of-service",
                        "privacyPolicyURL": "https://www.together.ai/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "TogetherAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.together.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://www.together.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "mixedbread-ai/Mxbai-Rerank-Large-V2",
                        "BAAI/bge-base-en-v1.5-vllm",
                        "scb10x/scb10x-typhoon-2-1-gemma3-12b",
                        "arcee-ai/AFM-4.5B-Preview",
                        "deepseek-ai/DeepSeek-R1-0528-tput",
                        "black-forest-labs/FLUX.1-kontext-dev",
                        "google/gemma-3-27b-it",
                        "Qwen/Qwen3-32B-FP8",
                        "openai/whisper-large-v3",
                        "eddie/Qwen3-32B",
                        "eddiehou/meta-llama/Llama-3.1-405B",
                        "yan/deepseek-ai-deepseek-v3",
                        "moz/Llama-3.3-70B-Instruct-Turbo",
                        "serverless-qwen-qwen3-32b-fp8",
                        "qwen-qwen3-32b-fp8-serverless",
                        "moz-llama-3-3-70b-instruct-turbo",
                        "moonshotai/Kimi-K2-Instruct-tgl-testing",
                        "VirtueAIxTogether/VirtueGuard-Text-Lite",
                        "Virtue-AI/VirtueGuard-Text-Lite",
                        "black-forest-labs/FLUX.1-krea-dev",
                        "prosus/qwen-qwen3-32b-fp8-long-context",
                        "meta-llama/Llama-4-Scout-17B-16E-Instruct-batch",
                        "deepseek-ai/DeepSeek-R1-DE",
                        "arize-ai/qwen-2-1.5b-instruct",
                        "openai/gpt-oss-120b",
                        "meta-llama/Llama-3-70b-hf",
                        "Qwen/Qwen2.5-72B-Instruct",
                        "meta-llama/Meta-Llama-3.1-70B-Instruct-Reference",
                        "meta-llama/Llama-3.2-1B-Instruct",
                        "meta-llama/Meta-Llama-3.1-8B-Instruct-Reference",
                        "meta-llama/Meta-Llama-3-8B-Instruct",
                        "meta-llama/Llama-3.1-405B-Instruct",
                        "cartesia/sonic",
                        "cartesia/sonic-2",
                        "togethercomputer/MoA-1",
                        "Salesforce/Llama-Rank-V1",
                        "black-forest-labs/FLUX.1-schnell",
                        "lgai/exaone-3-5-32b-instruct",
                        "lgai/exaone-deep-32b",
                        "black-forest-labs/FLUX.1-dev",
                        "marin-community/marin-8b-instruct",
                        "togethercomputer/Refuel-Llm-V2-Small",
                        "meta-llama/Llama-3-70b-chat-hf",
                        "Alibaba-NLP/gte-modernbert-base",
                        "black-forest-labs/FLUX.1-pro",
                        "black-forest-labs/FLUX.1.1-pro",
                        "togethercomputer/MoA-1-Turbo",
                        "black-forest-labs/FLUX.1-dev-lora",
                        "meta-llama/Llama-2-70b-hf",
                        "togethercomputer/m2-bert-80M-32k-retrieval",
                        "togethercomputer/Refuel-Llm-V2",
                        "intfloat/multilingual-e5-large-instruct",
                        "black-forest-labs/FLUX.1-kontext-max",
                        "black-forest-labs/FLUX.1-schnell-Free",
                        "black-forest-labs/FLUX.1-kontext-pro",
                        "BAAI/bge-large-en-v1.5",
                        "BAAI/bge-base-en-v1.5",
                        "Qwen/Qwen3-Next-80B-A3B-Instruct",
                        "ServiceNow-AI/Apriel-1.5-15b-Thinker",
                        "openai/whisper-large-v3-test",
                        "codellama/CodeLlama-34b-Instruct-hf",
                        "meta-llama/Llama-2-13b-chat-hf",
                        "togethercomputer/m2-bert-80M-8k-retrieval",
                        "WhereIsAI/UAE-Large-V1",
                        "meta-llama/Meta-Llama-3.1-405B-Instruct-Lite-Pro",
                        "togethercomputer/m2-bert-80M-2k-retrieval",
                        "meta-llama/Meta-Llama-3-70B-Instruct-Lite",
                        "Meta-Llama/Llama-Guard-7b",
                        "Gryphe/MythoMax-L2-13b-Lite",
                        "upstage/SOLAR-10.7B-Instruct-v1.0",
                        "Qwen/Qwen2.5-14B-Instruct",
                        "meta-llama/Llama-3.3-70B-Instruct-Turbo-Free",
                        "deepseek-ai/DeepSeek-R1-Distill-Llama-70B-free",
                        "zai-org/GLM-4.5-Air-FP8",
                        "kwaivgI/kling-1.6-standard",
                        "HiDream-ai/HiDream-I1-Full",
                        "ByteDance-Seed/Seedream-3.0",
                        "ByteDance-Seed/Seedream-4.0",
                        "Lykon/DreamShaper",
                        "HiDream-ai/HiDream-I1-Dev",
                        "Qwen/Qwen-Image",
                        "RunDiffusion/Juggernaut-pro-flux",
                        "google/imagen-4.0-preview",
                        "google/imagen-4.0-ultra",
                        "google/veo-3.0",
                        "minimax/hailuo-02",
                        "stabilityai/stable-diffusion-3-medium",
                        "black-forest-labs/FLUX.1-Canny-pro",
                        "google/imagen-4.0-fast",
                        "minimax/video-01-director",
                        "HiDream-ai/HiDream-I1-Fast",
                        "Wan-AI/Wan2.2-T2V-A14B",
                        "ByteDance/Seedance-1.0-pro",
                        "google/veo-3.0-fast-audio",
                        "vidu/vidu-q1",
                        "kwaivgI/kling-2.1-master",
                        "google/veo-3.0-audio",
                        "Rundiffusion/Juggernaut-Lightning-Flux",
                        "Wan-AI/Wan2.2-I2V-A14B",
                        "google/flash-image-2.5",
                        "google/veo-2.0",
                        "openai/sora-2",
                        "google/veo-3.0-fast",
                        "ideogram/ideogram-3.0",
                        "kwaivgI/kling-2.0-master",
                        "kwaivgI/kling-2.1-standard",
                        "pixverse/pixverse-v5",
                        "stabilityai/stable-diffusion-xl-base-1.0",
                        "openai/sora-2-pro",
                        "ByteDance/Seedance-1.0-lite",
                        "kwaivgI/kling-1.6-pro",
                        "vidu/vidu-2.0",
                        "kwaivgI/kling-2.1-pro",
                        "meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo",
                        "canopylabs/orpheus-3b-0.1-ft",
                        "hexgrad/Kokoro-82M",
                        "eddie/gemma-2b-it",
                        "mistralai/Voxtral-Mini-3B-2507",
                        "arcee-ai/coder-large",
                        "arcee-ai/virtuoso-large",
                        "arcee-ai/maestro-reasoning",
                        "deepcogito/cogito-v2-1-671b",
                        "arcee_ai/arcee-spotlight",
                        "google/gemini-3-pro-image",
                        "mercor/cwm",
                        "black-forest-labs/FLUX.2-flex",
                        "keith-aditya/kimi-k2-instruct",
                        "pangram/mistral-small-2501",
                        "black-forest-labs/FLUX.2-pro",
                        "black-forest-labs/FLUX.2-dev",
                        "ServiceNow-AI/Apriel-1.6-15b-Thinker"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Together",
                "provider_slug": "together",
                "provider_model_id": "arcee_ai/arcee-spotlight",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 65537,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "top_k",
                    "repetition_penalty",
                    "logit_bias",
                    "min_p"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.together.ai/terms-of-service",
                    "privacyPolicyURL": "https://www.together.ai/privacy"
                },
                "pricing": {
                    "prompt": "0.00000018",
                    "completion": "0.00000018",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000018",
                    "openai:completion_tokens": "0.00000018"
                },
                "pricing_version_id": "2f14e880-0538-46ad-914f-5bda86d9d5fa",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "meta-llama/llama-guard-4-12b",
            "hf_slug": "meta-llama/Llama-Guard-4-12B",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-04-30T01:06:33.531556+00:00",
            "hf_updated_at": null,
            "name": "Meta: Llama Guard 4 12B",
            "short_name": "Llama Guard 4 12B",
            "author": "meta-llama",
            "description": "Llama Guard 4 is a Llama 4 Scout-derived multimodal pretrained model, fine-tuned for content safety classification. Similar to previous versions, it can be used to classify content in both LLM inputs (prompt classification) and in LLM responses (response classification). It acts as an LLM—generating text in its output that indicates whether a given prompt or response is safe or unsafe, and if unsafe, it also lists the content categories violated.\n\nLlama Guard 4 was aligned to safeguard against the standardized MLCommons hazards taxonomy and designed to support multimodal Llama 4 capabilities. Specifically, it combines features from previous Llama Guard models, providing content moderation for English and multiple supported languages, along with enhanced capabilities to handle mixed text-and-image prompts, including multiple images. Additionally, Llama Guard 4 is integrated into the Llama Moderations API, extending robust safety classification to text and images.",
            "model_version_group_id": null,
            "context_length": 163840,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "meta-llama/llama-guard-4-12b",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "850b84c3-42a7-4cec-99c0-b5582d0da66b",
                "name": "DeepInfra | meta-llama/llama-guard-4-12b",
                "context_length": 163840,
                "model": {
                    "slug": "meta-llama/llama-guard-4-12b",
                    "hf_slug": "meta-llama/Llama-Guard-4-12B",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-04-30T01:06:33.531556+00:00",
                    "hf_updated_at": null,
                    "name": "Meta: Llama Guard 4 12B",
                    "short_name": "Llama Guard 4 12B",
                    "author": "meta-llama",
                    "description": "Llama Guard 4 is a Llama 4 Scout-derived multimodal pretrained model, fine-tuned for content safety classification. Similar to previous versions, it can be used to classify content in both LLM inputs (prompt classification) and in LLM responses (response classification). It acts as an LLM—generating text in its output that indicates whether a given prompt or response is safe or unsafe, and if unsafe, it also lists the content categories violated.\n\nLlama Guard 4 was aligned to safeguard against the standardized MLCommons hazards taxonomy and designed to support multimodal Llama 4 capabilities. Specifically, it combines features from previous Llama Guard models, providing content moderation for English and multiple supported languages, along with enhanced capabilities to handle mixed text-and-image prompts, including multiple images. Additionally, Llama Guard 4 is integrated into the Llama Moderations API, extending robust safety classification to text and images.",
                    "model_version_group_id": null,
                    "context_length": 163840,
                    "input_modalities": [
                        "image",
                        "text"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "meta-llama/llama-guard-4-12b",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "meta-llama/llama-guard-4-12b",
                "model_variant_permaslug": "meta-llama/llama-guard-4-12b",
                "adapter_name": "DeepInfraAdapter",
                "provider_name": "DeepInfra",
                "provider_info": {
                    "name": "DeepInfra",
                    "displayName": "DeepInfra",
                    "slug": "deepinfra",
                    "baseUrl": "https://api.deepinfra.com/v1/openai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://deepinfra.com/terms",
                        "privacyPolicyURL": "https://deepinfra.com/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}",
                        "org_38GSfr7NVq111kyg6iXh1TTpKuz"
                    ],
                    "adapterName": "DeepInfraAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.deepinfra.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/DeepInfra.webp"
                    },
                    "ignoredProviderModels": [
                        "anthropic/claude-4-opus",
                        "anthropic/claude-4-sonnet",
                        "deepseek-ai/DeepSeek-R1-0528-Turbo",
                        "meta-llama/Llama-2-70b-chat-hf",
                        "mistralai/Mixtral-8x22B-Instruct-v0.1",
                        "google/gemma-1.1-7b-it",
                        "microsoft/Phi-3-medium-4k-instruct",
                        "google/gemma-2-27b-it",
                        "microsoft/WizardLM-2-7B",
                        "mattshumer/Reflection-Llama-3.1-70B",
                        "Sao10K/L3-8B-Lunaris-v1",
                        "openbmb/MiniCPM-Llama3-V-2_5",
                        "Qwen/QVQ-72B-Preview",
                        "deepinfra/airoboros-70b",
                        "Qwen/QwQ-32B-Preview",
                        "Phind/Phind-CodeLlama-34B-v2",
                        "lizpreciatior/lzlv_70b_fp16_hf",
                        "mistralai/Mistral-7B-Instruct-v0.2",
                        "cognitivecomputations/dolphin-2.6-mixtral-8x7b",
                        "cognitivecomputations/dolphin-2.9.1-llama-3-70b",
                        "Qwen/Qwen2-72B-Instruct",
                        "Qwen/Qwen2-7B-Instruct",
                        "google/gemma-2-9b-it",
                        "Sao10K/L3-70B-Euryale-v2.1",
                        "google/codegemma-7b-it",
                        "mistralai/Mistral-7B-Instruct-v0.1",
                        "KoboldAI/LLaMA2-13B-Tiefighter",
                        "meta-llama/Llama-2-13b-chat-hf",
                        "openchat/openchat_3.5",
                        "openchat/openchat-3.6-8b",
                        "bigcode/starcoder2-15b-instruct-v0.1",
                        "Gryphe/MythoMax-L2-13b-turbo",
                        "Austism/chronos-hermes-13b-v2",
                        "Qwen/Qwen2.5-Coder-7B",
                        "moonshotai/Kimi-K2-Instruct",
                        "google/gemini-1.5-flash",
                        "google/gemini-2.5-flash",
                        "google/gemini-2.0-flash-001",
                        "anthropic/claude-3-7-sonnet-latest",
                        "google/gemini-1.5-flash-8b",
                        "google/gemini-2.5-pro",
                        "NovaSky-AI/Sky-T1-32B-Preview",
                        "allenai/olmOCR-7B-0725-FP8",
                        "allenai/olmOCR-7B-0825",
                        "deepseek-ai/DeepSeek-V3-0324-Turbo",
                        "PaddlePaddle/PaddleOCR-VL-0.9B",
                        "allenai/olmOCR-7B-1025",
                        "allenai/olmOCR-2-7B-1025",
                        "allenai/olmOCR-2",
                        "deepseek-ai/DeepSeek-OCR",
                        "meta-llama/Llama-3.2-1B-Instruct",
                        "sentence-transformers/clip-ViT-B-32-multilingual-v1",
                        "shibing624/text2vec-base-chinese",
                        "sentence-transformers/clip-ViT-B-32",
                        "BAAI/bge-en-icl",
                        "Qwen/Qwen3-Embedding-8B-batch",
                        "Qwen/Qwen3-Embedding-4B-batch",
                        "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
                        "meta-llama/Meta-Llama-3.1-405B-Instruct",
                        "BAAI/bge-m3-multi",
                        "google/embeddinggemma-300m",
                        "Qwen/Qwen3-Embedding-0.6B-batch",
                        "meta-llama/Llama-4-Maverick-17B-128E-Instruct-Turbo",
                        "microsoft/Phi-4-multimodal-instruct",
                        "deepseek-ai/DeepSeek-V3.2-Exp",
                        "meta-llama/Llama-3.2-90B-Vision-Instruct",
                        "meta-llama/Meta-Llama-3-70B-Instruct",
                        "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "DeepInfra",
                "provider_slug": "deepinfra/bf16",
                "provider_model_id": "meta-llama/Llama-Guard-4-12B",
                "quantization": "bf16",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "repetition_penalty",
                    "top_k",
                    "seed",
                    "min_p",
                    "response_format"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://deepinfra.com/terms",
                    "privacyPolicyURL": "https://deepinfra.com/privacy"
                },
                "pricing": {
                    "prompt": "0.00000018",
                    "completion": "0.00000018",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000018",
                    "openai:completion_tokens": "0.00000018"
                },
                "pricing_version_id": "48e5a11b-06e3-4455-a22f-3a3af4cea914",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/o4-mini-high",
            "hf_slug": "",
            "updated_at": "2026-01-08T00:53:50.4178+00:00",
            "created_at": "2025-04-16T17:23:32.042157+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: o4 Mini High",
            "short_name": "o4 Mini High",
            "author": "openai",
            "description": "OpenAI o4-mini-high is the same model as [o4-mini](/openai/o4-mini) with reasoning_effort set to high. \n\nOpenAI o4-mini is a compact reasoning model in the o-series, optimized for fast, cost-efficient performance while retaining strong multimodal and agentic capabilities. It supports tool use and demonstrates competitive reasoning and coding performance across benchmarks like AIME (99.5% with Python) and SWE-bench, outperforming its predecessor o3-mini and even approaching o3 in some domains.\n\nDespite its smaller size, o4-mini exhibits high accuracy in STEM tasks, visual problem solving (e.g., MathVista, MMMU), and code editing. It is especially well-suited for high-throughput scenarios where latency or cost is critical. Thanks to its efficient architecture and refined reinforcement learning training, o4-mini can chain tools, generate structured outputs, and solve multi-step tasks with minimal delay—often in under a minute.",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "image",
                "text",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/o4-mini-high-2025-04-16",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null,
                "is_mandatory_reasoning": true,
                "supports_reasoning_effort": true,
                "supported_reasoning_efforts": [
                    "high"
                ]
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null,
                    "is_mandatory_reasoning": true,
                    "supports_reasoning_effort": true,
                    "supported_reasoning_efforts": [
                        "high"
                    ]
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "60020533-2fb2-4aa1-9454-181029fd52de",
                "name": "OpenAI | openai/o4-mini-high-2025-04-16",
                "context_length": 200000,
                "model": {
                    "slug": "openai/o4-mini-high",
                    "hf_slug": "",
                    "updated_at": "2026-01-08T00:53:50.4178+00:00",
                    "created_at": "2025-04-16T17:23:32.042157+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: o4 Mini High",
                    "short_name": "o4 Mini High",
                    "author": "openai",
                    "description": "OpenAI o4-mini-high is the same model as [o4-mini](/openai/o4-mini) with reasoning_effort set to high. \n\nOpenAI o4-mini is a compact reasoning model in the o-series, optimized for fast, cost-efficient performance while retaining strong multimodal and agentic capabilities. It supports tool use and demonstrates competitive reasoning and coding performance across benchmarks like AIME (99.5% with Python) and SWE-bench, outperforming its predecessor o3-mini and even approaching o3 in some domains.\n\nDespite its smaller size, o4-mini exhibits high accuracy in STEM tasks, visual problem solving (e.g., MathVista, MMMU), and code editing. It is especially well-suited for high-throughput scenarios where latency or cost is critical. Thanks to its efficient architecture and refined reinforcement learning training, o4-mini can chain tools, generate structured outputs, and solve multi-step tasks with minimal delay—often in under a minute.",
                    "model_version_group_id": null,
                    "context_length": 200000,
                    "input_modalities": [
                        "image",
                        "text",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/o4-mini-high-2025-04-16",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null,
                        "is_mandatory_reasoning": true,
                        "supports_reasoning_effort": true,
                        "supported_reasoning_efforts": [
                            "high"
                        ]
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null,
                            "is_mandatory_reasoning": true,
                            "supports_reasoning_effort": true,
                            "supported_reasoning_efforts": [
                                "high"
                            ]
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/o4-mini-high",
                "model_variant_permaslug": "openai/o4-mini-high-2025-04-16",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "o4-mini-2025-04-16",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 100000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.0000011",
                    "completion": "0.0000044",
                    "input_cache_read": "0.000000275",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.0000011,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.0000044,
                    "openai_responses:cached_prompt_tokens": 2.75e-7
                },
                "pricing_version_id": "4bc59a87-2c2a-4682-809b-e495ce4af791",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/o3",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-04-16T17:10:57.049467+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: o3",
            "short_name": "o3",
            "author": "openai",
            "description": "o3 is a well-rounded and powerful model across domains. It sets a new standard for math, science, coding, and visual reasoning tasks. It also excels at technical writing and instruction-following. Use it to think through multi-step problems that involve analysis across text, code, and images. ",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "image",
                "text",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/o3-2025-04-16",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "42e72619-d01c-411c-a201-f991644768b7",
                "name": "OpenAI | openai/o3-2025-04-16",
                "context_length": 200000,
                "model": {
                    "slug": "openai/o3",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-04-16T17:10:57.049467+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: o3",
                    "short_name": "o3",
                    "author": "openai",
                    "description": "o3 is a well-rounded and powerful model across domains. It sets a new standard for math, science, coding, and visual reasoning tasks. It also excels at technical writing and instruction-following. Use it to think through multi-step problems that involve analysis across text, code, and images. ",
                    "model_version_group_id": null,
                    "context_length": 200000,
                    "input_modalities": [
                        "image",
                        "text",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/o3-2025-04-16",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/o3",
                "model_variant_permaslug": "openai/o3-2025-04-16",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "o3-2025-04-16",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 100000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000002",
                    "completion": "0.000008",
                    "input_cache_read": "0.0000005",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.000002,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.000008,
                    "openai_responses:cached_prompt_tokens": 5e-7
                },
                "pricing_version_id": "a6ec168c-ce39-40e5-82e9-5847d89c27dd",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/o4-mini",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-04-16T16:29:02.980764+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: o4 Mini",
            "short_name": "o4 Mini",
            "author": "openai",
            "description": "OpenAI o4-mini is a compact reasoning model in the o-series, optimized for fast, cost-efficient performance while retaining strong multimodal and agentic capabilities. It supports tool use and demonstrates competitive reasoning and coding performance across benchmarks like AIME (99.5% with Python) and SWE-bench, outperforming its predecessor o3-mini and even approaching o3 in some domains.\n\nDespite its smaller size, o4-mini exhibits high accuracy in STEM tasks, visual problem solving (e.g., MathVista, MMMU), and code editing. It is especially well-suited for high-throughput scenarios where latency or cost is critical. Thanks to its efficient architecture and refined reinforcement learning training, o4-mini can chain tools, generate structured outputs, and solve multi-step tasks with minimal delay—often in under a minute.",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "image",
                "text",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/o4-mini-2025-04-16",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "bd121898-b27c-4e2c-bc92-278627465a54",
                "name": "OpenAI | openai/o4-mini-2025-04-16",
                "context_length": 200000,
                "model": {
                    "slug": "openai/o4-mini",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-04-16T16:29:02.980764+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: o4 Mini",
                    "short_name": "o4 Mini",
                    "author": "openai",
                    "description": "OpenAI o4-mini is a compact reasoning model in the o-series, optimized for fast, cost-efficient performance while retaining strong multimodal and agentic capabilities. It supports tool use and demonstrates competitive reasoning and coding performance across benchmarks like AIME (99.5% with Python) and SWE-bench, outperforming its predecessor o3-mini and even approaching o3 in some domains.\n\nDespite its smaller size, o4-mini exhibits high accuracy in STEM tasks, visual problem solving (e.g., MathVista, MMMU), and code editing. It is especially well-suited for high-throughput scenarios where latency or cost is critical. Thanks to its efficient architecture and refined reinforcement learning training, o4-mini can chain tools, generate structured outputs, and solve multi-step tasks with minimal delay—often in under a minute.",
                    "model_version_group_id": null,
                    "context_length": 200000,
                    "input_modalities": [
                        "image",
                        "text",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/o4-mini-2025-04-16",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/o4-mini",
                "model_variant_permaslug": "openai/o4-mini-2025-04-16",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "o4-mini-2025-04-16",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 100000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "structured_outputs",
                    "response_format",
                    "seed",
                    "max_tokens",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.0000011",
                    "completion": "0.0000044",
                    "input_cache_read": "0.000000275",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.0000011,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.0000044,
                    "openai_responses:cached_prompt_tokens": 2.75e-7
                },
                "pricing_version_id": "b9791ed2-0245-490a-9ba2-eb793e43b0ec",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-4.1",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-04-14T17:23:05+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-4.1",
            "short_name": "GPT-4.1",
            "author": "openai",
            "description": "GPT-4.1 is a flagship large language model optimized for advanced instruction following, real-world software engineering, and long-context reasoning. It supports a 1 million token context window and outperforms GPT-4o and GPT-4.5 across coding (54.6% SWE-bench Verified), instruction compliance (87.4% IFEval), and multimodal understanding benchmarks. It is tuned for precise code diffs, agent reliability, and high recall in large document contexts, making it ideal for agents, IDE tooling, and enterprise knowledge retrieval.",
            "model_version_group_id": null,
            "context_length": 1047576,
            "input_modalities": [
                "image",
                "text",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-4.1-2025-04-14",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "c235abe8-11cc-42d3-95ad-72f4d198287a",
                "name": "OpenAI | openai/gpt-4.1-2025-04-14",
                "context_length": 1047576,
                "model": {
                    "slug": "openai/gpt-4.1",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-04-14T17:23:05+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-4.1",
                    "short_name": "GPT-4.1",
                    "author": "openai",
                    "description": "GPT-4.1 is a flagship large language model optimized for advanced instruction following, real-world software engineering, and long-context reasoning. It supports a 1 million token context window and outperforms GPT-4o and GPT-4.5 across coding (54.6% SWE-bench Verified), instruction compliance (87.4% IFEval), and multimodal understanding benchmarks. It is tuned for precise code diffs, agent reliability, and high recall in large document contexts, making it ideal for agents, IDE tooling, and enterprise knowledge retrieval.",
                    "model_version_group_id": null,
                    "context_length": 1047576,
                    "input_modalities": [
                        "image",
                        "text",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-4.1-2025-04-14",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-4.1",
                "model_variant_permaslug": "openai/gpt-4.1-2025-04-14",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-4.1-2025-04-14",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 32768,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice",
                    "temperature",
                    "top_p"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000002",
                    "completion": "0.000008",
                    "input_cache_read": "0.0000005",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "search-threshold",
                        "threshold": "high",
                        "request": "0.05"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "medium",
                        "request": "0.035"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "low",
                        "request": "0.03"
                    }
                ],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.000002,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.000008,
                    "openai_responses:cached_prompt_tokens": 5e-7
                },
                "pricing_version_id": "ca78388e-e63c-4cea-a999-e421ab69bfe9",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-4.1-mini",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-04-14T17:23:01+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-4.1 Mini",
            "short_name": "GPT-4.1 Mini",
            "author": "openai",
            "description": "GPT-4.1 Mini is a mid-sized model delivering performance competitive with GPT-4o at substantially lower latency and cost. It retains a 1 million token context window and scores 45.1% on hard instruction evals, 35.8% on MultiChallenge, and 84.1% on IFEval. Mini also shows strong coding ability (e.g., 31.6% on Aider’s polyglot diff benchmark) and vision understanding, making it suitable for interactive applications with tight performance constraints.",
            "model_version_group_id": null,
            "context_length": 1047576,
            "input_modalities": [
                "image",
                "text",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-4.1-mini-2025-04-14",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "872eccb7-9c85-45fc-974a-ff7c8e2407e6",
                "name": "OpenAI | openai/gpt-4.1-mini-2025-04-14",
                "context_length": 1047576,
                "model": {
                    "slug": "openai/gpt-4.1-mini",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-04-14T17:23:01+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-4.1 Mini",
                    "short_name": "GPT-4.1 Mini",
                    "author": "openai",
                    "description": "GPT-4.1 Mini is a mid-sized model delivering performance competitive with GPT-4o at substantially lower latency and cost. It retains a 1 million token context window and scores 45.1% on hard instruction evals, 35.8% on MultiChallenge, and 84.1% on IFEval. Mini also shows strong coding ability (e.g., 31.6% on Aider’s polyglot diff benchmark) and vision understanding, making it suitable for interactive applications with tight performance constraints.",
                    "model_version_group_id": null,
                    "context_length": 1047576,
                    "input_modalities": [
                        "image",
                        "text",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-4.1-mini-2025-04-14",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-4.1-mini",
                "model_variant_permaslug": "openai/gpt-4.1-mini-2025-04-14",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-4.1-mini-2025-04-14",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 32768,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice",
                    "temperature",
                    "top_p"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.0000004",
                    "completion": "0.0000016",
                    "input_cache_read": "0.0000001",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "search-threshold",
                        "threshold": "high",
                        "request": "0.03"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "medium",
                        "request": "0.0275"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "low",
                        "request": "0.025"
                    }
                ],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 4e-7,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 0.0000016,
                    "openai_responses:cached_prompt_tokens": 1e-7
                },
                "pricing_version_id": "2ec08c1d-41c8-4a5c-a05a-14ff60a6fdd5",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-4.1-nano",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-04-14T17:22:49+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-4.1 Nano",
            "short_name": "GPT-4.1 Nano",
            "author": "openai",
            "description": "For tasks that demand low latency, GPT‑4.1 nano is the fastest and cheapest model in the GPT-4.1 series. It delivers exceptional performance at a small size with its 1 million token context window, and scores 80.1% on MMLU, 50.3% on GPQA, and 9.8% on Aider polyglot coding – even higher than GPT‑4o mini. It’s ideal for tasks like classification or autocompletion.",
            "model_version_group_id": null,
            "context_length": 1047576,
            "input_modalities": [
                "image",
                "text",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-4.1-nano-2025-04-14",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "9251cee5-5503-4be9-9439-7ae21ff062a3",
                "name": "OpenAI | openai/gpt-4.1-nano-2025-04-14",
                "context_length": 1047576,
                "model": {
                    "slug": "openai/gpt-4.1-nano",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-04-14T17:22:49+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-4.1 Nano",
                    "short_name": "GPT-4.1 Nano",
                    "author": "openai",
                    "description": "For tasks that demand low latency, GPT‑4.1 nano is the fastest and cheapest model in the GPT-4.1 series. It delivers exceptional performance at a small size with its 1 million token context window, and scores 80.1% on MMLU, 50.3% on GPQA, and 9.8% on Aider polyglot coding – even higher than GPT‑4o mini. It’s ideal for tasks like classification or autocompletion.",
                    "model_version_group_id": null,
                    "context_length": 1047576,
                    "input_modalities": [
                        "image",
                        "text",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-4.1-nano-2025-04-14",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-4.1-nano",
                "model_variant_permaslug": "openai/gpt-4.1-nano-2025-04-14",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-4.1-nano-2025-04-14",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 32768,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice",
                    "temperature",
                    "top_p"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.0000001",
                    "completion": "0.0000004",
                    "input_cache_read": "0.000000025",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 1e-7,
                    "openai_responses:web_search_calls": 0.01,
                    "openai_responses:completion_tokens": 4e-7,
                    "openai_responses:cached_prompt_tokens": 2.5e-8
                },
                "pricing_version_id": "e9e74600-ce43-43ee-8cfc-ee5f7a13c045",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_native_web_search": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "meta-llama/llama-4-maverick",
            "hf_slug": "meta-llama/Llama-4-Maverick-17B-128E-Instruct",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-04-05T19:37:02.129674+00:00",
            "hf_updated_at": null,
            "name": "Meta: Llama 4 Maverick",
            "short_name": "Llama 4 Maverick",
            "author": "meta-llama",
            "description": "Llama 4 Maverick 17B Instruct (128E) is a high-capacity multimodal language model from Meta, built on a mixture-of-experts (MoE) architecture with 128 experts and 17 billion active parameters per forward pass (400B total). It supports multilingual text and image input, and produces multilingual text and code output across 12 supported languages. Optimized for vision-language tasks, Maverick is instruction-tuned for assistant-like behavior, image reasoning, and general-purpose multimodal interaction.\n\nMaverick features early fusion for native multimodality and a 1 million token context window. It was trained on a curated mixture of public, licensed, and Meta-platform data, covering ~22 trillion tokens, with a knowledge cutoff in August 2024. Released on April 5, 2025 under the Llama 4 Community License, Maverick is suited for research and commercial applications requiring advanced multimodal understanding and high model throughput.",
            "model_version_group_id": null,
            "context_length": 1048576,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Llama4",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "meta-llama/llama-4-maverick-17b-128e-instruct",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "69a5d06e-1935-4aa5-903f-71058e64399f",
                "name": "DeepInfra | meta-llama/llama-4-maverick-17b-128e-instruct",
                "context_length": 1048576,
                "model": {
                    "slug": "meta-llama/llama-4-maverick",
                    "hf_slug": "meta-llama/Llama-4-Maverick-17B-128E-Instruct",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-04-05T19:37:02.129674+00:00",
                    "hf_updated_at": null,
                    "name": "Meta: Llama 4 Maverick",
                    "short_name": "Llama 4 Maverick",
                    "author": "meta-llama",
                    "description": "Llama 4 Maverick 17B Instruct (128E) is a high-capacity multimodal language model from Meta, built on a mixture-of-experts (MoE) architecture with 128 experts and 17 billion active parameters per forward pass (400B total). It supports multilingual text and image input, and produces multilingual text and code output across 12 supported languages. Optimized for vision-language tasks, Maverick is instruction-tuned for assistant-like behavior, image reasoning, and general-purpose multimodal interaction.\n\nMaverick features early fusion for native multimodality and a 1 million token context window. It was trained on a curated mixture of public, licensed, and Meta-platform data, covering ~22 trillion tokens, with a knowledge cutoff in August 2024. Released on April 5, 2025 under the Llama 4 Community License, Maverick is suited for research and commercial applications requiring advanced multimodal understanding and high model throughput.",
                    "model_version_group_id": null,
                    "context_length": 1048576,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Llama4",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "meta-llama/llama-4-maverick-17b-128e-instruct",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "meta-llama/llama-4-maverick",
                "model_variant_permaslug": "meta-llama/llama-4-maverick-17b-128e-instruct",
                "adapter_name": "DeepInfraAdapter",
                "provider_name": "DeepInfra",
                "provider_info": {
                    "name": "DeepInfra",
                    "displayName": "DeepInfra",
                    "slug": "deepinfra/base",
                    "baseUrl": "https://api.deepinfra.com/v1/openai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://deepinfra.com/terms",
                        "privacyPolicyURL": "https://deepinfra.com/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}",
                        "org_38GSfr7NVq111kyg6iXh1TTpKuz"
                    ],
                    "adapterName": "DeepInfraAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.deepinfra.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/DeepInfra.webp"
                    },
                    "ignoredProviderModels": [
                        "anthropic/claude-4-opus",
                        "anthropic/claude-4-sonnet",
                        "deepseek-ai/DeepSeek-R1-0528-Turbo",
                        "meta-llama/Llama-2-70b-chat-hf",
                        "mistralai/Mixtral-8x22B-Instruct-v0.1",
                        "google/gemma-1.1-7b-it",
                        "microsoft/Phi-3-medium-4k-instruct",
                        "google/gemma-2-27b-it",
                        "microsoft/WizardLM-2-7B",
                        "mattshumer/Reflection-Llama-3.1-70B",
                        "Sao10K/L3-8B-Lunaris-v1",
                        "openbmb/MiniCPM-Llama3-V-2_5",
                        "Qwen/QVQ-72B-Preview",
                        "deepinfra/airoboros-70b",
                        "Qwen/QwQ-32B-Preview",
                        "Phind/Phind-CodeLlama-34B-v2",
                        "lizpreciatior/lzlv_70b_fp16_hf",
                        "mistralai/Mistral-7B-Instruct-v0.2",
                        "cognitivecomputations/dolphin-2.6-mixtral-8x7b",
                        "cognitivecomputations/dolphin-2.9.1-llama-3-70b",
                        "Qwen/Qwen2-72B-Instruct",
                        "Qwen/Qwen2-7B-Instruct",
                        "google/gemma-2-9b-it",
                        "Sao10K/L3-70B-Euryale-v2.1",
                        "google/codegemma-7b-it",
                        "mistralai/Mistral-7B-Instruct-v0.1",
                        "KoboldAI/LLaMA2-13B-Tiefighter",
                        "meta-llama/Llama-2-13b-chat-hf",
                        "openchat/openchat_3.5",
                        "openchat/openchat-3.6-8b",
                        "bigcode/starcoder2-15b-instruct-v0.1",
                        "Gryphe/MythoMax-L2-13b-turbo",
                        "Austism/chronos-hermes-13b-v2",
                        "Qwen/Qwen2.5-Coder-7B",
                        "moonshotai/Kimi-K2-Instruct",
                        "google/gemini-1.5-flash",
                        "google/gemini-2.5-flash",
                        "google/gemini-2.0-flash-001",
                        "anthropic/claude-3-7-sonnet-latest",
                        "google/gemini-1.5-flash-8b",
                        "google/gemini-2.5-pro",
                        "NovaSky-AI/Sky-T1-32B-Preview",
                        "allenai/olmOCR-7B-0725-FP8",
                        "allenai/olmOCR-7B-0825",
                        "deepseek-ai/DeepSeek-V3-0324-Turbo",
                        "PaddlePaddle/PaddleOCR-VL-0.9B",
                        "allenai/olmOCR-7B-1025",
                        "allenai/olmOCR-2-7B-1025",
                        "allenai/olmOCR-2",
                        "deepseek-ai/DeepSeek-OCR",
                        "meta-llama/Llama-3.2-1B-Instruct",
                        "sentence-transformers/clip-ViT-B-32-multilingual-v1",
                        "shibing624/text2vec-base-chinese",
                        "sentence-transformers/clip-ViT-B-32",
                        "BAAI/bge-en-icl",
                        "Qwen/Qwen3-Embedding-8B-batch",
                        "Qwen/Qwen3-Embedding-4B-batch",
                        "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
                        "meta-llama/Meta-Llama-3.1-405B-Instruct",
                        "BAAI/bge-m3-multi",
                        "google/embeddinggemma-300m",
                        "Qwen/Qwen3-Embedding-0.6B-batch",
                        "meta-llama/Llama-4-Maverick-17B-128E-Instruct-Turbo",
                        "microsoft/Phi-4-multimodal-instruct",
                        "deepseek-ai/DeepSeek-V3.2-Exp",
                        "meta-llama/Llama-3.2-90B-Vision-Instruct",
                        "meta-llama/Meta-Llama-3-70B-Instruct",
                        "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "DeepInfra",
                "provider_slug": "deepinfra/base",
                "provider_model_id": "meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8",
                "quantization": "fp8",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 16384,
                "max_tokens_per_image": 3342,
                "supported_parameters": [
                    "structured_outputs",
                    "response_format",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "repetition_penalty",
                    "top_k",
                    "seed",
                    "min_p"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://deepinfra.com/terms",
                    "privacyPolicyURL": "https://deepinfra.com/privacy"
                },
                "pricing": {
                    "prompt": "0.00000015",
                    "completion": "0.0000006",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000015",
                    "openai:completion_tokens": "0.0000006"
                },
                "pricing_version_id": "8e632947-d4e4-4b41-9854-9d81e10a9e02",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "meta-llama/llama-4-scout",
            "hf_slug": "meta-llama/Llama-4-Scout-17B-16E-Instruct",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-04-05T19:31:59.735804+00:00",
            "hf_updated_at": null,
            "name": "Meta: Llama 4 Scout",
            "short_name": "Llama 4 Scout",
            "author": "meta-llama",
            "description": "Llama 4 Scout 17B Instruct (16E) is a mixture-of-experts (MoE) language model developed by Meta, activating 17 billion parameters out of a total of 109B. It supports native multimodal input (text and image) and multilingual output (text and code) across 12 supported languages. Designed for assistant-style interaction and visual reasoning, Scout uses 16 experts per forward pass and features a context length of 10 million tokens, with a training corpus of ~40 trillion tokens.\n\nBuilt for high efficiency and local or commercial deployment, Llama 4 Scout incorporates early fusion for seamless modality integration. It is instruction-tuned for use in multilingual chat, captioning, and image understanding tasks. Released under the Llama 4 Community License, it was last trained on data up to August 2024 and launched publicly on April 5, 2025.",
            "model_version_group_id": null,
            "context_length": 327680,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Llama4",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "meta-llama/llama-4-scout-17b-16e-instruct",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "9cf05ded-eefe-41b4-8c08-0c6460feffea",
                "name": "DeepInfra | meta-llama/llama-4-scout-17b-16e-instruct",
                "context_length": 327680,
                "model": {
                    "slug": "meta-llama/llama-4-scout",
                    "hf_slug": "meta-llama/Llama-4-Scout-17B-16E-Instruct",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-04-05T19:31:59.735804+00:00",
                    "hf_updated_at": null,
                    "name": "Meta: Llama 4 Scout",
                    "short_name": "Llama 4 Scout",
                    "author": "meta-llama",
                    "description": "Llama 4 Scout 17B Instruct (16E) is a mixture-of-experts (MoE) language model developed by Meta, activating 17 billion parameters out of a total of 109B. It supports native multimodal input (text and image) and multilingual output (text and code) across 12 supported languages. Designed for assistant-style interaction and visual reasoning, Scout uses 16 experts per forward pass and features a context length of 10 million tokens, with a training corpus of ~40 trillion tokens.\n\nBuilt for high efficiency and local or commercial deployment, Llama 4 Scout incorporates early fusion for seamless modality integration. It is instruction-tuned for use in multilingual chat, captioning, and image understanding tasks. Released under the Llama 4 Community License, it was last trained on data up to August 2024 and launched publicly on April 5, 2025.",
                    "model_version_group_id": null,
                    "context_length": 10000000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Llama4",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "meta-llama/llama-4-scout-17b-16e-instruct",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "meta-llama/llama-4-scout",
                "model_variant_permaslug": "meta-llama/llama-4-scout-17b-16e-instruct",
                "adapter_name": "DeepInfraAdapter",
                "provider_name": "DeepInfra",
                "provider_info": {
                    "name": "DeepInfra",
                    "displayName": "DeepInfra",
                    "slug": "deepinfra",
                    "baseUrl": "https://api.deepinfra.com/v1/openai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://deepinfra.com/terms",
                        "privacyPolicyURL": "https://deepinfra.com/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}",
                        "org_38GSfr7NVq111kyg6iXh1TTpKuz"
                    ],
                    "adapterName": "DeepInfraAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.deepinfra.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/DeepInfra.webp"
                    },
                    "ignoredProviderModels": [
                        "anthropic/claude-4-opus",
                        "anthropic/claude-4-sonnet",
                        "deepseek-ai/DeepSeek-R1-0528-Turbo",
                        "meta-llama/Llama-2-70b-chat-hf",
                        "mistralai/Mixtral-8x22B-Instruct-v0.1",
                        "google/gemma-1.1-7b-it",
                        "microsoft/Phi-3-medium-4k-instruct",
                        "google/gemma-2-27b-it",
                        "microsoft/WizardLM-2-7B",
                        "mattshumer/Reflection-Llama-3.1-70B",
                        "Sao10K/L3-8B-Lunaris-v1",
                        "openbmb/MiniCPM-Llama3-V-2_5",
                        "Qwen/QVQ-72B-Preview",
                        "deepinfra/airoboros-70b",
                        "Qwen/QwQ-32B-Preview",
                        "Phind/Phind-CodeLlama-34B-v2",
                        "lizpreciatior/lzlv_70b_fp16_hf",
                        "mistralai/Mistral-7B-Instruct-v0.2",
                        "cognitivecomputations/dolphin-2.6-mixtral-8x7b",
                        "cognitivecomputations/dolphin-2.9.1-llama-3-70b",
                        "Qwen/Qwen2-72B-Instruct",
                        "Qwen/Qwen2-7B-Instruct",
                        "google/gemma-2-9b-it",
                        "Sao10K/L3-70B-Euryale-v2.1",
                        "google/codegemma-7b-it",
                        "mistralai/Mistral-7B-Instruct-v0.1",
                        "KoboldAI/LLaMA2-13B-Tiefighter",
                        "meta-llama/Llama-2-13b-chat-hf",
                        "openchat/openchat_3.5",
                        "openchat/openchat-3.6-8b",
                        "bigcode/starcoder2-15b-instruct-v0.1",
                        "Gryphe/MythoMax-L2-13b-turbo",
                        "Austism/chronos-hermes-13b-v2",
                        "Qwen/Qwen2.5-Coder-7B",
                        "moonshotai/Kimi-K2-Instruct",
                        "google/gemini-1.5-flash",
                        "google/gemini-2.5-flash",
                        "google/gemini-2.0-flash-001",
                        "anthropic/claude-3-7-sonnet-latest",
                        "google/gemini-1.5-flash-8b",
                        "google/gemini-2.5-pro",
                        "NovaSky-AI/Sky-T1-32B-Preview",
                        "allenai/olmOCR-7B-0725-FP8",
                        "allenai/olmOCR-7B-0825",
                        "deepseek-ai/DeepSeek-V3-0324-Turbo",
                        "PaddlePaddle/PaddleOCR-VL-0.9B",
                        "allenai/olmOCR-7B-1025",
                        "allenai/olmOCR-2-7B-1025",
                        "allenai/olmOCR-2",
                        "deepseek-ai/DeepSeek-OCR",
                        "meta-llama/Llama-3.2-1B-Instruct",
                        "sentence-transformers/clip-ViT-B-32-multilingual-v1",
                        "shibing624/text2vec-base-chinese",
                        "sentence-transformers/clip-ViT-B-32",
                        "BAAI/bge-en-icl",
                        "Qwen/Qwen3-Embedding-8B-batch",
                        "Qwen/Qwen3-Embedding-4B-batch",
                        "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
                        "meta-llama/Meta-Llama-3.1-405B-Instruct",
                        "BAAI/bge-m3-multi",
                        "google/embeddinggemma-300m",
                        "Qwen/Qwen3-Embedding-0.6B-batch",
                        "meta-llama/Llama-4-Maverick-17B-128E-Instruct-Turbo",
                        "microsoft/Phi-4-multimodal-instruct",
                        "deepseek-ai/DeepSeek-V3.2-Exp",
                        "meta-llama/Llama-3.2-90B-Vision-Instruct",
                        "meta-llama/Meta-Llama-3-70B-Instruct",
                        "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "DeepInfra",
                "provider_slug": "deepinfra/fp8",
                "provider_model_id": "meta-llama/Llama-4-Scout-17B-16E-Instruct",
                "quantization": "fp8",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 16384,
                "max_tokens_per_image": 3342,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "repetition_penalty",
                    "top_k",
                    "seed",
                    "min_p",
                    "response_format"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://deepinfra.com/terms",
                    "privacyPolicyURL": "https://deepinfra.com/privacy"
                },
                "pricing": {
                    "prompt": "0.00000008",
                    "completion": "0.0000003",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000008",
                    "openai:completion_tokens": "0.0000003"
                },
                "pricing_version_id": "f1a26530-5938-49e1-aff6-64820dd4754c",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": false,
                        "type_function": false
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "qwen/qwen2.5-vl-32b-instruct",
            "hf_slug": "Qwen/Qwen2.5-VL-32B-Instruct",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-03-24T18:10:38.542849+00:00",
            "hf_updated_at": null,
            "name": "Qwen: Qwen2.5 VL 32B Instruct",
            "short_name": "Qwen2.5 VL 32B Instruct",
            "author": "qwen",
            "description": "Qwen2.5-VL-32B is a multimodal vision-language model fine-tuned through reinforcement learning for enhanced mathematical reasoning, structured outputs, and visual problem-solving capabilities. It excels at visual analysis tasks, including object recognition, textual interpretation within images, and precise event localization in extended videos. Qwen2.5-VL-32B demonstrates state-of-the-art performance across multimodal benchmarks such as MMMU, MathVista, and VideoMME, while maintaining strong reasoning and clarity in text-based tasks like MMLU, mathematical problem-solving, and code generation.",
            "model_version_group_id": null,
            "context_length": 16384,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Qwen",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "qwen/qwen2.5-vl-32b-instruct",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "da25176f-4fdf-4f1c-8cbd-11aa2d943ec3",
                "name": "Chutes | qwen/qwen2.5-vl-32b-instruct",
                "context_length": 16384,
                "model": {
                    "slug": "qwen/qwen2.5-vl-32b-instruct",
                    "hf_slug": "Qwen/Qwen2.5-VL-32B-Instruct",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-03-24T18:10:38.542849+00:00",
                    "hf_updated_at": null,
                    "name": "Qwen: Qwen2.5 VL 32B Instruct",
                    "short_name": "Qwen2.5 VL 32B Instruct",
                    "author": "qwen",
                    "description": "Qwen2.5-VL-32B is a multimodal vision-language model fine-tuned through reinforcement learning for enhanced mathematical reasoning, structured outputs, and visual problem-solving capabilities. It excels at visual analysis tasks, including object recognition, textual interpretation within images, and precise event localization in extended videos. Qwen2.5-VL-32B demonstrates state-of-the-art performance across multimodal benchmarks such as MMMU, MathVista, and VideoMME, while maintaining strong reasoning and clarity in text-based tasks like MMLU, mathematical problem-solving, and code generation.",
                    "model_version_group_id": null,
                    "context_length": 32768,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Qwen",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "qwen/qwen2.5-vl-32b-instruct",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "qwen/qwen2.5-vl-32b-instruct",
                "model_variant_permaslug": "qwen/qwen2.5-vl-32b-instruct",
                "adapter_name": "ChutesAdapter",
                "provider_name": "Chutes",
                "provider_info": {
                    "name": "Chutes",
                    "displayName": "Chutes",
                    "slug": "chutes",
                    "baseUrl": "https://llm.chutes.ai/v1",
                    "dataPolicy": {
                        "training": true,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://chutes.ai/tos"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "ChutesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://chutes.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "openbmb/MiniCPM4-8B",
                        "agentica-org/DeepSWE-Preview",
                        "moonshotai/Kimi-K2-Instruct-tools",
                        "internlm/Intern-S1",
                        "TheDrummer/Gemmasutra-Pro-27B-v1.1",
                        "all-hands/openhands-lm-32b-v0.1-ep3",
                        "TheDrummer/Tunguska-39B-v1",
                        "Meridian",
                        "Zenith",
                        "Proxima",
                        "agentica-org/DeepCoder-14B-Preview",
                        "TheDrummer/Cydonia-24B-v2.1",
                        "Tesslate/UIGEN-X-32B-0727",
                        "NousResearch/Hermes-4-14B",
                        "unsloth/gemma-3-4b-it",
                        "tencent/Hunyuan-A13B-Instruct",
                        "unsloth/Llama-3.2-3B-Instruct",
                        "unsloth/Llama-3.2-1B-Instruct",
                        "zai-org/GLM-4.5-turbo",
                        "zai-org/GLM-4.6-turbo",
                        "rednote-hilab/dots.ocr",
                        "deepseek-ai/DeepSeek-V3-0324-turbo",
                        "deepseek-ai/DeepSeek-V3.1-turbo",
                        "moonshotai/Kimi-K2-Thinking",
                        "zai-org/GLM-4.5",
                        "deepseek-ai/DeepSeek-V3.1",
                        "zai-org/GLM-4.6-FP8",
                        "zai-org/GLM-4.7-FP8",
                        "zai-org/GLM-4.5-FP8"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Chutes",
                "provider_slug": "chutes/bf16",
                "provider_model_id": "Qwen/Qwen2.5-VL-32B-Instruct",
                "quantization": "bf16",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 16384,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "top_k",
                    "repetition_penalty",
                    "response_format",
                    "structured_outputs"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": true,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://chutes.ai/tos"
                },
                "pricing": {
                    "prompt": "0.00000005",
                    "completion": "0.00000022",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000005",
                    "openai:completion_tokens": "0.00000022"
                },
                "pricing_version_id": "f15cc17b-4cc0-4f96-a76b-e1664fb8ed62",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/o1-pro",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-03-19T22:26:51.610039+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: o1-pro",
            "short_name": "o1-pro",
            "author": "openai",
            "description": "The o1 series of models are trained with reinforcement learning to think before they answer and perform complex reasoning. The o1-pro model uses more compute to think harder and provide consistently better answers.",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/o1-pro",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "046ae30d-fe99-44b4-b020-21127e4342c7",
                "name": "OpenAI | openai/o1-pro",
                "context_length": 200000,
                "model": {
                    "slug": "openai/o1-pro",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-03-19T22:26:51.610039+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: o1-pro",
                    "short_name": "o1-pro",
                    "author": "openai",
                    "description": "The o1 series of models are trained with reinforcement learning to think before they answer and perform complex reasoning. The o1-pro model uses more compute to think harder and provide consistently better answers.",
                    "model_version_group_id": null,
                    "context_length": 200000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/o1-pro",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/o1-pro",
                "model_variant_permaslug": "openai/o1-pro",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "o1-pro",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 100000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00015",
                    "completion": "0.0006",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.00015,
                    "openai_responses:completion_tokens": 0.0006
                },
                "pricing_version_id": "af47ffe6-72c7-4a72-8bf4-1922ed5d6d65",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "mistralai/mistral-small-3.1-24b-instruct",
            "hf_slug": "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-03-17T19:15:37.00423+00:00",
            "hf_updated_at": null,
            "name": "Mistral: Mistral Small 3.1 24B (free)",
            "short_name": "Mistral Small 3.1 24B (free)",
            "author": "mistralai",
            "description": "Mistral Small 3.1 24B Instruct is an upgraded variant of Mistral Small 3 (2501), featuring 24 billion parameters with advanced multimodal capabilities. It provides state-of-the-art performance in text-based reasoning and vision tasks, including image analysis, programming, mathematical reasoning, and multilingual support across dozens of languages. Equipped with an extensive 128k token context window and optimized for efficient local inference, it supports use cases such as conversational agents, function calling, long-document comprehension, and privacy-sensitive deployments. The updated version is [Mistral Small 3.2](mistralai/mistral-small-3.2-24b-instruct)",
            "model_version_group_id": null,
            "context_length": 128000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Mistral",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "mistralai/mistral-small-3.1-24b-instruct-2503",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": 0.3
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "ecbdc9f1-ecca-4f91-83cf-b3495a60e874",
                "name": "Venice | mistralai/mistral-small-3.1-24b-instruct-2503:free",
                "context_length": 128000,
                "model": {
                    "slug": "mistralai/mistral-small-3.1-24b-instruct",
                    "hf_slug": "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-03-17T19:15:37.00423+00:00",
                    "hf_updated_at": null,
                    "name": "Mistral: Mistral Small 3.1 24B",
                    "short_name": "Mistral Small 3.1 24B",
                    "author": "mistralai",
                    "description": "Mistral Small 3.1 24B Instruct is an upgraded variant of Mistral Small 3 (2501), featuring 24 billion parameters with advanced multimodal capabilities. It provides state-of-the-art performance in text-based reasoning and vision tasks, including image analysis, programming, mathematical reasoning, and multilingual support across dozens of languages. Equipped with an extensive 128k token context window and optimized for efficient local inference, it supports use cases such as conversational agents, function calling, long-document comprehension, and privacy-sensitive deployments. The updated version is [Mistral Small 3.2](mistralai/mistral-small-3.2-24b-instruct)",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Mistral",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "mistralai/mistral-small-3.1-24b-instruct-2503",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {
                        "temperature": 0.3
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "mistralai/mistral-small-3.1-24b-instruct:free",
                "model_variant_permaslug": "mistralai/mistral-small-3.1-24b-instruct-2503:free",
                "adapter_name": "VeniceAdapter",
                "provider_name": "Venice",
                "provider_info": {
                    "name": "Venice",
                    "displayName": "Venice",
                    "slug": "venice",
                    "baseUrl": "https://api.venice.ai/api/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://venice.ai/legal/tos",
                        "privacyPolicyURL": "https://venice.ai/legal/privacy-policy"
                    },
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "VeniceAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://venice.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "llama-3.2-3b",
                        "deepseek-coder-v2-lite",
                        "dolphin-2.9.2-qwen2-72b",
                        "mistral-32-24b",
                        "zai-org-glm-4.6",
                        "qwen3-235b-a22b-thinking-2507",
                        "qwen3-235b-a22b-instruct-2507",
                        "google-gemma-3-27b-it",
                        "openai-gpt-oss-120b",
                        "deepseek-ai-DeepSeek-R1",
                        "grok-41-fast",
                        "gemini-3-pro-preview",
                        "claude-opus-45",
                        "kimi-k2-thinking",
                        "deepseek-v3.2",
                        "openai-gpt-52",
                        "gemini-3-flash-preview",
                        "grok-code-fast-1",
                        "claude-sonnet-45",
                        "openai-gpt-52-codex",
                        "venice-uncensored",
                        "qwen3-4b",
                        "mistral-31-24b",
                        "qwen3-next-80b",
                        "qwen3-coder-480b-a35b-instruct",
                        "hermes-3-llama-3.1-405b",
                        "llama-3.3-70b"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Venice",
                "provider_slug": "venice/fp8",
                "provider_model_id": "mistral-31-24b",
                "quantization": "fp8",
                "variant": "free",
                "is_free": true,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "structured_outputs",
                    "response_format",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "top_k",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://venice.ai/legal/tos",
                    "privacyPolicyURL": "https://venice.ai/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0",
                    "openai:completion_tokens": "0"
                },
                "pricing_version_id": "ea23abca-d690-46fc-bfe7-f9b7131fec90",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": 8,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "disable_free_endpoint_limits": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "response_format": true,
                        "structured_outputs": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "mistralai/mistral-small-3.1-24b-instruct",
            "hf_slug": "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-03-17T19:15:37.00423+00:00",
            "hf_updated_at": null,
            "name": "Mistral: Mistral Small 3.1 24B",
            "short_name": "Mistral Small 3.1 24B",
            "author": "mistralai",
            "description": "Mistral Small 3.1 24B Instruct is an upgraded variant of Mistral Small 3 (2501), featuring 24 billion parameters with advanced multimodal capabilities. It provides state-of-the-art performance in text-based reasoning and vision tasks, including image analysis, programming, mathematical reasoning, and multilingual support across dozens of languages. Equipped with an extensive 128k token context window and optimized for efficient local inference, it supports use cases such as conversational agents, function calling, long-document comprehension, and privacy-sensitive deployments. The updated version is [Mistral Small 3.2](mistralai/mistral-small-3.2-24b-instruct)",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Mistral",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "mistralai/mistral-small-3.1-24b-instruct-2503",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": 0.3
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "5f981bd9-b098-4757-b075-06d51d37cc65",
                "name": "Chutes | mistralai/mistral-small-3.1-24b-instruct-2503",
                "context_length": 131072,
                "model": {
                    "slug": "mistralai/mistral-small-3.1-24b-instruct",
                    "hf_slug": "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-03-17T19:15:37.00423+00:00",
                    "hf_updated_at": null,
                    "name": "Mistral: Mistral Small 3.1 24B",
                    "short_name": "Mistral Small 3.1 24B",
                    "author": "mistralai",
                    "description": "Mistral Small 3.1 24B Instruct is an upgraded variant of Mistral Small 3 (2501), featuring 24 billion parameters with advanced multimodal capabilities. It provides state-of-the-art performance in text-based reasoning and vision tasks, including image analysis, programming, mathematical reasoning, and multilingual support across dozens of languages. Equipped with an extensive 128k token context window and optimized for efficient local inference, it supports use cases such as conversational agents, function calling, long-document comprehension, and privacy-sensitive deployments. The updated version is [Mistral Small 3.2](mistralai/mistral-small-3.2-24b-instruct)",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Mistral",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "mistralai/mistral-small-3.1-24b-instruct-2503",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {
                        "temperature": 0.3
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "mistralai/mistral-small-3.1-24b-instruct",
                "model_variant_permaslug": "mistralai/mistral-small-3.1-24b-instruct-2503",
                "adapter_name": "ChutesAdapter",
                "provider_name": "Chutes",
                "provider_info": {
                    "name": "Chutes",
                    "displayName": "Chutes",
                    "slug": "chutes",
                    "baseUrl": "https://llm.chutes.ai/v1",
                    "dataPolicy": {
                        "training": true,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://chutes.ai/tos"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "ChutesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://chutes.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "openbmb/MiniCPM4-8B",
                        "agentica-org/DeepSWE-Preview",
                        "moonshotai/Kimi-K2-Instruct-tools",
                        "internlm/Intern-S1",
                        "TheDrummer/Gemmasutra-Pro-27B-v1.1",
                        "all-hands/openhands-lm-32b-v0.1-ep3",
                        "TheDrummer/Tunguska-39B-v1",
                        "Meridian",
                        "Zenith",
                        "Proxima",
                        "agentica-org/DeepCoder-14B-Preview",
                        "TheDrummer/Cydonia-24B-v2.1",
                        "Tesslate/UIGEN-X-32B-0727",
                        "NousResearch/Hermes-4-14B",
                        "unsloth/gemma-3-4b-it",
                        "tencent/Hunyuan-A13B-Instruct",
                        "unsloth/Llama-3.2-3B-Instruct",
                        "unsloth/Llama-3.2-1B-Instruct",
                        "zai-org/GLM-4.5-turbo",
                        "zai-org/GLM-4.6-turbo",
                        "rednote-hilab/dots.ocr",
                        "deepseek-ai/DeepSeek-V3-0324-turbo",
                        "deepseek-ai/DeepSeek-V3.1-turbo",
                        "moonshotai/Kimi-K2-Thinking",
                        "zai-org/GLM-4.5",
                        "deepseek-ai/DeepSeek-V3.1",
                        "zai-org/GLM-4.6-FP8",
                        "zai-org/GLM-4.7-FP8",
                        "zai-org/GLM-4.5-FP8"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Chutes",
                "provider_slug": "chutes/bf16",
                "provider_model_id": "chutesai/Mistral-Small-3.1-24B-Instruct-2503",
                "quantization": "bf16",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 131072,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "top_k",
                    "repetition_penalty",
                    "response_format",
                    "tools",
                    "tool_choice",
                    "structured_outputs"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": true,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://chutes.ai/tos"
                },
                "pricing": {
                    "prompt": "0.00000003",
                    "completion": "0.00000011",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000003",
                    "openai:completion_tokens": "0.00000011"
                },
                "pricing_version_id": "8f9bd506-357e-41cb-b7e8-f8f5b7b4d123",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemma-3-4b-it",
            "hf_slug": "google/gemma-3-4b-it",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-03-13T22:38:30.653142+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemma 3 4B (free)",
            "short_name": "Gemma 3 4B (free)",
            "author": "google",
            "description": "Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling.",
            "model_version_group_id": "c99b277a-cfaf-4e93-9360-8a79cfa2b2c4",
            "context_length": 32768,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": "gemma",
            "default_system": null,
            "default_stops": [
                "<start_of_turn>",
                "<end_of_turn>",
                "<eos>"
            ],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemma-3-4b-it",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "90fbd988-266d-4ef4-b345-63b46ab6caca",
                "name": "Google AI Studio | google/gemma-3-4b-it:free",
                "context_length": 32768,
                "model": {
                    "slug": "google/gemma-3-4b-it",
                    "hf_slug": "google/gemma-3-4b-it",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-03-13T22:38:30.653142+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemma 3 4B",
                    "short_name": "Gemma 3 4B",
                    "author": "google",
                    "description": "Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling.",
                    "model_version_group_id": "c99b277a-cfaf-4e93-9360-8a79cfa2b2c4",
                    "context_length": 131072,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": "gemma",
                    "default_system": null,
                    "default_stops": [
                        "<start_of_turn>",
                        "<end_of_turn>",
                        "<eos>"
                    ],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "google/gemma-3-4b-it",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemma-3-4b-it:free",
                "model_variant_permaslug": "google/gemma-3-4b-it:free",
                "adapter_name": "GoogleAIStudioGeminiAdapter",
                "provider_name": "Google AI Studio",
                "provider_info": {
                    "name": "Google AI Studio",
                    "displayName": "Google AI Studio",
                    "slug": "google-ai-studio",
                    "baseUrl": "https://generativelanguage.googleapis.com/v1beta",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 55,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleAIStudioGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleAIStudio.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-1p",
                        "gemini-2.5-pro-1p-recitation-off",
                        "gemini-2.5-flash-1p",
                        "gemini-2.5-flash-1p-recitation-off",
                        "gemini-2.5-flash-lite-preview-06-11-summarized",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-1.5-pro-latest",
                        "gemini-1.5-pro",
                        "gemini-1.5-flash-latest",
                        "gemini-1.5-flash",
                        "gemini-1.5-flash-8b",
                        "gemini-1.5-flash-8b-latest",
                        "gemini-2.5-pro-preview-03-25",
                        "gemini-2.0-flash",
                        "gemini-2.0-flash-lite",
                        "gemini-2.0-flash-lite-preview",
                        "gemini-2.0-pro-exp",
                        "gemini-2.0-flash-thinking-exp",
                        "gemini-2.5-flash-preview-tts",
                        "gemini-2.5-pro-preview-tts",
                        "learnlm-2.0-flash-experimental",
                        "gracefulgolem",
                        "gemini-2.5-flash-preview-05-20",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.0-flash-exp-image-generation",
                        "gemini-2.0-flash-preview-image-generation",
                        "gemini-2.0-flash-lite-preview-02-05",
                        "gemini-2.0-pro-exp-02-05",
                        "gemini-exp-1206",
                        "gemini-2.0-flash-thinking-exp-01-21",
                        "gemini-2.0-flash-thinking-exp-1219",
                        "gemma-3-1b-it",
                        "gemini-flash-latest",
                        "gemini-flash-lite-latest",
                        "gemini-pro-latest",
                        "gemini-robotics-er-1.5-preview",
                        "gemini-embedding-001",
                        "riftrunner-fst-rewind",
                        "gemini-3-pro-image-preview",
                        "nano-banana-pro-preview",
                        "fiercefalcon",
                        "fiercefalcon-inline-citation",
                        "fiercefalcon-blocked-sites"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google AI Studio",
                "provider_slug": "google-ai-studio",
                "provider_model_id": "gemma-3-4b-it",
                "quantization": "unknown",
                "variant": "free",
                "is_free": true,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 8192,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "response_format",
                    "stop"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": true,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 55,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice"
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "gemini:prompt_tokens": 0,
                    "gemini:reasoning_tokens": 0,
                    "gemini:completion_tokens": 0,
                    "gemini:text_input_tokens": 0,
                    "gemini:audio_input_tokens": 0,
                    "gemini:image_input_tokens": 0,
                    "gemini:video_input_tokens": 0,
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "5910cac3-cd98-4e8a-8aa1-95d0ecfd5f88",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "structured_outputs": false
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemma-3-4b-it",
            "hf_slug": "google/gemma-3-4b-it",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-03-13T22:38:30.653142+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemma 3 4B",
            "short_name": "Gemma 3 4B",
            "author": "google",
            "description": "Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling.",
            "model_version_group_id": "c99b277a-cfaf-4e93-9360-8a79cfa2b2c4",
            "context_length": 96000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": "gemma",
            "default_system": null,
            "default_stops": [
                "<start_of_turn>",
                "<end_of_turn>",
                "<eos>"
            ],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemma-3-4b-it",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "82b95f58-a96f-4ace-bbfa-8ab8443c9d15",
                "name": "Chutes | google/gemma-3-4b-it",
                "context_length": 96000,
                "model": {
                    "slug": "google/gemma-3-4b-it",
                    "hf_slug": "google/gemma-3-4b-it",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-03-13T22:38:30.653142+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemma 3 4B",
                    "short_name": "Gemma 3 4B",
                    "author": "google",
                    "description": "Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling.",
                    "model_version_group_id": "c99b277a-cfaf-4e93-9360-8a79cfa2b2c4",
                    "context_length": 131072,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": "gemma",
                    "default_system": null,
                    "default_stops": [
                        "<start_of_turn>",
                        "<end_of_turn>",
                        "<eos>"
                    ],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "google/gemma-3-4b-it",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemma-3-4b-it",
                "model_variant_permaslug": "google/gemma-3-4b-it",
                "adapter_name": "ChutesAdapter",
                "provider_name": "Chutes",
                "provider_info": {
                    "name": "Chutes",
                    "displayName": "Chutes",
                    "slug": "chutes",
                    "baseUrl": "https://llm.chutes.ai/v1",
                    "dataPolicy": {
                        "training": true,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://chutes.ai/tos"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "ChutesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://chutes.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "openbmb/MiniCPM4-8B",
                        "agentica-org/DeepSWE-Preview",
                        "moonshotai/Kimi-K2-Instruct-tools",
                        "internlm/Intern-S1",
                        "TheDrummer/Gemmasutra-Pro-27B-v1.1",
                        "all-hands/openhands-lm-32b-v0.1-ep3",
                        "TheDrummer/Tunguska-39B-v1",
                        "Meridian",
                        "Zenith",
                        "Proxima",
                        "agentica-org/DeepCoder-14B-Preview",
                        "TheDrummer/Cydonia-24B-v2.1",
                        "Tesslate/UIGEN-X-32B-0727",
                        "NousResearch/Hermes-4-14B",
                        "unsloth/gemma-3-4b-it",
                        "tencent/Hunyuan-A13B-Instruct",
                        "unsloth/Llama-3.2-3B-Instruct",
                        "unsloth/Llama-3.2-1B-Instruct",
                        "zai-org/GLM-4.5-turbo",
                        "zai-org/GLM-4.6-turbo",
                        "rednote-hilab/dots.ocr",
                        "deepseek-ai/DeepSeek-V3-0324-turbo",
                        "deepseek-ai/DeepSeek-V3.1-turbo",
                        "moonshotai/Kimi-K2-Thinking",
                        "zai-org/GLM-4.5",
                        "deepseek-ai/DeepSeek-V3.1",
                        "zai-org/GLM-4.6-FP8",
                        "zai-org/GLM-4.7-FP8",
                        "zai-org/GLM-4.5-FP8"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Chutes",
                "provider_slug": "chutes",
                "provider_model_id": "unsloth/gemma-3-4b-it",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "top_k",
                    "repetition_penalty"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": true,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://chutes.ai/tos"
                },
                "pricing": {
                    "prompt": "0.00000001703012",
                    "completion": "0.0000000681536",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000001703012",
                    "openai:completion_tokens": "0.0000000681536"
                },
                "pricing_version_id": "f1fa869b-f892-461c-858e-c77dc890f169",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemma-3-12b-it",
            "hf_slug": "google/gemma-3-12b-it",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-03-13T21:50:25.140801+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemma 3 12B (free)",
            "short_name": "Gemma 3 12B (free)",
            "author": "google",
            "description": "Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3 12B is the second largest in the family of Gemma 3 models after [Gemma 3 27B](google/gemma-3-27b-it)",
            "model_version_group_id": "c99b277a-cfaf-4e93-9360-8a79cfa2b2c4",
            "context_length": 32768,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": "gemma",
            "default_system": null,
            "default_stops": [
                "<start_of_turn>",
                "<end_of_turn>",
                "<eos>"
            ],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemma-3-12b-it",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "a6489e9a-e430-438f-9aa9-d6a664362e6e",
                "name": "Google AI Studio | google/gemma-3-12b-it:free",
                "context_length": 32768,
                "model": {
                    "slug": "google/gemma-3-12b-it",
                    "hf_slug": "google/gemma-3-12b-it",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-03-13T21:50:25.140801+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemma 3 12B",
                    "short_name": "Gemma 3 12B",
                    "author": "google",
                    "description": "Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3 12B is the second largest in the family of Gemma 3 models after [Gemma 3 27B](google/gemma-3-27b-it)",
                    "model_version_group_id": "c99b277a-cfaf-4e93-9360-8a79cfa2b2c4",
                    "context_length": 131072,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": "gemma",
                    "default_system": null,
                    "default_stops": [
                        "<start_of_turn>",
                        "<end_of_turn>",
                        "<eos>"
                    ],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "google/gemma-3-12b-it",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemma-3-12b-it:free",
                "model_variant_permaslug": "google/gemma-3-12b-it:free",
                "adapter_name": "GoogleAIStudioGeminiAdapter",
                "provider_name": "Google AI Studio",
                "provider_info": {
                    "name": "Google AI Studio",
                    "displayName": "Google AI Studio",
                    "slug": "google-ai-studio",
                    "baseUrl": "https://generativelanguage.googleapis.com/v1beta",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 55,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleAIStudioGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleAIStudio.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-1p",
                        "gemini-2.5-pro-1p-recitation-off",
                        "gemini-2.5-flash-1p",
                        "gemini-2.5-flash-1p-recitation-off",
                        "gemini-2.5-flash-lite-preview-06-11-summarized",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-1.5-pro-latest",
                        "gemini-1.5-pro",
                        "gemini-1.5-flash-latest",
                        "gemini-1.5-flash",
                        "gemini-1.5-flash-8b",
                        "gemini-1.5-flash-8b-latest",
                        "gemini-2.5-pro-preview-03-25",
                        "gemini-2.0-flash",
                        "gemini-2.0-flash-lite",
                        "gemini-2.0-flash-lite-preview",
                        "gemini-2.0-pro-exp",
                        "gemini-2.0-flash-thinking-exp",
                        "gemini-2.5-flash-preview-tts",
                        "gemini-2.5-pro-preview-tts",
                        "learnlm-2.0-flash-experimental",
                        "gracefulgolem",
                        "gemini-2.5-flash-preview-05-20",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.0-flash-exp-image-generation",
                        "gemini-2.0-flash-preview-image-generation",
                        "gemini-2.0-flash-lite-preview-02-05",
                        "gemini-2.0-pro-exp-02-05",
                        "gemini-exp-1206",
                        "gemini-2.0-flash-thinking-exp-01-21",
                        "gemini-2.0-flash-thinking-exp-1219",
                        "gemma-3-1b-it",
                        "gemini-flash-latest",
                        "gemini-flash-lite-latest",
                        "gemini-pro-latest",
                        "gemini-robotics-er-1.5-preview",
                        "gemini-embedding-001",
                        "riftrunner-fst-rewind",
                        "gemini-3-pro-image-preview",
                        "nano-banana-pro-preview",
                        "fiercefalcon",
                        "fiercefalcon-inline-citation",
                        "fiercefalcon-blocked-sites"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google AI Studio",
                "provider_slug": "google-ai-studio",
                "provider_model_id": "gemma-3-12b-it",
                "quantization": "unknown",
                "variant": "free",
                "is_free": true,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 8192,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "stop"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": true,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 55,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice"
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "gemini:prompt_tokens": 0,
                    "gemini:reasoning_tokens": 0,
                    "gemini:completion_tokens": 0,
                    "gemini:text_input_tokens": 0,
                    "gemini:audio_input_tokens": 0,
                    "gemini:image_input_tokens": 0,
                    "gemini:video_input_tokens": 0,
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "0140f5a5-97fd-4ac9-ac62-e7132fb22336",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {
                        "structured_outputs": false
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemma-3-12b-it",
            "hf_slug": "google/gemma-3-12b-it",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-03-13T21:50:25.140801+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemma 3 12B",
            "short_name": "Gemma 3 12B",
            "author": "google",
            "description": "Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3 12B is the second largest in the family of Gemma 3 models after [Gemma 3 27B](google/gemma-3-27b-it)",
            "model_version_group_id": "c99b277a-cfaf-4e93-9360-8a79cfa2b2c4",
            "context_length": 131072,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": "gemma",
            "default_system": null,
            "default_stops": [
                "<start_of_turn>",
                "<end_of_turn>",
                "<eos>"
            ],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemma-3-12b-it",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "3d994016-72a0-497c-a16a-22eff393ab2a",
                "name": "Chutes | google/gemma-3-12b-it",
                "context_length": 131072,
                "model": {
                    "slug": "google/gemma-3-12b-it",
                    "hf_slug": "google/gemma-3-12b-it",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-03-13T21:50:25.140801+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemma 3 12B",
                    "short_name": "Gemma 3 12B",
                    "author": "google",
                    "description": "Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3 12B is the second largest in the family of Gemma 3 models after [Gemma 3 27B](google/gemma-3-27b-it)",
                    "model_version_group_id": "c99b277a-cfaf-4e93-9360-8a79cfa2b2c4",
                    "context_length": 131072,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": "gemma",
                    "default_system": null,
                    "default_stops": [
                        "<start_of_turn>",
                        "<end_of_turn>",
                        "<eos>"
                    ],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "google/gemma-3-12b-it",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemma-3-12b-it",
                "model_variant_permaslug": "google/gemma-3-12b-it",
                "adapter_name": "ChutesAdapter",
                "provider_name": "Chutes",
                "provider_info": {
                    "name": "Chutes",
                    "displayName": "Chutes",
                    "slug": "chutes",
                    "baseUrl": "https://llm.chutes.ai/v1",
                    "dataPolicy": {
                        "training": true,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://chutes.ai/tos"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "ChutesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://chutes.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "openbmb/MiniCPM4-8B",
                        "agentica-org/DeepSWE-Preview",
                        "moonshotai/Kimi-K2-Instruct-tools",
                        "internlm/Intern-S1",
                        "TheDrummer/Gemmasutra-Pro-27B-v1.1",
                        "all-hands/openhands-lm-32b-v0.1-ep3",
                        "TheDrummer/Tunguska-39B-v1",
                        "Meridian",
                        "Zenith",
                        "Proxima",
                        "agentica-org/DeepCoder-14B-Preview",
                        "TheDrummer/Cydonia-24B-v2.1",
                        "Tesslate/UIGEN-X-32B-0727",
                        "NousResearch/Hermes-4-14B",
                        "unsloth/gemma-3-4b-it",
                        "tencent/Hunyuan-A13B-Instruct",
                        "unsloth/Llama-3.2-3B-Instruct",
                        "unsloth/Llama-3.2-1B-Instruct",
                        "zai-org/GLM-4.5-turbo",
                        "zai-org/GLM-4.6-turbo",
                        "rednote-hilab/dots.ocr",
                        "deepseek-ai/DeepSeek-V3-0324-turbo",
                        "deepseek-ai/DeepSeek-V3.1-turbo",
                        "moonshotai/Kimi-K2-Thinking",
                        "zai-org/GLM-4.5",
                        "deepseek-ai/DeepSeek-V3.1",
                        "zai-org/GLM-4.6-FP8",
                        "zai-org/GLM-4.7-FP8",
                        "zai-org/GLM-4.5-FP8"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Chutes",
                "provider_slug": "chutes/bf16",
                "provider_model_id": "unsloth/gemma-3-12b-it",
                "quantization": "bf16",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 131072,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "top_k",
                    "repetition_penalty",
                    "response_format"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": true,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://chutes.ai/tos"
                },
                "pricing": {
                    "prompt": "0.00000003",
                    "completion": "0.0000001",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000003",
                    "openai:completion_tokens": "0.0000001"
                },
                "pricing_version_id": "410a115b-b30c-4039-9667-726659fdd9ff",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemma-3-27b-it",
            "hf_slug": "google/gemma-3-27b-it",
            "updated_at": "2026-01-07T04:36:03.22387+00:00",
            "created_at": "2025-03-12T05:12:39.645813+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemma 3 27B (free)",
            "short_name": "Gemma 3 27B (free)",
            "author": "google",
            "description": "Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3 27B is Google's latest open source model, successor to [Gemma 2](google/gemma-2-27b-it)",
            "model_version_group_id": "c99b277a-cfaf-4e93-9360-8a79cfa2b2c4",
            "context_length": 131072,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": "gemma",
            "default_system": null,
            "default_stops": [
                "<start_of_turn>",
                "<end_of_turn>",
                "<eos>"
            ],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemma-3-27b-it",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "f4276f71-4f8b-48e5-a823-42260e7c0965",
                "name": "ModelRun | google/gemma-3-27b-it:free",
                "context_length": 131072,
                "model": {
                    "slug": "google/gemma-3-27b-it",
                    "hf_slug": "google/gemma-3-27b-it",
                    "updated_at": "2026-01-07T04:36:03.22387+00:00",
                    "created_at": "2025-03-12T05:12:39.645813+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemma 3 27B",
                    "short_name": "Gemma 3 27B",
                    "author": "google",
                    "description": "Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3 27B is Google's latest open source model, successor to [Gemma 2](google/gemma-2-27b-it)",
                    "model_version_group_id": "c99b277a-cfaf-4e93-9360-8a79cfa2b2c4",
                    "context_length": 131072,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": "gemma",
                    "default_system": null,
                    "default_stops": [
                        "<start_of_turn>",
                        "<end_of_turn>",
                        "<eos>"
                    ],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "google/gemma-3-27b-it",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemma-3-27b-it:free",
                "model_variant_permaslug": "google/gemma-3-27b-it:free",
                "adapter_name": "OpenAIAdapter",
                "provider_name": "ModelRun",
                "provider_info": {
                    "name": "ModelRun",
                    "displayName": "ModelRun",
                    "slug": "modelrun",
                    "baseUrl": "https://api.runmodelrun.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.runmodelrun.com/TOS.html",
                        "privacyPolicyURL": "https://www.runmodelrun.com/privacy-policy.html"
                    },
                    "headquarters": "US",
                    "datacenters": [
                        "US"
                    ],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [],
                    "owners": [],
                    "adapterName": "OpenAIAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://api.runmodelrun.com&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "ModelRun",
                "provider_slug": "modelrun",
                "provider_model_id": "google/gemma-3-27b-it",
                "quantization": "unknown",
                "variant": "free",
                "is_free": true,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "presence_penalty",
                    "repetition_penalty",
                    "frequency_penalty"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.runmodelrun.com/TOS.html",
                    "privacyPolicyURL": "https://www.runmodelrun.com/privacy-policy.html"
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": 0,
                    "openai:completion_tokens": 0
                },
                "pricing_version_id": "d2453ad7-a13c-4d55-99d7-bdc5162c7d4e",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": false,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": false,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemma-3-27b-it",
            "hf_slug": "google/gemma-3-27b-it",
            "updated_at": "2026-01-07T04:36:03.22387+00:00",
            "created_at": "2025-03-12T05:12:39.645813+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemma 3 27B",
            "short_name": "Gemma 3 27B",
            "author": "google",
            "description": "Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3 27B is Google's latest open source model, successor to [Gemma 2](google/gemma-2-27b-it)",
            "model_version_group_id": "c99b277a-cfaf-4e93-9360-8a79cfa2b2c4",
            "context_length": 96000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": "gemma",
            "default_system": null,
            "default_stops": [
                "<start_of_turn>",
                "<end_of_turn>",
                "<eos>"
            ],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemma-3-27b-it",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "0618de82-14d9-41e5-98f9-51bccf805320",
                "name": "Chutes | google/gemma-3-27b-it",
                "context_length": 96000,
                "model": {
                    "slug": "google/gemma-3-27b-it",
                    "hf_slug": "google/gemma-3-27b-it",
                    "updated_at": "2026-01-07T04:36:03.22387+00:00",
                    "created_at": "2025-03-12T05:12:39.645813+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemma 3 27B",
                    "short_name": "Gemma 3 27B",
                    "author": "google",
                    "description": "Gemma 3 introduces multimodality, supporting vision-language input and text outputs. It handles context windows up to 128k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Gemma 3 27B is Google's latest open source model, successor to [Gemma 2](google/gemma-2-27b-it)",
                    "model_version_group_id": "c99b277a-cfaf-4e93-9360-8a79cfa2b2c4",
                    "context_length": 131072,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": "gemma",
                    "default_system": null,
                    "default_stops": [
                        "<start_of_turn>",
                        "<end_of_turn>",
                        "<eos>"
                    ],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "google/gemma-3-27b-it",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemma-3-27b-it",
                "model_variant_permaslug": "google/gemma-3-27b-it",
                "adapter_name": "ChutesAdapter",
                "provider_name": "Chutes",
                "provider_info": {
                    "name": "Chutes",
                    "displayName": "Chutes",
                    "slug": "chutes",
                    "baseUrl": "https://llm.chutes.ai/v1",
                    "dataPolicy": {
                        "training": true,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://chutes.ai/tos"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "ChutesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://chutes.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "openbmb/MiniCPM4-8B",
                        "agentica-org/DeepSWE-Preview",
                        "moonshotai/Kimi-K2-Instruct-tools",
                        "internlm/Intern-S1",
                        "TheDrummer/Gemmasutra-Pro-27B-v1.1",
                        "all-hands/openhands-lm-32b-v0.1-ep3",
                        "TheDrummer/Tunguska-39B-v1",
                        "Meridian",
                        "Zenith",
                        "Proxima",
                        "agentica-org/DeepCoder-14B-Preview",
                        "TheDrummer/Cydonia-24B-v2.1",
                        "Tesslate/UIGEN-X-32B-0727",
                        "NousResearch/Hermes-4-14B",
                        "unsloth/gemma-3-4b-it",
                        "tencent/Hunyuan-A13B-Instruct",
                        "unsloth/Llama-3.2-3B-Instruct",
                        "unsloth/Llama-3.2-1B-Instruct",
                        "zai-org/GLM-4.5-turbo",
                        "zai-org/GLM-4.6-turbo",
                        "rednote-hilab/dots.ocr",
                        "deepseek-ai/DeepSeek-V3-0324-turbo",
                        "deepseek-ai/DeepSeek-V3.1-turbo",
                        "moonshotai/Kimi-K2-Thinking",
                        "zai-org/GLM-4.5",
                        "deepseek-ai/DeepSeek-V3.1",
                        "zai-org/GLM-4.6-FP8",
                        "zai-org/GLM-4.7-FP8",
                        "zai-org/GLM-4.5-FP8"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Chutes",
                "provider_slug": "chutes/bf16",
                "provider_model_id": "unsloth/gemma-3-27b-it",
                "quantization": "bf16",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 96000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "top_k",
                    "repetition_penalty",
                    "response_format",
                    "tools",
                    "tool_choice",
                    "structured_outputs"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": true,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://chutes.ai/tos"
                },
                "pricing": {
                    "prompt": "0.00000004",
                    "completion": "0.00000015",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000004",
                    "openai:completion_tokens": "0.00000015"
                },
                "pricing_version_id": "280251e1-c249-418e-85fd-31963ef6b92a",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "perplexity/sonar-reasoning-pro",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-03-07T02:08:28.125446+00:00",
            "hf_updated_at": null,
            "name": "Perplexity: Sonar Reasoning Pro",
            "short_name": "Sonar Reasoning Pro",
            "author": "perplexity",
            "description": "Note: Sonar Pro pricing includes Perplexity search pricing. See [details here](https://docs.perplexity.ai/guides/pricing#detailed-pricing-breakdown-for-sonar-reasoning-pro-and-sonar-pro)\n\nSonar Reasoning Pro is a premier reasoning model powered by DeepSeek R1 with Chain of Thought (CoT). Designed for advanced use cases, it supports in-depth, multi-step queries with a larger context window and can surface more citations per search, enabling more comprehensive and extensible responses.",
            "model_version_group_id": null,
            "context_length": 128000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": "deepseek-r1",
            "default_system": null,
            "default_stops": [
                "<｜User｜>",
                "<｜end▁of▁sentence｜>"
            ],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "perplexity/sonar-reasoning-pro",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": "<think>",
                "end_token": "</think>"
            },
            "features": {
                "reasoning_config": {
                    "start_token": "<think>",
                    "end_token": "</think>"
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "0d28660e-435a-4853-a2c6-9d916df28fc7",
                "name": "Perplexity | perplexity/sonar-reasoning-pro",
                "context_length": 128000,
                "model": {
                    "slug": "perplexity/sonar-reasoning-pro",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-03-07T02:08:28.125446+00:00",
                    "hf_updated_at": null,
                    "name": "Perplexity: Sonar Reasoning Pro",
                    "short_name": "Sonar Reasoning Pro",
                    "author": "perplexity",
                    "description": "Note: Sonar Pro pricing includes Perplexity search pricing. See [details here](https://docs.perplexity.ai/guides/pricing#detailed-pricing-breakdown-for-sonar-reasoning-pro-and-sonar-pro)\n\nSonar Reasoning Pro is a premier reasoning model powered by DeepSeek R1 with Chain of Thought (CoT). Designed for advanced use cases, it supports in-depth, multi-step queries with a larger context window and can surface more citations per search, enabling more comprehensive and extensible responses.",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": "deepseek-r1",
                    "default_system": null,
                    "default_stops": [
                        "<｜User｜>",
                        "<｜end▁of▁sentence｜>"
                    ],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "perplexity/sonar-reasoning-pro",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": "<think>",
                        "end_token": "</think>"
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": "<think>",
                            "end_token": "</think>"
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "perplexity/sonar-reasoning-pro",
                "model_variant_permaslug": "perplexity/sonar-reasoning-pro",
                "adapter_name": "PerplexityAdapter",
                "provider_name": "Perplexity",
                "provider_info": {
                    "name": "Perplexity",
                    "displayName": "Perplexity",
                    "slug": "perplexity",
                    "baseUrl": "https://api.perplexity.ai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.perplexity.ai/hub/legal/perplexity-api-terms-of-service",
                        "privacyPolicyURL": "https://www.perplexity.ai/hub/legal/privacy-policy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "PerplexityAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.perplexity.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Perplexity.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": null
                },
                "provider_display_name": "Perplexity",
                "provider_slug": "perplexity",
                "provider_model_id": "sonar-reasoning-pro",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "reasoning",
                    "include_reasoning",
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "top_k",
                    "frequency_penalty",
                    "presence_penalty",
                    "web_search_options"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.perplexity.ai/hub/legal/perplexity-api-terms-of-service",
                    "privacyPolicyURL": "https://www.perplexity.ai/hub/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0.000002",
                    "completion": "0.000008",
                    "image": "0",
                    "request": "0",
                    "web_search": "0.005",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "search-threshold",
                        "threshold": "high",
                        "request": "0.014"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "medium",
                        "request": "0.01"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "low",
                        "request": "0.006"
                    }
                ],
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "perplexity/sonar-pro",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-03-07T01:53:43+00:00",
            "hf_updated_at": null,
            "name": "Perplexity: Sonar Pro",
            "short_name": "Sonar Pro",
            "author": "perplexity",
            "description": "Note: Sonar Pro pricing includes Perplexity search pricing. See [details here](https://docs.perplexity.ai/guides/pricing#detailed-pricing-breakdown-for-sonar-reasoning-pro-and-sonar-pro)\n\nFor enterprises seeking more advanced capabilities, the Sonar Pro API can handle in-depth, multi-step queries with added extensibility, like double the number of citations per search as Sonar on average. Plus, with a larger context window, it can handle longer and more nuanced searches and follow-up questions. ",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "perplexity/sonar-pro",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "e19b1036-fab9-4f97-9579-8ea67959cc9b",
                "name": "Perplexity | perplexity/sonar-pro",
                "context_length": 200000,
                "model": {
                    "slug": "perplexity/sonar-pro",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-03-07T01:53:43+00:00",
                    "hf_updated_at": null,
                    "name": "Perplexity: Sonar Pro",
                    "short_name": "Sonar Pro",
                    "author": "perplexity",
                    "description": "Note: Sonar Pro pricing includes Perplexity search pricing. See [details here](https://docs.perplexity.ai/guides/pricing#detailed-pricing-breakdown-for-sonar-reasoning-pro-and-sonar-pro)\n\nFor enterprises seeking more advanced capabilities, the Sonar Pro API can handle in-depth, multi-step queries with added extensibility, like double the number of citations per search as Sonar on average. Plus, with a larger context window, it can handle longer and more nuanced searches and follow-up questions. ",
                    "model_version_group_id": null,
                    "context_length": 200000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "perplexity/sonar-pro",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "perplexity/sonar-pro",
                "model_variant_permaslug": "perplexity/sonar-pro",
                "adapter_name": "PerplexityAdapter",
                "provider_name": "Perplexity",
                "provider_info": {
                    "name": "Perplexity",
                    "displayName": "Perplexity",
                    "slug": "perplexity",
                    "baseUrl": "https://api.perplexity.ai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.perplexity.ai/hub/legal/perplexity-api-terms-of-service",
                        "privacyPolicyURL": "https://www.perplexity.ai/hub/legal/privacy-policy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "PerplexityAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.perplexity.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Perplexity.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": null
                },
                "provider_display_name": "Perplexity",
                "provider_slug": "perplexity",
                "provider_model_id": "sonar-pro",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 8000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "top_k",
                    "frequency_penalty",
                    "presence_penalty",
                    "web_search_options"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.perplexity.ai/hub/legal/perplexity-api-terms-of-service",
                    "privacyPolicyURL": "https://www.perplexity.ai/hub/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0.000003",
                    "completion": "0.000015",
                    "image": "0",
                    "request": "0",
                    "web_search": "0.005",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "search-threshold",
                        "threshold": "high",
                        "request": "0.014"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "medium",
                        "request": "0.01"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "low",
                        "request": "0.006"
                    }
                ],
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_multipart": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemini-2.0-flash-lite-001",
            "hf_slug": "",
            "updated_at": "2025-11-14T23:32:47.563595+00:00",
            "created_at": "2025-02-25T17:56:52.206054+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 2.0 Flash Lite",
            "short_name": "Gemini 2.0 Flash Lite",
            "author": "google",
            "description": "Gemini 2.0 Flash Lite offers a significantly faster time to first token (TTFT) compared to [Gemini Flash 1.5](/google/gemini-flash-1.5), while maintaining quality on par with larger models like [Gemini Pro 1.5](/google/gemini-pro-1.5), all at extremely economical token prices.",
            "model_version_group_id": "e993dfbf-2cbd-4680-b866-c05bbdcc8f4d",
            "context_length": 1048576,
            "input_modalities": [
                "text",
                "image",
                "file",
                "audio",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-2.0-flash-lite-001",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "4dc03b46-4015-495b-acff-1dcacb6c3311",
                "name": "Google | google/gemini-2.0-flash-lite-001",
                "context_length": 1048576,
                "model": {
                    "slug": "google/gemini-2.0-flash-lite-001",
                    "hf_slug": "",
                    "updated_at": "2025-11-14T23:32:47.563595+00:00",
                    "created_at": "2025-02-25T17:56:52.206054+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemini 2.0 Flash Lite",
                    "short_name": "Gemini 2.0 Flash Lite",
                    "author": "google",
                    "description": "Gemini 2.0 Flash Lite offers a significantly faster time to first token (TTFT) compared to [Gemini Flash 1.5](/google/gemini-flash-1.5), while maintaining quality on par with larger models like [Gemini Pro 1.5](/google/gemini-pro-1.5), all at extremely economical token prices.",
                    "model_version_group_id": "e993dfbf-2cbd-4680-b866-c05bbdcc8f4d",
                    "context_length": 1048576,
                    "input_modalities": [
                        "text",
                        "image",
                        "file",
                        "audio",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "google/gemini-2.0-flash-lite-001",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemini-2.0-flash-lite-001",
                "model_variant_permaslug": "google/gemini-2.0-flash-lite-001",
                "adapter_name": "GoogleVertexGeminiAdapter",
                "provider_name": "Google",
                "provider_info": {
                    "name": "Google",
                    "displayName": "Google Vertex",
                    "slug": "google-vertex",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "not-used"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleVertexGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.cloud.google.com/products/sdXM79fz1FS6ekNpu37K/history",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleVertex.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-exp-03-25",
                        "gemini-2.0-flash-exp",
                        "gemini-1.5-flash-002",
                        "gemini-2.0-flash-lite-001",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-2.0-flash-001",
                        "llama-4-scout-17b-16e-instruct-maas",
                        "qwen3-235b-a22b-instruct-2507-maas",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-image-preview",
                        "llama-4-maverick-17b-128e-instruct-maas",
                        "llama-3.3-70b-instruct-maas",
                        "claude-3-5-haiku@20241022",
                        "qwen3-coder-480b-a35b-instruct-maas",
                        "gemini-1.5-pro-002",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-pro",
                        "deepseek-r1-0528-maas",
                        "claude-3-7-sonnet@20250219",
                        "claude-3-5-sonnet-v2@20241022",
                        "claude-sonnet-4@20250514",
                        "claude-opus-4-1@20250805",
                        "claude-opus-4@20250514",
                        "claude-3-haiku@20240307",
                        "claude-3-5-sonnet@20240620",
                        "claude-3-opus@20240229",
                        "gemini-2.5-flash-lite-preview-09-2025",
                        "gemini-2.5-flash-preview-09-2025",
                        "gemini-2.5-flash-image",
                        "claude-sonnet-4-5@20250929",
                        "claude-haiku-4-5@20251001",
                        "minimax/minimax-m2-maas",
                        "gemini-3-pro-preview",
                        "gemini-3-pro-image-preview",
                        "claude-opus-4-5@20251101"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google Vertex",
                "provider_slug": "google-vertex",
                "provider_model_id": "gemini-2.0-flash-lite-001",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 8192,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "response_format",
                    "stop",
                    "structured_outputs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000000075",
                    "completion": "0.0000003",
                    "image": "0.000000075",
                    "audio": "0.000000075",
                    "internal_reasoning": "0.0000003",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "gemini:prompt_tokens": 7.5e-8,
                    "gemini:reasoning_tokens": 3e-7,
                    "gemini:completion_tokens": 3e-7,
                    "gemini:text_input_tokens": 7.5e-8,
                    "gemini:audio_input_tokens": 7.5e-8,
                    "gemini:image_input_tokens": 7.5e-8,
                    "gemini:video_input_tokens": 7.5e-8,
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "34326346-6ef6-4ae4-812f-8efa6243856d",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_base64_video_input": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {},
                    "supports_input_audio": true
                },
                "provider_region": null,
                "deprecation_date": "2026-03-03"
            }
        },
        {
            "slug": "anthropic/claude-3.7-sonnet",
            "hf_slug": "",
            "updated_at": "2025-12-05T21:54:07.586262+00:00",
            "created_at": "2025-02-24T18:35:10.00008+00:00",
            "hf_updated_at": null,
            "name": "Anthropic: Claude 3.7 Sonnet (thinking)",
            "short_name": "Claude 3.7 Sonnet (thinking)",
            "author": "anthropic",
            "description": "Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities. It introduces a hybrid reasoning approach, allowing users to choose between rapid responses and extended, step-by-step processing for complex tasks. The model demonstrates notable improvements in coding, particularly in front-end development and full-stack updates, and excels in agentic workflows, where it can autonomously navigate multi-step processes. \n\nClaude 3.7 Sonnet maintains performance parity with its predecessor in standard mode while offering an extended reasoning mode for enhanced accuracy in math, coding, and instruction-following tasks.\n\nRead more at the [blog post here](https://www.anthropic.com/news/claude-3-7-sonnet)",
            "model_version_group_id": "30636d20-cda3-4a59-aa0c-1a5b6efba072",
            "context_length": 200000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Claude",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "anthropic/claude-3-7-sonnet-20250219",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [
                "google-vertex",
                "amazon-bedrock",
                "anthropic"
            ],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "aa1ee54a-c660-496a-8f2d-d8470ef3f11b",
                "name": "Google | anthropic/claude-3-7-sonnet-20250219:thinking",
                "context_length": 200000,
                "model": {
                    "slug": "anthropic/claude-3.7-sonnet",
                    "hf_slug": "",
                    "updated_at": "2025-12-05T21:54:07.586262+00:00",
                    "created_at": "2025-02-24T18:35:10.00008+00:00",
                    "hf_updated_at": null,
                    "name": "Anthropic: Claude 3.7 Sonnet",
                    "short_name": "Claude 3.7 Sonnet",
                    "author": "anthropic",
                    "description": "Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities. It introduces a hybrid reasoning approach, allowing users to choose between rapid responses and extended, step-by-step processing for complex tasks. The model demonstrates notable improvements in coding, particularly in front-end development and full-stack updates, and excels in agentic workflows, where it can autonomously navigate multi-step processes. \n\nClaude 3.7 Sonnet maintains performance parity with its predecessor in standard mode while offering an extended reasoning mode for enhanced accuracy in math, coding, and instruction-following tasks.\n\nRead more at the [blog post here](https://www.anthropic.com/news/claude-3-7-sonnet)",
                    "model_version_group_id": "30636d20-cda3-4a59-aa0c-1a5b6efba072",
                    "context_length": 200000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Claude",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "anthropic/claude-3-7-sonnet-20250219",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [
                        "google-vertex",
                        "amazon-bedrock",
                        "anthropic"
                    ],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "anthropic/claude-3.7-sonnet:thinking",
                "model_variant_permaslug": "anthropic/claude-3-7-sonnet-20250219:thinking",
                "adapter_name": "GoogleVertexAnthropicAdapter",
                "provider_name": "Google",
                "provider_info": {
                    "name": "Google",
                    "displayName": "Google Vertex",
                    "slug": "google-vertex",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "not-used"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleVertexGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.cloud.google.com/products/sdXM79fz1FS6ekNpu37K/history",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleVertex.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-exp-03-25",
                        "gemini-2.0-flash-exp",
                        "gemini-1.5-flash-002",
                        "gemini-2.0-flash-lite-001",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-2.0-flash-001",
                        "llama-4-scout-17b-16e-instruct-maas",
                        "qwen3-235b-a22b-instruct-2507-maas",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-image-preview",
                        "llama-4-maverick-17b-128e-instruct-maas",
                        "llama-3.3-70b-instruct-maas",
                        "claude-3-5-haiku@20241022",
                        "qwen3-coder-480b-a35b-instruct-maas",
                        "gemini-1.5-pro-002",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-pro",
                        "deepseek-r1-0528-maas",
                        "claude-3-7-sonnet@20250219",
                        "claude-3-5-sonnet-v2@20241022",
                        "claude-sonnet-4@20250514",
                        "claude-opus-4-1@20250805",
                        "claude-opus-4@20250514",
                        "claude-3-haiku@20240307",
                        "claude-3-5-sonnet@20240620",
                        "claude-3-opus@20240229",
                        "gemini-2.5-flash-lite-preview-09-2025",
                        "gemini-2.5-flash-preview-09-2025",
                        "gemini-2.5-flash-image",
                        "claude-sonnet-4-5@20250929",
                        "claude-haiku-4-5@20251001",
                        "minimax/minimax-m2-maas",
                        "gemini-3-pro-preview",
                        "gemini-3-pro-image-preview",
                        "claude-opus-4-5@20251101"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "anthropic"
                },
                "provider_display_name": "Google Vertex",
                "provider_slug": "google-vertex",
                "provider_model_id": "claude-3-7-sonnet@20250219",
                "quantization": "unknown",
                "variant": "thinking",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 64000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "top_p",
                    "temperature",
                    "stop",
                    "reasoning",
                    "include_reasoning",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000003",
                    "completion": "0.000015",
                    "input_cache_read": "0.0000003",
                    "input_cache_write": "0.00000375",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "anthropic:prompt_tokens": 0.000003,
                    "anthropic:web_search_calls": 0.01,
                    "anthropic:cache_read_tokens": 3e-7,
                    "anthropic:completion_tokens": 0.000015,
                    "anthropic:cache_write_1h_tokens": 0.000006,
                    "anthropic:cache_write_5m_tokens": 0.00000375
                },
                "pricing_version_id": "42f7eb91-30f9-4d8e-bd2e-a584e9b6edaa",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "anthropic/claude-3.7-sonnet",
            "hf_slug": "",
            "updated_at": "2025-12-05T21:54:07.586262+00:00",
            "created_at": "2025-02-24T18:35:10.00008+00:00",
            "hf_updated_at": null,
            "name": "Anthropic: Claude 3.7 Sonnet",
            "short_name": "Claude 3.7 Sonnet",
            "author": "anthropic",
            "description": "Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities. It introduces a hybrid reasoning approach, allowing users to choose between rapid responses and extended, step-by-step processing for complex tasks. The model demonstrates notable improvements in coding, particularly in front-end development and full-stack updates, and excels in agentic workflows, where it can autonomously navigate multi-step processes. \n\nClaude 3.7 Sonnet maintains performance parity with its predecessor in standard mode while offering an extended reasoning mode for enhanced accuracy in math, coding, and instruction-following tasks.\n\nRead more at the [blog post here](https://www.anthropic.com/news/claude-3-7-sonnet)",
            "model_version_group_id": "30636d20-cda3-4a59-aa0c-1a5b6efba072",
            "context_length": 200000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Claude",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "anthropic/claude-3-7-sonnet-20250219",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [
                "google-vertex",
                "amazon-bedrock",
                "anthropic"
            ],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "1c9b8776-e266-4efb-b5ba-19a6753e7736",
                "name": "Google | anthropic/claude-3-7-sonnet-20250219",
                "context_length": 200000,
                "model": {
                    "slug": "anthropic/claude-3.7-sonnet",
                    "hf_slug": "",
                    "updated_at": "2025-12-05T21:54:07.586262+00:00",
                    "created_at": "2025-02-24T18:35:10.00008+00:00",
                    "hf_updated_at": null,
                    "name": "Anthropic: Claude 3.7 Sonnet",
                    "short_name": "Claude 3.7 Sonnet",
                    "author": "anthropic",
                    "description": "Claude 3.7 Sonnet is an advanced large language model with improved reasoning, coding, and problem-solving capabilities. It introduces a hybrid reasoning approach, allowing users to choose between rapid responses and extended, step-by-step processing for complex tasks. The model demonstrates notable improvements in coding, particularly in front-end development and full-stack updates, and excels in agentic workflows, where it can autonomously navigate multi-step processes. \n\nClaude 3.7 Sonnet maintains performance parity with its predecessor in standard mode while offering an extended reasoning mode for enhanced accuracy in math, coding, and instruction-following tasks.\n\nRead more at the [blog post here](https://www.anthropic.com/news/claude-3-7-sonnet)",
                    "model_version_group_id": "30636d20-cda3-4a59-aa0c-1a5b6efba072",
                    "context_length": 200000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Claude",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "anthropic/claude-3-7-sonnet-20250219",
                    "supports_reasoning": true,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [
                        "google-vertex",
                        "amazon-bedrock",
                        "anthropic"
                    ],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "anthropic/claude-3.7-sonnet",
                "model_variant_permaslug": "anthropic/claude-3-7-sonnet-20250219",
                "adapter_name": "GoogleVertexAnthropicAdapter",
                "provider_name": "Google",
                "provider_info": {
                    "name": "Google",
                    "displayName": "Google Vertex",
                    "slug": "google-vertex/us",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "not-used"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleVertexGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.cloud.google.com/products/sdXM79fz1FS6ekNpu37K/history",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleVertex.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-exp-03-25",
                        "gemini-2.0-flash-exp",
                        "gemini-1.5-flash-002",
                        "gemini-2.0-flash-lite-001",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-2.0-flash-001",
                        "llama-4-scout-17b-16e-instruct-maas",
                        "qwen3-235b-a22b-instruct-2507-maas",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-image-preview",
                        "llama-4-maverick-17b-128e-instruct-maas",
                        "llama-3.3-70b-instruct-maas",
                        "claude-3-5-haiku@20241022",
                        "qwen3-coder-480b-a35b-instruct-maas",
                        "gemini-1.5-pro-002",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-pro",
                        "deepseek-r1-0528-maas",
                        "claude-3-7-sonnet@20250219",
                        "claude-3-5-sonnet-v2@20241022",
                        "claude-sonnet-4@20250514",
                        "claude-opus-4-1@20250805",
                        "claude-opus-4@20250514",
                        "claude-3-haiku@20240307",
                        "claude-3-5-sonnet@20240620",
                        "claude-3-opus@20240229",
                        "gemini-2.5-flash-lite-preview-09-2025",
                        "gemini-2.5-flash-preview-09-2025",
                        "gemini-2.5-flash-image",
                        "claude-sonnet-4-5@20250929",
                        "claude-haiku-4-5@20251001",
                        "minimax/minimax-m2-maas",
                        "gemini-3-pro-preview",
                        "gemini-3-pro-image-preview",
                        "claude-opus-4-5@20251101"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "anthropic"
                },
                "provider_display_name": "Google Vertex",
                "provider_slug": "google-vertex/us",
                "provider_model_id": "claude-3-7-sonnet@20250219",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 64000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "top_p",
                    "temperature",
                    "stop",
                    "reasoning",
                    "include_reasoning",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000003",
                    "completion": "0.000015",
                    "input_cache_read": "0.0000003",
                    "input_cache_write": "0.00000375",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "anthropic:prompt_tokens": 0.000003,
                    "anthropic:web_search_calls": 0.01,
                    "anthropic:cache_read_tokens": 3e-7,
                    "anthropic:completion_tokens": 0.000015,
                    "anthropic:cache_write_1h_tokens": 0.000006,
                    "anthropic:cache_write_5m_tokens": 0.00000375
                },
                "pricing_version_id": "0c3c8e44-3744-4eb9-b1ef-59291e23b8fd",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": true,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemini-2.0-flash-001",
            "hf_slug": "",
            "updated_at": "2025-11-14T23:34:05.685679+00:00",
            "created_at": "2025-02-05T15:30:13.144552+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 2.0 Flash",
            "short_name": "Gemini 2.0 Flash",
            "author": "google",
            "description": "Gemini Flash 2.0 offers a significantly faster time to first token (TTFT) compared to [Gemini Flash 1.5](/google/gemini-flash-1.5), while maintaining quality on par with larger models like [Gemini Pro 1.5](/google/gemini-pro-1.5). It introduces notable enhancements in multimodal understanding, coding capabilities, complex instruction following, and function calling. These advancements come together to deliver more seamless and robust agentic experiences.",
            "model_version_group_id": "e993dfbf-2cbd-4680-b866-c05bbdcc8f4d",
            "context_length": 1048576,
            "input_modalities": [
                "text",
                "image",
                "file",
                "audio",
                "video"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-2.0-flash-001",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "8b6c3ec6-e6a0-43f7-9e09-a5487a5756c9",
                "name": "Google AI Studio | google/gemini-2.0-flash-001",
                "context_length": 1048576,
                "model": {
                    "slug": "google/gemini-2.0-flash-001",
                    "hf_slug": "",
                    "updated_at": "2025-11-14T23:34:05.685679+00:00",
                    "created_at": "2025-02-05T15:30:13.144552+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemini 2.0 Flash",
                    "short_name": "Gemini 2.0 Flash",
                    "author": "google",
                    "description": "Gemini Flash 2.0 offers a significantly faster time to first token (TTFT) compared to [Gemini Flash 1.5](/google/gemini-flash-1.5), while maintaining quality on par with larger models like [Gemini Pro 1.5](/google/gemini-pro-1.5). It introduces notable enhancements in multimodal understanding, coding capabilities, complex instruction following, and function calling. These advancements come together to deliver more seamless and robust agentic experiences.",
                    "model_version_group_id": "e993dfbf-2cbd-4680-b866-c05bbdcc8f4d",
                    "context_length": 1000000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file",
                        "audio",
                        "video"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "google/gemini-2.0-flash-001",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemini-2.0-flash-001",
                "model_variant_permaslug": "google/gemini-2.0-flash-001",
                "adapter_name": "GoogleAIStudioGeminiAdapter",
                "provider_name": "Google AI Studio",
                "provider_info": {
                    "name": "Google AI Studio",
                    "displayName": "Google AI Studio",
                    "slug": "google-ai-studio",
                    "baseUrl": "https://generativelanguage.googleapis.com/v1beta",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 55,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleAIStudioGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleAIStudio.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-1p",
                        "gemini-2.5-pro-1p-recitation-off",
                        "gemini-2.5-flash-1p",
                        "gemini-2.5-flash-1p-recitation-off",
                        "gemini-2.5-flash-lite-preview-06-11-summarized",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-1.5-pro-latest",
                        "gemini-1.5-pro",
                        "gemini-1.5-flash-latest",
                        "gemini-1.5-flash",
                        "gemini-1.5-flash-8b",
                        "gemini-1.5-flash-8b-latest",
                        "gemini-2.5-pro-preview-03-25",
                        "gemini-2.0-flash",
                        "gemini-2.0-flash-lite",
                        "gemini-2.0-flash-lite-preview",
                        "gemini-2.0-pro-exp",
                        "gemini-2.0-flash-thinking-exp",
                        "gemini-2.5-flash-preview-tts",
                        "gemini-2.5-pro-preview-tts",
                        "learnlm-2.0-flash-experimental",
                        "gracefulgolem",
                        "gemini-2.5-flash-preview-05-20",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.0-flash-exp-image-generation",
                        "gemini-2.0-flash-preview-image-generation",
                        "gemini-2.0-flash-lite-preview-02-05",
                        "gemini-2.0-pro-exp-02-05",
                        "gemini-exp-1206",
                        "gemini-2.0-flash-thinking-exp-01-21",
                        "gemini-2.0-flash-thinking-exp-1219",
                        "gemma-3-1b-it",
                        "gemini-flash-latest",
                        "gemini-flash-lite-latest",
                        "gemini-pro-latest",
                        "gemini-robotics-er-1.5-preview",
                        "gemini-embedding-001",
                        "riftrunner-fst-rewind",
                        "gemini-3-pro-image-preview",
                        "nano-banana-pro-preview",
                        "fiercefalcon",
                        "fiercefalcon-inline-citation",
                        "fiercefalcon-blocked-sites"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google AI Studio",
                "provider_slug": "google-ai-studio",
                "provider_model_id": "gemini-2.0-flash-001",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 8192,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "response_format",
                    "stop",
                    "structured_outputs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 55,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice"
                },
                "pricing": {
                    "prompt": "0.0000001",
                    "completion": "0.0000004",
                    "image": "0.0000001",
                    "audio": "0.0000007",
                    "input_audio_cache": "0.000000175",
                    "input_cache_read": "0.000000025",
                    "input_cache_write": "0.00000008333333333333334",
                    "internal_reasoning": "0.0000004",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "gemini:prompt_tokens": 1e-7,
                    "gemini:reasoning_tokens": 4e-7,
                    "gemini:cache_read_tokens": 2.5e-8,
                    "gemini:completion_tokens": 4e-7,
                    "gemini:text_input_tokens": 1e-7,
                    "gemini:audio_input_tokens": 7e-7,
                    "gemini:image_input_tokens": 1e-7,
                    "gemini:video_input_tokens": 1e-7,
                    "gemini:cache_read_text_tokens": 2.5e-8,
                    "gemini:cache_read_audio_tokens": 1.75e-7,
                    "gemini:cache_read_image_tokens": 2.5e-8,
                    "gemini:cache_read_video_tokens": 2.5e-8,
                    "gemini:cache_write_storage_hours": 0.000001,
                    "gemini:cache_read_tokens_high_context": 5e-8,
                    "gemini:cache_read_text_tokens_high_context": 5e-8,
                    "gemini:cache_read_audio_tokens_high_context": 3.5e-7,
                    "gemini:cache_read_image_tokens_high_context": 5e-8,
                    "gemini:cache_read_video_tokens_high_context": 5e-8,
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "f232c68f-eb0d-4d69-948e-a854a9b49d01",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_base64_video_input": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": true
                },
                "provider_region": null,
                "deprecation_date": "2026-03-31"
            }
        },
        {
            "slug": "qwen/qwen-vl-plus",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-02-05T04:54:15.216448+00:00",
            "hf_updated_at": null,
            "name": "Qwen: Qwen VL Plus",
            "short_name": "Qwen VL Plus",
            "author": "qwen",
            "description": "Qwen's Enhanced Large Visual Language Model. Significantly upgraded for detailed recognition capabilities and text recognition abilities, supporting ultra-high pixel resolutions up to millions of pixels and extreme aspect ratios for image input. It delivers significant performance across a broad range of visual tasks.\n",
            "model_version_group_id": null,
            "context_length": 7500,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Qwen",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "qwen/qwen-vl-plus",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "df9c15ac-870b-40e5-aa43-e4b3b44951f7",
                "name": "Alibaba | qwen/qwen-vl-plus",
                "context_length": 7500,
                "model": {
                    "slug": "qwen/qwen-vl-plus",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-02-05T04:54:15.216448+00:00",
                    "hf_updated_at": null,
                    "name": "Qwen: Qwen VL Plus",
                    "short_name": "Qwen VL Plus",
                    "author": "qwen",
                    "description": "Qwen's Enhanced Large Visual Language Model. Significantly upgraded for detailed recognition capabilities and text recognition abilities, supporting ultra-high pixel resolutions up to millions of pixels and extreme aspect ratios for image input. It delivers significant performance across a broad range of visual tasks.\n",
                    "model_version_group_id": null,
                    "context_length": 7500,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Qwen",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "qwen/qwen-vl-plus",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "qwen/qwen-vl-plus",
                "model_variant_permaslug": "qwen/qwen-vl-plus",
                "adapter_name": "AlibabaAdapter",
                "provider_name": "Alibaba",
                "provider_info": {
                    "name": "Alibaba",
                    "displayName": "Alibaba Cloud Int.",
                    "slug": "alibaba",
                    "baseUrl": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.alibabacloud.com/help/en/legal/latest/alibaba-cloud-international-website-product-terms-of-service-v-3-8-0",
                        "privacyPolicyURL": "https://www.alibabacloud.com/help/en/legal/latest/alibaba-cloud-international-website-privacy-policy"
                    },
                    "headquarters": "SG",
                    "datacenters": [
                        "SG",
                        "CN"
                    ],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "AlibabaAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.alibabacloud.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://www.alibabacloud.com/&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": null
                },
                "provider_display_name": "Alibaba Cloud Int.",
                "provider_slug": "alibaba",
                "provider_model_id": "qwen-vl-plus",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": 6000,
                "max_completion_tokens": 1500,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "presence_penalty",
                    "response_format"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.alibabacloud.com/help/en/legal/latest/alibaba-cloud-international-website-product-terms-of-service-v-3-8-0",
                    "privacyPolicyURL": "https://www.alibabacloud.com/help/en/legal/latest/alibaba-cloud-international-website-privacy-policy"
                },
                "pricing": {
                    "prompt": "0.00000021",
                    "completion": "0.00000063",
                    "image": "0.0002688",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "qwen/qwen-vl-max",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-02-01T18:25:04.223655+00:00",
            "hf_updated_at": null,
            "name": "Qwen: Qwen VL Max",
            "short_name": "Qwen VL Max",
            "author": "qwen",
            "description": "Qwen VL Max is a visual understanding model with 7500 tokens context length. It excels in delivering optimal performance for a broader spectrum of complex tasks.\n",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Qwen",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "qwen/qwen-vl-max-2025-01-25",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "40a33c72-3801-49f3-ac2a-966d0b249981",
                "name": "Alibaba | qwen/qwen-vl-max-2025-01-25",
                "context_length": 131072,
                "model": {
                    "slug": "qwen/qwen-vl-max",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-02-01T18:25:04.223655+00:00",
                    "hf_updated_at": null,
                    "name": "Qwen: Qwen VL Max",
                    "short_name": "Qwen VL Max",
                    "author": "qwen",
                    "description": "Qwen VL Max is a visual understanding model with 7500 tokens context length. It excels in delivering optimal performance for a broader spectrum of complex tasks.\n",
                    "model_version_group_id": null,
                    "context_length": 131072,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Qwen",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "qwen/qwen-vl-max-2025-01-25",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "qwen/qwen-vl-max",
                "model_variant_permaslug": "qwen/qwen-vl-max-2025-01-25",
                "adapter_name": "AlibabaAdapter",
                "provider_name": "Alibaba",
                "provider_info": {
                    "name": "Alibaba",
                    "displayName": "Alibaba Cloud Int.",
                    "slug": "alibaba",
                    "baseUrl": "https://dashscope-intl.aliyuncs.com/compatible-mode/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.alibabacloud.com/help/en/legal/latest/alibaba-cloud-international-website-product-terms-of-service-v-3-8-0",
                        "privacyPolicyURL": "https://www.alibabacloud.com/help/en/legal/latest/alibaba-cloud-international-website-privacy-policy"
                    },
                    "headquarters": "SG",
                    "datacenters": [
                        "SG",
                        "CN"
                    ],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "AlibabaAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.alibabacloud.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://www.alibabacloud.com/&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": null
                },
                "provider_display_name": "Alibaba Cloud Int.",
                "provider_slug": "alibaba",
                "provider_model_id": "qwen-vl-max-2025-08-13",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": 129024,
                "max_completion_tokens": 8192,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "presence_penalty",
                    "response_format",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.alibabacloud.com/help/en/legal/latest/alibaba-cloud-international-website-product-terms-of-service-v-3-8-0",
                    "privacyPolicyURL": "https://www.alibabacloud.com/help/en/legal/latest/alibaba-cloud-international-website-privacy-policy"
                },
                "pricing": {
                    "prompt": "0.0000008",
                    "completion": "0.0000032",
                    "image": "0.001024",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "qwen/qwen2.5-vl-72b-instruct",
            "hf_slug": "Qwen/Qwen2.5-VL-72B-Instruct",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-02-01T11:45:11.997326+00:00",
            "hf_updated_at": null,
            "name": "Qwen: Qwen2.5 VL 72B Instruct",
            "short_name": "Qwen2.5 VL 72B Instruct",
            "author": "qwen",
            "description": "Qwen2.5-VL is proficient in recognizing common objects such as flowers, birds, fish, and insects. It is also highly capable of analyzing texts, charts, icons, graphics, and layouts within images.",
            "model_version_group_id": null,
            "context_length": 32768,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Qwen",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "qwen/qwen2.5-vl-72b-instruct",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "f80f9c7d-2b54-4ee2-bb8f-c8a46fde38d2",
                "name": "Chutes | qwen/qwen2.5-vl-72b-instruct",
                "context_length": 32768,
                "model": {
                    "slug": "qwen/qwen2.5-vl-72b-instruct",
                    "hf_slug": "Qwen/Qwen2.5-VL-72B-Instruct",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-02-01T11:45:11.997326+00:00",
                    "hf_updated_at": null,
                    "name": "Qwen: Qwen2.5 VL 72B Instruct",
                    "short_name": "Qwen2.5 VL 72B Instruct",
                    "author": "qwen",
                    "description": "Qwen2.5-VL is proficient in recognizing common objects such as flowers, birds, fish, and insects. It is also highly capable of analyzing texts, charts, icons, graphics, and layouts within images.",
                    "model_version_group_id": null,
                    "context_length": 131072,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Qwen",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "qwen/qwen2.5-vl-72b-instruct",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "qwen/qwen2.5-vl-72b-instruct",
                "model_variant_permaslug": "qwen/qwen2.5-vl-72b-instruct",
                "adapter_name": "ChutesAdapter",
                "provider_name": "Chutes",
                "provider_info": {
                    "name": "Chutes",
                    "displayName": "Chutes",
                    "slug": "chutes",
                    "baseUrl": "https://llm.chutes.ai/v1",
                    "dataPolicy": {
                        "training": true,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://chutes.ai/tos"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "ChutesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://chutes.ai/&size=256"
                    },
                    "ignoredProviderModels": [
                        "openbmb/MiniCPM4-8B",
                        "agentica-org/DeepSWE-Preview",
                        "moonshotai/Kimi-K2-Instruct-tools",
                        "internlm/Intern-S1",
                        "TheDrummer/Gemmasutra-Pro-27B-v1.1",
                        "all-hands/openhands-lm-32b-v0.1-ep3",
                        "TheDrummer/Tunguska-39B-v1",
                        "Meridian",
                        "Zenith",
                        "Proxima",
                        "agentica-org/DeepCoder-14B-Preview",
                        "TheDrummer/Cydonia-24B-v2.1",
                        "Tesslate/UIGEN-X-32B-0727",
                        "NousResearch/Hermes-4-14B",
                        "unsloth/gemma-3-4b-it",
                        "tencent/Hunyuan-A13B-Instruct",
                        "unsloth/Llama-3.2-3B-Instruct",
                        "unsloth/Llama-3.2-1B-Instruct",
                        "zai-org/GLM-4.5-turbo",
                        "zai-org/GLM-4.6-turbo",
                        "rednote-hilab/dots.ocr",
                        "deepseek-ai/DeepSeek-V3-0324-turbo",
                        "deepseek-ai/DeepSeek-V3.1-turbo",
                        "moonshotai/Kimi-K2-Thinking",
                        "zai-org/GLM-4.5",
                        "deepseek-ai/DeepSeek-V3.1",
                        "zai-org/GLM-4.6-FP8",
                        "zai-org/GLM-4.7-FP8",
                        "zai-org/GLM-4.5-FP8"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Chutes",
                "provider_slug": "chutes/bf16",
                "provider_model_id": "Qwen/Qwen2.5-VL-72B-Instruct-TEE",
                "quantization": "bf16",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 32768,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "top_k",
                    "repetition_penalty",
                    "response_format",
                    "structured_outputs"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": true,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://chutes.ai/tos"
                },
                "pricing": {
                    "prompt": "0.00000015",
                    "completion": "0.0000006",
                    "image": "0",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.00000015",
                    "openai:completion_tokens": "0.0000006"
                },
                "pricing_version_id": "ef3a118d-6cc7-498d-a4df-3c3f82eb2f6e",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "perplexity/sonar",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-01-27T21:36:48.666939+00:00",
            "hf_updated_at": null,
            "name": "Perplexity: Sonar",
            "short_name": "Sonar",
            "author": "perplexity",
            "description": "Sonar is lightweight, affordable, fast, and simple to use — now featuring citations and the ability to customize sources. It is designed for companies seeking to integrate lightweight question-and-answer features optimized for speed.",
            "model_version_group_id": null,
            "context_length": 127072,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "perplexity/sonar",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "5f831e7a-c555-4d3a-b228-88286347558a",
                "name": "Perplexity | perplexity/sonar",
                "context_length": 127072,
                "model": {
                    "slug": "perplexity/sonar",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-01-27T21:36:48.666939+00:00",
                    "hf_updated_at": null,
                    "name": "Perplexity: Sonar",
                    "short_name": "Sonar",
                    "author": "perplexity",
                    "description": "Sonar is lightweight, affordable, fast, and simple to use — now featuring citations and the ability to customize sources. It is designed for companies seeking to integrate lightweight question-and-answer features optimized for speed.",
                    "model_version_group_id": null,
                    "context_length": 127072,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "perplexity/sonar",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "perplexity/sonar",
                "model_variant_permaslug": "perplexity/sonar",
                "adapter_name": "PerplexityAdapter",
                "provider_name": "Perplexity",
                "provider_info": {
                    "name": "Perplexity",
                    "displayName": "Perplexity",
                    "slug": "perplexity",
                    "baseUrl": "https://api.perplexity.ai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.perplexity.ai/hub/legal/perplexity-api-terms-of-service",
                        "privacyPolicyURL": "https://www.perplexity.ai/hub/legal/privacy-policy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "PerplexityAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.perplexity.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Perplexity.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": null
                },
                "provider_display_name": "Perplexity",
                "provider_slug": "perplexity",
                "provider_model_id": "sonar",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "top_k",
                    "frequency_penalty",
                    "presence_penalty",
                    "web_search_options"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.perplexity.ai/hub/legal/perplexity-api-terms-of-service",
                    "privacyPolicyURL": "https://www.perplexity.ai/hub/legal/privacy-policy"
                },
                "pricing": {
                    "prompt": "0.000001",
                    "completion": "0.000001",
                    "image": "0",
                    "request": "0.005",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "search-threshold",
                        "threshold": "high",
                        "request": "0.012"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "medium",
                        "request": "0.008"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "low",
                        "request": "0.005"
                    }
                ],
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "minimax/minimax-01",
            "hf_slug": "MiniMaxAI/MiniMax-Text-01",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-01-15T04:31:02.677929+00:00",
            "hf_updated_at": null,
            "name": "MiniMax: MiniMax-01",
            "short_name": "MiniMax-01",
            "author": "minimax",
            "description": "MiniMax-01 is a combines MiniMax-Text-01 for text generation and MiniMax-VL-01 for image understanding. It has 456 billion parameters, with 45.9 billion parameters activated per inference, and can handle a context of up to 4 million tokens.\n\nThe text model adopts a hybrid architecture that combines Lightning Attention, Softmax Attention, and Mixture-of-Experts (MoE). The image model adopts the “ViT-MLP-LLM” framework and is trained on top of the text model.\n\nTo read more about the release, see: https://www.minimaxi.com/en/news/minimax-01-series-2",
            "model_version_group_id": null,
            "context_length": 1000192,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "minimax/minimax-01",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "352546d2-3758-4aa1-9e98-e1a83748aa4e",
                "name": "Minimax | minimax/minimax-01",
                "context_length": 1000192,
                "model": {
                    "slug": "minimax/minimax-01",
                    "hf_slug": "MiniMaxAI/MiniMax-Text-01",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2025-01-15T04:31:02.677929+00:00",
                    "hf_updated_at": null,
                    "name": "MiniMax: MiniMax-01",
                    "short_name": "MiniMax-01",
                    "author": "minimax",
                    "description": "MiniMax-01 is a combines MiniMax-Text-01 for text generation and MiniMax-VL-01 for image understanding. It has 456 billion parameters, with 45.9 billion parameters activated per inference, and can handle a context of up to 4 million tokens.\n\nThe text model adopts a hybrid architecture that combines Lightning Attention, Softmax Attention, and Mixture-of-Experts (MoE). The image model adopts the “ViT-MLP-LLM” framework and is trained on top of the text model.\n\nTo read more about the release, see: https://www.minimaxi.com/en/news/minimax-01-series-2",
                    "model_version_group_id": null,
                    "context_length": 1000000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Other",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "minimax/minimax-01",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "minimax/minimax-01",
                "model_variant_permaslug": "minimax/minimax-01",
                "adapter_name": "MinimaxAdapter",
                "provider_name": "Minimax",
                "provider_info": {
                    "name": "Minimax",
                    "displayName": "MiniMax",
                    "slug": "minimax",
                    "baseUrl": "https://api.minimaxi.chat/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.minimax.io/platform/protocol/terms-of-service",
                        "privacyPolicyURL": "https://www.minimax.io/platform/protocol/privacy-policy"
                    },
                    "headquarters": "SG",
                    "datacenters": [
                        "US"
                    ],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "MinimaxAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://minimaxi.com/&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "MiniMax",
                "provider_slug": "minimax",
                "provider_model_id": "MiniMax-Text-01",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 1000192,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.minimax.io/platform/protocol/terms-of-service",
                    "privacyPolicyURL": "https://www.minimax.io/platform/protocol/privacy-policy"
                },
                "pricing": {
                    "prompt": "0.0000002",
                    "completion": "0.0000011",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.0000002",
                    "openai:completion_tokens": "0.0000011"
                },
                "pricing_version_id": "6bea1ceb-8249-4f88-b48c-f90eb7df1ab0",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/o1",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-12-17T18:26:39.576639+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: o1",
            "short_name": "o1",
            "author": "openai",
            "description": "The latest and strongest model family from OpenAI, o1 is designed to spend more time thinking before responding. The o1 model series is trained with large-scale reinforcement learning to reason using chain of thought. \n\nThe o1 models are optimized for math, science, programming, and other STEM-related tasks. They consistently exhibit PhD-level accuracy on benchmarks in physics, chemistry, and biology. Learn more in the [launch announcement](https://openai.com/o1).\n",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/o1-2024-12-17",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "82738f61-f3cb-44a5-b5d1-e6787ae64e3b",
                "name": "OpenAI | openai/o1-2024-12-17",
                "context_length": 200000,
                "model": {
                    "slug": "openai/o1",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-12-17T18:26:39.576639+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: o1",
                    "short_name": "o1",
                    "author": "openai",
                    "description": "The latest and strongest model family from OpenAI, o1 is designed to spend more time thinking before responding. The o1 model series is trained with large-scale reinforcement learning to reason using chain of thought. \n\nThe o1 models are optimized for math, science, programming, and other STEM-related tasks. They consistently exhibit PhD-level accuracy on benchmarks in physics, chemistry, and biology. Learn more in the [launch announcement](https://openai.com/o1).\n",
                    "model_version_group_id": null,
                    "context_length": 200000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": "",
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/o1-2024-12-17",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/o1",
                "model_variant_permaslug": "openai/o1-2024-12-17",
                "adapter_name": "OpenAIResponsesAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIResponsesAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_responses"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "o1-2024-12-17",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 100000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000015",
                    "completion": "0.00006",
                    "input_cache_read": "0.0000075",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai_responses:prompt_tokens": 0.000015,
                    "openai_responses:completion_tokens": 0.00006,
                    "openai_responses:cached_prompt_tokens": 0.0000075
                },
                "pricing_version_id": "c7fe5d08-4ae8-494a-80a6-7452307c6540",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_file_urls": true,
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "google/gemini-2.0-flash-exp",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-12-11T17:18:43.999311+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 2.0 Flash Experimental (free)",
            "short_name": "Gemini 2.0 Flash Experimental (free)",
            "author": "google",
            "description": "Gemini Flash 2.0 offers a significantly faster time to first token (TTFT) compared to [Gemini Flash 1.5](/google/gemini-flash-1.5), while maintaining quality on par with larger models like [Gemini Pro 1.5](/google/gemini-pro-1.5). It introduces notable enhancements in multimodal understanding, coding capabilities, complex instruction following, and function calling. These advancements come together to deliver more seamless and robust agentic experiences.",
            "model_version_group_id": "e993dfbf-2cbd-4680-b866-c05bbdcc8f4d",
            "context_length": 1048576,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-2.0-flash-exp",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "65df650a-3eae-46b0-b5b0-87546ca90cc3",
                "name": "Google | google/gemini-2.0-flash-exp:free",
                "context_length": 1048576,
                "model": {
                    "slug": "google/gemini-2.0-flash-exp",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-12-11T17:18:43.999311+00:00",
                    "hf_updated_at": null,
                    "name": "Google: Gemini 2.0 Flash Experimental",
                    "short_name": "Gemini 2.0 Flash Experimental",
                    "author": "google",
                    "description": "Gemini Flash 2.0 offers a significantly faster time to first token (TTFT) compared to [Gemini Flash 1.5](/google/gemini-flash-1.5), while maintaining quality on par with larger models like [Gemini Pro 1.5](/google/gemini-pro-1.5). It introduces notable enhancements in multimodal understanding, coding capabilities, complex instruction following, and function calling. These advancements come together to deliver more seamless and robust agentic experiences.",
                    "model_version_group_id": "e993dfbf-2cbd-4680-b866-c05bbdcc8f4d",
                    "context_length": 1048576,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Gemini",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "google/gemini-2.0-flash-exp",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "google/gemini-2.0-flash-exp:free",
                "model_variant_permaslug": "google/gemini-2.0-flash-exp:free",
                "adapter_name": "GoogleVertexGeminiAdapter",
                "provider_name": "Google",
                "provider_info": {
                    "name": "Google",
                    "displayName": "Google Vertex",
                    "slug": "google-vertex",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://cloud.google.com/terms/",
                        "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "not-used"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "GoogleVertexGeminiAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.cloud.google.com/products/sdXM79fz1FS6ekNpu37K/history",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/GoogleVertex.svg"
                    },
                    "ignoredProviderModels": [
                        "gemini-2.5-pro-exp-03-25",
                        "gemini-2.0-flash-exp",
                        "gemini-1.5-flash-002",
                        "gemini-2.0-flash-lite-001",
                        "gemini-2.5-flash-lite-preview-06-17",
                        "gemini-2.5-flash-lite",
                        "gemini-2.0-flash-001",
                        "llama-4-scout-17b-16e-instruct-maas",
                        "qwen3-235b-a22b-instruct-2507-maas",
                        "gemini-2.5-flash",
                        "gemini-2.5-flash-image-preview",
                        "llama-4-maverick-17b-128e-instruct-maas",
                        "llama-3.3-70b-instruct-maas",
                        "claude-3-5-haiku@20241022",
                        "qwen3-coder-480b-a35b-instruct-maas",
                        "gemini-1.5-pro-002",
                        "gemini-2.5-pro-preview-06-05",
                        "gemini-2.5-pro-preview-05-06",
                        "gemini-2.5-pro",
                        "deepseek-r1-0528-maas",
                        "claude-3-7-sonnet@20250219",
                        "claude-3-5-sonnet-v2@20241022",
                        "claude-sonnet-4@20250514",
                        "claude-opus-4-1@20250805",
                        "claude-opus-4@20250514",
                        "claude-3-haiku@20240307",
                        "claude-3-5-sonnet@20240620",
                        "claude-3-opus@20240229",
                        "gemini-2.5-flash-lite-preview-09-2025",
                        "gemini-2.5-flash-preview-09-2025",
                        "gemini-2.5-flash-image",
                        "claude-sonnet-4-5@20250929",
                        "claude-haiku-4-5@20251001",
                        "minimax/minimax-m2-maas",
                        "gemini-3-pro-preview",
                        "gemini-3-pro-image-preview",
                        "claude-opus-4-5@20251101"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "gemini"
                },
                "provider_display_name": "Google Vertex",
                "provider_slug": "google-vertex",
                "provider_model_id": "gemini-2.0-flash-exp",
                "quantization": "unknown",
                "variant": "free",
                "is_free": true,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 8192,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "seed",
                    "response_format",
                    "stop",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": true,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 55,
                    "canPublish": false,
                    "termsOfServiceURL": "https://cloud.google.com/terms/",
                    "privacyPolicyURL": "https://cloud.google.com/terms/cloud-privacy-notice",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "gemini:prompt_tokens": "0",
                    "gemini:reasoning_tokens": "0",
                    "gemini:cache_read_tokens": "0",
                    "gemini:completion_tokens": "0",
                    "gemini:text_input_tokens": "0",
                    "gemini:audio_input_tokens": "0",
                    "gemini:image_input_tokens": "0",
                    "gemini:video_input_tokens": "0",
                    "gemini:cache_read_text_tokens": "0",
                    "gemini:cache_read_audio_tokens": "0",
                    "gemini:cache_read_image_tokens": "0",
                    "gemini:cache_read_video_tokens": "0",
                    "gemini:cache_write_storage_hours": "0",
                    "gemini:cache_read_tokens_high_context": "0",
                    "gemini:cache_read_text_tokens_high_context": "0",
                    "gemini:cache_read_audio_tokens_high_context": "0",
                    "gemini:cache_read_image_tokens_high_context": "0",
                    "gemini:cache_read_video_tokens_high_context": "0",
                    "gemini:informational_cache_write_tokens_count": 0
                },
                "pricing_version_id": "66d10a89-12f4-4443-8fe8-436118617f33",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": "2026-03-03"
            }
        },
        {
            "slug": "amazon/nova-lite-v1",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-12-05T22:22:43.403315+00:00",
            "hf_updated_at": null,
            "name": "Amazon: Nova Lite 1.0",
            "short_name": "Nova Lite 1.0",
            "author": "amazon",
            "description": "Amazon Nova Lite 1.0 is a very low-cost multimodal model from Amazon that focused on fast processing of image, video, and text inputs to generate text output. Amazon Nova Lite can handle real-time customer interactions, document analysis, and visual question-answering tasks with high accuracy.\n\nWith an input context of 300K tokens, it can analyze multiple images or up to 30 minutes of video in a single input.",
            "model_version_group_id": null,
            "context_length": 300000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Nova",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "amazon/nova-lite-v1",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "72eda073-d180-4482-8e4f-81051cb66f7e",
                "name": "Amazon Bedrock | amazon/nova-lite-v1",
                "context_length": 300000,
                "model": {
                    "slug": "amazon/nova-lite-v1",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-12-05T22:22:43.403315+00:00",
                    "hf_updated_at": null,
                    "name": "Amazon: Nova Lite 1.0",
                    "short_name": "Nova Lite 1.0",
                    "author": "amazon",
                    "description": "Amazon Nova Lite 1.0 is a very low-cost multimodal model from Amazon that focused on fast processing of image, video, and text inputs to generate text output. Amazon Nova Lite can handle real-time customer interactions, document analysis, and visual question-answering tasks with high accuracy.\n\nWith an input context of 300K tokens, it can analyze multiple images or up to 30 minutes of video in a single input.",
                    "model_version_group_id": null,
                    "context_length": 300000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Nova",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "amazon/nova-lite-v1",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "amazon/nova-lite-v1",
                "model_variant_permaslug": "amazon/nova-lite-v1",
                "adapter_name": "AmazonBedrockConverseAdapter",
                "provider_name": "Amazon Bedrock",
                "provider_info": {
                    "name": "Amazon Bedrock",
                    "displayName": "Amazon Bedrock",
                    "slug": "amazon-bedrock",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                        "privacyPolicyURL": "https://aws.amazon.com/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "dummy-value"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "AmazonBedrockConverseAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://health.aws.amazon.com/health/status",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Bedrock.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": null
                },
                "provider_display_name": "Amazon Bedrock",
                "provider_slug": "amazon-bedrock",
                "provider_model_id": "us.amazon.nova-lite-v1:0",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 5120,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "top_k",
                    "stop",
                    "tools"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                    "privacyPolicyURL": "https://aws.amazon.com/privacy"
                },
                "pricing": {
                    "prompt": "0.00000006",
                    "completion": "0.00000024",
                    "image": "0.00009",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "amazon/nova-pro-v1",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-12-05T22:05:03.587216+00:00",
            "hf_updated_at": null,
            "name": "Amazon: Nova Pro 1.0",
            "short_name": "Nova Pro 1.0",
            "author": "amazon",
            "description": "Amazon Nova Pro 1.0 is a capable multimodal model from Amazon focused on providing a combination of accuracy, speed, and cost for a wide range of tasks. As of December 2024, it achieves state-of-the-art performance on key benchmarks including visual question answering (TextVQA) and video understanding (VATEX).\n\nAmazon Nova Pro demonstrates strong capabilities in processing both visual and textual information and at analyzing financial documents.\n\n**NOTE**: Video input is not supported at this time.",
            "model_version_group_id": null,
            "context_length": 300000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Nova",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "amazon/nova-pro-v1",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "959381a4-8054-450f-9daf-5fcab64ba9aa",
                "name": "Amazon Bedrock | amazon/nova-pro-v1",
                "context_length": 300000,
                "model": {
                    "slug": "amazon/nova-pro-v1",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-12-05T22:05:03.587216+00:00",
                    "hf_updated_at": null,
                    "name": "Amazon: Nova Pro 1.0",
                    "short_name": "Nova Pro 1.0",
                    "author": "amazon",
                    "description": "Amazon Nova Pro 1.0 is a capable multimodal model from Amazon focused on providing a combination of accuracy, speed, and cost for a wide range of tasks. As of December 2024, it achieves state-of-the-art performance on key benchmarks including visual question answering (TextVQA) and video understanding (VATEX).\n\nAmazon Nova Pro demonstrates strong capabilities in processing both visual and textual information and at analyzing financial documents.\n\n**NOTE**: Video input is not supported at this time.",
                    "model_version_group_id": null,
                    "context_length": 300000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Nova",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "amazon/nova-pro-v1",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "amazon/nova-pro-v1",
                "model_variant_permaslug": "amazon/nova-pro-v1",
                "adapter_name": "AmazonBedrockConverseAdapter",
                "provider_name": "Amazon Bedrock",
                "provider_info": {
                    "name": "Amazon Bedrock",
                    "displayName": "Amazon Bedrock",
                    "slug": "amazon-bedrock",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                        "privacyPolicyURL": "https://aws.amazon.com/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "dummy-value"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "AmazonBedrockConverseAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://health.aws.amazon.com/health/status",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Bedrock.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": null
                },
                "provider_display_name": "Amazon Bedrock",
                "provider_slug": "amazon-bedrock",
                "provider_model_id": "us.amazon.nova-pro-v1:0",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 5120,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "top_k",
                    "stop",
                    "tools"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                    "privacyPolicyURL": "https://aws.amazon.com/privacy"
                },
                "pricing": {
                    "prompt": "0.0000008",
                    "completion": "0.0000032",
                    "image": "0.0012",
                    "request": "0",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-4o-2024-11-20",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-11-20T18:33:14.771895+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-4o (2024-11-20)",
            "short_name": "GPT-4o (2024-11-20)",
            "author": "openai",
            "description": "The 2024-11-20 version of GPT-4o offers a leveled-up creative writing ability with more natural, engaging, and tailored writing to improve relevance & readability. It’s also better at working with uploaded files, providing deeper insights & more thorough responses.\n\nGPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs. It maintains the intelligence level of [GPT-4 Turbo](/models/openai/gpt-4-turbo) while being twice as fast and 50% more cost-effective. GPT-4o also offers improved performance in processing non-English languages and enhanced visual capabilities.",
            "model_version_group_id": "76e36b33-358e-477a-be24-09f954fcea74",
            "context_length": 128000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-4o-2024-11-20",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "3e86b7c5-bffe-4b60-a3dd-b36451978775",
                "name": "OpenAI | openai/gpt-4o-2024-11-20",
                "context_length": 128000,
                "model": {
                    "slug": "openai/gpt-4o-2024-11-20",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-11-20T18:33:14.771895+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-4o (2024-11-20)",
                    "short_name": "GPT-4o (2024-11-20)",
                    "author": "openai",
                    "description": "The 2024-11-20 version of GPT-4o offers a leveled-up creative writing ability with more natural, engaging, and tailored writing to improve relevance & readability. It’s also better at working with uploaded files, providing deeper insights & more thorough responses.\n\nGPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs. It maintains the intelligence level of [GPT-4 Turbo](/models/openai/gpt-4-turbo) while being twice as fast and 50% more cost-effective. GPT-4o also offers improved performance in processing non-English languages and enhanced visual capabilities.",
                    "model_version_group_id": "76e36b33-358e-477a-be24-09f954fcea74",
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-4o-2024-11-20",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-4o-2024-11-20",
                "model_variant_permaslug": "openai/gpt-4o-2024-11-20",
                "adapter_name": "OpenAIAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-4o-2024-11-20",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 16384,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "web_search_options",
                    "logit_bias",
                    "logprobs",
                    "top_logprobs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.0000025",
                    "completion": "0.00001",
                    "input_cache_read": "0.00000125",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "search-threshold",
                        "threshold": "high",
                        "request": "0.05"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "medium",
                        "request": "0.035"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "low",
                        "request": "0.03"
                    }
                ],
                "pricing_json": {
                    "openai:prompt_tokens": 0.0000025,
                    "openai:completion_tokens": 0.00001,
                    "openai:cached_prompt_tokens": 0.00000125
                },
                "pricing_version_id": "8359b48b-204e-47a6-aea1-737dba83e20c",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "mistralai/pixtral-large-2411",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-11-19T00:49:48.873161+00:00",
            "hf_updated_at": null,
            "name": "Mistral: Pixtral Large 2411",
            "short_name": "Pixtral Large 2411",
            "author": "mistralai",
            "description": "Pixtral Large is a 124B parameter, open-weight, multimodal model built on top of [Mistral Large 2](/mistralai/mistral-large-2411). The model is able to understand documents, charts and natural images.\n\nThe model is available under the Mistral Research License (MRL) for research and educational use, and the Mistral Commercial License for experimentation, testing, and production for commercial purposes.\n\n",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Mistral",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "mistralai/pixtral-large-2411",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {
                "temperature": 0.3
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "1a41639e-c1cf-422e-a871-27bc67f03928",
                "name": "Mistral | mistralai/pixtral-large-2411",
                "context_length": 131072,
                "model": {
                    "slug": "mistralai/pixtral-large-2411",
                    "hf_slug": "",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-11-19T00:49:48.873161+00:00",
                    "hf_updated_at": null,
                    "name": "Mistral: Pixtral Large 2411",
                    "short_name": "Pixtral Large 2411",
                    "author": "mistralai",
                    "description": "Pixtral Large is a 124B parameter, open-weight, multimodal model built on top of [Mistral Large 2](/mistralai/mistral-large-2411). The model is able to understand documents, charts and natural images.\n\nThe model is available under the Mistral Research License (MRL) for research and educational use, and the Mistral Commercial License for experimentation, testing, and production for commercial purposes.\n\n",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Mistral",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "mistralai/pixtral-large-2411",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {
                        "temperature": 0.3
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "mistralai/pixtral-large-2411",
                "model_variant_permaslug": "mistralai/pixtral-large-2411",
                "adapter_name": "MistralAdapter",
                "provider_name": "Mistral",
                "provider_info": {
                    "name": "Mistral",
                    "displayName": "Mistral",
                    "slug": "mistral",
                    "baseUrl": "https://api.mistral.ai/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://mistral.ai/terms/#terms-of-use",
                        "privacyPolicyURL": "https://mistral.ai/terms/#privacy-policy"
                    },
                    "headquarters": "FR",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "MistralAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.mistral.ai/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Mistral.png"
                    },
                    "ignoredProviderModels": [
                        "mistral-moderation-2411-all",
                        "voxtral-mini-2507",
                        "voxtral-small-2507",
                        "voxtral-mini-transcribe-2507",
                        "mistral-medium",
                        "mistral-tiny",
                        "mistral-tiny-2312",
                        "open-mistral-nemo",
                        "mistral-tiny-2407",
                        "open-mixtral-8x7b",
                        "mistral-small",
                        "mistral-small-2312",
                        "open-mixtral-8x22b-2404",
                        "mistral-large-pixtral-2411",
                        "codestral-2412",
                        "codestral-2411-rc5",
                        "pixtral-12b",
                        "mistral-moderation-2411",
                        "mistral-ocr-2503",
                        "mistral-ocr-2505",
                        "mistral-saba-2502",
                        "open-mixtral-8x22b",
                        "mistral-large-2407",
                        "magistral-medium-2507",
                        "mistral-embed",
                        "codestral-embed",
                        "codestral-2501",
                        "mistral-small-2501",
                        "mistral-ocr-2512",
                        "labs-devstral-small-2512"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "mistral"
                },
                "provider_display_name": "Mistral",
                "provider_slug": "mistral",
                "provider_model_id": "pixtral-large-2411",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://mistral.ai/terms/#terms-of-use",
                    "privacyPolicyURL": "https://mistral.ai/terms/#privacy-policy"
                },
                "pricing": {
                    "prompt": "0.000002",
                    "completion": "0.000006",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "mistral:prompt_tokens": 0.000002,
                    "mistral:completion_tokens": 0.000006
                },
                "pricing_version_id": "b80bc0f8-6b6c-4dd4-9205-041df98e8a5f",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "anthropic/claude-3.5-haiku",
            "hf_slug": null,
            "updated_at": "2025-12-05T21:54:21.40359+00:00",
            "created_at": "2024-11-04T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Anthropic: Claude 3.5 Haiku",
            "short_name": "Claude 3.5 Haiku",
            "author": "anthropic",
            "description": "Claude 3.5 Haiku features offers enhanced capabilities in speed, coding accuracy, and tool use. Engineered to excel in real-time applications, it delivers quick response times that are essential for dynamic tasks such as chat interactions and immediate coding suggestions.\n\nThis makes it highly suitable for environments that demand both speed and precision, such as software development, customer service bots, and data management systems.\n\nThis model is currently pointing to [Claude 3.5 Haiku (2024-10-22)](/anthropic/claude-3-5-haiku-20241022).",
            "model_version_group_id": "028ec497-a034-40fd-81fe-f51d0a0c640c",
            "context_length": 200000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Claude",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "anthropic/claude-3-5-haiku",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [
                "amazon-bedrock",
                "google-vertex",
                "anthropic"
            ],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "50d15f84-5009-4962-a843-90401118ddd2",
                "name": "Amazon Bedrock | anthropic/claude-3-5-haiku",
                "context_length": 200000,
                "model": {
                    "slug": "anthropic/claude-3.5-haiku",
                    "hf_slug": null,
                    "updated_at": "2025-12-05T21:54:21.40359+00:00",
                    "created_at": "2024-11-04T00:00:00+00:00",
                    "hf_updated_at": null,
                    "name": "Anthropic: Claude 3.5 Haiku",
                    "short_name": "Claude 3.5 Haiku",
                    "author": "anthropic",
                    "description": "Claude 3.5 Haiku features offers enhanced capabilities in speed, coding accuracy, and tool use. Engineered to excel in real-time applications, it delivers quick response times that are essential for dynamic tasks such as chat interactions and immediate coding suggestions.\n\nThis makes it highly suitable for environments that demand both speed and precision, such as software development, customer service bots, and data management systems.\n\nThis model is currently pointing to [Claude 3.5 Haiku (2024-10-22)](/anthropic/claude-3-5-haiku-20241022).",
                    "model_version_group_id": "028ec497-a034-40fd-81fe-f51d0a0c640c",
                    "context_length": 200000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Claude",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "anthropic/claude-3-5-haiku",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        },
                        "chat_template_config": {}
                    },
                    "default_parameters": {
                        "temperature": null,
                        "top_p": null,
                        "frequency_penalty": null
                    },
                    "default_order": [
                        "amazon-bedrock",
                        "google-vertex",
                        "anthropic"
                    ],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "anthropic/claude-3.5-haiku",
                "model_variant_permaslug": "anthropic/claude-3-5-haiku",
                "adapter_name": "AmazonBedrockInvokeAnthropicAdapter",
                "provider_name": "Amazon Bedrock",
                "provider_info": {
                    "name": "Amazon Bedrock",
                    "displayName": "Amazon Bedrock",
                    "slug": "amazon-bedrock",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                        "privacyPolicyURL": "https://aws.amazon.com/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "dummy-value"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "AmazonBedrockConverseAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://health.aws.amazon.com/health/status",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Bedrock.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "anthropic"
                },
                "provider_display_name": "Amazon Bedrock",
                "provider_slug": "amazon-bedrock",
                "provider_model_id": "us.anthropic.claude-3-5-haiku-20241022-v1:0",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 8192,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "top_k",
                    "stop",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                    "privacyPolicyURL": "https://aws.amazon.com/privacy"
                },
                "pricing": {
                    "prompt": "0.0000008",
                    "completion": "0.000004",
                    "input_cache_read": "0.00000008",
                    "input_cache_write": "0.000001",
                    "web_search": "0.01",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "anthropic:prompt_tokens": 8e-7,
                    "anthropic:web_search_calls": 0.01,
                    "anthropic:cache_read_tokens": 8e-8,
                    "anthropic:completion_tokens": 0.000004,
                    "anthropic:cache_write_1h_tokens": 0.0000016,
                    "anthropic:cache_write_5m_tokens": 0.000001
                },
                "pricing_version_id": "dcdd1da5-3a78-4f57-8122-d38c1110c682",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "anthropic/claude-3.5-sonnet",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-10-22T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Anthropic: Claude 3.5 Sonnet",
            "short_name": "Claude 3.5 Sonnet",
            "author": "anthropic",
            "description": "New Claude 3.5 Sonnet delivers better-than-Opus capabilities, faster-than-Sonnet speeds, at the same Sonnet prices. Sonnet is particularly good at:\n\n- Coding: Scores ~49% on SWE-Bench Verified, higher than the last best score, and without any fancy prompt scaffolding\n- Data science: Augments human data science expertise; navigates unstructured data while using multiple tools for insights\n- Visual processing: excelling at interpreting charts, graphs, and images, accurately transcribing text to derive insights beyond just the text alone\n- Agentic tasks: exceptional tool use, making it great at agentic tasks (i.e. complex, multi-step problem solving tasks that require engaging with other systems)\n\n#multimodal",
            "model_version_group_id": "30636d20-cda3-4a59-aa0c-1a5b6efba072",
            "context_length": 200000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Claude",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "anthropic/claude-3.5-sonnet",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "d4fb79bd-9786-4932-af81-b83040e9f4e4",
                "name": "Amazon Bedrock | anthropic/claude-3.5-sonnet",
                "context_length": 200000,
                "model": {
                    "slug": "anthropic/claude-3.5-sonnet",
                    "hf_slug": null,
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-10-22T00:00:00+00:00",
                    "hf_updated_at": null,
                    "name": "Anthropic: Claude 3.5 Sonnet",
                    "short_name": "Claude 3.5 Sonnet",
                    "author": "anthropic",
                    "description": "New Claude 3.5 Sonnet delivers better-than-Opus capabilities, faster-than-Sonnet speeds, at the same Sonnet prices. Sonnet is particularly good at:\n\n- Coding: Scores ~49% on SWE-Bench Verified, higher than the last best score, and without any fancy prompt scaffolding\n- Data science: Augments human data science expertise; navigates unstructured data while using multiple tools for insights\n- Visual processing: excelling at interpreting charts, graphs, and images, accurately transcribing text to derive insights beyond just the text alone\n- Agentic tasks: exceptional tool use, making it great at agentic tasks (i.e. complex, multi-step problem solving tasks that require engaging with other systems)\n\n#multimodal",
                    "model_version_group_id": "30636d20-cda3-4a59-aa0c-1a5b6efba072",
                    "context_length": 200000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Claude",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "anthropic/claude-3.5-sonnet",
                    "supports_reasoning": false,
                    "reasoning_config": {
                        "start_token": null,
                        "end_token": null,
                        "system_prompt": null
                    },
                    "features": {
                        "reasoning_config": {
                            "start_token": null,
                            "end_token": null,
                            "system_prompt": null
                        }
                    },
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "anthropic/claude-3.5-sonnet",
                "model_variant_permaslug": "anthropic/claude-3.5-sonnet",
                "adapter_name": "AmazonBedrockInvokeAnthropicAdapter",
                "provider_name": "Amazon Bedrock",
                "provider_info": {
                    "name": "Amazon Bedrock",
                    "displayName": "Amazon Bedrock",
                    "slug": "amazon-bedrock",
                    "baseUrl": "not_used",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                        "privacyPolicyURL": "https://aws.amazon.com/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "dummy-value"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": false,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "AmazonBedrockConverseAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://health.aws.amazon.com/health/status",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Bedrock.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "anthropic"
                },
                "provider_display_name": "Amazon Bedrock",
                "provider_slug": "amazon-bedrock",
                "provider_model_id": "us.anthropic.claude-3-5-sonnet-20241022-v2:0",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": false,
                "max_prompt_tokens": null,
                "max_completion_tokens": 8192,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "top_k",
                    "stop",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://aws.amazon.com/service-terms/",
                    "privacyPolicyURL": "https://aws.amazon.com/privacy"
                },
                "pricing": {
                    "prompt": "0.000006",
                    "completion": "0.00003",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "anthropic:prompt_tokens": 0.000006,
                    "anthropic:completion_tokens": 0.00003
                },
                "pricing_version_id": "eb96ddba-9cd5-4a4b-bb70-4f88db92ecb1",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "meta-llama/llama-3.2-11b-vision-instruct",
            "hf_slug": "meta-llama/Llama-3.2-11B-Vision-Instruct",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-09-25T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Meta: Llama 3.2 11B Vision Instruct",
            "short_name": "Llama 3.2 11B Vision Instruct",
            "author": "meta-llama",
            "description": "Llama 3.2 11B Vision is a multimodal model with 11 billion parameters, designed to handle tasks combining visual and textual data. It excels in tasks such as image captioning and visual question answering, bridging the gap between language generation and visual reasoning. Pre-trained on a massive dataset of image-text pairs, it performs well in complex, high-accuracy image analysis.\n\nIts ability to integrate visual understanding with language processing makes it an ideal solution for industries requiring comprehensive visual-linguistic AI applications, such as content creation, AI-driven customer service, and research.\n\nClick here for the [original model card](https://github.com/meta-llama/llama-models/blob/main/models/llama3_2/MODEL_CARD_VISION.md).\n\nUsage of this model is subject to [Meta's Acceptable Use Policy](https://www.llama.com/llama3/use-policy/).",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Llama3",
            "instruct_type": "llama3",
            "default_system": null,
            "default_stops": [
                "<|eot_id|>",
                "<|end_of_text|>"
            ],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "meta-llama/llama-3.2-11b-vision-instruct",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "4a07b512-e030-412d-b1d6-39773a8b8dcf",
                "name": "DeepInfra | meta-llama/llama-3.2-11b-vision-instruct",
                "context_length": 131072,
                "model": {
                    "slug": "meta-llama/llama-3.2-11b-vision-instruct",
                    "hf_slug": "meta-llama/Llama-3.2-11B-Vision-Instruct",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-09-25T00:00:00+00:00",
                    "hf_updated_at": null,
                    "name": "Meta: Llama 3.2 11B Vision Instruct",
                    "short_name": "Llama 3.2 11B Vision Instruct",
                    "author": "meta-llama",
                    "description": "Llama 3.2 11B Vision is a multimodal model with 11 billion parameters, designed to handle tasks combining visual and textual data. It excels in tasks such as image captioning and visual question answering, bridging the gap between language generation and visual reasoning. Pre-trained on a massive dataset of image-text pairs, it performs well in complex, high-accuracy image analysis.\n\nIts ability to integrate visual understanding with language processing makes it an ideal solution for industries requiring comprehensive visual-linguistic AI applications, such as content creation, AI-driven customer service, and research.\n\nClick here for the [original model card](https://github.com/meta-llama/llama-models/blob/main/models/llama3_2/MODEL_CARD_VISION.md).\n\nUsage of this model is subject to [Meta's Acceptable Use Policy](https://www.llama.com/llama3/use-policy/).",
                    "model_version_group_id": null,
                    "context_length": 131072,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Llama3",
                    "instruct_type": "llama3",
                    "default_system": null,
                    "default_stops": [
                        "<|eot_id|>",
                        "<|end_of_text|>"
                    ],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "meta-llama/llama-3.2-11b-vision-instruct",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "meta-llama/llama-3.2-11b-vision-instruct",
                "model_variant_permaslug": "meta-llama/llama-3.2-11b-vision-instruct",
                "adapter_name": "DeepInfraAdapter",
                "provider_name": "DeepInfra",
                "provider_info": {
                    "name": "DeepInfra",
                    "displayName": "DeepInfra",
                    "slug": "deepinfra",
                    "baseUrl": "https://api.deepinfra.com/v1/openai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://deepinfra.com/terms",
                        "privacyPolicyURL": "https://deepinfra.com/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}",
                        "org_38GSfr7NVq111kyg6iXh1TTpKuz"
                    ],
                    "adapterName": "DeepInfraAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.deepinfra.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/DeepInfra.webp"
                    },
                    "ignoredProviderModels": [
                        "anthropic/claude-4-opus",
                        "anthropic/claude-4-sonnet",
                        "deepseek-ai/DeepSeek-R1-0528-Turbo",
                        "meta-llama/Llama-2-70b-chat-hf",
                        "mistralai/Mixtral-8x22B-Instruct-v0.1",
                        "google/gemma-1.1-7b-it",
                        "microsoft/Phi-3-medium-4k-instruct",
                        "google/gemma-2-27b-it",
                        "microsoft/WizardLM-2-7B",
                        "mattshumer/Reflection-Llama-3.1-70B",
                        "Sao10K/L3-8B-Lunaris-v1",
                        "openbmb/MiniCPM-Llama3-V-2_5",
                        "Qwen/QVQ-72B-Preview",
                        "deepinfra/airoboros-70b",
                        "Qwen/QwQ-32B-Preview",
                        "Phind/Phind-CodeLlama-34B-v2",
                        "lizpreciatior/lzlv_70b_fp16_hf",
                        "mistralai/Mistral-7B-Instruct-v0.2",
                        "cognitivecomputations/dolphin-2.6-mixtral-8x7b",
                        "cognitivecomputations/dolphin-2.9.1-llama-3-70b",
                        "Qwen/Qwen2-72B-Instruct",
                        "Qwen/Qwen2-7B-Instruct",
                        "google/gemma-2-9b-it",
                        "Sao10K/L3-70B-Euryale-v2.1",
                        "google/codegemma-7b-it",
                        "mistralai/Mistral-7B-Instruct-v0.1",
                        "KoboldAI/LLaMA2-13B-Tiefighter",
                        "meta-llama/Llama-2-13b-chat-hf",
                        "openchat/openchat_3.5",
                        "openchat/openchat-3.6-8b",
                        "bigcode/starcoder2-15b-instruct-v0.1",
                        "Gryphe/MythoMax-L2-13b-turbo",
                        "Austism/chronos-hermes-13b-v2",
                        "Qwen/Qwen2.5-Coder-7B",
                        "moonshotai/Kimi-K2-Instruct",
                        "google/gemini-1.5-flash",
                        "google/gemini-2.5-flash",
                        "google/gemini-2.0-flash-001",
                        "anthropic/claude-3-7-sonnet-latest",
                        "google/gemini-1.5-flash-8b",
                        "google/gemini-2.5-pro",
                        "NovaSky-AI/Sky-T1-32B-Preview",
                        "allenai/olmOCR-7B-0725-FP8",
                        "allenai/olmOCR-7B-0825",
                        "deepseek-ai/DeepSeek-V3-0324-Turbo",
                        "PaddlePaddle/PaddleOCR-VL-0.9B",
                        "allenai/olmOCR-7B-1025",
                        "allenai/olmOCR-2-7B-1025",
                        "allenai/olmOCR-2",
                        "deepseek-ai/DeepSeek-OCR",
                        "meta-llama/Llama-3.2-1B-Instruct",
                        "sentence-transformers/clip-ViT-B-32-multilingual-v1",
                        "shibing624/text2vec-base-chinese",
                        "sentence-transformers/clip-ViT-B-32",
                        "BAAI/bge-en-icl",
                        "Qwen/Qwen3-Embedding-8B-batch",
                        "Qwen/Qwen3-Embedding-4B-batch",
                        "mistralai/Mistral-Small-3.1-24B-Instruct-2503",
                        "meta-llama/Meta-Llama-3.1-405B-Instruct",
                        "BAAI/bge-m3-multi",
                        "google/embeddinggemma-300m",
                        "Qwen/Qwen3-Embedding-0.6B-batch",
                        "meta-llama/Llama-4-Maverick-17B-128E-Instruct-Turbo",
                        "microsoft/Phi-4-multimodal-instruct",
                        "deepseek-ai/DeepSeek-V3.2-Exp",
                        "meta-llama/Llama-3.2-90B-Vision-Instruct",
                        "meta-llama/Meta-Llama-3-70B-Instruct",
                        "deepseek-ai/DeepSeek-R1-Distill-Qwen-32B"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "DeepInfra",
                "provider_slug": "deepinfra/fp8",
                "provider_model_id": "meta-llama/Llama-3.2-11B-Vision-Instruct",
                "quantization": "fp8",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 16384,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "repetition_penalty",
                    "top_k",
                    "seed",
                    "min_p",
                    "response_format"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://deepinfra.com/terms",
                    "privacyPolicyURL": "https://deepinfra.com/privacy"
                },
                "pricing": {
                    "prompt": "0.000000049",
                    "completion": "0.000000049",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.000000049",
                    "openai:completion_tokens": "0.000000049"
                },
                "pricing_version_id": "66e3a91d-e4dd-4721-b500-9f23d2365917",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "mistralai/pixtral-12b",
            "hf_slug": "mistralai/Pixtral-12B-2409",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-09-10T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Mistral: Pixtral 12B",
            "short_name": "Pixtral 12B",
            "author": "mistralai",
            "description": "The first multi-modal, text+image-to-text model from Mistral AI. Its weights were launched via torrent: https://x.com/mistralai/status/1833758285167722836.",
            "model_version_group_id": null,
            "context_length": 32768,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Mistral",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "mistralai/pixtral-12b",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {
                "temperature": 0.3
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "b550f7af-571a-45fd-b442-b3327afaf38c",
                "name": "Hyperbolic | mistralai/pixtral-12b",
                "context_length": 32768,
                "model": {
                    "slug": "mistralai/pixtral-12b",
                    "hf_slug": "mistralai/Pixtral-12B-2409",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-09-10T00:00:00+00:00",
                    "hf_updated_at": null,
                    "name": "Mistral: Pixtral 12B",
                    "short_name": "Pixtral 12B",
                    "author": "mistralai",
                    "description": "The first multi-modal, text+image-to-text model from Mistral AI. Its weights were launched via torrent: https://x.com/mistralai/status/1833758285167722836.",
                    "model_version_group_id": null,
                    "context_length": 4096,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Mistral",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "mistralai/pixtral-12b",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {
                        "temperature": 0.3
                    },
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "mistralai/pixtral-12b",
                "model_variant_permaslug": "mistralai/pixtral-12b",
                "adapter_name": "HyperbolicAdapter",
                "provider_name": "Hyperbolic",
                "provider_info": {
                    "name": "Hyperbolic",
                    "displayName": "Hyperbolic",
                    "slug": "hyperbolic",
                    "baseUrl": "https://api.hyperbolic.xyz/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://hyperbolic.xyz/terms",
                        "privacyPolicyURL": "https://hyperbolic.xyz/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "HyperbolicAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://hyperbolic.xyz/&size=256"
                    },
                    "ignoredProviderModels": [
                        "Qwen/Qwen3-Coder-480B-A35B-Instruct"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Hyperbolic",
                "provider_slug": "hyperbolic/bf16",
                "provider_model_id": "mistralai/Pixtral-12B-2409",
                "quantization": "bf16",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "logit_bias",
                    "top_k",
                    "min_p",
                    "repetition_penalty"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://hyperbolic.xyz/terms",
                    "privacyPolicyURL": "https://hyperbolic.xyz/privacy"
                },
                "pricing": {
                    "prompt": "0.0000001",
                    "completion": "0.0000001",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.0000001",
                    "openai:completion_tokens": "0.0000001"
                },
                "pricing_version_id": "bd22699d-f1d8-49fe-afc3-99a0936757d6",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "qwen/qwen-2.5-vl-7b-instruct",
            "hf_slug": "Qwen/Qwen2.5-VL-7B-Instruct",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-08-28T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Qwen: Qwen2.5-VL 7B Instruct (free)",
            "short_name": "Qwen2.5-VL 7B Instruct (free)",
            "author": "qwen",
            "description": "Qwen2.5 VL 7B is a multimodal LLM from the Qwen Team with the following key enhancements:\n\n- SoTA understanding of images of various resolution & ratio: Qwen2.5-VL achieves state-of-the-art performance on visual understanding benchmarks, including MathVista, DocVQA, RealWorldQA, MTVQA, etc.\n\n- Understanding videos of 20min+: Qwen2.5-VL can understand videos over 20 minutes for high-quality video-based question answering, dialog, content creation, etc.\n\n- Agent that can operate your mobiles, robots, etc.: with the abilities of complex reasoning and decision making, Qwen2.5-VL can be integrated with devices like mobile phones, robots, etc., for automatic operation based on visual environment and text instructions.\n\n- Multilingual Support: to serve global users, besides English and Chinese, Qwen2.5-VL now supports the understanding of texts in different languages inside images, including most European languages, Japanese, Korean, Arabic, Vietnamese, etc.\n\nFor more details, see this [blog post](https://qwenlm.github.io/blog/qwen2-vl/) and [GitHub repo](https://github.com/QwenLM/Qwen2-VL).\n\nUsage of this model is subject to [Tongyi Qianwen LICENSE AGREEMENT](https://huggingface.co/Qwen/Qwen1.5-110B-Chat/blob/main/LICENSE).",
            "model_version_group_id": null,
            "context_length": 32768,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Qwen",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "qwen/qwen-2-vl-7b-instruct",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "77ef6e4c-601d-4bd6-b168-c88a5b44a792",
                "name": "ModelRun | qwen/qwen-2-vl-7b-instruct:free",
                "context_length": 32768,
                "model": {
                    "slug": "qwen/qwen-2.5-vl-7b-instruct",
                    "hf_slug": "Qwen/Qwen2.5-VL-7B-Instruct",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-08-28T00:00:00+00:00",
                    "hf_updated_at": null,
                    "name": "Qwen: Qwen2.5-VL 7B Instruct",
                    "short_name": "Qwen2.5-VL 7B Instruct",
                    "author": "qwen",
                    "description": "Qwen2.5 VL 7B is a multimodal LLM from the Qwen Team with the following key enhancements:\n\n- SoTA understanding of images of various resolution & ratio: Qwen2.5-VL achieves state-of-the-art performance on visual understanding benchmarks, including MathVista, DocVQA, RealWorldQA, MTVQA, etc.\n\n- Understanding videos of 20min+: Qwen2.5-VL can understand videos over 20 minutes for high-quality video-based question answering, dialog, content creation, etc.\n\n- Agent that can operate your mobiles, robots, etc.: with the abilities of complex reasoning and decision making, Qwen2.5-VL can be integrated with devices like mobile phones, robots, etc., for automatic operation based on visual environment and text instructions.\n\n- Multilingual Support: to serve global users, besides English and Chinese, Qwen2.5-VL now supports the understanding of texts in different languages inside images, including most European languages, Japanese, Korean, Arabic, Vietnamese, etc.\n\nFor more details, see this [blog post](https://qwenlm.github.io/blog/qwen2-vl/) and [GitHub repo](https://github.com/QwenLM/Qwen2-VL).\n\nUsage of this model is subject to [Tongyi Qianwen LICENSE AGREEMENT](https://huggingface.co/Qwen/Qwen1.5-110B-Chat/blob/main/LICENSE).",
                    "model_version_group_id": null,
                    "context_length": 32768,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Qwen",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "qwen/qwen-2-vl-7b-instruct",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "qwen/qwen-2.5-vl-7b-instruct:free",
                "model_variant_permaslug": "qwen/qwen-2-vl-7b-instruct:free",
                "adapter_name": "OpenAIAdapter",
                "provider_name": "ModelRun",
                "provider_info": {
                    "name": "ModelRun",
                    "displayName": "ModelRun",
                    "slug": "modelrun",
                    "baseUrl": "https://api.runmodelrun.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.runmodelrun.com/TOS.html",
                        "privacyPolicyURL": "https://www.runmodelrun.com/privacy-policy.html"
                    },
                    "headquarters": "US",
                    "datacenters": [
                        "US"
                    ],
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [],
                    "owners": [],
                    "adapterName": "OpenAIAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": false,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://api.runmodelrun.com&size=256"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "ModelRun",
                "provider_slug": "modelrun",
                "provider_model_id": "Qwen/Qwen2.5-VL-7B-Instruct",
                "quantization": "unknown",
                "variant": "free",
                "is_free": true,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "presence_penalty",
                    "repetition_penalty",
                    "frequency_penalty"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.runmodelrun.com/TOS.html",
                    "privacyPolicyURL": "https://www.runmodelrun.com/privacy-policy.html"
                },
                "pricing": {
                    "prompt": "0",
                    "completion": "0",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": 0,
                    "openai:completion_tokens": 0
                },
                "pricing_version_id": "22606844-5b89-4cf3-9031-5175f3f83d81",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supports_input_audio": false
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "qwen/qwen-2.5-vl-7b-instruct",
            "hf_slug": "Qwen/Qwen2.5-VL-7B-Instruct",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-08-28T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Qwen: Qwen2.5-VL 7B Instruct",
            "short_name": "Qwen2.5-VL 7B Instruct",
            "author": "qwen",
            "description": "Qwen2.5 VL 7B is a multimodal LLM from the Qwen Team with the following key enhancements:\n\n- SoTA understanding of images of various resolution & ratio: Qwen2.5-VL achieves state-of-the-art performance on visual understanding benchmarks, including MathVista, DocVQA, RealWorldQA, MTVQA, etc.\n\n- Understanding videos of 20min+: Qwen2.5-VL can understand videos over 20 minutes for high-quality video-based question answering, dialog, content creation, etc.\n\n- Agent that can operate your mobiles, robots, etc.: with the abilities of complex reasoning and decision making, Qwen2.5-VL can be integrated with devices like mobile phones, robots, etc., for automatic operation based on visual environment and text instructions.\n\n- Multilingual Support: to serve global users, besides English and Chinese, Qwen2.5-VL now supports the understanding of texts in different languages inside images, including most European languages, Japanese, Korean, Arabic, Vietnamese, etc.\n\nFor more details, see this [blog post](https://qwenlm.github.io/blog/qwen2-vl/) and [GitHub repo](https://github.com/QwenLM/Qwen2-VL).\n\nUsage of this model is subject to [Tongyi Qianwen LICENSE AGREEMENT](https://huggingface.co/Qwen/Qwen1.5-110B-Chat/blob/main/LICENSE).",
            "model_version_group_id": null,
            "context_length": 32768,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Qwen",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "qwen/qwen-2-vl-7b-instruct",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": {
                "id": "fae5bc3c-f799-4657-8d05-3cf6f489ed0c",
                "name": "Hyperbolic | qwen/qwen-2-vl-7b-instruct",
                "context_length": 32768,
                "model": {
                    "slug": "qwen/qwen-2.5-vl-7b-instruct",
                    "hf_slug": "Qwen/Qwen2.5-VL-7B-Instruct",
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-08-28T00:00:00+00:00",
                    "hf_updated_at": null,
                    "name": "Qwen: Qwen2.5-VL 7B Instruct",
                    "short_name": "Qwen2.5-VL 7B Instruct",
                    "author": "qwen",
                    "description": "Qwen2.5 VL 7B is a multimodal LLM from the Qwen Team with the following key enhancements:\n\n- SoTA understanding of images of various resolution & ratio: Qwen2.5-VL achieves state-of-the-art performance on visual understanding benchmarks, including MathVista, DocVQA, RealWorldQA, MTVQA, etc.\n\n- Understanding videos of 20min+: Qwen2.5-VL can understand videos over 20 minutes for high-quality video-based question answering, dialog, content creation, etc.\n\n- Agent that can operate your mobiles, robots, etc.: with the abilities of complex reasoning and decision making, Qwen2.5-VL can be integrated with devices like mobile phones, robots, etc., for automatic operation based on visual environment and text instructions.\n\n- Multilingual Support: to serve global users, besides English and Chinese, Qwen2.5-VL now supports the understanding of texts in different languages inside images, including most European languages, Japanese, Korean, Arabic, Vietnamese, etc.\n\nFor more details, see this [blog post](https://qwenlm.github.io/blog/qwen2-vl/) and [GitHub repo](https://github.com/QwenLM/Qwen2-VL).\n\nUsage of this model is subject to [Tongyi Qianwen LICENSE AGREEMENT](https://huggingface.co/Qwen/Qwen1.5-110B-Chat/blob/main/LICENSE).",
                    "model_version_group_id": null,
                    "context_length": 32768,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Qwen",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "qwen/qwen-2-vl-7b-instruct",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": true,
                    "is_trainable_image": null
                },
                "model_variant_slug": "qwen/qwen-2.5-vl-7b-instruct",
                "model_variant_permaslug": "qwen/qwen-2-vl-7b-instruct",
                "adapter_name": "HyperbolicAdapter",
                "provider_name": "Hyperbolic",
                "provider_info": {
                    "name": "Hyperbolic",
                    "displayName": "Hyperbolic",
                    "slug": "hyperbolic",
                    "baseUrl": "https://api.hyperbolic.xyz/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://hyperbolic.xyz/terms",
                        "privacyPolicyURL": "https://hyperbolic.xyz/privacy"
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "HyperbolicAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": null,
                    "byokEnabled": true,
                    "icon": {
                        "url": "https://t0.gstatic.com/faviconV2?client=SOCIAL&type=FAVICON&fallback_opts=TYPE,SIZE,URL&url=https://hyperbolic.xyz/&size=256"
                    },
                    "ignoredProviderModels": [
                        "Qwen/Qwen3-Coder-480B-A35B-Instruct"
                    ],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Hyperbolic",
                "provider_slug": "hyperbolic/bf16",
                "provider_model_id": "Qwen/Qwen2.5-VL-7B-Instruct",
                "quantization": "bf16",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": null,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "seed",
                    "logit_bias",
                    "top_k",
                    "min_p",
                    "repetition_penalty"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://hyperbolic.xyz/terms",
                    "privacyPolicyURL": "https://hyperbolic.xyz/privacy"
                },
                "pricing": {
                    "prompt": "0.0000002",
                    "completion": "0.0000002",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": "0.0000002",
                    "openai:completion_tokens": "0.0000002"
                },
                "pricing_version_id": "92bd83cb-246a-4525-b1b2-497cb23f093e",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    },
                    "supported_parameters": {}
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/chatgpt-4o-latest",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-08-14T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: ChatGPT-4o",
            "short_name": "ChatGPT-4o",
            "author": "openai",
            "description": "OpenAI ChatGPT 4o is continually updated by OpenAI to point to the current version of GPT-4o used by ChatGPT. It therefore differs slightly from the API version of [GPT-4o](/models/openai/gpt-4o) in that it has additional RLHF. It is intended for research and evaluation.\n\nOpenAI notes that this model is not suited for production use-cases as it may be removed or redirected to another model in the future.",
            "model_version_group_id": null,
            "context_length": 128000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/chatgpt-4o-latest",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "aff4b825-af10-4633-9ab2-9ac68c547988",
                "name": "OpenAI | openai/chatgpt-4o-latest",
                "context_length": 128000,
                "model": {
                    "slug": "openai/chatgpt-4o-latest",
                    "hf_slug": null,
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-08-14T00:00:00+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: ChatGPT-4o",
                    "short_name": "ChatGPT-4o",
                    "author": "openai",
                    "description": "OpenAI ChatGPT 4o is continually updated by OpenAI to point to the current version of GPT-4o used by ChatGPT. It therefore differs slightly from the API version of [GPT-4o](/models/openai/gpt-4o) in that it has additional RLHF. It is intended for research and evaluation.\n\nOpenAI notes that this model is not suited for production use-cases as it may be removed or redirected to another model in the future.",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/chatgpt-4o-latest",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/chatgpt-4o-latest",
                "model_variant_permaslug": "openai/chatgpt-4o-latest",
                "adapter_name": "OpenAIAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "chatgpt-4o-latest",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 16384,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "logit_bias",
                    "logprobs",
                    "top_logprobs"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000005",
                    "completion": "0.000015",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": 0.000005,
                    "openai:completion_tokens": 0.000015
                },
                "pricing_version_id": "7ba48c60-6be4-495f-beb5-c2a7b5b22639",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": false,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-4o-2024-08-06",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-08-06T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-4o (2024-08-06)",
            "short_name": "GPT-4o (2024-08-06)",
            "author": "openai",
            "description": "The 2024-08-06 version of GPT-4o offers improved performance in structured outputs, with the ability to supply a JSON schema in the respone_format. Read more [here](https://openai.com/index/introducing-structured-outputs-in-the-api/).\n\nGPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs. It maintains the intelligence level of [GPT-4 Turbo](/models/openai/gpt-4-turbo) while being twice as fast and 50% more cost-effective. GPT-4o also offers improved performance in processing non-English languages and enhanced visual capabilities.\n\nFor benchmarking against other models, it was briefly called [\"im-also-a-good-gpt2-chatbot\"](https://twitter.com/LiamFedus/status/1790064963966370209)",
            "model_version_group_id": "76e36b33-358e-477a-be24-09f954fcea74",
            "context_length": 128000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-4o-2024-08-06",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "59ea8d2a-1b1b-47f1-83de-a358a724caeb",
                "name": "Azure | openai/gpt-4o-2024-08-06",
                "context_length": 128000,
                "model": {
                    "slug": "openai/gpt-4o-2024-08-06",
                    "hf_slug": null,
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-08-06T00:00:00+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-4o (2024-08-06)",
                    "short_name": "GPT-4o (2024-08-06)",
                    "author": "openai",
                    "description": "The 2024-08-06 version of GPT-4o offers improved performance in structured outputs, with the ability to supply a JSON schema in the respone_format. Read more [here](https://openai.com/index/introducing-structured-outputs-in-the-api/).\n\nGPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs. It maintains the intelligence level of [GPT-4 Turbo](/models/openai/gpt-4-turbo) while being twice as fast and 50% more cost-effective. GPT-4o also offers improved performance in processing non-English languages and enhanced visual capabilities.\n\nFor benchmarking against other models, it was briefly called [\"im-also-a-good-gpt2-chatbot\"](https://twitter.com/LiamFedus/status/1790064963966370209)",
                    "model_version_group_id": "76e36b33-358e-477a-be24-09f954fcea74",
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-4o-2024-08-06",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-4o-2024-08-06",
                "model_variant_permaslug": "openai/gpt-4o-2024-08-06",
                "adapter_name": "AzureOpenAIAdapter",
                "provider_name": "Azure",
                "provider_info": {
                    "name": "Azure",
                    "displayName": "Azure",
                    "slug": "azure",
                    "baseUrl": "https://openrouter-east-us-2.openai.azure.com/openai",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": false,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.microsoft.com/en-us/legal/terms-of-use?oneroute=true",
                        "privacyPolicyURL": "https://www.microsoft.com/en-us/privacy/privacystatement"
                    },
                    "headquarters": "US",
                    "regionOverrides": {
                        "europe": {
                            "baseUrl": "https://openrouter-eu-resource.cognitiveservices.azure.com/openai"
                        }
                    },
                    "hasChatCompletions": true,
                    "hasCompletions": false,
                    "isAbortable": true,
                    "moderationRequired": false,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "AzureOpenAIAdapter",
                    "isMultipartSupported": false,
                    "statusPageUrl": "https://status.azure.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Azure.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "Azure",
                "provider_slug": "azure",
                "provider_model_id": "gpt-4o",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 16384,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "web_search_options",
                    "seed",
                    "logit_bias",
                    "logprobs",
                    "top_logprobs",
                    "response_format",
                    "structured_outputs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": false,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": false,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.microsoft.com/en-us/legal/terms-of-use?oneroute=true",
                    "privacyPolicyURL": "https://www.microsoft.com/en-us/privacy/privacystatement"
                },
                "pricing": {
                    "prompt": "0.0000025",
                    "completion": "0.00001",
                    "image": "0.003613",
                    "request": "0",
                    "input_cache_read": "0.00000125",
                    "web_search": "0",
                    "internal_reasoning": "0",
                    "image_output": "0",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "search-threshold",
                        "threshold": "high",
                        "request": "0.05"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "medium",
                        "request": "0.035"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "low",
                        "request": "0.03"
                    }
                ],
                "pricing_json": {
                    "openai:prompt_tokens": 0.0000025,
                    "openai:completion_tokens": 0.00001,
                    "openai:cached_prompt_tokens": 0.00000125
                },
                "pricing_version_id": "35fabd0d-b247-41ac-8e48-9f3ef3031f55",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": false,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-4o-mini-2024-07-18",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-07-18T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-4o-mini (2024-07-18)",
            "short_name": "GPT-4o-mini (2024-07-18)",
            "author": "openai",
            "description": "GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs.\n\nAs their most advanced small model, it is many multiples more affordable than other recent frontier models, and more than 60% cheaper than [GPT-3.5 Turbo](/models/openai/gpt-3.5-turbo). It maintains SOTA intelligence, while being significantly more cost-effective.\n\nGPT-4o mini achieves an 82% score on MMLU and presently ranks higher than GPT-4 on chat preferences [common leaderboards](https://arena.lmsys.org/).\n\nCheck out the [launch announcement](https://openai.com/index/gpt-4o-mini-advancing-cost-efficient-intelligence/) to learn more.\n\n#multimodal",
            "model_version_group_id": null,
            "context_length": 128000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-4o-mini-2024-07-18",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "ebcc1f0a-6621-4cdc-a93f-88a6e2cc2e15",
                "name": "OpenAI | openai/gpt-4o-mini-2024-07-18",
                "context_length": 128000,
                "model": {
                    "slug": "openai/gpt-4o-mini-2024-07-18",
                    "hf_slug": null,
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-07-18T00:00:00+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-4o-mini (2024-07-18)",
                    "short_name": "GPT-4o-mini (2024-07-18)",
                    "author": "openai",
                    "description": "GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs.\n\nAs their most advanced small model, it is many multiples more affordable than other recent frontier models, and more than 60% cheaper than [GPT-3.5 Turbo](/models/openai/gpt-3.5-turbo). It maintains SOTA intelligence, while being significantly more cost-effective.\n\nGPT-4o mini achieves an 82% score on MMLU and presently ranks higher than GPT-4 on chat preferences [common leaderboards](https://arena.lmsys.org/).\n\nCheck out the [launch announcement](https://openai.com/index/gpt-4o-mini-advancing-cost-efficient-intelligence/) to learn more.\n\n#multimodal",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-4o-mini-2024-07-18",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-4o-mini-2024-07-18",
                "model_variant_permaslug": "openai/gpt-4o-mini-2024-07-18",
                "adapter_name": "OpenAIAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-4o-mini-2024-07-18",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 16384,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "web_search_options",
                    "logit_bias",
                    "logprobs",
                    "top_logprobs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000015",
                    "completion": "0.0000006",
                    "input_cache_read": "0.000000075",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "search-threshold",
                        "threshold": "high",
                        "request": "0.03"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "medium",
                        "request": "0.0275"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "low",
                        "request": "0.025"
                    }
                ],
                "pricing_json": {
                    "openai:prompt_tokens": 1.5e-7,
                    "openai:completion_tokens": 6e-7,
                    "openai:cached_prompt_tokens": 7.5e-8
                },
                "pricing_version_id": "bb978658-5598-4ad9-8224-e8e5d57794cd",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-4o-mini",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-07-18T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-4o-mini",
            "short_name": "GPT-4o-mini",
            "author": "openai",
            "description": "GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs.\n\nAs their most advanced small model, it is many multiples more affordable than other recent frontier models, and more than 60% cheaper than [GPT-3.5 Turbo](/models/openai/gpt-3.5-turbo). It maintains SOTA intelligence, while being significantly more cost-effective.\n\nGPT-4o mini achieves an 82% score on MMLU and presently ranks higher than GPT-4 on chat preferences [common leaderboards](https://arena.lmsys.org/).\n\nCheck out the [launch announcement](https://openai.com/index/gpt-4o-mini-advancing-cost-efficient-intelligence/) to learn more.\n\n#multimodal",
            "model_version_group_id": null,
            "context_length": 128000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-4o-mini",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "77e40332-6f2a-4c48-bc14-e44596b30ce2",
                "name": "OpenAI | openai/gpt-4o-mini",
                "context_length": 128000,
                "model": {
                    "slug": "openai/gpt-4o-mini",
                    "hf_slug": null,
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-07-18T00:00:00+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-4o-mini",
                    "short_name": "GPT-4o-mini",
                    "author": "openai",
                    "description": "GPT-4o mini is OpenAI's newest model after [GPT-4 Omni](/models/openai/gpt-4o), supporting both text and image inputs with text outputs.\n\nAs their most advanced small model, it is many multiples more affordable than other recent frontier models, and more than 60% cheaper than [GPT-3.5 Turbo](/models/openai/gpt-3.5-turbo). It maintains SOTA intelligence, while being significantly more cost-effective.\n\nGPT-4o mini achieves an 82% score on MMLU and presently ranks higher than GPT-4 on chat preferences [common leaderboards](https://arena.lmsys.org/).\n\nCheck out the [launch announcement](https://openai.com/index/gpt-4o-mini-advancing-cost-efficient-intelligence/) to learn more.\n\n#multimodal",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-4o-mini",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-4o-mini",
                "model_variant_permaslug": "openai/gpt-4o-mini",
                "adapter_name": "OpenAIAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-4o-mini",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 16384,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "web_search_options",
                    "logit_bias",
                    "logprobs",
                    "top_logprobs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000015",
                    "completion": "0.0000006",
                    "input_cache_read": "0.000000075",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "search-threshold",
                        "threshold": "high",
                        "request": "0.03"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "medium",
                        "request": "0.0275"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "low",
                        "request": "0.025"
                    }
                ],
                "pricing_json": {
                    "openai:prompt_tokens": 1.5e-7,
                    "openai:completion_tokens": 6e-7,
                    "openai:cached_prompt_tokens": 7.5e-8
                },
                "pricing_version_id": "496e0c4b-dfc8-40e3-97e1-d0eeeab62195",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-4o-2024-05-13",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-05-13T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-4o (2024-05-13)",
            "short_name": "GPT-4o (2024-05-13)",
            "author": "openai",
            "description": "GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs. It maintains the intelligence level of [GPT-4 Turbo](/models/openai/gpt-4-turbo) while being twice as fast and 50% more cost-effective. GPT-4o also offers improved performance in processing non-English languages and enhanced visual capabilities.\n\nFor benchmarking against other models, it was briefly called [\"im-also-a-good-gpt2-chatbot\"](https://twitter.com/LiamFedus/status/1790064963966370209)\n\n#multimodal",
            "model_version_group_id": "76e36b33-358e-477a-be24-09f954fcea74",
            "context_length": 128000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-4o-2024-05-13",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "3d6584e7-a2bb-48d6-903d-24e3d90e7e55",
                "name": "OpenAI | openai/gpt-4o-2024-05-13",
                "context_length": 128000,
                "model": {
                    "slug": "openai/gpt-4o-2024-05-13",
                    "hf_slug": null,
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-05-13T00:00:00+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-4o (2024-05-13)",
                    "short_name": "GPT-4o (2024-05-13)",
                    "author": "openai",
                    "description": "GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs. It maintains the intelligence level of [GPT-4 Turbo](/models/openai/gpt-4-turbo) while being twice as fast and 50% more cost-effective. GPT-4o also offers improved performance in processing non-English languages and enhanced visual capabilities.\n\nFor benchmarking against other models, it was briefly called [\"im-also-a-good-gpt2-chatbot\"](https://twitter.com/LiamFedus/status/1790064963966370209)\n\n#multimodal",
                    "model_version_group_id": "76e36b33-358e-477a-be24-09f954fcea74",
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-4o-2024-05-13",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-4o-2024-05-13",
                "model_variant_permaslug": "openai/gpt-4o-2024-05-13",
                "adapter_name": "OpenAIAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-4o-2024-05-13",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 4096,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "web_search_options",
                    "logit_bias",
                    "logprobs",
                    "top_logprobs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000005",
                    "completion": "0.000015",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "search-threshold",
                        "threshold": "high",
                        "request": "0.05"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "medium",
                        "request": "0.035"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "low",
                        "request": "0.03"
                    }
                ],
                "pricing_json": {
                    "openai:prompt_tokens": 0.000005,
                    "openai:completion_tokens": 0.000015
                },
                "pricing_version_id": "dab5f507-2c79-4281-bc39-5346d8549075",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-4o",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-05-13T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-4o",
            "short_name": "GPT-4o",
            "author": "openai",
            "description": "GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs. It maintains the intelligence level of [GPT-4 Turbo](/models/openai/gpt-4-turbo) while being twice as fast and 50% more cost-effective. GPT-4o also offers improved performance in processing non-English languages and enhanced visual capabilities.\n\nFor benchmarking against other models, it was briefly called [\"im-also-a-good-gpt2-chatbot\"](https://twitter.com/LiamFedus/status/1790064963966370209)\n\n#multimodal",
            "model_version_group_id": "76e36b33-358e-477a-be24-09f954fcea74",
            "context_length": 128000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-4o",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "452a72a0-2c24-4e31-98cb-d6cc1084fb99",
                "name": "OpenAI | openai/gpt-4o",
                "context_length": 128000,
                "model": {
                    "slug": "openai/gpt-4o",
                    "hf_slug": null,
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-05-13T00:00:00+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-4o",
                    "short_name": "GPT-4o",
                    "author": "openai",
                    "description": "GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs. It maintains the intelligence level of [GPT-4 Turbo](/models/openai/gpt-4-turbo) while being twice as fast and 50% more cost-effective. GPT-4o also offers improved performance in processing non-English languages and enhanced visual capabilities.\n\nFor benchmarking against other models, it was briefly called [\"im-also-a-good-gpt2-chatbot\"](https://twitter.com/LiamFedus/status/1790064963966370209)\n\n#multimodal",
                    "model_version_group_id": "76e36b33-358e-477a-be24-09f954fcea74",
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-4o",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-4o",
                "model_variant_permaslug": "openai/gpt-4o",
                "adapter_name": "OpenAIAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-4o",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 16384,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "web_search_options",
                    "logit_bias",
                    "logprobs",
                    "top_logprobs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.0000025",
                    "completion": "0.00001",
                    "input_cache_read": "0.00000125",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "search-threshold",
                        "threshold": "high",
                        "request": "0.05"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "medium",
                        "request": "0.035"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "low",
                        "request": "0.03"
                    }
                ],
                "pricing_json": {
                    "openai:prompt_tokens": 0.0000025,
                    "openai:completion_tokens": 0.00001,
                    "openai:cached_prompt_tokens": 0.00000125
                },
                "pricing_version_id": "9a09c5e1-25e5-4027-ac71-8ada7a7a80b9",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-4o",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-05-13T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-4o (extended)",
            "short_name": "GPT-4o (extended)",
            "author": "openai",
            "description": "GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs. It maintains the intelligence level of [GPT-4 Turbo](/models/openai/gpt-4-turbo) while being twice as fast and 50% more cost-effective. GPT-4o also offers improved performance in processing non-English languages and enhanced visual capabilities.\n\nFor benchmarking against other models, it was briefly called [\"im-also-a-good-gpt2-chatbot\"](https://twitter.com/LiamFedus/status/1790064963966370209)\n\n#multimodal",
            "model_version_group_id": "76e36b33-358e-477a-be24-09f954fcea74",
            "context_length": 128000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-4o",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "3f4c883a-bd8b-4e01-ac1b-25cc9a17dd61",
                "name": "OpenAI | openai/gpt-4o:extended",
                "context_length": 128000,
                "model": {
                    "slug": "openai/gpt-4o",
                    "hf_slug": null,
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-05-13T00:00:00+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-4o",
                    "short_name": "GPT-4o",
                    "author": "openai",
                    "description": "GPT-4o (\"o\" for \"omni\") is OpenAI's latest AI model, supporting both text and image inputs with text outputs. It maintains the intelligence level of [GPT-4 Turbo](/models/openai/gpt-4-turbo) while being twice as fast and 50% more cost-effective. GPT-4o also offers improved performance in processing non-English languages and enhanced visual capabilities.\n\nFor benchmarking against other models, it was briefly called [\"im-also-a-good-gpt2-chatbot\"](https://twitter.com/LiamFedus/status/1790064963966370209)\n\n#multimodal",
                    "model_version_group_id": "76e36b33-358e-477a-be24-09f954fcea74",
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image",
                        "file"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-4o",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-4o:extended",
                "model_variant_permaslug": "openai/gpt-4o:extended",
                "adapter_name": "OpenAIAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-4o-64k-output-alpha",
                "quantization": "unknown",
                "variant": "extended",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 64000,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "web_search_options",
                    "logit_bias",
                    "logprobs",
                    "top_logprobs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.000006",
                    "completion": "0.000018",
                    "discount": 0
                },
                "variable_pricings": [
                    {
                        "type": "search-threshold",
                        "threshold": "high",
                        "request": "0.05"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "medium",
                        "request": "0.035"
                    },
                    {
                        "type": "search-threshold",
                        "threshold": "low",
                        "request": "0.03"
                    }
                ],
                "pricing_json": {
                    "openai:prompt_tokens": 0.000006,
                    "openai:completion_tokens": 0.000018
                },
                "pricing_version_id": "1a91197b-4d58-49bd-9658-0563b513b7da",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openai/gpt-4-turbo",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-04-09T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-4 Turbo",
            "short_name": "GPT-4 Turbo",
            "author": "openai",
            "description": "The latest GPT-4 Turbo model with vision capabilities. Vision requests can now use JSON mode and function calling.\n\nTraining data: up to December 2023.",
            "model_version_group_id": null,
            "context_length": 128000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-4-turbo",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "da16824f-3ba0-43a1-86f8-a6131837f457",
                "name": "OpenAI | openai/gpt-4-turbo",
                "context_length": 128000,
                "model": {
                    "slug": "openai/gpt-4-turbo",
                    "hf_slug": null,
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-04-09T00:00:00+00:00",
                    "hf_updated_at": null,
                    "name": "OpenAI: GPT-4 Turbo",
                    "short_name": "GPT-4 Turbo",
                    "author": "openai",
                    "description": "The latest GPT-4 Turbo model with vision capabilities. Vision requests can now use JSON mode and function calling.\n\nTraining data: up to December 2023.",
                    "model_version_group_id": null,
                    "context_length": 128000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "GPT",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "openai/gpt-4-turbo",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "openai/gpt-4-turbo",
                "model_variant_permaslug": "openai/gpt-4-turbo",
                "adapter_name": "OpenAIAdapter",
                "provider_name": "OpenAI",
                "provider_info": {
                    "name": "OpenAI",
                    "displayName": "OpenAI",
                    "slug": "openai",
                    "baseUrl": "https://api.openai.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "canPublish": false,
                        "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                        "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "OpenAIAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.openai.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/OpenAI.svg",
                        "className": "invert-0 dark:invert"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "openai_chat_completions"
                },
                "provider_display_name": "OpenAI",
                "provider_slug": "openai",
                "provider_model_id": "gpt-4-turbo",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 4096,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "seed",
                    "max_tokens",
                    "response_format",
                    "structured_outputs",
                    "temperature",
                    "top_p",
                    "stop",
                    "frequency_penalty",
                    "presence_penalty",
                    "logit_bias",
                    "logprobs",
                    "top_logprobs",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "canPublish": false,
                    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
                    "privacyPolicyURL": "https://openai.com/policies/privacy-policy/",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00001",
                    "completion": "0.00003",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "openai:prompt_tokens": 0.00001,
                    "openai:completion_tokens": 0.00003
                },
                "pricing_version_id": "48751c0f-27b9-45d7-9b9a-ec343acdf97b",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "anthropic/claude-3-haiku",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-03-13T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Anthropic: Claude 3 Haiku",
            "short_name": "Claude 3 Haiku",
            "author": "anthropic",
            "description": "Claude 3 Haiku is Anthropic's fastest and most compact model for\nnear-instant responsiveness. Quick and accurate targeted performance.\n\nSee the launch announcement and benchmark results [here](https://www.anthropic.com/news/claude-3-haiku)\n\n#multimodal",
            "model_version_group_id": "028ec497-a034-40fd-81fe-f51d0a0c640c",
            "context_length": 200000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Claude",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "anthropic/claude-3-haiku",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": {
                "id": "8661a1db-b0cf-4eb2-ba04-c2a79f698682",
                "name": "Anthropic | anthropic/claude-3-haiku",
                "context_length": 200000,
                "model": {
                    "slug": "anthropic/claude-3-haiku",
                    "hf_slug": null,
                    "updated_at": "2025-11-10T16:00:38.246665+00:00",
                    "created_at": "2024-03-13T00:00:00+00:00",
                    "hf_updated_at": null,
                    "name": "Anthropic: Claude 3 Haiku",
                    "short_name": "Claude 3 Haiku",
                    "author": "anthropic",
                    "description": "Claude 3 Haiku is Anthropic's fastest and most compact model for\nnear-instant responsiveness. Quick and accurate targeted performance.\n\nSee the launch announcement and benchmark results [here](https://www.anthropic.com/news/claude-3-haiku)\n\n#multimodal",
                    "model_version_group_id": "028ec497-a034-40fd-81fe-f51d0a0c640c",
                    "context_length": 200000,
                    "input_modalities": [
                        "text",
                        "image"
                    ],
                    "output_modalities": [
                        "text"
                    ],
                    "has_text_output": true,
                    "group": "Claude",
                    "instruct_type": null,
                    "default_system": null,
                    "default_stops": [],
                    "hidden": false,
                    "router": null,
                    "warning_message": null,
                    "promotion_message": null,
                    "routing_error_message": null,
                    "permaslug": "anthropic/claude-3-haiku",
                    "supports_reasoning": false,
                    "reasoning_config": null,
                    "features": {},
                    "default_parameters": {},
                    "default_order": [],
                    "quick_start_example_type": null,
                    "is_trainable_text": null,
                    "is_trainable_image": null
                },
                "model_variant_slug": "anthropic/claude-3-haiku",
                "model_variant_permaslug": "anthropic/claude-3-haiku",
                "adapter_name": "AnthropicMessageAdapter",
                "provider_name": "Anthropic",
                "provider_info": {
                    "name": "Anthropic",
                    "displayName": "Anthropic",
                    "slug": "anthropic",
                    "baseUrl": "https://api.anthropic.com/v1",
                    "dataPolicy": {
                        "training": false,
                        "trainingOpenRouter": false,
                        "retainsPrompts": true,
                        "retentionDays": 30,
                        "canPublish": false,
                        "termsOfServiceURL": "https://www.anthropic.com/legal/commercial-terms",
                        "privacyPolicyURL": "https://www.anthropic.com/legal/privacy",
                        "requiresUserIDs": true
                    },
                    "headquarters": "US",
                    "regionOverrides": {},
                    "hasChatCompletions": true,
                    "hasCompletions": true,
                    "isAbortable": true,
                    "moderationRequired": true,
                    "editors": [
                        "{}"
                    ],
                    "owners": [
                        "{}"
                    ],
                    "adapterName": "AnthropicMessageAdapter",
                    "isMultipartSupported": true,
                    "statusPageUrl": "https://status.anthropic.com/",
                    "byokEnabled": true,
                    "icon": {
                        "url": "/images/icons/Anthropic.svg"
                    },
                    "ignoredProviderModels": [],
                    "sendClientIp": false,
                    "pricingStrategy": "anthropic"
                },
                "provider_display_name": "Anthropic",
                "provider_slug": "anthropic",
                "provider_model_id": "claude-3-haiku-20240307",
                "quantization": "unknown",
                "variant": "standard",
                "is_free": false,
                "can_abort": true,
                "max_prompt_tokens": null,
                "max_completion_tokens": 4096,
                "max_tokens_per_image": null,
                "supported_parameters": [
                    "max_tokens",
                    "temperature",
                    "top_p",
                    "top_k",
                    "stop",
                    "tools",
                    "tool_choice"
                ],
                "is_byok": false,
                "moderation_required": true,
                "data_policy": {
                    "training": false,
                    "trainingOpenRouter": false,
                    "retainsPrompts": true,
                    "retentionDays": 30,
                    "canPublish": false,
                    "termsOfServiceURL": "https://www.anthropic.com/legal/commercial-terms",
                    "privacyPolicyURL": "https://www.anthropic.com/legal/privacy",
                    "requiresUserIDs": true
                },
                "pricing": {
                    "prompt": "0.00000025",
                    "completion": "0.00000125",
                    "input_cache_read": "0.00000003",
                    "input_cache_write": "0.0000003",
                    "discount": 0
                },
                "variable_pricings": [],
                "pricing_json": {
                    "anthropic:prompt_tokens": 2.5e-7,
                    "anthropic:cache_read_tokens": 3e-8,
                    "anthropic:completion_tokens": 0.00000125,
                    "anthropic:cache_write_1h_tokens": 5e-7,
                    "anthropic:cache_write_5m_tokens": 3e-7
                },
                "pricing_version_id": "6e785387-5305-4e6a-84e2-76c9ab02b414",
                "is_hidden": false,
                "is_deranked": false,
                "is_disabled": false,
                "supports_tool_parameters": true,
                "supports_reasoning": false,
                "supports_multipart": true,
                "limit_rpm": null,
                "limit_rpd": null,
                "limit_rpm_cf": null,
                "has_completions": true,
                "has_chat_completions": true,
                "features": {
                    "supports_tool_choice": {
                        "literal_none": true,
                        "literal_auto": true,
                        "literal_required": true,
                        "type_function": true
                    }
                },
                "provider_region": null,
                "deprecation_date": null
            }
        },
        {
            "slug": "openrouter/bert-nebulon-alpha",
            "hf_slug": "",
            "updated_at": "2025-12-02T15:25:47.01144+00:00",
            "created_at": "2025-11-24T17:24:18+00:00",
            "hf_updated_at": null,
            "name": "Bert-Nebulon Alpha",
            "short_name": "Bert-Nebulon Alpha",
            "author": "openrouter",
            "description": "This model was an early testing version of Mistral Large 3. Try the official launch of Mistral Large 3 [here](/mistralai/mistral-large-2512)\n\nThis is a cloaked model provided to the community to gather feedback. A general-purpose multimodal model (text/image in, text out) designed for reliability, long-context comprehension, and adaptive logic. It is engineered for production-grade assistants, retrieval-augmented systems, science workloads, and complex agentic workflows.\n\n**Note:** All prompts and completions for this model are logged by the provider and may be used to improve the model.",
            "model_version_group_id": null,
            "context_length": 256000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": "",
            "routing_error_message": "Bert-Nebulon Alpha was a stealth model revealed on December 2nd as an early testing version of Mistral Large 3. Find it here: {{SITE_UR}}/mistralai/mistral-large-2512",
            "permaslug": "openrouter/bert-nebulon-alpha",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": 0.0645,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "text",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "openrouter/sherlock-dash-alpha",
            "hf_slug": "",
            "updated_at": "2025-11-19T23:50:42.801865+00:00",
            "created_at": "2025-11-15T17:49:49+00:00",
            "hf_updated_at": null,
            "name": "Sherlock Dash Alpha",
            "short_name": "Sherlock Dash Alpha",
            "author": "openrouter",
            "description": "This model was an early snapshot of Grok 4.1 Fast with reasoning disabled. Try the official launch of Grok 4.1 Fast [here](/x-ai/grok-4.1-fast)\n\nThis is a cloaked model provided to the community to gather feedback. A frontier non-reasoning model that excels at tool calling, with a 1.8M context window and multimodal support.\n\n**Note:** All prompts and completions for this model are logged by the provider and may be used to improve the model.",
            "model_version_group_id": null,
            "context_length": 1840000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "This model was an early snapshot of Grok 4.1 Fast with reasoning disabled. Try the official launch of Grok 4.1 Fast [here](/x-ai/grok-4.1-fast)\n\nAll prompts and completions for this model are logged by the provider and may be used to improve the model.",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "openrouter/sherlock-dash-alpha",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": 0.7,
                "top_p": 0.95,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "openrouter/sherlock-think-alpha",
            "hf_slug": "",
            "updated_at": "2025-11-20T02:01:49.950758+00:00",
            "created_at": "2025-11-15T17:49:46+00:00",
            "hf_updated_at": null,
            "name": "Sherlock Think Alpha",
            "short_name": "Sherlock Think Alpha",
            "author": "openrouter",
            "description": "This model was an early snapshot of Grok 4.1 Fast with reasoning enabled. Try the official launch of Grok 4.1 Fast [here](/x-ai/grok-4.1-fast)\n\nThis is a cloaked model provided to the community to gather feedback. A frontier reasoning model that excels at tool calling, with a 1.8M context window and multimodal support.\n\n**Note:** All prompts and completions for this model are logged by the provider and may be used to improve the model.",
            "model_version_group_id": null,
            "context_length": 1840000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "This model was an early snapshot of Grok 4.1 Fast with reasoning enabled. Try the official launch of Grok 4.1 Fast [here](/x-ai/grok-4.1-fast)\n\nAll prompts and completions for this model are logged by the provider and may be used to improve the model.",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "openrouter/sherlock-think-alpha",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": 0.7,
                "top_p": 0.95,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "openrouter/polaris-alpha",
            "hf_slug": "",
            "updated_at": "2025-11-19T23:49:14.889425+00:00",
            "created_at": "2025-11-06T17:55:07.695182+00:00",
            "hf_updated_at": null,
            "name": "Polaris Alpha",
            "short_name": "Polaris Alpha",
            "author": "openrouter",
            "description": "This model was an early snapshot of GPT-5.1 with reasoning effort set to minimal. Try the official launch of GPT-5.1 [here](/openai/gpt-5.1)\n\nThis is a cloaked model provided to the community to gather feedback. A powerful, general-purpose model that excels across real-world tasks, with standout performance in coding, tool calling, and instruction following.\n\n**Note:** All prompts and completions for this model are logged by the provider and may be used to improve the model.",
            "model_version_group_id": null,
            "context_length": 256000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "This model was an early snapshot of GPT-5.1 with reasoning effort set to minimal. Try the official launch of GPT-5.1 here: /openai/gpt-5.1\n\nAll prompts and completions for this model are logged by the provider and may be used to improve the model.",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "openrouter/polaris-alpha",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                },
                "chat_template_config": {}
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": "reasoning",
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "openrouter/andromeda-alpha",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-10-21T20:03:14+00:00",
            "hf_updated_at": null,
            "name": "Andromeda Alpha",
            "short_name": "Andromeda Alpha",
            "author": "openrouter",
            "description": "This model has been revealed as NVIDIA Nemotron Nano 2 VL. It continues to be offered for free by NVIDIA [here](https://openrouter.ai/nvidia/nemotron-nano-12b-v2-vl:free). \n\nThis is a small reasoning VLM trained for image understanding. It's strengths include multi-image comprehension (6+ images), especially those containing charts and text. This is a cloaked model provided to the community to gather feedback.\n\nNote: All prompts and output are logged to improve the provider’s model and its product and services. Please do not upload any personal, confidential, or otherwise sensitive information. This is a trial use only. Do not use for production or business-critical systems.",
            "model_version_group_id": null,
            "context_length": 128000,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "All prompts and output are logged to improve the provider’s model and its product and services. Please do not upload any personal, confidential, or otherwise sensitive information. This is a trial use only. Do not use for production or business-critical systems.",
            "promotion_message": "",
            "routing_error_message": null,
            "permaslug": "openrouter/andromeda-alpha",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "openrouter/sonoma-dusk-alpha",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-09-05T17:27:27.26817+00:00",
            "hf_updated_at": null,
            "name": "Sonoma Dusk Alpha",
            "short_name": "Sonoma Dusk Alpha",
            "author": "openrouter",
            "description": "This is a cloaked model provided to the community to gather feedback. A fast and intelligent general-purpose frontier model with a 2 million token context window. Supports image inputs and parallel tool calling.\n\nNote: It’s free to use during this testing period, and prompts and completions are logged by the model creator for feedback and training.",
            "model_version_group_id": null,
            "context_length": 2000000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "Sonoma Dusk Alpha were early test versions of [Grok 4 Fast](/x-ai/grok-4-fast:free), which is free to use for a limited time.”\n\nAll prompts and completions for this model are logged by the provider and may be used to improve the model.",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openrouter/sonoma-dusk-alpha",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "openrouter/sonoma-sky-alpha",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-09-05T17:23:21.168091+00:00",
            "hf_updated_at": null,
            "name": "Sonoma Sky Alpha",
            "short_name": "Sonoma Sky Alpha",
            "author": "openrouter",
            "description": "This is a cloaked model provided to the community to gather feedback. A maximally intelligent general-purpose frontier model with a 2 million token context window. Supports image inputs and parallel tool calling.\n\nNote: It’s free to use during this testing period, and prompts and completions are logged by the model creator for feedback and training.",
            "model_version_group_id": null,
            "context_length": 2000000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "Sonoma Sky Alpha were early test versions of [Grok 4 Fast](/x-ai/grok-4-fast:free), which is free to use for a limited time.”\n\nAll prompts and completions for this model are logged by the provider and may be used to improve the model.",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openrouter/sonoma-sky-alpha",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "google/gemini-2.5-flash-image-preview",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-08-26T14:36:17+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 2.5 Flash Image Preview (Nano Banana)",
            "short_name": "Gemini 2.5 Flash Image Preview (Nano Banana)",
            "author": "google",
            "description": "Gemini 2.5 Flash Image Preview, a.k.a. \"Nano Banana,\" is a state of the art image generation model with contextual understanding. It is capable of image generation, edits, and multi-turn conversations.",
            "model_version_group_id": null,
            "context_length": 32768,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "image",
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-2.5-flash-image-preview",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {
                "temperature": null,
                "top_p": null,
                "frequency_penalty": null
            },
            "default_order": [
                "google-vertex",
                "google-ai-studio"
            ],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "openrouter/horizon-beta",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-08-01T23:03:39.887977+00:00",
            "hf_updated_at": null,
            "name": "Horizon Beta",
            "short_name": "Horizon Beta",
            "author": "openrouter",
            "description": "This is a cloaked model provided to the community to gather feedback. This is an improved version of [Horizon Alpha](/openrouter/horizon-alpha)\n\nNote: It’s free to use during this testing period, and prompts and completions are logged by the model creator for feedback and training.",
            "model_version_group_id": null,
            "context_length": 256000,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "All prompts and completions for this model are logged by the provider and may be used to improve the model.",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openrouter/horizon-beta",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "openrouter/horizon-alpha",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-07-30T22:18:04+00:00",
            "hf_updated_at": null,
            "name": "Horizon Alpha",
            "short_name": "Horizon Alpha",
            "author": "openrouter",
            "description": "This was a cloaked model provided to the community to gather feedback. It has been deprecated - see [Horizon Beta](/openrouter/horizon-beta).\n\nNote: It’s free to use during this testing period, and prompts and completions are logged by the model creator for feedback and training.",
            "model_version_group_id": null,
            "context_length": 256000,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "All prompts and completions for this model are logged by the provider and may be used to improve the model and other products and services. ",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openrouter/horizon-alpha",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "thudm/glm-4.1v-9b-thinking",
            "hf_slug": "THUDM/GLM-4.1V-9B-Thinking",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-07-11T14:33:05.378045+00:00",
            "hf_updated_at": null,
            "name": "THUDM: GLM 4.1V 9B Thinking",
            "short_name": "GLM 4.1V 9B Thinking",
            "author": "thudm",
            "description": "GLM-4.1V-9B-Thinking is a 9B parameter vision-language model developed by THUDM, based on the GLM-4-9B foundation. It introduces a reasoning-centric \"thinking paradigm\" enhanced with reinforcement learning to improve multimodal reasoning, long-context understanding (up to 64K tokens), and complex problem solving. It achieves state-of-the-art performance among models in its class, outperforming even larger models like Qwen-2.5-VL-72B on a majority of benchmark tasks. ",
            "model_version_group_id": null,
            "context_length": 65536,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "thudm/glm-4.1v-9b-thinking",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": "<think>",
                "end_token": "</think>",
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": "<think>",
                    "end_token": "</think>",
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "openai/codex-mini",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-05-16T15:36:01.081688+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: Codex Mini",
            "short_name": "Codex Mini",
            "author": "openai",
            "description": "codex-mini-latest is a fine-tuned version of o4-mini specifically for use in Codex CLI. For direct use in the API, we recommend starting with gpt-4.1.",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/codex-mini",
            "supports_reasoning": true,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "opengvlab/internvl3-14b",
            "hf_slug": "OpenGVLab/InternVL3-14B",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-04-30T13:55:55.014183+00:00",
            "hf_updated_at": null,
            "name": "OpenGVLab: InternVL3 14B",
            "short_name": "InternVL3 14B",
            "author": "opengvlab",
            "description": "The 14b version of the InternVL3 series. An advanced multimodal large language model (MLLM) series that demonstrates superior overall performance. Compared to InternVL 2.5, InternVL3 exhibits superior multimodal perception and reasoning capabilities, while further extending its multimodal capabilities to encompass tool usage, GUI agents, industrial image analysis, 3D vision perception, and more.",
            "model_version_group_id": null,
            "context_length": 32000,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "opengvlab/internvl3-14b",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "opengvlab/internvl3-2b",
            "hf_slug": "OpenGVLab/InternVL3-2B",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-04-30T13:30:07.912688+00:00",
            "hf_updated_at": null,
            "name": "OpenGVLab: InternVL3 2B",
            "short_name": "InternVL3 2B",
            "author": "opengvlab",
            "description": "The 2b version of the InternVL3 series, for an even higher inference speed and very reasonable performance. An advanced multimodal large language model (MLLM) series that demonstrates superior overall performance. Compared to InternVL 2.5, InternVL3 exhibits superior multimodal perception and reasoning capabilities, while further extending its multimodal capabilities to encompass tool usage, GUI agents, industrial image analysis, 3D vision perception, and more.",
            "model_version_group_id": null,
            "context_length": 32000,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "opengvlab/internvl3-2b",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "moonshotai/kimi-vl-a3b-thinking",
            "hf_slug": "moonshotai/Kimi-VL-A3B-Thinking",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-04-10T17:07:21.175402+00:00",
            "hf_updated_at": null,
            "name": "MoonshotAI: Kimi VL A3B Thinking",
            "short_name": "Kimi VL A3B Thinking",
            "author": "moonshotai",
            "description": "Kimi-VL is a lightweight Mixture-of-Experts vision-language model that activates only 2.8B parameters per step while delivering strong performance on multimodal reasoning and long-context tasks. The Kimi-VL-A3B-Thinking variant, fine-tuned with chain-of-thought and reinforcement learning, excels in math and visual reasoning benchmarks like MathVision, MMMU, and MathVista, rivaling much larger models such as Qwen2.5-VL-7B and Gemma-3-12B. It supports 128K context and high-resolution input via its MoonViT encoder.",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "moonshotai/kimi-vl-a3b-thinking",
            "supports_reasoning": true,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "openrouter/optimus-alpha",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-04-10T13:30:19+00:00",
            "hf_updated_at": null,
            "name": "Optimus Alpha",
            "short_name": "Optimus Alpha",
            "author": "openrouter",
            "description": "This is a cloaked model provided to the community to gather feedback. It's geared toward real world use cases, including programming.\n\n**Note:** All prompts and completions for this model are logged by the provider and may be used to improve the model.",
            "model_version_group_id": null,
            "context_length": 1000000,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openrouter/optimus-alpha",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "openrouter/quasar-alpha",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-04-02T20:46:49.278785+00:00",
            "hf_updated_at": null,
            "name": "Quasar Alpha",
            "short_name": "Quasar Alpha",
            "author": "openrouter",
            "description": "This is a cloaked model provided to the community to gather feedback. It’s a powerful, all-purpose model supporting long-context tasks, including code generation.\n\n**Note:** All prompts and completions for this model are logged by the provider  and may be used to improve the model.",
            "model_version_group_id": null,
            "context_length": 1000000,
            "input_modalities": [
                "image",
                "text"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openrouter/quasar-alpha",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "bytedance-research/ui-tars-72b",
            "hf_slug": "bytedance-research/UI-TARS-72B-DPO",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-03-26T20:14:25.673407+00:00",
            "hf_updated_at": null,
            "name": "Bytedance: UI-TARS 72B ",
            "short_name": "UI-TARS 72B ",
            "author": "bytedance-research",
            "description": "UI-TARS 72B is an open-source multimodal AI model designed specifically for automating browser and desktop tasks through visual interaction and control. The model is built with a specialized vision architecture enabling accurate interpretation and manipulation of on-screen visual data. It supports automation tasks within web browsers as well as desktop applications, including Microsoft Office and VS Code.\n\nCore capabilities include intelligent screen detection, predictive action modeling, and efficient handling of repetitive interactions. UI-TARS employs supervised fine-tuning (SFT) tailored explicitly for computer control scenarios. It can be deployed locally or accessed via Hugging Face for demonstration purposes. Intended use cases encompass workflow automation, task scripting, and interactive desktop control applications.",
            "model_version_group_id": null,
            "context_length": 32768,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "bytedance-research/ui-tars-72b",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "qwen/qwen2.5-vl-3b-instruct",
            "hf_slug": "Qwen/Qwen2.5-VL-3B-Instruct",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-03-26T18:42:53.41832+00:00",
            "hf_updated_at": null,
            "name": "Qwen: Qwen2.5 VL 3B Instruct",
            "short_name": "Qwen2.5 VL 3B Instruct",
            "author": "qwen",
            "description": "Qwen2.5 VL 3B is a multimodal LLM from the Qwen Team with the following key enhancements:\n\n- SoTA understanding of images of various resolution & ratio: Qwen2.5-VL achieves state-of-the-art performance on visual understanding benchmarks, including MathVista, DocVQA, RealWorldQA, MTVQA, etc.\n\n- Agent that can operate your mobiles, robots, etc.: with the abilities of complex reasoning and decision making, Qwen2.5-VL can be integrated with devices like mobile phones, robots, etc., for automatic operation based on visual environment and text instructions.\n\n- Multilingual Support: to serve global users, besides English and Chinese, Qwen2.5-VL now supports the understanding of texts in different languages inside images, including most European languages, Japanese, Korean, Arabic, Vietnamese, etc.\n\nFor more details, see this [blog post](https://qwenlm.github.io/blog/qwen2-vl/) and [GitHub repo](https://github.com/QwenLM/Qwen2-VL).\n\nUsage of this model is subject to [Tongyi Qianwen LICENSE AGREEMENT](https://huggingface.co/Qwen/Qwen1.5-110B-Chat/blob/main/LICENSE).",
            "model_version_group_id": null,
            "context_length": 64000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Qwen",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "qwen/qwen2.5-vl-3b-instruct",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "google/gemini-2.5-pro-exp-03-25",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-03-25T17:01:39.919989+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 2.5 Pro Experimental",
            "short_name": "Gemini 2.5 Pro Experimental",
            "author": "google",
            "description": "This model has been deprecated by Google in favor of the (paid Preview model)[google/gemini-2.5-pro-preview]\n \nGemini 2.5 Pro is Google’s state-of-the-art AI model designed for advanced reasoning, coding, mathematics, and scientific tasks. It employs “thinking” capabilities, enabling it to reason through responses with enhanced accuracy and nuanced context handling. Gemini 2.5 Pro achieves top-tier performance on multiple benchmarks, including first-place positioning on the LMArena leaderboard, reflecting superior human-preference alignment and complex problem-solving abilities.",
            "model_version_group_id": null,
            "context_length": 1048576,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "This model has been deprecated by Google. Please switch to the [paid Gemini 2.5 Pro Preview endpoint](/google/gemini-2.5-pro-preview). ",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-2.5-pro-exp-03-25",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "google/gemma-3-1b-it",
            "hf_slug": "google/gemma-3-1b-it",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-03-14T14:45:56.842499+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemma 3 1B",
            "short_name": "Gemma 3 1B",
            "author": "google",
            "description": "Gemma 3 1B is the smallest of the new Gemma 3 family. It handles context windows up to 32k tokens, understands over 140 languages, and offers improved math, reasoning, and chat capabilities, including structured outputs and function calling. Note: Gemma 3 1B is not multimodal. For the smallest multimodal Gemma 3 model, please see [Gemma 3 4B](google/gemma-3-4b-it)",
            "model_version_group_id": "c99b277a-cfaf-4e93-9360-8a79cfa2b2c4",
            "context_length": 32000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": "gemma",
            "default_system": null,
            "default_stops": [
                "<start_of_turn>",
                "<end_of_turn>",
                "<eos>"
            ],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemma-3-1b-it",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "microsoft/phi-4-multimodal-instruct",
            "hf_slug": "microsoft/Phi-4-multimodal-instruct",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-03-08T01:11:24.652063+00:00",
            "hf_updated_at": null,
            "name": "Microsoft: Phi 4 Multimodal Instruct",
            "short_name": "Phi 4 Multimodal Instruct",
            "author": "microsoft",
            "description": "Phi-4 Multimodal Instruct is a versatile 5.6B parameter foundation model that combines advanced reasoning and instruction-following capabilities across both text and visual inputs, providing accurate text outputs. The unified architecture enables efficient, low-latency inference, suitable for edge and mobile deployments. Phi-4 Multimodal Instruct supports text inputs in multiple languages including Arabic, Chinese, English, French, German, Japanese, Spanish, and more, with visual input optimized primarily for English. It delivers impressive performance on multimodal tasks involving mathematical, scientific, and document reasoning, providing developers and enterprises a powerful yet compact model for sophisticated interactive applications. For more information, see the [Phi-4 Multimodal blog post](https://azure.microsoft.com/en-us/blog/empowering-innovation-the-next-generation-of-the-phi-family/).\n",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Other",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "microsoft/phi-4-multimodal-instruct",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "openai/gpt-4.5-preview",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2025-02-27T20:23:30.841555+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-4.5 (Preview)",
            "short_name": "GPT-4.5 (Preview)",
            "author": "openai",
            "description": "GPT-4.5 (Preview) is a research preview of OpenAI’s latest language model, designed to advance capabilities in reasoning, creativity, and multi-turn conversation. It builds on previous iterations with improvements in world knowledge, contextual coherence, and the ability to follow user intent more effectively.\n\nThe model demonstrates enhanced performance in tasks that require open-ended thinking, problem-solving, and communication. Early testing suggests it is better at generating nuanced responses, maintaining long-context coherence, and reducing hallucinations compared to earlier versions.\n\nThis research preview is intended to help evaluate GPT-4.5’s strengths and limitations in real-world use cases as OpenAI continues to refine and develop future models. Read more at the [blog post here.](https://openai.com/index/introducing-gpt-4-5/)",
            "model_version_group_id": null,
            "context_length": 128000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-4.5-preview-2025-02-27",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "x-ai/grok-2-vision-1212",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-12-15T04:35:38.489105+00:00",
            "hf_updated_at": null,
            "name": "xAI: Grok 2 Vision 1212",
            "short_name": "Grok 2 Vision 1212",
            "author": "x-ai",
            "description": "Grok 2 Vision 1212 advances image-based AI with stronger visual comprehension, refined instruction-following, and multilingual support. From object recognition to style analysis, it empowers developers to build more intuitive, visually aware applications. Its enhanced steerability and reasoning establish a robust foundation for next-generation image solutions.\n\nTo read more about this model, check out [xAI's announcement](https://x.ai/blog/grok-1212).",
            "model_version_group_id": null,
            "context_length": 32768,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Grok",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "x-ai/grok-2-vision-1212",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "google/gemini-exp-1121",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-11-21T19:18:45.23737+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini Experimental 1121",
            "short_name": "Gemini Experimental 1121",
            "author": "google",
            "description": "Experimental release (November 21st, 2024) of Gemini.",
            "model_version_group_id": null,
            "context_length": 40960,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-exp-1121",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "x-ai/grok-vision-beta",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-11-19T00:37:04.585936+00:00",
            "hf_updated_at": null,
            "name": "xAI: Grok Vision Beta",
            "short_name": "Grok Vision Beta",
            "author": "x-ai",
            "description": "Grok Vision Beta is xAI's experimental language model with vision capability.\n\n",
            "model_version_group_id": null,
            "context_length": 8192,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Grok",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "x-ai/grok-vision-beta",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "google/gemini-exp-1114",
            "hf_slug": "",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-11-15T23:52:20.203831+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini Experimental 1114",
            "short_name": "Gemini Experimental 1114",
            "author": "google",
            "description": "Gemini 11-14 (2024) experimental model features \"quality\" improvements.",
            "model_version_group_id": null,
            "context_length": 40960,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-exp-1114",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "anthropic/claude-3.5-haiku-20241022",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-11-04T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Anthropic: Claude 3.5 Haiku (2024-10-22)",
            "short_name": "Claude 3.5 Haiku (2024-10-22)",
            "author": "anthropic",
            "description": "Claude 3.5 Haiku features enhancements across all skill sets including coding, tool use, and reasoning. As the fastest model in the Anthropic lineup, it offers rapid response times suitable for applications that require high interactivity and low latency, such as user-facing chatbots and on-the-fly code completions. It also excels in specialized tasks like data extraction and real-time content moderation, making it a versatile tool for a broad range of industries.\n\nIt does not support image inputs.\n\nSee the launch announcement and benchmark results [here](https://www.anthropic.com/news/3-5-models-and-computer-use)",
            "model_version_group_id": "028ec497-a034-40fd-81fe-f51d0a0c640c",
            "context_length": 200000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Claude",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "anthropic/claude-3-5-haiku-20241022",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "google/gemini-flash-1.5-8b",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-10-03T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 1.5 Flash 8B",
            "short_name": "Gemini 1.5 Flash 8B",
            "author": "google",
            "description": "Gemini Flash 1.5 8B is optimized for speed and efficiency, offering enhanced performance in small prompt tasks like chat, transcription, and translation. With reduced latency, it is highly effective for real-time and large-scale operations. This model focuses on cost-effective solutions while maintaining high-quality results.\n\n[Click here to learn more about this model](https://developers.googleblog.com/en/gemini-15-flash-8b-is-now-generally-available-for-use/).\n\nUsage of Gemini is subject to Google's [Gemini Terms of Use](https://ai.google.dev/terms).",
            "model_version_group_id": "3a412ab9-b077-48de-884c-90843f7abbf2",
            "context_length": 1000000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-flash-1.5-8b",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "meta-llama/llama-3.2-90b-vision-instruct",
            "hf_slug": "meta-llama/Llama-3.2-90B-Vision-Instruct",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-09-25T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Meta: Llama 3.2 90B Vision Instruct",
            "short_name": "Llama 3.2 90B Vision Instruct",
            "author": "meta-llama",
            "description": "The Llama 90B Vision model is a top-tier, 90-billion-parameter multimodal model designed for the most challenging visual reasoning and language tasks. It offers unparalleled accuracy in image captioning, visual question answering, and advanced image-text comprehension. Pre-trained on vast multimodal datasets and fine-tuned with human feedback, the Llama 90B Vision is engineered to handle the most demanding image-based AI tasks.\n\nThis model is perfect for industries requiring cutting-edge multimodal AI capabilities, particularly those dealing with complex, real-time visual and textual analysis.\n\nClick here for the [original model card](https://github.com/meta-llama/llama-models/blob/main/models/llama3_2/MODEL_CARD_VISION.md).\n\nUsage of this model is subject to [Meta's Acceptable Use Policy](https://www.llama.com/llama3/use-policy/).",
            "model_version_group_id": null,
            "context_length": 131072,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Llama3",
            "instruct_type": "llama3",
            "default_system": null,
            "default_stops": [
                "<|eot_id|>",
                "<|end_of_text|>"
            ],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "meta-llama/llama-3.2-90b-vision-instruct",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": true,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "google/gemini-flash-1.5-exp",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-08-28T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 1.5 Flash Experimental",
            "short_name": "Gemini 1.5 Flash Experimental",
            "author": "google",
            "description": "Gemini 1.5 Flash Experimental is an experimental version of the [Gemini 1.5 Flash](/models/google/gemini-flash-1.5) model.\n\nUsage of Gemini is subject to Google's [Gemini Terms of Use](https://ai.google.dev/terms).\n\n#multimodal\n\nNote: This model is experimental and not suited for production use-cases. It may be removed or redirected to another model in the future.",
            "model_version_group_id": "86ec374b-de4b-4920-a960-94f25078e303",
            "context_length": 1000000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-flash-1.5-exp",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "01-ai/yi-vision",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-08-02T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "01.AI: Yi Vision",
            "short_name": "Yi Vision",
            "author": "01-ai",
            "description": "The Yi Vision is a complex visual task models provide high-performance understanding and analysis capabilities based on multiple images.\n\nIt's ideal for scenarios that require analysis and interpretation of images and charts, such as image question answering, chart understanding, OCR, visual reasoning, education, research report understanding, or multilingual document reading.",
            "model_version_group_id": null,
            "context_length": 16384,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Yi",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "01-ai/yi-vision",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "google/gemini-pro-1.5-exp",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-08-01T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 1.5 Pro Experimental",
            "short_name": "Gemini 1.5 Pro Experimental",
            "author": "google",
            "description": "Gemini 1.5 Pro Experimental is a bleeding-edge version of the [Gemini 1.5 Pro](/models/google/gemini-pro-1.5) model. Because it's currently experimental, it will be **heavily rate-limited** by Google.\n\nUsage of Gemini is subject to Google's [Gemini Terms of Use](https://ai.google.dev/terms).\n\n#multimodal",
            "model_version_group_id": null,
            "context_length": 1000000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-pro-1.5-exp",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "anthropic/claude-3.5-sonnet-20240620",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-06-20T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Anthropic: Claude 3.5 Sonnet (2024-06-20)",
            "short_name": "Claude 3.5 Sonnet (2024-06-20)",
            "author": "anthropic",
            "description": "Claude 3.5 Sonnet delivers better-than-Opus capabilities, faster-than-Sonnet speeds, at the same Sonnet prices. Sonnet is particularly good at:\n\n- Coding: Autonomously writes, edits, and runs code with reasoning and troubleshooting\n- Data science: Augments human data science expertise; navigates unstructured data while using multiple tools for insights\n- Visual processing: excelling at interpreting charts, graphs, and images, accurately transcribing text to derive insights beyond just the text alone\n- Agentic tasks: exceptional tool use, making it great at agentic tasks (i.e. complex, multi-step problem solving tasks that require engaging with other systems)\n\nFor the latest version (2024-10-23), check out [Claude 3.5 Sonnet](/anthropic/claude-3.5-sonnet).\n\n#multimodal",
            "model_version_group_id": "30636d20-cda3-4a59-aa0c-1a5b6efba072",
            "context_length": 200000,
            "input_modalities": [
                "text",
                "image",
                "file"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Claude",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "anthropic/claude-3.5-sonnet-20240620",
            "supports_reasoning": false,
            "reasoning_config": {
                "start_token": null,
                "end_token": null,
                "system_prompt": null
            },
            "features": {
                "reasoning_config": {
                    "start_token": null,
                    "end_token": null,
                    "system_prompt": null
                }
            },
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "google/gemini-flash-1.5",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-05-14T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 1.5 Flash ",
            "short_name": "Gemini 1.5 Flash ",
            "author": "google",
            "description": "Gemini 1.5 Flash is a foundation model that performs well at a variety of multimodal tasks such as visual understanding, classification, summarization, and creating content from image, audio and video. It's adept at processing visual and text inputs such as photographs, documents, infographics, and screenshots.\n\nGemini 1.5 Flash is designed for high-volume, high-frequency tasks where cost and latency matter. On most common tasks, Flash achieves comparable quality to other Gemini Pro models at a significantly reduced cost. Flash is well-suited for applications like chat assistants and on-demand content generation where speed and scale matter.\n\nUsage of Gemini is subject to Google's [Gemini Terms of Use](https://ai.google.dev/terms).\n\n#multimodal",
            "model_version_group_id": "86ec374b-de4b-4920-a960-94f25078e303",
            "context_length": 1000000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-flash-1.5",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "liuhaotian/llava-yi-34b",
            "hf_slug": "liuhaotian/llava-v1.6-34b",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-05-11T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "LLaVA v1.6 34B",
            "short_name": "LLaVA v1.6 34B",
            "author": "liuhaotian",
            "description": "LLaVA Yi 34B is an open-source model trained by fine-tuning LLM on multimodal instruction-following data. It is an auto-regressive language model, based on the transformer architecture. Base LLM: [NousResearch/Nous-Hermes-2-Yi-34B](/models/nousresearch/nous-hermes-yi-34b)\n\nIt was trained in December 2023.",
            "model_version_group_id": null,
            "context_length": 4096,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Yi",
            "instruct_type": "chatml",
            "default_system": null,
            "default_stops": [
                "<|im_start|>",
                "<|im_end|>",
                "<|endoftext|>"
            ],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "liuhaotian/llava-yi-34b",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "fireworks/firellava-13b",
            "hf_slug": "fireworks-ai/FireLLaVA-13b",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-04-26T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Fireworks: FireLLaVA 13B",
            "short_name": "FireLLaVA 13B",
            "author": "fireworks",
            "description": "A blazing fast vision-language model, FireLLaVA quickly understands both text and images. It achieves impressive chat skills in tests, and was designed to mimic multimodal GPT-4.\n\nThe first commercially permissive open source LLaVA model, trained entirely on open source LLM generated instruction following data.",
            "model_version_group_id": null,
            "context_length": 4096,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Llama2",
            "instruct_type": "vicuna",
            "default_system": null,
            "default_stops": [
                "USER:",
                "</s>"
            ],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "fireworks/firellava-13b",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "google/gemini-pro-1.5",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-04-09T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Google: Gemini 1.5 Pro",
            "short_name": "Gemini 1.5 Pro",
            "author": "google",
            "description": "Google's latest multimodal model, supports image and video[0] in text or chat prompts.\n\nOptimized for language tasks including:\n\n- Code generation\n- Text generation\n- Text editing\n- Problem solving\n- Recommendations\n- Information extraction\n- Data extraction or generation\n- AI agents\n\nUsage of Gemini is subject to Google's [Gemini Terms of Use](https://ai.google.dev/terms).\n\n* [0]: Video input is not available through OpenRouter at this time.",
            "model_version_group_id": null,
            "context_length": 2000000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Gemini",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": "",
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "google/gemini-pro-1.5",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "anthropic/claude-3-sonnet",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-03-05T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Anthropic: Claude 3 Sonnet",
            "short_name": "Claude 3 Sonnet",
            "author": "anthropic",
            "description": "Claude 3 Sonnet is an ideal balance of intelligence and speed for enterprise workloads. Maximum utility at a lower price, dependable, balanced for scaled deployments.\n\nSee the launch announcement and benchmark results [here](https://www.anthropic.com/news/claude-3-family)\n\n#multimodal",
            "model_version_group_id": "30636d20-cda3-4a59-aa0c-1a5b6efba072",
            "context_length": 200000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Claude",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "anthropic/claude-3-sonnet",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "anthropic/claude-3-opus",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2024-03-05T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Anthropic: Claude 3 Opus",
            "short_name": "Claude 3 Opus",
            "author": "anthropic",
            "description": "Claude 3 Opus is Anthropic's most powerful model for highly complex tasks. It boasts top-level performance, intelligence, fluency, and understanding.\n\nSee the launch announcement and benchmark results [here](https://www.anthropic.com/news/claude-3-family)\n\n#multimodal",
            "model_version_group_id": null,
            "context_length": 200000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Claude",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "anthropic/claude-3-opus",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "nousresearch/nous-hermes-2-vision-7b",
            "hf_slug": "NousResearch/Nous-Hermes-2-Vision-Alpha",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2023-12-07T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "Nous: Hermes 2 Vision 7B (alpha)",
            "short_name": "Hermes 2 Vision 7B (alpha)",
            "author": "nousresearch",
            "description": "This vision-language model builds on innovations from the popular [OpenHermes-2.5](/models/teknium/openhermes-2.5-mistral-7b) model, by Teknium. It adds vision support, and is trained on a custom dataset enriched with function calling\n\nThis project is led by [qnguyen3](https://twitter.com/stablequan) and [teknium](https://twitter.com/Teknium1).\n\n#multimodal",
            "model_version_group_id": null,
            "context_length": 4096,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Mistral",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "nousresearch/nous-hermes-2-vision-7b",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "liuhaotian/llava-13b",
            "hf_slug": "liuhaotian/llava-v1.6-vicuna-13b",
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2023-11-16T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "LLaVA 13B",
            "short_name": "LLaVA 13B",
            "author": "liuhaotian",
            "description": "LLaVA is a large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding, achieving impressive chat capabilities and setting a new state-of-the-art accuracy on Science QA.\n\n#multimodal",
            "model_version_group_id": null,
            "context_length": 2048,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "Llama2",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "liuhaotian/llava-13b",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        },
        {
            "slug": "openai/gpt-4-vision-preview",
            "hf_slug": null,
            "updated_at": "2025-11-10T16:00:38.246665+00:00",
            "created_at": "2023-11-13T00:00:00+00:00",
            "hf_updated_at": null,
            "name": "OpenAI: GPT-4 Vision",
            "short_name": "GPT-4 Vision",
            "author": "openai",
            "description": "Ability to understand images, in addition to all other [GPT-4 Turbo capabilties](/models/openai/gpt-4-turbo). Training data: up to Apr 2023.\n\n**Note:** heavily rate limited by OpenAI while in preview.\n\n#multimodal",
            "model_version_group_id": null,
            "context_length": 128000,
            "input_modalities": [
                "text",
                "image"
            ],
            "output_modalities": [
                "text"
            ],
            "has_text_output": true,
            "group": "GPT",
            "instruct_type": null,
            "default_system": null,
            "default_stops": [],
            "hidden": false,
            "router": null,
            "warning_message": null,
            "promotion_message": null,
            "routing_error_message": null,
            "permaslug": "openai/gpt-4-vision-preview",
            "supports_reasoning": false,
            "reasoning_config": null,
            "features": {},
            "default_parameters": {},
            "default_order": [],
            "quick_start_example_type": null,
            "is_trainable_text": null,
            "is_trainable_image": null,
            "endpoint": null
        }
    ],
    "analytics": {
        "baai/bge-large-en-v1.5-20251117": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "baai/bge-large-en-v1.5-20251117",
            "variant": "standard",
            "variant_permaslug": "baai/bge-large-en-v1.5-20251117",
            "count": 56000,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 301743491,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "z-ai/glm-4.7-20251222": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "z-ai/glm-4.7-20251222",
            "variant": "standard",
            "variant_permaslug": "z-ai/glm-4.7-20251222",
            "count": 7326994,
            "total_completion_tokens": 7166727805,
            "total_prompt_tokens": 124679568471,
            "total_native_tokens_reasoning": 3472150501,
            "num_media_prompt": 3960,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 66105749567,
            "total_tool_calls": 3844651,
            "requests_with_tool_call_errors": 106939
        },
        "openai/gpt-4o-audio-preview": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4o-audio-preview",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4o-audio-preview",
            "count": 27582,
            "total_completion_tokens": 4801902,
            "total_prompt_tokens": 12966368,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 26322,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 181,
            "requests_with_tool_call_errors": 0
        },
        "deepseek/deepseek-r1-distill-qwen-32b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepseek/deepseek-r1-distill-qwen-32b",
            "variant": "standard",
            "variant_permaslug": "deepseek/deepseek-r1-distill-qwen-32b",
            "count": 315466,
            "total_completion_tokens": 123379010,
            "total_prompt_tokens": 262042012,
            "total_native_tokens_reasoning": 125713604,
            "num_media_prompt": 26,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "anthropic/claude-4.5-haiku-20251001": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "anthropic/claude-4.5-haiku-20251001",
            "variant": "standard",
            "variant_permaslug": "anthropic/claude-4.5-haiku-20251001",
            "count": 10568707,
            "total_completion_tokens": 4894010141,
            "total_prompt_tokens": 95650710853,
            "total_native_tokens_reasoning": 351130316,
            "num_media_prompt": 605539,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 39504635529,
            "total_tool_calls": 3583893,
            "requests_with_tool_call_errors": 93524
        },
        "thenlper/gte-base-20251117": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "thenlper/gte-base-20251117",
            "variant": "standard",
            "variant_permaslug": "thenlper/gte-base-20251117",
            "count": 268509,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 517139623,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "google/gemini-embedding-001": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemini-embedding-001",
            "variant": "standard",
            "variant_permaslug": "google/gemini-embedding-001",
            "count": 3125195,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 11491693627,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "tencent/hunyuan-a13b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "tencent/hunyuan-a13b-instruct",
            "variant": "standard",
            "variant_permaslug": "tencent/hunyuan-a13b-instruct",
            "count": 17731,
            "total_completion_tokens": 3593634,
            "total_prompt_tokens": 23816463,
            "total_native_tokens_reasoning": 45339,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/ministral-8b-2512": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/ministral-8b-2512",
            "variant": "standard",
            "variant_permaslug": "mistralai/ministral-8b-2512",
            "count": 682571,
            "total_completion_tokens": 94416421,
            "total_prompt_tokens": 766270291,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 13776,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 8805,
            "requests_with_tool_call_errors": 286
        },
        "deepseek/deepseek-chat-v3": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepseek/deepseek-chat-v3",
            "variant": "standard",
            "variant_permaslug": "deepseek/deepseek-chat-v3",
            "count": 5933001,
            "total_completion_tokens": 1027859492,
            "total_prompt_tokens": 9444356305,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 192,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 491471211,
            "total_tool_calls": 163068,
            "requests_with_tool_call_errors": 2485
        },
        "perplexity/sonar-pro": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "perplexity/sonar-pro",
            "variant": "standard",
            "variant_permaslug": "perplexity/sonar-pro",
            "count": 313682,
            "total_completion_tokens": 141896142,
            "total_prompt_tokens": 628573035,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 1739,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "nvidia/nemotron-nano-9b-v2": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nvidia/nemotron-nano-9b-v2",
            "variant": "standard",
            "variant_permaslug": "nvidia/nemotron-nano-9b-v2",
            "count": 234059,
            "total_completion_tokens": 237424934,
            "total_prompt_tokens": 1851261229,
            "total_native_tokens_reasoning": 146735698,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 9503,
            "requests_with_tool_call_errors": 64
        },
        "bytedance-seed/seedream-4.5-20251203": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "bytedance-seed/seedream-4.5-20251203",
            "variant": "standard",
            "variant_permaslug": "bytedance-seed/seedream-4.5-20251203",
            "count": 144847,
            "total_completion_tokens": 604736225,
            "total_prompt_tokens": 359909974,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 200249,
            "num_media_completion": 144847,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "google/gemini-2.0-flash-lite-001": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemini-2.0-flash-lite-001",
            "variant": "standard",
            "variant_permaslug": "google/gemini-2.0-flash-lite-001",
            "count": 22917372,
            "total_completion_tokens": 4336482928,
            "total_prompt_tokens": 31347706424,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 4095938,
            "num_media_completion": 0,
            "num_audio_prompt": 8060,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 994113,
            "requests_with_tool_call_errors": 50641
        },
        "tngtech/tng-r1t-chimera": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "tngtech/tng-r1t-chimera",
            "variant": "standard",
            "variant_permaslug": "tngtech/tng-r1t-chimera",
            "count": 6734,
            "total_completion_tokens": 4003602,
            "total_prompt_tokens": 28843712,
            "total_native_tokens_reasoning": 2828318,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 5687040,
            "total_tool_calls": 14,
            "requests_with_tool_call_errors": 0
        },
        "minimax/minimax-01": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "minimax/minimax-01",
            "variant": "standard",
            "variant_permaslug": "minimax/minimax-01",
            "count": 426369,
            "total_completion_tokens": 45176314,
            "total_prompt_tokens": 995697421,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 1538,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "google/gemini-2.5-pro": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemini-2.5-pro",
            "variant": "standard",
            "variant_permaslug": "google/gemini-2.5-pro",
            "count": 10780156,
            "total_completion_tokens": 18953499128,
            "total_prompt_tokens": 122564258747,
            "total_native_tokens_reasoning": 10863268000,
            "num_media_prompt": 1617577,
            "num_media_completion": 0,
            "num_audio_prompt": 42784,
            "total_native_tokens_cached": 41631826713,
            "total_tool_calls": 449386,
            "requests_with_tool_call_errors": 16005
        },
        "mistralai/devstral-medium-2507": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/devstral-medium-2507",
            "variant": "standard",
            "variant_permaslug": "mistralai/devstral-medium-2507",
            "count": 10817,
            "total_completion_tokens": 1161667,
            "total_prompt_tokens": 58111545,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 1099,
            "requests_with_tool_call_errors": 175
        },
        "meta-llama/llama-3-8b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-3-8b-instruct",
            "variant": "standard",
            "variant_permaslug": "meta-llama/llama-3-8b-instruct",
            "count": 10071240,
            "total_completion_tokens": 209321216,
            "total_prompt_tokens": 5640372687,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 230,
            "requests_with_tool_call_errors": 49
        },
        "qwen/qwen3-next-80b-a3b-thinking-2509": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-next-80b-a3b-thinking-2509",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-next-80b-a3b-thinking-2509",
            "count": 298687,
            "total_completion_tokens": 1377894120,
            "total_prompt_tokens": 872215138,
            "total_native_tokens_reasoning": 1220871412,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 2269434,
            "total_tool_calls": 11836,
            "requests_with_tool_call_errors": 205
        },
        "openai/gpt-oss-120b:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-oss-120b",
            "variant": "free",
            "variant_permaslug": "openai/gpt-oss-120b:free",
            "count": 297335,
            "total_completion_tokens": 219162308,
            "total_prompt_tokens": 2552257624,
            "total_native_tokens_reasoning": 135565268,
            "num_media_prompt": 2,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 48563,
            "requests_with_tool_call_errors": 9997
        },
        "minimax/minimax-m1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "minimax/minimax-m1",
            "variant": "standard",
            "variant_permaslug": "minimax/minimax-m1",
            "count": 7817,
            "total_completion_tokens": 7106799,
            "total_prompt_tokens": 139459466,
            "total_native_tokens_reasoning": 4700939,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 1516,
            "requests_with_tool_call_errors": 110
        },
        "prime-intellect/intellect-3-20251126": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "prime-intellect/intellect-3-20251126",
            "variant": "standard",
            "variant_permaslug": "prime-intellect/intellect-3-20251126",
            "count": 12187,
            "total_completion_tokens": 28105469,
            "total_prompt_tokens": 27679118,
            "total_native_tokens_reasoning": 16803717,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 4392032,
            "total_tool_calls": 697,
            "requests_with_tool_call_errors": 3
        },
        "qwen/qwen3-30b-a3b-thinking-2507": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-30b-a3b-thinking-2507",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-30b-a3b-thinking-2507",
            "count": 152838,
            "total_completion_tokens": 220747983,
            "total_prompt_tokens": 815517449,
            "total_native_tokens_reasoning": 207872997,
            "num_media_prompt": 6,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 16807,
            "requests_with_tool_call_errors": 4428
        },
        "amazon/nova-pro-v1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "amazon/nova-pro-v1",
            "variant": "standard",
            "variant_permaslug": "amazon/nova-pro-v1",
            "count": 32946,
            "total_completion_tokens": 4291169,
            "total_prompt_tokens": 31785345,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 8986,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 174,
            "requests_with_tool_call_errors": 12
        },
        "anthropic/claude-3-7-sonnet-20250219:thinking": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "anthropic/claude-3-7-sonnet-20250219",
            "variant": "thinking",
            "variant_permaslug": "anthropic/claude-3-7-sonnet-20250219:thinking",
            "count": 124765,
            "total_completion_tokens": 197876448,
            "total_prompt_tokens": 2247362567,
            "total_native_tokens_reasoning": 107544503,
            "num_media_prompt": 19249,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 845269929,
            "total_tool_calls": 31038,
            "requests_with_tool_call_errors": 1135
        },
        "qwen/qwen-plus-2025-01-25": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen-plus-2025-01-25",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen-plus-2025-01-25",
            "count": 33043,
            "total_completion_tokens": 9475756,
            "total_prompt_tokens": 93280663,
            "total_native_tokens_reasoning": 16527,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 7807593,
            "total_tool_calls": 630,
            "requests_with_tool_call_errors": 98
        },
        "bytedance/ui-tars-1.5-7b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "bytedance/ui-tars-1.5-7b",
            "variant": "standard",
            "variant_permaslug": "bytedance/ui-tars-1.5-7b",
            "count": 51511,
            "total_completion_tokens": 2232961,
            "total_prompt_tokens": 125770709,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 136687,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 38059216,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "meta-llama/llama-4-maverick-17b-128e-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-4-maverick-17b-128e-instruct",
            "variant": "standard",
            "variant_permaslug": "meta-llama/llama-4-maverick-17b-128e-instruct",
            "count": 10143224,
            "total_completion_tokens": 1032604550,
            "total_prompt_tokens": 20252517533,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 1598470,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 756278012,
            "total_tool_calls": 229109,
            "requests_with_tool_call_errors": 4230
        },
        "deepcogito/cogito-v2-preview-llama-70b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepcogito/cogito-v2-preview-llama-70b",
            "variant": "standard",
            "variant_permaslug": "deepcogito/cogito-v2-preview-llama-70b",
            "count": 3870,
            "total_completion_tokens": 548889,
            "total_prompt_tokens": 4287286,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 28,
            "requests_with_tool_call_errors": 0
        },
        "google/gemma-2-9b-it": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemma-2-9b-it",
            "variant": "standard",
            "variant_permaslug": "google/gemma-2-9b-it",
            "count": 1694384,
            "total_completion_tokens": 502347769,
            "total_prompt_tokens": 1202088087,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "relace/relace-apply-3": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "relace/relace-apply-3",
            "variant": "standard",
            "variant_permaslug": "relace/relace-apply-3",
            "count": 21942,
            "total_completion_tokens": 43565758,
            "total_prompt_tokens": 65298540,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/mistral-embed-2312": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-embed-2312",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-embed-2312",
            "count": 115832,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 164760373,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/mistral-large-2407": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-large-2407",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-large-2407",
            "count": 8885,
            "total_completion_tokens": 3880628,
            "total_prompt_tokens": 23365163,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 773,
            "requests_with_tool_call_errors": 50
        },
        "openai/gpt-oss-safeguard-20b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-oss-safeguard-20b",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-oss-safeguard-20b",
            "count": 1740019,
            "total_completion_tokens": 916063158,
            "total_prompt_tokens": 4979040258,
            "total_native_tokens_reasoning": 684413109,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 3801686784,
            "total_tool_calls": 51543,
            "requests_with_tool_call_errors": 374
        },
        "mistralai/devstral-2512:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/devstral-2512",
            "variant": "free",
            "variant_permaslug": "mistralai/devstral-2512:free",
            "count": 10594999,
            "total_completion_tokens": 4598306315,
            "total_prompt_tokens": 146943045358,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 2724884,
            "requests_with_tool_call_errors": 165205
        },
        "mistralai/pixtral-large-2411": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/pixtral-large-2411",
            "variant": "standard",
            "variant_permaslug": "mistralai/pixtral-large-2411",
            "count": 17079,
            "total_completion_tokens": 3658461,
            "total_prompt_tokens": 47146237,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 13665,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 425,
            "requests_with_tool_call_errors": 72
        },
        "openai/o4-mini-high-2025-04-16": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/o4-mini-high-2025-04-16",
            "variant": "standard",
            "variant_permaslug": "openai/o4-mini-high-2025-04-16",
            "count": 91184,
            "total_completion_tokens": 122735450,
            "total_prompt_tokens": 376252306,
            "total_native_tokens_reasoning": 102812504,
            "num_media_prompt": 8373,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 139692928,
            "total_tool_calls": 4915,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-4o-mini-2024-07-18": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4o-mini-2024-07-18",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4o-mini-2024-07-18",
            "count": 3162539,
            "total_completion_tokens": 421374822,
            "total_prompt_tokens": 7606086792,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 12664,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 3048499200,
            "total_tool_calls": 108896,
            "requests_with_tool_call_errors": 127
        },
        "allenai/olmo-3-7b-think-20251121": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "allenai/olmo-3-7b-think-20251121",
            "variant": "standard",
            "variant_permaslug": "allenai/olmo-3-7b-think-20251121",
            "count": 27677,
            "total_completion_tokens": 58928656,
            "total_prompt_tokens": 18987653,
            "total_native_tokens_reasoning": 70320406,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 3380192,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "z-ai/glm-4.5v": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "z-ai/glm-4.5v",
            "variant": "standard",
            "variant_permaslug": "z-ai/glm-4.5v",
            "count": 31164,
            "total_completion_tokens": 16135432,
            "total_prompt_tokens": 73146472,
            "total_native_tokens_reasoning": 8783618,
            "num_media_prompt": 118474,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 10110739,
            "total_tool_calls": 1124,
            "requests_with_tool_call_errors": 189
        },
        "gryphe/mythomax-l2-13b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "gryphe/mythomax-l2-13b",
            "variant": "standard",
            "variant_permaslug": "gryphe/mythomax-l2-13b",
            "count": 1506570,
            "total_completion_tokens": 219510857,
            "total_prompt_tokens": 1553012977,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "google/gemini-3-pro-preview-20251117": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemini-3-pro-preview-20251117",
            "variant": "standard",
            "variant_permaslug": "google/gemini-3-pro-preview-20251117",
            "count": 9892425,
            "total_completion_tokens": 21414757024,
            "total_prompt_tokens": 146558026906,
            "total_native_tokens_reasoning": 14414102833,
            "num_media_prompt": 4162447,
            "num_media_completion": 0,
            "num_audio_prompt": 511519,
            "total_native_tokens_cached": 80549468622,
            "total_tool_calls": 1375732,
            "requests_with_tool_call_errors": 32236
        },
        "perplexity/sonar": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "perplexity/sonar",
            "variant": "standard",
            "variant_permaslug": "perplexity/sonar",
            "count": 798796,
            "total_completion_tokens": 299240117,
            "total_prompt_tokens": 664100180,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 6773,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "deepseek/deepseek-r1-0528": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepseek/deepseek-r1-0528",
            "variant": "standard",
            "variant_permaslug": "deepseek/deepseek-r1-0528",
            "count": 1544153,
            "total_completion_tokens": 2215709216,
            "total_prompt_tokens": 12164290190,
            "total_native_tokens_reasoning": 1558355699,
            "num_media_prompt": 2447,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 2515918238,
            "total_tool_calls": 52994,
            "requests_with_tool_call_errors": 761
        },
        "xiaomi/mimo-v2-flash-20251210": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "xiaomi/mimo-v2-flash-20251210",
            "variant": "standard",
            "variant_permaslug": "xiaomi/mimo-v2-flash-20251210",
            "count": 1943166,
            "total_completion_tokens": 740454249,
            "total_prompt_tokens": 11455424408,
            "total_native_tokens_reasoning": 143206691,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 6032144183,
            "total_tool_calls": 181852,
            "requests_with_tool_call_errors": 7767
        },
        "qwen/qwen3-next-80b-a3b-instruct-2509": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-next-80b-a3b-instruct-2509",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-next-80b-a3b-instruct-2509",
            "count": 2876915,
            "total_completion_tokens": 673532132,
            "total_prompt_tokens": 17875297548,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 168,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1217351630,
            "total_tool_calls": 194121,
            "requests_with_tool_call_errors": 15257
        },
        "qwen/qwen-plus-2025-07-28": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen-plus-2025-07-28",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen-plus-2025-07-28",
            "count": 22195,
            "total_completion_tokens": 13045146,
            "total_prompt_tokens": 170367803,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 8889,
            "requests_with_tool_call_errors": 398
        },
        "meta-llama/llama-3.1-70b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-3.1-70b-instruct",
            "variant": "standard",
            "variant_permaslug": "meta-llama/llama-3.1-70b-instruct",
            "count": 4364390,
            "total_completion_tokens": 418065223,
            "total_prompt_tokens": 4559441228,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 4,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 10253,
            "requests_with_tool_call_errors": 772
        },
        "meta-llama/llama-3-70b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-3-70b-instruct",
            "variant": "standard",
            "variant_permaslug": "meta-llama/llama-3-70b-instruct",
            "count": 1599367,
            "total_completion_tokens": 49533185,
            "total_prompt_tokens": 1053324356,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 3,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/mistral-7b-instruct-v0.3": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-7b-instruct-v0.3",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-7b-instruct-v0.3",
            "count": 383910,
            "total_completion_tokens": 18806873,
            "total_prompt_tokens": 124936558,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "qwen/qwen-turbo-2024-11-01": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen-turbo-2024-11-01",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen-turbo-2024-11-01",
            "count": 910687,
            "total_completion_tokens": 195574768,
            "total_prompt_tokens": 2076465032,
            "total_native_tokens_reasoning": 16492,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 237985366,
            "total_tool_calls": 25415,
            "requests_with_tool_call_errors": 273
        },
        "meituan/longcat-flash-chat": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meituan/longcat-flash-chat",
            "variant": "standard",
            "variant_permaslug": "meituan/longcat-flash-chat",
            "count": 220789,
            "total_completion_tokens": 50544891,
            "total_prompt_tokens": 1092736265,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 577060608,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "switchpoint/router": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "switchpoint/router",
            "variant": "standard",
            "variant_permaslug": "switchpoint/router",
            "count": 2416,
            "total_completion_tokens": 1274731,
            "total_prompt_tokens": 4573203,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "z-ai/glm-4.5-air": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "z-ai/glm-4.5-air",
            "variant": "standard",
            "variant_permaslug": "z-ai/glm-4.5-air",
            "count": 2316148,
            "total_completion_tokens": 566681876,
            "total_prompt_tokens": 8523603457,
            "total_native_tokens_reasoning": 254236178,
            "num_media_prompt": 1,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 5103777316,
            "total_tool_calls": 151412,
            "requests_with_tool_call_errors": 13067
        },
        "google/gemini-2.5-flash-image": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemini-2.5-flash-image",
            "variant": "standard",
            "variant_permaslug": "google/gemini-2.5-flash-image",
            "count": 1458384,
            "total_completion_tokens": 1371494036,
            "total_prompt_tokens": 1512274934,
            "total_native_tokens_reasoning": 10891,
            "num_media_prompt": 1368784,
            "num_media_completion": 1023950,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "z-ai/glm-4.6-20251208": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "z-ai/glm-4.6-20251208",
            "variant": "standard",
            "variant_permaslug": "z-ai/glm-4.6-20251208",
            "count": 250922,
            "total_completion_tokens": 758698311,
            "total_prompt_tokens": 2234777448,
            "total_native_tokens_reasoning": 565917377,
            "num_media_prompt": 223729,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 345750388,
            "total_tool_calls": 42018,
            "requests_with_tool_call_errors": 2397
        },
        "openai/gpt-5-nano-2025-08-07": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5-nano-2025-08-07",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5-nano-2025-08-07",
            "count": 8533756,
            "total_completion_tokens": 9637117127,
            "total_prompt_tokens": 28156498975,
            "total_native_tokens_reasoning": 8546398027,
            "num_media_prompt": 563845,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 5781763200,
            "total_tool_calls": 1779796,
            "requests_with_tool_call_errors": 4144
        },
        "perplexity/sonar-pro-search": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "perplexity/sonar-pro-search",
            "variant": "standard",
            "variant_permaslug": "perplexity/sonar-pro-search",
            "count": 80370,
            "total_completion_tokens": 39446810,
            "total_prompt_tokens": 135073279,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 1339,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 1706,
            "requests_with_tool_call_errors": 0
        },
        "neversleep/noromaid-20b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "neversleep/noromaid-20b",
            "variant": "standard",
            "variant_permaslug": "neversleep/noromaid-20b",
            "count": 16906,
            "total_completion_tokens": 2357472,
            "total_prompt_tokens": 25556092,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "google/gemma-3-27b-it": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemma-3-27b-it",
            "variant": "standard",
            "variant_permaslug": "google/gemma-3-27b-it",
            "count": 13041622,
            "total_completion_tokens": 2041183774,
            "total_prompt_tokens": 20217477100,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 2806874,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 2003308696,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "deepseek/deepseek-chat-v3.1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepseek/deepseek-chat-v3.1",
            "variant": "standard",
            "variant_permaslug": "deepseek/deepseek-chat-v3.1",
            "count": 26139768,
            "total_completion_tokens": 4343426603,
            "total_prompt_tokens": 95339386393,
            "total_native_tokens_reasoning": 702763319,
            "num_media_prompt": 385,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 10730007416,
            "total_tool_calls": 228597,
            "requests_with_tool_call_errors": 6087
        },
        "deepseek/deepseek-v3.2-20251201": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepseek/deepseek-v3.2-20251201",
            "variant": "standard",
            "variant_permaslug": "deepseek/deepseek-v3.2-20251201",
            "count": 53257850,
            "total_completion_tokens": 23649787150,
            "total_prompt_tokens": 416145678347,
            "total_native_tokens_reasoning": 5367372095,
            "num_media_prompt": 5308,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 174575670000,
            "total_tool_calls": 1700424,
            "requests_with_tool_call_errors": 41664
        },
        "qwen/qwen3-32b-04-28": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-32b-04-28",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-32b-04-28",
            "count": 11727702,
            "total_completion_tokens": 2547491846,
            "total_prompt_tokens": 12551192732,
            "total_native_tokens_reasoning": 1809460224,
            "num_media_prompt": 3,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 2461644792,
            "total_tool_calls": 260352,
            "requests_with_tool_call_errors": 7057
        },
        "mistralai/ministral-8b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/ministral-8b",
            "variant": "standard",
            "variant_permaslug": "mistralai/ministral-8b",
            "count": 1361613,
            "total_completion_tokens": 371260724,
            "total_prompt_tokens": 581306189,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 13760,
            "requests_with_tool_call_errors": 307
        },
        "mistralai/mistral-saba-2502": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-saba-2502",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-saba-2502",
            "count": 29670,
            "total_completion_tokens": 638776,
            "total_prompt_tokens": 4152071,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 20,
            "requests_with_tool_call_errors": 0
        },
        "openai/o3-2025-04-16": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/o3-2025-04-16",
            "variant": "standard",
            "variant_permaslug": "openai/o3-2025-04-16",
            "count": 148689,
            "total_completion_tokens": 135006853,
            "total_prompt_tokens": 762496785,
            "total_native_tokens_reasoning": 83438014,
            "num_media_prompt": 78466,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 341476096,
            "total_tool_calls": 15237,
            "requests_with_tool_call_errors": 1
        },
        "qwen/qwen3-coder-480b-a35b-07-25:exacto": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-coder-480b-a35b-07-25",
            "variant": "exacto",
            "variant_permaslug": "qwen/qwen3-coder-480b-a35b-07-25:exacto",
            "count": 30683,
            "total_completion_tokens": 8788690,
            "total_prompt_tokens": 1445637919,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 918901615,
            "total_tool_calls": 21596,
            "requests_with_tool_call_errors": 661
        },
        "raifle/sorcererlm-8x22b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "raifle/sorcererlm-8x22b",
            "variant": "standard",
            "variant_permaslug": "raifle/sorcererlm-8x22b",
            "count": 2899,
            "total_completion_tokens": 898820,
            "total_prompt_tokens": 7968231,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-5.1-codex-20251113": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5.1-codex-20251113",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5.1-codex-20251113",
            "count": 121428,
            "total_completion_tokens": 71681309,
            "total_prompt_tokens": 3793123607,
            "total_native_tokens_reasoning": 43627205,
            "num_media_prompt": 19149,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 3163285504,
            "total_tool_calls": 57820,
            "requests_with_tool_call_errors": 444
        },
        "deepcogito/cogito-v2-preview-llama-405b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepcogito/cogito-v2-preview-llama-405b",
            "variant": "standard",
            "variant_permaslug": "deepcogito/cogito-v2-preview-llama-405b",
            "count": 2896,
            "total_completion_tokens": 567975,
            "total_prompt_tokens": 5169281,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 321,
            "requests_with_tool_call_errors": 5
        },
        "amazon/nova-lite-v1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "amazon/nova-lite-v1",
            "variant": "standard",
            "variant_permaslug": "amazon/nova-lite-v1",
            "count": 380831,
            "total_completion_tokens": 7336424,
            "total_prompt_tokens": 248864490,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 323472,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 1157,
            "requests_with_tool_call_errors": 21
        },
        "ai21/jamba-mini-1.7": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "ai21/jamba-mini-1.7",
            "variant": "standard",
            "variant_permaslug": "ai21/jamba-mini-1.7",
            "count": 6254,
            "total_completion_tokens": 1827673,
            "total_prompt_tokens": 14898287,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 264,
            "requests_with_tool_call_errors": 117
        },
        "nvidia/llama-3.1-nemotron-ultra-253b-v1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nvidia/llama-3.1-nemotron-ultra-253b-v1",
            "variant": "standard",
            "variant_permaslug": "nvidia/llama-3.1-nemotron-ultra-253b-v1",
            "count": 4442794,
            "total_completion_tokens": 39267636,
            "total_prompt_tokens": 2880404878,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "moonshotai/kimi-dev-72b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "moonshotai/kimi-dev-72b",
            "variant": "standard",
            "variant_permaslug": "moonshotai/kimi-dev-72b",
            "count": 2682,
            "total_completion_tokens": 5278023,
            "total_prompt_tokens": 5963342,
            "total_native_tokens_reasoning": 3441842,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "deepcogito/cogito-v2.1-671b-20251118": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepcogito/cogito-v2.1-671b-20251118",
            "variant": "standard",
            "variant_permaslug": "deepcogito/cogito-v2.1-671b-20251118",
            "count": 35018,
            "total_completion_tokens": 4644141,
            "total_prompt_tokens": 99001779,
            "total_native_tokens_reasoning": 1003632,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "allenai/olmo-3.1-32b-instruct-20251215": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "allenai/olmo-3.1-32b-instruct-20251215",
            "variant": "standard",
            "variant_permaslug": "allenai/olmo-3.1-32b-instruct-20251215",
            "count": 75062,
            "total_completion_tokens": 56402666,
            "total_prompt_tokens": 156057705,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 113,
            "requests_with_tool_call_errors": 7
        },
        "mistralai/codestral-embed-2505": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/codestral-embed-2505",
            "variant": "standard",
            "variant_permaslug": "mistralai/codestral-embed-2505",
            "count": 139439,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 483559519,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-5-codex": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5-codex",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5-codex",
            "count": 41915,
            "total_completion_tokens": 44116692,
            "total_prompt_tokens": 1753290451,
            "total_native_tokens_reasoning": 32906737,
            "num_media_prompt": 9662,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1444822784,
            "total_tool_calls": 23684,
            "requests_with_tool_call_errors": 229
        },
        "qwen/qwen3-coder-flash": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-coder-flash",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-coder-flash",
            "count": 29226,
            "total_completion_tokens": 9814216,
            "total_prompt_tokens": 184805618,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 4868,
            "requests_with_tool_call_errors": 340
        },
        "mistralai/ministral-14b-2512": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/ministral-14b-2512",
            "variant": "standard",
            "variant_permaslug": "mistralai/ministral-14b-2512",
            "count": 962263,
            "total_completion_tokens": 118344319,
            "total_prompt_tokens": 1920892986,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 61496,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 50716,
            "requests_with_tool_call_errors": 691
        },
        "openai/gpt-3.5-turbo-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-3.5-turbo-instruct",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-3.5-turbo-instruct",
            "count": 35555,
            "total_completion_tokens": 5557395,
            "total_prompt_tokens": 15509656,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "cohere/command-r-plus-08-2024": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "cohere/command-r-plus-08-2024",
            "variant": "standard",
            "variant_permaslug": "cohere/command-r-plus-08-2024",
            "count": 17400,
            "total_completion_tokens": 3685981,
            "total_prompt_tokens": 30974067,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 2003,
            "requests_with_tool_call_errors": 242
        },
        "baidu/ernie-4.5-300b-a47b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "baidu/ernie-4.5-300b-a47b",
            "variant": "standard",
            "variant_permaslug": "baidu/ernie-4.5-300b-a47b",
            "count": 109163,
            "total_completion_tokens": 27477499,
            "total_prompt_tokens": 205335482,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 13336128,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/text-embedding-3-small": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/text-embedding-3-small",
            "variant": "standard",
            "variant_permaslug": "openai/text-embedding-3-small",
            "count": 17518036,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 29941259162,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/o3-deep-research-2025-06-26": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/o3-deep-research-2025-06-26",
            "variant": "standard",
            "variant_permaslug": "openai/o3-deep-research-2025-06-26",
            "count": 3777,
            "total_completion_tokens": 37509753,
            "total_prompt_tokens": 62160506,
            "total_native_tokens_reasoning": 31903648,
            "num_media_prompt": 309,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1920000,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "baidu/ernie-4.5-vl-424b-a47b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "baidu/ernie-4.5-vl-424b-a47b",
            "variant": "standard",
            "variant_permaslug": "baidu/ernie-4.5-vl-424b-a47b",
            "count": 5888,
            "total_completion_tokens": 3564971,
            "total_prompt_tokens": 21391641,
            "total_native_tokens_reasoning": 381414,
            "num_media_prompt": 873,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "black-forest-labs/flux.2-klein-4b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "black-forest-labs/flux.2-klein-4b",
            "variant": "standard",
            "variant_permaslug": "black-forest-labs/flux.2-klein-4b",
            "count": 27218,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 6058023,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 8371,
            "num_media_completion": 27218,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "sentence-transformers/all-minilm-l12-v2-20251117": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "sentence-transformers/all-minilm-l12-v2-20251117",
            "variant": "standard",
            "variant_permaslug": "sentence-transformers/all-minilm-l12-v2-20251117",
            "count": 9467527,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 1237609904,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "nvidia/nemotron-3-nano-30b-a3b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nvidia/nemotron-3-nano-30b-a3b",
            "variant": "standard",
            "variant_permaslug": "nvidia/nemotron-3-nano-30b-a3b",
            "count": 577192,
            "total_completion_tokens": 2241294227,
            "total_prompt_tokens": 1840432830,
            "total_native_tokens_reasoning": 2159825592,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 23473,
            "requests_with_tool_call_errors": 7385
        },
        "thenlper/gte-large-20251117": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "thenlper/gte-large-20251117",
            "variant": "standard",
            "variant_permaslug": "thenlper/gte-large-20251117",
            "count": 61854,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 58099045,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "nvidia/nemotron-3-nano-30b-a3b:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nvidia/nemotron-3-nano-30b-a3b",
            "variant": "free",
            "variant_permaslug": "nvidia/nemotron-3-nano-30b-a3b:free",
            "count": 465379,
            "total_completion_tokens": 1023767338,
            "total_prompt_tokens": 3230621601,
            "total_native_tokens_reasoning": 794532679,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 54361,
            "requests_with_tool_call_errors": 13555
        },
        "qwen/qwq-32b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwq-32b",
            "variant": "standard",
            "variant_permaslug": "qwen/qwq-32b",
            "count": 106911,
            "total_completion_tokens": 152561647,
            "total_prompt_tokens": 211161725,
            "total_native_tokens_reasoning": 140650447,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 100,
            "requests_with_tool_call_errors": 9
        },
        "x-ai/grok-code-fast-1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "x-ai/grok-code-fast-1",
            "variant": "standard",
            "variant_permaslug": "x-ai/grok-code-fast-1",
            "count": 15899673,
            "total_completion_tokens": 26696679793,
            "total_prompt_tokens": 567580333280,
            "total_native_tokens_reasoning": 19832616079,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 434330497856,
            "total_tool_calls": 5451422,
            "requests_with_tool_call_errors": 15042
        },
        "meta-llama/llama-guard-3-8b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-guard-3-8b",
            "variant": "standard",
            "variant_permaslug": "meta-llama/llama-guard-3-8b",
            "count": 60527,
            "total_completion_tokens": 110777100,
            "total_prompt_tokens": 13096421,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 1,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "baidu/ernie-4.5-21b-a3b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "baidu/ernie-4.5-21b-a3b",
            "variant": "standard",
            "variant_permaslug": "baidu/ernie-4.5-21b-a3b",
            "count": 182894,
            "total_completion_tokens": 11371707,
            "total_prompt_tokens": 94912075,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "sentence-transformers/all-mpnet-base-v2-20251117": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "sentence-transformers/all-mpnet-base-v2-20251117",
            "variant": "standard",
            "variant_permaslug": "sentence-transformers/all-mpnet-base-v2-20251117",
            "count": 2058,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 2718315,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "qwen/qwen3-coder-480b-a35b-07-25": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-coder-480b-a35b-07-25",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-coder-480b-a35b-07-25",
            "count": 6335868,
            "total_completion_tokens": 2228665815,
            "total_prompt_tokens": 107754969823,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 241,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 12119976176,
            "total_tool_calls": 367692,
            "requests_with_tool_call_errors": 59710
        },
        "openai/gpt-5-pro-2025-10-06": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5-pro-2025-10-06",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5-pro-2025-10-06",
            "count": 6193,
            "total_completion_tokens": 15668074,
            "total_prompt_tokens": 37522362,
            "total_native_tokens_reasoning": 12954829,
            "num_media_prompt": 1220,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 246,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-4o-search-preview-2025-03-11": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4o-search-preview-2025-03-11",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4o-search-preview-2025-03-11",
            "count": 47133,
            "total_completion_tokens": 17262691,
            "total_prompt_tokens": 31468892,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "qwen/qwen3-30b-a3b-04-28": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-30b-a3b-04-28",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-30b-a3b-04-28",
            "count": 1401176,
            "total_completion_tokens": 994521415,
            "total_prompt_tokens": 3193991037,
            "total_native_tokens_reasoning": 987782488,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 110250995,
            "total_tool_calls": 16598,
            "requests_with_tool_call_errors": 10709
        },
        "thedrummer/unslopnemo-12b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "thedrummer/unslopnemo-12b",
            "variant": "standard",
            "variant_permaslug": "thedrummer/unslopnemo-12b",
            "count": 450702,
            "total_completion_tokens": 75652110,
            "total_prompt_tokens": 1408710952,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "x-ai/grok-4.1-fast": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "x-ai/grok-4.1-fast",
            "variant": "standard",
            "variant_permaslug": "x-ai/grok-4.1-fast",
            "count": 47427569,
            "total_completion_tokens": 38002522893,
            "total_prompt_tokens": 271402744172,
            "total_native_tokens_reasoning": 27479133279,
            "num_media_prompt": 8396324,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 88719842273,
            "total_tool_calls": 4813231,
            "requests_with_tool_call_errors": 52286
        },
        "openai/gpt-4o-2024-05-13": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4o-2024-05-13",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4o-2024-05-13",
            "count": 39639,
            "total_completion_tokens": 11613112,
            "total_prompt_tokens": 39084844,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 849,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 731008,
            "total_tool_calls": 5314,
            "requests_with_tool_call_errors": 251
        },
        "nousresearch/hermes-2-pro-llama-3-8b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nousresearch/hermes-2-pro-llama-3-8b",
            "variant": "standard",
            "variant_permaslug": "nousresearch/hermes-2-pro-llama-3-8b",
            "count": 97934,
            "total_completion_tokens": 5888875,
            "total_prompt_tokens": 59774444,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 1,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/voxtral-small-24b-2507": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/voxtral-small-24b-2507",
            "variant": "standard",
            "variant_permaslug": "mistralai/voxtral-small-24b-2507",
            "count": 75705,
            "total_completion_tokens": 4766524,
            "total_prompt_tokens": 33785457,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 10673,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 628,
            "requests_with_tool_call_errors": 1
        },
        "google/gemma-3-27b-it:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemma-3-27b-it",
            "variant": "free",
            "variant_permaslug": "google/gemma-3-27b-it:free",
            "count": 726513,
            "total_completion_tokens": 569119463,
            "total_prompt_tokens": 3308238335,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 91438,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 1334,
            "requests_with_tool_call_errors": 126
        },
        "ai21/jamba-large-1.7": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "ai21/jamba-large-1.7",
            "variant": "standard",
            "variant_permaslug": "ai21/jamba-large-1.7",
            "count": 10327,
            "total_completion_tokens": 4614615,
            "total_prompt_tokens": 34193371,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 28,
            "requests_with_tool_call_errors": 7
        },
        "inflection/inflection-3-productivity": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "inflection/inflection-3-productivity",
            "variant": "standard",
            "variant_permaslug": "inflection/inflection-3-productivity",
            "count": 2514,
            "total_completion_tokens": 519207,
            "total_prompt_tokens": 1525486,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "meta-llama/llama-guard-4-12b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-guard-4-12b",
            "variant": "standard",
            "variant_permaslug": "meta-llama/llama-guard-4-12b",
            "count": 3002198,
            "total_completion_tokens": 11260246,
            "total_prompt_tokens": 1239841940,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 1794,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/o1-pro": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/o1-pro",
            "variant": "standard",
            "variant_permaslug": "openai/o1-pro",
            "count": 1317,
            "total_completion_tokens": 1115072,
            "total_prompt_tokens": 2128699,
            "total_native_tokens_reasoning": 727296,
            "num_media_prompt": 181,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "qwen/qwen3-4b-04-28:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-4b-04-28",
            "variant": "free",
            "variant_permaslug": "qwen/qwen3-4b-04-28:free",
            "count": 30271,
            "total_completion_tokens": 38967228,
            "total_prompt_tokens": 48283796,
            "total_native_tokens_reasoning": 33277948,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 455,
            "requests_with_tool_call_errors": 308
        },
        "neversleep/llama-3.1-lumimaid-8b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "neversleep/llama-3.1-lumimaid-8b",
            "variant": "standard",
            "variant_permaslug": "neversleep/llama-3.1-lumimaid-8b",
            "count": 47779,
            "total_completion_tokens": 6420163,
            "total_prompt_tokens": 100259159,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "minimax/minimax-m2-her-20260123": {
            "date": "2026-01-24 00:00:00",
            "model_permaslug": "minimax/minimax-m2-her-20260123",
            "variant": "standard",
            "variant_permaslug": "minimax/minimax-m2-her-20260123",
            "count": 40722,
            "total_completion_tokens": 11868646,
            "total_prompt_tokens": 120384653,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-4o:extended": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4o",
            "variant": "extended",
            "variant_permaslug": "openai/gpt-4o:extended",
            "count": 2052,
            "total_completion_tokens": 818727,
            "total_prompt_tokens": 14652854,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 100,
            "requests_with_tool_call_errors": 21
        },
        "qwen/qwen-vl-plus": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen-vl-plus",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen-vl-plus",
            "count": 41749,
            "total_completion_tokens": 3907581,
            "total_prompt_tokens": 66157285,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 35807,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "amazon/nova-premier-v1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "amazon/nova-premier-v1",
            "variant": "standard",
            "variant_permaslug": "amazon/nova-premier-v1",
            "count": 11532,
            "total_completion_tokens": 1430151,
            "total_prompt_tokens": 30905804,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 11744,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 293,
            "requests_with_tool_call_errors": 21
        },
        "x-ai/grok-3-mini": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "x-ai/grok-3-mini",
            "variant": "standard",
            "variant_permaslug": "x-ai/grok-3-mini",
            "count": 3810063,
            "total_completion_tokens": 3035518513,
            "total_prompt_tokens": 7221862269,
            "total_native_tokens_reasoning": 2458013955,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 2064734279,
            "total_tool_calls": 64796,
            "requests_with_tool_call_errors": 21484
        },
        "openai/gpt-audio": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-audio",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-audio",
            "count": 1005,
            "total_completion_tokens": 536578,
            "total_prompt_tokens": 1395530,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 1011,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-4.1-2025-04-14": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4.1-2025-04-14",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4.1-2025-04-14",
            "count": 7844751,
            "total_completion_tokens": 1306013515,
            "total_prompt_tokens": 31722949437,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 534024,
            "num_media_completion": 2,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 14270786560,
            "total_tool_calls": 752355,
            "requests_with_tool_call_errors": 5668
        },
        "inception/mercury": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "inception/mercury",
            "variant": "standard",
            "variant_permaslug": "inception/mercury",
            "count": 24524,
            "total_completion_tokens": 5079353,
            "total_prompt_tokens": 24509510,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 143,
            "requests_with_tool_call_errors": 20
        },
        "nvidia/llama-3.1-nemotron-70b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nvidia/llama-3.1-nemotron-70b-instruct",
            "variant": "standard",
            "variant_permaslug": "nvidia/llama-3.1-nemotron-70b-instruct",
            "count": 19588,
            "total_completion_tokens": 7099164,
            "total_prompt_tokens": 51722141,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 507,
            "requests_with_tool_call_errors": 228
        },
        "qwen/qwen3-vl-30b-a3b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-vl-30b-a3b-instruct",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-vl-30b-a3b-instruct",
            "count": 1531426,
            "total_completion_tokens": 259572632,
            "total_prompt_tokens": 4500935545,
            "total_native_tokens_reasoning": 81,
            "num_media_prompt": 2125835,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 693451868,
            "total_tool_calls": 70104,
            "requests_with_tool_call_errors": 1227
        },
        "baidu/ernie-4.5-vl-28b-a3b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "baidu/ernie-4.5-vl-28b-a3b",
            "variant": "standard",
            "variant_permaslug": "baidu/ernie-4.5-vl-28b-a3b",
            "count": 3540,
            "total_completion_tokens": 1793889,
            "total_prompt_tokens": 3050807,
            "total_native_tokens_reasoning": 39313,
            "num_media_prompt": 2055,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "microsoft/wizardlm-2-8x22b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "microsoft/wizardlm-2-8x22b",
            "variant": "standard",
            "variant_permaslug": "microsoft/wizardlm-2-8x22b",
            "count": 578837,
            "total_completion_tokens": 112454946,
            "total_prompt_tokens": 1147142220,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "deepseek/deepseek-v3.2-speciale-20251201": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepseek/deepseek-v3.2-speciale-20251201",
            "variant": "standard",
            "variant_permaslug": "deepseek/deepseek-v3.2-speciale-20251201",
            "count": 180829,
            "total_completion_tokens": 930417214,
            "total_prompt_tokens": 890055823,
            "total_native_tokens_reasoning": 864858200,
            "num_media_prompt": 127,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 242214592,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "alfredpros/codellama-7b-instruct-solidity": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "alfredpros/codellama-7b-instruct-solidity",
            "variant": "standard",
            "variant_permaslug": "alfredpros/codellama-7b-instruct-solidity",
            "count": 9786,
            "total_completion_tokens": 4178045,
            "total_prompt_tokens": 1819048,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "essentialai/rnj-1-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "essentialai/rnj-1-instruct",
            "variant": "standard",
            "variant_permaslug": "essentialai/rnj-1-instruct",
            "count": 11787,
            "total_completion_tokens": 1520226,
            "total_prompt_tokens": 12267248,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-oss-20b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-oss-20b",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-oss-20b",
            "count": 19312303,
            "total_completion_tokens": 12715219060,
            "total_prompt_tokens": 42136401057,
            "total_native_tokens_reasoning": 10020222255,
            "num_media_prompt": 209,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 12706507541,
            "total_tool_calls": 383362,
            "requests_with_tool_call_errors": 76770
        },
        "minimax/minimax-m2.1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "minimax/minimax-m2.1",
            "variant": "standard",
            "variant_permaslug": "minimax/minimax-m2.1",
            "count": 3526547,
            "total_completion_tokens": 2435110684,
            "total_prompt_tokens": 116402426791,
            "total_native_tokens_reasoning": 1116173114,
            "num_media_prompt": 434,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 89048390158,
            "total_tool_calls": 2029625,
            "requests_with_tool_call_errors": 69110
        },
        "openai/gpt-4o-mini": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4o-mini",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4o-mini",
            "count": 60680673,
            "total_completion_tokens": 6360988566,
            "total_prompt_tokens": 138793367698,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 1357134,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 34998984576,
            "total_tool_calls": 3056398,
            "requests_with_tool_call_errors": 110056
        },
        "openai/gpt-4o-2024-11-20": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4o-2024-11-20",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4o-2024-11-20",
            "count": 612052,
            "total_completion_tokens": 102512202,
            "total_prompt_tokens": 999436113,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 100897,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 206370176,
            "total_tool_calls": 15821,
            "requests_with_tool_call_errors": 377
        },
        "morph/morph-v3-large": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "morph/morph-v3-large",
            "variant": "standard",
            "variant_permaslug": "morph/morph-v3-large",
            "count": 102228,
            "total_completion_tokens": 432132667,
            "total_prompt_tokens": 489091349,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "moonshotai/kimi-k2-thinking-20251106": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "moonshotai/kimi-k2-thinking-20251106",
            "variant": "standard",
            "variant_permaslug": "moonshotai/kimi-k2-thinking-20251106",
            "count": 1396962,
            "total_completion_tokens": 2116423704,
            "total_prompt_tokens": 20993230600,
            "total_native_tokens_reasoning": 1653928358,
            "num_media_prompt": 3519,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 11084168483,
            "total_tool_calls": 482265,
            "requests_with_tool_call_errors": 9383
        },
        "nousresearch/deephermes-3-mistral-24b-preview": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nousresearch/deephermes-3-mistral-24b-preview",
            "variant": "standard",
            "variant_permaslug": "nousresearch/deephermes-3-mistral-24b-preview",
            "count": 4473,
            "total_completion_tokens": 942124,
            "total_prompt_tokens": 12119545,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 2636638,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "meta-llama/llama-4-scout-17b-16e-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-4-scout-17b-16e-instruct",
            "variant": "standard",
            "variant_permaslug": "meta-llama/llama-4-scout-17b-16e-instruct",
            "count": 4002437,
            "total_completion_tokens": 473428859,
            "total_prompt_tokens": 7644298987,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 2095725,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 8233,
            "requests_with_tool_call_errors": 117
        },
        "mistralai/mistral-nemo": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-nemo",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-nemo",
            "count": 25092923,
            "total_completion_tokens": 3172232567,
            "total_prompt_tokens": 73938925717,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 1205,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 3532856591,
            "total_tool_calls": 25369,
            "requests_with_tool_call_errors": 121
        },
        "arcee-ai/trinity-mini-20251201:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "arcee-ai/trinity-mini-20251201",
            "variant": "free",
            "variant_permaslug": "arcee-ai/trinity-mini-20251201:free",
            "count": 108476,
            "total_completion_tokens": 163583893,
            "total_prompt_tokens": 480310583,
            "total_native_tokens_reasoning": 124197785,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 4354,
            "requests_with_tool_call_errors": 1385
        },
        "google/gemini-2.5-flash-preview-09-2025": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemini-2.5-flash-preview-09-2025",
            "variant": "standard",
            "variant_permaslug": "google/gemini-2.5-flash-preview-09-2025",
            "count": 982226,
            "total_completion_tokens": 491908325,
            "total_prompt_tokens": 10463861887,
            "total_native_tokens_reasoning": 113833818,
            "num_media_prompt": 102932,
            "num_media_completion": 0,
            "num_audio_prompt": 375,
            "total_native_tokens_cached": 4625613140,
            "total_tool_calls": 99897,
            "requests_with_tool_call_errors": 3203
        },
        "qwen/qwen3-coder-480b-a35b-07-25:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-coder-480b-a35b-07-25",
            "variant": "free",
            "variant_permaslug": "qwen/qwen3-coder-480b-a35b-07-25:free",
            "count": 149972,
            "total_completion_tokens": 88429107,
            "total_prompt_tokens": 4081024124,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 43797,
            "requests_with_tool_call_errors": 1491
        },
        "inflection/inflection-3-pi": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "inflection/inflection-3-pi",
            "variant": "standard",
            "variant_permaslug": "inflection/inflection-3-pi",
            "count": 22821,
            "total_completion_tokens": 555932,
            "total_prompt_tokens": 2391856,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "thedrummer/rocinante-12b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "thedrummer/rocinante-12b",
            "variant": "standard",
            "variant_permaslug": "thedrummer/rocinante-12b",
            "count": 485782,
            "total_completion_tokens": 135881553,
            "total_prompt_tokens": 825514993,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "intfloat/multilingual-e5-large-20251117": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "intfloat/multilingual-e5-large-20251117",
            "variant": "standard",
            "variant_permaslug": "intfloat/multilingual-e5-large-20251117",
            "count": 1223709,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 351916702,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "morph/morph-v3-fast": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "morph/morph-v3-fast",
            "variant": "standard",
            "variant_permaslug": "morph/morph-v3-fast",
            "count": 9863,
            "total_completion_tokens": 47105360,
            "total_prompt_tokens": 47515524,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "liquid/lfm-2.5-1.2b-thinking-20260120:free": {
            "date": "2026-01-20 00:00:00",
            "model_permaslug": "liquid/lfm-2.5-1.2b-thinking-20260120",
            "variant": "free",
            "variant_permaslug": "liquid/lfm-2.5-1.2b-thinking-20260120:free",
            "count": 60889,
            "total_completion_tokens": 74178052,
            "total_prompt_tokens": 157185295,
            "total_native_tokens_reasoning": 67559769,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "tngtech/deepseek-r1t2-chimera": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "tngtech/deepseek-r1t2-chimera",
            "variant": "standard",
            "variant_permaslug": "tngtech/deepseek-r1t2-chimera",
            "count": 914190,
            "total_completion_tokens": 436390509,
            "total_prompt_tokens": 4558361985,
            "total_native_tokens_reasoning": 648503925,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 513858944,
            "total_tool_calls": 241,
            "requests_with_tool_call_errors": 5
        },
        "deepseek/deepseek-v3.1-terminus": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepseek/deepseek-v3.1-terminus",
            "variant": "standard",
            "variant_permaslug": "deepseek/deepseek-v3.1-terminus",
            "count": 2407143,
            "total_completion_tokens": 1226306945,
            "total_prompt_tokens": 12330540601,
            "total_native_tokens_reasoning": 456697957,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 875479848,
            "total_tool_calls": 95994,
            "requests_with_tool_call_errors": 3228
        },
        "x-ai/grok-3": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "x-ai/grok-3",
            "variant": "standard",
            "variant_permaslug": "x-ai/grok-3",
            "count": 410928,
            "total_completion_tokens": 145880736,
            "total_prompt_tokens": 1430128861,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 283069230,
            "total_tool_calls": 6474,
            "requests_with_tool_call_errors": 23
        },
        "amazon/nova-micro-v1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "amazon/nova-micro-v1",
            "variant": "standard",
            "variant_permaslug": "amazon/nova-micro-v1",
            "count": 1631001,
            "total_completion_tokens": 406537118,
            "total_prompt_tokens": 4269168968,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 378,
            "requests_with_tool_call_errors": 46
        },
        "perplexity/sonar-deep-research": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "perplexity/sonar-deep-research",
            "variant": "standard",
            "variant_permaslug": "perplexity/sonar-deep-research",
            "count": 13917,
            "total_completion_tokens": 3419854140,
            "total_prompt_tokens": 52769030,
            "total_native_tokens_reasoning": 3336125169,
            "num_media_prompt": 55,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "google/gemini-2.5-flash": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemini-2.5-flash",
            "variant": "standard",
            "variant_permaslug": "google/gemini-2.5-flash",
            "count": 115785936,
            "total_completion_tokens": 32611605879,
            "total_prompt_tokens": 373321024571,
            "total_native_tokens_reasoning": 4462350310,
            "num_media_prompt": 23460483,
            "num_media_completion": 0,
            "num_audio_prompt": 228520,
            "total_native_tokens_cached": 95919357244,
            "total_tool_calls": 10388484,
            "requests_with_tool_call_errors": 197257
        },
        "allenai/olmo-3-7b-instruct-20251121": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "allenai/olmo-3-7b-instruct-20251121",
            "variant": "standard",
            "variant_permaslug": "allenai/olmo-3-7b-instruct-20251121",
            "count": 31889,
            "total_completion_tokens": 4109996,
            "total_prompt_tokens": 34795445,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 5825520,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "meta-llama/llama-3.2-1b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-3.2-1b-instruct",
            "variant": "standard",
            "variant_permaslug": "meta-llama/llama-3.2-1b-instruct",
            "count": 75992,
            "total_completion_tokens": 48745808,
            "total_prompt_tokens": 32523389,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "sao10k/l3.1-70b-hanami-x1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "sao10k/l3.1-70b-hanami-x1",
            "variant": "standard",
            "variant_permaslug": "sao10k/l3.1-70b-hanami-x1",
            "count": 3046,
            "total_completion_tokens": 781790,
            "total_prompt_tokens": 3683174,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "google/gemma-3n-e4b-it": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemma-3n-e4b-it",
            "variant": "standard",
            "variant_permaslug": "google/gemma-3n-e4b-it",
            "count": 1548728,
            "total_completion_tokens": 96473759,
            "total_prompt_tokens": 418274605,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 11,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "qwen/qwen3-coder-plus": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-coder-plus",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-coder-plus",
            "count": 41916,
            "total_completion_tokens": 14190066,
            "total_prompt_tokens": 523823636,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 12076,
            "requests_with_tool_call_errors": 571
        },
        "inception/mercury-coder-small-beta": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "inception/mercury-coder-small-beta",
            "variant": "standard",
            "variant_permaslug": "inception/mercury-coder-small-beta",
            "count": 12809,
            "total_completion_tokens": 18097310,
            "total_prompt_tokens": 44407937,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 341,
            "requests_with_tool_call_errors": 83
        },
        "opengvlab/internvl3-78b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "opengvlab/internvl3-78b",
            "variant": "standard",
            "variant_permaslug": "opengvlab/internvl3-78b",
            "count": 439907,
            "total_completion_tokens": 11242917,
            "total_prompt_tokens": 237294717,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 43777,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 90987104,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "anthropic/claude-4-sonnet-20250522": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "anthropic/claude-4-sonnet-20250522",
            "variant": "standard",
            "variant_permaslug": "anthropic/claude-4-sonnet-20250522",
            "count": 4473746,
            "total_completion_tokens": 2981170223,
            "total_prompt_tokens": 48009673174,
            "total_native_tokens_reasoning": 49199513,
            "num_media_prompt": 383372,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 22743990787,
            "total_tool_calls": 725864,
            "requests_with_tool_call_errors": 17083
        },
        "meta-llama/llama-3.1-8b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-3.1-8b-instruct",
            "variant": "standard",
            "variant_permaslug": "meta-llama/llama-3.1-8b-instruct",
            "count": 32859297,
            "total_completion_tokens": 2367797022,
            "total_prompt_tokens": 26505562786,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 48,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 6979016576,
            "total_tool_calls": 738993,
            "requests_with_tool_call_errors": 7838
        },
        "cohere/command-a-03-2025": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "cohere/command-a-03-2025",
            "variant": "standard",
            "variant_permaslug": "cohere/command-a-03-2025",
            "count": 9318,
            "total_completion_tokens": 2341154,
            "total_prompt_tokens": 13450745,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-3.5-turbo-0613": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-3.5-turbo-0613",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-3.5-turbo-0613",
            "count": 71223,
            "total_completion_tokens": 17493137,
            "total_prompt_tokens": 20673462,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 229248,
            "total_tool_calls": 62,
            "requests_with_tool_call_errors": 0
        },
        "google/gemini-2.0-flash-exp:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemini-2.0-flash-exp",
            "variant": "free",
            "variant_permaslug": "google/gemini-2.0-flash-exp:free",
            "count": 182702,
            "total_completion_tokens": 78877919,
            "total_prompt_tokens": 1294295802,
            "total_native_tokens_reasoning": 1,
            "num_media_prompt": 64243,
            "num_media_completion": 541,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 6257,
            "requests_with_tool_call_errors": 605
        },
        "qwen/qwen2.5-vl-72b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen2.5-vl-72b-instruct",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen2.5-vl-72b-instruct",
            "count": 1106859,
            "total_completion_tokens": 139119314,
            "total_prompt_tokens": 2674424670,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 1311297,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 207595840,
            "total_tool_calls": 90,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/mistral-small-3.1-24b-instruct-2503:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-small-3.1-24b-instruct-2503",
            "variant": "free",
            "variant_permaslug": "mistralai/mistral-small-3.1-24b-instruct-2503:free",
            "count": 45848,
            "total_completion_tokens": 21706501,
            "total_prompt_tokens": 149500868,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 787,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 205,
            "requests_with_tool_call_errors": 205
        },
        "mistralai/mistral-medium-3": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-medium-3",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-medium-3",
            "count": 68864,
            "total_completion_tokens": 53579248,
            "total_prompt_tokens": 722558562,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 925,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 501,
            "requests_with_tool_call_errors": 23
        },
        "openai/gpt-4-turbo": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4-turbo",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4-turbo",
            "count": 62782,
            "total_completion_tokens": 15096715,
            "total_prompt_tokens": 148424003,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 24741,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 3647,
            "requests_with_tool_call_errors": 204
        },
        "qwen/qwen3-vl-32b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-vl-32b-instruct",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-vl-32b-instruct",
            "count": 146066,
            "total_completion_tokens": 114466340,
            "total_prompt_tokens": 354130396,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 166599,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "deepseek/deepseek-v3.2-exp": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepseek/deepseek-v3.2-exp",
            "variant": "standard",
            "variant_permaslug": "deepseek/deepseek-v3.2-exp",
            "count": 3610632,
            "total_completion_tokens": 1640237768,
            "total_prompt_tokens": 19119441936,
            "total_native_tokens_reasoning": 496727268,
            "num_media_prompt": 2422,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 740679616,
            "total_tool_calls": 537819,
            "requests_with_tool_call_errors": 7073
        },
        "openai/gpt-5.2-pro-20251211": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5.2-pro-20251211",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5.2-pro-20251211",
            "count": 111026,
            "total_completion_tokens": 212193122,
            "total_prompt_tokens": 2062310256,
            "total_native_tokens_reasoning": 144353142,
            "num_media_prompt": 51709,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 13346,
            "requests_with_tool_call_errors": 234
        },
        "z-ai/glm-4.5": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "z-ai/glm-4.5",
            "variant": "standard",
            "variant_permaslug": "z-ai/glm-4.5",
            "count": 483671,
            "total_completion_tokens": 494396061,
            "total_prompt_tokens": 4495392820,
            "total_native_tokens_reasoning": 382434383,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 3261340260,
            "total_tool_calls": 186815,
            "requests_with_tool_call_errors": 56210
        },
        "minimax/minimax-m2": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "minimax/minimax-m2",
            "variant": "standard",
            "variant_permaslug": "minimax/minimax-m2",
            "count": 569359,
            "total_completion_tokens": 288164974,
            "total_prompt_tokens": 13223292344,
            "total_native_tokens_reasoning": 204961516,
            "num_media_prompt": 320,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 5209906073,
            "total_tool_calls": 299239,
            "requests_with_tool_call_errors": 17438
        },
        "thedrummer/cydonia-24b-v4.1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "thedrummer/cydonia-24b-v4.1",
            "variant": "standard",
            "variant_permaslug": "thedrummer/cydonia-24b-v4.1",
            "count": 178970,
            "total_completion_tokens": 48528779,
            "total_prompt_tokens": 974524827,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 637825792,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/mistral-tiny": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-tiny",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-tiny",
            "count": 3166286,
            "total_completion_tokens": 44993440,
            "total_prompt_tokens": 1478147544,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 2,
            "requests_with_tool_call_errors": 0
        },
        "qwen/qwen3-embedding-4b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-embedding-4b",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-embedding-4b",
            "count": 3065377,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 1333957295,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/mistral-small-creative-20251216": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-small-creative-20251216",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-small-creative-20251216",
            "count": 771570,
            "total_completion_tokens": 321148319,
            "total_prompt_tokens": 3750591514,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 14750,
            "requests_with_tool_call_errors": 1151
        },
        "openai/gpt-oss-120b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-oss-120b",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-oss-120b",
            "count": 61918702,
            "total_completion_tokens": 32739021051,
            "total_prompt_tokens": 243369618486,
            "total_native_tokens_reasoning": 13933748855,
            "num_media_prompt": 2192,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 41773390730,
            "total_tool_calls": 978567,
            "requests_with_tool_call_errors": 93678
        },
        "openai/gpt-5-image": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5-image",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5-image",
            "count": 14952,
            "total_completion_tokens": 63900324,
            "total_prompt_tokens": 51058716,
            "total_native_tokens_reasoning": 20173151,
            "num_media_prompt": 16762,
            "num_media_completion": 8705,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 4415744,
            "total_tool_calls": 92,
            "requests_with_tool_call_errors": 1
        },
        "anthropic/claude-4.1-opus-20250805": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "anthropic/claude-4.1-opus-20250805",
            "variant": "standard",
            "variant_permaslug": "anthropic/claude-4.1-opus-20250805",
            "count": 104379,
            "total_completion_tokens": 59742156,
            "total_prompt_tokens": 1226252147,
            "total_native_tokens_reasoning": 7069461,
            "num_media_prompt": 11178,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 327534743,
            "total_tool_calls": 10941,
            "requests_with_tool_call_errors": 165
        },
        "z-ai/glm-4.5-air:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "z-ai/glm-4.5-air",
            "variant": "free",
            "variant_permaslug": "z-ai/glm-4.5-air:free",
            "count": 1773597,
            "total_completion_tokens": 1511322639,
            "total_prompt_tokens": 21983748101,
            "total_native_tokens_reasoning": 763641378,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 11929038042,
            "total_tool_calls": 256023,
            "requests_with_tool_call_errors": 22197
        },
        "google/gemini-3-flash-preview-20251217": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemini-3-flash-preview-20251217",
            "variant": "standard",
            "variant_permaslug": "google/gemini-3-flash-preview-20251217",
            "count": 74003236,
            "total_completion_tokens": 33872964299,
            "total_prompt_tokens": 557730950089,
            "total_native_tokens_reasoning": 7798049552,
            "num_media_prompt": 18896703,
            "num_media_completion": 0,
            "num_audio_prompt": 419881,
            "total_native_tokens_cached": 231981520427,
            "total_tool_calls": 14944012,
            "requests_with_tool_call_errors": 254550
        },
        "undi95/remm-slerp-l2-13b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "undi95/remm-slerp-l2-13b",
            "variant": "standard",
            "variant_permaslug": "undi95/remm-slerp-l2-13b",
            "count": 182287,
            "total_completion_tokens": 18421400,
            "total_prompt_tokens": 272887760,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "relace/relace-search-20251208": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "relace/relace-search-20251208",
            "variant": "standard",
            "variant_permaslug": "relace/relace-search-20251208",
            "count": 24404,
            "total_completion_tokens": 1409292,
            "total_prompt_tokens": 14521163,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 376,
            "requests_with_tool_call_errors": 10
        },
        "openai/gpt-5-image-mini": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5-image-mini",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5-image-mini",
            "count": 54241,
            "total_completion_tokens": 125008706,
            "total_prompt_tokens": 112078812,
            "total_native_tokens_reasoning": 46416933,
            "num_media_prompt": 39835,
            "num_media_completion": 14279,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 6076544,
            "total_tool_calls": 59,
            "requests_with_tool_call_errors": 3
        },
        "deepseek/deepseek-v3.1-terminus:exacto": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepseek/deepseek-v3.1-terminus",
            "variant": "exacto",
            "variant_permaslug": "deepseek/deepseek-v3.1-terminus:exacto",
            "count": 276181,
            "total_completion_tokens": 140441832,
            "total_prompt_tokens": 2646441579,
            "total_native_tokens_reasoning": 22626243,
            "num_media_prompt": 26,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 89932428,
            "total_tool_calls": 36181,
            "requests_with_tool_call_errors": 1571
        },
        "openai/gpt-5.2-20251211": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5.2-20251211",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5.2-20251211",
            "count": 7661946,
            "total_completion_tokens": 7080958767,
            "total_prompt_tokens": 96972656070,
            "total_native_tokens_reasoning": 4026126811,
            "num_media_prompt": 1321717,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 54688884864,
            "total_tool_calls": 2093266,
            "requests_with_tool_call_errors": 10048
        },
        "writer/palmyra-x5-20250428": {
            "date": "2026-01-21 00:00:00",
            "model_permaslug": "writer/palmyra-x5-20250428",
            "variant": "standard",
            "variant_permaslug": "writer/palmyra-x5-20250428",
            "count": 22260,
            "total_completion_tokens": 13458218,
            "total_prompt_tokens": 214539884,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "z-ai/glm-4-32b-0414": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "z-ai/glm-4-32b-0414",
            "variant": "standard",
            "variant_permaslug": "z-ai/glm-4-32b-0414",
            "count": 16399297,
            "total_completion_tokens": 125023141,
            "total_prompt_tokens": 5542380209,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 49,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 9904,
            "requests_with_tool_call_errors": 18
        },
        "sourceful/riverflow-v2-max-preview": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "sourceful/riverflow-v2-max-preview",
            "variant": "standard",
            "variant_permaslug": "sourceful/riverflow-v2-max-preview",
            "count": 2805,
            "total_completion_tokens": 11710875,
            "total_prompt_tokens": 8019702,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 3141,
            "num_media_completion": 2805,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/devstral-2512": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/devstral-2512",
            "variant": "standard",
            "variant_permaslug": "mistralai/devstral-2512",
            "count": 341621,
            "total_completion_tokens": 102754367,
            "total_prompt_tokens": 3451339635,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 2705307824,
            "total_tool_calls": 14494,
            "requests_with_tool_call_errors": 383
        },
        "anthropic/claude-3-haiku": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "anthropic/claude-3-haiku",
            "variant": "standard",
            "variant_permaslug": "anthropic/claude-3-haiku",
            "count": 1830991,
            "total_completion_tokens": 378758962,
            "total_prompt_tokens": 2429285955,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 41423,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 112997293,
            "total_tool_calls": 137916,
            "requests_with_tool_call_errors": 3247
        },
        "nvidia/nemotron-nano-12b-v2-vl:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nvidia/nemotron-nano-12b-v2-vl",
            "variant": "free",
            "variant_permaslug": "nvidia/nemotron-nano-12b-v2-vl:free",
            "count": 89427,
            "total_completion_tokens": 109140367,
            "total_prompt_tokens": 352717588,
            "total_native_tokens_reasoning": 81088126,
            "num_media_prompt": 49683,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 1198,
            "requests_with_tool_call_errors": 569
        },
        "bytedance-seed/seed-1.6-20250625": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "bytedance-seed/seed-1.6-20250625",
            "variant": "standard",
            "variant_permaslug": "bytedance-seed/seed-1.6-20250625",
            "count": 1953211,
            "total_completion_tokens": 758325790,
            "total_prompt_tokens": 9583367290,
            "total_native_tokens_reasoning": 529830307,
            "num_media_prompt": 1898597,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 2713,
            "requests_with_tool_call_errors": 80
        },
        "openai/gpt-3.5-turbo": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-3.5-turbo",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-3.5-turbo",
            "count": 674562,
            "total_completion_tokens": 103912194,
            "total_prompt_tokens": 472478631,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 16655,
            "requests_with_tool_call_errors": 929
        },
        "tngtech/deepseek-r1t-chimera:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "tngtech/deepseek-r1t-chimera",
            "variant": "free",
            "variant_permaslug": "tngtech/deepseek-r1t-chimera:free",
            "count": 2216079,
            "total_completion_tokens": 1296023240,
            "total_prompt_tokens": 24526317860,
            "total_native_tokens_reasoning": 25951771,
            "num_media_prompt": 99,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 5155309829,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "qwen/qwen-2.5-7b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen-2.5-7b-instruct",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen-2.5-7b-instruct",
            "count": 5445718,
            "total_completion_tokens": 845301347,
            "total_prompt_tokens": 5055046507,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 1143,
            "requests_with_tool_call_errors": 187
        },
        "openai/gpt-5-2025-08-07": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5-2025-08-07",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5-2025-08-07",
            "count": 2830941,
            "total_completion_tokens": 3818817390,
            "total_prompt_tokens": 27987719813,
            "total_native_tokens_reasoning": 3052967172,
            "num_media_prompt": 7145576,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 13494982272,
            "total_tool_calls": 670869,
            "requests_with_tool_call_errors": 3925
        },
        "qwen/qwen3-coder-30b-a3b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-coder-30b-a3b-instruct",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-coder-30b-a3b-instruct",
            "count": 698464,
            "total_completion_tokens": 231072212,
            "total_prompt_tokens": 3614654628,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 196460,
            "requests_with_tool_call_errors": 71456
        },
        "qwen/qwen-2.5-72b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen-2.5-72b-instruct",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen-2.5-72b-instruct",
            "count": 2513332,
            "total_completion_tokens": 202680254,
            "total_prompt_tokens": 2512435745,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 4,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 57271519,
            "total_tool_calls": 26022,
            "requests_with_tool_call_errors": 463
        },
        "meta-llama/llama-3.2-3b-instruct:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-3.2-3b-instruct",
            "variant": "free",
            "variant_permaslug": "meta-llama/llama-3.2-3b-instruct:free",
            "count": 75948,
            "total_completion_tokens": 16885186,
            "total_prompt_tokens": 72099472,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-4.1-mini-2025-04-14": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4.1-mini-2025-04-14",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4.1-mini-2025-04-14",
            "count": 24327807,
            "total_completion_tokens": 4068177973,
            "total_prompt_tokens": 50078864170,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 2969440,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 12610175616,
            "total_tool_calls": 2294321,
            "requests_with_tool_call_errors": 12164
        },
        "meta-llama/llama-guard-2-8b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-guard-2-8b",
            "variant": "standard",
            "variant_permaslug": "meta-llama/llama-guard-2-8b",
            "count": 56266,
            "total_completion_tokens": 96360,
            "total_prompt_tokens": 771577,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "eleutherai/llemma_7b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "eleutherai/llemma_7b",
            "variant": "standard",
            "variant_permaslug": "eleutherai/llemma_7b",
            "count": 1033,
            "total_completion_tokens": 1468344,
            "total_prompt_tokens": 493084,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/o1-2024-12-17": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/o1-2024-12-17",
            "variant": "standard",
            "variant_permaslug": "openai/o1-2024-12-17",
            "count": 7565,
            "total_completion_tokens": 19949444,
            "total_prompt_tokens": 108413923,
            "total_native_tokens_reasoning": 16314752,
            "num_media_prompt": 585,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 73294720,
            "total_tool_calls": 224,
            "requests_with_tool_call_errors": 0
        },
        "nousresearch/hermes-4-70b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nousresearch/hermes-4-70b",
            "variant": "standard",
            "variant_permaslug": "nousresearch/hermes-4-70b",
            "count": 307624,
            "total_completion_tokens": 55744604,
            "total_prompt_tokens": 1379930871,
            "total_native_tokens_reasoning": 984015,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 139212784,
            "total_tool_calls": 422,
            "requests_with_tool_call_errors": 4
        },
        "qwen/qwen-plus-2025-07-28:thinking": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen-plus-2025-07-28",
            "variant": "thinking",
            "variant_permaslug": "qwen/qwen-plus-2025-07-28:thinking",
            "count": 3125,
            "total_completion_tokens": 5867030,
            "total_prompt_tokens": 19394762,
            "total_native_tokens_reasoning": 4300735,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 390,
            "requests_with_tool_call_errors": 2
        },
        "bytedance-seed/seed-1.6-flash-20250625": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "bytedance-seed/seed-1.6-flash-20250625",
            "variant": "standard",
            "variant_permaslug": "bytedance-seed/seed-1.6-flash-20250625",
            "count": 232087,
            "total_completion_tokens": 243753976,
            "total_prompt_tokens": 662542096,
            "total_native_tokens_reasoning": 183485749,
            "num_media_prompt": 145834,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 5248,
            "requests_with_tool_call_errors": 464
        },
        "meta-llama/llama-3.3-70b-instruct:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-3.3-70b-instruct",
            "variant": "free",
            "variant_permaslug": "meta-llama/llama-3.3-70b-instruct:free",
            "count": 1060390,
            "total_completion_tokens": 518883679,
            "total_prompt_tokens": 3896419811,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 11,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 9431,
            "requests_with_tool_call_errors": 3658
        },
        "intfloat/e5-base-v2-20251117": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "intfloat/e5-base-v2-20251117",
            "variant": "standard",
            "variant_permaslug": "intfloat/e5-base-v2-20251117",
            "count": 21742,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 120121303,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "alibaba/tongyi-deepresearch-30b-a3b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "alibaba/tongyi-deepresearch-30b-a3b",
            "variant": "standard",
            "variant_permaslug": "alibaba/tongyi-deepresearch-30b-a3b",
            "count": 236834,
            "total_completion_tokens": 159388547,
            "total_prompt_tokens": 2997498734,
            "total_native_tokens_reasoning": 120512990,
            "num_media_prompt": 173,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1932252627,
            "total_tool_calls": 4531,
            "requests_with_tool_call_errors": 1278
        },
        "openai/o4-mini-2025-04-16": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/o4-mini-2025-04-16",
            "variant": "standard",
            "variant_permaslug": "openai/o4-mini-2025-04-16",
            "count": 327193,
            "total_completion_tokens": 318907346,
            "total_prompt_tokens": 1421212071,
            "total_native_tokens_reasoning": 258876792,
            "num_media_prompt": 107216,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 508844672,
            "total_tool_calls": 28437,
            "requests_with_tool_call_errors": 13
        },
        "baai/bge-m3-20251117": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "baai/bge-m3-20251117",
            "variant": "standard",
            "variant_permaslug": "baai/bge-m3-20251117",
            "count": 2023152,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 2243444441,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "sentence-transformers/all-minilm-l6-v2-20251117": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "sentence-transformers/all-minilm-l6-v2-20251117",
            "variant": "standard",
            "variant_permaslug": "sentence-transformers/all-minilm-l6-v2-20251117",
            "count": 1034419,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 510912366,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "intfloat/e5-large-v2-20251117": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "intfloat/e5-large-v2-20251117",
            "variant": "standard",
            "variant_permaslug": "intfloat/e5-large-v2-20251117",
            "count": 87715,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 173189236,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "qwen/qwen3-max": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-max",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-max",
            "count": 267185,
            "total_completion_tokens": 99759200,
            "total_prompt_tokens": 1672265257,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 155,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 45959,
            "requests_with_tool_call_errors": 949
        },
        "liquid/lfm-2.2-6b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "liquid/lfm-2.2-6b",
            "variant": "standard",
            "variant_permaslug": "liquid/lfm-2.2-6b",
            "count": 570850,
            "total_completion_tokens": 24984489,
            "total_prompt_tokens": 129744763,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-oss-20b:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-oss-20b",
            "variant": "free",
            "variant_permaslug": "openai/gpt-oss-20b:free",
            "count": 145945,
            "total_completion_tokens": 147121633,
            "total_prompt_tokens": 651986603,
            "total_native_tokens_reasoning": 117888105,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 11581,
            "requests_with_tool_call_errors": 1157
        },
        "google/gemini-3-pro-image-preview-20251120": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemini-3-pro-image-preview-20251120",
            "variant": "standard",
            "variant_permaslug": "google/gemini-3-pro-image-preview-20251120",
            "count": 2037408,
            "total_completion_tokens": 2871158702,
            "total_prompt_tokens": 2794742882,
            "total_native_tokens_reasoning": 633048425,
            "num_media_prompt": 2690156,
            "num_media_completion": 2415325,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 14718890,
            "total_tool_calls": 214,
            "requests_with_tool_call_errors": 214
        },
        "nvidia/llama-3.3-nemotron-super-49b-v1.5": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nvidia/llama-3.3-nemotron-super-49b-v1.5",
            "variant": "standard",
            "variant_permaslug": "nvidia/llama-3.3-nemotron-super-49b-v1.5",
            "count": 74333,
            "total_completion_tokens": 77139766,
            "total_prompt_tokens": 524614552,
            "total_native_tokens_reasoning": 70163431,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 2306,
            "requests_with_tool_call_errors": 51
        },
        "qwen/qwen3-30b-a3b-instruct-2507": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-30b-a3b-instruct-2507",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-30b-a3b-instruct-2507",
            "count": 2063244,
            "total_completion_tokens": 834251470,
            "total_prompt_tokens": 7368588974,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1224026004,
            "total_tool_calls": 30764,
            "requests_with_tool_call_errors": 2349
        },
        "allenai/molmo-2-8b-20260109:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "allenai/molmo-2-8b-20260109",
            "variant": "free",
            "variant_permaslug": "allenai/molmo-2-8b-20260109:free",
            "count": 127448,
            "total_completion_tokens": 37719244,
            "total_prompt_tokens": 289344552,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 45806,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "qwen/qwen3-235b-a22b-thinking-2507": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-235b-a22b-thinking-2507",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-235b-a22b-thinking-2507",
            "count": 574641,
            "total_completion_tokens": 810562842,
            "total_prompt_tokens": 2424528103,
            "total_native_tokens_reasoning": 656760281,
            "num_media_prompt": 15,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 449322789,
            "total_tool_calls": 73531,
            "requests_with_tool_call_errors": 16746
        },
        "mistralai/mistral-large-2512": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-large-2512",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-large-2512",
            "count": 1184978,
            "total_completion_tokens": 334998151,
            "total_prompt_tokens": 3961659617,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 91815,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 171074,
            "requests_with_tool_call_errors": 1924
        },
        "openai/o3-mini-2025-01-31": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/o3-mini-2025-01-31",
            "variant": "standard",
            "variant_permaslug": "openai/o3-mini-2025-01-31",
            "count": 308328,
            "total_completion_tokens": 478951917,
            "total_prompt_tokens": 914607310,
            "total_native_tokens_reasoning": 353225920,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 323890048,
            "total_tool_calls": 2383,
            "requests_with_tool_call_errors": 41
        },
        "cohere/command-r7b-12-2024": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "cohere/command-r7b-12-2024",
            "variant": "standard",
            "variant_permaslug": "cohere/command-r7b-12-2024",
            "count": 1803098,
            "total_completion_tokens": 193474379,
            "total_prompt_tokens": 8891742751,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "allenai/olmo-3.1-32b-think-20251215": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "allenai/olmo-3.1-32b-think-20251215",
            "variant": "standard",
            "variant_permaslug": "allenai/olmo-3.1-32b-think-20251215",
            "count": 45650,
            "total_completion_tokens": 150533469,
            "total_prompt_tokens": 255774740,
            "total_native_tokens_reasoning": 131134929,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 52961424,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "z-ai/glm-4.6": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "z-ai/glm-4.6",
            "variant": "standard",
            "variant_permaslug": "z-ai/glm-4.6",
            "count": 2197581,
            "total_completion_tokens": 1222724976,
            "total_prompt_tokens": 21446182073,
            "total_native_tokens_reasoning": 577591342,
            "num_media_prompt": 619,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 9314347785,
            "total_tool_calls": 278257,
            "requests_with_tool_call_errors": 46725
        },
        "tngtech/deepseek-r1t-chimera": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "tngtech/deepseek-r1t-chimera",
            "variant": "standard",
            "variant_permaslug": "tngtech/deepseek-r1t-chimera",
            "count": 263909,
            "total_completion_tokens": 35306418,
            "total_prompt_tokens": 1622203375,
            "total_native_tokens_reasoning": 63773,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 345665658,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "google/gemma-3-4b-it": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemma-3-4b-it",
            "variant": "standard",
            "variant_permaslug": "google/gemma-3-4b-it",
            "count": 24773822,
            "total_completion_tokens": 751915995,
            "total_prompt_tokens": 1675871487,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 73222,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 262326656,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "nvidia/nemotron-nano-12b-v2-vl": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nvidia/nemotron-nano-12b-v2-vl",
            "variant": "standard",
            "variant_permaslug": "nvidia/nemotron-nano-12b-v2-vl",
            "count": 18716,
            "total_completion_tokens": 12551625,
            "total_prompt_tokens": 44388396,
            "total_native_tokens_reasoning": 10692719,
            "num_media_prompt": 15800,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "deepseek/deepseek-r1-0528:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepseek/deepseek-r1-0528",
            "variant": "free",
            "variant_permaslug": "deepseek/deepseek-r1-0528:free",
            "count": 1846716,
            "total_completion_tokens": 1452388540,
            "total_prompt_tokens": 12305184584,
            "total_native_tokens_reasoning": 984705588,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 3506951461,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/mistral-7b-instruct-v0.2": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-7b-instruct-v0.2",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-7b-instruct-v0.2",
            "count": 150723,
            "total_completion_tokens": 6322315,
            "total_prompt_tokens": 35927934,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "tngtech/deepseek-r1t2-chimera:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "tngtech/deepseek-r1t2-chimera",
            "variant": "free",
            "variant_permaslug": "tngtech/deepseek-r1t2-chimera:free",
            "count": 9630252,
            "total_completion_tokens": 8662919705,
            "total_prompt_tokens": 91499670433,
            "total_native_tokens_reasoning": 4908855415,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 10961445632,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-5.2-chat-20251211": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5.2-chat-20251211",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5.2-chat-20251211",
            "count": 1781502,
            "total_completion_tokens": 533931783,
            "total_prompt_tokens": 7823169333,
            "total_native_tokens_reasoning": 126747456,
            "num_media_prompt": 662583,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 3667900288,
            "total_tool_calls": 70523,
            "requests_with_tool_call_errors": 1272
        },
        "sentence-transformers/multi-qa-mpnet-base-dot-v1-20251117": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "sentence-transformers/multi-qa-mpnet-base-dot-v1-20251117",
            "variant": "standard",
            "variant_permaslug": "sentence-transformers/multi-qa-mpnet-base-dot-v1-20251117",
            "count": 34496,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 64365618,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/mistral-large": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-large",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-large",
            "count": 109155,
            "total_completion_tokens": 25331326,
            "total_prompt_tokens": 448581208,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 2442,
            "requests_with_tool_call_errors": 28
        },
        "qwen/qwen3-8b-04-28": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-8b-04-28",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-8b-04-28",
            "count": 1083088,
            "total_completion_tokens": 1302577216,
            "total_prompt_tokens": 1510351462,
            "total_native_tokens_reasoning": 1130728655,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 366149808,
            "total_tool_calls": 10884,
            "requests_with_tool_call_errors": 225
        },
        "tngtech/tng-r1t-chimera:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "tngtech/tng-r1t-chimera",
            "variant": "free",
            "variant_permaslug": "tngtech/tng-r1t-chimera:free",
            "count": 727919,
            "total_completion_tokens": 571752368,
            "total_prompt_tokens": 7849838046,
            "total_native_tokens_reasoning": 351126255,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1461032576,
            "total_tool_calls": 5974,
            "requests_with_tool_call_errors": 355
        },
        "liquid/lfm2-8b-a1b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "liquid/lfm2-8b-a1b",
            "variant": "standard",
            "variant_permaslug": "liquid/lfm2-8b-a1b",
            "count": 66606,
            "total_completion_tokens": 6376575,
            "total_prompt_tokens": 48372223,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "x-ai/grok-4-07-09": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "x-ai/grok-4-07-09",
            "variant": "standard",
            "variant_permaslug": "x-ai/grok-4-07-09",
            "count": 692491,
            "total_completion_tokens": 1156269714,
            "total_prompt_tokens": 4570323962,
            "total_native_tokens_reasoning": 837979893,
            "num_media_prompt": 200193,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 2163902788,
            "total_tool_calls": 73817,
            "requests_with_tool_call_errors": 2060
        },
        "google/gemma-3-4b-it:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemma-3-4b-it",
            "variant": "free",
            "variant_permaslug": "google/gemma-3-4b-it:free",
            "count": 54683,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 48827034,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 57435,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "sao10k/l3-lunaris-8b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "sao10k/l3-lunaris-8b",
            "variant": "standard",
            "variant_permaslug": "sao10k/l3-lunaris-8b",
            "count": 2450856,
            "total_completion_tokens": 516022859,
            "total_prompt_tokens": 6360572820,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "venice/uncensored:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "venice/uncensored",
            "variant": "free",
            "variant_permaslug": "venice/uncensored:free",
            "count": 143030,
            "total_completion_tokens": 59610815,
            "total_prompt_tokens": 380872557,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "perplexity/sonar-reasoning-pro": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "perplexity/sonar-reasoning-pro",
            "variant": "standard",
            "variant_permaslug": "perplexity/sonar-reasoning-pro",
            "count": 37766,
            "total_completion_tokens": 42295554,
            "total_prompt_tokens": 106684128,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 787,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "qwen/qwen3-embedding-8b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-embedding-8b",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-embedding-8b",
            "count": 13466551,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 21635509665,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "anthracite-org/magnum-v4-72b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "anthracite-org/magnum-v4-72b",
            "variant": "standard",
            "variant_permaslug": "anthracite-org/magnum-v4-72b",
            "count": 21113,
            "total_completion_tokens": 3540860,
            "total_prompt_tokens": 45799893,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "qwen/qwen3-vl-30b-a3b-thinking": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-vl-30b-a3b-thinking",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-vl-30b-a3b-thinking",
            "count": 21696,
            "total_completion_tokens": 50113408,
            "total_prompt_tokens": 74105043,
            "total_native_tokens_reasoning": 42125107,
            "num_media_prompt": 23614,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 1510,
            "requests_with_tool_call_errors": 128
        },
        "mistralai/mistral-small-24b-instruct-2501": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-small-24b-instruct-2501",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-small-24b-instruct-2501",
            "count": 6960859,
            "total_completion_tokens": 1225370908,
            "total_prompt_tokens": 14255863011,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 59745005,
            "total_tool_calls": 1131,
            "requests_with_tool_call_errors": 159
        },
        "z-ai/glm-4.6:exacto": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "z-ai/glm-4.6",
            "variant": "exacto",
            "variant_permaslug": "z-ai/glm-4.6:exacto",
            "count": 46944,
            "total_completion_tokens": 24832165,
            "total_prompt_tokens": 601696080,
            "total_native_tokens_reasoning": 15036207,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 289442169,
            "total_tool_calls": 15527,
            "requests_with_tool_call_errors": 4019
        },
        "alpindale/goliath-120b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "alpindale/goliath-120b",
            "variant": "standard",
            "variant_permaslug": "alpindale/goliath-120b",
            "count": 3858,
            "total_completion_tokens": 1106171,
            "total_prompt_tokens": 3636492,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 2,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/pixtral-12b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/pixtral-12b",
            "variant": "standard",
            "variant_permaslug": "mistralai/pixtral-12b",
            "count": 132130,
            "total_completion_tokens": 9452448,
            "total_prompt_tokens": 65159498,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 58379,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 57,
            "requests_with_tool_call_errors": 8
        },
        "qwen/qwen3-vl-8b-thinking": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-vl-8b-thinking",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-vl-8b-thinking",
            "count": 9516,
            "total_completion_tokens": 46908484,
            "total_prompt_tokens": 47136515,
            "total_native_tokens_reasoning": 43226360,
            "num_media_prompt": 19536,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 178,
            "requests_with_tool_call_errors": 39
        },
        "openai/gpt-5.1-codex-mini-20251113": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5.1-codex-mini-20251113",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5.1-codex-mini-20251113",
            "count": 186557,
            "total_completion_tokens": 164996341,
            "total_prompt_tokens": 4691133466,
            "total_native_tokens_reasoning": 123890587,
            "num_media_prompt": 19093,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 3905151488,
            "total_tool_calls": 77815,
            "requests_with_tool_call_errors": 430
        },
        "meta-llama/llama-3.1-405b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-3.1-405b",
            "variant": "standard",
            "variant_permaslug": "meta-llama/llama-3.1-405b",
            "count": 10499,
            "total_completion_tokens": 3652834,
            "total_prompt_tokens": 56848,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 1,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "nousresearch/hermes-3-llama-3.1-405b:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nousresearch/hermes-3-llama-3.1-405b",
            "variant": "free",
            "variant_permaslug": "nousresearch/hermes-3-llama-3.1-405b:free",
            "count": 60782,
            "total_completion_tokens": 11984095,
            "total_prompt_tokens": 312277154,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/mistral-medium-3.1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-medium-3.1",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-medium-3.1",
            "count": 390184,
            "total_completion_tokens": 184880154,
            "total_prompt_tokens": 3874645996,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 20110,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 17651,
            "requests_with_tool_call_errors": 1506
        },
        "google/gemini-2.0-flash-001": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemini-2.0-flash-001",
            "variant": "standard",
            "variant_permaslug": "google/gemini-2.0-flash-001",
            "count": 136992641,
            "total_completion_tokens": 17924314182,
            "total_prompt_tokens": 158559212770,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 12036456,
            "num_media_completion": 0,
            "num_audio_prompt": 47410,
            "total_native_tokens_cached": 998000777,
            "total_tool_calls": 1693902,
            "requests_with_tool_call_errors": 13063
        },
        "deepseek/deepseek-r1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepseek/deepseek-r1",
            "variant": "standard",
            "variant_permaslug": "deepseek/deepseek-r1",
            "count": 779151,
            "total_completion_tokens": 1077354518,
            "total_prompt_tokens": 3152973582,
            "total_native_tokens_reasoning": 585244280,
            "num_media_prompt": 124,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 10581056,
            "total_tool_calls": 30082,
            "requests_with_tool_call_errors": 1045
        },
        "qwen/qwen3-vl-8b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-vl-8b-instruct",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-vl-8b-instruct",
            "count": 7781731,
            "total_completion_tokens": 1421861558,
            "total_prompt_tokens": 8594391654,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 7434328,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 160562528,
            "total_tool_calls": 86278,
            "requests_with_tool_call_errors": 3374
        },
        "mistralai/mistral-7b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-7b-instruct",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-7b-instruct",
            "count": 511372,
            "total_completion_tokens": 73436658,
            "total_prompt_tokens": 485394721,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "anthropic/claude-4.5-sonnet-20250929": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "anthropic/claude-4.5-sonnet-20250929",
            "variant": "standard",
            "variant_permaslug": "anthropic/claude-4.5-sonnet-20250929",
            "count": 23485779,
            "total_completion_tokens": 12344009204,
            "total_prompt_tokens": 781245834164,
            "total_native_tokens_reasoning": 509278025,
            "num_media_prompt": 6006596,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 507231193823,
            "total_tool_calls": 9001911,
            "requests_with_tool_call_errors": 221803
        },
        "qwen/qwen2.5-vl-32b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen2.5-vl-32b-instruct",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen2.5-vl-32b-instruct",
            "count": 645588,
            "total_completion_tokens": 89811420,
            "total_prompt_tokens": 1986167487,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 557308,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 84296080,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "ibm-granite/granite-4.0-h-micro": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "ibm-granite/granite-4.0-h-micro",
            "variant": "standard",
            "variant_permaslug": "ibm-granite/granite-4.0-h-micro",
            "count": 402059,
            "total_completion_tokens": 48029034,
            "total_prompt_tokens": 655467559,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-audio-mini": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-audio-mini",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-audio-mini",
            "count": 4688,
            "total_completion_tokens": 2428037,
            "total_prompt_tokens": 2105169,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 1958,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/mixtral-8x7b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mixtral-8x7b-instruct",
            "variant": "standard",
            "variant_permaslug": "mistralai/mixtral-8x7b-instruct",
            "count": 8090801,
            "total_completion_tokens": 2324745397,
            "total_prompt_tokens": 1691311580,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 6,
            "requests_with_tool_call_errors": 4
        },
        "google/gemma-3-12b-it:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemma-3-12b-it",
            "variant": "free",
            "variant_permaslug": "google/gemma-3-12b-it:free",
            "count": 66238,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 54791449,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 34318,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "allenai/olmo-2-0325-32b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "allenai/olmo-2-0325-32b-instruct",
            "variant": "standard",
            "variant_permaslug": "allenai/olmo-2-0325-32b-instruct",
            "count": 119,
            "total_completion_tokens": 17925,
            "total_prompt_tokens": 166416,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "aion-labs/aion-1.0-mini": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "aion-labs/aion-1.0-mini",
            "variant": "standard",
            "variant_permaslug": "aion-labs/aion-1.0-mini",
            "count": 1749,
            "total_completion_tokens": 690580,
            "total_prompt_tokens": 2297110,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-4o-2024-08-06": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4o-2024-08-06",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4o-2024-08-06",
            "count": 278969,
            "total_completion_tokens": 32496053,
            "total_prompt_tokens": 338646842,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 19647,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 83269120,
            "total_tool_calls": 3489,
            "requests_with_tool_call_errors": 447
        },
        "mistralai/codestral-2508": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/codestral-2508",
            "variant": "standard",
            "variant_permaslug": "mistralai/codestral-2508",
            "count": 2232296,
            "total_completion_tokens": 336877942,
            "total_prompt_tokens": 3384393093,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 1960,
            "requests_with_tool_call_errors": 57
        },
        "google/gemini-2.5-flash-lite": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemini-2.5-flash-lite",
            "variant": "standard",
            "variant_permaslug": "google/gemini-2.5-flash-lite",
            "count": 103426441,
            "total_completion_tokens": 31659875717,
            "total_prompt_tokens": 260309030001,
            "total_native_tokens_reasoning": 1608199600,
            "num_media_prompt": 212189808,
            "num_media_completion": 0,
            "num_audio_prompt": 23226,
            "total_native_tokens_cached": 41116052668,
            "total_tool_calls": 2281661,
            "requests_with_tool_call_errors": 171902
        },
        "openai/o3-pro-2025-06-10": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/o3-pro-2025-06-10",
            "variant": "standard",
            "variant_permaslug": "openai/o3-pro-2025-06-10",
            "count": 3337,
            "total_completion_tokens": 2054818,
            "total_prompt_tokens": 15243698,
            "total_native_tokens_reasoning": 1054189,
            "num_media_prompt": 208,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 1459,
            "requests_with_tool_call_errors": 0
        },
        "sentence-transformers/paraphrase-minilm-l6-v2-20251117": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "sentence-transformers/paraphrase-minilm-l6-v2-20251117",
            "variant": "standard",
            "variant_permaslug": "sentence-transformers/paraphrase-minilm-l6-v2-20251117",
            "count": 20601,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 76404005,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/mistral-large-2411": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-large-2411",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-large-2411",
            "count": 69392,
            "total_completion_tokens": 20364448,
            "total_prompt_tokens": 250051299,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 1567,
            "requests_with_tool_call_errors": 30
        },
        "openai/gpt-4-1106-preview": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4-1106-preview",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4-1106-preview",
            "count": 29639,
            "total_completion_tokens": 3002692,
            "total_prompt_tokens": 19826741,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 8832,
            "requests_with_tool_call_errors": 4
        },
        "moonshotai/kimi-k2-0905": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "moonshotai/kimi-k2-0905",
            "variant": "standard",
            "variant_permaslug": "moonshotai/kimi-k2-0905",
            "count": 11476713,
            "total_completion_tokens": 1649528478,
            "total_prompt_tokens": 26469505503,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 344,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 3829086178,
            "total_tool_calls": 74087,
            "requests_with_tool_call_errors": 1219
        },
        "openai/gpt-4": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4",
            "count": 136521,
            "total_completion_tokens": 14150269,
            "total_prompt_tokens": 140665510,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1395584,
            "total_tool_calls": 3478,
            "requests_with_tool_call_errors": 212
        },
        "mistralai/ministral-3b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/ministral-3b",
            "variant": "standard",
            "variant_permaslug": "mistralai/ministral-3b",
            "count": 6329793,
            "total_completion_tokens": 312850241,
            "total_prompt_tokens": 4947849276,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 146,
            "requests_with_tool_call_errors": 8
        },
        "qwen/qwen-max-2025-01-25": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen-max-2025-01-25",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen-max-2025-01-25",
            "count": 60834,
            "total_completion_tokens": 10322415,
            "total_prompt_tokens": 107420863,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 629504,
            "total_tool_calls": 2245,
            "requests_with_tool_call_errors": 81
        },
        "anthropic/claude-3-5-haiku": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "anthropic/claude-3-5-haiku",
            "variant": "standard",
            "variant_permaslug": "anthropic/claude-3-5-haiku",
            "count": 4618564,
            "total_completion_tokens": 551549329,
            "total_prompt_tokens": 9445989016,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 42768,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1200291032,
            "total_tool_calls": 124276,
            "requests_with_tool_call_errors": 2694
        },
        "google/gemma-3n-e2b-it:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemma-3n-e2b-it",
            "variant": "free",
            "variant_permaslug": "google/gemma-3n-e2b-it:free",
            "count": 100981,
            "total_completion_tokens": 34038123,
            "total_prompt_tokens": 19350483,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 8,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-4-0314": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4-0314",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4-0314",
            "count": 1639,
            "total_completion_tokens": 361835,
            "total_prompt_tokens": 806148,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "sao10k/l3-euryale-70b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "sao10k/l3-euryale-70b",
            "variant": "standard",
            "variant_permaslug": "sao10k/l3-euryale-70b",
            "count": 25751,
            "total_completion_tokens": 7455897,
            "total_prompt_tokens": 30895033,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "baidu/ernie-4.5-21b-a3b-thinking": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "baidu/ernie-4.5-21b-a3b-thinking",
            "variant": "standard",
            "variant_permaslug": "baidu/ernie-4.5-21b-a3b-thinking",
            "count": 6119,
            "total_completion_tokens": 13871945,
            "total_prompt_tokens": 17060944,
            "total_native_tokens_reasoning": 11987443,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "nex-agi/deepseek-v3.1-nex-n1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nex-agi/deepseek-v3.1-nex-n1",
            "variant": "standard",
            "variant_permaslug": "nex-agi/deepseek-v3.1-nex-n1",
            "count": 237341,
            "total_completion_tokens": 143737138,
            "total_prompt_tokens": 3172479375,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 205,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 6124,
            "requests_with_tool_call_errors": 186
        },
        "qwen/qwen3-235b-a22b-07-25": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-235b-a22b-07-25",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-235b-a22b-07-25",
            "count": 27738550,
            "total_completion_tokens": 5143603685,
            "total_prompt_tokens": 65756794705,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 350,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 15195637496,
            "total_tool_calls": 376745,
            "requests_with_tool_call_errors": 10763
        },
        "nousresearch/hermes-4-405b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nousresearch/hermes-4-405b",
            "variant": "standard",
            "variant_permaslug": "nousresearch/hermes-4-405b",
            "count": 100190,
            "total_completion_tokens": 18994938,
            "total_prompt_tokens": 418466375,
            "total_native_tokens_reasoning": 1800661,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "google/gemma-3n-e4b-it:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemma-3n-e4b-it",
            "variant": "free",
            "variant_permaslug": "google/gemma-3n-e4b-it:free",
            "count": 26921,
            "total_completion_tokens": 7602874,
            "total_prompt_tokens": 14573881,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "anthropic/claude-3.5-sonnet": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "anthropic/claude-3.5-sonnet",
            "variant": "standard",
            "variant_permaslug": "anthropic/claude-3.5-sonnet",
            "count": 1163025,
            "total_completion_tokens": 319390574,
            "total_prompt_tokens": 4403983689,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 85333,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1195679087,
            "total_tool_calls": 73869,
            "requests_with_tool_call_errors": 3326
        },
        "openai/gpt-4o-mini-search-preview-2025-03-11": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4o-mini-search-preview-2025-03-11",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4o-mini-search-preview-2025-03-11",
            "count": 76615,
            "total_completion_tokens": 65653693,
            "total_prompt_tokens": 43376909,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mancer/weaver": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mancer/weaver",
            "variant": "standard",
            "variant_permaslug": "mancer/weaver",
            "count": 3285,
            "total_completion_tokens": 1488561,
            "total_prompt_tokens": 2836050,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "deepcogito/cogito-v2-preview-llama-109b-moe": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepcogito/cogito-v2-preview-llama-109b-moe",
            "variant": "standard",
            "variant_permaslug": "deepcogito/cogito-v2-preview-llama-109b-moe",
            "count": 10123,
            "total_completion_tokens": 1154296,
            "total_prompt_tokens": 32992630,
            "total_native_tokens_reasoning": 174120,
            "num_media_prompt": 11384,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 7,
            "requests_with_tool_call_errors": 0
        },
        "nousresearch/hermes-3-llama-3.1-405b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nousresearch/hermes-3-llama-3.1-405b",
            "variant": "standard",
            "variant_permaslug": "nousresearch/hermes-3-llama-3.1-405b",
            "count": 412952,
            "total_completion_tokens": 115254765,
            "total_prompt_tokens": 850007155,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "nvidia/nemotron-nano-9b-v2:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nvidia/nemotron-nano-9b-v2",
            "variant": "free",
            "variant_permaslug": "nvidia/nemotron-nano-9b-v2:free",
            "count": 75121,
            "total_completion_tokens": 76730359,
            "total_prompt_tokens": 283722712,
            "total_native_tokens_reasoning": 51109614,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 3452,
            "requests_with_tool_call_errors": 587
        },
        "qwen/qwen3-next-80b-a3b-instruct-2509:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-next-80b-a3b-instruct-2509",
            "variant": "free",
            "variant_permaslug": "qwen/qwen3-next-80b-a3b-instruct-2509:free",
            "count": 57796,
            "total_completion_tokens": 21857390,
            "total_prompt_tokens": 563875735,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 4455,
            "requests_with_tool_call_errors": 532
        },
        "moonshotai/kimi-k2-0905:exacto": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "moonshotai/kimi-k2-0905",
            "variant": "exacto",
            "variant_permaslug": "moonshotai/kimi-k2-0905:exacto",
            "count": 723895,
            "total_completion_tokens": 213242986,
            "total_prompt_tokens": 1141531777,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 701288253,
            "total_tool_calls": 14413,
            "requests_with_tool_call_errors": 121
        },
        "deepseek/deepseek-chat-v3-0324": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepseek/deepseek-chat-v3-0324",
            "variant": "standard",
            "variant_permaslug": "deepseek/deepseek-chat-v3-0324",
            "count": 27919785,
            "total_completion_tokens": 5316434896,
            "total_prompt_tokens": 107114035100,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 254,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 7243824223,
            "total_tool_calls": 35501,
            "requests_with_tool_call_errors": 2224
        },
        "openai/gpt-3.5-turbo-16k": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-3.5-turbo-16k",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-3.5-turbo-16k",
            "count": 41646,
            "total_completion_tokens": 6041361,
            "total_prompt_tokens": 40272129,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 12065,
            "requests_with_tool_call_errors": 77
        },
        "anthropic/claude-3-7-sonnet-20250219": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "anthropic/claude-3-7-sonnet-20250219",
            "variant": "standard",
            "variant_permaslug": "anthropic/claude-3-7-sonnet-20250219",
            "count": 2926565,
            "total_completion_tokens": 1391260505,
            "total_prompt_tokens": 27324106988,
            "total_native_tokens_reasoning": 13691552,
            "num_media_prompt": 222530,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 8427258210,
            "total_tool_calls": 181055,
            "requests_with_tool_call_errors": 4546
        },
        "openai/chatgpt-4o-latest": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/chatgpt-4o-latest",
            "variant": "standard",
            "variant_permaslug": "openai/chatgpt-4o-latest",
            "count": 415332,
            "total_completion_tokens": 108526462,
            "total_prompt_tokens": 1339527331,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 107281,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "meta-llama/llama-3.2-3b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-3.2-3b-instruct",
            "variant": "standard",
            "variant_permaslug": "meta-llama/llama-3.2-3b-instruct",
            "count": 7385388,
            "total_completion_tokens": 1935843119,
            "total_prompt_tokens": 6590530751,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "qwen/qwen-2-vl-7b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen-2-vl-7b-instruct",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen-2-vl-7b-instruct",
            "count": 305972,
            "total_completion_tokens": 28945407,
            "total_prompt_tokens": 259862256,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 274682,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/text-embedding-3-large": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/text-embedding-3-large",
            "variant": "standard",
            "variant_permaslug": "openai/text-embedding-3-large",
            "count": 5340977,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 4071224619,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "moonshotai/kimi-k2": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "moonshotai/kimi-k2",
            "variant": "standard",
            "variant_permaslug": "moonshotai/kimi-k2",
            "count": 1103050,
            "total_completion_tokens": 221770044,
            "total_prompt_tokens": 3212174918,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 11,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1618420451,
            "total_tool_calls": 43497,
            "requests_with_tool_call_errors": 618
        },
        "thedrummer/skyfall-36b-v2": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "thedrummer/skyfall-36b-v2",
            "variant": "standard",
            "variant_permaslug": "thedrummer/skyfall-36b-v2",
            "count": 372206,
            "total_completion_tokens": 114033104,
            "total_prompt_tokens": 1133099759,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 681424848,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "x-ai/grok-4-fast": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "x-ai/grok-4-fast",
            "variant": "standard",
            "variant_permaslug": "x-ai/grok-4-fast",
            "count": 30662938,
            "total_completion_tokens": 26956873712,
            "total_prompt_tokens": 139154030110,
            "total_native_tokens_reasoning": 14821789705,
            "num_media_prompt": 2345367,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 31193574569,
            "total_tool_calls": 722986,
            "requests_with_tool_call_errors": 1470
        },
        "openai/gpt-5.1-20251113": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5.1-20251113",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5.1-20251113",
            "count": 2665874,
            "total_completion_tokens": 3226437362,
            "total_prompt_tokens": 22140881048,
            "total_native_tokens_reasoning": 1928406314,
            "num_media_prompt": 1407067,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 7851680896,
            "total_tool_calls": 221243,
            "requests_with_tool_call_errors": 4487
        },
        "openai/gpt-4o": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4o",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4o",
            "count": 7199508,
            "total_completion_tokens": 921141443,
            "total_prompt_tokens": 12678725365,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 861698,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 3747912448,
            "total_tool_calls": 487300,
            "requests_with_tool_call_errors": 12787
        },
        "baai/bge-base-en-v1.5-20251117": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "baai/bge-base-en-v1.5-20251117",
            "variant": "standard",
            "variant_permaslug": "baai/bge-base-en-v1.5-20251117",
            "count": 12236,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 26346034,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-4.1-nano-2025-04-14": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4.1-nano-2025-04-14",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4.1-nano-2025-04-14",
            "count": 9125773,
            "total_completion_tokens": 1703784493,
            "total_prompt_tokens": 21456674991,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 379033,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 8451233280,
            "total_tool_calls": 596142,
            "requests_with_tool_call_errors": 528
        },
        "qwen/qwen3-vl-235b-a22b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-vl-235b-a22b-instruct",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-vl-235b-a22b-instruct",
            "count": 5690091,
            "total_completion_tokens": 1299636708,
            "total_prompt_tokens": 18280770584,
            "total_native_tokens_reasoning": 21140,
            "num_media_prompt": 13103591,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1989233920,
            "total_tool_calls": 44191,
            "requests_with_tool_call_errors": 29236
        },
        "deepseek/deepseek-r1-distill-llama-70b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "deepseek/deepseek-r1-distill-llama-70b",
            "variant": "standard",
            "variant_permaslug": "deepseek/deepseek-r1-distill-llama-70b",
            "count": 634067,
            "total_completion_tokens": 285712742,
            "total_prompt_tokens": 1136603945,
            "total_native_tokens_reasoning": 261923111,
            "num_media_prompt": 193,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 308541240,
            "total_tool_calls": 1,
            "requests_with_tool_call_errors": 0
        },
        "xiaomi/mimo-v2-flash-20251210:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "xiaomi/mimo-v2-flash-20251210",
            "variant": "free",
            "variant_permaslug": "xiaomi/mimo-v2-flash-20251210:free",
            "count": 83499620,
            "total_completion_tokens": 92858868926,
            "total_prompt_tokens": 533854603083,
            "total_native_tokens_reasoning": 46324822231,
            "num_media_prompt": 1744,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 140015164033,
            "total_tool_calls": 2701216,
            "requests_with_tool_call_errors": 92915
        },
        "openai/gpt-5-mini-2025-08-07": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5-mini-2025-08-07",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5-mini-2025-08-07",
            "count": 17378914,
            "total_completion_tokens": 13324307036,
            "total_prompt_tokens": 88844254326,
            "total_native_tokens_reasoning": 9028918766,
            "num_media_prompt": 13994234,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 28117811840,
            "total_tool_calls": 2659700,
            "requests_with_tool_call_errors": 18771
        },
        "qwen/qwen-vl-max-2025-01-25": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen-vl-max-2025-01-25",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen-vl-max-2025-01-25",
            "count": 20268,
            "total_completion_tokens": 4466962,
            "total_prompt_tokens": 235783583,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 121122,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 63,
            "requests_with_tool_call_errors": 21
        },
        "meta-llama/llama-3.1-405b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-3.1-405b-instruct",
            "variant": "standard",
            "variant_permaslug": "meta-llama/llama-3.1-405b-instruct",
            "count": 184805,
            "total_completion_tokens": 35772350,
            "total_prompt_tokens": 572213457,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 1317,
            "requests_with_tool_call_errors": 59
        },
        "aion-labs/aion-rp-llama-3.1-8b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "aion-labs/aion-rp-llama-3.1-8b",
            "variant": "standard",
            "variant_permaslug": "aion-labs/aion-rp-llama-3.1-8b",
            "count": 26823,
            "total_completion_tokens": 4683828,
            "total_prompt_tokens": 349601833,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-5-chat-2025-08-07": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5-chat-2025-08-07",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5-chat-2025-08-07",
            "count": 2409983,
            "total_completion_tokens": 550313101,
            "total_prompt_tokens": 11178088280,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 369029,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 5831974400,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-4-turbo-preview": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-4-turbo-preview",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-4-turbo-preview",
            "count": 19959,
            "total_completion_tokens": 3213959,
            "total_prompt_tokens": 19615720,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 170,
            "requests_with_tool_call_errors": 0
        },
        "google/gemma-2-27b-it": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemma-2-27b-it",
            "variant": "standard",
            "variant_permaslug": "google/gemma-2-27b-it",
            "count": 74530,
            "total_completion_tokens": 9125901,
            "total_prompt_tokens": 58902539,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 175,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-oss-120b:exacto": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-oss-120b",
            "variant": "exacto",
            "variant_permaslug": "openai/gpt-oss-120b:exacto",
            "count": 2692561,
            "total_completion_tokens": 1828286490,
            "total_prompt_tokens": 7133026725,
            "total_native_tokens_reasoning": 927237119,
            "num_media_prompt": 1,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 572126490,
            "total_tool_calls": 296243,
            "requests_with_tool_call_errors": 48531
        },
        "qwen/qwen3-14b-04-28": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-14b-04-28",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-14b-04-28",
            "count": 2087055,
            "total_completion_tokens": 1058081808,
            "total_prompt_tokens": 3127643260,
            "total_native_tokens_reasoning": 330399419,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1251873947,
            "total_tool_calls": 54443,
            "requests_with_tool_call_errors": 1324
        },
        "meta-llama/llama-3.3-70b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-3.3-70b-instruct",
            "variant": "standard",
            "variant_permaslug": "meta-llama/llama-3.3-70b-instruct",
            "count": 21786809,
            "total_completion_tokens": 1828166814,
            "total_prompt_tokens": 22315968072,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 18,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 6834020500,
            "total_tool_calls": 304243,
            "requests_with_tool_call_errors": 160710
        },
        "arcee-ai/trinity-mini-20251201": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "arcee-ai/trinity-mini-20251201",
            "variant": "standard",
            "variant_permaslug": "arcee-ai/trinity-mini-20251201",
            "count": 54526,
            "total_completion_tokens": 51385937,
            "total_prompt_tokens": 39113112,
            "total_native_tokens_reasoning": 48019429,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 133,
            "requests_with_tool_call_errors": 30
        },
        "qwen/qwen2.5-coder-7b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen2.5-coder-7b-instruct",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen2.5-coder-7b-instruct",
            "count": 22439,
            "total_completion_tokens": 19962041,
            "total_prompt_tokens": 18486034,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "qwen/qwen-2.5-coder-32b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen-2.5-coder-32b-instruct",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen-2.5-coder-32b-instruct",
            "count": 570734,
            "total_completion_tokens": 51384294,
            "total_prompt_tokens": 726253531,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 170517439,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "sourceful/riverflow-v2-standard-preview": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "sourceful/riverflow-v2-standard-preview",
            "variant": "standard",
            "variant_permaslug": "sourceful/riverflow-v2-standard-preview",
            "count": 3311,
            "total_completion_tokens": 13823425,
            "total_prompt_tokens": 7310731,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 2927,
            "num_media_completion": 3311,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "nousresearch/hermes-3-llama-3.1-70b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "nousresearch/hermes-3-llama-3.1-70b",
            "variant": "standard",
            "variant_permaslug": "nousresearch/hermes-3-llama-3.1-70b",
            "count": 244353,
            "total_completion_tokens": 51376380,
            "total_prompt_tokens": 382266971,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "mistralai/mixtral-8x22b-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mixtral-8x22b-instruct",
            "variant": "standard",
            "variant_permaslug": "mistralai/mixtral-8x22b-instruct",
            "count": 72106,
            "total_completion_tokens": 13138001,
            "total_prompt_tokens": 111588907,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 299,
            "requests_with_tool_call_errors": 37
        },
        "mistralai/devstral-small-2507": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/devstral-small-2507",
            "variant": "standard",
            "variant_permaslug": "mistralai/devstral-small-2507",
            "count": 594211,
            "total_completion_tokens": 83734614,
            "total_prompt_tokens": 2264919430,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 6007,
            "requests_with_tool_call_errors": 27
        },
        "mistralai/mistral-7b-instruct-v0.1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-7b-instruct-v0.1",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-7b-instruct-v0.1",
            "count": 39132,
            "total_completion_tokens": 5984144,
            "total_prompt_tokens": 9952537,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/o3-mini-high-2025-01-31": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/o3-mini-high-2025-01-31",
            "variant": "standard",
            "variant_permaslug": "openai/o3-mini-high-2025-01-31",
            "count": 139048,
            "total_completion_tokens": 154918975,
            "total_prompt_tokens": 4333351095,
            "total_native_tokens_reasoning": 145036096,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 675452544,
            "total_tool_calls": 233,
            "requests_with_tool_call_errors": 0
        },
        "black-forest-labs/flux.2-pro": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "black-forest-labs/flux.2-pro",
            "variant": "standard",
            "variant_permaslug": "black-forest-labs/flux.2-pro",
            "count": 13472,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 2992990,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 7743,
            "num_media_completion": 13472,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-5.1-codex-max-20251204": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5.1-codex-max-20251204",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5.1-codex-max-20251204",
            "count": 60407,
            "total_completion_tokens": 44722195,
            "total_prompt_tokens": 1961313486,
            "total_native_tokens_reasoning": 25283813,
            "num_media_prompt": 7886,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1476752384,
            "total_tool_calls": 38777,
            "requests_with_tool_call_errors": 201
        },
        "black-forest-labs/flux.2-flex": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "black-forest-labs/flux.2-flex",
            "variant": "standard",
            "variant_permaslug": "black-forest-labs/flux.2-flex",
            "count": 1677,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 418879,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 1022,
            "num_media_completion": 1677,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "google/gemini-2.5-flash-lite-preview-09-2025": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemini-2.5-flash-lite-preview-09-2025",
            "variant": "standard",
            "variant_permaslug": "google/gemini-2.5-flash-lite-preview-09-2025",
            "count": 18586530,
            "total_completion_tokens": 8480917247,
            "total_prompt_tokens": 53881010810,
            "total_native_tokens_reasoning": 1758499158,
            "num_media_prompt": 6065107,
            "num_media_completion": 0,
            "num_audio_prompt": 746913,
            "total_native_tokens_cached": 14868768460,
            "total_tool_calls": 358965,
            "requests_with_tool_call_errors": 3287
        },
        "mistralai/mistral-small-3.2-24b-instruct-2506": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-small-3.2-24b-instruct-2506",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-small-3.2-24b-instruct-2506",
            "count": 5934281,
            "total_completion_tokens": 3148093352,
            "total_prompt_tokens": 23268604466,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 470463,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 4753085600,
            "total_tool_calls": 87588,
            "requests_with_tool_call_errors": 13017
        },
        "black-forest-labs/flux.2-max": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "black-forest-labs/flux.2-max",
            "variant": "standard",
            "variant_permaslug": "black-forest-labs/flux.2-max",
            "count": 4396,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 1235436,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 3251,
            "num_media_completion": 4396,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "sao10k/l3.1-euryale-70b": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "sao10k/l3.1-euryale-70b",
            "variant": "standard",
            "variant_permaslug": "sao10k/l3.1-euryale-70b",
            "count": 145937,
            "total_completion_tokens": 20145246,
            "total_prompt_tokens": 427655177,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/o4-mini-deep-research-2025-06-26": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/o4-mini-deep-research-2025-06-26",
            "variant": "standard",
            "variant_permaslug": "openai/o4-mini-deep-research-2025-06-26",
            "count": 3748,
            "total_completion_tokens": 44484465,
            "total_prompt_tokens": 118312484,
            "total_native_tokens_reasoning": 40540192,
            "num_media_prompt": 473,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 2013184,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "aion-labs/aion-1.0": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "aion-labs/aion-1.0",
            "variant": "standard",
            "variant_permaslug": "aion-labs/aion-1.0",
            "count": 35452,
            "total_completion_tokens": 68886741,
            "total_prompt_tokens": 395143297,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "sao10k/l3.3-euryale-70b-v2.3": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "sao10k/l3.3-euryale-70b-v2.3",
            "variant": "standard",
            "variant_permaslug": "sao10k/l3.3-euryale-70b-v2.3",
            "count": 231760,
            "total_completion_tokens": 22652991,
            "total_prompt_tokens": 378865067,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "kwaipilot/kat-coder-pro-v1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "kwaipilot/kat-coder-pro-v1",
            "variant": "standard",
            "variant_permaslug": "kwaipilot/kat-coder-pro-v1",
            "count": 105142,
            "total_completion_tokens": 46987910,
            "total_prompt_tokens": 1789650757,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1560217657,
            "total_tool_calls": 19079,
            "requests_with_tool_call_errors": 4136
        },
        "cohere/command-r-08-2024": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "cohere/command-r-08-2024",
            "variant": "standard",
            "variant_permaslug": "cohere/command-r-08-2024",
            "count": 120705,
            "total_completion_tokens": 11081999,
            "total_prompt_tokens": 89475364,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 155,
            "requests_with_tool_call_errors": 3
        },
        "liquid/lfm-2.5-1.2b-instruct-20260120:free": {
            "date": "2026-01-20 00:00:00",
            "model_permaslug": "liquid/lfm-2.5-1.2b-instruct-20260120",
            "variant": "free",
            "variant_permaslug": "liquid/lfm-2.5-1.2b-instruct-20260120:free",
            "count": 56136,
            "total_completion_tokens": 9170936,
            "total_prompt_tokens": 107868868,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "sourceful/riverflow-v2-fast-preview": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "sourceful/riverflow-v2-fast-preview",
            "variant": "standard",
            "variant_permaslug": "sourceful/riverflow-v2-fast-preview",
            "count": 1820,
            "total_completion_tokens": 7598500,
            "total_prompt_tokens": 3182118,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 1413,
            "num_media_completion": 1820,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "qwen/qwen3-vl-235b-a22b-thinking": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-vl-235b-a22b-thinking",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-vl-235b-a22b-thinking",
            "count": 406676,
            "total_completion_tokens": 1112760537,
            "total_prompt_tokens": 783612967,
            "total_native_tokens_reasoning": 938936885,
            "num_media_prompt": 426919,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 27,
            "requests_with_tool_call_errors": 3
        },
        "mistralai/mistral-small-3.1-24b-instruct-2503": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/mistral-small-3.1-24b-instruct-2503",
            "variant": "standard",
            "variant_permaslug": "mistralai/mistral-small-3.1-24b-instruct-2503",
            "count": 682972,
            "total_completion_tokens": 88256527,
            "total_prompt_tokens": 824409062,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 1598,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 55064647,
            "total_tool_calls": 1,
            "requests_with_tool_call_errors": 0
        },
        "stepfun-ai/step3": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "stepfun-ai/step3",
            "variant": "standard",
            "variant_permaslug": "stepfun-ai/step3",
            "count": 2168,
            "total_completion_tokens": 3765435,
            "total_prompt_tokens": 4323362,
            "total_native_tokens_reasoning": 2620503,
            "num_media_prompt": 803,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 3,
            "requests_with_tool_call_errors": 1
        },
        "z-ai/glm-4.7-flash-20260119": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "z-ai/glm-4.7-flash-20260119",
            "variant": "standard",
            "variant_permaslug": "z-ai/glm-4.7-flash-20260119",
            "count": 391103,
            "total_completion_tokens": 503788659,
            "total_prompt_tokens": 3886937150,
            "total_native_tokens_reasoning": 385546998,
            "num_media_prompt": 675,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 938865656,
            "total_tool_calls": 69581,
            "requests_with_tool_call_errors": 5346
        },
        "meta-llama/llama-3.2-11b-vision-instruct": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "meta-llama/llama-3.2-11b-vision-instruct",
            "variant": "standard",
            "variant_permaslug": "meta-llama/llama-3.2-11b-vision-instruct",
            "count": 783918,
            "total_completion_tokens": 59546211,
            "total_prompt_tokens": 3423065046,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 763954,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "microsoft/phi-4": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "microsoft/phi-4",
            "variant": "standard",
            "variant_permaslug": "microsoft/phi-4",
            "count": 2800573,
            "total_completion_tokens": 67183370,
            "total_prompt_tokens": 807060229,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "anthropic/claude-4.5-opus-20251124": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "anthropic/claude-4.5-opus-20251124",
            "variant": "standard",
            "variant_permaslug": "anthropic/claude-4.5-opus-20251124",
            "count": 10493841,
            "total_completion_tokens": 6854303978,
            "total_prompt_tokens": 390764902861,
            "total_native_tokens_reasoning": 581240085,
            "num_media_prompt": 10425135,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 239903108464,
            "total_tool_calls": 5755981,
            "requests_with_tool_call_errors": 150431
        },
        "mistralai/ministral-3b-2512": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "mistralai/ministral-3b-2512",
            "variant": "standard",
            "variant_permaslug": "mistralai/ministral-3b-2512",
            "count": 941810,
            "total_completion_tokens": 244855602,
            "total_prompt_tokens": 685990433,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 8774,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 1098,
            "requests_with_tool_call_errors": 76
        },
        "openai/text-embedding-ada-002": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/text-embedding-ada-002",
            "variant": "standard",
            "variant_permaslug": "openai/text-embedding-ada-002",
            "count": 1773891,
            "total_completion_tokens": 0,
            "total_prompt_tokens": 2744825472,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "openai/gpt-5.1-chat-20251113": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5.1-chat-20251113",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5.1-chat-20251113",
            "count": 516153,
            "total_completion_tokens": 83117350,
            "total_prompt_tokens": 2437443388,
            "total_native_tokens_reasoning": 8020224,
            "num_media_prompt": 144230,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 947214976,
            "total_tool_calls": 31605,
            "requests_with_tool_call_errors": 24
        },
        "amazon/nova-2-lite-v1": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "amazon/nova-2-lite-v1",
            "variant": "standard",
            "variant_permaslug": "amazon/nova-2-lite-v1",
            "count": 59703,
            "total_completion_tokens": 61390805,
            "total_prompt_tokens": 182561972,
            "total_native_tokens_reasoning": 10674,
            "num_media_prompt": 22469,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 5016,
            "requests_with_tool_call_errors": 5
        },
        "anthropic/claude-4-opus-20250522": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "anthropic/claude-4-opus-20250522",
            "variant": "standard",
            "variant_permaslug": "anthropic/claude-4-opus-20250522",
            "count": 99754,
            "total_completion_tokens": 51593532,
            "total_prompt_tokens": 1235228141,
            "total_native_tokens_reasoning": 1243573,
            "num_media_prompt": 11030,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 520152888,
            "total_tool_calls": 22752,
            "requests_with_tool_call_errors": 331
        },
        "qwen/qwen3-235b-a22b-04-28": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen3-235b-a22b-04-28",
            "variant": "standard",
            "variant_permaslug": "qwen/qwen3-235b-a22b-04-28",
            "count": 664448,
            "total_completion_tokens": 584861886,
            "total_prompt_tokens": 1872359913,
            "total_native_tokens_reasoning": 435221401,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 424807100,
            "total_tool_calls": 10029,
            "requests_with_tool_call_errors": 148
        },
        "openai/gpt-5.2-codex-20260114": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "openai/gpt-5.2-codex-20260114",
            "variant": "standard",
            "variant_permaslug": "openai/gpt-5.2-codex-20260114",
            "count": 867597,
            "total_completion_tokens": 976412353,
            "total_prompt_tokens": 43360971481,
            "total_native_tokens_reasoning": 651711042,
            "num_media_prompt": 230805,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 35740070400,
            "total_tool_calls": 556537,
            "requests_with_tool_call_errors": 4408
        },
        "google/gemma-3-12b-it": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "google/gemma-3-12b-it",
            "variant": "standard",
            "variant_permaslug": "google/gemma-3-12b-it",
            "count": 8397216,
            "total_completion_tokens": 1393883939,
            "total_prompt_tokens": 6848742766,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 746128,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1140641131,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "qwen/qwen-2-vl-7b-instruct:free": {
            "date": "2026-01-19 00:00:00",
            "model_permaslug": "qwen/qwen-2-vl-7b-instruct",
            "variant": "free",
            "variant_permaslug": "qwen/qwen-2-vl-7b-instruct:free",
            "count": 51618,
            "total_completion_tokens": 15733701,
            "total_prompt_tokens": 160992730,
            "total_native_tokens_reasoning": 0,
            "num_media_prompt": 39114,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 0,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        },
        "allenai/olmo-3-32b-think-20251121": {
            "date": "2026-01-20 00:00:00",
            "model_permaslug": "allenai/olmo-3-32b-think-20251121",
            "variant": "standard",
            "variant_permaslug": "allenai/olmo-3-32b-think-20251121",
            "count": 2,
            "total_completion_tokens": 1175,
            "total_prompt_tokens": 1288,
            "total_native_tokens_reasoning": 1323,
            "num_media_prompt": 0,
            "num_media_completion": 0,
            "num_audio_prompt": 0,
            "total_native_tokens_cached": 1280,
            "total_tool_calls": 0,
            "requests_with_tool_call_errors": 0
        }
    },
    "categories": {
        "x-ai/grok-code-fast-1": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "x-ai/grok-code-fast-1",
                "category": "programming",
                "count": 10836,
                "total_prompt_tokens": 531133745,
                "total_completion_tokens": 5665781,
                "volume": 3.5350348246,
                "rank": 1
            }
        ],
        "google/gemini-2.5-flash": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash",
                "category": "legal",
                "count": 7008,
                "total_prompt_tokens": 38636587,
                "total_completion_tokens": 1352649,
                "volume": 13.476538740833334,
                "rank": 1
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash",
                "category": "health",
                "count": 3920,
                "total_prompt_tokens": 8406078,
                "total_completion_tokens": 949371,
                "volume": 3.5860605543,
                "rank": 2
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash",
                "category": "academia",
                "count": 7371,
                "total_prompt_tokens": 13342756,
                "total_completion_tokens": 2101928,
                "volume": 7.608459497666667,
                "rank": 2
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash",
                "category": "marketing/seo",
                "count": 768,
                "total_prompt_tokens": 3001599,
                "total_completion_tokens": 369433,
                "volume": 1.37687878,
                "rank": 3
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash",
                "category": "trivia",
                "count": 1121,
                "total_prompt_tokens": 1170020,
                "total_completion_tokens": 82831,
                "volume": 0.3562632706666667,
                "rank": 4
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash",
                "category": "marketing",
                "count": 2101,
                "total_prompt_tokens": 6826805,
                "total_completion_tokens": 945513,
                "volume": 3.4052504572,
                "rank": 4
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash",
                "category": "science",
                "count": 8539,
                "total_prompt_tokens": 29778965,
                "total_completion_tokens": 2507316,
                "volume": 12.478750967766667,
                "rank": 4
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash",
                "category": "roleplay",
                "count": 13043,
                "total_prompt_tokens": 80049644,
                "total_completion_tokens": 4300091,
                "volume": 25.597364748133334,
                "rank": 5
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash",
                "category": "finance",
                "count": 4283,
                "total_prompt_tokens": 13330084,
                "total_completion_tokens": 1235691,
                "volume": 4.560706761466666,
                "rank": 6
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash",
                "category": "technology",
                "count": 15530,
                "total_prompt_tokens": 49818555,
                "total_completion_tokens": 3253293,
                "volume": 17.849434636999998,
                "rank": 6
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash",
                "category": "translation",
                "count": 5708,
                "total_prompt_tokens": 8180159,
                "total_completion_tokens": 818147,
                "volume": 3.362067071,
                "rank": 6
            }
        ],
        "openai/gpt-oss-120b": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-oss-120b",
                "category": "translation",
                "count": 43949,
                "total_prompt_tokens": 46903567,
                "total_completion_tokens": 15150366,
                "volume": 1.29545287424,
                "rank": 1
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-oss-120b",
                "category": "trivia",
                "count": 744,
                "total_prompt_tokens": 1635428,
                "total_completion_tokens": 370527,
                "volume": 0.0520163832,
                "rank": 2
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-oss-120b",
                "category": "finance",
                "count": 2467,
                "total_prompt_tokens": 17372657,
                "total_completion_tokens": 1564553,
                "volume": 3.40829904244,
                "rank": 2
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-oss-120b",
                "category": "legal",
                "count": 2180,
                "total_prompt_tokens": 14313450,
                "total_completion_tokens": 803310,
                "volume": 2.0643605301999997,
                "rank": 2
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-oss-120b",
                "category": "marketing",
                "count": 1416,
                "total_prompt_tokens": 9217422,
                "total_completion_tokens": 1435333,
                "volume": 0.42303750005,
                "rank": 3
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-oss-120b",
                "category": "academia",
                "count": 10785,
                "total_prompt_tokens": 7751331,
                "total_completion_tokens": 2010781,
                "volume": 0.65319241523,
                "rank": 4
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-oss-120b",
                "category": "science",
                "count": 3714,
                "total_prompt_tokens": 19163898,
                "total_completion_tokens": 2395485,
                "volume": 3.55779855165,
                "rank": 8
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-oss-120b",
                "category": "technology",
                "count": 6058,
                "total_prompt_tokens": 35136008,
                "total_completion_tokens": 4671065,
                "volume": 5.57806890951,
                "rank": 9
            }
        ],
        "google/gemini-3-flash-preview-20251217": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-3-flash-preview-20251217",
                "category": "health",
                "count": 3124,
                "total_prompt_tokens": 11738693,
                "total_completion_tokens": 1832928,
                "volume": 10.594289208500001,
                "rank": 1
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-3-flash-preview-20251217",
                "category": "finance",
                "count": 3791,
                "total_prompt_tokens": 22809969,
                "total_completion_tokens": 1140177,
                "volume": 9.9780890215,
                "rank": 1
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-3-flash-preview-20251217",
                "category": "technology",
                "count": 13378,
                "total_prompt_tokens": 119941389,
                "total_completion_tokens": 4115561,
                "volume": 52.79453034583333,
                "rank": 3
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-3-flash-preview-20251217",
                "category": "programming",
                "count": 9684,
                "total_prompt_tokens": 244232887,
                "total_completion_tokens": 3362604,
                "volume": 34.280786395,
                "rank": 3
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-3-flash-preview-20251217",
                "category": "academia",
                "count": 4949,
                "total_prompt_tokens": 10603509,
                "total_completion_tokens": 3881727,
                "volume": 18.143410949,
                "rank": 3
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-3-flash-preview-20251217",
                "category": "science",
                "count": 6993,
                "total_prompt_tokens": 46459659,
                "total_completion_tokens": 2309513,
                "volume": 26.611923623166668,
                "rank": 3
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-3-flash-preview-20251217",
                "category": "legal",
                "count": 2161,
                "total_prompt_tokens": 5267428,
                "total_completion_tokens": 540977,
                "volume": 4.59874074,
                "rank": 4
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-3-flash-preview-20251217",
                "category": "trivia",
                "count": 602,
                "total_prompt_tokens": 1061500,
                "total_completion_tokens": 112671,
                "volume": 0.74280744,
                "rank": 5
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-3-flash-preview-20251217",
                "category": "translation",
                "count": 6648,
                "total_prompt_tokens": 10962479,
                "total_completion_tokens": 1464967,
                "volume": 7.920350073,
                "rank": 5
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-3-flash-preview-20251217",
                "category": "marketing",
                "count": 1177,
                "total_prompt_tokens": 3392588,
                "total_completion_tokens": 331680,
                "volume": 2.0894731898333334,
                "rank": 6
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-3-flash-preview-20251217",
                "category": "roleplay",
                "count": 7599,
                "total_prompt_tokens": 56120704,
                "total_completion_tokens": 2970028,
                "volume": 26.75196715066667,
                "rank": 8
            }
        ],
        "x-ai/grok-4.1-fast": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "x-ai/grok-4.1-fast",
                "category": "trivia",
                "count": 1015,
                "total_prompt_tokens": 1891019,
                "total_completion_tokens": 237321,
                "volume": 0.691084712,
                "rank": 1
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "x-ai/grok-4.1-fast",
                "category": "roleplay",
                "count": 11716,
                "total_prompt_tokens": 93141347,
                "total_completion_tokens": 4738511,
                "volume": 11.2644881925,
                "rank": 4
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "x-ai/grok-4.1-fast",
                "category": "marketing",
                "count": 1137,
                "total_prompt_tokens": 5695128,
                "total_completion_tokens": 787523,
                "volume": 1.842000172,
                "rank": 5
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "x-ai/grok-4.1-fast",
                "category": "science",
                "count": 5103,
                "total_prompt_tokens": 25233712,
                "total_completion_tokens": 1614711,
                "volume": 5.229664069,
                "rank": 6
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "x-ai/grok-4.1-fast",
                "category": "technology",
                "count": 5860,
                "total_prompt_tokens": 45123767,
                "total_completion_tokens": 2051482,
                "volume": 9.6054095765,
                "rank": 7
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "x-ai/grok-4.1-fast",
                "category": "health",
                "count": 433,
                "total_prompt_tokens": 3899145,
                "total_completion_tokens": 346844,
                "volume": 1.158146058,
                "rank": 8
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "x-ai/grok-4.1-fast",
                "category": "legal",
                "count": 392,
                "total_prompt_tokens": 3200474,
                "total_completion_tokens": 209423,
                "volume": 0.922147195,
                "rank": 9
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "x-ai/grok-4.1-fast",
                "category": "finance",
                "count": 2190,
                "total_prompt_tokens": 11119589,
                "total_completion_tokens": 758446,
                "volume": 4.3694143875,
                "rank": 9
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "x-ai/grok-4.1-fast",
                "category": "translation",
                "count": 1797,
                "total_prompt_tokens": 2182858,
                "total_completion_tokens": 465645,
                "volume": 0.813118916,
                "rank": 9
            }
        ],
        "xiaomi/mimo-v2-flash-20251210:free": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "xiaomi/mimo-v2-flash-20251210:free",
                "category": "marketing",
                "count": 1272,
                "total_prompt_tokens": 66919804,
                "total_completion_tokens": 585052,
                "volume": 0,
                "rank": 1
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "xiaomi/mimo-v2-flash-20251210:free",
                "category": "academia",
                "count": 4181,
                "total_prompt_tokens": 10009895,
                "total_completion_tokens": 32336029,
                "volume": 0.1,
                "rank": 1
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "xiaomi/mimo-v2-flash-20251210:free",
                "category": "science",
                "count": 24083,
                "total_prompt_tokens": 114486859,
                "total_completion_tokens": 53325428,
                "volume": 0.06,
                "rank": 1
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "xiaomi/mimo-v2-flash-20251210:free",
                "category": "technology",
                "count": 15335,
                "total_prompt_tokens": 169831265,
                "total_completion_tokens": 12225969,
                "volume": 0.1,
                "rank": 2
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "xiaomi/mimo-v2-flash-20251210:free",
                "category": "roleplay",
                "count": 11866,
                "total_prompt_tokens": 147487589,
                "total_completion_tokens": 8563346,
                "volume": 0.1,
                "rank": 2
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "xiaomi/mimo-v2-flash-20251210:free",
                "category": "marketing/seo",
                "count": 2090,
                "total_prompt_tokens": 5320314,
                "total_completion_tokens": 3194864,
                "volume": 0,
                "rank": 2
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "xiaomi/mimo-v2-flash-20251210:free",
                "category": "legal",
                "count": 773,
                "total_prompt_tokens": 5020299,
                "total_completion_tokens": 1662541,
                "volume": 0,
                "rank": 3
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "xiaomi/mimo-v2-flash-20251210:free",
                "category": "finance",
                "count": 2717,
                "total_prompt_tokens": 15341092,
                "total_completion_tokens": 1247697,
                "volume": 0.12,
                "rank": 4
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "xiaomi/mimo-v2-flash-20251210:free",
                "category": "programming",
                "count": 20036,
                "total_prompt_tokens": 129182027,
                "total_completion_tokens": 14373249,
                "volume": 0.08,
                "rank": 5
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "xiaomi/mimo-v2-flash-20251210:free",
                "category": "translation",
                "count": 2337,
                "total_prompt_tokens": 3678570,
                "total_completion_tokens": 2361201,
                "volume": 0,
                "rank": 7
            }
        ],
        "deepseek/deepseek-v3.2-20251201": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "deepseek/deepseek-v3.2-20251201",
                "category": "roleplay",
                "count": 27446,
                "total_prompt_tokens": 345459113,
                "total_completion_tokens": 12965361,
                "volume": 33.532336778310004,
                "rank": 1
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "deepseek/deepseek-v3.2-20251201",
                "category": "academia",
                "count": 1325,
                "total_prompt_tokens": 7576854,
                "total_completion_tokens": 2135178,
                "volume": 2.64958215181,
                "rank": 5
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "deepseek/deepseek-v3.2-20251201",
                "category": "programming",
                "count": 5521,
                "total_prompt_tokens": 72255007,
                "total_completion_tokens": 3243899,
                "volume": 17.03625339718,
                "rank": 9
            }
        ],
        "anthropic/claude-4.5-sonnet-20250929": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "anthropic/claude-4.5-sonnet-20250929",
                "category": "technology",
                "count": 6664,
                "total_prompt_tokens": 352763361,
                "total_completion_tokens": 2402697,
                "volume": 227.956396639,
                "rank": 1
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "anthropic/claude-4.5-sonnet-20250929",
                "category": "programming",
                "count": 6564,
                "total_prompt_tokens": 293890452,
                "total_completion_tokens": 3101214,
                "volume": 442.8547804285,
                "rank": 2
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "anthropic/claude-4.5-sonnet-20250929",
                "category": "science",
                "count": 2134,
                "total_prompt_tokens": 62510757,
                "total_completion_tokens": 855040,
                "volume": 139.5991539595,
                "rank": 2
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "anthropic/claude-4.5-sonnet-20250929",
                "category": "health",
                "count": 467,
                "total_prompt_tokens": 5607919,
                "total_completion_tokens": 222504,
                "volume": 24.1709653185,
                "rank": 3
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "anthropic/claude-4.5-sonnet-20250929",
                "category": "marketing",
                "count": 187,
                "total_prompt_tokens": 2971866,
                "total_completion_tokens": 96519,
                "volume": 11.1058761635,
                "rank": 7
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "anthropic/claude-4.5-sonnet-20250929",
                "category": "academia",
                "count": 737,
                "total_prompt_tokens": 6184279,
                "total_completion_tokens": 335053,
                "volume": 23.17357555,
                "rank": 7
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "anthropic/claude-4.5-sonnet-20250929",
                "category": "marketing/seo",
                "count": 324,
                "total_prompt_tokens": 883787,
                "total_completion_tokens": 84515,
                "volume": 4.4639487,
                "rank": 10
            }
        ],
        "x-ai/grok-4-fast": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "x-ai/grok-4-fast",
                "category": "marketing/seo",
                "count": 3379,
                "total_prompt_tokens": 14025501,
                "total_completion_tokens": 4645751,
                "volume": 7.4791038835000005,
                "rank": 1
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "x-ai/grok-4-fast",
                "category": "legal",
                "count": 70,
                "total_prompt_tokens": 4384559,
                "total_completion_tokens": 97836,
                "volume": 1.7034889340000001,
                "rank": 7
            }
        ],
        "meta-llama/llama-3.1-8b-instruct": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "meta-llama/llama-3.1-8b-instruct",
                "category": "translation",
                "count": 11865,
                "total_prompt_tokens": 13137000,
                "total_completion_tokens": 669287,
                "volume": 0.8780004331,
                "rank": 2
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "meta-llama/llama-3.1-8b-instruct",
                "category": "trivia",
                "count": 1804,
                "total_prompt_tokens": 639350,
                "total_completion_tokens": 6200,
                "volume": 0.018702475,
                "rank": 7
            }
        ],
        "google/gemini-2.5-flash-lite": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash-lite",
                "category": "marketing",
                "count": 5138,
                "total_prompt_tokens": 19811003,
                "total_completion_tokens": 1550916,
                "volume": 1.294499445,
                "rank": 2
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash-lite",
                "category": "technology",
                "count": 15532,
                "total_prompt_tokens": 86937346,
                "total_completion_tokens": 8144806,
                "volume": 4.953564093433333,
                "rank": 4
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash-lite",
                "category": "translation",
                "count": 9568,
                "total_prompt_tokens": 9797985,
                "total_completion_tokens": 2853191,
                "volume": 1.96591817301,
                "rank": 4
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash-lite",
                "category": "legal",
                "count": 1631,
                "total_prompt_tokens": 4395949,
                "total_completion_tokens": 435010,
                "volume": 0.724170027,
                "rank": 6
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash-lite",
                "category": "health",
                "count": 3795,
                "total_prompt_tokens": 3335379,
                "total_completion_tokens": 1003887,
                "volume": 0.8050978128,
                "rank": 7
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash-lite",
                "category": "academia",
                "count": 1612,
                "total_prompt_tokens": 3753502,
                "total_completion_tokens": 1173738,
                "volume": 0.9613857419,
                "rank": 8
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash-lite",
                "category": "marketing/seo",
                "count": 543,
                "total_prompt_tokens": 909103,
                "total_completion_tokens": 94926,
                "volume": 0.1285888524,
                "rank": 9
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash-lite",
                "category": "science",
                "count": 7270,
                "total_prompt_tokens": 13589676,
                "total_completion_tokens": 2063695,
                "volume": 2.110919856,
                "rank": 9
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash-lite",
                "category": "trivia",
                "count": 543,
                "total_prompt_tokens": 531346,
                "total_completion_tokens": 53508,
                "volume": 0.0630259303,
                "rank": 10
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash-lite",
                "category": "finance",
                "count": 5482,
                "total_prompt_tokens": 7165441,
                "total_completion_tokens": 638545,
                "volume": 1.0517388072,
                "rank": 10
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash-lite",
                "category": "roleplay",
                "count": 21035,
                "total_prompt_tokens": 48354219,
                "total_completion_tokens": 1130199,
                "volume": 4.3890588916999995,
                "rank": 10
            }
        ],
        "openai/gpt-4o-mini": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-4o-mini",
                "category": "finance",
                "count": 2223,
                "total_prompt_tokens": 16924600,
                "total_completion_tokens": 306443,
                "volume": 2.780786855,
                "rank": 3
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-4o-mini",
                "category": "trivia",
                "count": 1433,
                "total_prompt_tokens": 1543771,
                "total_completion_tokens": 16635,
                "volume": 0.17132043900000002,
                "rank": 3
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-4o-mini",
                "category": "science",
                "count": 5641,
                "total_prompt_tokens": 23735619,
                "total_completion_tokens": 704597,
                "volume": 4.037689341,
                "rank": 7
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-4o-mini",
                "category": "translation",
                "count": 9736,
                "total_prompt_tokens": 2746528,
                "total_completion_tokens": 475198,
                "volume": 0.6885863495,
                "rank": 8
            }
        ],
        "google/gemini-2.0-flash-001": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.0-flash-001",
                "category": "translation",
                "count": 22926,
                "total_prompt_tokens": 11087168,
                "total_completion_tokens": 1622898,
                "volume": 1.862434215,
                "rank": 3
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.0-flash-001",
                "category": "academia",
                "count": 2513,
                "total_prompt_tokens": 7466194,
                "total_completion_tokens": 1841887,
                "volume": 1.342845945,
                "rank": 6
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.0-flash-001",
                "category": "trivia",
                "count": 516,
                "total_prompt_tokens": 665320,
                "total_completion_tokens": 57882,
                "volume": 0.113648232,
                "rank": 6
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.0-flash-001",
                "category": "roleplay",
                "count": 67719,
                "total_prompt_tokens": 43658450,
                "total_completion_tokens": 7086464,
                "volume": 7.0095375933333335,
                "rank": 9
            }
        ],
        "tngtech/deepseek-r1t2-chimera:free": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "tngtech/deepseek-r1t2-chimera:free",
                "category": "roleplay",
                "count": 9190,
                "total_prompt_tokens": 95442040,
                "total_completion_tokens": 7646977,
                "volume": 0.12,
                "rank": 3
            }
        ],
        "anthropic/claude-4.5-haiku-20251001": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "anthropic/claude-4.5-haiku-20251001",
                "category": "health",
                "count": 262,
                "total_prompt_tokens": 4557388,
                "total_completion_tokens": 215336,
                "volume": 6.7674549299999995,
                "rank": 4
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "anthropic/claude-4.5-haiku-20251001",
                "category": "science",
                "count": 1066,
                "total_prompt_tokens": 13496493,
                "total_completion_tokens": 450995,
                "volume": 13.7007391425,
                "rank": 10
            }
        ],
        "anthropic/claude-4.5-opus-20251124": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "anthropic/claude-4.5-opus-20251124",
                "category": "programming",
                "count": 5210,
                "total_prompt_tokens": 228257655,
                "total_completion_tokens": 2318898,
                "volume": 497.071782615,
                "rank": 4
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "anthropic/claude-4.5-opus-20251124",
                "category": "science",
                "count": 1324,
                "total_prompt_tokens": 30815590,
                "total_completion_tokens": 649554,
                "volume": 92.5945990625,
                "rank": 5
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "anthropic/claude-4.5-opus-20251124",
                "category": "technology",
                "count": 3258,
                "total_prompt_tokens": 92579477,
                "total_completion_tokens": 1201066,
                "volume": 280.19274504,
                "rank": 5
            }
        ],
        "openai/gpt-4.1-nano-2025-04-14": [
            {
                "id": 0,
                "date": "2026-01-24",
                "model": "openai/gpt-4.1-nano-2025-04-14",
                "category": "marketing/seo",
                "count": 908,
                "total_prompt_tokens": 2155843,
                "total_completion_tokens": 961508,
                "volume": 0.51574823,
                "rank": 4
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-4.1-nano-2025-04-14",
                "category": "finance",
                "count": 1959,
                "total_prompt_tokens": 12503739,
                "total_completion_tokens": 86411,
                "volume": 0.596097646,
                "rank": 8
            }
        ],
        "openai/gpt-5-mini-2025-08-07": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-5-mini-2025-08-07",
                "category": "finance",
                "count": 2817,
                "total_prompt_tokens": 15176992,
                "total_completion_tokens": 1237641,
                "volume": 7.2602494455,
                "rank": 5
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-5-mini-2025-08-07",
                "category": "marketing/seo",
                "count": 525,
                "total_prompt_tokens": 1106759,
                "total_completion_tokens": 279745,
                "volume": 1.41557525,
                "rank": 7
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-5-mini-2025-08-07",
                "category": "technology",
                "count": 3278,
                "total_prompt_tokens": 40591099,
                "total_completion_tokens": 1601342,
                "volume": 12.391080005000001,
                "rank": 8
            }
        ],
        "deepseek/deepseek-chat-v3-0324": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "deepseek/deepseek-chat-v3-0324",
                "category": "health",
                "count": 558,
                "total_prompt_tokens": 4308758,
                "total_completion_tokens": 299797,
                "volume": 1.3899661247,
                "rank": 5
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "deepseek/deepseek-chat-v3-0324",
                "category": "roleplay",
                "count": 14708,
                "total_prompt_tokens": 79061746,
                "total_completion_tokens": 3325115,
                "volume": 26.21701005124,
                "rank": 6
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "deepseek/deepseek-chat-v3-0324",
                "category": "trivia",
                "count": 403,
                "total_prompt_tokens": 555811,
                "total_completion_tokens": 38385,
                "volume": 0.1966826763,
                "rank": 9
            }
        ],
        "google/gemini-2.5-flash-lite-preview-09-2025": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash-lite-preview-09-2025",
                "category": "legal",
                "count": 1076,
                "total_prompt_tokens": 5233542,
                "total_completion_tokens": 140817,
                "volume": 0.535424877,
                "rank": 5
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-flash-lite-preview-09-2025",
                "category": "health",
                "count": 2233,
                "total_prompt_tokens": 3815757,
                "total_completion_tokens": 424381,
                "volume": 0.5059171771000001,
                "rank": 9
            }
        ],
        "mistralai/mistral-small-24b-instruct-2501": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "mistralai/mistral-small-24b-instruct-2501",
                "category": "marketing/seo",
                "count": 3227,
                "total_prompt_tokens": 1646000,
                "total_completion_tokens": 153600,
                "volume": 0.15526883,
                "rank": 5
            }
        ],
        "anthropic/claude-4-sonnet-20250522": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "anthropic/claude-4-sonnet-20250522",
                "category": "health",
                "count": 1008,
                "total_prompt_tokens": 3654025,
                "total_completion_tokens": 897830,
                "volume": 28.639203039999998,
                "rank": 6
            }
        ],
        "openai/gpt-4.1-mini-2025-04-14": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-4.1-mini-2025-04-14",
                "category": "marketing/seo",
                "count": 177,
                "total_prompt_tokens": 1637555,
                "total_completion_tokens": 56395,
                "volume": 0.46711184399999994,
                "rank": 6
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-4.1-mini-2025-04-14",
                "category": "translation",
                "count": 4681,
                "total_prompt_tokens": 1943692,
                "total_completion_tokens": 432633,
                "volume": 1.446540652,
                "rank": 10
            }
        ],
        "mistralai/devstral-2512:free": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "mistralai/devstral-2512:free",
                "category": "programming",
                "count": 2916,
                "total_prompt_tokens": 119421491,
                "total_completion_tokens": 1476345,
                "volume": 0.06,
                "rank": 6
            }
        ],
        "minimax/minimax-m2.1": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "minimax/minimax-m2.1",
                "category": "programming",
                "count": 2277,
                "total_prompt_tokens": 103670532,
                "total_completion_tokens": 1221384,
                "volume": 5.0084127714,
                "rank": 7
            }
        ],
        "deepseek/deepseek-chat-v3.1": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "deepseek/deepseek-chat-v3.1",
                "category": "roleplay",
                "count": 14823,
                "total_prompt_tokens": 61299217,
                "total_completion_tokens": 1521221,
                "volume": 17.4936888335,
                "rank": 7
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "deepseek/deepseek-chat-v3.1",
                "category": "finance",
                "count": 697,
                "total_prompt_tokens": 12385381,
                "total_completion_tokens": 1316875,
                "volume": 3.709949474,
                "rank": 7
            }
        ],
        "openai/gpt-5.1-20251113": [
            {
                "id": 0,
                "date": "2026-01-24",
                "model": "openai/gpt-5.1-20251113",
                "category": "marketing/seo",
                "count": 31,
                "total_prompt_tokens": 1101866,
                "total_completion_tokens": 22637,
                "volume": 1.6054705,
                "rank": 8
            }
        ],
        "google/gemma-3-12b-it": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemma-3-12b-it",
                "category": "legal",
                "count": 733,
                "total_prompt_tokens": 3536254,
                "total_completion_tokens": 764721,
                "volume": 0.42422915879999995,
                "rank": 8
            }
        ],
        "z-ai/glm-4.6": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "z-ai/glm-4.6",
                "category": "trivia",
                "count": 32,
                "total_prompt_tokens": 611200,
                "total_completion_tokens": 2650,
                "volume": 0.094958016,
                "rank": 8
            }
        ],
        "z-ai/glm-4.7-20251222": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "z-ai/glm-4.7-20251222",
                "category": "programming",
                "count": 3469,
                "total_prompt_tokens": 93287542,
                "total_completion_tokens": 3634332,
                "volume": 48.25153520348,
                "rank": 8
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "z-ai/glm-4.7-20251222",
                "category": "technology",
                "count": 1401,
                "total_prompt_tokens": 36004408,
                "total_completion_tokens": 1451833,
                "volume": 23.15973101437,
                "rank": 10
            }
        ],
        "qwen/qwen3-30b-a3b-04-28": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "qwen/qwen3-30b-a3b-04-28",
                "category": "marketing",
                "count": 948,
                "total_prompt_tokens": 2102350,
                "total_completion_tokens": 726050,
                "volume": 0.48477359,
                "rank": 8
            }
        ],
        "google/gemini-3-pro-preview-20251117": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-3-pro-preview-20251117",
                "category": "marketing",
                "count": 77,
                "total_prompt_tokens": 2226575,
                "total_completion_tokens": 87360,
                "volume": 4.43219952,
                "rank": 9
            },
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-3-pro-preview-20251117",
                "category": "programming",
                "count": 2091,
                "total_prompt_tokens": 60974690,
                "total_completion_tokens": 2248711,
                "volume": 95.426867561,
                "rank": 10
            }
        ],
        "openai/gpt-5.2-20251211": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-5.2-20251211",
                "category": "academia",
                "count": 1625,
                "total_prompt_tokens": 4304664,
                "total_completion_tokens": 351223,
                "volume": 16.587270996,
                "rank": 9
            }
        ],
        "google/gemini-2.5-pro": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "google/gemini-2.5-pro",
                "category": "academia",
                "count": 342,
                "total_prompt_tokens": 3960607,
                "total_completion_tokens": 673794,
                "volume": 14.30496995,
                "rank": 10
            }
        ],
        "openai/gpt-oss-20b": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "openai/gpt-oss-20b",
                "category": "marketing",
                "count": 220,
                "total_prompt_tokens": 1838140,
                "total_completion_tokens": 209244,
                "volume": 0.13806193565,
                "rank": 10
            }
        ],
        "qwen/qwen3-embedding-8b": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "qwen/qwen3-embedding-8b",
                "category": "legal",
                "count": 233,
                "total_prompt_tokens": 2744490,
                "total_completion_tokens": 0,
                "volume": 0.03424931,
                "rank": 10
            }
        ],
        "meta-llama/llama-3-8b-instruct": [
            {
                "id": 0,
                "date": "2026-01-25",
                "model": "meta-llama/llama-3-8b-instruct",
                "category": "health",
                "count": 908,
                "total_prompt_tokens": 3823250,
                "total_completion_tokens": 9200,
                "volume": 0.02727106,
                "rank": 10
            }
        ]
    }
}