{
"title": "agent.openrouter.ProviderQuantization",
"description": "Model quantization levels for provider filtering.\n\nQuantization reduces model precision to decrease memory usage and\nincrease inference speed, potentially at the cost of output quality.",
"anyOf": [
{
"title": "Int4",
"description": "4-bit integer quantization.",
"type": "string",
"enum": [
"int4"
]
},
{
"title": "Int8",
"description": "8-bit integer quantization.",
"type": "string",
"enum": [
"int8"
]
},
{
"title": "Fp4",
"description": "4-bit floating point quantization.",
"type": "string",
"enum": [
"fp4"
]
},
{
"title": "Fp6",
"description": "6-bit floating point quantization.",
"type": "string",
"enum": [
"fp6"
]
},
{
"title": "Fp8",
"description": "8-bit floating point quantization.",
"type": "string",
"enum": [
"fp8"
]
},
{
"title": "Fp16",
"description": "16-bit floating point (half precision).",
"type": "string",
"enum": [
"fp16"
]
},
{
"title": "Bf16",
"description": "16-bit brain floating point.",
"type": "string",
"enum": [
"bf16"
]
},
{
"title": "Fp32",
"description": "32-bit floating point (full precision).",
"type": "string",
"enum": [
"fp32"
]
},
{
"title": "Unknown",
"description": "Unknown quantization level.",
"type": "string",
"enum": [
"unknown"
]
}
]
}