objectiveai-sdk 2.0.8

{
  "title": "agent.openrouter.ProviderQuantization",
  "description": "Model quantization levels for provider filtering.\n\nQuantization reduces model precision to decrease memory usage and\nincrease inference speed, potentially at the cost of output quality.",
  "anyOf": [
    {
      "title": "Int4",
      "description": "4-bit integer quantization.",
      "type": "string",
      "enum": [
        "int4"
      ]
    },
    {
      "title": "Int8",
      "description": "8-bit integer quantization.",
      "type": "string",
      "enum": [
        "int8"
      ]
    },
    {
      "title": "Fp4",
      "description": "4-bit floating point quantization.",
      "type": "string",
      "enum": [
        "fp4"
      ]
    },
    {
      "title": "Fp6",
      "description": "6-bit floating point quantization.",
      "type": "string",
      "enum": [
        "fp6"
      ]
    },
    {
      "title": "Fp8",
      "description": "8-bit floating point quantization.",
      "type": "string",
      "enum": [
        "fp8"
      ]
    },
    {
      "title": "Fp16",
      "description": "16-bit floating point (half precision).",
      "type": "string",
      "enum": [
        "fp16"
      ]
    },
    {
      "title": "Bf16",
      "description": "16-bit brain floating point.",
      "type": "string",
      "enum": [
        "bf16"
      ]
    },
    {
      "title": "Fp32",
      "description": "32-bit floating point (full precision).",
      "type": "string",
      "enum": [
        "fp32"
      ]
    },
    {
      "title": "Unknown",
      "description": "Unknown quantization level.",
      "type": "string",
      "enum": [
        "unknown"
      ]
    }
  ]
}