{
  "name": "AI Gateway",
  "version": "2.0.0",
  "auth": {
    "header": "Authorization: Bearer <key> 或 x-api-key: <key>",
    "note": "/ 和 /health 无需认证，其他端点均需认证"
  },
  "services": [
    {
      "name": "LLM + Vision (exo 集群)",
      "desc": "大语言模型 + 多模态视觉理解，4台 Mac Studio 分布式集群",
      "backend": "exo (MLX tensor parallelism + Thunderbolt 5 RDMA)",
      "api_formats": [
        "OpenAI Chat Completions: POST /v1/chat/completions",
        "OpenAI Responses API:    POST /v1/responses",
        "Claude Messages API:     POST /v1/messages (x-api-key 认证)",
        "Ollama API:              POST /ollama/api/chat"
      ],
      "models": ["mlx-community/Qwen3.5-397B-A17B-8bit"],
      "capabilities": [
        "文本对话、推理、代码生成",
        "图片理解、OCR、文档分析 (原生多模态，content 传 image_url)",
        "PDF 理解 (dashboard 支持)",
        "Thinking 模式开关 (enable_thinking 参数)",
        "Tool Calling / Function Calling",
        "图片生成 (EXO_ENABLE_IMAGE_MODELS=true)"
      ],
      "other_endpoints": [
        "GET  /v1/models             - 可用模型列表",
        "POST /v1/images/generations  - 图片生成",
        "POST /v1/images/edits        - 图片编辑"
      ],
      "examples": {
        "text_chat": "curl -X POST https://ai.im.app/v1/chat/completions -H \"Authorization: Bearer <key>\" -H \"Content-Type: application/json\" -d '{\"model\":\"mlx-community/Qwen3.5-397B-A17B-8bit\",\"messages\":[{\"role\":\"user\",\"content\":\"hello\"}]}'",
        "vision": "curl -X POST https://ai.im.app/v1/chat/completions -H \"Authorization: Bearer <key>\" -H \"Content-Type: application/json\" -d '{\"model\":\"mlx-community/Qwen3.5-397B-A17B-8bit\",\"messages\":[{\"role\":\"user\",\"content\":[{\"type\":\"text\",\"text\":\"描述这张图片\"},{\"type\":\"image_url\",\"image_url\":{\"url\":\"data:image/jpeg;base64,...\"}}]}]}'",
        "no_thinking": "curl -X POST https://ai.im.app/v1/chat/completions -H \"Authorization: Bearer <key>\" -H \"Content-Type: application/json\" -d '{\"model\":\"mlx-community/Qwen3.5-397B-A17B-8bit\",\"messages\":[{\"role\":\"user\",\"content\":\"hello\"}],\"enable_thinking\":false}'"
      }
    },
    {
      "name": "ASR 语音识别 (Qwen3-ASR)",
      "desc": "语音转文字，支持中文(含22种方言)、英日韩法德等30+种语言",
      "backend": "mlx-qwen3-asr (4 节点 least_conn 负载均衡)",
      "api_format": "OpenAI Audio API: POST /v1/audio/transcriptions",
      "models": ["Qwen/Qwen3-ASR-1.7B"],
      "request_format": "multipart/form-data，file 字段上传音频文件",
      "supported_formats": "wav, mp3, m4a, flac, ogg 等",
      "examples": {
        "curl": "curl -X POST https://ai.im.app/v1/audio/transcriptions -H \"Authorization: Bearer <key>\" -F \"file=@audio.wav\" -F \"model=Qwen/Qwen3-ASR-1.7B\"",
        "openai_sdk": "from openai import OpenAI; client = OpenAI(api_key=\"<key>\", base_url=\"https://ai.im.app/v1\"); result = client.audio.transcriptions.create(model=\"Qwen/Qwen3-ASR-1.7B\", file=open(\"audio.wav\",\"rb\")); print(result.text)"
      }
    }
  ]
}
