zai.json

  1{
  2  "name": "Z.AI",
  3  "id": "zai",
  4  "api_key": "$ZAI_API_KEY",
  5  "api_endpoint": "https://api.z.ai/api/coding/paas/v4",
  6  "type": "openai-compat",
  7  "default_large_model_id": "glm-4.7",
  8  "default_small_model_id": "glm-4.7-flash",
  9  "models": [
 10    {
 11      "id": "glm-5.1",
 12      "name": "GLM-5.1",
 13      "cost_per_1m_in": 1.0,
 14      "cost_per_1m_out": 3.2,
 15      "cost_per_1m_in_cached": 0.2,
 16      "context_window": 204800,
 17      "default_max_tokens": 65536,
 18      "can_reason": true,
 19      "supports_attachments": false
 20    },
 21    {
 22      "id": "glm-5-turbo",
 23      "name": "GLM-5-Turbo",
 24      "cost_per_1m_in": 1.2,
 25      "cost_per_1m_out": 4.0,
 26      "cost_per_1m_in_cached": 0.24,
 27      "context_window": 200000,
 28      "default_max_tokens": 128000,
 29      "can_reason": true,
 30      "supports_attachments": false
 31    },
 32    {
 33      "id": "glm-5",
 34      "name": "GLM-5",
 35      "cost_per_1m_in": 1.0,
 36      "cost_per_1m_out": 3.2,
 37      "cost_per_1m_in_cached": 0.2,
 38      "context_window": 204800,
 39      "default_max_tokens": 65536,
 40      "can_reason": true,
 41      "supports_attachments": false
 42    },
 43    {
 44      "id": "glm-4.7",
 45      "name": "GLM-4.7",
 46      "cost_per_1m_in": 0.42,
 47      "cost_per_1m_out": 2.2,
 48      "cost_per_1m_in_cached": 0.11,
 49      "context_window": 204800,
 50      "default_max_tokens": 98000,
 51      "can_reason": true,
 52      "supports_attachments": false
 53    },
 54    {
 55      "id": "glm-4.7-flash",
 56      "name": "GLM-4.7 Flash",
 57      "cost_per_1m_in": 0.07,
 58      "cost_per_1m_out": 0.4,
 59      "cost_per_1m_in_cached": 0.01,
 60      "context_window": 200000,
 61      "default_max_tokens": 65550,
 62      "can_reason": true,
 63      "supports_attachments": false
 64    },
 65    {
 66      "id": "glm-4.6",
 67      "name": "GLM-4.6",
 68      "cost_per_1m_in": 0.39,
 69      "cost_per_1m_out": 1.9,
 70      "cost_per_1m_in_cached": 0.11,
 71      "context_window": 204800,
 72      "default_max_tokens": 102400,
 73      "can_reason": true,
 74      "supports_attachments": false
 75    },
 76    {
 77      "id": "glm-4.6v",
 78      "name": "GLM-4.6V",
 79      "cost_per_1m_in": 0.3,
 80      "cost_per_1m_out": 0.9,
 81      "context_window": 131072,
 82      "default_max_tokens": 65536,
 83      "can_reason": true,
 84      "supports_attachments": true
 85    },
 86    {
 87      "id": "glm-4.5",
 88      "name": "GLM-4.5",
 89      "cost_per_1m_in": 0.6,
 90      "cost_per_1m_out": 2.2,
 91      "cost_per_1m_in_cached": 0.11,
 92      "context_window": 131072,
 93      "default_max_tokens": 49152,
 94      "can_reason": true,
 95      "supports_attachments": false
 96    },
 97    {
 98      "id": "glm-4.5-air",
 99      "name": "GLM-4.5-Air",
100      "cost_per_1m_in": 0.13,
101      "cost_per_1m_out": 0.85,
102      "cost_per_1m_in_cached": 0.03,
103      "context_window": 131072,
104      "default_max_tokens": 49152,
105      "can_reason": true,
106      "supports_attachments": false
107    },
108    {
109      "id": "glm-4.5v",
110      "name": "GLM-4.5V",
111      "cost_per_1m_in": 0.6,
112      "cost_per_1m_out": 1.8,
113      "cost_per_1m_in_cached": 0.11,
114      "context_window": 65536,
115      "default_max_tokens": 8192,
116      "can_reason": true,
117      "supports_attachments": true
118    }
119  ]
120}