models.json

  1{
  2	"providers": {
  3		"plexus": {
  4			"baseUrl": "http://100.77.116.78:4000/v1",
  5			"apiKey": "!fnox get PLEXUS_API_KEY",
  6			"api": "openai-completions",
  7			"models": [
  8				{
  9					"id": "claude-opus-4.6",
 10					"name": "Claude Opus 4.6",
 11					"reasoning": true,
 12					"input": ["text", "image"],
 13					"cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
 14					"contextWindow": 200000,
 15					"maxTokens": 50000,
 16					"compat": {
 17						"supportsReasoningEffort": true,
 18						"supportsDeveloperRole": false
 19					}
 20				},
 21				{
 22					"id": "claude-sonnet-4.6",
 23					"name": "Claude Sonnet 4.6",
 24					"reasoning": true,
 25					"input": ["text", "image"],
 26					"cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
 27					"contextWindow": 200000,
 28					"maxTokens": 50000,
 29					"compat": {
 30						"supportsReasoningEffort": true,
 31						"supportsDeveloperRole": false
 32					}
 33				},
 34				{
 35					"id": "gpt-5.4",
 36					"name": "GPT 5.4",
 37					"reasoning": true,
 38					"supportsReasoningEffort": true,
 39					"supportsDeveloperRole": false,
 40					"input": ["text", "image"],
 41					"cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
 42					"contextWindow": 400000,
 43					"maxTokens": 128000
 44				},
 45				{
 46					"id": "gpt-5.3-codex",
 47					"name": "GPT 5.3 Codex",
 48					"reasoning": true,
 49					"input": ["text", "image"],
 50					"cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
 51					"contextWindow": 400000,
 52					"maxTokens": 128000,
 53					"compat": {
 54						"supportsReasoningEffort": true,
 55						"supportsDeveloperRole": false
 56					}
 57				},
 58				{
 59					"id": "kimi-k2.5h",
 60					"name": "Kimi K2.5h",
 61					"reasoning": true,
 62					"input": ["text", "image"],
 63					"cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
 64					"contextWindow": 262144,
 65					"maxTokens": 32768,
 66					"compat": {
 67						"supportsReasoningEffort": true,
 68						"supportsDeveloperRole": false
 69					}
 70				},
 71				{
 72					"id": "glm-5",
 73					"name": "GLM 5",
 74					"reasoning": true,
 75					"input": ["text"],
 76					"cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
 77					"contextWindow": 202752,
 78					"maxTokens": 20275,
 79					"compat": {
 80						"supportsReasoningEffort": true,
 81						"supportsDeveloperRole": false
 82					}
 83				},
 84				{
 85					"id": "glm-4.7",
 86					"name": "GLM 4.7",
 87					"reasoning": true,
 88					"input": ["text"],
 89					"cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
 90					"contextWindow": 202752,
 91					"maxTokens": 20275,
 92					"compat": {
 93						"supportsReasoningEffort": true,
 94						"supportsDeveloperRole": false
 95					}
 96				},
 97				{
 98					"id": "minimax-m2.5",
 99					"name": "MiniMax M2.5",
100					"reasoning": true,
101					"input": ["text"],
102					"cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
103					"contextWindow": 196608,
104					"maxTokens": 19660,
105					"compat": {
106						"supportsReasoningEffort": true,
107						"supportsDeveloperRole": false
108					}
109				},
110				{
111					"id": "qwen3.5-397b-a17b",
112					"name": "Qwen3.5 397B A17B",
113					"reasoning": true,
114					"input": ["text"],
115					"cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
116					"contextWindow": 262144,
117					"maxTokens": 65536,
118					"compat": {
119						"supportsReasoningEffort": true,
120						"supportsDeveloperRole": false
121					}
122				},
123				{
124					"id": "gpt-oss-120b",
125					"name": "GPT OSS 120B",
126					"reasoning": true,
127					"input": ["text", "image"],
128					"cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
129					"contextWindow": 131072,
130					"maxTokens": 13107,
131					"compat": {
132						"supportsReasoningEffort": true,
133						"supportsDeveloperRole": false
134					}
135				},
136				{
137					"id": "diff-apply",
138					"name": "Diff Apply",
139					"reasoning": false,
140					"supportsDeveloperRole": false,
141					"input": ["text"],
142					"cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 },
143					"contextWindow": 256000,
144					"maxTokens": 64000
145				}
146			]
147		}
148	}
149}