Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 2 additions & 0 deletions packages/proxy/schema/index.ts
Original file line number Diff line number Diff line change
Expand Up @@ -605,6 +605,8 @@ export const AvailableEndpointTypes: { [name: string]: ModelEndpointType[] } = {
"moonshotai/Kimi-K2-Instruct": ["baseten"],
"deepseek-ai/DeepSeek-V3-0324": ["baseten"],
"publishers/moonshotai/models/kimi-k2.5": ["azure"],
"fireworks_ai/accounts/fireworks/models/glm-4p7": ["fireworks"],
"fireworks_ai/accounts/fireworks/models/qwen3-vl-30b-a3b-instruct": ["fireworks"]
};

export function getModelEndpointTypes(model: string): ModelEndpointType[] {
Expand Down
24 changes: 24 additions & 0 deletions packages/proxy/schema/model_list.json
Original file line number Diff line number Diff line change
Expand Up @@ -6496,5 +6496,29 @@
"displayName": "Kimi K2.5",
"max_input_tokens": 256000,
"max_output_tokens": 65535
},
"fireworks_ai/accounts/fireworks/models/glm-4p7": {
"format": "openai",
"flavor": "chat",
"input_cost_per_mil_tokens": 0.6,
"output_cost_per_mil_tokens": 2.2,
"displayName": "GLM-4.7",
"max_input_tokens": 200000,
"max_output_tokens": 128000,
"available_providers": [
"fireworks"
]
},
"fireworks_ai/accounts/fireworks/models/qwen3-vl-30b-a3b-instruct": {
Copy link
Copy Markdown

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

P2 Badge Register provider mapping for qwen3-vl model

This new model is added to model_list.json but not to AvailableEndpointTypes, so getModelEndpointTypes() falls back to DefaultEndpointTypes["openai"] (openai/azure) instead of fireworks. In the edge fallback path (when /api/secret lookup fails), the auth token is then tagged with the wrong provider type and requests for this model can be routed to the wrong endpoint/auth scheme. Please add fireworks_ai/accounts/fireworks/models/qwen3-vl-30b-a3b-instruct to AvailableEndpointTypes like glm-4p7.

Useful? React with 👍 / 👎.

"format": "openai",
"flavor": "chat",
"input_cost_per_mil_tokens": 0.13,
"output_cost_per_mil_tokens": 0.52,
"displayName": "Qwen3 VL 30B A3B Instruct",
"max_input_tokens": 128000,
"max_output_tokens": 32000,
"available_providers": [
"fireworks"
]
}
}
Loading