@@ -21,6 +21,10 @@ class ModelPricing:
2121# Pricing per model ($/1M tokens). Keep in sync with infra pricing.
2222MODEL_PRICING : dict [str , ModelPricing ] = {
2323 # Qwen models
24+ "Qwen/Qwen3.5-4B" : ModelPricing (prefill = 0.22 , sample = 0.67 , train = 0.67 ),
25+ "Qwen/Qwen3.5-27B" : ModelPricing (prefill = 1.24 , sample = 3.73 , train = 3.73 ),
26+ "Qwen/Qwen3.5-35B-A3B" : ModelPricing (prefill = 0.36 , sample = 0.89 , train = 1.07 ),
27+ "Qwen/Qwen3.5-397B-A17B" : ModelPricing (prefill = 2.00 , sample = 5.00 , train = 6.00 ),
2428 "Qwen/Qwen3-4B-Instruct-2507" : ModelPricing (prefill = 0.07 , sample = 0.22 , train = 0.22 ),
2529 "Qwen/Qwen3-8B" : ModelPricing (prefill = 0.13 , sample = 0.40 , train = 0.40 ),
2630 "Qwen/Qwen3-8B-Base" : ModelPricing (prefill = 0.13 , sample = 0.40 , train = 0.40 ),
@@ -60,6 +64,7 @@ class ModelPricing:
6064 "openai/gpt-oss-20b" : ModelPricing (prefill = 0.12 , sample = 0.30 , train = 0.36 ),
6165 # Moonshot models
6266 "moonshotai/Kimi-K2-Thinking" : ModelPricing (prefill = 0.98 , sample = 2.44 , train = 2.93 ),
67+ "moonshotai/Kimi-K2.5" : ModelPricing (prefill = 1.47 , sample = 3.66 , train = 4.40 ),
6368}
6469
6570
0 commit comments