Skip to content

Commit 4d6a4e0

Browse files
committed
Add OpenRouter embedding models to catalog
- text-embedding-3-small via OpenRouter (/bin/zsh.02/MTok) - text-embedding-3-large via OpenRouter (/bin/zsh.13/MTok) - qwen3-embedding-8b (/bin/zsh.01/MTok) - qwen3-embedding-4b (/bin/zsh.02/MTok) Embedding catalog now has 11 models (was 7).
1 parent b88cfcf commit 4d6a4e0

2 files changed

Lines changed: 91 additions & 0 deletions

File tree

internal/ai/models/embedding_catalog.json

Lines changed: 68 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -117,5 +117,73 @@
117117
"provider": "cohere",
118118
"supportsDimCtrl": false,
119119
"supportsTaskType": true
120+
},
121+
{
122+
"api": "openai-embeddings",
123+
"baseUrl": "https://openrouter.ai/api/v1",
124+
"cost": {
125+
"perMTok": 0.02
126+
},
127+
"defaultDims": 1536,
128+
"id": "openai/text-embedding-3-small",
129+
"maxBatchSize": 2048,
130+
"maxDims": 1536,
131+
"maxInputTokens": 8192,
132+
"minDims": 256,
133+
"name": "Text Embedding 3 Small (OpenRouter)",
134+
"provider": "openrouter",
135+
"supportsDimCtrl": true,
136+
"supportsTaskType": false
137+
},
138+
{
139+
"api": "openai-embeddings",
140+
"baseUrl": "https://openrouter.ai/api/v1",
141+
"cost": {
142+
"perMTok": 0.13
143+
},
144+
"defaultDims": 3072,
145+
"id": "openai/text-embedding-3-large",
146+
"maxBatchSize": 2048,
147+
"maxDims": 3072,
148+
"maxInputTokens": 8192,
149+
"minDims": 256,
150+
"name": "Text Embedding 3 Large (OpenRouter)",
151+
"provider": "openrouter",
152+
"supportsDimCtrl": true,
153+
"supportsTaskType": false
154+
},
155+
{
156+
"api": "openai-embeddings",
157+
"baseUrl": "https://openrouter.ai/api/v1",
158+
"cost": {
159+
"perMTok": 0.01
160+
},
161+
"defaultDims": 1024,
162+
"id": "qwen/qwen3-embedding-8b",
163+
"maxBatchSize": 2048,
164+
"maxDims": 1024,
165+
"maxInputTokens": 32000,
166+
"minDims": 1024,
167+
"name": "Qwen3 Embedding 8B",
168+
"provider": "openrouter",
169+
"supportsDimCtrl": false,
170+
"supportsTaskType": false
171+
},
172+
{
173+
"api": "openai-embeddings",
174+
"baseUrl": "https://openrouter.ai/api/v1",
175+
"cost": {
176+
"perMTok": 0.02
177+
},
178+
"defaultDims": 1024,
179+
"id": "qwen/qwen3-embedding-4b",
180+
"maxBatchSize": 2048,
181+
"maxDims": 1024,
182+
"maxInputTokens": 32768,
183+
"minDims": 1024,
184+
"name": "Qwen3 Embedding 4B",
185+
"provider": "openrouter",
186+
"supportsDimCtrl": false,
187+
"supportsTaskType": false
120188
}
121189
]

scripts/update-model-catalog.py

Lines changed: 23 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -381,6 +381,29 @@ def embedding_model(id_, name, api, provider, base_url, max_input, default_dims,
381381
"cohere-embeddings", "cohere", "https://api.cohere.com/v2",
382382
512, 1024, 1024, 1024, 96, False, True, 0.1,
383383
),
384+
# OpenRouter embeddings -- source: https://openrouter.ai/models (embedding models)
385+
# OpenRouter uses OpenAI-compatible embeddings API at /api/v1/embeddings
386+
# Pricing is pass-through from underlying providers (no markup)
387+
embedding_model(
388+
"openai/text-embedding-3-small", "Text Embedding 3 Small (OpenRouter)",
389+
"openai-embeddings", "openrouter", "https://openrouter.ai/api/v1",
390+
8192, 1536, 1536, 256, 2048, True, False, 0.02,
391+
),
392+
embedding_model(
393+
"openai/text-embedding-3-large", "Text Embedding 3 Large (OpenRouter)",
394+
"openai-embeddings", "openrouter", "https://openrouter.ai/api/v1",
395+
8192, 3072, 3072, 256, 2048, True, False, 0.13,
396+
),
397+
embedding_model(
398+
"qwen/qwen3-embedding-8b", "Qwen3 Embedding 8B",
399+
"openai-embeddings", "openrouter", "https://openrouter.ai/api/v1",
400+
32000, 1024, 1024, 1024, 2048, False, False, 0.01,
401+
),
402+
embedding_model(
403+
"qwen/qwen3-embedding-4b", "Qwen3 Embedding 4B",
404+
"openai-embeddings", "openrouter", "https://openrouter.ai/api/v1",
405+
32768, 1024, 1024, 1024, 2048, False, False, 0.02,
406+
),
384407
]
385408

386409

0 commit comments

Comments
 (0)