@@ -65,6 +65,8 @@ pub enum EmbeddingModel {
65
65
GTELargeENV15Q ,
66
66
/// Qdrant/clip-ViT-B-32-text
67
67
ClipVitB32 ,
68
+ /// jinaai/jina-embeddings-v2-base-code
69
+ JinaEmbeddingsV2BaseCode ,
68
70
}
69
71
70
72
/// Centralized function to initialize the models map.
@@ -76,62 +78,71 @@ fn init_models_map() -> HashMap<EmbeddingModel, ModelInfo<EmbeddingModel>> {
76
78
description: String :: from( "Sentence Transformer model, MiniLM-L6-v2" ) ,
77
79
model_code: String :: from( "Qdrant/all-MiniLM-L6-v2-onnx" ) ,
78
80
model_file: String :: from( "model.onnx" ) ,
81
+ additional_files: Vec :: new( ) ,
79
82
} ,
80
83
ModelInfo {
81
84
model: EmbeddingModel :: AllMiniLML6V2Q ,
82
85
dim: 384 ,
83
86
description: String :: from( "Quantized Sentence Transformer model, MiniLM-L6-v2" ) ,
84
87
model_code: String :: from( "Xenova/all-MiniLM-L6-v2" ) ,
85
88
model_file: String :: from( "onnx/model_quantized.onnx" ) ,
89
+ additional_files: Vec :: new( ) ,
86
90
} ,
87
91
ModelInfo {
88
92
model: EmbeddingModel :: AllMiniLML12V2 ,
89
93
dim: 384 ,
90
94
description: String :: from( "Sentence Transformer model, MiniLM-L12-v2" ) ,
91
95
model_code: String :: from( "Xenova/all-MiniLM-L12-v2" ) ,
92
96
model_file: String :: from( "onnx/model.onnx" ) ,
97
+ additional_files: Vec :: new( ) ,
93
98
} ,
94
99
ModelInfo {
95
100
model: EmbeddingModel :: AllMiniLML12V2Q ,
96
101
dim: 384 ,
97
102
description: String :: from( "Quantized Sentence Transformer model, MiniLM-L12-v2" ) ,
98
103
model_code: String :: from( "Xenova/all-MiniLM-L12-v2" ) ,
99
104
model_file: String :: from( "onnx/model_quantized.onnx" ) ,
105
+ additional_files: Vec :: new( ) ,
100
106
} ,
101
107
ModelInfo {
102
108
model: EmbeddingModel :: BGEBaseENV15 ,
103
109
dim: 768 ,
104
110
description: String :: from( "v1.5 release of the base English model" ) ,
105
111
model_code: String :: from( "Xenova/bge-base-en-v1.5" ) ,
106
112
model_file: String :: from( "onnx/model.onnx" ) ,
113
+ additional_files: Vec :: new( ) ,
107
114
} ,
108
115
ModelInfo {
109
116
model: EmbeddingModel :: BGEBaseENV15Q ,
110
117
dim: 768 ,
111
118
description: String :: from( "Quantized v1.5 release of the large English model" ) ,
112
119
model_code: String :: from( "Qdrant/bge-base-en-v1.5-onnx-Q" ) ,
113
120
model_file: String :: from( "model_optimized.onnx" ) ,
121
+ additional_files: Vec :: new( ) ,
114
122
} ,
115
123
ModelInfo {
116
124
model: EmbeddingModel :: BGELargeENV15 ,
117
125
dim: 1024 ,
118
126
description: String :: from( "v1.5 release of the large English model" ) ,
119
127
model_code: String :: from( "Xenova/bge-large-en-v1.5" ) ,
120
128
model_file: String :: from( "onnx/model.onnx" ) ,
129
+ additional_files: Vec :: new( ) ,
121
130
} ,
122
131
ModelInfo {
123
132
model: EmbeddingModel :: BGELargeENV15Q ,
124
133
dim: 1024 ,
125
134
description: String :: from( "Quantized v1.5 release of the large English model" ) ,
126
135
model_code: String :: from( "Qdrant/bge-large-en-v1.5-onnx-Q" ) ,
127
136
model_file: String :: from( "model_optimized.onnx" ) ,
137
+ additional_files: Vec :: new( ) ,
128
138
} ,
129
139
ModelInfo {
130
140
model: EmbeddingModel :: BGESmallENV15 ,
131
141
dim: 384 ,
132
142
description: String :: from( "v1.5 release of the fast and default English model" ) ,
133
143
model_code: String :: from( "Xenova/bge-small-en-v1.5" ) ,
134
144
model_file: String :: from( "onnx/model.onnx" ) ,
145
+ additional_files: Vec :: new( ) ,
135
146
} ,
136
147
ModelInfo {
137
148
model: EmbeddingModel :: BGESmallENV15Q ,
@@ -141,20 +152,23 @@ fn init_models_map() -> HashMap<EmbeddingModel, ModelInfo<EmbeddingModel>> {
141
152
) ,
142
153
model_code: String :: from( "Qdrant/bge-small-en-v1.5-onnx-Q" ) ,
143
154
model_file: String :: from( "model_optimized.onnx" ) ,
155
+ additional_files: Vec :: new( ) ,
144
156
} ,
145
157
ModelInfo {
146
158
model: EmbeddingModel :: NomicEmbedTextV1 ,
147
159
dim: 768 ,
148
160
description: String :: from( "8192 context length english model" ) ,
149
161
model_code: String :: from( "nomic-ai/nomic-embed-text-v1" ) ,
150
162
model_file: String :: from( "onnx/model.onnx" ) ,
163
+ additional_files: Vec :: new( ) ,
151
164
} ,
152
165
ModelInfo {
153
166
model: EmbeddingModel :: NomicEmbedTextV15 ,
154
167
dim: 768 ,
155
168
description: String :: from( "v1.5 release of the 8192 context length english model" ) ,
156
169
model_code: String :: from( "nomic-ai/nomic-embed-text-v1.5" ) ,
157
170
model_file: String :: from( "onnx/model.onnx" ) ,
171
+ additional_files: Vec :: new( ) ,
158
172
} ,
159
173
ModelInfo {
160
174
model: EmbeddingModel :: NomicEmbedTextV15Q ,
@@ -164,20 +178,23 @@ fn init_models_map() -> HashMap<EmbeddingModel, ModelInfo<EmbeddingModel>> {
164
178
) ,
165
179
model_code: String :: from( "nomic-ai/nomic-embed-text-v1.5" ) ,
166
180
model_file: String :: from( "onnx/model_quantized.onnx" ) ,
181
+ additional_files: Vec :: new( ) ,
167
182
} ,
168
183
ModelInfo {
169
184
model: EmbeddingModel :: ParaphraseMLMiniLML12V2Q ,
170
185
dim: 384 ,
171
186
description: String :: from( "Quantized Multi-lingual model" ) ,
172
187
model_code: String :: from( "Qdrant/paraphrase-multilingual-MiniLM-L12-v2-onnx-Q" ) ,
173
188
model_file: String :: from( "model_optimized.onnx" ) ,
189
+ additional_files: Vec :: new( ) ,
174
190
} ,
175
191
ModelInfo {
176
192
model: EmbeddingModel :: ParaphraseMLMiniLML12V2 ,
177
193
dim: 384 ,
178
194
description: String :: from( "Multi-lingual model" ) ,
179
195
model_code: String :: from( "Xenova/paraphrase-multilingual-MiniLM-L12-v2" ) ,
180
196
model_file: String :: from( "onnx/model.onnx" ) ,
197
+ additional_files: Vec :: new( ) ,
181
198
} ,
182
199
ModelInfo {
183
200
model: EmbeddingModel :: ParaphraseMLMpnetBaseV2 ,
@@ -187,83 +204,103 @@ fn init_models_map() -> HashMap<EmbeddingModel, ModelInfo<EmbeddingModel>> {
187
204
) ,
188
205
model_code: String :: from( "Xenova/paraphrase-multilingual-mpnet-base-v2" ) ,
189
206
model_file: String :: from( "onnx/model.onnx" ) ,
207
+ additional_files: Vec :: new( ) ,
190
208
} ,
191
209
ModelInfo {
192
210
model: EmbeddingModel :: BGESmallZHV15 ,
193
211
dim: 512 ,
194
212
description: String :: from( "v1.5 release of the small Chinese model" ) ,
195
213
model_code: String :: from( "Xenova/bge-small-zh-v1.5" ) ,
196
214
model_file: String :: from( "onnx/model.onnx" ) ,
215
+ additional_files: Vec :: new( ) ,
197
216
} ,
198
217
ModelInfo {
199
218
model: EmbeddingModel :: MultilingualE5Small ,
200
219
dim: 384 ,
201
220
description: String :: from( "Small model of multilingual E5 Text Embeddings" ) ,
202
221
model_code: String :: from( "intfloat/multilingual-e5-small" ) ,
203
222
model_file: String :: from( "onnx/model.onnx" ) ,
223
+ additional_files: Vec :: new( ) ,
204
224
} ,
205
225
ModelInfo {
206
226
model: EmbeddingModel :: MultilingualE5Base ,
207
227
dim: 768 ,
208
228
description: String :: from( "Base model of multilingual E5 Text Embeddings" ) ,
209
229
model_code: String :: from( "intfloat/multilingual-e5-base" ) ,
210
230
model_file: String :: from( "onnx/model.onnx" ) ,
231
+ additional_files: Vec :: new( ) ,
211
232
} ,
212
233
ModelInfo {
213
234
model: EmbeddingModel :: MultilingualE5Large ,
214
235
dim: 1024 ,
215
236
description: String :: from( "Large model of multilingual E5 Text Embeddings" ) ,
216
237
model_code: String :: from( "Qdrant/multilingual-e5-large-onnx" ) ,
217
238
model_file: String :: from( "model.onnx" ) ,
239
+ additional_files: vec![ "model.onnx_data" . to_string( ) ] ,
218
240
} ,
219
241
ModelInfo {
220
242
model: EmbeddingModel :: MxbaiEmbedLargeV1 ,
221
243
dim: 1024 ,
222
244
description: String :: from( "Large English embedding model from MixedBreed.ai" ) ,
223
245
model_code: String :: from( "mixedbread-ai/mxbai-embed-large-v1" ) ,
224
246
model_file: String :: from( "onnx/model.onnx" ) ,
247
+ additional_files: Vec :: new( ) ,
225
248
} ,
226
249
ModelInfo {
227
250
model: EmbeddingModel :: MxbaiEmbedLargeV1Q ,
228
251
dim: 1024 ,
229
252
description: String :: from( "Quantized Large English embedding model from MixedBreed.ai" ) ,
230
253
model_code: String :: from( "mixedbread-ai/mxbai-embed-large-v1" ) ,
231
254
model_file: String :: from( "onnx/model_quantized.onnx" ) ,
255
+ additional_files: Vec :: new( ) ,
232
256
} ,
233
257
ModelInfo {
234
258
model: EmbeddingModel :: GTEBaseENV15 ,
235
259
dim: 768 ,
236
260
description: String :: from( "Large multilingual embedding model from Alibaba" ) ,
237
261
model_code: String :: from( "Alibaba-NLP/gte-base-en-v1.5" ) ,
238
262
model_file: String :: from( "onnx/model.onnx" ) ,
263
+ additional_files: Vec :: new( ) ,
239
264
} ,
240
265
ModelInfo {
241
266
model: EmbeddingModel :: GTEBaseENV15Q ,
242
267
dim: 768 ,
243
268
description: String :: from( "Quantized Large multilingual embedding model from Alibaba" ) ,
244
269
model_code: String :: from( "Alibaba-NLP/gte-base-en-v1.5" ) ,
245
270
model_file: String :: from( "onnx/model_quantized.onnx" ) ,
271
+ additional_files: Vec :: new( ) ,
246
272
} ,
247
273
ModelInfo {
248
274
model: EmbeddingModel :: GTELargeENV15 ,
249
275
dim: 1024 ,
250
276
description: String :: from( "Large multilingual embedding model from Alibaba" ) ,
251
277
model_code: String :: from( "Alibaba-NLP/gte-large-en-v1.5" ) ,
252
278
model_file: String :: from( "onnx/model.onnx" ) ,
279
+ additional_files: Vec :: new( ) ,
253
280
} ,
254
281
ModelInfo {
255
282
model: EmbeddingModel :: GTELargeENV15Q ,
256
283
dim: 1024 ,
257
284
description: String :: from( "Quantized Large multilingual embedding model from Alibaba" ) ,
258
285
model_code: String :: from( "Alibaba-NLP/gte-large-en-v1.5" ) ,
259
286
model_file: String :: from( "onnx/model_quantized.onnx" ) ,
287
+ additional_files: Vec :: new( ) ,
260
288
} ,
261
289
ModelInfo {
262
290
model: EmbeddingModel :: ClipVitB32 ,
263
291
dim: 512 ,
264
292
description: String :: from( "CLIP text encoder based on ViT-B/32" ) ,
265
293
model_code: String :: from( "Qdrant/clip-ViT-B-32-text" ) ,
266
294
model_file: String :: from( "model.onnx" ) ,
295
+ additional_files: Vec :: new( ) ,
296
+ } ,
297
+ ModelInfo {
298
+ model: EmbeddingModel :: JinaEmbeddingsV2BaseCode ,
299
+ dim: 768 ,
300
+ description: String :: from( "Jina embeddings v2 base code" ) ,
301
+ model_code: String :: from( "jinaai/jina-embeddings-v2-base-code" ) ,
302
+ model_file: String :: from( "onnx/model.onnx" ) ,
303
+ additional_files: Vec :: new( ) ,
267
304
} ,
268
305
] ;
269
306
@@ -338,6 +375,8 @@ impl EmbeddingModel {
338
375
EmbeddingModel :: GTELargeENV15Q => Some ( Pooling :: Cls ) ,
339
376
340
377
EmbeddingModel :: ClipVitB32 => Some ( Pooling :: Mean ) ,
378
+
379
+ EmbeddingModel :: JinaEmbeddingsV2BaseCode => Some ( Pooling :: Mean ) ,
341
380
}
342
381
}
343
382
0 commit comments