@@ -54,14 +54,25 @@ def __init__(
54
54
55
55
def compile (self ):
56
56
if self .request is None :
57
- logger .info (f"Compiling the Language model to { self ._device } ..." )
58
- self .request = core .compile_model (self .model , self ._device , self .ov_config ).create_infer_request ()
57
+ if self ._compile_only :
58
+ self .request = self .model .create_infer_request ()
59
+ else :
60
+ logger .info (f"Compiling the Language model to { self ._device } ..." )
61
+ self .request = self ._compile_model (
62
+ self .model , self ._device , self .ov_config , self .model_save_dir
63
+ ).create_infer_request ()
59
64
self ._compile_text_emb ()
60
65
61
66
def _compile_text_emb (self ):
62
67
if self .text_emb_request is None :
63
68
logger .info (f"Compiling the Text embeddings model to { self ._device } ..." )
64
- self .text_emb_request = core .compile_model (self .text_emb_model , self ._device , self .ov_config )
69
+ if self ._compile_only :
70
+ self .text_emb_request = self .text_emb_model
71
+ else :
72
+ logger .info (f"Compiling the Text embeddings model to { self ._device } ..." )
73
+ self .text_emb_request = self ._compile_model (
74
+ self .text_emb_model , self ._device , self .ov_config , self .model_save_dir
75
+ )
65
76
66
77
def clear_requests (self ):
67
78
if self ._compile_only :
@@ -263,11 +274,11 @@ def __init__(
263
274
self .lm_model ,
264
275
self .text_embdings_model ,
265
276
config = config ,
266
- deivce = device ,
277
+ device = device ,
267
278
ov_config = ov_config ,
268
279
model_save_dir = model_save_dir ,
269
280
quantization_config = quantization_config ,
270
- compile = not self ._compile_only ,
281
+ compile = self ._compile_only ,
271
282
compile_only = self ._compile_only ,
272
283
)
273
284
self .vision_embeddings = OVVisionEmbedding (self .vision_embeddings_model , self )
@@ -308,7 +319,7 @@ def _save_pretrained(self, save_directory: Union[str, Path]):
308
319
dst_file_names = [
309
320
"openvino_language_model.xml" ,
310
321
"openvino_text_embeddings_model.xml" ,
311
- "openvino_vision_embeddings .xml" ,
322
+ "openvino_vision_embeddings_model .xml" ,
312
323
]
313
324
for part in self .additional_parts :
314
325
model = getattr (self , f"{ part } _model" , None )
0 commit comments