Skip to content

Commit ba70ef1

Browse files
Update DQ query
1 parent db0fb9a commit ba70ef1

File tree

1 file changed

+3
-7
lines changed

1 file changed

+3
-7
lines changed

src/cpp/src/llm_pipeline_static.cpp

Lines changed: 3 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -475,13 +475,7 @@ std::optional<NPUDesc> extract_npu_descriptor(ov::Core& core) {
475475
}
476476
const auto arch = core.get_property("NPU", ov::device::architecture);
477477
const auto max_tiles = core.get_property("NPU", ov::intel_npu::max_tiles);
478-
479-
bool compiler_dq = false;
480-
const auto device_caps = core.get_property("NPU", ov::device::capabilities);
481-
if (std::find(device_caps.begin(), device_caps.end(),
482-
"COMPILER_DYNAMIC_QUANTIZATION") != device_caps.end()) {
483-
compiler_dq = true;
484-
}
478+
const auto compiler_dq = core.get_property("NPU", ov::intel_npu::compiler_dynamic_quantization);
485479
return std::make_optional(NPUDesc{arch, max_tiles, compiler_dq});
486480
}
487481

@@ -526,6 +520,7 @@ ov::AnyMap get_default_prefill_config(const std::shared_ptr<ov::Model>& model,
526520
}
527521
if (npudesc.has_value() && npudesc->compiler_dq) {
528522
config.emplace("NPUW_DQ_FULL", "NO");
523+
config.emplace("NPU_COMPILATION_MODE_PARAMS", "enable-weights-dynamic-dequantization=true");
529524
}
530525
return config;
531526
}
@@ -547,6 +542,7 @@ ov::AnyMap get_default_generate_config(const std::shared_ptr<ov::Model>& model,
547542
}
548543
if (npudesc.has_value() && npudesc->compiler_dq) {
549544
config.emplace("NPUW_DQ_FULL", "NO");
545+
config.emplace("NPU_COMPILATION_MODE_PARAMS", "enable-weights-dynamic-dequantization=true");
550546
}
551547
return config;
552548
}

0 commit comments

Comments
 (0)