From dcf82afc6f8e4a124fd26eefad56ea0fa65ef54c Mon Sep 17 00:00:00 2001 From: Lyalyushkin Nikolay Date: Wed, 28 Feb 2024 17:51:39 +0100 Subject: [PATCH] Add default quantization int4 config for Mixtral-8x7B (#576) --- optimum/intel/openvino/configuration.py | 1 + 1 file changed, 1 insertion(+) diff --git a/optimum/intel/openvino/configuration.py b/optimum/intel/openvino/configuration.py index 6611e5d0dd..9f3e3a06ca 100644 --- a/optimum/intel/openvino/configuration.py +++ b/optimum/intel/openvino/configuration.py @@ -96,6 +96,7 @@ "openlm-research/open_llama_3b": {"bits": 4, "sym": True, "group_size": 64, "all_layers": True}, "tiiuae/falcon-7b": {"bits": 4, "sym": True, "group_size": 64, "all_layers": True}, "psmathur/orca_mini_3b": {"bits": 4, "sym": True, "group_size": 64, "all_layers": True}, + "mistralai/Mixtral-8x7B-v0.1": {"bits": 4, "sym": True, "group_size": 128, "ratio": 0.8}, }