Skip to content

Commit abfb4f4

Browse files
authored
Added compression configs for Llama-3.1-8B and Llama-3.1-8B-Instruct. (#904)
* Added compression configs for Llama-3.1-8B and Llama-3.1-8B-Instruct. * Removed unverified parameters.
1 parent c9629e8 commit abfb4f4

File tree

1 file changed

+4
-4
lines changed

1 file changed

+4
-4
lines changed

optimum/intel/openvino/configuration.py

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -164,19 +164,19 @@ class OVQuantizationMethod(str, Enum):
164164
"dataset": "wikitext2",
165165
"scale_estimation": True,
166166
},
167-
"meta-llama/Meta-Llama-3-8B-Instruct": {
167+
"meta-llama/Meta-Llama-3.1-8B-Instruct": {
168168
"bits": 4,
169169
"sym": False,
170170
"group_size": 64,
171-
"ratio": 0.9,
171+
"ratio": 0.8,
172172
"dataset": "wikitext2",
173173
"scale_estimation": True,
174174
},
175-
"meta-llama/Meta-Llama-3-8B": {
175+
"meta-llama/Meta-Llama-3.1-8B": {
176176
"bits": 4,
177177
"sym": False,
178178
"group_size": 64,
179-
"ratio": 0.9,
179+
"ratio": 0.8,
180180
"dataset": "wikitext2",
181181
"scale_estimation": True,
182182
},

0 commit comments

Comments
 (0)