int4 config for mixtral model

openvinotoolkit · eaidova · Feb 28, 2024 · Feb 28, 2024 · Feb 28, 2024 · 3bdff2d91e698968674db5eb60d3f779441faf3f
commit 3bdff2d91e698968674db5eb60d3f779441faf3f
diff --git a/llm_bench/python/utils/nncf_utils.py b/llm_bench/python/utils/nncf_utils.py
@@ -47,4 +47,5 @@ def get_compressed_path(output_dir: str, base_precision, option: str):
     "open-llama-3b": {"mode": nncf.CompressWeightsMode.INT4_SYM, "group_size": 64, "all_layers": True},
     "falcon-7b-instruct": {"mode": nncf.CompressWeightsMode.INT4_SYM, "group_size": 64, "all_layers": True},
     "orca-mini-3b": {"mode": nncf.CompressWeightsMode.INT4_SYM, "group_size": 64, "all_layers": True},
+    "mixtral-8x7b-v0.1": {"mode": nncf.CompressWeightsMode.INT4_SYM, "group_size": 128, "ratio": 0.8},
 }