From 58e08898e9aed181e4fdda9dc506a30e91b1ada6 Mon Sep 17 00:00:00 2001 From: SharkyKZ Date: Sat, 1 Nov 2025 11:06:35 +0000 Subject: [PATCH] Fix int8 check --- gradio-app/app.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/gradio-app/app.py b/gradio-app/app.py index d50843f..f14dffd 100644 --- a/gradio-app/app.py +++ b/gradio-app/app.py @@ -322,7 +322,7 @@ def load_model(quant: str, status: gr.HTML | None = None): print(f"[WARN] Liger kernel could not be applied: {e}") else: from transformers import BitsAndBytesConfig - if quant == "8bit": + if quant == "int8": qnt_config = BitsAndBytesConfig( load_in_8bit=True, llm_int8_skip_modules=["vision_tower", "multi_modal_projector"], # Transformer's Siglip implementation has bugs when quantized, so skip those. @@ -824,4 +824,4 @@ def collate_fn(batch: list[tuple[Path, Image.Image, str, str] | None], *, proces if __name__ == "__main__": print_system_info() - demo.launch() \ No newline at end of file + demo.launch()