Image generation: add torchao quantization (supports torch.compile)

2026-04-04 14:17:28 +00:00 · 2025-12-02 14:22:51 -08:00 · 2025-12-02 14:22:51 -08:00 · 9448bf1caa
commit 9448bf1caa
parent 97281ff831
12 changed files with 40 additions and 6 deletions
--- a/modules/ui_image_generation.py
+++ b/modules/ui_image_generation.py
@ -473,9 +473,9 @@ def create_ui():
                            with gr.Column():
                                shared.gradio['image_quant'] = gr.Dropdown(
                                    label='Quantization',
-                                    choices=['none', 'bnb-8bit', 'bnb-4bit'],
+                                    choices=['none', 'bnb-8bit', 'bnb-4bit', 'torchao-int8wo', 'torchao-fp4', 'torchao-float8wo'],
                                    value=shared.settings['image_quant'],
-                                    info='Quantization method for reduced VRAM usage. Quanto supports lower precisions (2-bit, 4-bit, 8-bit).'
+                                    info='BnB: bitsandbytes quantization. torchao: int8wo, fp4, float8wo.'
                                )

                                shared.gradio['image_dtype'] = gr.Dropdown(