Add --no_xformers and --no_sdpa flags for ExllamaV2

This commit is contained in:
oobabooga 2024-07-11 15:47:37 -07:00
parent 512b311137
commit e436d69e2b
6 changed files with 15 additions and 1 deletions

View file

@ -85,6 +85,8 @@ def list_model_elements():
'disable_exllamav2',
'cfg_cache',
'no_flash_attn',
'no_xformers',
'no_sdpa',
'num_experts_per_token',
'cache_8bit',
'cache_4bit',