mirror of
https://github.com/oobabooga/text-generation-webui.git
synced 2026-04-09 00:23:38 +00:00
ExLlamaV2: Add speculative decoding (#6899)
This commit is contained in:
parent
8f2493cc60
commit
ae1fe87365
2 changed files with 53 additions and 2 deletions
|
|
@ -25,7 +25,7 @@ loaders_and_params = OrderedDict({
|
|||
'gpu_layers_draft',
|
||||
'device_draft',
|
||||
'ctx_size_draft',
|
||||
'speculative_decoding_accordion'
|
||||
'speculative_decoding_accordion',
|
||||
],
|
||||
'Transformers': [
|
||||
'gpu_split',
|
||||
|
|
@ -82,6 +82,9 @@ loaders_and_params = OrderedDict({
|
|||
'no_xformers',
|
||||
'no_sdpa',
|
||||
'exllamav2_info',
|
||||
'model_draft',
|
||||
'ctx_size_draft',
|
||||
'speculative_decoding_accordion',
|
||||
],
|
||||
'HQQ': [
|
||||
'hqq_backend',
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue