Bump llama-cpp-python to 0.2.83, add back tensorcore wheels

Also add back the progress bar patch
This commit is contained in:
oobabooga 2024-07-22 18:05:11 -07:00
parent 11bbf71aa5
commit aa809e420e
13 changed files with 109 additions and 45 deletions

View file

@ -46,6 +46,7 @@ loaders_and_params = OrderedDict({
'numa',
'no_offload_kqv',
'row_split',
'tensorcores',
'flash_attn',
'streaming_llm',
'attention_sink_size',
@ -72,6 +73,7 @@ loaders_and_params = OrderedDict({
'logits_all',
'no_offload_kqv',
'row_split',
'tensorcores',
'flash_attn',
'streaming_llm',
'attention_sink_size',