Add back my llama-cpp-python wheels, bump to 0.2.65 (#5964)

This commit is contained in:
oobabooga 2024-04-30 09:11:31 -03:00 committed by GitHub
parent 5770e06c48
commit 51fb766bea
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
18 changed files with 330 additions and 56 deletions

View file

@ -114,6 +114,7 @@ group.add_argument('--quant_type', type=str, default='nf4', help='quant_type for
# llama.cpp
group = parser.add_argument_group('llama.cpp')
group.add_argument('--tensorcores', action='store_true', help='Use llama-cpp-python compiled with tensor cores support. This increases performance on RTX cards. NVIDIA only.')
group.add_argument('--n_ctx', type=int, default=2048, help='Size of the prompt context.')
group.add_argument('--threads', type=int, default=0, help='Number of threads to use.')
group.add_argument('--threads-batch', type=int, default=0, help='Number of threads to use for batches/prompt processing.')
@ -204,8 +205,7 @@ group = parser.add_argument_group('Multimodal')
group.add_argument('--multimodal-pipeline', type=str, default=None, help='The multimodal pipeline to use. Examples: llava-7b, llava-13b.')
# Deprecated parameters
group = parser.add_argument_group('Deprecated')
group.add_argument('--tensorcores', action='store_true', help='DEPRECATED')
# group = parser.add_argument_group('Deprecated')
args = parser.parse_args()
args_defaults = parser.parse_args([])
@ -215,7 +215,7 @@ for arg in sys.argv[1:]:
if hasattr(args, arg):
provided_arguments.append(arg)
deprecated_args = ['tensorcores']
deprecated_args = []
def do_cmd_flags_warnings():