Update TensorRT-LLM to v1.1.0

This commit is contained in:
oobabooga 2026-03-05 09:32:28 -03:00
parent 69fa4dd0b1
commit 268cc3f100
3 changed files with 13 additions and 32 deletions

View file

@ -142,7 +142,7 @@ group.add_argument('--num_experts_per_token', type=int, default=2, metavar='N',
# TensorRT-LLM
group = parser.add_argument_group('TensorRT-LLM')
group.add_argument('--cpp-runner', action='store_true', help='Use the ModelRunnerCpp runner, which is faster than the default ModelRunner but doesn\'t support streaming yet.')
group.add_argument('--cpp-runner', action='store_true', help='Use the ModelRunnerCpp runner, which is faster than the default ModelRunner.')
# RoPE
group = parser.add_argument_group('RoPE')