Skip to content

Commit 5aec7af

Browse files
authored
TensorRT-LLM v0.18.2 release (#3611)
1 parent 62f3c95 commit 5aec7af

File tree

54 files changed

+146
-77
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

54 files changed

+146
-77
lines changed

README.md

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,2 @@
11
9f9942768fd5b0cf5ed19860ad539dc9 libtensorrt_llm_ucx_wrapper.so
2-
d2efc6043262c896e262e8d8b97055af0f1f8b47 commit
2+
edf502396e4443f284a5fae6044402478cf457c1 commit
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
11
version https://git-lfs.github.com/spec/v1
2-
oid sha256:e015c5cab637202b76f6ccd2d59b1427dc739f10321996a003230ba32814c08b
2+
oid sha256:ee2a324ae76a843823d1d82686bb495d097367e1c3a41aa9596fd0d2ba3fadae
33
size 8408224
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
11
version https://git-lfs.github.com/spec/v1
2-
oid sha256:1205f8fe60cc657645441c14c304888ad7cd68bc4cd1fabd10931a719560a42a
2+
oid sha256:4fcd95de792c72a38d4c1e76a4e714a2c69ffc25f03172075efb432e40ec29cd
33
size 8374456
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,2 @@
11
e383212a40dca932c7b77bf4544dab80 libtensorrt_llm_ucx_wrapper.so
2-
d2efc6043262c896e262e8d8b97055af0f1f8b47 commit
2+
edf502396e4443f284a5fae6044402478cf457c1 commit
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
11
version https://git-lfs.github.com/spec/v1
2-
oid sha256:e2fbf80d02c115b9eeb2c18d24e3cb55f0c5404eba563591abeab7d223518df6
2+
oid sha256:6fd8ea50100bbbdc9d1d52d4b7e9a82f01583884eeb4d2703d537b6785c63ea7
33
size 3102764
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
11
version https://git-lfs.github.com/spec/v1
2-
oid sha256:27f9acc83aa72979834cc8c216cf06e6ab4e9b10a7d1c9928bac3721fef037bd
2+
oid sha256:cd30000142d1256991fa27644d86dcd12a4c017eab9345a88ac705914aba8d11
33
size 3145744
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
1-
61ab1a6d4c62ee2a648f6daa5083c4de libtensorrt_llm_executor_static.a
2-
2f2bc67944c45ce0965704da43c9b1c4 libtensorrt_llm_executor_static.pre_cxx11.a
3-
d2efc6043262c896e262e8d8b97055af0f1f8b47 commit
1+
1146671822817c690387dc77d775b8c7 libtensorrt_llm_executor_static.a
2+
8f7cb0047a0c2690497a97911a60ed6d libtensorrt_llm_executor_static.pre_cxx11.a
3+
edf502396e4443f284a5fae6044402478cf457c1 commit
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
11
version https://git-lfs.github.com/spec/v1
2-
oid sha256:ae603dd0c585a7ee601fb6816ac2cdde674d5c49b96c7dce88de2bc67ea727bc
2+
oid sha256:22951d2bb0e5da2a1eb20ae0eb74690ddd57e7f1dd9545762eed1e0f468dd4a5
33
size 3457520
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
11
version https://git-lfs.github.com/spec/v1
2-
oid sha256:7adc486890442df336e145b0ccf982bc733f1a9cc8116f7ce56f1769cf7b1154
2+
oid sha256:0c13a28fc903da20aad74aeb1c3d04a3b1bf91421fdbe85a16b3552b3e7e431b
33
size 3448406
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
1-
e5da8cc2936606dfb49f4417d6961060 libtensorrt_llm_executor_static.a
2-
ad5dfb89c2d719d99d67346828e92e25 libtensorrt_llm_executor_static.pre_cxx11.a
3-
d2efc6043262c896e262e8d8b97055af0f1f8b47 commit
1+
34a5173ddebafd3f1621af2717a92f54 libtensorrt_llm_executor_static.a
2+
34eacc123dc995815fbd1e68ec98f78b libtensorrt_llm_executor_static.pre_cxx11.a
3+
edf502396e4443f284a5fae6044402478cf457c1 commit
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,2 @@
11
f3143205203b038b9dca6dd32cf02f59 libtensorrt_llm_nvrtc_wrapper.so
2-
d2efc6043262c896e262e8d8b97055af0f1f8b47 commit
2+
edf502396e4443f284a5fae6044402478cf457c1 commit
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,2 @@
11
770ca93818f3f04837a67353e3f71fbc libtensorrt_llm_nvrtc_wrapper.so
2-
d2efc6043262c896e262e8d8b97055af0f1f8b47 commit
2+
edf502396e4443f284a5fae6044402478cf457c1 commit
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
11
6bf0ba4e9b8b1152a21316243d30bec6 libtensorrt_llm_internal_cutlass_kernels_static.a
22
96f8a359c84a78ba415f4d98ef1c4e1d libtensorrt_llm_internal_cutlass_kernels_static.pre_cxx11.a
3-
d2efc6043262c896e262e8d8b97055af0f1f8b47 commit
3+
edf502396e4443f284a5fae6044402478cf457c1 commit
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
11
version https://git-lfs.github.com/spec/v1
2-
oid sha256:0b0f621e74dd506e49acd027dc09e9d2a3a6e0117ca0af68254841c02fb9c1dd
3-
size 68126454
2+
oid sha256:447838fe5c798098410a2cfed027aa38df847da2f725b9b8ccec57e73a1e194a
3+
size 68114502
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
11
version https://git-lfs.github.com/spec/v1
2-
oid sha256:8448e105a5002148083bacc6c5066e017719ccd532c021f4c821df74fa0b763f
3-
size 68295728
2+
oid sha256:42b88e56cee5b9b81a66836add80ba79819afa24cbfd72140f4d62a244e3f960
3+
size 68295696
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
1-
0b3322f5047dd4ee549211c2d15483c4 libtensorrt_llm_internal_cutlass_kernels_static.a
2-
502d4901fad6e648b8858051017c4cf2 libtensorrt_llm_internal_cutlass_kernels_static.pre_cxx11.a
3-
d2efc6043262c896e262e8d8b97055af0f1f8b47 commit
1+
4de75ffa1ff225422ba27f367175448f libtensorrt_llm_internal_cutlass_kernels_static.a
2+
e91d6c762f26c0b158eba8f376914e6e libtensorrt_llm_internal_cutlass_kernels_static.pre_cxx11.a
3+
edf502396e4443f284a5fae6044402478cf457c1 commit

docs/source/release-notes.md

+6

examples/baichuan/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.15.0
33
evaluate~=0.4.1
44
rouge_score~=0.1.2

examples/bloom/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.5
33
evaluate~=0.4.1
44
rouge_score~=0.1.2

examples/chatglm/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.5
33
evaluate~=0.4.1
44
protobuf

examples/commandr/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets==2.14.6
33
evaluate~=0.4.1
44
rouge_score~=0.1.2

examples/dbrx/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.5
33
evaluate~=0.4.1
44
rouge_score~=0.1.2

examples/deepseek_v1/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.6
33
evaluate~=0.4.1
44
rouge_score~=0.1.2

examples/draft_target_model/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.5
33
rouge_score~=0.1.2
44
sentencepiece>=0.1.99

examples/eagle/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.5
33
rouge_score~=0.1.2
44
SentencePiece~=0.1.99

examples/falcon/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
transformers>=4.31.0
33
datasets~=2.14.5
44
evaluate~=0.4.1

examples/gemma/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@
22
# WAR the new posting of "nvidia-cudnn-cu12~=9.0".
33
# "jax[cuda12_pip]~=0.4.19" specifies "nvidia-cudnn-cu12>=8.9" but actually requires "nvidia-cudnn-cu12~=8.9".
44
nvidia-cudnn-cu12~=8.9; platform_machine == "x86_64"
5-
tensorrt_llm==0.18.1
5+
tensorrt_llm==0.18.2
66
flax~=0.8.0
77
# jax[cuda12_pip]~=0.4.19; platform_system != "Windows"
88
jax~=0.4.19; platform_system == "Windows"

examples/gpt/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.5
33
evaluate~=0.4.1
44
rouge_score~=0.1.2

examples/gptj/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.5
33
evaluate~=0.4.1
44
rouge_score~=0.1.2

examples/gptneox/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.5
33
rouge_score~=0.1.2
44
evaluate~=0.4.1

examples/grok/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
-f https://storage.googleapis.com/jax-releases/jax_cuda_releases.html
2-
tensorrt_llm==0.18.1
2+
tensorrt_llm==0.18.2
33
datasets==2.14.6
44
evaluate~=0.4.1
55
rouge_score~=0.1.2

examples/internlm/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets==2.14.5
33
rouge_score~=0.1.2
44
sentencepiece>=0.1.99

examples/jais/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.5
33
evaluate~=0.4.1
44
rouge_score~=0.1.2

examples/llama/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
transformers>=4.43.0
33
datasets==2.14.6
44
evaluate~=0.4.1

examples/lookahead/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.5
33
rouge_score~=0.1.2
44
sentencepiece>=0.1.99

examples/mamba/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
transformers>=4.39.0
33
datasets~=2.14.5
44
evaluate

examples/medusa/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.5
33
rouge_score~=0.1.2
44
sentencepiece>=0.1.99

examples/mixtral/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
transformers==4.38.2
33
accelerate==0.25.0

examples/mpt/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.5
33
evaluate~=0.4.1
44
rouge_score~=0.1.2

examples/nemotron/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
nemo-toolkit[all]==2.0.0rc1
33
megatron-core==0.8.0
44
datasets~=2.14.5

examples/opt/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.5
33
evaluate~=0.4.1
44
rouge_score~=0.1.2

examples/phi/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.5
33
evaluate~=0.4.1
44
rouge_score~=0.1.2

examples/prompt_lookup/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
--extra-index-url https://pypi.nvidia.com
2-
tensorrt_llm==0.18.1
2+
tensorrt_llm==0.18.2
33
datasets~=2.14.5
44
rouge_score~=0.1.2
55
sentencepiece~=0.1.99

examples/quantization/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets>=2.14.4
33
nemo-toolkit[all]==2.0.0rc1
44
rouge_score~=0.1.2

examples/qwen/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.16.0
33
evaluate~=0.4.1
44
rouge_score~=0.1.2

examples/qwenvl/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.16.0
33
evaluate~=0.4.1
44
rouge_score~=0.1.2

examples/recurrentgemma/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
git+https://github.com/google-deepmind/recurrentgemma.git@8a32e365
33
flax>=0.8.2
44
jax~=0.4.23

examples/redrafter/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.14.5
33
rouge_score~=0.1.2
44
sentencepiece>=0.1.99

examples/skywork/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets~=2.16.1
33
evaluate~=0.4.1
44
rouge_score~=0.1.2

examples/smaug/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
datasets==2.14.6
33
evaluate~=0.4.1
44
rouge_score~=0.1.2

examples/whisper/requirements.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
tensorrt_llm==0.18.1
1+
tensorrt_llm==0.18.2
22
tiktoken
33
datasets
44
kaldialign

0 commit comments

Comments
 (0)