We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 50379d0 commit 87dd01aCopy full SHA for 87dd01a
4 files changed
README.md
@@ -10,7 +10,7 @@ state-of-the-art optimizations to perform inference efficiently on NVIDIA GPUs.<
10
[](https://www.python.org/downloads/release/python-31012/)
11
[](https://developer.nvidia.com/cuda-downloads)
12
[](https://pytorch.org)
13
-[](https://github.com/NVIDIA/TensorRT-LLM/blob/main/tensorrt_llm/version.py)
+[](https://github.com/NVIDIA/TensorRT-LLM/blob/main/tensorrt_llm/version.py)
14
[](https://github.com/NVIDIA/TensorRT-LLM/blob/main/LICENSE)
15
16
[Architecture](https://nvidia.github.io/TensorRT-LLM/developer-guide/overview.html) | [Performance](https://nvidia.github.io/TensorRT-LLM/developer-guide/perf-overview.html) | [Examples](https://nvidia.github.io/TensorRT-LLM/quick-start-guide.html) | [Documentation](https://nvidia.github.io/TensorRT-LLM/) | [Roadmap](https://github.com/NVIDIA/TensorRT-LLM/issues?q=is%3Aissue%20state%3Aopen%20label%3Aroadmap)
examples/constraints.txt
@@ -1,3 +1,3 @@
1
-tensorrt_llm==1.2.0rc6.post2
+tensorrt_llm==1.2.0rc6.post4
2
evaluate~=0.4.1
3
rouge_score~=0.1.2
jenkins/L0_Test.groovy
@@ -2944,8 +2944,8 @@ def launchTestJobs(pipeline, testFilter)
2944
"DGX_H100-4_GPUs-PyTorch-Others-1": ["dgx-h100-x4-oci", "l0_dgx_h100", 1, 1, 4],
2945
"B300-PyTorch-1": ["b300-single", "l0_b300", 1, 1],
2946
"DGX_B200-4_GPUs-PyTorch-1": ["b200-x4", "l0_dgx_b200", 1, 1, 4],
2947
- "DGX_B200-4_GPUs-PyTorch-Ray-1": ["b200-x4-lbd", "l0_dgx_b200", 1, 1, 4, 1, true],
2948
- "DGX_B200-8_GPUs-PyTorch-1": ["b200-x8-lbd", "l0_dgx_b200", 1, 1, 8, 1, true],
+ "DGX_B200-4_GPUs-PyTorch-Ray-1": ["b200-x4", "l0_dgx_b200", 1, 1, 4, 1, true],
+ "DGX_B200-8_GPUs-PyTorch-1": ["b200-x8", "l0_dgx_b200", 1, 1, 8, 1, true],
2949
"DGX_B200-4_GPUs-PyTorch-Post-Merge-1": ["b200-trtllm", "l0_dgx_b200", 1, 2, 4, 1, true],
2950
"DGX_B200-4_GPUs-PyTorch-Post-Merge-2": ["b200-trtllm", "l0_dgx_b200", 2, 2, 4, 1, true],
2951
"DGX_B300-4_GPUs-PyTorch-Post-Merge-1": ["b300-x4", "l0_dgx_b300", 1, 2, 4],
tensorrt_llm/version.py
@@ -12,4 +12,4 @@
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
-__version__ = "1.2.0rc6.post2"
+__version__ = "1.2.0rc6.post4"
0 commit comments