Skip to content

Commit c75b5fc

Browse files
committed
[None][fix] Address DSv4 primitive review comments
Signed-off-by: Mingyang Hao <200044211+mingyangHao@users.noreply.github.com>
1 parent 0f3020e commit c75b5fc

15 files changed

Lines changed: 32 additions & 18 deletions

File tree

cpp/tensorrt_llm/CMakeLists.txt

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -200,11 +200,13 @@ set(TRTLLM_LINK_LIBS
200200
layers_src
201201
runtime_src
202202
testing_src
203-
mhcKernels_src
204203
compressorKernels_src
205204
userbuffers_src
206205
${DECODER_SHARED_TARGET_0}
207206
${DECODER_SHARED_TARGET_1})
207+
if(BUILD_DEEP_GEMM)
208+
set(TRTLLM_LINK_LIBS ${TRTLLM_LINK_LIBS} mhcKernels_src)
209+
endif()
208210
if(USING_OSS_CUTLASS_LOW_LATENCY_GEMM)
209211
set(TRTLLM_LINK_LIBS ${TRTLLM_LINK_LIBS} low_latency_gemm_src)
210212
message(STATUS "USING_OSS_CUTLASS_LOW_LATENCY_GEMM")

cpp/tensorrt_llm/kernels/CMakeLists.txt

Lines changed: 5 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -30,7 +30,11 @@ add_subdirectory(dsv3MinLatencyKernels)
3030
add_subdirectory(causalConv1d)
3131
add_subdirectory(fusedGatedRMSNormQuant)
3232
add_subdirectory(mamba2MTPSSMCache)
33-
add_subdirectory(mhcKernels)
33+
# The mHC fused MMA path depends on DeepGEMM helper headers, which are only
34+
# fetched when BUILD_DEEP_GEMM is enabled.
35+
if(BUILD_DEEP_GEMM)
36+
add_subdirectory(mhcKernels)
37+
endif()
3438
add_subdirectory(compressorKernels)
3539

3640
file(GLOB_RECURSE SRC_CPP *.cpp)

cpp/tensorrt_llm/kernels/compressorKernels/CMakeLists.txt

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
#
2-
# SPDX-FileCopyrightText: Copyright (c) 1993-2026 NVIDIA CORPORATION &
3-
# AFFILIATES. All rights reserved. SPDX-License-Identifier: Apache-2.0
2+
# SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES.
3+
# All rights reserved. SPDX-License-Identifier: Apache-2.0
44
#
55
# Licensed under the Apache License, Version 2.0 (the "License"); you may not
66
# use this file except in compliance with the License. You may obtain a copy of

cpp/tensorrt_llm/kernels/compressorKernels/compressorKernels.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
/*
2-
* Copyright (c) 2022-2026, NVIDIA CORPORATION. All rights reserved.
2+
* Copyright (c) 2026, NVIDIA CORPORATION. All rights reserved.
33
*
44
* Licensed under the Apache License, Version 2.0 (the "License");
55
* you may not use this file except in compliance with the License.

cpp/tensorrt_llm/kernels/compressorKernels/compressorKernels.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
/*
2-
* Copyright (c) 2022-2026, NVIDIA CORPORATION. All rights reserved.
2+
* Copyright (c) 2026, NVIDIA CORPORATION. All rights reserved.
33
*
44
* Licensed under the Apache License, Version 2.0 (the "License");
55
* you may not use this file except in compliance with the License.

cpp/tensorrt_llm/kernels/mhcKernels/CMakeLists.txt

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,6 +1,6 @@
11
#
2-
# SPDX-FileCopyrightText: Copyright (c) 1993-2026 NVIDIA CORPORATION &
3-
# AFFILIATES. All rights reserved. SPDX-License-Identifier: Apache-2.0
2+
# SPDX-FileCopyrightText: Copyright (c) 2026 NVIDIA CORPORATION & AFFILIATES.
3+
# All rights reserved. SPDX-License-Identifier: Apache-2.0
44
#
55
# Licensed under the Apache License, Version 2.0 (the "License"); you may not
66
# use this file except in compliance with the License. You may obtain a copy of

cpp/tensorrt_llm/kernels/mhcKernels/fused_tf32_pmap_gemm.cuh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
/*
2-
* Copyright (c) 2022-2026, NVIDIA CORPORATION. All rights reserved.
2+
* Copyright (c) 2026, NVIDIA CORPORATION. All rights reserved.
33
*
44
* Licensed under the Apache License, Version 2.0 (the "License");
55
* you may not use this file except in compliance with the License.

cpp/tensorrt_llm/kernels/mhcKernels/mhcFusedHcKernel.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
/*
2-
* Copyright (c) 2022-2026, NVIDIA CORPORATION. All rights reserved.
2+
* Copyright (c) 2026, NVIDIA CORPORATION. All rights reserved.
33
*
44
* Licensed under the Apache License, Version 2.0 (the "License");
55
* you may not use this file except in compliance with the License.

cpp/tensorrt_llm/kernels/mhcKernels/mhcKernels.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
/*
2-
* Copyright (c) 2022-2026, NVIDIA CORPORATION. All rights reserved.
2+
* Copyright (c) 2026, NVIDIA CORPORATION. All rights reserved.
33
*
44
* Licensed under the Apache License, Version 2.0 (the "License");
55
* you may not use this file except in compliance with the License.

cpp/tensorrt_llm/kernels/mhcKernels/mhcKernels.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
/*
2-
* Copyright (c) 2022-2026, NVIDIA CORPORATION. All rights reserved.
2+
* Copyright (c) 2026, NVIDIA CORPORATION. All rights reserved.
33
*
44
* Licensed under the Apache License, Version 2.0 (the "License");
55
* you may not use this file except in compliance with the License.

0 commit comments

Comments
 (0)