Skip to content

Commit fa3a233

Browse files
authored
Merge pull request #1130 from InfiniTensor/issue/1129
issue/1129 - fix dtype generalization and used variables
2 parents 6e88052 + de07226 commit fa3a233

2 files changed

Lines changed: 2 additions & 2 deletions

File tree

src/infiniop/ops/huber_loss/nvidia/huber_loss_nvidia.cu

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -105,7 +105,7 @@ infiniStatus_t Descriptor::calculate(
105105
launch_kernel<half>(output, input, target, workspace, _info, stream);
106106
break;
107107
case INFINI_DTYPE_BF16:
108-
launch_kernel<nv_bfloat16>(output, input, target, workspace, _info, stream);
108+
launch_kernel<cuda_bfloat16>(output, input, target, workspace, _info, stream);
109109
break;
110110
case INFINI_DTYPE_F32:
111111
launch_kernel<float>(output, input, target, workspace, _info, stream);

src/infiniop/ops/kthvalue/cuda/kernel.cuh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -115,7 +115,7 @@ __global__ void kthvalue_kernel(
115115
for (unsigned int size = 2; size <= power_of_2_dim; size <<= 1) {
116116
// Bitonic Merge
117117
// dir: 升序或降序交替,构造双调序列
118-
bool dir = (tid & (size / 2)) == 0;
118+
// bool dir = (tid & (size / 2)) == 0;
119119

120120
// 这里的逻辑稍微复杂,为了简单和稳定,我们使用全升序排序逻辑
121121
// 标准 Bitonic Sort 代码如下:

0 commit comments

Comments
 (0)