Skip to content

Commit 99442a9

Browse files
committed
Cleanup.
1 parent 6a8402d commit 99442a9

3 files changed

Lines changed: 3 additions & 19 deletions

File tree

GPU/Common/GPUCommonAlgorithm.h

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -422,7 +422,7 @@ GPUdi() T warp_broadcast_FUNC(T v, int32_t i)
422422
#endif
423423
}
424424

425-
[[nodiscard]] GPUdi() bool work_group_any(bool pred, int32_t &smemBcast)
425+
[[nodiscard]] GPUdi() bool work_group_any(bool pred)
426426
{
427427
return __syncthreads_or(pred);
428428
}

GPU/GPUTracking/TPCClusterFinder/GPUTPCCFCheckPadBaseline.cxx

Lines changed: 2 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -97,11 +97,6 @@ GPUd() void GPUTPCCFCheckPadBaseline::CheckBaselineGPU(int32_t nBlocks, int32_t
9797

9898
HipTailRange activeHIPTail{-1, -1};
9999

100-
if (iThread == 0) {
101-
smem.bcast = 0;
102-
}
103-
GPUbarrier();
104-
105100
const int16_t iPadOffset = iThread % MaxNPadsPerRow;
106101
const int16_t iTimeOffset = iThread / MaxNPadsPerRow;
107102
const int16_t iPadHandle = iThread;
@@ -119,13 +114,7 @@ GPUd() void GPUTPCCFCheckPadBaseline::CheckBaselineGPU(int32_t nBlocks, int32_t
119114
const Charge ql = iTimeLoad < lastTB && iPadOffset < rowinfo.nPads ? chargeMap[pos].unpack() : 0;
120115
smem.charges[iTimeOffset][iPadOffset] = ql;
121116

122-
const bool hasHIPTrigger = work_group_any(ql == MaxADC, smem.bcast);
123-
// bool hasHIPTrigger = false;
124-
// if (t % (NumOfCachedTBs * 100) == 0) {
125-
// hasHIPTrigger = work_group_any(ql == MaxADC);
126-
// } else {
127-
// GPUbarrier();
128-
// }
117+
const bool hasHIPTrigger = work_group_any(ql == MaxADC);
129118

130119
acc.HIPtb = -1;
131120

@@ -152,9 +141,6 @@ GPUd() void GPUTPCCFCheckPadBaseline::CheckBaselineGPU(int32_t nBlocks, int32_t
152141

153142
}
154143

155-
if (iThread == 0) {
156-
smem.bcast = 0;
157-
}
158144
GPUbarrier();
159145

160146
if (hasHIPTrigger) [[unlikely]] {
@@ -237,7 +223,7 @@ GPUd() void GPUTPCCFCheckPadBaseline::CheckBaselineGPU(int32_t nBlocks, int32_t
237223
// Call `work_group_any` here, instead of always counting.
238224
// This is important as `work_group_count` is a lot slower
239225
// and has a lot of overhead if no HIPs were found.
240-
const bool anyCloseTail = work_group_any(shouldCloseTail, smem.bcast);
226+
const bool anyCloseTail = work_group_any(shouldCloseTail);
241227

242228
if (anyCloseTail) {
243229

GPU/GPUTracking/TPCClusterFinder/GPUTPCCFCheckPadBaseline.h

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -77,8 +77,6 @@ class GPUTPCCFCheckPadBaseline : public GPUKernelTemplate
7777
HipTailRange tails[MaxNPadsPerRow];
7878
uint8_t tailsClosedPad[MaxNPadsPerRow];
7979
HipTailRange tailsClosed[MaxNPadsPerRow];
80-
81-
int32_t bcast;
8280
};
8381

8482
// Accumulated values from scanning cached charges in a pad

0 commit comments

Comments
 (0)