@@ -97,11 +97,6 @@ GPUd() void GPUTPCCFCheckPadBaseline::CheckBaselineGPU(int32_t nBlocks, int32_t
9797
9898 HipTailRange activeHIPTail{-1 , -1 };
9999
100- if (iThread == 0 ) {
101- smem.bcast = 0 ;
102- }
103- GPUbarrier ();
104-
105100 const int16_t iPadOffset = iThread % MaxNPadsPerRow;
106101 const int16_t iTimeOffset = iThread / MaxNPadsPerRow;
107102 const int16_t iPadHandle = iThread;
@@ -119,13 +114,7 @@ GPUd() void GPUTPCCFCheckPadBaseline::CheckBaselineGPU(int32_t nBlocks, int32_t
119114 const Charge ql = iTimeLoad < lastTB && iPadOffset < rowinfo.nPads ? chargeMap[pos].unpack () : 0 ;
120115 smem.charges [iTimeOffset][iPadOffset] = ql;
121116
122- const bool hasHIPTrigger = work_group_any (ql == MaxADC, smem.bcast );
123- // bool hasHIPTrigger = false;
124- // if (t % (NumOfCachedTBs * 100) == 0) {
125- // hasHIPTrigger = work_group_any(ql == MaxADC);
126- // } else {
127- // GPUbarrier();
128- // }
117+ const bool hasHIPTrigger = work_group_any (ql == MaxADC);
129118
130119 acc.HIPtb = -1 ;
131120
@@ -152,9 +141,6 @@ GPUd() void GPUTPCCFCheckPadBaseline::CheckBaselineGPU(int32_t nBlocks, int32_t
152141
153142 }
154143
155- if (iThread == 0 ) {
156- smem.bcast = 0 ;
157- }
158144 GPUbarrier ();
159145
160146 if (hasHIPTrigger) [[unlikely]] {
@@ -237,7 +223,7 @@ GPUd() void GPUTPCCFCheckPadBaseline::CheckBaselineGPU(int32_t nBlocks, int32_t
237223 // Call `work_group_any` here, instead of always counting.
238224 // This is important as `work_group_count` is a lot slower
239225 // and has a lot of overhead if no HIPs were found.
240- const bool anyCloseTail = work_group_any (shouldCloseTail, smem. bcast );
226+ const bool anyCloseTail = work_group_any (shouldCloseTail);
241227
242228 if (anyCloseTail) {
243229
0 commit comments