Skip to content

Commit 2c15d78

Browse files
Optimal tuned parameters for AMD-W7000
1 parent 8a4f86f commit 2c15d78

1 file changed

Lines changed: 53 additions & 3 deletions

File tree

GPU/GPUTracking/Definitions/GPUDefParametersDefaults.h

Lines changed: 53 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -87,17 +87,67 @@
8787
#define GPUCA_PAR_COMP_GATHER_KERNEL 4
8888
#define GPUCA_PAR_COMP_GATHER_MODE 3
8989
#elif defined(GPUCA_GPUTYPE_W7900)
90+
#define GPUCA_WARP_SIZE 32
91+
#define GPUCA_THREAD_COUNT_DEFAULT 256
92+
#define GPUCA_LB_GPUTPCNeighboursFinder 256
93+
#define GPUCA_LB_GPUTPCNeighboursCleaner 256
94+
#define GPUCA_LB_GPUTPCStartHitsFinder 256
95+
#define GPUCA_LB_GPUTPCStartHitsSorter 256
96+
#define GPUCA_LB_GPUTPCTrackletConstructor 256
97+
#define GPUCA_LB_GPUTPCTrackletSelector 256
98+
#define GPUCA_LB_GPUTPCExtrapolationTracking 256
99+
#define GPUCA_LB_GPUTPCCreateTrackingData 256
100+
#define GPUCA_LB_GPUTPCGMMergerTrackFit 256
101+
#define GPUCA_LB_GPUTPCGMMergerFollowLoopers 256
102+
#define GPUCA_LB_GPUTPCGMMergerUnpackResetIds 256
103+
#define GPUCA_LB_GPUTPCGMMergerSectorRefit 256
104+
#define GPUCA_LB_GPUTPCGMMergerUnpackGlobal 256
105+
#define GPUCA_LB_GPUTPCGMMergerResolve_step0 256
106+
#define GPUCA_LB_GPUTPCGMMergerResolve_step1 256
107+
#define GPUCA_LB_GPUTPCGMMergerResolve_step2 256
108+
#define GPUCA_LB_GPUTPCGMMergerResolve_step3 256
109+
#define GPUCA_LB_GPUTPCGMMergerResolve_step4 256
110+
#define GPUCA_LB_GPUTPCGMMergerClearLinks 256
111+
#define GPUCA_LB_GPUTPCGMMergerMergeWithinPrepare 256
112+
#define GPUCA_LB_GPUTPCGMMergerMergeSectorsPrepare 256
113+
#define GPUCA_LB_GPUTPCGMMergerMergeBorders_step0 256
114+
#define GPUCA_LB_GPUTPCGMMergerMergeBorders_step2 256
115+
#define GPUCA_LB_GPUTPCGMMergerMergeCE 256
116+
#define GPUCA_LB_GPUTPCGMMergerLinkExtrapolatedTracks 256
117+
#define GPUCA_LB_GPUTPCGMMergerCollect 256
118+
#define GPUCA_LB_GPUTPCGMMergerSortTracksPrepare 256
119+
#define GPUCA_LB_GPUTPCGMMergerPrepareClusters_step0 256
120+
#define GPUCA_LB_GPUTPCGMMergerPrepareClusters_step1 256
121+
#define GPUCA_LB_GPUTPCGMMergerPrepareClusters_step2 256
122+
#define GPUCA_LB_GPUTPCCompressionKernels_step0attached 256
123+
#define GPUCA_LB_GPUTPCCompressionKernels_step1unattached 256
124+
#define GPUCA_LB_GPUTPCDecompressionKernels_step0attached 256
125+
#define GPUCA_LB_GPUTPCDecompressionKernels_step1unattached 256
126+
#define GPUCA_LB_GPUTPCCFCheckPadBaseline 64
127+
#define GPUCA_LB_GPUTPCCFChargeMapFiller_fillIndexMap 512
128+
#define GPUCA_LB_GPUTPCCFChargeMapFiller_fillFromDigits 512
129+
#define GPUCA_LB_GPUTPCCFChargeMapFiller_findFragmentStart 512
130+
#define GPUCA_LB_GPUTPCCFPeakFinder 512
131+
#define GPUCA_LB_GPUTPCCFDeconvolution 512
132+
#define GPUCA_LB_GPUTPCCFClusterizer 512
133+
#define GPUCA_LB_GPUTPCCFDecodeZS 128, 4
134+
#define GPUCA_LB_GPUTPCCFDecodeZSLink 32
135+
#define GPUCA_LB_GPUTPCCFDecodeZSDenseLink 32
136+
#define GPUCA_LB_GPUTPCCFGather 1024, 1
90137
#define GPUCA_PAR_NEIGHBOURS_FINDER_MAX_NNEIGHUP 5
138+
#define GPUCA_PAR_NEIGHBOURS_FINDER_UNROLL_GLOBAL 4
139+
#define GPUCA_PAR_NEIGHBOURS_FINDER_UNROLL_SHARED 1
91140
#define GPUCA_PAR_TRACKLET_SELECTOR_HITS_REG_SIZE 20
92141
#define GPUCA_PAR_ALTERNATE_BORDER_SORT 1
93142
#define GPUCA_PAR_SORT_BEFORE_FIT 1
94143
#define GPUCA_PAR_MERGER_SPLIT_LOOP_INTERPOLATION 1
95144
#define GPUCA_PAR_NO_ATOMIC_PRECHECK 1
96-
#define GPUCA_PAR_DEDX_STORAGE_TYPE uint16_t
97-
#define GPUCA_PAR_MERGER_INTERPOLATION_ERROR_TYPE half
98145
#define GPUCA_PAR_COMP_GATHER_KERNEL 4
99146
#define GPUCA_PAR_COMP_GATHER_MODE 3
100-
// Use default settings below
147+
#define GPUCA_PAR_SORT_STARTHITS 1
148+
#define GPUCA_PAR_CF_SCAN_WORKGROUP_SIZE 512
149+
#define GPUCA_PAR_DEDX_STORAGE_TYPE uint16_t
150+
#define GPUCA_PAR_MERGER_INTERPOLATION_ERROR_TYPE half
101151
#elif defined(GPUCA_GPUTYPE_VEGA)
102152
#define GPUCA_WARP_SIZE 64
103153
#define GPUCA_THREAD_COUNT_DEFAULT 256

0 commit comments

Comments
 (0)