@@ -79,9 +79,6 @@ __global__ void fillFvalue(const real *csrFvalue, uint numCsr, const uint *preRo
7979 atomicAdd (newCsrFeaLen + (firstPartId + 1 ) * numFea + feaId, 1 );
8080 newCsrLen[basePos + numCsrCurPart] = csrLen;
8181 }
82- // if(0.369250 == temp){
83- // printf("csr len of 0.369250 is %d and %d; old len=%d, csrId=%d\n", newCsrLen[basePos], newCsrLen[basePos + numCsrCurPart], oldCsrLen[csrId], csrId);
84- // }
8582}
8683
8784__global__ void newCsrLenFvalue (const int *preFvalueInsId, int numFeaValue, const int *pInsId2Nid, int maxNid,
@@ -101,10 +98,7 @@ __global__ void newCsrLenFvalue(const int *preFvalueInsId, int numFeaValue, cons
10198 RangeBinarySearch (gTid , eachCsrStart, numCsr, csrId);
10299 CONCHECKER (csrId < numCsr);
103100 __syncthreads ();
104- // first csrId
105- // if(gTid >= numFeaValue && tid == 0){
106- // printf("oh shitt####################################################\n");
107- // }
101+
108102 if (tid == 0 )
109103 firstCsrId = csrId;
110104 __syncthreads ();
@@ -115,30 +109,16 @@ __global__ void newCsrLenFvalue(const int *preFvalueInsId, int numFeaValue, cons
115109 int insId = preFvalueInsId[gTid ];// insId is not -1, as preFvalueInsId is dense.
116110 int pid = pInsId2Nid[insId] - maxNid - 1 ;// mapping to new node
117111
118- // if(csrId == 2809992 && csrFvalue[csrId] == 0.369250){
119- // printf("gpu pid=%d, insId=%d, csrfvalue=%f, left_fv=%f, right_fv=%f, gTid=%d, blkid=%d\n",
120- // pid, insId, csrFvalue[csrId], csrFvalue[csrId - 1], csrFvalue[csrId + 1], gTid, blockIdx.y * gridDim.x + blockIdx.x);
121- // }
122-
123112 csrId2Pid[csrId] = pid < 0 ? LARGE_1B_UCHAR : pid;
124113 if (pid >= 0 && pid % 2 == 0 ){// not leaf node and it's first part.
125114 uint counterOffset = csrId - firstCsrId;
126- // if(305030 == csrId || 478798 == csrId){
127- // printf("first csr id=%d, csrId=%d\n", firstCsrId, csrId);
128- // }
115+
129116 __threadfence ();
130117 uint orgValue = atomicAdd (csrCounter + counterOffset, 1 );
131- // if(csrFvalue[csrId] == 0.369250){
132- // printf("gpu pid=%d, insId=%d, csrfvalue=%f, firstCsrId=%d, cntOffset=%d, orgValue=%d, cnt=%d\n",
133- // pid, insId, csrFvalue[csrId], firstCsrId, counterOffset, orgValue, csrCounter[counterOffset]);
134- // }
135118 }
136119 }
137120
138121 __syncthreads ();
139- // if(blockIdx.y * gridDim.x + blockIdx.x == 2216293 && tid == 95){
140- // printf("###################################################################### cnt=%d\n", csrCounter[tid]);
141- // }
142122 // compute len of each csr
143123 if (csrCounter[tid] > 0 ){
144124 uint numCsrCurPart;
@@ -149,9 +129,6 @@ __global__ void newCsrLenFvalue(const int *preFvalueInsId, int numFeaValue, cons
149129 numCsrPrePartsAhead, posInPart, numCsrCurPart, feaId);
150130
151131 atomicAdd (csrNewLen + numCsrPrePartsAhead * 2 + posInPart, csrCounter[tid]);
152- // if(blockIdx.y * gridDim.x + blockIdx.x == 2216293 && tid == 95){
153- // printf("csrNewLen=%d, numcsrPrePartAhead=%d, posInPart=%d, cnt=%d\n", csrNewLen[numCsrPrePartsAhead * 2 + posInPart], numCsrPrePartsAhead, posInPart, csrCounter[tid]);
154- // }
155132 }
156133}
157134
0 commit comments