Skip to content

Commit 207ba9c

Browse files
committed
Fixing one memory issue. Segfault / memory leak persists
1 parent c03a60e commit 207ba9c

File tree

4 files changed

+5
-2
lines changed

4 files changed

+5
-2
lines changed

GPU/GPUTracking/Global/GPUChainTrackingClusterizer.cxx

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -893,6 +893,7 @@ int32_t GPUChainTracking::RunTPCClusterizer(bool synchronizeOutput)
893893
clustererNN.nnClusterizerElementSize = ((2 * nn_settings.nnClusterizerSizeInputRow + 1) * (2 * nn_settings.nnClusterizerSizeInputPad + 1) * (2 * nn_settings.nnClusterizerSizeInputTime + 1)) + (nn_settings.nnClusterizerAddIndexData ? 3 : 0);
894894
clustererNN.nnClusterizerBatchedMode = nn_settings.nnClusterizerBatchedMode;
895895
clustererNN.nnClusterizerBoundaryFillValue = nn_settings.nnClusterizerBoundaryFillValue;
896+
clustererNN.nnClusterizerTotalClusters = clusterer.mPmemory->counters.nClusters;
896897
if (nn_settings.nnClusterizerVerbosity < 0) {
897898
clustererNN.nnClusterizerVerbosity = nn_settings.nnInferenceVerbosity;
898899
} else {
@@ -962,7 +963,7 @@ int32_t GPUChainTracking::RunTPCClusterizer(bool synchronizeOutput)
962963
time_clusterizer += std::chrono::duration_cast<std::chrono::nanoseconds>(stop1 - start1).count() / 1e9;
963964

964965
if (clustererNN.nnClusterizerVerbosity < 3) {
965-
LOG(info) << "[NN CF] Apply NN (fragment " << fragment.index << ", lane: " << lane << ", slice: " << iSector << "): filling data " << time_fill << "s ; clusterizer: " << time_clusterizer << "s ; " << clusterer.mPmemory->counters.nClusters << " clusters --> " << clusterer.mPmemory->counters.nClusters / (time_fill + time_clusterizer) << " clusters/s";
966+
LOG(info) << "[NN CF] Apply NN (fragment " << fragment.index << ", lane: " << lane << ", sector: " << iSector << "): filling data " << time_fill << "s ; clusterizer: " << time_clusterizer << "s ; " << clusterer.mPmemory->counters.nClusters << " clusters --> " << clusterer.mPmemory->counters.nClusters / (time_fill + time_clusterizer) << " clusters/s";
966967
}
967968
#else
968969
GPUFatal("Project not compiled with neural network clusterization. Aborting.");

GPU/GPUTracking/TPCClusterFinder/GPUTPCNNClusterizer.cxx

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -32,7 +32,7 @@ void* GPUTPCNNClusterizer::setIOPointers(void* mem)
3232
computePointerWithAlignment(mem, peakPositions, nnClusterizerBatchedMode);
3333
computePointerWithAlignment(mem, clusterFlags, 2 * nnClusterizerBatchedMode);
3434
computePointerWithAlignment(mem, centralCharges, nnClusterizerBatchedMode);
35-
computePointerWithAlignment(mem, outputDataClass, nnClusterizerBatchedMode);
35+
computePointerWithAlignment(mem, outputDataClass, nnClusterizerTotalClusters);
3636
if (nnClusterizerModelClassNumOutputNodes > 0) {
3737
computePointerWithAlignment(mem, modelProbabilities, nnClusterizerBatchedMode * nnClusterizerModelClassNumOutputNodes);
3838
}

GPU/GPUTracking/TPCClusterFinder/GPUTPCNNClusterizer.h

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -46,6 +46,7 @@ class GPUTPCNNClusterizer : public GPUProcessor
4646
bool nnSigmoidTrafoClassThreshold = 1;
4747
int nnClusterizerUseCfRegression = 0;
4848
int nnClusterizerBatchedMode = 1;
49+
int nnClusterizerTotalClusters = 1;
4950
int nnClusterizerVerbosity = 0;
5051
int nnClusterizerBoundaryFillValue = -1;
5152
int nnClusterizerDumpDigits = 0;

GPU/GPUTracking/TPCClusterFinder/GPUTPCNNClusterizerKernels.cxx

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -143,6 +143,7 @@ GPUd() void GPUTPCNNClusterizerKernels::fillInputData(int32_t nBlocks, int32_t n
143143

144144
clustererNN.peakPositions[glo_idx] = peak;
145145
clustererNN.centralCharges[glo_idx] = central_charge;
146+
clustererNN.outputDataClass[glo_idx + batchStart] = -1;
146147

147148
int row_offset = GPUTPCNNClusterizerKernels::rowOffset(row, clustererNN.nnClusterizerSizeInputRow);
148149
#ifndef GPUCA_GPUCODE

0 commit comments

Comments
 (0)