Skip to content

Commit

Permalink
remove unnecessary allocations in HistogramSumReducer (#6132)
Browse files Browse the repository at this point in the history
  • Loading branch information
jameslamb committed Oct 9, 2023
1 parent f901f47 commit ad02551
Showing 1 changed file with 2 additions and 4 deletions.
6 changes: 2 additions & 4 deletions include/LightGBM/bin.h
Original file line number Diff line number Diff line change
Expand Up @@ -63,8 +63,7 @@ inline static void Int32HistogramSumReducer(const char* src, char* dst, int type
const int64_t* src_ptr = reinterpret_cast<const int64_t*>(src);
int64_t* dst_ptr = reinterpret_cast<int64_t*>(dst);
const comm_size_t steps = (len + (type_size * 2) - 1) / (type_size * 2);
const int num_threads = OMP_NUM_THREADS();
#pragma omp parallel for schedule(static) num_threads(num_threads)
#pragma omp parallel for schedule(static) num_threads(OMP_NUM_THREADS())
for (comm_size_t i = 0; i < steps; ++i) {
dst_ptr[i] += src_ptr[i];
}
Expand All @@ -74,8 +73,7 @@ inline static void Int16HistogramSumReducer(const char* src, char* dst, int type
const int32_t* src_ptr = reinterpret_cast<const int32_t*>(src);
int32_t* dst_ptr = reinterpret_cast<int32_t*>(dst);
const comm_size_t steps = (len + (type_size * 2) - 1) / (type_size * 2);
const int num_threads = OMP_NUM_THREADS();
#pragma omp parallel for schedule(static) num_threads(num_threads)
#pragma omp parallel for schedule(static) num_threads(OMP_NUM_THREADS())
for (comm_size_t i = 0; i < steps; ++i) {
dst_ptr[i] += src_ptr[i];
}
Expand Down

0 comments on commit ad02551

Please sign in to comment.