From 82d734f7a3b6f08813a9ad6272aa026779c88975 Mon Sep 17 00:00:00 2001 From: Tom Tromey Date: Sun, 23 May 2021 09:04:27 -0600 Subject: Add batching parameter to parallel_for_each parallel_for_each currently requires each thread to process at least 10 elements. However, when indexing, it's fine for a thread to handle just a single CU. This patch parameterizes this, and updates the one user. --- gdb/minsyms.c | 4 ++-- gdb/unittests/parallel-for-selftests.c | 2 +- gdbsupport/parallel-for.h | 18 ++++++++++++------ 3 files changed, 15 insertions(+), 9 deletions(-) diff --git a/gdb/minsyms.c b/gdb/minsyms.c index f1c2890..cbd0ad2 100644 --- a/gdb/minsyms.c +++ b/gdb/minsyms.c @@ -1460,8 +1460,8 @@ minimal_symbol_reader::install () std::vector hash_values (mcount); msymbols = m_objfile->per_bfd->msymbols.get (); - gdb::parallel_for_each - (&msymbols[0], &msymbols[mcount], + /* Arbitrarily require at least 10 elements in a thread. */ + gdb::parallel_for_each (10, &msymbols[0], &msymbols[mcount], [&] (minimal_symbol *start, minimal_symbol *end) { for (minimal_symbol *msym = start; msym < end; ++msym) diff --git a/gdb/unittests/parallel-for-selftests.c b/gdb/unittests/parallel-for-selftests.c index adfc82f..e0c07e5 100644 --- a/gdb/unittests/parallel-for-selftests.c +++ b/gdb/unittests/parallel-for-selftests.c @@ -52,7 +52,7 @@ test (int n_threads) #define NUMBER 10000 std::atomic counter (0); - gdb::parallel_for_each (0, NUMBER, + gdb::parallel_for_each (1, 0, NUMBER, [&] (int start, int end) { counter += end - start; diff --git a/gdbsupport/parallel-for.h b/gdbsupport/parallel-for.h index 915814e..811ffd6 100644 --- a/gdbsupport/parallel-for.h +++ b/gdbsupport/parallel-for.h @@ -32,11 +32,16 @@ namespace gdb This approach was chosen over having the callback work on single items because it makes it simple for the caller to do - once-per-subrange initialization and destruction. */ + once-per-subrange initialization and destruction. + + The parameter N says how batching ought to be done -- there will be + at least N elements processed per thread. Setting N to 0 is not + allowed. */ template void -parallel_for_each (RandomIt first, RandomIt last, RangeFunction callback) +parallel_for_each (unsigned n, RandomIt first, RandomIt last, + RangeFunction callback) { /* So we can use a local array below. */ const size_t local_max = 16; @@ -48,10 +53,11 @@ parallel_for_each (RandomIt first, RandomIt last, RangeFunction callback) size_t n_elements = last - first; if (n_threads > 1) { - /* Arbitrarily require that there should be at least 10 elements - in a thread. */ - if (n_elements / n_threads < 10) - n_threads = std::max (n_elements / 10, (size_t) 1); + /* Require that there should be at least N elements in a + thread. */ + gdb_assert (n > 0); + if (n_elements / n_threads < n) + n_threads = std::max (n_elements / n, (size_t) 1); size_t elts_per_thread = n_elements / n_threads; n_actual_threads = n_threads - 1; for (int i = 0; i < n_actual_threads; ++i) -- cgit v1.1