[1166] | 1 | // -*- C++ -*-
|
---|
| 2 |
|
---|
| 3 | // Copyright (C) 2007-2021 Free Software Foundation, Inc.
|
---|
| 4 | //
|
---|
| 5 | // This file is part of the GNU ISO C++ Library. This library is free
|
---|
| 6 | // software; you can redistribute it and/or modify it under the terms
|
---|
| 7 | // of the GNU General Public License as published by the Free Software
|
---|
| 8 | // Foundation; either version 3, or (at your option) any later
|
---|
| 9 | // version.
|
---|
| 10 |
|
---|
| 11 | // This library is distributed in the hope that it will be useful, but
|
---|
| 12 | // WITHOUT ANY WARRANTY; without even the implied warranty of
|
---|
| 13 | // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
---|
| 14 | // General Public License for more details.
|
---|
| 15 |
|
---|
| 16 | // Under Section 7 of GPL version 3, you are granted additional
|
---|
| 17 | // permissions described in the GCC Runtime Library Exception, version
|
---|
| 18 | // 3.1, as published by the Free Software Foundation.
|
---|
| 19 |
|
---|
| 20 | // You should have received a copy of the GNU General Public License and
|
---|
| 21 | // a copy of the GCC Runtime Library Exception along with this program;
|
---|
| 22 | // see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
|
---|
| 23 | // <http://www.gnu.org/licenses/>.
|
---|
| 24 |
|
---|
| 25 | /** @file parallel/find.h
|
---|
| 26 | * @brief Parallel implementation base for std::find(), std::equal()
|
---|
| 27 | * and related functions.
|
---|
| 28 | * This file is a GNU parallel extension to the Standard C++ Library.
|
---|
| 29 | */
|
---|
| 30 |
|
---|
| 31 | // Written by Felix Putze and Johannes Singler.
|
---|
| 32 |
|
---|
| 33 | #ifndef _GLIBCXX_PARALLEL_FIND_H
|
---|
| 34 | #define _GLIBCXX_PARALLEL_FIND_H 1
|
---|
| 35 |
|
---|
| 36 | #include <bits/stl_algobase.h>
|
---|
| 37 |
|
---|
| 38 | #include <parallel/features.h>
|
---|
| 39 | #include <parallel/parallel.h>
|
---|
| 40 | #include <parallel/compatibility.h>
|
---|
| 41 | #include <parallel/equally_split.h>
|
---|
| 42 |
|
---|
| 43 | namespace __gnu_parallel
|
---|
| 44 | {
|
---|
| 45 | /**
|
---|
| 46 | * @brief Parallel std::find, switch for different algorithms.
|
---|
| 47 | * @param __begin1 Begin iterator of first sequence.
|
---|
| 48 | * @param __end1 End iterator of first sequence.
|
---|
| 49 | * @param __begin2 Begin iterator of second sequence. Must have same
|
---|
| 50 | * length as first sequence.
|
---|
| 51 | * @param __pred Find predicate.
|
---|
| 52 | * @param __selector _Functionality (e. g. std::find_if(), std::equal(),...)
|
---|
| 53 | * @return Place of finding in both sequences.
|
---|
| 54 | */
|
---|
| 55 | template<typename _RAIter1,
|
---|
| 56 | typename _RAIter2,
|
---|
| 57 | typename _Pred,
|
---|
| 58 | typename _Selector>
|
---|
| 59 | inline std::pair<_RAIter1, _RAIter2>
|
---|
| 60 | __find_template(_RAIter1 __begin1, _RAIter1 __end1,
|
---|
| 61 | _RAIter2 __begin2, _Pred __pred, _Selector __selector)
|
---|
| 62 | {
|
---|
| 63 | switch (_Settings::get().find_algorithm)
|
---|
| 64 | {
|
---|
| 65 | case GROWING_BLOCKS:
|
---|
| 66 | return __find_template(__begin1, __end1, __begin2, __pred,
|
---|
| 67 | __selector, growing_blocks_tag());
|
---|
| 68 | case CONSTANT_SIZE_BLOCKS:
|
---|
| 69 | return __find_template(__begin1, __end1, __begin2, __pred,
|
---|
| 70 | __selector, constant_size_blocks_tag());
|
---|
| 71 | case EQUAL_SPLIT:
|
---|
| 72 | return __find_template(__begin1, __end1, __begin2, __pred,
|
---|
| 73 | __selector, equal_split_tag());
|
---|
| 74 | default:
|
---|
| 75 | _GLIBCXX_PARALLEL_ASSERT(false);
|
---|
| 76 | return std::make_pair(__begin1, __begin2);
|
---|
| 77 | }
|
---|
| 78 | }
|
---|
| 79 |
|
---|
| 80 | #if _GLIBCXX_FIND_EQUAL_SPLIT
|
---|
| 81 |
|
---|
| 82 | /**
|
---|
| 83 | * @brief Parallel std::find, equal splitting variant.
|
---|
| 84 | * @param __begin1 Begin iterator of first sequence.
|
---|
| 85 | * @param __end1 End iterator of first sequence.
|
---|
| 86 | * @param __begin2 Begin iterator of second sequence. Second __sequence
|
---|
| 87 | * must have same length as first sequence.
|
---|
| 88 | * @param __pred Find predicate.
|
---|
| 89 | * @param __selector _Functionality (e. g. std::find_if(), std::equal(),...)
|
---|
| 90 | * @return Place of finding in both sequences.
|
---|
| 91 | */
|
---|
| 92 | template<typename _RAIter1,
|
---|
| 93 | typename _RAIter2,
|
---|
| 94 | typename _Pred,
|
---|
| 95 | typename _Selector>
|
---|
| 96 | std::pair<_RAIter1, _RAIter2>
|
---|
| 97 | __find_template(_RAIter1 __begin1, _RAIter1 __end1,
|
---|
| 98 | _RAIter2 __begin2, _Pred __pred,
|
---|
| 99 | _Selector __selector, equal_split_tag)
|
---|
| 100 | {
|
---|
| 101 | _GLIBCXX_CALL(__end1 - __begin1)
|
---|
| 102 |
|
---|
| 103 | typedef std::iterator_traits<_RAIter1> _TraitsType;
|
---|
| 104 | typedef typename _TraitsType::difference_type _DifferenceType;
|
---|
| 105 | typedef typename _TraitsType::value_type _ValueType;
|
---|
| 106 |
|
---|
| 107 | _DifferenceType __length = __end1 - __begin1;
|
---|
| 108 | _DifferenceType __result = __length;
|
---|
| 109 | _DifferenceType* __borders;
|
---|
| 110 |
|
---|
| 111 | omp_lock_t __result_lock;
|
---|
| 112 | omp_init_lock(&__result_lock);
|
---|
| 113 |
|
---|
| 114 | _ThreadIndex __num_threads = __get_max_threads();
|
---|
| 115 | # pragma omp parallel num_threads(__num_threads)
|
---|
| 116 | {
|
---|
| 117 | # pragma omp single
|
---|
| 118 | {
|
---|
| 119 | __num_threads = omp_get_num_threads();
|
---|
| 120 | __borders = new _DifferenceType[__num_threads + 1];
|
---|
| 121 | __equally_split(__length, __num_threads, __borders);
|
---|
| 122 | } //single
|
---|
| 123 |
|
---|
| 124 | _ThreadIndex __iam = omp_get_thread_num();
|
---|
| 125 | _DifferenceType __start = __borders[__iam],
|
---|
| 126 | __stop = __borders[__iam + 1];
|
---|
| 127 |
|
---|
| 128 | _RAIter1 __i1 = __begin1 + __start;
|
---|
| 129 | _RAIter2 __i2 = __begin2 + __start;
|
---|
| 130 | for (_DifferenceType __pos = __start; __pos < __stop; ++__pos)
|
---|
| 131 | {
|
---|
| 132 | # pragma omp flush(__result)
|
---|
| 133 | // Result has been set to something lower.
|
---|
| 134 | if (__result < __pos)
|
---|
| 135 | break;
|
---|
| 136 |
|
---|
| 137 | if (__selector(__i1, __i2, __pred))
|
---|
| 138 | {
|
---|
| 139 | omp_set_lock(&__result_lock);
|
---|
| 140 | if (__pos < __result)
|
---|
| 141 | __result = __pos;
|
---|
| 142 | omp_unset_lock(&__result_lock);
|
---|
| 143 | break;
|
---|
| 144 | }
|
---|
| 145 | ++__i1;
|
---|
| 146 | ++__i2;
|
---|
| 147 | }
|
---|
| 148 | } //parallel
|
---|
| 149 |
|
---|
| 150 | omp_destroy_lock(&__result_lock);
|
---|
| 151 | delete[] __borders;
|
---|
| 152 |
|
---|
| 153 | return std::pair<_RAIter1, _RAIter2>(__begin1 + __result,
|
---|
| 154 | __begin2 + __result);
|
---|
| 155 | }
|
---|
| 156 |
|
---|
| 157 | #endif
|
---|
| 158 |
|
---|
| 159 | #if _GLIBCXX_FIND_GROWING_BLOCKS
|
---|
| 160 |
|
---|
| 161 | /**
|
---|
| 162 | * @brief Parallel std::find, growing block size variant.
|
---|
| 163 | * @param __begin1 Begin iterator of first sequence.
|
---|
| 164 | * @param __end1 End iterator of first sequence.
|
---|
| 165 | * @param __begin2 Begin iterator of second sequence. Second __sequence
|
---|
| 166 | * must have same length as first sequence.
|
---|
| 167 | * @param __pred Find predicate.
|
---|
| 168 | * @param __selector _Functionality (e. g. std::find_if(), std::equal(),...)
|
---|
| 169 | * @return Place of finding in both sequences.
|
---|
| 170 | * @see __gnu_parallel::_Settings::find_sequential_search_size
|
---|
| 171 | * @see __gnu_parallel::_Settings::find_scale_factor
|
---|
| 172 | *
|
---|
| 173 | * There are two main differences between the growing blocks and
|
---|
| 174 | * the constant-size blocks variants.
|
---|
| 175 | * 1. For GB, the block size grows; for CSB, the block size is fixed.
|
---|
| 176 | * 2. For GB, the blocks are allocated dynamically;
|
---|
| 177 | * for CSB, the blocks are allocated in a predetermined manner,
|
---|
| 178 | * namely spacial round-robin.
|
---|
| 179 | */
|
---|
| 180 | template<typename _RAIter1,
|
---|
| 181 | typename _RAIter2,
|
---|
| 182 | typename _Pred,
|
---|
| 183 | typename _Selector>
|
---|
| 184 | std::pair<_RAIter1, _RAIter2>
|
---|
| 185 | __find_template(_RAIter1 __begin1, _RAIter1 __end1,
|
---|
| 186 | _RAIter2 __begin2, _Pred __pred, _Selector __selector,
|
---|
| 187 | growing_blocks_tag)
|
---|
| 188 | {
|
---|
| 189 | _GLIBCXX_CALL(__end1 - __begin1)
|
---|
| 190 |
|
---|
| 191 | typedef std::iterator_traits<_RAIter1> _TraitsType;
|
---|
| 192 | typedef typename _TraitsType::difference_type _DifferenceType;
|
---|
| 193 | typedef typename _TraitsType::value_type _ValueType;
|
---|
| 194 |
|
---|
| 195 | const _Settings& __s = _Settings::get();
|
---|
| 196 |
|
---|
| 197 | _DifferenceType __length = __end1 - __begin1;
|
---|
| 198 |
|
---|
| 199 | _DifferenceType
|
---|
| 200 | __sequential_search_size = std::min<_DifferenceType>
|
---|
| 201 | (__length, __s.find_sequential_search_size);
|
---|
| 202 |
|
---|
| 203 | // Try it sequentially first.
|
---|
| 204 | std::pair<_RAIter1, _RAIter2>
|
---|
| 205 | __find_seq_result = __selector._M_sequential_algorithm
|
---|
| 206 | (__begin1, __begin1 + __sequential_search_size,
|
---|
| 207 | __begin2, __pred);
|
---|
| 208 |
|
---|
| 209 | if (__find_seq_result.first != (__begin1 + __sequential_search_size))
|
---|
| 210 | return __find_seq_result;
|
---|
| 211 |
|
---|
| 212 | // Index of beginning of next free block (after sequential find).
|
---|
| 213 | _DifferenceType __next_block_start = __sequential_search_size;
|
---|
| 214 | _DifferenceType __result = __length;
|
---|
| 215 |
|
---|
| 216 | omp_lock_t __result_lock;
|
---|
| 217 | omp_init_lock(&__result_lock);
|
---|
| 218 |
|
---|
| 219 | const float __scale_factor = __s.find_scale_factor;
|
---|
| 220 |
|
---|
| 221 | _ThreadIndex __num_threads = __get_max_threads();
|
---|
| 222 | # pragma omp parallel shared(__result) num_threads(__num_threads)
|
---|
| 223 | {
|
---|
| 224 | # pragma omp single
|
---|
| 225 | __num_threads = omp_get_num_threads();
|
---|
| 226 |
|
---|
| 227 | // Not within first __k elements -> start parallel.
|
---|
| 228 | _ThreadIndex __iam = omp_get_thread_num();
|
---|
| 229 |
|
---|
| 230 | _DifferenceType __block_size =
|
---|
| 231 | std::max<_DifferenceType>(1, __scale_factor * __next_block_start);
|
---|
| 232 | _DifferenceType __start = __fetch_and_add<_DifferenceType>
|
---|
| 233 | (&__next_block_start, __block_size);
|
---|
| 234 |
|
---|
| 235 | // Get new block, update pointer to next block.
|
---|
| 236 | _DifferenceType __stop =
|
---|
| 237 | std::min<_DifferenceType>(__length, __start + __block_size);
|
---|
| 238 |
|
---|
| 239 | std::pair<_RAIter1, _RAIter2> __local_result;
|
---|
| 240 |
|
---|
| 241 | while (__start < __length)
|
---|
| 242 | {
|
---|
| 243 | # pragma omp flush(__result)
|
---|
| 244 | // Get new value of result.
|
---|
| 245 | if (__result < __start)
|
---|
| 246 | {
|
---|
| 247 | // No chance to find first element.
|
---|
| 248 | break;
|
---|
| 249 | }
|
---|
| 250 |
|
---|
| 251 | __local_result = __selector._M_sequential_algorithm
|
---|
| 252 | (__begin1 + __start, __begin1 + __stop,
|
---|
| 253 | __begin2 + __start, __pred);
|
---|
| 254 |
|
---|
| 255 | if (__local_result.first != (__begin1 + __stop))
|
---|
| 256 | {
|
---|
| 257 | omp_set_lock(&__result_lock);
|
---|
| 258 | if ((__local_result.first - __begin1) < __result)
|
---|
| 259 | {
|
---|
| 260 | __result = __local_result.first - __begin1;
|
---|
| 261 |
|
---|
| 262 | // Result cannot be in future blocks, stop algorithm.
|
---|
| 263 | __fetch_and_add<_DifferenceType>(&__next_block_start,
|
---|
| 264 | __length);
|
---|
| 265 | }
|
---|
| 266 | omp_unset_lock(&__result_lock);
|
---|
| 267 | }
|
---|
| 268 |
|
---|
| 269 | _DifferenceType __block_size =
|
---|
| 270 | std::max<_DifferenceType>(1, __scale_factor * __next_block_start);
|
---|
| 271 |
|
---|
| 272 | // Get new block, update pointer to next block.
|
---|
| 273 | __start = __fetch_and_add<_DifferenceType>(&__next_block_start,
|
---|
| 274 | __block_size);
|
---|
| 275 | __stop =
|
---|
| 276 | std::min<_DifferenceType>(__length, __start + __block_size);
|
---|
| 277 | }
|
---|
| 278 | } //parallel
|
---|
| 279 |
|
---|
| 280 | omp_destroy_lock(&__result_lock);
|
---|
| 281 |
|
---|
| 282 | // Return iterator on found element.
|
---|
| 283 | return
|
---|
| 284 | std::pair<_RAIter1, _RAIter2>(__begin1 + __result,
|
---|
| 285 | __begin2 + __result);
|
---|
| 286 | }
|
---|
| 287 |
|
---|
| 288 | #endif
|
---|
| 289 |
|
---|
| 290 | #if _GLIBCXX_FIND_CONSTANT_SIZE_BLOCKS
|
---|
| 291 |
|
---|
| 292 | /**
|
---|
| 293 | * @brief Parallel std::find, constant block size variant.
|
---|
| 294 | * @param __begin1 Begin iterator of first sequence.
|
---|
| 295 | * @param __end1 End iterator of first sequence.
|
---|
| 296 | * @param __begin2 Begin iterator of second sequence. Second __sequence
|
---|
| 297 | * must have same length as first sequence.
|
---|
| 298 | * @param __pred Find predicate.
|
---|
| 299 | * @param __selector _Functionality (e. g. std::find_if(), std::equal(),...)
|
---|
| 300 | * @return Place of finding in both sequences.
|
---|
| 301 | * @see __gnu_parallel::_Settings::find_sequential_search_size
|
---|
| 302 | * @see __gnu_parallel::_Settings::find_block_size
|
---|
| 303 | * There are two main differences between the growing blocks and the
|
---|
| 304 | * constant-size blocks variants.
|
---|
| 305 | * 1. For GB, the block size grows; for CSB, the block size is fixed.
|
---|
| 306 | * 2. For GB, the blocks are allocated dynamically; for CSB, the
|
---|
| 307 | * blocks are allocated in a predetermined manner, namely spacial
|
---|
| 308 | * round-robin.
|
---|
| 309 | */
|
---|
| 310 | template<typename _RAIter1,
|
---|
| 311 | typename _RAIter2,
|
---|
| 312 | typename _Pred,
|
---|
| 313 | typename _Selector>
|
---|
| 314 | std::pair<_RAIter1, _RAIter2>
|
---|
| 315 | __find_template(_RAIter1 __begin1, _RAIter1 __end1,
|
---|
| 316 | _RAIter2 __begin2, _Pred __pred, _Selector __selector,
|
---|
| 317 | constant_size_blocks_tag)
|
---|
| 318 | {
|
---|
| 319 | _GLIBCXX_CALL(__end1 - __begin1)
|
---|
| 320 | typedef std::iterator_traits<_RAIter1> _TraitsType;
|
---|
| 321 | typedef typename _TraitsType::difference_type _DifferenceType;
|
---|
| 322 | typedef typename _TraitsType::value_type _ValueType;
|
---|
| 323 |
|
---|
| 324 | const _Settings& __s = _Settings::get();
|
---|
| 325 |
|
---|
| 326 | _DifferenceType __length = __end1 - __begin1;
|
---|
| 327 |
|
---|
| 328 | _DifferenceType __sequential_search_size = std::min<_DifferenceType>
|
---|
| 329 | (__length, __s.find_sequential_search_size);
|
---|
| 330 |
|
---|
| 331 | // Try it sequentially first.
|
---|
| 332 | std::pair<_RAIter1, _RAIter2>
|
---|
| 333 | __find_seq_result = __selector._M_sequential_algorithm
|
---|
| 334 | (__begin1, __begin1 + __sequential_search_size, __begin2, __pred);
|
---|
| 335 |
|
---|
| 336 | if (__find_seq_result.first != (__begin1 + __sequential_search_size))
|
---|
| 337 | return __find_seq_result;
|
---|
| 338 |
|
---|
| 339 | _DifferenceType __result = __length;
|
---|
| 340 | omp_lock_t __result_lock;
|
---|
| 341 | omp_init_lock(&__result_lock);
|
---|
| 342 |
|
---|
| 343 | // Not within first __sequential_search_size elements -> start parallel.
|
---|
| 344 |
|
---|
| 345 | _ThreadIndex __num_threads = __get_max_threads();
|
---|
| 346 | # pragma omp parallel shared(__result) num_threads(__num_threads)
|
---|
| 347 | {
|
---|
| 348 | # pragma omp single
|
---|
| 349 | __num_threads = omp_get_num_threads();
|
---|
| 350 |
|
---|
| 351 | _ThreadIndex __iam = omp_get_thread_num();
|
---|
| 352 | _DifferenceType __block_size = __s.find_initial_block_size;
|
---|
| 353 |
|
---|
| 354 | // First element of thread's current iteration.
|
---|
| 355 | _DifferenceType __iteration_start = __sequential_search_size;
|
---|
| 356 |
|
---|
| 357 | // Where to work (initialization).
|
---|
| 358 | _DifferenceType __start = __iteration_start + __iam * __block_size;
|
---|
| 359 | _DifferenceType __stop = std::min<_DifferenceType>(__length,
|
---|
| 360 | __start
|
---|
| 361 | + __block_size);
|
---|
| 362 |
|
---|
| 363 | std::pair<_RAIter1, _RAIter2> __local_result;
|
---|
| 364 |
|
---|
| 365 | while (__start < __length)
|
---|
| 366 | {
|
---|
| 367 | // Get new value of result.
|
---|
| 368 | # pragma omp flush(__result)
|
---|
| 369 | // No chance to find first element.
|
---|
| 370 | if (__result < __start)
|
---|
| 371 | break;
|
---|
| 372 |
|
---|
| 373 | __local_result = __selector._M_sequential_algorithm
|
---|
| 374 | (__begin1 + __start, __begin1 + __stop,
|
---|
| 375 | __begin2 + __start, __pred);
|
---|
| 376 |
|
---|
| 377 | if (__local_result.first != (__begin1 + __stop))
|
---|
| 378 | {
|
---|
| 379 | omp_set_lock(&__result_lock);
|
---|
| 380 | if ((__local_result.first - __begin1) < __result)
|
---|
| 381 | __result = __local_result.first - __begin1;
|
---|
| 382 | omp_unset_lock(&__result_lock);
|
---|
| 383 | // Will not find better value in its interval.
|
---|
| 384 | break;
|
---|
| 385 | }
|
---|
| 386 |
|
---|
| 387 | __iteration_start += __num_threads * __block_size;
|
---|
| 388 |
|
---|
| 389 | // Where to work.
|
---|
| 390 | __start = __iteration_start + __iam * __block_size;
|
---|
| 391 | __stop = std::min<_DifferenceType>(__length,
|
---|
| 392 | __start + __block_size);
|
---|
| 393 | }
|
---|
| 394 | } //parallel
|
---|
| 395 |
|
---|
| 396 | omp_destroy_lock(&__result_lock);
|
---|
| 397 |
|
---|
| 398 | // Return iterator on found element.
|
---|
| 399 | return std::pair<_RAIter1, _RAIter2>(__begin1 + __result,
|
---|
| 400 | __begin2 + __result);
|
---|
| 401 | }
|
---|
| 402 | #endif
|
---|
| 403 | } // end namespace
|
---|
| 404 |
|
---|
| 405 | #endif /* _GLIBCXX_PARALLEL_FIND_H */
|
---|