• Home
  • History
  • Annotate
  • Line#
  • Navigate
  • Raw
  • Download
  • only in /asuswrt-rt-n18u-9.0.0.4.380.2695/release/src-rt-6.x.4708/toolchains/hndtools-armeabi-2013.11/arm-none-eabi/include/c++/4.8.1/parallel/
1// -*- C++ -*-
2
3// Copyright (C) 2007-2013 Free Software Foundation, Inc.
4//
5// This file is part of the GNU ISO C++ Library.  This library is free
6// software; you can redistribute it and/or modify it under the terms
7// of the GNU General Public License as published by the Free Software
8// Foundation; either version 3, or (at your option) any later
9// version.
10
11// This library is distributed in the hope that it will be useful, but
12// WITHOUT ANY WARRANTY; without even the implied warranty of
13// MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
14// General Public License for more details.
15
16// Under Section 7 of GPL version 3, you are granted additional
17// permissions described in the GCC Runtime Library Exception, version
18// 3.1, as published by the Free Software Foundation.
19
20// You should have received a copy of the GNU General Public License and
21// a copy of the GCC Runtime Library Exception along with this program;
22// see the files COPYING3 and COPYING.RUNTIME respectively.  If not, see
23// <http://www.gnu.org/licenses/>.
24
25/** @file parallel/find.h
26 *  @brief Parallel implementation base for std::find(), std::equal()
27 *  and related functions.
28 *  This file is a GNU parallel extension to the Standard C++ Library.
29 */
30
31// Written by Felix Putze and Johannes Singler.
32
33#ifndef _GLIBCXX_PARALLEL_FIND_H
34#define _GLIBCXX_PARALLEL_FIND_H 1
35
36#include <bits/stl_algobase.h>
37
38#include <parallel/features.h>
39#include <parallel/parallel.h>
40#include <parallel/compatibility.h>
41#include <parallel/equally_split.h>
42
43namespace __gnu_parallel
44{
45  /**
46   *  @brief Parallel std::find, switch for different algorithms.
47   *  @param __begin1 Begin iterator of first sequence.
48   *  @param __end1 End iterator of first sequence.
49   *  @param __begin2 Begin iterator of second sequence. Must have same
50   *  length as first sequence.
51   *  @param __pred Find predicate.
52   *  @param __selector _Functionality (e. g. std::find_if(), std::equal(),...)
53   *  @return Place of finding in both sequences.
54   */
55  template<typename _RAIter1,
56	   typename _RAIter2,
57	   typename _Pred,
58           typename _Selector>
59    inline std::pair<_RAIter1, _RAIter2>
60    __find_template(_RAIter1 __begin1, _RAIter1 __end1,
61		    _RAIter2 __begin2, _Pred __pred, _Selector __selector)
62    {
63      switch (_Settings::get().find_algorithm)
64	{
65	case GROWING_BLOCKS:
66          return __find_template(__begin1, __end1, __begin2, __pred,
67				 __selector, growing_blocks_tag());
68	case CONSTANT_SIZE_BLOCKS:
69          return __find_template(__begin1, __end1, __begin2, __pred,
70				 __selector, constant_size_blocks_tag());
71	case EQUAL_SPLIT:
72          return __find_template(__begin1, __end1, __begin2, __pred,
73				 __selector, equal_split_tag());
74	default:
75          _GLIBCXX_PARALLEL_ASSERT(false);
76          return std::make_pair(__begin1, __begin2);
77	}
78    }
79
80#if _GLIBCXX_FIND_EQUAL_SPLIT
81
82  /**
83   *  @brief Parallel std::find, equal splitting variant.
84   *  @param __begin1 Begin iterator of first sequence.
85   *  @param __end1 End iterator of first sequence.
86   *  @param __begin2 Begin iterator of second sequence. Second __sequence
87   *  must have same length as first sequence.
88   *  @param __pred Find predicate.
89   *  @param __selector _Functionality (e. g. std::find_if(), std::equal(),...)
90   *  @return Place of finding in both sequences.
91   */
92  template<typename _RAIter1,
93           typename _RAIter2,
94           typename _Pred,
95           typename _Selector>
96    std::pair<_RAIter1, _RAIter2>
97    __find_template(_RAIter1 __begin1, _RAIter1 __end1,
98		    _RAIter2 __begin2, _Pred __pred,
99		    _Selector __selector, equal_split_tag)
100    {
101      _GLIBCXX_CALL(__end1 - __begin1)
102
103      typedef std::iterator_traits<_RAIter1> _TraitsType;
104      typedef typename _TraitsType::difference_type _DifferenceType;
105      typedef typename _TraitsType::value_type _ValueType;
106
107      _DifferenceType __length = __end1 - __begin1;
108      _DifferenceType __result = __length;
109      _DifferenceType* __borders;
110
111      omp_lock_t __result_lock;
112      omp_init_lock(&__result_lock);
113
114      _ThreadIndex __num_threads = __get_max_threads();
115#     pragma omp parallel num_threads(__num_threads)
116      {
117#     pragma omp single
118	{
119	  __num_threads = omp_get_num_threads();
120	  __borders = new _DifferenceType[__num_threads + 1];
121	  __equally_split(__length, __num_threads, __borders);
122	} //single
123
124	_ThreadIndex __iam = omp_get_thread_num();
125	_DifferenceType __start = __borders[__iam],
126	                 __stop = __borders[__iam + 1];
127
128	_RAIter1 __i1 = __begin1 + __start;
129	_RAIter2 __i2 = __begin2 + __start;
130	for (_DifferenceType __pos = __start; __pos < __stop; ++__pos)
131	  {
132#           pragma omp flush(__result)
133	    // Result has been set to something lower.
134	    if (__result < __pos)
135	      break;
136
137	    if (__selector(__i1, __i2, __pred))
138	      {
139		omp_set_lock(&__result_lock);
140		if (__pos < __result)
141		  __result = __pos;
142		omp_unset_lock(&__result_lock);
143		break;
144	      }
145	    ++__i1;
146	    ++__i2;
147	  }
148      } //parallel
149
150      omp_destroy_lock(&__result_lock);
151      delete[] __borders;
152
153      return std::pair<_RAIter1, _RAIter2>(__begin1 + __result,
154					   __begin2 + __result);
155    }
156
157#endif
158
159#if _GLIBCXX_FIND_GROWING_BLOCKS
160
161  /**
162   *  @brief Parallel std::find, growing block size variant.
163   *  @param __begin1 Begin iterator of first sequence.
164   *  @param __end1 End iterator of first sequence.
165   *  @param __begin2 Begin iterator of second sequence. Second __sequence
166   *  must have same length as first sequence.
167   *  @param __pred Find predicate.
168   *  @param __selector _Functionality (e. g. std::find_if(), std::equal(),...)
169   *  @return Place of finding in both sequences.
170   *  @see __gnu_parallel::_Settings::find_sequential_search_size
171   *  @see __gnu_parallel::_Settings::find_scale_factor
172   *
173   *  There are two main differences between the growing blocks and
174   *  the constant-size blocks variants.
175   *  1. For GB, the block size grows; for CSB, the block size is fixed.
176   *  2. For GB, the blocks are allocated dynamically;
177   *     for CSB, the blocks are allocated in a predetermined manner,
178   *     namely spacial round-robin.
179   */
180  template<typename _RAIter1,
181           typename _RAIter2,
182           typename _Pred,
183           typename _Selector>
184    std::pair<_RAIter1, _RAIter2>
185    __find_template(_RAIter1 __begin1, _RAIter1 __end1,
186		    _RAIter2 __begin2, _Pred __pred, _Selector __selector,
187		    growing_blocks_tag)
188    {
189      _GLIBCXX_CALL(__end1 - __begin1)
190
191      typedef std::iterator_traits<_RAIter1> _TraitsType;
192      typedef typename _TraitsType::difference_type _DifferenceType;
193      typedef typename _TraitsType::value_type _ValueType;
194
195      const _Settings& __s = _Settings::get();
196
197      _DifferenceType __length = __end1 - __begin1;
198
199      _DifferenceType
200	__sequential_search_size = std::min<_DifferenceType>
201	(__length, __s.find_sequential_search_size);
202
203      // Try it sequentially first.
204      std::pair<_RAIter1, _RAIter2>
205	__find_seq_result = __selector._M_sequential_algorithm
206	(__begin1, __begin1 + __sequential_search_size,
207	 __begin2, __pred);
208
209      if (__find_seq_result.first != (__begin1 + __sequential_search_size))
210	return __find_seq_result;
211
212      // Index of beginning of next free block (after sequential find).
213      _DifferenceType __next_block_start = __sequential_search_size;
214      _DifferenceType __result = __length;
215
216      omp_lock_t __result_lock;
217      omp_init_lock(&__result_lock);
218
219      const float __scale_factor = __s.find_scale_factor;
220
221      _ThreadIndex __num_threads = __get_max_threads();
222#     pragma omp parallel shared(__result) num_threads(__num_threads)
223      {
224#       pragma omp single
225	__num_threads = omp_get_num_threads();
226
227	// Not within first __k elements -> start parallel.
228	_ThreadIndex __iam = omp_get_thread_num();
229
230	_DifferenceType __block_size =
231	  std::max<_DifferenceType>(1, __scale_factor * __next_block_start);
232	_DifferenceType __start = __fetch_and_add<_DifferenceType>
233	  (&__next_block_start, __block_size);
234
235	// Get new block, update pointer to next block.
236	_DifferenceType __stop =
237	  std::min<_DifferenceType>(__length, __start + __block_size);
238
239	std::pair<_RAIter1, _RAIter2> __local_result;
240
241	while (__start < __length)
242	  {
243#           pragma omp flush(__result)
244	    // Get new value of result.
245	    if (__result < __start)
246	      {
247		// No chance to find first element.
248		break;
249	      }
250
251	    __local_result = __selector._M_sequential_algorithm
252	      (__begin1 + __start, __begin1 + __stop,
253	       __begin2 + __start, __pred);
254
255	    if (__local_result.first != (__begin1 + __stop))
256	      {
257		omp_set_lock(&__result_lock);
258		if ((__local_result.first - __begin1) < __result)
259		  {
260		    __result = __local_result.first - __begin1;
261
262		    // Result cannot be in future blocks, stop algorithm.
263		    __fetch_and_add<_DifferenceType>(&__next_block_start,
264						     __length);
265		  }
266		omp_unset_lock(&__result_lock);
267	      }
268
269	    _DifferenceType __block_size =
270	     std::max<_DifferenceType>(1, __scale_factor * __next_block_start);
271
272	    // Get new block, update pointer to next block.
273	    __start = __fetch_and_add<_DifferenceType>(&__next_block_start,
274						       __block_size);
275	    __stop =
276	      std::min<_DifferenceType>(__length, __start + __block_size);
277	  }
278      } //parallel
279
280      omp_destroy_lock(&__result_lock);
281
282      // Return iterator on found element.
283      return
284	std::pair<_RAIter1, _RAIter2>(__begin1 + __result,
285				      __begin2 + __result);
286    }
287
288#endif
289
290#if _GLIBCXX_FIND_CONSTANT_SIZE_BLOCKS
291
292  /**
293   *   @brief Parallel std::find, constant block size variant.
294   *  @param __begin1 Begin iterator of first sequence.
295   *  @param __end1 End iterator of first sequence.
296   *  @param __begin2 Begin iterator of second sequence. Second __sequence
297   *  must have same length as first sequence.
298   *  @param __pred Find predicate.
299   *  @param __selector _Functionality (e. g. std::find_if(), std::equal(),...)
300   *  @return Place of finding in both sequences.
301   *  @see __gnu_parallel::_Settings::find_sequential_search_size
302   *  @see __gnu_parallel::_Settings::find_block_size
303   *  There are two main differences between the growing blocks and the
304   *  constant-size blocks variants.
305   *  1. For GB, the block size grows; for CSB, the block size is fixed.
306   *  2. For GB, the blocks are allocated dynamically; for CSB, the
307   *  blocks are allocated in a predetermined manner, namely spacial
308   *  round-robin.
309   */
310  template<typename _RAIter1,
311           typename _RAIter2,
312           typename _Pred,
313           typename _Selector>
314    std::pair<_RAIter1, _RAIter2>
315    __find_template(_RAIter1 __begin1, _RAIter1 __end1,
316                  _RAIter2 __begin2, _Pred __pred, _Selector __selector,
317                  constant_size_blocks_tag)
318    {
319      _GLIBCXX_CALL(__end1 - __begin1)
320      typedef std::iterator_traits<_RAIter1> _TraitsType;
321      typedef typename _TraitsType::difference_type _DifferenceType;
322      typedef typename _TraitsType::value_type _ValueType;
323
324      const _Settings& __s = _Settings::get();
325
326      _DifferenceType __length = __end1 - __begin1;
327
328      _DifferenceType __sequential_search_size = std::min<_DifferenceType>
329	(__length, __s.find_sequential_search_size);
330
331      // Try it sequentially first.
332      std::pair<_RAIter1, _RAIter2>
333	__find_seq_result = __selector._M_sequential_algorithm
334	(__begin1, __begin1 + __sequential_search_size, __begin2, __pred);
335
336      if (__find_seq_result.first != (__begin1 + __sequential_search_size))
337	return __find_seq_result;
338
339      _DifferenceType __result = __length;
340      omp_lock_t __result_lock;
341      omp_init_lock(&__result_lock);
342
343      // Not within first __sequential_search_size elements -> start parallel.
344
345      _ThreadIndex __num_threads = __get_max_threads();
346#     pragma omp parallel shared(__result) num_threads(__num_threads)
347      {
348#       pragma omp single
349	__num_threads = omp_get_num_threads();
350
351	_ThreadIndex __iam = omp_get_thread_num();
352	_DifferenceType __block_size = __s.find_initial_block_size;
353
354	// First element of thread's current iteration.
355	_DifferenceType __iteration_start = __sequential_search_size;
356
357	// Where to work (initialization).
358	_DifferenceType __start = __iteration_start + __iam * __block_size;
359	_DifferenceType __stop = std::min<_DifferenceType>(__length,
360							   __start
361							   + __block_size);
362
363	std::pair<_RAIter1, _RAIter2> __local_result;
364
365	while (__start < __length)
366	  {
367	    // Get new value of result.
368#           pragma omp flush(__result)
369	    // No chance to find first element.
370	    if (__result < __start)
371	      break;
372
373	    __local_result = __selector._M_sequential_algorithm
374	      (__begin1 + __start, __begin1 + __stop,
375	       __begin2 + __start, __pred);
376
377	    if (__local_result.first != (__begin1 + __stop))
378	      {
379		omp_set_lock(&__result_lock);
380		if ((__local_result.first - __begin1) < __result)
381		  __result = __local_result.first - __begin1;
382		omp_unset_lock(&__result_lock);
383		// Will not find better value in its interval.
384		break;
385	      }
386
387	    __iteration_start += __num_threads * __block_size;
388
389	    // Where to work.
390	    __start = __iteration_start + __iam * __block_size;
391	    __stop = std::min<_DifferenceType>(__length,
392					       __start + __block_size);
393	  }
394      } //parallel
395
396      omp_destroy_lock(&__result_lock);
397
398      // Return iterator on found element.
399      return std::pair<_RAIter1, _RAIter2>(__begin1 + __result,
400					   __begin2 + __result);
401    }
402#endif
403} // end namespace
404
405#endif /* _GLIBCXX_PARALLEL_FIND_H */
406