97 lines
		
	
	
		
			3 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
		
		
			
		
	
	
			97 lines
		
	
	
		
			3 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
|   | /*
 | ||
|  |  * Copyright (c) 2003, 2007-14 Matteo Frigo | ||
|  |  * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology | ||
|  |  * | ||
|  |  * This program is free software; you can redistribute it and/or modify | ||
|  |  * it under the terms of the GNU General Public License as published by | ||
|  |  * the Free Software Foundation; either version 2 of the License, or | ||
|  |  * (at your option) any later version. | ||
|  |  * | ||
|  |  * This program is distributed in the hope that it will be useful, | ||
|  |  * but WITHOUT ANY WARRANTY; without even the implied warranty of | ||
|  |  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the | ||
|  |  * GNU General Public License for more details. | ||
|  |  * | ||
|  |  * You should have received a copy of the GNU General Public License | ||
|  |  * along with this program; if not, write to the Free Software | ||
|  |  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA | ||
|  |  * | ||
|  |  */ | ||
|  | 
 | ||
|  | /* openmp.c: thread spawning via OpenMP  */ | ||
|  | 
 | ||
|  | #include "threads/threads.h"
 | ||
|  | 
 | ||
|  | #if !defined(_OPENMP)
 | ||
|  | #error OpenMP enabled but not using an OpenMP compiler
 | ||
|  | #endif
 | ||
|  | 
 | ||
|  | int X(ithreads_init)(void) | ||
|  | { | ||
|  |      return 0; /* no error */ | ||
|  | } | ||
|  | 
 | ||
|  | /* Distribute a loop from 0 to loopmax-1 over nthreads threads.
 | ||
|  |    proc(d) is called to execute a block of iterations from d->min | ||
|  |    to d->max-1.  d->thr_num indicate the number of the thread | ||
|  |    that is executing proc (from 0 to nthreads-1), and d->data is | ||
|  |    the same as the data parameter passed to X(spawn_loop). | ||
|  | 
 | ||
|  |    This function returns only after all the threads have completed. */ | ||
|  | void X(spawn_loop)(int loopmax, int nthr, spawn_function proc, void *data) | ||
|  | { | ||
|  |      int block_size; | ||
|  |      spawn_data d; | ||
|  |      int i; | ||
|  | 
 | ||
|  |      A(loopmax >= 0); | ||
|  |      A(nthr > 0); | ||
|  |      A(proc); | ||
|  | 
 | ||
|  |      if (!loopmax) return; | ||
|  | 
 | ||
|  |      /* Choose the block size and number of threads in order to (1)
 | ||
|  |         minimize the critical path and (2) use the fewest threads that | ||
|  |         achieve the same critical path (to minimize overhead). | ||
|  |         e.g. if loopmax is 5 and nthr is 4, we should use only 3 | ||
|  |         threads with block sizes of 2, 2, and 1. */ | ||
|  |      block_size = (loopmax + nthr - 1) / nthr; | ||
|  |      nthr = (loopmax + block_size - 1) / block_size; | ||
|  | 
 | ||
|  |      if (X(spawnloop_callback)) { /* user-defined spawnloop backend */ | ||
|  |           spawn_data *sdata; | ||
|  |           STACK_MALLOC(spawn_data *, sdata, sizeof(spawn_data) * nthr); | ||
|  |           for (i = 0; i < nthr; ++i) { | ||
|  |                spawn_data *d = &sdata[i]; | ||
|  |                d->max = (d->min = i * block_size) + block_size; | ||
|  |                if (d->max > loopmax) | ||
|  |                     d->max = loopmax; | ||
|  |                d->thr_num = i; | ||
|  |                d->data = data; | ||
|  |           } | ||
|  |           X(spawnloop_callback)(proc, sdata, sizeof(spawn_data), nthr, X(spawnloop_callback_data)); | ||
|  |           STACK_FREE(sdata); | ||
|  |           return; | ||
|  |      } | ||
|  | 
 | ||
|  | #pragma omp parallel for private(d)
 | ||
|  |      for (i = 0; i < nthr; ++i) { | ||
|  | 	  d.max = (d.min = i * block_size) + block_size; | ||
|  | 	  if (d.max > loopmax) | ||
|  | 	       d.max = loopmax; | ||
|  | 	  d.thr_num = i; | ||
|  | 	  d.data = data; | ||
|  | 	  proc(&d); | ||
|  |      } | ||
|  | } | ||
|  | 
 | ||
|  | void X(threads_cleanup)(void) | ||
|  | { | ||
|  | } | ||
|  | 
 | ||
|  | /* FIXME [Matteo Frigo 2015-05-25] What does "thread-safe"
 | ||
|  |    mean for openmp? */ | ||
|  | void X(threads_register_planner_hooks)(void) | ||
|  | { | ||
|  | } |