97 lines
		
	
	
		
			3 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			97 lines
		
	
	
		
			3 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
/*
 | 
						|
 * Copyright (c) 2003, 2007-14 Matteo Frigo
 | 
						|
 * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
 | 
						|
 *
 | 
						|
 * This program is free software; you can redistribute it and/or modify
 | 
						|
 * it under the terms of the GNU General Public License as published by
 | 
						|
 * the Free Software Foundation; either version 2 of the License, or
 | 
						|
 * (at your option) any later version.
 | 
						|
 *
 | 
						|
 * This program is distributed in the hope that it will be useful,
 | 
						|
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | 
						|
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | 
						|
 * GNU General Public License for more details.
 | 
						|
 *
 | 
						|
 * You should have received a copy of the GNU General Public License
 | 
						|
 * along with this program; if not, write to the Free Software
 | 
						|
 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
 | 
						|
 *
 | 
						|
 */
 | 
						|
 | 
						|
/* openmp.c: thread spawning via OpenMP  */
 | 
						|
 | 
						|
#include "threads/threads.h"
 | 
						|
 | 
						|
#if !defined(_OPENMP)
 | 
						|
#error OpenMP enabled but not using an OpenMP compiler
 | 
						|
#endif
 | 
						|
 | 
						|
int X(ithreads_init)(void)
 | 
						|
{
 | 
						|
     return 0; /* no error */
 | 
						|
}
 | 
						|
 | 
						|
/* Distribute a loop from 0 to loopmax-1 over nthreads threads.
 | 
						|
   proc(d) is called to execute a block of iterations from d->min
 | 
						|
   to d->max-1.  d->thr_num indicate the number of the thread
 | 
						|
   that is executing proc (from 0 to nthreads-1), and d->data is
 | 
						|
   the same as the data parameter passed to X(spawn_loop).
 | 
						|
 | 
						|
   This function returns only after all the threads have completed. */
 | 
						|
void X(spawn_loop)(int loopmax, int nthr, spawn_function proc, void *data)
 | 
						|
{
 | 
						|
     int block_size;
 | 
						|
     spawn_data d;
 | 
						|
     int i;
 | 
						|
 | 
						|
     A(loopmax >= 0);
 | 
						|
     A(nthr > 0);
 | 
						|
     A(proc);
 | 
						|
 | 
						|
     if (!loopmax) return;
 | 
						|
 | 
						|
     /* Choose the block size and number of threads in order to (1)
 | 
						|
        minimize the critical path and (2) use the fewest threads that
 | 
						|
        achieve the same critical path (to minimize overhead).
 | 
						|
        e.g. if loopmax is 5 and nthr is 4, we should use only 3
 | 
						|
        threads with block sizes of 2, 2, and 1. */
 | 
						|
     block_size = (loopmax + nthr - 1) / nthr;
 | 
						|
     nthr = (loopmax + block_size - 1) / block_size;
 | 
						|
 | 
						|
     if (X(spawnloop_callback)) { /* user-defined spawnloop backend */
 | 
						|
          spawn_data *sdata;
 | 
						|
          STACK_MALLOC(spawn_data *, sdata, sizeof(spawn_data) * nthr);
 | 
						|
          for (i = 0; i < nthr; ++i) {
 | 
						|
               spawn_data *d = &sdata[i];
 | 
						|
               d->max = (d->min = i * block_size) + block_size;
 | 
						|
               if (d->max > loopmax)
 | 
						|
                    d->max = loopmax;
 | 
						|
               d->thr_num = i;
 | 
						|
               d->data = data;
 | 
						|
          }
 | 
						|
          X(spawnloop_callback)(proc, sdata, sizeof(spawn_data), nthr, X(spawnloop_callback_data));
 | 
						|
          STACK_FREE(sdata);
 | 
						|
          return;
 | 
						|
     }
 | 
						|
 | 
						|
#pragma omp parallel for private(d)
 | 
						|
     for (i = 0; i < nthr; ++i) {
 | 
						|
	  d.max = (d.min = i * block_size) + block_size;
 | 
						|
	  if (d.max > loopmax)
 | 
						|
	       d.max = loopmax;
 | 
						|
	  d.thr_num = i;
 | 
						|
	  d.data = data;
 | 
						|
	  proc(&d);
 | 
						|
     }
 | 
						|
}
 | 
						|
 | 
						|
void X(threads_cleanup)(void)
 | 
						|
{
 | 
						|
}
 | 
						|
 | 
						|
/* FIXME [Matteo Frigo 2015-05-25] What does "thread-safe"
 | 
						|
   mean for openmp? */
 | 
						|
void X(threads_register_planner_hooks)(void)
 | 
						|
{
 | 
						|
}
 |