361 lines
		
	
	
		
			9.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			361 lines
		
	
	
		
			9.5 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /* Re-use libbench2 and the test program, but override bench_main so that
 | |
|    we can have different command-line syntax. */
 | |
| #include "libbench2/my-getopt.h"
 | |
| #include "libbench2/bench.h"
 | |
| 
 | |
| #include <stdio.h>
 | |
| #include <stdlib.h>
 | |
| #include <ctype.h>
 | |
| #include "api/fftw3.h"
 | |
| #include <string.h>
 | |
| #include <time.h>
 | |
| 
 | |
| #if defined(HAVE_THREADS) || defined(HAVE_OPENMP)
 | |
| #  define HAVE_SMP
 | |
|    extern int threads_ok;
 | |
| #endif
 | |
| 
 | |
| #define CONCAT(prefix, name) prefix ## name
 | |
| #if defined(BENCHFFT_SINGLE)
 | |
| #define FFTW(x) CONCAT(fftwf_, x)
 | |
| #elif defined(BENCHFFT_LDOUBLE)
 | |
| #define FFTW(x) CONCAT(fftwl_, x)
 | |
| #elif defined(BENCHFFT_QUAD)
 | |
| #define FFTW(x) CONCAT(fftwq_, x)
 | |
| #else
 | |
| #define FFTW(x) CONCAT(fftw_, x)
 | |
| #endif
 | |
| 
 | |
| /* from bench.c: */
 | |
| extern unsigned the_flags;
 | |
| extern int usewisdom;
 | |
| extern int nthreads;
 | |
| 
 | |
| /* dummy routines to replace those in hook.c */
 | |
| void install_hook(void) {}
 | |
| void uninstall_hook(void) {}
 | |
| 
 | |
| int verbose;
 | |
| 
 | |
| static void do_problem(bench_problem *p)
 | |
| {
 | |
|      if (verbose)
 | |
| 	  printf("Planning transform: %s\n", p->pstring);
 | |
|      /* BENCH_ASSERT(can_do(p)); */
 | |
|      problem_alloc(p);
 | |
|      setup(p);
 | |
|      done(p);
 | |
| }
 | |
| 
 | |
| static void add_problem(const char *pstring,
 | |
| 			bench_problem ***p, int *ip, int *np)
 | |
| {
 | |
|      if (*ip >= *np) {
 | |
| 	  *np = *np * 2 + 1;
 | |
| 	  *p = (bench_problem **) realloc(*p, sizeof(bench_problem *) * *np);
 | |
|      }
 | |
|      (*p)[(*ip)++] = problem_parse(pstring);
 | |
| }
 | |
| 
 | |
| static int sz(const bench_problem *p)
 | |
| {
 | |
|      return tensor_sz(p->sz) * tensor_sz(p->vecsz);
 | |
| }
 | |
| 
 | |
| static int prob_size_cmp(const void *p1_, const void *p2_)
 | |
| {
 | |
|      const bench_problem * const *p1 = (const bench_problem * const *) p1_;
 | |
|      const bench_problem * const *p2 = (const bench_problem * const *) p2_;
 | |
|      return (sz(*p1) - sz(*p2));
 | |
| }
 | |
| 
 | |
| static struct my_option options[] =
 | |
| {
 | |
|   {"help", NOARG, 'h'},
 | |
|   {"version", NOARG, 'V'},
 | |
|   {"verbose", NOARG, 'v'},
 | |
| 
 | |
|   {"canonical", NOARG, 'c'},
 | |
|   {"time-limit", REQARG, 't'},
 | |
| 
 | |
|   {"output-file", REQARG, 'o'},
 | |
| 
 | |
|   {"impatient", NOARG, 'i'},
 | |
|   {"measure", NOARG, 'm'},
 | |
|   {"estimate", NOARG, 'e'},
 | |
|   {"exhaustive", NOARG, 'x'},
 | |
| 
 | |
|   {"no-system-wisdom", NOARG, 'n'},
 | |
|   {"wisdom-file", REQARG, 'w'},
 | |
| 
 | |
| #ifdef HAVE_SMP
 | |
|   {"threads", REQARG, 'T'},
 | |
| #endif
 | |
| 
 | |
|   /* options to restrict configuration to rdft-only, etcetera? */
 | |
|   
 | |
|   {0, NOARG, 0}
 | |
| };
 | |
| 
 | |
| static void help(FILE *f, const char *program_name)
 | |
| {
 | |
|      fprintf(
 | |
| 	  f, 
 | |
| 	  "Usage: %s [options] [sizes]\n"
 | |
| "    Create wisdom (pre-planned/optimized transforms) for specified sizes,\n"
 | |
| "    writing wisdom to stdout (or to a file, using -o).\n"
 | |
| 	  "\nOptions:\n"
 | |
|  "                   -h, --help: print this help\n"
 | |
|  "                -V, --version: print version/copyright info\n"
 | |
|  "                -v, --verbose: verbose output\n"
 | |
|  "              -c, --canonical: plan/optimize canonical set of sizes\n"
 | |
|  "     -t <h>, --time-limit=<h>: time limit in hours (default: 0, no limit)\n"
 | |
|  "  -o FILE, --output-file=FILE: output to FILE instead of stdout\n"
 | |
|  "                -m, --measure: plan in MEASURE mode (PATIENT is default)\n"
 | |
|  "               -e, --estimate: plan in ESTIMATE mode (not recommended)\n"
 | |
|  "             -x, --exhaustive: plan in EXHAUSTIVE mode (may be slow)\n"
 | |
|  "       -n, --no-system-wisdom: don't read /etc/fftw/ system wisdom file\n"
 | |
|  "  -w FILE, --wisdom-file=FILE: read wisdom from FILE (stdin if -)\n"
 | |
| #ifdef HAVE_SMP
 | |
|  "            -T N, --threads=N: plan with N threads\n"
 | |
| #endif
 | |
| 	  "\nSize syntax: <type><inplace><direction><geometry>\n"
 | |
|  "      <type> = c/r/k for complex/real(r2c,c2r)/r2r\n" 
 | |
|  "   <inplace> = i/o for in/out-of place\n"
 | |
|  " <direction> = f/b for forward/backward, omitted for k transforms\n"
 | |
|  "  <geometry> = <n1>[x<n2>[x...]], e.g. 10x12x14\n"
 | |
|  "               -- for k transforms, after each dimension is a <kind>:\n"
 | |
|  "                     <kind> = f/b/h/e00/e01/e10/e11/o00/o01/o10/o11\n"
 | |
|  "                              for R2HC/HC2R/DHT/REDFT00/.../RODFT11\n"
 | |
| 	  , program_name);
 | |
| }
 | |
| 
 | |
| /* powers of two and ten up to 2^20, for now */
 | |
| static char canonical_sizes[][32] = {
 | |
|      "1", "2", "4", "8", "16", "32", "64", "128", "256", "512", "1024",
 | |
|      "2048", "4096", "8192", "16384", "32768", "65536", "131072",
 | |
|      "262144", "524288", "1048576",
 | |
| 
 | |
|      "10", "100", "1000", "10000", "100000", "1000000",
 | |
| 
 | |
|      "2x2", "4x4", "8x8", "10x10", "16x16", "32x32", "64x64", "100x100",
 | |
|      "128x128", "256x256", "512x512", "1000x1000", "1024x1024",
 | |
| 
 | |
|      "2x2x2", "4x4x4", "8x8x8", "10x10x10", "16x16x16", "32x32x32",
 | |
|      "64x64x64", "100x100x100"
 | |
| };
 | |
| 
 | |
| #define NELEM(array)(sizeof(array) / sizeof((array)[0]))
 | |
| 
 | |
| int bench_main(int argc, char *argv[])
 | |
| {
 | |
|      int c;
 | |
|      unsigned i;
 | |
|      int impatient = 0;
 | |
|      int system_wisdom = 1;
 | |
|      int canonical = 0;
 | |
|      double hours = 0;
 | |
|      FILE *output_file;
 | |
|      char *output_fname = 0;
 | |
|      bench_problem **problems = 0;
 | |
|      int nproblems = 0, iproblem = 0;
 | |
|      time_t begin;
 | |
| 
 | |
|      verbose = 0;
 | |
|      usewisdom = 0;
 | |
| 
 | |
|      bench_srand(1);
 | |
| #ifdef HAVE_SMP
 | |
|      /* do not configure FFTW with threads, unless the
 | |
| 	user requests -T */
 | |
|      threads_ok = 0;
 | |
| #endif
 | |
| 
 | |
|      while ((c = my_getopt(argc, argv, options)) != -1) {
 | |
| 	  switch (c) {
 | |
| 	      case 'h':
 | |
| 		   help(stdout, argv[0]);
 | |
| 		   exit(EXIT_SUCCESS);
 | |
| 		   break;
 | |
| 
 | |
| 	      case 'V':
 | |
| 		   printf("fftw-wisdom tool for FFTW version " VERSION ".\n");
 | |
| 		   printf(
 | |
| "\n"
 | |
| "Copyright (c) 2003, 2007-14 Matteo Frigo\n"
 | |
| "Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology\n"
 | |
| "\n"
 | |
| "This program is free software; you can redistribute it and/or modify\n"
 | |
| "it under the terms of the GNU General Public License as published by\n"
 | |
| "the Free Software Foundation; either version 2 of the License, or\n"
 | |
| "(at your option) any later version.\n"
 | |
| "\n"
 | |
| "This program is distributed in the hope that it will be useful,\n"
 | |
| "but WITHOUT ANY WARRANTY; without even the implied warranty of\n"
 | |
| "MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the\n"
 | |
| "GNU General Public License for more details.\n"
 | |
| "\n"
 | |
| "You should have received a copy of the GNU General Public License\n"
 | |
| "along with this program; if not, write to the Free Software\n"
 | |
| "Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA\n"
 | |
| 			);
 | |
| 		   exit(EXIT_SUCCESS);
 | |
| 		   break;
 | |
| 		   
 | |
| 	      case 'v':
 | |
| 		   verbose = 1;
 | |
| 		   break;
 | |
| 		   
 | |
| 	      case 'c':
 | |
| 		   canonical = 1;
 | |
| 		   break;
 | |
| 
 | |
| 	      case 't':
 | |
| 		   hours = atof(my_optarg);
 | |
| 		   break;
 | |
| 
 | |
| 	      case 'o':
 | |
| 		   if (output_fname)
 | |
| 			bench_free(output_fname);
 | |
| 		   
 | |
| 		   if (!strcmp(my_optarg, "-"))
 | |
| 			output_fname = 0;
 | |
| 		   else {
 | |
| 			output_fname = (char *) bench_malloc(sizeof(char) *
 | |
| 						    (strlen(my_optarg) + 1));
 | |
| 			strcpy(output_fname, my_optarg);
 | |
| 		   }
 | |
| 		   break;
 | |
| 
 | |
| 	      case 'm':
 | |
| 	      case 'i':
 | |
| 		   impatient = 1;
 | |
| 		   break;
 | |
| 
 | |
| 	      case 'e':
 | |
| 		   the_flags |= FFTW_ESTIMATE;
 | |
| 		   break;
 | |
| 
 | |
| 	      case 'x':
 | |
| 		   the_flags |= FFTW_EXHAUSTIVE;
 | |
| 		   break;
 | |
| 
 | |
| 	      case 'n':
 | |
| 		   system_wisdom = 0;
 | |
| 		   break;
 | |
| 
 | |
| 	      case 'w': {
 | |
| 		   FILE *w = stdin;
 | |
| 		   if (strcmp(my_optarg, "-") && !(w = fopen(my_optarg, "r"))) {
 | |
| 			fprintf(stderr,
 | |
| 				"fftw-wisdom: error opening \"%s\": ", my_optarg);
 | |
| 			perror("");
 | |
| 			exit(EXIT_FAILURE);
 | |
| 		   }
 | |
| 		   if (!FFTW(import_wisdom_from_file)(w)) {
 | |
| 			fprintf(stderr, "fftw_wisdom: error reading wisdom "
 | |
| 				"from \"%s\"\n", my_optarg);
 | |
| 			exit(EXIT_FAILURE);
 | |
| 		   }
 | |
| 		   if (w != stdin)
 | |
| 			fclose(w);
 | |
| 		   break;
 | |
| 	      }
 | |
| 
 | |
| #ifdef HAVE_SMP
 | |
| 	      case 'T':
 | |
| 		   nthreads = atoi(my_optarg);
 | |
| 		   if (nthreads < 1) nthreads = 1;
 | |
| 		   threads_ok = 1;
 | |
| 		   BENCH_ASSERT(FFTW(init_threads)());
 | |
| 		   break;
 | |
| #endif
 | |
| 
 | |
| 	      case '?':
 | |
| 		   /* `my_getopt' already printed an error message. */
 | |
| 		   cleanup();
 | |
| 		   return EXIT_FAILURE;
 | |
| 
 | |
| 	      default:
 | |
| 		   abort ();
 | |
| 	  }
 | |
|      }
 | |
| 
 | |
|      if (!impatient)
 | |
| 	  the_flags |= FFTW_PATIENT;
 | |
| 
 | |
|      if (system_wisdom)
 | |
| 	  if (!FFTW(import_system_wisdom)() && verbose)
 | |
| 	       fprintf(stderr, "fftw-wisdom: system-wisdom import failed\n");
 | |
| 
 | |
|      if (canonical) {
 | |
| 	  for (i = 0; i < NELEM(canonical_sizes); ++i) {
 | |
| 	       unsigned j;
 | |
| 	       char types[][8] = { 
 | |
| 		    "cof", "cob", "cif", "cib", "rof", "rob", "rif", "rib"
 | |
| 	       };
 | |
| 	       
 | |
| 	       for (j = 0; j < NELEM(types); ++j) {
 | |
| 		    char ps[64];
 | |
| 		    if (!strchr(canonical_sizes[i],'x')
 | |
| 			|| !strchr(types[j],'o')) {
 | |
| #ifdef HAVE_SNPRINTF
 | |
| 			 snprintf(ps, sizeof(ps), "%s%s", types[j], canonical_sizes[i]);
 | |
| #else
 | |
| 			 sprintf(ps, "%s%s", types[j], canonical_sizes[i]);
 | |
| #endif
 | |
| 			 add_problem(ps, &problems, &iproblem, &nproblems);
 | |
| 		    }
 | |
| 	       }
 | |
| 	  }
 | |
|      }
 | |
| 
 | |
|      while (my_optind < argc) {
 | |
| 	  if (!strcmp(argv[my_optind], "-")) {
 | |
| 	       char s[1025];
 | |
| 	       while (1 == fscanf(stdin, "%1024s", s))
 | |
| 		    add_problem(s, &problems, &iproblem, &nproblems);
 | |
| 	  }
 | |
| 	  else
 | |
| 	       add_problem(argv[my_optind], &problems, &iproblem, &nproblems);
 | |
| 	  ++my_optind;
 | |
|      }
 | |
| 
 | |
|      nproblems = iproblem;
 | |
|      qsort(problems, nproblems, sizeof(bench_problem *), prob_size_cmp);
 | |
| 
 | |
|      if (!output_fname)
 | |
| 	  output_file = stdout;
 | |
|      else
 | |
| 	  if (!(output_file = fopen(output_fname, "w"))) {
 | |
| 	       fprintf(stderr,
 | |
| 		       "fftw-wisdom: error creating \"%s\"", output_fname);
 | |
| 	       perror("");
 | |
| 	       exit(EXIT_FAILURE);
 | |
| 	  }
 | |
| 
 | |
|      begin = time((time_t*)0);
 | |
|      for (iproblem = 0; iproblem < nproblems; ++iproblem) {
 | |
| 	  if (hours <= 0
 | |
| 	      || hours > (time((time_t*)0) - begin) / 3600.0)
 | |
| 	       do_problem(problems[iproblem]);
 | |
| 	  problem_destroy(problems[iproblem]);
 | |
| 	  
 | |
|      }
 | |
|      free(problems);
 | |
|      
 | |
|      if (verbose && hours > 0
 | |
| 	 && hours < (time((time_t*)0) - begin) / 3600.0)
 | |
| 	  fprintf(stderr, "EXCEEDED TIME LIMIT OF %g HOURS.\n", hours);
 | |
| 
 | |
|      FFTW(export_wisdom_to_file)(output_file);
 | |
|      if (output_file != stdout)
 | |
| 	  fclose(output_file);
 | |
|      if (output_fname)
 | |
| 	  bench_free(output_fname);
 | |
| 
 | |
|      cleanup();
 | |
| 
 | |
|      return EXIT_SUCCESS;
 | |
| }
 | 
