257 lines
		
	
	
		
			5.3 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			257 lines
		
	
	
		
			5.3 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * Copyright (c) 2003, 2007-14 Matteo Frigo
 | |
|  * Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology
 | |
|  *
 | |
|  * This program is free software; you can redistribute it and/or modify
 | |
|  * it under the terms of the GNU General Public License as published by
 | |
|  * the Free Software Foundation; either version 2 of the License, or
 | |
|  * (at your option) any later version.
 | |
|  *
 | |
|  * This program is distributed in the hope that it will be useful,
 | |
|  * but WITHOUT ANY WARRANTY; without even the implied warranty of
 | |
|  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 | |
|  * GNU General Public License for more details.
 | |
|  *
 | |
|  * You should have received a copy of the GNU General Public License
 | |
|  * along with this program; if not, write to the Free Software
 | |
|  * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA  02110-1301  USA
 | |
|  *
 | |
|  */
 | |
| 
 | |
| 
 | |
| /* Twiddle manipulation */
 | |
| 
 | |
| #include "kernel/ifftw.h"
 | |
| #include <math.h>
 | |
| 
 | |
| #define HASHSZ 109
 | |
| 
 | |
| /* hash table of known twiddle factors */
 | |
| static twid *twlist[HASHSZ];
 | |
| 
 | |
| static INT hash(INT n, INT r)
 | |
| {
 | |
|      INT h = n * 17 + r;
 | |
| 
 | |
|      if (h < 0) h = -h;
 | |
| 
 | |
|      return (h % HASHSZ);
 | |
| }
 | |
| 
 | |
| static int equal_instr(const tw_instr *p, const tw_instr *q)
 | |
| {
 | |
|      if (p == q)
 | |
|           return 1;
 | |
| 
 | |
|      for (;; ++p, ++q) {
 | |
|           if (p->op != q->op)
 | |
| 	       return 0;
 | |
| 
 | |
| 	  switch (p->op) {
 | |
| 	      case TW_NEXT:
 | |
| 		   return (p->v == q->v); /* p->i is ignored */
 | |
| 
 | |
| 	      case TW_FULL:
 | |
| 	      case TW_HALF:
 | |
| 		   if (p->v != q->v) return 0; /* p->i is ignored */
 | |
| 		   break;
 | |
| 
 | |
| 	      default:
 | |
| 		   if (p->v != q->v || p->i != q->i) return 0;
 | |
| 		   break;
 | |
| 	  }
 | |
|      }
 | |
|      A(0 /* can't happen */);
 | |
| }
 | |
| 
 | |
| static int ok_twid(const twid *t, 
 | |
| 		   enum wakefulness wakefulness,
 | |
| 		   const tw_instr *q, INT n, INT r, INT m)
 | |
| {
 | |
|      return (wakefulness == t->wakefulness &&
 | |
| 	     n == t->n &&
 | |
| 	     r == t->r && 
 | |
| 	     m <= t->m && 
 | |
| 	     equal_instr(t->instr, q));
 | |
| }
 | |
| 
 | |
| static twid *lookup(enum wakefulness wakefulness,
 | |
| 		    const tw_instr *q, INT n, INT r, INT m)
 | |
| {
 | |
|      twid *p;
 | |
| 
 | |
|      for (p = twlist[hash(n,r)]; 
 | |
| 	  p && !ok_twid(p, wakefulness, q, n, r, m); 
 | |
| 	  p = p->cdr)
 | |
|           ;
 | |
|      return p;
 | |
| }
 | |
| 
 | |
| static INT twlen0(INT r, const tw_instr *p, INT *vl)
 | |
| {
 | |
|      INT ntwiddle = 0;
 | |
| 
 | |
|      /* compute length of bytecode program */
 | |
|      A(r > 0);
 | |
|      for ( ; p->op != TW_NEXT; ++p) {
 | |
| 	  switch (p->op) {
 | |
| 	      case TW_FULL:
 | |
| 		   ntwiddle += (r - 1) * 2;
 | |
| 		   break;
 | |
| 	      case TW_HALF:
 | |
| 		   ntwiddle += (r - 1);
 | |
| 		   break;
 | |
| 	      case TW_CEXP:
 | |
| 		   ntwiddle += 2;
 | |
| 		   break;
 | |
| 	      case TW_COS:
 | |
| 	      case TW_SIN:
 | |
| 		   ntwiddle += 1;
 | |
| 		   break;
 | |
| 	  }
 | |
|      }
 | |
| 
 | |
|      *vl = (INT)p->v;
 | |
|      return ntwiddle;
 | |
| }
 | |
| 
 | |
| INT X(twiddle_length)(INT r, const tw_instr *p)
 | |
| {
 | |
|      INT vl;
 | |
|      return twlen0(r, p, &vl);
 | |
| }
 | |
| 
 | |
| static R *compute(enum wakefulness wakefulness,
 | |
| 		  const tw_instr *instr, INT n, INT r, INT m)
 | |
| {
 | |
|      INT ntwiddle, j, vl;
 | |
|      R *W, *W0;
 | |
|      const tw_instr *p;
 | |
|      triggen *t = X(mktriggen)(wakefulness, n);
 | |
| 
 | |
|      p = instr;
 | |
|      ntwiddle = twlen0(r, p, &vl);
 | |
| 
 | |
|      A(m % vl == 0);
 | |
| 
 | |
|      W0 = W = (R *)MALLOC((ntwiddle * (m / vl)) * sizeof(R), TWIDDLES);
 | |
| 
 | |
|      for (j = 0; j < m; j += vl) {
 | |
|           for (p = instr; p->op != TW_NEXT; ++p) {
 | |
| 	       switch (p->op) {
 | |
| 		   case TW_FULL: {
 | |
| 			INT i;
 | |
| 			for (i = 1; i < r; ++i) {
 | |
| 			     A((j + (INT)p->v) * i < n);
 | |
| 			     A((j + (INT)p->v) * i > -n);
 | |
| 			     t->cexp(t, (j + (INT)p->v) * i, W);
 | |
| 			     W += 2;
 | |
| 			}
 | |
| 			break;
 | |
| 		   }
 | |
| 
 | |
| 		   case TW_HALF: {
 | |
| 			INT i;
 | |
| 			A((r % 2) == 1);
 | |
| 			for (i = 1; i + i < r; ++i) {
 | |
| 			     t->cexp(t, MULMOD(i, (j + (INT)p->v), n), W);
 | |
| 			     W += 2;
 | |
| 			}
 | |
| 			break;
 | |
| 		   }
 | |
| 
 | |
| 		   case TW_COS: {
 | |
| 			R d[2];
 | |
| 
 | |
| 			A((j + (INT)p->v) * p->i < n);
 | |
| 			A((j + (INT)p->v) * p->i > -n);
 | |
| 			t->cexp(t, (j + (INT)p->v) * (INT)p->i, d);
 | |
| 			*W++ = d[0];
 | |
| 			break;
 | |
| 		   }
 | |
| 
 | |
| 		   case TW_SIN: {
 | |
| 			R d[2];
 | |
| 
 | |
| 			A((j + (INT)p->v) * p->i < n);
 | |
| 			A((j + (INT)p->v) * p->i > -n);
 | |
| 			t->cexp(t, (j + (INT)p->v) * (INT)p->i, d);
 | |
| 			*W++ = d[1];
 | |
| 			break;
 | |
| 		   }
 | |
| 
 | |
| 		   case TW_CEXP:
 | |
| 			A((j + (INT)p->v) * p->i < n);
 | |
| 			A((j + (INT)p->v) * p->i > -n);
 | |
| 			t->cexp(t, (j + (INT)p->v) * (INT)p->i, W);
 | |
| 			W += 2;
 | |
| 			break;
 | |
| 	       }
 | |
| 	  }
 | |
|      }
 | |
| 
 | |
|      X(triggen_destroy)(t);
 | |
|      return W0;
 | |
| }
 | |
| 
 | |
| static void mktwiddle(enum wakefulness wakefulness,
 | |
| 		      twid **pp, const tw_instr *instr, INT n, INT r, INT m)
 | |
| {
 | |
|      twid *p;
 | |
|      INT h;
 | |
| 
 | |
|      if ((p = lookup(wakefulness, instr, n, r, m))) {
 | |
|           ++p->refcnt;
 | |
|      } else {
 | |
| 	  p = (twid *) MALLOC(sizeof(twid), TWIDDLES);
 | |
| 	  p->n = n;
 | |
| 	  p->r = r;
 | |
| 	  p->m = m;
 | |
| 	  p->instr = instr;
 | |
| 	  p->refcnt = 1;
 | |
| 	  p->wakefulness = wakefulness;
 | |
| 	  p->W = compute(wakefulness, instr, n, r, m);
 | |
| 
 | |
| 	  /* cons! onto twlist */
 | |
| 	  h = hash(n, r);
 | |
| 	  p->cdr = twlist[h];
 | |
| 	  twlist[h] = p;
 | |
|      }
 | |
| 
 | |
|      *pp = p;
 | |
| }
 | |
| 
 | |
| static void twiddle_destroy(twid **pp)
 | |
| {
 | |
|      twid *p = *pp;
 | |
|      twid **q;
 | |
| 
 | |
|      if ((--p->refcnt) == 0) {
 | |
| 	  /* remove p from twiddle list */
 | |
| 	  for (q = &twlist[hash(p->n, p->r)]; *q; q = &((*q)->cdr)) {
 | |
| 	       if (*q == p) {
 | |
| 		    *q = p->cdr;
 | |
| 		    X(ifree)(p->W);
 | |
| 		    X(ifree)(p);
 | |
| 		    *pp = 0;
 | |
| 		    return;
 | |
| 	       }
 | |
| 	  }
 | |
| 	  A(0 /* can't happen */ );
 | |
|      }
 | |
| }
 | |
| 
 | |
| 
 | |
| void X(twiddle_awake)(enum wakefulness wakefulness, twid **pp, 
 | |
| 		      const tw_instr *instr, INT n, INT r, INT m)
 | |
| {
 | |
|      switch (wakefulness) {
 | |
| 	 case SLEEPY: 
 | |
| 	      twiddle_destroy(pp);
 | |
| 	      break;
 | |
| 	 default:
 | |
| 	      mktwiddle(wakefulness, pp, instr, n, r, m);
 | |
| 	      break;
 | |
|      }
 | |
| }
 | 
