mirror of
https://github.com/tildearrow/furnace.git
synced 2024-12-04 18:27:25 +00:00
329 lines
7.5 KiB
C
329 lines
7.5 KiB
C
|
/*
|
||
|
* Copyright (c) 2001 Matteo Frigo
|
||
|
* Copyright (c) 2001 Massachusetts Institute of Technology
|
||
|
*
|
||
|
* This program is free software; you can redistribute it and/or modify
|
||
|
* it under the terms of the GNU General Public License as published by
|
||
|
* the Free Software Foundation; either version 2 of the License, or
|
||
|
* (at your option) any later version.
|
||
|
*
|
||
|
* This program is distributed in the hope that it will be useful,
|
||
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
||
|
* GNU General Public License for more details.
|
||
|
*
|
||
|
* You should have received a copy of the GNU General Public License
|
||
|
* along with this program; if not, write to the Free Software
|
||
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
||
|
*
|
||
|
*/
|
||
|
|
||
|
|
||
|
#include "config.h"
|
||
|
#include "libbench2/bench.h"
|
||
|
#include <stdio.h>
|
||
|
#include <stdlib.h>
|
||
|
#include <string.h>
|
||
|
#include <ctype.h>
|
||
|
|
||
|
int always_pad_real = 0; /* by default, only pad in-place case */
|
||
|
|
||
|
typedef enum {
|
||
|
SAME, PADDED, HALFISH
|
||
|
} n_transform;
|
||
|
|
||
|
/* funny transformations for last dimension of PROBLEM_REAL */
|
||
|
static int transform_n(int n, n_transform nt)
|
||
|
{
|
||
|
switch (nt) {
|
||
|
case SAME: return n;
|
||
|
case PADDED: return 2*(n/2+1);
|
||
|
case HALFISH: return (n/2+1);
|
||
|
default: BENCH_ASSERT(0); return 0;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/* do what I mean */
|
||
|
static bench_tensor *dwim(bench_tensor *t, bench_iodim **last_iodim,
|
||
|
n_transform nti, n_transform nto,
|
||
|
bench_iodim *dt)
|
||
|
{
|
||
|
int i;
|
||
|
bench_iodim *d, *d1;
|
||
|
|
||
|
if (!BENCH_FINITE_RNK(t->rnk) || t->rnk < 1)
|
||
|
return t;
|
||
|
|
||
|
i = t->rnk;
|
||
|
d1 = *last_iodim;
|
||
|
|
||
|
while (--i >= 0) {
|
||
|
d = t->dims + i;
|
||
|
if (!d->is)
|
||
|
d->is = d1->is * transform_n(d1->n, d1==dt ? nti : SAME);
|
||
|
if (!d->os)
|
||
|
d->os = d1->os * transform_n(d1->n, d1==dt ? nto : SAME);
|
||
|
d1 = d;
|
||
|
}
|
||
|
|
||
|
*last_iodim = d1;
|
||
|
return t;
|
||
|
}
|
||
|
|
||
|
static void transpose_tensor(bench_tensor *t)
|
||
|
{
|
||
|
if (!BENCH_FINITE_RNK(t->rnk) || t->rnk < 2)
|
||
|
return;
|
||
|
|
||
|
t->dims[0].os = t->dims[1].os;
|
||
|
t->dims[1].os = t->dims[0].os * t->dims[0].n;
|
||
|
}
|
||
|
|
||
|
static const char *parseint(const char *s, int *n)
|
||
|
{
|
||
|
int sign = 1;
|
||
|
|
||
|
*n = 0;
|
||
|
|
||
|
if (*s == '-') {
|
||
|
sign = -1;
|
||
|
++s;
|
||
|
} else if (*s == '+') {
|
||
|
sign = +1;
|
||
|
++s;
|
||
|
}
|
||
|
|
||
|
BENCH_ASSERT(isdigit(*s));
|
||
|
while (isdigit(*s)) {
|
||
|
*n = *n * 10 + (*s - '0');
|
||
|
++s;
|
||
|
}
|
||
|
|
||
|
*n *= sign;
|
||
|
|
||
|
if (*s == 'k' || *s == 'K') {
|
||
|
*n *= 1024;
|
||
|
++s;
|
||
|
}
|
||
|
|
||
|
if (*s == 'm' || *s == 'M') {
|
||
|
*n *= 1024 * 1024;
|
||
|
++s;
|
||
|
}
|
||
|
|
||
|
return s;
|
||
|
}
|
||
|
|
||
|
struct dimlist { bench_iodim car; r2r_kind_t k; struct dimlist *cdr; };
|
||
|
|
||
|
static const char *parsetensor(const char *s, bench_tensor **tp,
|
||
|
r2r_kind_t **k)
|
||
|
{
|
||
|
struct dimlist *l = 0, *m;
|
||
|
bench_tensor *t;
|
||
|
int rnk = 0;
|
||
|
|
||
|
L1:
|
||
|
m = (struct dimlist *)bench_malloc(sizeof(struct dimlist));
|
||
|
/* nconc onto l */
|
||
|
m->cdr = l; l = m;
|
||
|
++rnk;
|
||
|
|
||
|
s = parseint(s, &m->car.n);
|
||
|
|
||
|
if (*s == ':') {
|
||
|
/* read input stride */
|
||
|
++s;
|
||
|
s = parseint(s, &m->car.is);
|
||
|
if (*s == ':') {
|
||
|
/* read output stride */
|
||
|
++s;
|
||
|
s = parseint(s, &m->car.os);
|
||
|
} else {
|
||
|
/* default */
|
||
|
m->car.os = m->car.is;
|
||
|
}
|
||
|
} else {
|
||
|
m->car.is = 0;
|
||
|
m->car.os = 0;
|
||
|
}
|
||
|
|
||
|
if (*s == 'f' || *s == 'F') {
|
||
|
m->k = R2R_R2HC;
|
||
|
++s;
|
||
|
}
|
||
|
else if (*s == 'b' || *s == 'B') {
|
||
|
m->k = R2R_HC2R;
|
||
|
++s;
|
||
|
}
|
||
|
else if (*s == 'h' || *s == 'H') {
|
||
|
m->k = R2R_DHT;
|
||
|
++s;
|
||
|
}
|
||
|
else if (*s == 'e' || *s == 'E' || *s == 'o' || *s == 'O') {
|
||
|
char c = *(s++);
|
||
|
int ab;
|
||
|
|
||
|
s = parseint(s, &ab);
|
||
|
|
||
|
if (c == 'e' || c == 'E') {
|
||
|
if (ab == 0)
|
||
|
m->k = R2R_REDFT00;
|
||
|
else if (ab == 1)
|
||
|
m->k = R2R_REDFT01;
|
||
|
else if (ab == 10)
|
||
|
m->k = R2R_REDFT10;
|
||
|
else if (ab == 11)
|
||
|
m->k = R2R_REDFT11;
|
||
|
else
|
||
|
BENCH_ASSERT(0);
|
||
|
}
|
||
|
else {
|
||
|
if (ab == 0)
|
||
|
m->k = R2R_RODFT00;
|
||
|
else if (ab == 1)
|
||
|
m->k = R2R_RODFT01;
|
||
|
else if (ab == 10)
|
||
|
m->k = R2R_RODFT10;
|
||
|
else if (ab == 11)
|
||
|
m->k = R2R_RODFT11;
|
||
|
else
|
||
|
BENCH_ASSERT(0);
|
||
|
}
|
||
|
}
|
||
|
else
|
||
|
m->k = R2R_R2HC;
|
||
|
|
||
|
if (*s == 'x' || *s == 'X') {
|
||
|
++s;
|
||
|
goto L1;
|
||
|
}
|
||
|
|
||
|
/* now we have a dimlist. Build bench_tensor, etc. */
|
||
|
|
||
|
if (k && rnk > 0) {
|
||
|
int i;
|
||
|
*k = (r2r_kind_t *) bench_malloc(sizeof(r2r_kind_t) * rnk);
|
||
|
for (m = l, i = rnk - 1; i >= 0; --i, m = m->cdr) {
|
||
|
BENCH_ASSERT(m);
|
||
|
(*k)[i] = m->k;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
t = mktensor(rnk);
|
||
|
while (--rnk >= 0) {
|
||
|
bench_iodim *d = t->dims + rnk;
|
||
|
BENCH_ASSERT(l);
|
||
|
m = l; l = m->cdr;
|
||
|
d->n = m->car.n;
|
||
|
d->is = m->car.is;
|
||
|
d->os = m->car.os;
|
||
|
bench_free(m);
|
||
|
}
|
||
|
|
||
|
*tp = t;
|
||
|
return s;
|
||
|
}
|
||
|
|
||
|
/* parse a problem description, return a problem */
|
||
|
bench_problem *problem_parse(const char *s)
|
||
|
{
|
||
|
bench_problem *p;
|
||
|
bench_iodim last_iodim0 = {1,1,1}, *last_iodim = &last_iodim0;
|
||
|
bench_iodim *sz_last_iodim;
|
||
|
bench_tensor *sz;
|
||
|
n_transform nti = SAME, nto = SAME;
|
||
|
int transpose = 0;
|
||
|
|
||
|
p = (bench_problem *) bench_malloc(sizeof(bench_problem));
|
||
|
p->kind = PROBLEM_COMPLEX;
|
||
|
p->k = 0;
|
||
|
p->sign = -1;
|
||
|
p->in = p->out = 0;
|
||
|
p->inphys = p->outphys = 0;
|
||
|
p->iphyssz = p->ophyssz = 0;
|
||
|
p->in_place = 0;
|
||
|
p->destroy_input = 0;
|
||
|
p->split = 0;
|
||
|
p->userinfo = 0;
|
||
|
p->scrambled_in = p->scrambled_out = 0;
|
||
|
p->sz = p->vecsz = 0;
|
||
|
p->ini = p->outi = 0;
|
||
|
p->pstring = (char *) bench_malloc(sizeof(char) * (strlen(s) + 1));
|
||
|
strcpy(p->pstring, s);
|
||
|
|
||
|
L1:
|
||
|
switch (tolower(*s)) {
|
||
|
case 'i': p->in_place = 1; ++s; goto L1;
|
||
|
case 'o': p->in_place = 0; ++s; goto L1;
|
||
|
case 'd': p->destroy_input = 1; ++s; goto L1;
|
||
|
case '/': p->split = 1; ++s; goto L1;
|
||
|
case 'f':
|
||
|
case '-': p->sign = -1; ++s; goto L1;
|
||
|
case 'b':
|
||
|
case '+': p->sign = 1; ++s; goto L1;
|
||
|
case 'r': p->kind = PROBLEM_REAL; ++s; goto L1;
|
||
|
case 'c': p->kind = PROBLEM_COMPLEX; ++s; goto L1;
|
||
|
case 'k': p->kind = PROBLEM_R2R; ++s; goto L1;
|
||
|
case 't': transpose = 1; ++s; goto L1;
|
||
|
|
||
|
/* hack for MPI: */
|
||
|
case '[': p->scrambled_in = 1; ++s; goto L1;
|
||
|
case ']': p->scrambled_out = 1; ++s; goto L1;
|
||
|
|
||
|
default : ;
|
||
|
}
|
||
|
|
||
|
s = parsetensor(s, &sz, p->kind == PROBLEM_R2R ? &p->k : 0);
|
||
|
|
||
|
if (p->kind == PROBLEM_REAL) {
|
||
|
if (p->sign < 0) {
|
||
|
nti = p->in_place || always_pad_real ? PADDED : SAME;
|
||
|
nto = HALFISH;
|
||
|
}
|
||
|
else {
|
||
|
nti = HALFISH;
|
||
|
nto = p->in_place || always_pad_real ? PADDED : SAME;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
sz_last_iodim = sz->dims + sz->rnk - 1;
|
||
|
if (*s == '*') { /* "external" vector */
|
||
|
++s;
|
||
|
p->sz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim);
|
||
|
s = parsetensor(s, &sz, 0);
|
||
|
p->vecsz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim);
|
||
|
} else if (*s == 'v' || *s == 'V') { /* "internal" vector */
|
||
|
bench_tensor *vecsz;
|
||
|
++s;
|
||
|
s = parsetensor(s, &vecsz, 0);
|
||
|
p->vecsz = dwim(vecsz, &last_iodim, nti, nto, sz_last_iodim);
|
||
|
p->sz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim);
|
||
|
} else {
|
||
|
p->sz = dwim(sz, &last_iodim, nti, nto, sz_last_iodim);
|
||
|
p->vecsz = mktensor(0);
|
||
|
}
|
||
|
|
||
|
if (transpose) {
|
||
|
transpose_tensor(p->sz);
|
||
|
transpose_tensor(p->vecsz);
|
||
|
}
|
||
|
|
||
|
if (!p->in_place)
|
||
|
p->out = ((bench_real *) p->in) + (1 << 20); /* whatever */
|
||
|
|
||
|
BENCH_ASSERT(p->sz && p->vecsz);
|
||
|
BENCH_ASSERT(!*s);
|
||
|
return p;
|
||
|
}
|
||
|
|
||
|
void problem_destroy(bench_problem *p)
|
||
|
{
|
||
|
BENCH_ASSERT(p);
|
||
|
problem_free(p);
|
||
|
bench_free0(p->k);
|
||
|
bench_free0(p->pstring);
|
||
|
bench_free(p);
|
||
|
}
|
||
|
|