mirror of
https://github.com/tildearrow/furnace.git
synced 2024-11-18 02:25:11 +00:00
361 lines
9.5 KiB
C
361 lines
9.5 KiB
C
|
/* Re-use libbench2 and the test program, but override bench_main so that
|
||
|
we can have different command-line syntax. */
|
||
|
#include "libbench2/my-getopt.h"
|
||
|
#include "libbench2/bench.h"
|
||
|
|
||
|
#include <stdio.h>
|
||
|
#include <stdlib.h>
|
||
|
#include <ctype.h>
|
||
|
#include "api/fftw3.h"
|
||
|
#include <string.h>
|
||
|
#include <time.h>
|
||
|
|
||
|
#if defined(HAVE_THREADS) || defined(HAVE_OPENMP)
|
||
|
# define HAVE_SMP
|
||
|
extern int threads_ok;
|
||
|
#endif
|
||
|
|
||
|
#define CONCAT(prefix, name) prefix ## name
|
||
|
#if defined(BENCHFFT_SINGLE)
|
||
|
#define FFTW(x) CONCAT(fftwf_, x)
|
||
|
#elif defined(BENCHFFT_LDOUBLE)
|
||
|
#define FFTW(x) CONCAT(fftwl_, x)
|
||
|
#elif defined(BENCHFFT_QUAD)
|
||
|
#define FFTW(x) CONCAT(fftwq_, x)
|
||
|
#else
|
||
|
#define FFTW(x) CONCAT(fftw_, x)
|
||
|
#endif
|
||
|
|
||
|
/* from bench.c: */
|
||
|
extern unsigned the_flags;
|
||
|
extern int usewisdom;
|
||
|
extern int nthreads;
|
||
|
|
||
|
/* dummy routines to replace those in hook.c */
|
||
|
void install_hook(void) {}
|
||
|
void uninstall_hook(void) {}
|
||
|
|
||
|
int verbose;
|
||
|
|
||
|
static void do_problem(bench_problem *p)
|
||
|
{
|
||
|
if (verbose)
|
||
|
printf("Planning transform: %s\n", p->pstring);
|
||
|
/* BENCH_ASSERT(can_do(p)); */
|
||
|
problem_alloc(p);
|
||
|
setup(p);
|
||
|
done(p);
|
||
|
}
|
||
|
|
||
|
static void add_problem(const char *pstring,
|
||
|
bench_problem ***p, int *ip, int *np)
|
||
|
{
|
||
|
if (*ip >= *np) {
|
||
|
*np = *np * 2 + 1;
|
||
|
*p = (bench_problem **) realloc(*p, sizeof(bench_problem *) * *np);
|
||
|
}
|
||
|
(*p)[(*ip)++] = problem_parse(pstring);
|
||
|
}
|
||
|
|
||
|
static int sz(const bench_problem *p)
|
||
|
{
|
||
|
return tensor_sz(p->sz) * tensor_sz(p->vecsz);
|
||
|
}
|
||
|
|
||
|
static int prob_size_cmp(const void *p1_, const void *p2_)
|
||
|
{
|
||
|
const bench_problem * const *p1 = (const bench_problem * const *) p1_;
|
||
|
const bench_problem * const *p2 = (const bench_problem * const *) p2_;
|
||
|
return (sz(*p1) - sz(*p2));
|
||
|
}
|
||
|
|
||
|
static struct my_option options[] =
|
||
|
{
|
||
|
{"help", NOARG, 'h'},
|
||
|
{"version", NOARG, 'V'},
|
||
|
{"verbose", NOARG, 'v'},
|
||
|
|
||
|
{"canonical", NOARG, 'c'},
|
||
|
{"time-limit", REQARG, 't'},
|
||
|
|
||
|
{"output-file", REQARG, 'o'},
|
||
|
|
||
|
{"impatient", NOARG, 'i'},
|
||
|
{"measure", NOARG, 'm'},
|
||
|
{"estimate", NOARG, 'e'},
|
||
|
{"exhaustive", NOARG, 'x'},
|
||
|
|
||
|
{"no-system-wisdom", NOARG, 'n'},
|
||
|
{"wisdom-file", REQARG, 'w'},
|
||
|
|
||
|
#ifdef HAVE_SMP
|
||
|
{"threads", REQARG, 'T'},
|
||
|
#endif
|
||
|
|
||
|
/* options to restrict configuration to rdft-only, etcetera? */
|
||
|
|
||
|
{0, NOARG, 0}
|
||
|
};
|
||
|
|
||
|
static void help(FILE *f, const char *program_name)
|
||
|
{
|
||
|
fprintf(
|
||
|
f,
|
||
|
"Usage: %s [options] [sizes]\n"
|
||
|
" Create wisdom (pre-planned/optimized transforms) for specified sizes,\n"
|
||
|
" writing wisdom to stdout (or to a file, using -o).\n"
|
||
|
"\nOptions:\n"
|
||
|
" -h, --help: print this help\n"
|
||
|
" -V, --version: print version/copyright info\n"
|
||
|
" -v, --verbose: verbose output\n"
|
||
|
" -c, --canonical: plan/optimize canonical set of sizes\n"
|
||
|
" -t <h>, --time-limit=<h>: time limit in hours (default: 0, no limit)\n"
|
||
|
" -o FILE, --output-file=FILE: output to FILE instead of stdout\n"
|
||
|
" -m, --measure: plan in MEASURE mode (PATIENT is default)\n"
|
||
|
" -e, --estimate: plan in ESTIMATE mode (not recommended)\n"
|
||
|
" -x, --exhaustive: plan in EXHAUSTIVE mode (may be slow)\n"
|
||
|
" -n, --no-system-wisdom: don't read /etc/fftw/ system wisdom file\n"
|
||
|
" -w FILE, --wisdom-file=FILE: read wisdom from FILE (stdin if -)\n"
|
||
|
#ifdef HAVE_SMP
|
||
|
" -T N, --threads=N: plan with N threads\n"
|
||
|
#endif
|
||
|
"\nSize syntax: <type><inplace><direction><geometry>\n"
|
||
|
" <type> = c/r/k for complex/real(r2c,c2r)/r2r\n"
|
||
|
" <inplace> = i/o for in/out-of place\n"
|
||
|
" <direction> = f/b for forward/backward, omitted for k transforms\n"
|
||
|
" <geometry> = <n1>[x<n2>[x...]], e.g. 10x12x14\n"
|
||
|
" -- for k transforms, after each dimension is a <kind>:\n"
|
||
|
" <kind> = f/b/h/e00/e01/e10/e11/o00/o01/o10/o11\n"
|
||
|
" for R2HC/HC2R/DHT/REDFT00/.../RODFT11\n"
|
||
|
, program_name);
|
||
|
}
|
||
|
|
||
|
/* powers of two and ten up to 2^20, for now */
|
||
|
static char canonical_sizes[][32] = {
|
||
|
"1", "2", "4", "8", "16", "32", "64", "128", "256", "512", "1024",
|
||
|
"2048", "4096", "8192", "16384", "32768", "65536", "131072",
|
||
|
"262144", "524288", "1048576",
|
||
|
|
||
|
"10", "100", "1000", "10000", "100000", "1000000",
|
||
|
|
||
|
"2x2", "4x4", "8x8", "10x10", "16x16", "32x32", "64x64", "100x100",
|
||
|
"128x128", "256x256", "512x512", "1000x1000", "1024x1024",
|
||
|
|
||
|
"2x2x2", "4x4x4", "8x8x8", "10x10x10", "16x16x16", "32x32x32",
|
||
|
"64x64x64", "100x100x100"
|
||
|
};
|
||
|
|
||
|
#define NELEM(array)(sizeof(array) / sizeof((array)[0]))
|
||
|
|
||
|
int bench_main(int argc, char *argv[])
|
||
|
{
|
||
|
int c;
|
||
|
unsigned i;
|
||
|
int impatient = 0;
|
||
|
int system_wisdom = 1;
|
||
|
int canonical = 0;
|
||
|
double hours = 0;
|
||
|
FILE *output_file;
|
||
|
char *output_fname = 0;
|
||
|
bench_problem **problems = 0;
|
||
|
int nproblems = 0, iproblem = 0;
|
||
|
time_t begin;
|
||
|
|
||
|
verbose = 0;
|
||
|
usewisdom = 0;
|
||
|
|
||
|
bench_srand(1);
|
||
|
#ifdef HAVE_SMP
|
||
|
/* do not configure FFTW with threads, unless the
|
||
|
user requests -T */
|
||
|
threads_ok = 0;
|
||
|
#endif
|
||
|
|
||
|
while ((c = my_getopt(argc, argv, options)) != -1) {
|
||
|
switch (c) {
|
||
|
case 'h':
|
||
|
help(stdout, argv[0]);
|
||
|
exit(EXIT_SUCCESS);
|
||
|
break;
|
||
|
|
||
|
case 'V':
|
||
|
printf("fftw-wisdom tool for FFTW version " VERSION ".\n");
|
||
|
printf(
|
||
|
"\n"
|
||
|
"Copyright (c) 2003, 2007-14 Matteo Frigo\n"
|
||
|
"Copyright (c) 2003, 2007-14 Massachusetts Institute of Technology\n"
|
||
|
"\n"
|
||
|
"This program is free software; you can redistribute it and/or modify\n"
|
||
|
"it under the terms of the GNU General Public License as published by\n"
|
||
|
"the Free Software Foundation; either version 2 of the License, or\n"
|
||
|
"(at your option) any later version.\n"
|
||
|
"\n"
|
||
|
"This program is distributed in the hope that it will be useful,\n"
|
||
|
"but WITHOUT ANY WARRANTY; without even the implied warranty of\n"
|
||
|
"MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the\n"
|
||
|
"GNU General Public License for more details.\n"
|
||
|
"\n"
|
||
|
"You should have received a copy of the GNU General Public License\n"
|
||
|
"along with this program; if not, write to the Free Software\n"
|
||
|
"Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA\n"
|
||
|
);
|
||
|
exit(EXIT_SUCCESS);
|
||
|
break;
|
||
|
|
||
|
case 'v':
|
||
|
verbose = 1;
|
||
|
break;
|
||
|
|
||
|
case 'c':
|
||
|
canonical = 1;
|
||
|
break;
|
||
|
|
||
|
case 't':
|
||
|
hours = atof(my_optarg);
|
||
|
break;
|
||
|
|
||
|
case 'o':
|
||
|
if (output_fname)
|
||
|
bench_free(output_fname);
|
||
|
|
||
|
if (!strcmp(my_optarg, "-"))
|
||
|
output_fname = 0;
|
||
|
else {
|
||
|
output_fname = (char *) bench_malloc(sizeof(char) *
|
||
|
(strlen(my_optarg) + 1));
|
||
|
strcpy(output_fname, my_optarg);
|
||
|
}
|
||
|
break;
|
||
|
|
||
|
case 'm':
|
||
|
case 'i':
|
||
|
impatient = 1;
|
||
|
break;
|
||
|
|
||
|
case 'e':
|
||
|
the_flags |= FFTW_ESTIMATE;
|
||
|
break;
|
||
|
|
||
|
case 'x':
|
||
|
the_flags |= FFTW_EXHAUSTIVE;
|
||
|
break;
|
||
|
|
||
|
case 'n':
|
||
|
system_wisdom = 0;
|
||
|
break;
|
||
|
|
||
|
case 'w': {
|
||
|
FILE *w = stdin;
|
||
|
if (strcmp(my_optarg, "-") && !(w = fopen(my_optarg, "r"))) {
|
||
|
fprintf(stderr,
|
||
|
"fftw-wisdom: error opening \"%s\": ", my_optarg);
|
||
|
perror("");
|
||
|
exit(EXIT_FAILURE);
|
||
|
}
|
||
|
if (!FFTW(import_wisdom_from_file)(w)) {
|
||
|
fprintf(stderr, "fftw_wisdom: error reading wisdom "
|
||
|
"from \"%s\"\n", my_optarg);
|
||
|
exit(EXIT_FAILURE);
|
||
|
}
|
||
|
if (w != stdin)
|
||
|
fclose(w);
|
||
|
break;
|
||
|
}
|
||
|
|
||
|
#ifdef HAVE_SMP
|
||
|
case 'T':
|
||
|
nthreads = atoi(my_optarg);
|
||
|
if (nthreads < 1) nthreads = 1;
|
||
|
threads_ok = 1;
|
||
|
BENCH_ASSERT(FFTW(init_threads)());
|
||
|
break;
|
||
|
#endif
|
||
|
|
||
|
case '?':
|
||
|
/* `my_getopt' already printed an error message. */
|
||
|
cleanup();
|
||
|
return EXIT_FAILURE;
|
||
|
|
||
|
default:
|
||
|
abort ();
|
||
|
}
|
||
|
}
|
||
|
|
||
|
if (!impatient)
|
||
|
the_flags |= FFTW_PATIENT;
|
||
|
|
||
|
if (system_wisdom)
|
||
|
if (!FFTW(import_system_wisdom)() && verbose)
|
||
|
fprintf(stderr, "fftw-wisdom: system-wisdom import failed\n");
|
||
|
|
||
|
if (canonical) {
|
||
|
for (i = 0; i < NELEM(canonical_sizes); ++i) {
|
||
|
unsigned j;
|
||
|
char types[][8] = {
|
||
|
"cof", "cob", "cif", "cib", "rof", "rob", "rif", "rib"
|
||
|
};
|
||
|
|
||
|
for (j = 0; j < NELEM(types); ++j) {
|
||
|
char ps[64];
|
||
|
if (!strchr(canonical_sizes[i],'x')
|
||
|
|| !strchr(types[j],'o')) {
|
||
|
#ifdef HAVE_SNPRINTF
|
||
|
snprintf(ps, sizeof(ps), "%s%s", types[j], canonical_sizes[i]);
|
||
|
#else
|
||
|
sprintf(ps, "%s%s", types[j], canonical_sizes[i]);
|
||
|
#endif
|
||
|
add_problem(ps, &problems, &iproblem, &nproblems);
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
while (my_optind < argc) {
|
||
|
if (!strcmp(argv[my_optind], "-")) {
|
||
|
char s[1025];
|
||
|
while (1 == fscanf(stdin, "%1024s", s))
|
||
|
add_problem(s, &problems, &iproblem, &nproblems);
|
||
|
}
|
||
|
else
|
||
|
add_problem(argv[my_optind], &problems, &iproblem, &nproblems);
|
||
|
++my_optind;
|
||
|
}
|
||
|
|
||
|
nproblems = iproblem;
|
||
|
qsort(problems, nproblems, sizeof(bench_problem *), prob_size_cmp);
|
||
|
|
||
|
if (!output_fname)
|
||
|
output_file = stdout;
|
||
|
else
|
||
|
if (!(output_file = fopen(output_fname, "w"))) {
|
||
|
fprintf(stderr,
|
||
|
"fftw-wisdom: error creating \"%s\"", output_fname);
|
||
|
perror("");
|
||
|
exit(EXIT_FAILURE);
|
||
|
}
|
||
|
|
||
|
begin = time((time_t*)0);
|
||
|
for (iproblem = 0; iproblem < nproblems; ++iproblem) {
|
||
|
if (hours <= 0
|
||
|
|| hours > (time((time_t*)0) - begin) / 3600.0)
|
||
|
do_problem(problems[iproblem]);
|
||
|
problem_destroy(problems[iproblem]);
|
||
|
|
||
|
}
|
||
|
free(problems);
|
||
|
|
||
|
if (verbose && hours > 0
|
||
|
&& hours < (time((time_t*)0) - begin) / 3600.0)
|
||
|
fprintf(stderr, "EXCEEDED TIME LIMIT OF %g HOURS.\n", hours);
|
||
|
|
||
|
FFTW(export_wisdom_to_file)(output_file);
|
||
|
if (output_file != stdout)
|
||
|
fclose(output_file);
|
||
|
if (output_fname)
|
||
|
bench_free(output_fname);
|
||
|
|
||
|
cleanup();
|
||
|
|
||
|
return EXIT_SUCCESS;
|
||
|
}
|