On a target with a 16-bit mask (for example), we would choose the type of an integer literal "1024" to be an int16. Previously, we used an int32, which is a worse fit and leads to less efficient code than an int16 on a 16-bit mask target. (However, we'd still give an integer literal 1000000 the type int32, even in a 16-bit target.) Updated the tests to still pass with 8 and 16-bit targets, given this change.
521 lines
19 KiB
Python
Executable File
521 lines
19 KiB
Python
Executable File
#!/usr/bin/python
|
|
|
|
# test-running driver for ispc
|
|
|
|
from optparse import OptionParser
|
|
import multiprocessing
|
|
from ctypes import c_int
|
|
import os
|
|
import sys
|
|
import glob
|
|
import re
|
|
import signal
|
|
import random
|
|
import string
|
|
import subprocess
|
|
import shlex
|
|
import platform
|
|
import tempfile
|
|
import os.path
|
|
import time
|
|
|
|
# disable fancy error/warning printing with ANSI colors, so grepping for error
|
|
# messages doesn't get confused
|
|
os.environ["TERM"] = "dumb"
|
|
|
|
# This script is affected by http://bugs.python.org/issue5261 on OSX 10.5 Leopard
|
|
# git history has a workaround for that issue.
|
|
|
|
is_windows = (platform.system() == 'Windows' or
|
|
'CYGWIN_NT' in platform.system())
|
|
|
|
parser = OptionParser()
|
|
parser.add_option("-r", "--random-shuffle", dest="random", help="Randomly order tests",
|
|
default=False, action="store_true")
|
|
parser.add_option("-g", "--generics-include", dest="include_file", help="Filename for header implementing functions for generics",
|
|
default=None)
|
|
parser.add_option("-f", "--ispc-flags", dest="ispc_flags", help="Additional flags for ispc (-g, -O1, ...)",
|
|
default="")
|
|
parser.add_option('-t', '--target', dest='target',
|
|
help='Set compilation target (neon, sse2, sse2-x2, sse4, sse4-x2, sse4-8, avx, avx-x2, generic-4, generic-8, generic-16, generic-32)',
|
|
default="sse4")
|
|
parser.add_option('-a', '--arch', dest='arch',
|
|
help='Set architecture (arm, x86, x86-64)',
|
|
default="x86-64")
|
|
parser.add_option("-c", "--compiler", dest="compiler_exe", help="Compiler binary to use to run tests",
|
|
default=None)
|
|
parser.add_option('-o', '--no-opt', dest='no_opt', help='Disable optimization',
|
|
default=False, action="store_true")
|
|
parser.add_option('-j', '--jobs', dest='num_jobs', help='Maximum number of jobs to run in parallel',
|
|
default="1024", type="int")
|
|
parser.add_option('-v', '--verbose', dest='verbose', help='Enable verbose output',
|
|
default=False, action="store_true")
|
|
parser.add_option('--wrap-exe', dest='wrapexe',
|
|
help='Executable to wrap test runs with (e.g. "valgrind")',
|
|
default="")
|
|
parser.add_option('--time', dest='time', help='Enable time output',
|
|
default=False, action="store_true")
|
|
|
|
(options, args) = parser.parse_args()
|
|
|
|
if options.target == 'neon':
|
|
options.arch = 'arm'
|
|
|
|
# use relative path to not depend on host directory, which may possibly
|
|
# have white spaces and unicode characters.
|
|
if not is_windows:
|
|
ispc_exe = "./ispc"
|
|
else:
|
|
ispc_exe = ".\\Release\\ispc.exe"
|
|
|
|
# checks the required ispc compiler otherwise prints an error message
|
|
if not os.path.exists(ispc_exe):
|
|
sys.stderr.write("Fatal error: missing ispc compiler: %s\n" % ispc_exe)
|
|
sys.exit()
|
|
|
|
ispc_exe += " " + options.ispc_flags
|
|
|
|
if __name__ == '__main__':
|
|
sys.stdout.write("ispc compiler: %s\n" % ispc_exe)
|
|
|
|
is_generic_target = (options.target.find("generic-") != -1 and
|
|
options.target != "generic-1")
|
|
if is_generic_target and options.include_file == None:
|
|
if options.target == "generic-4":
|
|
sys.stderr.write("No generics #include specified; using examples/intrinsics/sse4.h\n")
|
|
options.include_file = "examples/intrinsics/sse4.h"
|
|
elif options.target == "generic-8":
|
|
sys.stderr.write("No generics #include specified and no default available for \"generic-8\" target.\n")
|
|
sys.exit(1)
|
|
elif options.target == "generic-16":
|
|
sys.stderr.write("No generics #include specified; using examples/intrinsics/generic-16.h\n")
|
|
options.include_file = "examples/intrinsics/generic-16.h"
|
|
elif options.target == "generic-32":
|
|
sys.stderr.write("No generics #include specified; using examples/intrinsics/generic-32.h\n")
|
|
options.include_file = "examples/intrinsics/generic-32.h"
|
|
elif options.target == "generic-64":
|
|
sys.stderr.write("No generics #include specified; using examples/intrinsics/generic-64.h\n")
|
|
options.include_file = "examples/intrinsics/generic-64.h"
|
|
|
|
if options.compiler_exe == None:
|
|
if is_windows:
|
|
options.compiler_exe = "cl.exe"
|
|
else:
|
|
options.compiler_exe = "g++"
|
|
|
|
# checks the required compiler otherwise prints an error message
|
|
PATH_dir = string.split(os.getenv("PATH"), os.pathsep)
|
|
compiler_exists = False
|
|
|
|
for counter in PATH_dir:
|
|
if os.path.exists(counter + os.sep + options.compiler_exe):
|
|
compiler_exists = True
|
|
break
|
|
|
|
if not compiler_exists:
|
|
sys.stderr.write("Fatal error: missing the required compiler: %s \n" %
|
|
options.compiler_exe)
|
|
sys.exit()
|
|
|
|
ispc_root = "."
|
|
|
|
# if no specific test files are specified, run all of the tests in tests/,
|
|
# failing_tests/, and tests_errors/
|
|
if len(args) == 0:
|
|
files = glob.glob(ispc_root + os.sep + "tests" + os.sep + "*ispc") + \
|
|
glob.glob(ispc_root + os.sep + "failing_tests" + os.sep + "*ispc") + \
|
|
glob.glob(ispc_root + os.sep + "tests_errors" + os.sep + "*ispc")
|
|
else:
|
|
if is_windows:
|
|
argfiles = [ ]
|
|
for f in args:
|
|
# we have to glob ourselves if this is being run under a DOS
|
|
# shell, as it passes wildcard as is.
|
|
argfiles += glob.glob(f)
|
|
else:
|
|
argfiles = args
|
|
|
|
files = [ ]
|
|
for f in argfiles:
|
|
if os.path.splitext(string.lower(f))[1] != ".ispc":
|
|
sys.stdout.write("Ignoring file %s, which doesn't have an .ispc extension.\n" % f)
|
|
else:
|
|
files += [ f ]
|
|
|
|
# max_test_length is used to issue exact number of whitespace characters when
|
|
# updating status. Otherwise update causes new lines standard 80 char terminal
|
|
# on both Linux and Windows.
|
|
max_test_length = 0
|
|
for f in files:
|
|
max_test_length = max(max_test_length, len(f))
|
|
|
|
# randomly shuffle the tests if asked to do so
|
|
if (options.random):
|
|
random.seed()
|
|
random.shuffle(files)
|
|
|
|
# counter
|
|
total_tests = 0
|
|
|
|
|
|
# utility routine to print an update on the number of tests that have been
|
|
# finished. Should be called with the lock held..
|
|
def update_progress(fn, total_tests_arg, counter, max_test_length_arg):
|
|
counter.value += 1
|
|
progress_str = " Done %d / %d [%s]" % (counter.value, total_tests_arg, fn)
|
|
# spaces to clear out detrius from previous printing...
|
|
spaces_needed = max_test_length_arg - len(fn)
|
|
for x in range(spaces_needed):
|
|
progress_str += ' '
|
|
progress_str += '\r'
|
|
sys.stdout.write(progress_str)
|
|
sys.stdout.flush()
|
|
|
|
def run_command(cmd):
|
|
if options.verbose:
|
|
sys.stdout.write("Running: %s\n" % cmd)
|
|
|
|
# Here's a bit tricky part. To pass a command for execution we should
|
|
# break down the line in to arguments. shlex class is designed exactly
|
|
# for this purpose, but by default it interprets escape sequences.
|
|
# On Windows backslaches are all over the place and they are treates as
|
|
# ESC-sequences, so we have to set manually to not interpret them.
|
|
lexer = shlex.shlex(cmd, posix=True)
|
|
lexer.whitespace_split = True
|
|
lexer.escape = ''
|
|
arg_list = list(lexer)
|
|
|
|
sp = subprocess.Popen(arg_list, stdin=None,
|
|
stdout=subprocess.PIPE,
|
|
stderr=subprocess.PIPE)
|
|
out = sp.communicate()
|
|
output = ""
|
|
output += out[0].decode("utf-8")
|
|
output += out[1].decode("utf-8")
|
|
|
|
return (sp.returncode, output)
|
|
|
|
# run the commands in cmd_list
|
|
def run_cmds(compile_cmds, run_cmd, filename, expect_failure):
|
|
for cmd in compile_cmds:
|
|
(return_code, output) = run_command(cmd)
|
|
compile_failed = (return_code != 0)
|
|
if compile_failed:
|
|
sys.stdout.write("Compilation of test %s failed \n" % filename)
|
|
if output != "":
|
|
sys.stdout.write("%s" % output.encode("utf-8"))
|
|
return (1, 0)
|
|
|
|
(return_code, output) = run_command(run_cmd)
|
|
run_failed = (return_code != 0)
|
|
|
|
surprise = ((expect_failure and not run_failed) or
|
|
(not expect_failure and run_failed))
|
|
if surprise == True:
|
|
sys.stderr.write("Test %s %s (return code %d) \n" % \
|
|
(filename, "unexpectedly passed" if expect_failure else "failed",
|
|
return_code))
|
|
if output != "":
|
|
sys.stdout.write("%s\n" % output.encode("utf-8"))
|
|
if surprise == True:
|
|
return (0, 1)
|
|
else:
|
|
return (0, 0)
|
|
|
|
|
|
def add_prefix(path):
|
|
global is_windows
|
|
if is_windows:
|
|
# On Windows we run tests in tmp dir, so the root is one level up.
|
|
input_prefix = "..\\"
|
|
else:
|
|
input_prefix = ""
|
|
path = input_prefix + path
|
|
path = os.path.normpath(path)
|
|
return path
|
|
|
|
|
|
def check_test(filename):
|
|
prev_arch = False
|
|
prev_os = False
|
|
done_arch = True
|
|
done_os = True
|
|
done = True
|
|
global is_windows
|
|
if is_windows:
|
|
oss = "windows"
|
|
else:
|
|
oss = "linux"
|
|
b = buffer(file(add_prefix(filename)).read());
|
|
for run in re.finditer('// *rule: run on .*', b):
|
|
arch = re.match('.* arch=.*', run.group())
|
|
if arch != None:
|
|
if re.search(' arch='+options.arch+'$', arch.group()) != None:
|
|
prev_arch = True
|
|
if re.search(' arch='+options.arch+' ', arch.group()) != None:
|
|
prev_arch = True
|
|
done_arch = prev_arch
|
|
OS = re.match('.* OS=.*', run.group())
|
|
if OS != None:
|
|
if re.search(' OS='+oss, OS.group()) != None:
|
|
prev_os = True
|
|
done_os = prev_os
|
|
done = done_arch and done_os
|
|
for skip in re.finditer('// *rule: skip on .*', b):
|
|
if re.search(' arch=' + options.arch + '$', skip.group())!=None:
|
|
done = False
|
|
if re.search(' arch=' + options.arch + ' ', skip.group())!=None:
|
|
done = False
|
|
if re.search(' OS=' + oss, skip.group())!=None:
|
|
done = False
|
|
return done
|
|
|
|
|
|
def run_test(testname):
|
|
# testname is a path to the test from the root of ispc dir
|
|
# filename is a path to the test from the current dir
|
|
# ispc_exe_rel is a relative path to ispc
|
|
filename = add_prefix(testname)
|
|
ispc_exe_rel = add_prefix(ispc_exe)
|
|
|
|
# is this a test to make sure an error is issued?
|
|
want_error = (filename.find("tests_errors") != -1)
|
|
if want_error == True:
|
|
ispc_cmd = ispc_exe_rel + " --werror --nowrap %s --arch=%s --target=%s" % \
|
|
(filename, options.arch, options.target)
|
|
(return_code, output) = run_command(ispc_cmd)
|
|
got_error = (return_code != 0)
|
|
|
|
# figure out the error message we're expecting
|
|
file = open(filename, 'r')
|
|
firstline = file.readline()
|
|
firstline = firstline.replace("//", "")
|
|
firstline = firstline.lstrip()
|
|
firstline = firstline.rstrip()
|
|
file.close()
|
|
|
|
if re.search(firstline, output) == None:
|
|
sys.stderr.write("Didn't see expected error message %s from test %s.\nActual output:\n%s\n" % \
|
|
(firstline, testname, output))
|
|
return (1, 0)
|
|
elif got_error == False:
|
|
sys.stderr.write("Unexpectedly no errors issued from test %s\n" % testname)
|
|
return (1, 0)
|
|
else:
|
|
return (0, 0)
|
|
else:
|
|
# do we expect this test to fail?
|
|
should_fail = (testname.find("failing_") != -1)
|
|
|
|
# We need to figure out the signature of the test
|
|
# function that this test has.
|
|
sig2def = { "f_v(" : 0, "f_f(" : 1, "f_fu(" : 2, "f_fi(" : 3,
|
|
"f_du(" : 4, "f_duf(" : 5, "f_di(" : 6 }
|
|
file = open(filename, 'r')
|
|
match = -1
|
|
for line in file:
|
|
# look for lines with 'export'...
|
|
if line.find("export") == -1:
|
|
continue
|
|
# one of them should have a function with one of the
|
|
# declarations in sig2def
|
|
for pattern, ident in list(sig2def.items()):
|
|
if line.find(pattern) != -1:
|
|
match = ident
|
|
break
|
|
file.close()
|
|
if match == -1:
|
|
sys.stderr.write("Fatal error: unable to find function signature " + \
|
|
"in test %s\n" % testname)
|
|
return (1, 0)
|
|
else:
|
|
global is_generic_target
|
|
if is_windows:
|
|
if is_generic_target:
|
|
obj_name = "%s.cpp" % os.path.basename(filename)
|
|
else:
|
|
obj_name = "%s.obj" % os.path.basename(filename)
|
|
exe_name = "%s.exe" % os.path.basename(filename)
|
|
|
|
cc_cmd = "%s /I. /I../winstuff /Zi /nologo /DTEST_SIG=%d %s %s /Fe%s" % \
|
|
(options.compiler_exe, match, add_prefix("test_static.cpp"), obj_name, exe_name)
|
|
if should_fail:
|
|
cc_cmd += " /DEXPECT_FAILURE"
|
|
else:
|
|
if is_generic_target:
|
|
obj_name = "%s.cpp" % testname
|
|
else:
|
|
obj_name = "%s.o" % testname
|
|
exe_name = "%s.run" % testname
|
|
|
|
if options.arch == 'arm':
|
|
gcc_arch = '--with-fpu=hardfp -marm -mfpu=neon -mfloat-abi=hard'
|
|
else:
|
|
if options.arch == 'x86':
|
|
gcc_arch = '-m32'
|
|
else:
|
|
gcc_arch = '-m64'
|
|
|
|
gcc_isa=""
|
|
if options.target == 'generic-4':
|
|
gcc_isa = '-msse4.2'
|
|
if options.target == 'generic-8':
|
|
gcc_isa = '-mavx'
|
|
if (options.target == 'generic-16' or options.target == 'generic-32' or options.target == 'generic-64') \
|
|
and (options.include_file.find("knc.h")!=-1 or options.include_file.find("knc2x.h")!=-1):
|
|
gcc_isa = '-mmic'
|
|
|
|
cc_cmd = "%s -O2 -I. %s %s test_static.cpp -DTEST_SIG=%d %s -o %s" % \
|
|
(options.compiler_exe, gcc_arch, gcc_isa, match, obj_name, exe_name)
|
|
if platform.system() == 'Darwin':
|
|
cc_cmd += ' -Wl,-no_pie'
|
|
if should_fail:
|
|
cc_cmd += " -DEXPECT_FAILURE"
|
|
|
|
ispc_cmd = ispc_exe_rel + " --woff %s -o %s --arch=%s --target=%s" % \
|
|
(filename, obj_name, options.arch, options.target)
|
|
if options.no_opt:
|
|
ispc_cmd += " -O0"
|
|
if is_generic_target:
|
|
ispc_cmd += " --emit-c++ --c++-include-file=%s" % add_prefix(options.include_file)
|
|
|
|
# compile the ispc code, make the executable, and run it...
|
|
(compile_error, run_error) = run_cmds([ispc_cmd, cc_cmd],
|
|
options.wrapexe + " " + exe_name, \
|
|
testname, should_fail)
|
|
|
|
# clean up after running the test
|
|
try:
|
|
if not run_error:
|
|
os.unlink(exe_name)
|
|
if is_windows:
|
|
basename = os.path.basename(filename)
|
|
os.unlink("%s.pdb" % basename)
|
|
os.unlink("%s.ilk" % basename)
|
|
os.unlink(obj_name)
|
|
except:
|
|
None
|
|
|
|
return (compile_error, run_error)
|
|
|
|
# pull tests to run from the given queue and run them. Multiple copies of
|
|
# this function will be running in parallel across all of the CPU cores of
|
|
# the system.
|
|
def run_tasks_from_queue(queue, queue_ret, queue_skip, total_tests_arg, max_test_length_arg, counter, mutex):
|
|
if is_windows:
|
|
tmpdir = "tmp%d" % os.getpid()
|
|
os.mkdir(tmpdir)
|
|
os.chdir(tmpdir)
|
|
else:
|
|
olddir = ""
|
|
|
|
compile_error_files = [ ]
|
|
run_error_files = [ ]
|
|
skip_files = [ ]
|
|
while True:
|
|
filename = queue.get()
|
|
if (filename == 'STOP'):
|
|
queue_ret.put((compile_error_files, run_error_files, skip_files))
|
|
if is_windows:
|
|
try:
|
|
os.remove("test_static.obj")
|
|
# vc*.pdb trick is in anticipaton of new versions of VS.
|
|
vcpdb = glob.glob("vc*.pdb")[0]
|
|
os.remove(vcpdb)
|
|
os.chdir("..")
|
|
# This will fail if there were failing tests or
|
|
# Windows is in bad mood.
|
|
os.rmdir(tmpdir)
|
|
except:
|
|
None
|
|
|
|
sys.exit(0)
|
|
|
|
if check_test(filename):
|
|
(compile_error, run_error) = run_test(filename)
|
|
if compile_error != 0:
|
|
compile_error_files += [ filename ]
|
|
if run_error != 0:
|
|
run_error_files += [ filename ]
|
|
|
|
with mutex:
|
|
update_progress(filename, total_tests_arg, counter, max_test_length_arg)
|
|
else:
|
|
skip_files += [ filename ]
|
|
|
|
|
|
task_threads = []
|
|
|
|
def sigint(signum, frame):
|
|
for t in task_threads:
|
|
t.terminate()
|
|
sys.exit(1)
|
|
|
|
if __name__ == '__main__':
|
|
total_tests = len(files)
|
|
|
|
compile_error_files = [ ]
|
|
run_error_files = [ ]
|
|
skip_files = [ ]
|
|
|
|
nthreads = min(multiprocessing.cpu_count(), options.num_jobs)
|
|
nthreads = min(nthreads, len(files))
|
|
sys.stdout.write("Running %d jobs in parallel. Running %d tests.\n" % (nthreads, total_tests))
|
|
|
|
# put each of the test filenames into a queue
|
|
q = multiprocessing.Queue()
|
|
for fn in files:
|
|
q.put(fn)
|
|
for x in range(nthreads):
|
|
q.put('STOP')
|
|
qret = multiprocessing.Queue()
|
|
qskip = multiprocessing.Queue()
|
|
|
|
# need to catch sigint so that we can terminate all of the tasks if
|
|
# we're interrupted
|
|
signal.signal(signal.SIGINT, sigint)
|
|
|
|
finished_tests_counter = multiprocessing.Value(c_int)
|
|
finished_tests_counter_lock = multiprocessing.Lock()
|
|
|
|
start_time = time.time()
|
|
# launch jobs to run tests
|
|
for x in range(nthreads):
|
|
t = multiprocessing.Process(target=run_tasks_from_queue, args=(q, qret, qskip, total_tests, max_test_length, finished_tests_counter, finished_tests_counter_lock))
|
|
task_threads.append(t)
|
|
t.start()
|
|
|
|
# wait for them to all finish and then return the number that failed
|
|
# (i.e. return 0 if all is ok)
|
|
for t in task_threads:
|
|
t.join()
|
|
sys.stdout.write("\n")
|
|
|
|
elapsed_time = time.time() - start_time
|
|
if options.time:
|
|
sys.stdout.write("Elapsed time: %d s\n" % elapsed_time)
|
|
|
|
while not qret.empty():
|
|
(c, r, s) = qret.get()
|
|
compile_error_files += c
|
|
run_error_files += r
|
|
skip_files += s
|
|
|
|
if len(skip_files) > 0:
|
|
skip_files.sort()
|
|
sys.stdout.write("%d / %d tests SKIPPED:\n" % (len(skip_files), total_tests))
|
|
for f in skip_files:
|
|
sys.stdout.write("\t%s\n" % f)
|
|
if len(compile_error_files) > 0:
|
|
compile_error_files.sort()
|
|
sys.stdout.write("%d / %d tests FAILED compilation:\n" % (len(compile_error_files), total_tests))
|
|
for f in compile_error_files:
|
|
sys.stdout.write("\t%s\n" % f)
|
|
if len(run_error_files) > 0:
|
|
run_error_files.sort()
|
|
sys.stdout.write("%d / %d tests FAILED execution:\n" % (len(run_error_files), total_tests))
|
|
for f in run_error_files:
|
|
sys.stdout.write("\t%s\n" % f)
|
|
|
|
sys.exit(len(compile_error_files) + len(run_error_files))
|