diff --git a/alloy.py b/alloy.py index 7ae972b4..3f05f4fd 100755 --- a/alloy.py +++ b/alloy.py @@ -200,7 +200,7 @@ def check_targets(): answer = answer + ["sse4-i32x4", "sse4-i32x8", "sse4-i16x8", "sse4-i8x16"] if AVX == False and "avx" in f_lines[i]: AVX = True; - answer = answer + ["avx1-i32x8", "avx1-i32x16"] + answer = answer + ["avx1-i32x8", "avx1-i32x16", "avx1-i64x4"] if AVX11 == False and "rdrand" in f_lines[i]: AVX11 = True; answer = answer + ["avx1.1-i32x8", "avx1.1-i32x16"] @@ -217,7 +217,7 @@ def check_targets(): answer = answer + ["sse4-i32x4", "sse4-i32x8", "sse4-i16x8", "sse4-i8x16"] if "AVX1.0" in f_lines: AVX = True; - answer = answer + ["avx1-i32x8", "avx1-i32x16"] + answer = answer + ["avx1-i32x8", "avx1-i32x16", "avx1-i64x4"] if "RDRAND" in f_lines: AVX11 = True; answer = answer + ["avx1.1-i32x8", "avx1.1-i32x16"] @@ -246,7 +246,7 @@ def check_targets(): if SSE4 == False and "wsm" in f_lines[i]: answer_sde = answer_sde + [["-wsm", "sse4-i32x4"], ["-wsm", "sse4-i32x8"], ["-wsm", "sse4-i16x8"], ["-wsm", "sse4-i8x16"]] if AVX == False and "snb" in f_lines[i]: - answer_sde = answer_sde + [["-snb", "avx1-i32x8"], ["-snb", "avx1-i32x16"]] + answer_sde = answer_sde + [["-snb", "avx1-i32x8"], ["-snb", "avx1-i32x16"], ["-snb", "avx1-i64x4"]] if AVX11 == False and "ivb" in f_lines[i]: answer_sde = answer_sde + [["-ivb", "avx1.1-i32x8"], ["-ivb", "avx1.1-i32x16"]] if AVX2 == False and "hsw" in f_lines[i]: diff --git a/ispc.cpp b/ispc.cpp index bec7baf7..56b0a25f 100644 --- a/ispc.cpp +++ b/ispc.cpp @@ -714,11 +714,11 @@ Target::SupportedTargets() { #endif "sse2-i32x4, sse2-i32x8, " "sse4-i32x4, sse4-i32x8, sse4-i16x8, sse4-i8x16, " - "avx1-i32x8, avx1-i32x16, " + "avx1-i32x8, avx1-i32x16, avx1-i64x4, " "avx1.1-i32x8, avx1.1-i32x16, " "avx2-i32x8, avx2-i32x16, " "generic-x1, generic-x4, generic-x8, generic-x16, " - "generic-x32, generic-x64"; + "generic-x32, generic-x64"; } diff --git a/run_tests.py b/run_tests.py index 64d3462a..4146576c 100755 --- a/run_tests.py +++ b/run_tests.py @@ -449,7 +449,7 @@ def verify(): check = [["g++", "clang", "cl"],["-O0", "-O2"],["x86","x86-64"], ["Linux","Windows","Mac"],["LLVM 3.1","LLVM 3.2","LLVM 3.3","LLVM head"], ["sse2-i32x4", "sse2-i32x8", "sse4-i32x4", "sse4-i32x8", "sse4-i16x8", - "sse4-i8x16", "avx1-i32x8", "avx1-i32x16", "avx1.1-i32x8", "avx1.1-i32x16", + "sse4-i8x16", "avx1-i32x8", "avx1-i32x16", "avx1-i64x4", "avx1.1-i32x8", "avx1.1-i32x16", "avx2-i32x8", "avx2-i32x16", "generic-1", "generic-4", "generic-8", "generic-16", "generic-32", "generic-64"]] for i in range (0,len(f_lines)):