Add SSE4 target optimized for computation with 8-bit datatypes.

This change adds a new 'sse4-8' target, where programCount is 16 and
the mask element size is 8-bits.  (i.e. the most appropriate sizing of
the mask for SIMD computation with 8-bit datatypes.)
This commit is contained in:
Matt Pharr
2013-07-23 17:30:32 -07:00
parent 15a3ef370a
commit 53414f12e6
7 changed files with 578 additions and 7 deletions

View File

@@ -868,6 +868,15 @@ DefineStdlib(SymbolTable *symbolTable, llvm::LLVMContext *ctx, llvm::Module *mod
EXPORT_MODULE(builtins_bitcode_sse4_x2_64bit);
}
break;
case 16:
Assert(g->target->getMaskBitCount() == 8);
if (runtime32) {
EXPORT_MODULE(builtins_bitcode_sse4_8_32bit);
}
else {
EXPORT_MODULE(builtins_bitcode_sse4_8_64bit);
}
break;
default:
FATAL("logic error in DefineStdlib");
}