Various AVX fixes (found by inspection).

Emit calls to masked_store, not masked_store_blend, when handling masked stores emitted by the frontend. Fix bug in binary8to16 macro in builtins.m4 Fix bug in 16-wide version of __reduce_add_float Remove blend function implementations for masked_store_blend for AVX; just forward those on to the corresponding real masked store functions.
2011-08-26 12:58:02 -07:00
parent 34301e09f5
commit 4ab982bc16
4 changed files with 30 additions and 200 deletions
--- a/opt.cpp
+++ b/opt.cpp
@@ -1422,7 +1422,8 @@ LowerMaskedStorePass::runOnBasicBlock(llvm::BasicBlock &bb) {
        // __masked_store_blend_* should be the same as __masked_store_*,
        // so this doesn't matter.  On SSE, blending is generally more
        // efficient and is always safe to do on stack-allocated values.(?)
-        bool doBlend = lIsStackVariablePointer(lvalue);
+        bool doBlend = (g->target.isa != Target::AVX &&
+                        lIsStackVariablePointer(lvalue));
        if (g->target.isa == Target::SSE4 || g->target.isa == Target::SSE2)
            doBlend |= !g->opt.disableBlendedMaskedStores;