avx1-i32x4 implementation as sse4-i32x4 with avx target-feature flag

2013-11-10 23:48:49 +04:00
parent fbab9874f6
commit ffc9a33933
3 changed files with 58 additions and 13 deletions
--- a/ispc.h
+++ b/ispc.h
@@ -253,6 +253,8 @@ public:

    int getNativeVectorWidth() const {return m_nativeVectorWidth;}

+    int getDataTypeWidth() const {return m_dataTypeWidth;}
+
    int getVectorWidth() const {return m_vectorWidth;}

    bool getGeneratePIC() const {return m_generatePIC;}
@@ -319,10 +321,14 @@ private:
 #endif

    /** Native vector width of the vector instruction set.  Note that this
-        value is directly derived from the ISA Being used (e.g. it's 4 for
+        value is directly derived from the ISA being used (e.g. it's 4 for
        SSE, 8 for AVX, etc.) */
    int m_nativeVectorWidth;

+    /** Data type with in bits. Typically it's 32, but could be 8, 16 or 64.
+        For generic it's -1, which means undefined. */
+    int m_dataTypeWidth;
+
    /** Actual vector width currently being compiled to.  This may be an
        integer multiple of the native vector width, for example if we're
        "doubling up" and compiling 8-wide on a 4-wide SSE system. */