Merge pull request #4621 from alexanderkyte/strdup_env
[mono.git] / mcs / class / Mono.Simd / Mono.Simd / Vector8s.cs
index 0f664ab2af0517c9748db27f7b28c10868aa4259..1008c20920b7b478d1f316f0dc69ea86923c1a98 100644 (file)
 // OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
 // WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
 //
-using System;\r
-using System.Runtime.InteropServices;\r
-\r
-namespace Mono.Simd\r
-{\r
-       [StructLayout(LayoutKind.Sequential, Pack = 0, Size = 16)]
-       public struct Vector8s\r
-       {\r
-               private short v0, v1, v2, v3, v4, v5, v6, v7;\r\r
-               public Vector8s (short v0, short v1, short v2, short v3, short v4, short v5, short v6, short v7)\r
-               {\r
-                       this.v0 = v0;\r
-                       this.v1 = v1;\r
-                       this.v2 = v2;\r
-                       this.v3 = v3;\r
-                       this.v4 = v4;\r
-                       this.v5 = v5;\r
-                       this.v6 = v6;\r
-                       this.v7 = v7;\r
-               }\r
+using System;
+using System.Runtime.InteropServices;
+
+namespace Mono.Simd
+{
+       [Obsolete ("Use the types in the System.Numerics.Vectors namespace")]
+       [StructLayout(LayoutKind.Explicit, Pack = 0, Size = 16)]
+       public struct Vector8s
+       {
+               [ FieldOffset(0) ]
+               internal short v0;
+               [ FieldOffset(2) ]
+               internal short v1;
+               [ FieldOffset(4) ]
+               internal short v2;
+               [ FieldOffset(6) ]
+               internal short v3;
+               [ FieldOffset(8) ]
+               internal short v4;
+               [ FieldOffset(10) ]
+               internal short v5;
+               [ FieldOffset(12) ]
+               internal short v6;
+               [ FieldOffset(14) ]
+               internal short v7;
+
+               public Vector8s (short v0, short v1, short v2, short v3, short v4, short v5, short v6, short v7)
+               {
+                       this.v0 = v0;
+                       this.v1 = v1;
+                       this.v2 = v2;
+                       this.v3 = v3;
+                       this.v4 = v4;
+                       this.v5 = v5;
+                       this.v6 = v6;
+                       this.v7 = v7;
+               }
+               
+               public Vector8s (short s)
+               {
+                       this.v0 = s;
+                       this.v1 = s;
+                       this.v2 = s;
+                       this.v3 = s;
+                       this.v4 = s;
+                       this.v5 = s;
+                       this.v6 = s;
+                       this.v7 = s;
+               }
 
                public short V0 { get { return v0; } set { v0 = value; } }
                public short V1 { get { return v1; } set { v1 = value; } }
@@ -53,345 +82,309 @@ namespace Mono.Simd
                public short V5 { get { return v5; } set { v5 = value; } }
                public short V6 { get { return v6; } set { v6 = value; } }
                public short V7 { get { return v7; } set { v7 = value; } }
-\r
+
+               public static Vector8s Identity
+               {
+                       get { return  new Vector8s (1); }
+               }
+
+               public static Vector8s Zero
+               {
+                       get { return  new Vector8s (0); }
+               }
+
+               public static Vector8s MinusOne
+               {
+                       get { return new Vector8s (-1); }
+               }
+
+               [System.Runtime.CompilerServices.IndexerName ("Component")]
+               public unsafe short this [int index]
+               {
+                       get {
+                               if ((index | 0x7) != 0x7) //index < 0 || index > 7
+                                       throw new ArgumentOutOfRangeException ("index");
+                               fixed (short *v = &v0) {
+                                       return * (v + index);
+                               }
+                       }
+                       set {
+                               if ( (index | 0x7) != 0x7) //index < 0 || index > 7
+                                       throw new ArgumentOutOfRangeException ("index");
+                               fixed (short *v = &v0) {
+                                       * (v + index) = value;
+                               }
+                       }
+               }
+
                [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s operator + (Vector8s va, Vector8s vb)\r
-               {\r
+               public static unsafe Vector8s operator + (Vector8s va, Vector8s vb)
+               {
                        Vector8s res = new Vector8s ();
                        short *a = &va.v0;
                        short *b = &vb.v0;
                        short *c = &res.v0;
                        for (int i = 0; i < 8; ++i)
                                *c++ = (short)(*a++ + *b++);
-                       return res;\r
-               }\r
+                       return res;
+               }
 
                [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s operator - (Vector8s va, Vector8s vb)\r
-               {\r
+               public static unsafe Vector8s operator - (Vector8s va, Vector8s vb)
+               {
                        Vector8s res = new Vector8s ();
                        short *a = &va.v0;
                        short *b = &vb.v0;
                        short *c = &res.v0;
                        for (int i = 0; i < 8; ++i)
                                *c++ = (short)(*a++ - *b++);
-                       return res;\r
+                       return res;
                }
 
                [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s operator * (Vector8s va, Vector8s vb)\r
-               {\r
+               public static unsafe Vector8s operator * (Vector8s va, Vector8s vb)
+               {
                        Vector8s res = new Vector8s ();
                        short *a = &va.v0;
                        short *b = &vb.v0;
                        short *c = &res.v0;
                        for (int i = 0; i < 8; ++i)
                                *c++ = (short)(*a++ * (*b++));
-                       return res;\r
+                       return res;
                }
 
                [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s operator >> (Vector8s va, int amount)\r
-               {\r
+               public static unsafe Vector8s operator >> (Vector8s va, int amount)
+               {
                        Vector8s res = new Vector8s ();
                        short *a = &va.v0;
                        short *b = &res.v0;
                        for (int i = 0; i < 8; ++i)
                                *b++ = (short)(*a++ >> amount);
-                       return res;\r
+                       return res;
                }
 
                [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s operator << (Vector8s va, int amount)\r
-               {\r
+               public static unsafe Vector8s operator << (Vector8s va, int amount)
+               {
                        Vector8s res = new Vector8s ();
                        short *a = &va.v0;
                        short *b = &res.v0;
                        for (int i = 0; i < 8; ++i)
                                *b++ = (short)(*a++ << amount);
-                       return res;\r
-               }
-
-               [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s operator & (Vector8s va, Vector8s vb)\r
-               {\r
-                       Vector8s res = new Vector8s ();
-                       short *a = &va.v0;
-                       short *b = &vb.v0;
-                       short *c = &res.v0;
-                       for (int i = 0; i < 8; ++i)
-                               *c++ = (short)(*a++ & *b++);
-                       return res;\r
-               }
-
-               [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s operator | (Vector8s va, Vector8s vb)\r
-               {\r
-                       Vector8s res = new Vector8s ();
-                       short *a = &va.v0;
-                       short *b = &vb.v0;
-                       short *c = &res.v0;
-                       for (int i = 0; i < 8; ++i)
-                               *c++ = (short)(*a++ | *b++);
-                       return res;\r
-               }
-
-               [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s operator ^ (Vector8s va, Vector8s vb)\r
-               {\r
-                       Vector8s res = new Vector8s ();
-                       short *a = &va.v0;
-                       short *b = &vb.v0;
-                       short *c = &res.v0;
-                       for (int i = 0; i < 8; ++i)
-                               *c++ = (short)(*a++ ^ *b++);
-                       return res;\r
-               }
-
-               [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s UnpackLow (Vector8s va, Vector8s vb)
-               {
-                       return new Vector8s (va.v0, vb.v0, va.v1, vb.v1, va.v2, vb.v2, va.v3, vb.v3);
+                       return res;
                }
 
                [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s UnpackHigh (Vector8s va, Vector8s vb)
+               public static unsafe Vector8s operator & (Vector8s va, Vector8s vb)
                {
-                       return new Vector8s (va.v4, vb.v4, va.v5, vb.v5, va.v6, vb.v6, va.v7, vb.v7);
-               }
-
-               [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s ShiftRightLogic (Vector8s va, int amount)\r
-               {\r
                        Vector8s res = new Vector8s ();
-                       short *a = &va.v0;
-                       short *b = &res.v0;
-                       for (int i = 0; i < 8; ++i)
-                               *b++ = (short)((ushort)(*a++) >> amount);
-                       return res;\r
+                       uint *a = (uint*) &va.v0;
+                       uint *b = (uint*) &vb.v0;
+                       uint *c = (uint*) &res.v0;
+                       *c++ = *a++ & *b++;
+                       *c++ = *a++ & *b++;
+                       *c++ = *a++ & *b++;
+                       *c = *a & *b;
+                       return res;
                }
 
                [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s AddWithSaturation (Vector8s va, Vector8s vb) {
+               public static unsafe Vector8s operator | (Vector8s va, Vector8s vb)
+               {
                        Vector8s res = new Vector8s ();
-                       short *a = &va.v0;
-                       short *b = &vb.v0;
-                       short *c = &res.v0;
-                       for (int i = 0; i < 8; ++i)
-                               *c++ = (short) System.Math.Max (System.Math.Min (*a++ + *b++, short.MaxValue), short.MinValue); 
+                       uint *a = (uint*) &va.v0;
+                       uint *b = (uint*) &vb.v0;
+                       uint *c = (uint*) &res.v0;
+                       *c++ = *a++ | *b++;
+                       *c++ = *a++ | *b++;
+                       *c++ = *a++ | *b++;
+                       *c = *a | *b;
                        return res;
-               }\r
+               }
 
                [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s SubWithSaturation (Vector8s va, Vector8s vb) {
+               public static unsafe Vector8s operator ^ (Vector8s va, Vector8s vb)
+               {
                        Vector8s res = new Vector8s ();
-                       short *a = &va.v0;
-                       short *b = &vb.v0;
-                       short *c = &res.v0;
-                       for (int i = 0; i < 8; ++i)
-                               *c++ = (short) System.Math.Max (System.Math.Min (*a++ - *b++, short.MaxValue), short.MinValue); ;
+                       uint *a = (uint*) &va.v0;
+                       uint *b = (uint*) &vb.v0;
+                       uint *c = (uint*) &res.v0;
+                       *c++ = *a++ ^ *b++;
+                       *c++ = *a++ ^ *b++;
+                       *c++ = *a++ ^ *b++;
+                       *c = *a ^ *b;
                        return res;
                }
 
                [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s Max (Vector8s va, Vector8s vb) {
-                       Vector8s res = new Vector8s ();
+               public unsafe static bool operator ==(Vector8s va, Vector8s vb)
+               {
                        short *a = &va.v0;
                        short *b = &vb.v0;
-                       short *c = &res.v0;
                        for (int i = 0; i < 8; ++i)
-                               *c++ = (short) System.Math.Max (*a++, *b++);
-                       return res;
+                               if (*a++ != *b++)
+                                       return false;
+                       return true;
                }
 
                [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s Min (Vector8s va, Vector8s vb) {
-                       Vector8s res = new Vector8s ();
+               public unsafe static bool operator !=(Vector8s va, Vector8s vb)
+               {
                        short *a = &va.v0;
                        short *b = &vb.v0;
-                       short *c = &res.v0;
                        for (int i = 0; i < 8; ++i)
-                               *c++ = (short) System.Math.Min (*a++, *b++);
-                       return res;
+                               if (*a++ != *b++)
+                                       return true;
+                       return false;
                }
 
-               [Acceleration (AccelMode.SSE2)]
-               public static unsafe int ExtractByteMask (Vector8s va) {
-                       int res = 0;
-                       byte *a = (byte*)&va;
-                       for (int i = 0; i < 16; ++i)
-                               res |= (*a++ & 0x80) >> 7 << i;
-                       return res;
+               [Acceleration (AccelMode.SSE1)]
+               public static unsafe explicit operator Vector2d (Vector8s v)
+               {
+                       Vector2d* p = (Vector2d*)&v;
+                       return *p;
                }
 
-               [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s ShuffleHigh (Vector8s va, ShuffleSel sel)\r
+               [Acceleration (AccelMode.SSE1)]
+               public static unsafe explicit operator Vector4f (Vector8s v)
                {
-                       short *ptr = ((short*)&va) + 4;
-                       int idx = (int)sel;\r
-                       return new Vector8s (va.v0, va.v1, va.v2, va.v3, *(ptr + ((idx >> 0) & 0x3)), *(ptr + ((idx >> 2) & 0x3)), *(ptr + ((idx >> 4) & 0x3)), *(ptr + ((idx >> 6) & 0x3)));\r
+                       Vector4f* p = (Vector4f*)&v;
+                       return *p;
                }
 
-               [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s ShuffleLow (Vector8s va, ShuffleSel sel)\r
+               [Acceleration (AccelMode.SSE1)]
+               public static unsafe explicit operator Vector2l (Vector8s v)
                {
-                       short *ptr = ((short*)&va);
-                       int idx = (int)sel;\r
-                       return new Vector8s (*(ptr + ((idx >> 0) & 0x3)), *(ptr + ((idx >> 2) & 0x3)), *(ptr + ((idx >> 4) & 0x3)), *(ptr + ((idx >> 6) & 0x3)), va.v4, va.v5, va.v6, va.v7);\r
+                       Vector2l* p = (Vector2l*)&v;
+                       return *p;
                }
 
-               [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s CompareEqual (Vector8s va, Vector8s vb) {
-                       Vector8s res = new Vector8s ();
-                       short *a = &va.v0;
-                       short *b = &vb.v0;
-                       short *c = &res.v0;
-                       for (int i = 0; i < 8; ++i)
-                               *c++ = (short) (*a++ == *b++ ? -1 : 0);
-                       return res;
+               [Acceleration (AccelMode.SSE1)]
+               [CLSCompliant(false)]
+               public static unsafe explicit operator Vector2ul (Vector8s v)
+               {
+                       Vector2ul* p = (Vector2ul*)&v;
+                       return *p;
                }
 
-               [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s CompareGreaterThan (Vector8s va, Vector8s vb) {
-                       Vector8s res = new Vector8s ();
-                       short *a = &va.v0;
-                       short *b = &vb.v0;
-                       short *c = &res.v0;
-                       for (int i = 0; i < 8; ++i)
-                               *c++ = (short) (*a++ > *b++ ? -1 : 0);
-                       return res;
+               [Acceleration (AccelMode.SSE1)]
+               public static unsafe explicit operator Vector4i (Vector8s v)
+               {
+                       Vector4i* p = (Vector4i*)&v;
+                       return *p;
                }
 
-               [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector8s MultiplyStoreHigh (Vector8s va, Vector8s vb) {
-                       Vector8s res = new Vector8s ();
-                       short *a = &va.v0;
-                       short *b = &vb.v0;
-                       short *c = &res.v0;
-                       for (int i = 0; i < 8; ++i)
-                               *c++ = (short)((int)*a++ * (int)*b++ >> 16);
-                       return res;
+               [Acceleration (AccelMode.SSE1)]
+               [CLSCompliant(false)]
+               public static unsafe explicit operator Vector4ui (Vector8s v)
+               {
+                       Vector4ui* p = (Vector4ui*)&v;
+                       return *p;
                }
 
-               [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector16b PackWithUnsignedSaturation (Vector8s va, Vector8s vb) {
-                       Vector16b res = new Vector16b ();
-                       short *a = (short*)&va;
-                       short *b = (short*)&vb;
-                       byte *c = (byte*)&res;
-                       for (int i = 0; i < 8; ++i)
-                               *c++ = (byte)System.Math.Max (0, System.Math.Min ((int)*a++, byte.MaxValue));
-                       for (int i = 0; i < 8; ++i)
-                               *c++ = (byte)System.Math.Max (0, System.Math.Min ((int)*b++, byte.MaxValue));
-                       return res;
+               [Acceleration (AccelMode.SSE1)]
+               [CLSCompliant(false)]
+               public static unsafe explicit operator Vector8us (Vector8s v)
+               {
+                       Vector8us* p = (Vector8us*)&v;
+                       return *p;
                }
 
-               [CLSCompliant(false)]\r
-               [Acceleration (AccelMode.SSE2)]
-               public static unsafe Vector16sb PackWithSignedSaturation (Vector8s va, Vector8s vb) {
-                       Vector16sb res = new Vector16sb ();
-                       short *a = (short*)&va;
-                       short *b = (short*)&vb;
-                       sbyte *c = (sbyte*)&res;
-                       for (int i = 0; i < 8; ++i)
-                               *c++ = (sbyte)System.Math.Max (System.Math.Min ((int)*a++, sbyte.MaxValue), sbyte.MinValue);
-                       for (int i = 0; i < 8; ++i)
-                               *c++ = (sbyte)System.Math.Max (System.Math.Min ((int)*b++, sbyte.MaxValue), sbyte.MinValue);
-                       return res;
+               [Acceleration (AccelMode.SSE1)]
+               [CLSCompliant(false)]
+               public static unsafe explicit operator Vector16sb (Vector8s v)
+               {
+                       Vector16sb* p = (Vector16sb*)&v;
+                       return *p;
                }
 
                [Acceleration (AccelMode.SSE1)]
-               public static unsafe explicit operator Vector2d (Vector8s v)\r
-               {\r
-                       Vector2d* p = (Vector2d*)&v;\r
-                       return *p;\r
+               public static unsafe explicit operator Vector16b (Vector8s v)
+               {
+                       Vector16b* p = (Vector16b*)&v;
+                       return *p;
                }
 
+
                [Acceleration (AccelMode.SSE1)]
-               public static unsafe explicit operator Vector4f (Vector8s v)\r
-               {\r
-                       Vector4f* p = (Vector4f*)&v;\r
-                       return *p;\r
+               public static Vector8s LoadAligned (ref Vector8s v)
+               {
+                       return v;
                }
 
                [Acceleration (AccelMode.SSE1)]
-               public static unsafe explicit operator Vector2l (Vector8s v)\r
-               {\r
-                       Vector2l* p = (Vector2l*)&v;\r
-                       return *p;\r
+               public static void StoreAligned (ref Vector8s res, Vector8s val)
+               {
+                       res = val;
                }
-\r
+
+               [CLSCompliant(false)]
                [Acceleration (AccelMode.SSE1)]
-               [CLSCompliant(false)]\r
-               public static unsafe explicit operator Vector2ul (Vector8s v)\r
-               {\r
-                       Vector2ul* p = (Vector2ul*)&v;\r
-                       return *p;\r
+               public static unsafe Vector8s LoadAligned (Vector8s *v)
+               {
+                       return *v;
                }
 
+               [CLSCompliant(false)]
                [Acceleration (AccelMode.SSE1)]
-               public static unsafe explicit operator Vector4i (Vector8s v)\r
-               {\r
-                       Vector4i* p = (Vector4i*)&v;\r
-                       return *p;\r
+               public static unsafe void StoreAligned (Vector8s *res, Vector8s val)
+               {
+                       *res = val;
                }
-\r
+
                [Acceleration (AccelMode.SSE1)]
-               [CLSCompliant(false)]\r
-               public static unsafe explicit operator Vector4ui (Vector8s v)\r
-               {\r
-                       Vector4ui* p = (Vector4ui*)&v;\r
-                       return *p;\r
+               [CLSCompliant(false)]
+               public static void PrefetchTemporalAllCacheLevels (ref Vector8s res)
+               {
                }
-\r
+
                [Acceleration (AccelMode.SSE1)]
-               [CLSCompliant(false)]\r
-               public static unsafe explicit operator Vector8us (Vector8s v)\r
-               {\r
-                       Vector8us* p = (Vector8us*)&v;\r
-                       return *p;\r
+               [CLSCompliant(false)]
+               public static void PrefetchTemporal1stLevelCache (ref Vector8s res)
+               {
                }
 
                [Acceleration (AccelMode.SSE1)]
-               [CLSCompliant(false)]\r
-               public static unsafe explicit operator Vector16sb (Vector8s v)\r
-               {\r
-                       Vector16sb* p = (Vector16sb*)&v;\r
-                       return *p;\r
+               [CLSCompliant(false)]
+               public static void PrefetchTemporal2ndLevelCache (ref Vector8s res)
+               {
                }
 
                [Acceleration (AccelMode.SSE1)]
-               public static unsafe explicit operator Vector16b (Vector8s v)\r
-               {\r
-                       Vector16b* p = (Vector16b*)&v;\r
-                       return *p;\r
+               [CLSCompliant(false)]
+               public static void PrefetchNonTemporal (ref Vector8s res)
+               {
                }
-\r
 
                [Acceleration (AccelMode.SSE1)]
-               public static Vector8s LoadAligned (ref Vector8s v)\r
-               {\r
-                       return v;\r
-               }\r
-\r
+               [CLSCompliant(false)]
+               public static unsafe void PrefetchTemporalAllCacheLevels (Vector8s *res)
+               {
+               }
+
                [Acceleration (AccelMode.SSE1)]
-               public static void StoreAligned (ref Vector8s res, Vector8s val)\r
-               {\r
-                       res = val;\r
+               [CLSCompliant(false)]
+               public static unsafe void PrefetchTemporal1stLevelCache (Vector8s *res)
+               {
                }
 
-               [CLSCompliant(false)]\r
                [Acceleration (AccelMode.SSE1)]
-               public static unsafe Vector8s LoadAligned (Vector8s *v)\r
-               {\r
-                       return *v;\r
-               }\r
-\r
-               [CLSCompliant(false)]\r
+               [CLSCompliant(false)]
+               public static unsafe void PrefetchTemporal2ndLevelCache (Vector8s *res)
+               {
+               }
+
                [Acceleration (AccelMode.SSE1)]
-               public static unsafe void StoreAligned (Vector8s *res, Vector8s val)\r
-               {\r
-                       *res = val;\r
+               [CLSCompliant(false)]
+               public static unsafe void PrefetchNonTemporal (Vector8s *res)
+               {
+               }
+               
+               public override string ToString()
+               {
+                       return "<" + v0 + ", " + v1 + ", " + v2 + ", " + v3 + ", " +
+                                       v4 + ", " + v5 + ", " + v6 + ", " + v7 + ">"; 
                }
-       }\r
-}\r
+       }
+}