4 // Rodrigo Kumpera (rkumpera@novell.com)
6 // (C) 2008 Novell, Inc. (http://www.novell.com)
8 // Permission is hereby granted, free of charge, to any person obtaining
9 // a copy of this software and associated documentation files (the
10 // "Software"), to deal in the Software without restriction, including
11 // without limitation the rights to use, copy, modify, merge, publish,
12 // distribute, sublicense, and/or sell copies of the Software, and to
13 // permit persons to whom the Software is furnished to do so, subject to
14 // the following conditions:
16 // The above copyright notice and this permission notice shall be
17 // included in all copies or substantial portions of the Software.
19 // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
20 // EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
21 // MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
22 // NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
23 // LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
24 // OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
25 // WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
28 using System.Runtime.InteropServices;
32 [StructLayout(LayoutKind.Sequential, Pack = 0, Size = 16)]
34 public struct Vector16sb
36 private sbyte v0, v1, v2, v3, v4, v5, v6, v7, v8, v9, v10, v11, v12, v13, v14, v15;
37 public Vector16sb (sbyte v0, sbyte v1, sbyte v2, sbyte v3, sbyte v4, sbyte v5, sbyte v6, sbyte v7, sbyte v8, sbyte v9, sbyte v10, sbyte v11, sbyte v12, sbyte v13, sbyte v14, sbyte v15)
56 public sbyte V0 { get { return v0; } set { v0 = value; } }
57 public sbyte V1 { get { return v1; } set { v1 = value; } }
58 public sbyte V2 { get { return v2; } set { v2 = value; } }
59 public sbyte V3 { get { return v3; } set { v3 = value; } }
60 public sbyte V4 { get { return v4; } set { v4 = value; } }
61 public sbyte V5 { get { return v5; } set { v5 = value; } }
62 public sbyte V6 { get { return v6; } set { v6 = value; } }
63 public sbyte V7 { get { return v7; } set { v7 = value; } }
64 public sbyte V8 { get { return v8; } set { v8 = value; } }
65 public sbyte V9 { get { return v9; } set { v9 = value; } }
66 public sbyte V10 { get { return v10; } set { v10 = value; } }
67 public sbyte V11 { get { return v11; } set { v11 = value; } }
68 public sbyte V12 { get { return v12; } set { v12 = value; } }
69 public sbyte V13 { get { return v13; } set { v13 = value; } }
70 public sbyte V14 { get { return v14; } set { v14 = value; } }
71 public sbyte V15 { get { return v15; } set { v15 = value; } }
73 [System.Runtime.CompilerServices.IndexerName ("Component")]
74 public unsafe sbyte this [int index]
77 if ((index | 0xF) != 0xF) //index < 0 || index > 15
78 throw new ArgumentOutOfRangeException ("index");
79 fixed (sbyte *v = &v0) {
84 if ( (index | 0xF) != 0xF) //index < 0 || index > 15
85 throw new ArgumentOutOfRangeException ("index");
86 fixed (sbyte *v = &v0) {
92 [Acceleration (AccelMode.SSE2)]
93 public static unsafe Vector16sb operator + (Vector16sb va, Vector16sb vb)
95 Vector16sb res = new Vector16sb ();
99 for (int i = 0; i < 16; ++i)
100 *c++ = (sbyte)(*a++ + *b++);
104 [Acceleration (AccelMode.SSE2)]
105 public static unsafe Vector16sb operator - (Vector16sb va, Vector16sb vb)
107 Vector16sb res = new Vector16sb ();
111 for (int i = 0; i < 16; ++i)
112 *c++ = (sbyte)(*a++ - *b++);
116 [Acceleration (AccelMode.SSE2)]
117 public static unsafe Vector16sb operator & (Vector16sb va, Vector16sb vb)
119 Vector16sb res = new Vector16sb ();
120 uint *a = (uint*) &va.v0;
121 uint *b = (uint*) &vb.v0;
122 uint *c = (uint*) &res.v0;
130 [Acceleration (AccelMode.SSE2)]
131 public static unsafe Vector16sb operator | (Vector16sb va, Vector16sb vb)
133 Vector16sb res = new Vector16sb ();
134 uint *a = (uint*) &va.v0;
135 uint *b = (uint*) &vb.v0;
136 uint *c = (uint*) &res.v0;
144 [Acceleration (AccelMode.SSE2)]
145 public static unsafe Vector16sb operator ^ (Vector16sb va, Vector16sb vb)
147 Vector16sb res = new Vector16sb ();
148 uint *a = (uint*) &va.v0;
149 uint *b = (uint*) &vb.v0;
150 uint *c = (uint*) &res.v0;
158 [Acceleration (AccelMode.SSE2)]
159 public unsafe static bool operator ==(Vector16sb va, Vector16sb vb)
163 for (int i = 0; i < 16; ++i)
169 [Acceleration (AccelMode.SSE2)]
170 public unsafe static bool operator !=(Vector16sb va, Vector16sb vb)
174 for (int i = 0; i < 16; ++i)
180 [Acceleration (AccelMode.SSE2)]
181 public static unsafe Vector16sb UnpackLow (Vector16sb va, Vector16sb vb)
183 return new Vector16sb (va.v0, vb.v0, va.v1, vb.v1, va.v2, vb.v2, va.v3, vb.v3, va.v4, vb.v4, va.v5, vb.v5, va.v6, vb.v6, va.v7, vb.v7);
186 [Acceleration (AccelMode.SSE2)]
187 public static unsafe Vector16sb UnpackHigh (Vector16sb va, Vector16sb vb)
189 return new Vector16sb (va.v8, vb.v8, va.v9, vb.v9, va.v10, vb.v10, va.v11, vb.v11, va.v12, vb.v12, va.v13, vb.v13, va.v14, vb.v14, va.v15, vb.v15);
192 [Acceleration (AccelMode.SSE2)]
193 public static unsafe Vector16sb AddWithSaturation (Vector16sb va, Vector16sb vb) {
194 Vector16sb res = new Vector16sb ();
198 for (int i = 0; i < 16; ++i)
199 *c++ = (sbyte) System.Math.Max (System.Math.Min (*a++ + *b++, sbyte.MaxValue), sbyte.MinValue);
203 [Acceleration (AccelMode.SSE2)]
204 public static unsafe Vector16sb SubtractWithSaturation (Vector16sb va, Vector16sb vb) {
205 Vector16sb res = new Vector16sb ();
209 for (int i = 0; i < 16; ++i)
210 *c++ = (sbyte) System.Math.Max (System.Math.Min (*a++ - *b++, sbyte.MaxValue), sbyte.MinValue);
214 [Acceleration (AccelMode.SSE41)]
215 public static unsafe Vector16sb Max (Vector16sb va, Vector16sb vb) {
216 Vector16sb res = new Vector16sb ();
220 for (int i = 0; i < 16; ++i)
221 *c++ = (sbyte) System.Math.Max (*a++, *b++);
225 [Acceleration (AccelMode.SSE41)]
226 public static unsafe Vector16sb Min (Vector16sb va, Vector16sb vb) {
227 Vector16sb res = new Vector16sb ();
231 for (int i = 0; i < 16; ++i)
232 *c++ = (sbyte) System.Math.Min(*a++, *b++);
236 [Acceleration (AccelMode.SSE2)]
237 public static unsafe int ExtractByteMask (Vector16sb va) {
239 sbyte *a = (sbyte*)&va;
240 for (int i = 0; i < 16; ++i)
241 res |= (*a++ & 0x80) >> 7 << i;
245 [Acceleration (AccelMode.SSE2)]
246 public static unsafe Vector16sb CompareEqual (Vector16sb va, Vector16sb vb) {
247 Vector16sb res = new Vector16sb ();
251 for (int i = 0; i < 16; ++i)
252 *c++ = (sbyte) (*a++ == *b++ ? -1 : 0);
256 [Acceleration (AccelMode.SSE2)]
257 public static unsafe Vector16sb CompareGreaterThan (Vector16sb va, Vector16sb vb) {
258 Vector16sb res = new Vector16sb ();
262 for (int i = 0; i < 16; ++i)
263 *c++ = (sbyte) (*a++ > *b++ ? -1 : 0);
267 [Acceleration (AccelMode.SSE1)]
268 public static unsafe explicit operator Vector2d (Vector16sb v)
270 Vector2d* p = (Vector2d*)&v;
274 [Acceleration (AccelMode.SSE1)]
275 public static unsafe explicit operator Vector4f (Vector16sb v)
277 Vector4f* p = (Vector4f*)&v;
281 [Acceleration (AccelMode.SSE1)]
282 public static unsafe explicit operator Vector2l (Vector16sb v)
284 Vector2l* p = (Vector2l*)&v;
288 [Acceleration (AccelMode.SSE1)]
289 public static unsafe explicit operator Vector2ul (Vector16sb v)
291 Vector2ul* p = (Vector2ul*)&v;
295 [Acceleration (AccelMode.SSE1)]
296 public static unsafe explicit operator Vector4i (Vector16sb v)
298 Vector4i* p = (Vector4i*)&v;
302 [Acceleration (AccelMode.SSE1)]
303 public static unsafe explicit operator Vector4ui (Vector16sb v)
305 Vector4ui* p = (Vector4ui*)&v;
309 [Acceleration (AccelMode.SSE1)]
310 public static unsafe explicit operator Vector8s (Vector16sb v)
312 Vector8s* p = (Vector8s*)&v;
316 [Acceleration (AccelMode.SSE1)]
317 public static unsafe explicit operator Vector8us (Vector16sb v)
319 Vector8us* p = (Vector8us*)&v;
323 [Acceleration (AccelMode.SSE1)]
324 public static unsafe explicit operator Vector16b (Vector16sb v)
326 Vector16b* p = (Vector16b*)&v;
330 [Acceleration (AccelMode.SSE1)]
331 public static Vector16sb LoadAligned (ref Vector16sb v)
336 [Acceleration (AccelMode.SSE1)]
337 public static void StoreAligned (ref Vector16sb res, Vector16sb val)
342 [Acceleration (AccelMode.SSE1)]
343 public static unsafe Vector16sb LoadAligned (Vector16sb *v)
348 [Acceleration (AccelMode.SSE1)]
349 public static unsafe void StoreAligned (Vector16sb *res, Vector16sb val)
354 [Acceleration (AccelMode.SSE1)]
355 [CLSCompliant(false)]
356 public static void PrefetchTemporalAllCacheLevels (ref Vector16sb res)
360 [Acceleration (AccelMode.SSE1)]
361 [CLSCompliant(false)]
362 public static void PrefetchTemporal1stLevelCache (ref Vector16sb res)
366 [Acceleration (AccelMode.SSE1)]
367 [CLSCompliant(false)]
368 public static void PrefetchTemporal2ndLevelCache (ref Vector16sb res)
372 [Acceleration (AccelMode.SSE1)]
373 [CLSCompliant(false)]
374 public static void PrefetchNonTemporal (ref Vector16sb res)
378 [Acceleration (AccelMode.SSE1)]
379 [CLSCompliant(false)]
380 public static unsafe void PrefetchTemporalAllCacheLevels (Vector16sb *res)
384 [Acceleration (AccelMode.SSE1)]
385 [CLSCompliant(false)]
386 public static unsafe void PrefetchTemporal1stLevelCache (Vector16sb *res)
390 [Acceleration (AccelMode.SSE1)]
391 [CLSCompliant(false)]
392 public static unsafe void PrefetchTemporal2ndLevelCache (Vector16sb *res)
396 [Acceleration (AccelMode.SSE1)]
397 [CLSCompliant(false)]
398 public static unsafe void PrefetchNonTemporal (Vector16sb *res)