SimdInt16x8OperationX86X64.cpp 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259
  1. //-------------------------------------------------------------------------------------------------------
  2. // Copyright (C) Microsoft Corporation and contributors. All rights reserved.
  3. // Licensed under the MIT license. See LICENSE.txt file in the project root for full license information.
  4. //-------------------------------------------------------------------------------------------------------
  5. #include "RuntimeLanguagePch.h"
  6. #if _M_IX86 || _M_AMD64
  7. namespace Js
  8. {
  9. // SIMD.Int16x8 operation wrappers that cover instrinsics for x86/x64 system
  10. SIMDValue SIMDInt16x8Operation::OpInt16x8(int16 values[])
  11. {
  12. X86SIMDValue x86Result;
  13. // Sets the 8 signed 16-bit integer values, note in revised order: starts with x7
  14. x86Result.m128i_value = _mm_set_epi16(values[7], values[6], values[5], values[4], values[3], values[2], values[1], values[0]);
  15. return X86SIMDValue::ToSIMDValue(x86Result);
  16. }
  17. SIMDValue SIMDInt16x8Operation::OpSplat(int16 x)
  18. {
  19. X86SIMDValue x86Result;
  20. // set 8 signed 16-bit integers values to input value x
  21. x86Result.m128i_value = _mm_set1_epi16(x);
  22. return X86SIMDValue::ToSIMDValue(x86Result);
  23. }
  24. // Unary Ops
  25. SIMDValue SIMDInt16x8Operation::OpNeg(const SIMDValue& value)
  26. {
  27. X86SIMDValue x86Result;
  28. X86SIMDValue SIGNMASK, temp;
  29. X86SIMDValue negativeOnes = { { -1, -1, -1, -1} };
  30. X86SIMDValue v = X86SIMDValue::ToX86SIMDValue(value);
  31. temp.m128i_value = _mm_andnot_si128(v.m128i_value, negativeOnes.m128i_value); // (~value) & (negative ones)
  32. SIGNMASK.m128i_value = _mm_set1_epi16(0x0001); // set SIGNMASK to 1
  33. x86Result.m128i_value = _mm_add_epi16(SIGNMASK.m128i_value, temp.m128i_value);// add 4 integers respectively
  34. return X86SIMDValue::ToSIMDValue(x86Result);
  35. }
  36. SIMDValue SIMDInt16x8Operation::OpNot(const SIMDValue& value)
  37. {
  38. X86SIMDValue x86Result;
  39. X86SIMDValue negativeOnes = { { -1, -1, -1, -1} };
  40. X86SIMDValue temp = X86SIMDValue::ToX86SIMDValue(value);
  41. x86Result.m128i_value = _mm_andnot_si128(temp.m128i_value, negativeOnes.m128i_value);
  42. return X86SIMDValue::ToSIMDValue(x86Result);
  43. }
  44. SIMDValue SIMDInt16x8Operation::OpAdd(const SIMDValue& aValue, const SIMDValue& bValue)
  45. {
  46. X86SIMDValue x86Result;
  47. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  48. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  49. x86Result.m128i_value = _mm_add_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // a + b
  50. return X86SIMDValue::ToSIMDValue(x86Result);
  51. }
  52. SIMDValue SIMDInt16x8Operation::OpSub(const SIMDValue& aValue, const SIMDValue& bValue)
  53. {
  54. X86SIMDValue x86Result;
  55. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  56. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  57. x86Result.m128i_value = _mm_sub_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // a - b
  58. return X86SIMDValue::ToSIMDValue(x86Result);;
  59. }
  60. SIMDValue SIMDInt16x8Operation::OpMul(const SIMDValue& aValue, const SIMDValue& bValue)
  61. {
  62. SIMDValue result;
  63. X86SIMDValue x86Result;
  64. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  65. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  66. x86Result.m128i_value = _mm_mullo_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value);
  67. result = X86SIMDValue::ToSIMDValue(x86Result);
  68. return result;
  69. }
  70. SIMDValue SIMDInt16x8Operation::OpAnd(const SIMDValue& aValue, const SIMDValue& bValue)
  71. {
  72. X86SIMDValue x86Result;
  73. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  74. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  75. x86Result.m128i_value = _mm_and_si128(tmpaValue.m128i_value, tmpbValue.m128i_value); // a & b
  76. return X86SIMDValue::ToSIMDValue(x86Result);
  77. }
  78. SIMDValue SIMDInt16x8Operation::OpOr(const SIMDValue& aValue, const SIMDValue& bValue)
  79. {
  80. X86SIMDValue x86Result;
  81. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  82. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  83. x86Result.m128i_value = _mm_or_si128(tmpaValue.m128i_value, tmpbValue.m128i_value); // a | b
  84. return X86SIMDValue::ToSIMDValue(x86Result);
  85. }
  86. SIMDValue SIMDInt16x8Operation::OpXor(const SIMDValue& aValue, const SIMDValue& bValue)
  87. {
  88. X86SIMDValue x86Result;
  89. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  90. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  91. x86Result.m128i_value = _mm_xor_si128(tmpaValue.m128i_value, tmpbValue.m128i_value); // a ^ b
  92. return X86SIMDValue::ToSIMDValue(x86Result);
  93. }
  94. SIMDValue SIMDInt16x8Operation::OpAddSaturate(const SIMDValue& aValue, const SIMDValue& bValue)
  95. {
  96. X86SIMDValue x86Result;
  97. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  98. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  99. x86Result.m128i_value = _mm_adds_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // a + b saturates
  100. return X86SIMDValue::ToSIMDValue(x86Result);
  101. }
  102. SIMDValue SIMDInt16x8Operation::OpSubSaturate(const SIMDValue& aValue, const SIMDValue& bValue)
  103. {
  104. X86SIMDValue x86Result;
  105. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  106. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  107. x86Result.m128i_value = _mm_subs_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // a - b saturates
  108. return X86SIMDValue::ToSIMDValue(x86Result);
  109. }
  110. SIMDValue SIMDInt16x8Operation::OpMin(const SIMDValue& aValue, const SIMDValue& bValue)
  111. {
  112. X86SIMDValue x86Result;
  113. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  114. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  115. x86Result.m128i_value = _mm_min_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // min a b
  116. return X86SIMDValue::ToSIMDValue(x86Result);
  117. }
  118. SIMDValue SIMDInt16x8Operation::OpMax(const SIMDValue& aValue, const SIMDValue& bValue)
  119. {
  120. X86SIMDValue x86Result;
  121. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  122. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  123. x86Result.m128i_value = _mm_max_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // min a b
  124. return X86SIMDValue::ToSIMDValue(x86Result);
  125. }
  126. SIMDValue SIMDInt16x8Operation::OpLessThan(const SIMDValue& aValue, const SIMDValue& bValue)
  127. {
  128. X86SIMDValue x86Result;
  129. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  130. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  131. x86Result.m128i_value = _mm_cmplt_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // compare a < b?
  132. return X86SIMDValue::ToSIMDValue(x86Result);
  133. }
  134. SIMDValue SIMDInt16x8Operation::OpLessThanOrEqual(const SIMDValue& aValue, const SIMDValue& bValue)
  135. {
  136. X86SIMDValue x86Result, x86Result1, x86Result2;
  137. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  138. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  139. x86Result1.m128i_value = _mm_cmplt_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // compare a < b?
  140. x86Result2.m128i_value = _mm_cmpeq_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // compare a == b?
  141. x86Result.m128i_value = _mm_or_si128(x86Result1.m128i_value, x86Result2.m128i_value);
  142. return X86SIMDValue::ToSIMDValue(x86Result);
  143. }
  144. SIMDValue SIMDInt16x8Operation::OpEqual(const SIMDValue& aValue, const SIMDValue& bValue)
  145. {
  146. X86SIMDValue x86Result;
  147. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  148. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  149. x86Result.m128i_value = _mm_cmpeq_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // compare a == b?
  150. return X86SIMDValue::ToSIMDValue(x86Result);
  151. }
  152. SIMDValue SIMDInt16x8Operation::OpNotEqual(const SIMDValue& aValue, const SIMDValue& bValue)
  153. {
  154. X86SIMDValue x86Result, tmpResult;
  155. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  156. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  157. tmpResult.m128i_value = _mm_cmpeq_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // compare a == b?
  158. X86SIMDValue negativeOnes = { { -1, -1, -1, -1} };
  159. x86Result.m128i_value = _mm_andnot_si128(tmpResult.m128i_value, negativeOnes.m128i_value);
  160. return X86SIMDValue::ToSIMDValue(x86Result);
  161. }
  162. SIMDValue SIMDInt16x8Operation::OpGreaterThan(const SIMDValue& aValue, const SIMDValue& bValue)
  163. {
  164. X86SIMDValue x86Result;
  165. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  166. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  167. x86Result.m128i_value = _mm_cmpgt_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // compare a > b?
  168. return X86SIMDValue::ToSIMDValue(x86Result);
  169. }
  170. SIMDValue SIMDInt16x8Operation::OpGreaterThanOrEqual(const SIMDValue& aValue, const SIMDValue& bValue)
  171. {
  172. X86SIMDValue x86Result, x86Result1, x86Result2;
  173. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  174. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  175. x86Result1.m128i_value = _mm_cmpgt_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // compare a > b?
  176. x86Result2.m128i_value = _mm_cmpeq_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // compare a == b?
  177. x86Result.m128i_value = _mm_or_si128(x86Result1.m128i_value, x86Result2.m128i_value);
  178. return X86SIMDValue::ToSIMDValue(x86Result);
  179. }
  180. // ShiftOps
  181. SIMDValue SIMDInt16x8Operation::OpShiftLeftByScalar(const SIMDValue& value, int count)
  182. {
  183. X86SIMDValue x86Result;
  184. X86SIMDValue tmpValue = X86SIMDValue::ToX86SIMDValue(value);
  185. // Shifts the 8 signed 16-bit integers in a left by count bits while shifting in zeros
  186. x86Result.m128i_value = _mm_slli_epi16(tmpValue.m128i_value, count & SIMDUtils::SIMDGetShiftAmountMask(2));
  187. return X86SIMDValue::ToSIMDValue(x86Result);
  188. }
  189. SIMDValue SIMDInt16x8Operation::OpShiftRightByScalar(const SIMDValue& value, int count)
  190. {
  191. X86SIMDValue x86Result;
  192. X86SIMDValue tmpValue = X86SIMDValue::ToX86SIMDValue(value);
  193. // Shifts the 8 signed 16-bit integers right by count bits while shifting in the sign bit
  194. x86Result.m128i_value = _mm_srai_epi16(tmpValue.m128i_value, count & SIMDUtils::SIMDGetShiftAmountMask(2));
  195. return X86SIMDValue::ToSIMDValue(x86Result);
  196. }
  197. }
  198. #endif