SimdFloat64x2OperationX86X64.cpp 12 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323
  1. //-------------------------------------------------------------------------------------------------------
  2. // Copyright (C) Microsoft Corporation and contributors. All rights reserved.
  3. // Licensed under the MIT license. See LICENSE.txt file in the project root for full license information.
  4. //-------------------------------------------------------------------------------------------------------
  5. #include "RuntimeLanguagePch.h"
  6. #if _M_IX86 || _M_AMD64
  7. namespace Js
  8. {
  9. SIMDValue SIMDFloat64x2Operation::OpFloat64x2(double x, double y)
  10. {
  11. X86SIMDValue x86Result;
  12. // Sets the lower double-precision, floating-point value to x
  13. // and sets the upper double-precision, floating-point value to y.
  14. x86Result.m128d_value = _mm_set_pd(y, x);
  15. return X86SIMDValue::ToSIMDValue(x86Result);
  16. }
  17. SIMDValue SIMDFloat64x2Operation::OpSplat(double x)
  18. {
  19. X86SIMDValue x86Result;
  20. // Sets the 2 double-precision, floating-point values to x
  21. x86Result.m128d_value = _mm_set1_pd(x);
  22. return X86SIMDValue::ToSIMDValue(x86Result);
  23. }
  24. // Conversions
  25. SIMDValue SIMDFloat64x2Operation::OpFromFloat32x4(const SIMDValue& value)
  26. {
  27. X86SIMDValue x86Result;
  28. X86SIMDValue v = X86SIMDValue::ToX86SIMDValue(value);
  29. // Converts the lower 2 single-precision, floating-point values
  30. // to two double-precision, floating-point values
  31. x86Result.m128d_value = _mm_cvtps_pd(v.m128_value);
  32. return X86SIMDValue::ToSIMDValue(x86Result);
  33. }
  34. SIMDValue SIMDFloat64x2Operation::OpFromInt32x4(const SIMDValue& value)
  35. {
  36. X86SIMDValue x86Result;
  37. X86SIMDValue v = X86SIMDValue::ToX86SIMDValue(value);
  38. // Converts the lower 2 signed 32-bit integer values of
  39. // to double-precision, floating-point values
  40. x86Result.m128d_value = _mm_cvtepi32_pd(v.m128i_value);
  41. return X86SIMDValue::ToSIMDValue(x86Result);
  42. }
  43. // Unary Ops
  44. SIMDValue SIMDFloat64x2Operation::OpAbs(const SIMDValue& value)
  45. {
  46. X86SIMDValue x86Result, SIGNMASK;
  47. X86SIMDValue v = X86SIMDValue::ToX86SIMDValue(value);
  48. SIGNMASK.m128d_value = _mm_castsi128_pd(_mm_set_epi32(0x7fffffff, 0xffffffff, 0x7fffffff, 0xffffffff));
  49. x86Result.m128d_value = _mm_and_pd(v.m128d_value, SIGNMASK.m128d_value); // v & SIGNMASK
  50. return X86SIMDValue::ToSIMDValue(x86Result);
  51. }
  52. SIMDValue SIMDFloat64x2Operation::OpNeg(const SIMDValue& value)
  53. {
  54. X86SIMDValue x86Result;
  55. X86SIMDValue SIGNMASK;
  56. X86SIMDValue v = X86SIMDValue::ToX86SIMDValue(value);
  57. SIGNMASK.m128d_value = _mm_castsi128_pd(_mm_set_epi32(0x80000000, 0x0, 0x80000000, 0x0));
  58. x86Result.m128d_value = _mm_xor_pd(v.m128d_value, SIGNMASK.m128d_value); // v ^ mask
  59. return X86SIMDValue::ToSIMDValue(x86Result);
  60. }
  61. SIMDValue SIMDFloat64x2Operation::OpNot(const SIMDValue& value)
  62. {
  63. X86SIMDValue x86Result;
  64. X86SIMDValue negativeOnes = { { -1, -1, -1, -1 } };
  65. X86SIMDValue v = X86SIMDValue::ToX86SIMDValue(value);
  66. x86Result.m128d_value = _mm_xor_pd(v.m128d_value, negativeOnes.m128d_value); // v ^ -1
  67. return X86SIMDValue::ToSIMDValue(x86Result);
  68. }
  69. SIMDValue SIMDFloat64x2Operation::OpReciprocal(const SIMDValue& value)
  70. {
  71. X86SIMDValue x86Result;
  72. X86SIMDValue doubleOnes;
  73. X86SIMDValue v = X86SIMDValue::ToX86SIMDValue(value);
  74. doubleOnes.m128d_value = _mm_set_pd(1.0, 1.0);
  75. x86Result.m128d_value = _mm_div_pd(doubleOnes.m128d_value, v.m128d_value); // result = 1.0/value
  76. return X86SIMDValue::ToSIMDValue(x86Result);
  77. }
  78. SIMDValue SIMDFloat64x2Operation::OpReciprocalSqrt(const SIMDValue& value)
  79. {
  80. X86SIMDValue x86Result;
  81. X86SIMDValue doubleOnes, temp;
  82. X86SIMDValue v = X86SIMDValue::ToX86SIMDValue(value);
  83. doubleOnes.m128d_value = _mm_set_pd(1.0, 1.0);
  84. temp.m128d_value = _mm_div_pd(doubleOnes.m128d_value, v.m128d_value); // temp = 1.0/value
  85. x86Result.m128d_value = _mm_sqrt_pd(temp.m128d_value); // result = sqrt(1.0/value)
  86. return X86SIMDValue::ToSIMDValue(x86Result);
  87. }
  88. SIMDValue SIMDFloat64x2Operation::OpSqrt(const SIMDValue& value)
  89. {
  90. X86SIMDValue x86Result;
  91. X86SIMDValue v = X86SIMDValue::ToX86SIMDValue(value);
  92. x86Result.m128d_value = _mm_sqrt_pd(v.m128d_value); // result = sqrt(value)
  93. return X86SIMDValue::ToSIMDValue(x86Result);
  94. }
  95. // Binary Ops
  96. SIMDValue SIMDFloat64x2Operation::OpAdd(const SIMDValue& aValue, const SIMDValue& bValue)
  97. {
  98. X86SIMDValue x86Result;
  99. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  100. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  101. x86Result.m128d_value = _mm_add_pd(tmpaValue.m128d_value, tmpbValue.m128d_value); // a + b
  102. return X86SIMDValue::ToSIMDValue(x86Result);
  103. }
  104. SIMDValue SIMDFloat64x2Operation::OpSub(const SIMDValue& aValue, const SIMDValue& bValue)
  105. {
  106. X86SIMDValue x86Result;
  107. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  108. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  109. x86Result.m128d_value = _mm_sub_pd(tmpaValue.m128d_value, tmpbValue.m128d_value); // a - b
  110. return X86SIMDValue::ToSIMDValue(x86Result);
  111. }
  112. SIMDValue SIMDFloat64x2Operation::OpMul(const SIMDValue& aValue, const SIMDValue& bValue)
  113. {
  114. X86SIMDValue x86Result;
  115. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  116. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  117. x86Result.m128d_value = _mm_mul_pd(tmpaValue.m128d_value, tmpbValue.m128d_value); // a * b
  118. return X86SIMDValue::ToSIMDValue(x86Result);
  119. }
  120. SIMDValue SIMDFloat64x2Operation::OpDiv(const SIMDValue& aValue, const SIMDValue& bValue)
  121. {
  122. X86SIMDValue x86Result;
  123. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  124. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  125. x86Result.m128d_value = _mm_div_pd(tmpaValue.m128d_value, tmpbValue.m128d_value); // a / b
  126. return X86SIMDValue::ToSIMDValue(x86Result);
  127. }
  128. SIMDValue SIMDFloat64x2Operation::OpAnd(const SIMDValue& aValue, const SIMDValue& bValue)
  129. {
  130. X86SIMDValue x86Result;
  131. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  132. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  133. x86Result.m128d_value = _mm_and_pd(tmpaValue.m128d_value, tmpbValue.m128d_value); // a & b
  134. return X86SIMDValue::ToSIMDValue(x86Result);
  135. }
  136. SIMDValue SIMDFloat64x2Operation::OpOr(const SIMDValue& aValue, const SIMDValue& bValue)
  137. {
  138. X86SIMDValue x86Result;
  139. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  140. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  141. x86Result.m128d_value = _mm_or_pd(tmpaValue.m128d_value, tmpbValue.m128d_value); // a | b
  142. return X86SIMDValue::ToSIMDValue(x86Result);
  143. }
  144. SIMDValue SIMDFloat64x2Operation::OpXor(const SIMDValue& aValue, const SIMDValue& bValue)
  145. {
  146. X86SIMDValue x86Result;
  147. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  148. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  149. x86Result.m128d_value = _mm_xor_pd(tmpaValue.m128d_value, tmpbValue.m128d_value); // a ^ b
  150. return X86SIMDValue::ToSIMDValue(x86Result);
  151. }
  152. SIMDValue SIMDFloat64x2Operation::OpMin(const SIMDValue& aValue, const SIMDValue& bValue)
  153. {
  154. X86SIMDValue x86Result;
  155. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  156. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  157. // choose the smaller value of the two parameters a and b
  158. x86Result.m128d_value = _mm_min_pd(tmpaValue.m128d_value, tmpbValue.m128d_value);
  159. return X86SIMDValue::ToSIMDValue(x86Result);
  160. }
  161. SIMDValue SIMDFloat64x2Operation::OpMax(const SIMDValue& aValue, const SIMDValue& bValue)
  162. {
  163. X86SIMDValue x86Result;
  164. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  165. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  166. // choose the larger value of the two parameters a and b
  167. x86Result.m128d_value = _mm_max_pd(tmpaValue.m128d_value, tmpbValue.m128d_value);
  168. return X86SIMDValue::ToSIMDValue(x86Result);
  169. }
  170. SIMDValue SIMDFloat64x2Operation::OpScale(const SIMDValue& Value, double scaleValue)
  171. {
  172. X86SIMDValue x86Result;
  173. X86SIMDValue v = X86SIMDValue::ToX86SIMDValue(Value);
  174. X86SIMDValue scaleVector;
  175. scaleVector.m128d_value = _mm_set1_pd(scaleValue);
  176. x86Result.m128d_value = _mm_mul_pd(v.m128d_value, scaleVector.m128d_value); // v * scale
  177. return X86SIMDValue::ToSIMDValue(x86Result);
  178. }
  179. SIMDValue SIMDFloat64x2Operation::OpLessThan(const SIMDValue& aValue, const SIMDValue& bValue)
  180. {
  181. X86SIMDValue x86Result;
  182. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  183. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  184. x86Result.m128d_value = _mm_cmplt_pd(tmpaValue.m128d_value, tmpbValue.m128d_value); // a < b?
  185. return X86SIMDValue::ToSIMDValue(x86Result);
  186. }
  187. SIMDValue SIMDFloat64x2Operation::OpLessThanOrEqual(const SIMDValue& aValue, const SIMDValue& bValue)
  188. {
  189. X86SIMDValue x86Result;
  190. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  191. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  192. x86Result.m128d_value = _mm_cmple_pd(tmpaValue.m128d_value, tmpbValue.m128d_value); // a <= b?
  193. return X86SIMDValue::ToSIMDValue(x86Result);
  194. }
  195. SIMDValue SIMDFloat64x2Operation::OpEqual(const SIMDValue& aValue, const SIMDValue& bValue)
  196. {
  197. X86SIMDValue x86Result;
  198. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  199. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  200. x86Result.m128d_value = _mm_cmpeq_pd(tmpaValue.m128d_value, tmpbValue.m128d_value); // a == b?
  201. return X86SIMDValue::ToSIMDValue(x86Result);
  202. }
  203. SIMDValue SIMDFloat64x2Operation::OpNotEqual(const SIMDValue& aValue, const SIMDValue& bValue)
  204. {
  205. X86SIMDValue x86Result;
  206. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  207. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  208. x86Result.m128d_value = _mm_cmpneq_pd(tmpaValue.m128d_value, tmpbValue.m128d_value); // a != b?
  209. return X86SIMDValue::ToSIMDValue(x86Result);
  210. }
  211. SIMDValue SIMDFloat64x2Operation::OpGreaterThan(const SIMDValue& aValue, const SIMDValue& bValue)
  212. {
  213. X86SIMDValue x86Result;
  214. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  215. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  216. x86Result.m128d_value = _mm_cmpgt_pd(tmpaValue.m128d_value, tmpbValue.m128d_value); // a > b?
  217. return X86SIMDValue::ToSIMDValue(x86Result);
  218. }
  219. SIMDValue SIMDFloat64x2Operation::OpGreaterThanOrEqual(const SIMDValue& aValue, const SIMDValue& bValue)
  220. {
  221. X86SIMDValue x86Result;
  222. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  223. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  224. x86Result.m128d_value = _mm_cmpge_pd(tmpaValue.m128d_value, tmpbValue.m128d_value); // a >= b?
  225. return X86SIMDValue::ToSIMDValue(x86Result);
  226. }
  227. SIMDValue SIMDFloat64x2Operation::OpSelect(const SIMDValue& mV, const SIMDValue& tV, const SIMDValue& fV)
  228. {
  229. X86SIMDValue x86Result;
  230. X86SIMDValue maskValue = X86SIMDValue::ToX86SIMDValue(mV);
  231. X86SIMDValue trueValue = X86SIMDValue::ToX86SIMDValue(tV);
  232. X86SIMDValue falseValue = X86SIMDValue::ToX86SIMDValue(fV);
  233. X86SIMDValue tempTrue, tempFalse;
  234. tempTrue.m128d_value = _mm_and_pd(maskValue.m128d_value, trueValue.m128d_value); // mask & True
  235. tempFalse.m128d_value = _mm_andnot_pd(maskValue.m128d_value, falseValue.m128d_value); // !mask & False
  236. x86Result.m128d_value = _mm_or_pd(tempTrue.m128d_value, tempFalse.m128d_value); // tempTrue | tempFalse
  237. return X86SIMDValue::ToSIMDValue(x86Result);
  238. }
  239. }
  240. #endif