SimdUint16x8OperationX86X64.cpp 6.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139
  1. //-------------------------------------------------------------------------------------------------------
  2. // Copyright (C) Microsoft Corporation and contributors. All rights reserved.
  3. // Licensed under the MIT license. See LICENSE.txt file in the project root for full license information.
  4. //-------------------------------------------------------------------------------------------------------
  5. #include "RuntimeLanguagePch.h"
  6. #if _M_IX86 || _M_AMD64
  7. namespace Js
  8. {
  9. // SIMD.Uint16x8 operation wrappers that cover instrinsics for x86/x64 system
  10. SIMDValue SIMDUint16x8Operation::OpUint16x8(uint16 values[])
  11. {
  12. X86SIMDValue x86Result;
  13. // Sets the 8 signed 16-bit integer values, note in revised order: starts with x7 below
  14. x86Result.m128i_value = _mm_set_epi16((int16)values[7], (int16)values[6], (int16)values[5], (int16)values[4],
  15. (int16)values[3], (int16)values[2], (int16)values[1], (int16)values[0]);
  16. return X86SIMDValue::ToSIMDValue(x86Result);
  17. }
  18. SIMDValue SIMDUint16x8Operation::OpMin(const SIMDValue& aValue, const SIMDValue& bValue)
  19. {
  20. X86SIMDValue x86Result;
  21. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  22. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  23. // _mm_min_epu16 is SSE4.1
  24. //x86Result.m128i_value = _mm_min_epu16(tmpaValue.m128i_value, tmpbValue.m128i_value);
  25. // XOR the sign bits so the comparison comes out correct for unsigned
  26. tmpaValue.m128i_value = _mm_xor_si128(tmpaValue.m128i_value, X86_WORD_SIGNBITS.m128i_value);
  27. tmpbValue.m128i_value = _mm_xor_si128(tmpbValue.m128i_value, X86_WORD_SIGNBITS.m128i_value);
  28. x86Result.m128i_value = _mm_min_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value);
  29. x86Result.m128i_value = _mm_xor_si128(x86Result.m128i_value, X86_WORD_SIGNBITS.m128i_value);
  30. return X86SIMDValue::ToSIMDValue(x86Result);
  31. }
  32. SIMDValue SIMDUint16x8Operation::OpMax(const SIMDValue& aValue, const SIMDValue& bValue)
  33. {
  34. X86SIMDValue x86Result;
  35. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  36. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  37. // _mm_max_epu16 is SSE4.1
  38. //x86Result.m128i_value = _mm_max_epu16(tmpaValue.m128i_value, tmpbValue.m128i_value);
  39. // XOR the sign bits so the comparison comes out correct for unsigned
  40. tmpaValue.m128i_value = _mm_xor_si128(tmpaValue.m128i_value, X86_WORD_SIGNBITS.m128i_value);
  41. tmpbValue.m128i_value = _mm_xor_si128(tmpbValue.m128i_value, X86_WORD_SIGNBITS.m128i_value);
  42. x86Result.m128i_value = _mm_max_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value);
  43. x86Result.m128i_value = _mm_xor_si128(x86Result.m128i_value, X86_WORD_SIGNBITS.m128i_value);
  44. return X86SIMDValue::ToSIMDValue(x86Result);
  45. }
  46. SIMDValue SIMDUint16x8Operation::OpLessThan(const SIMDValue& aValue, const SIMDValue& bValue)
  47. {
  48. X86SIMDValue x86Result;
  49. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  50. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  51. // Signed comparison of unsigned ints can be done if the ints have the "sign" bit xored with 1
  52. tmpaValue.m128i_value = _mm_xor_si128(tmpaValue.m128i_value, X86_WORD_SIGNBITS.m128i_value);
  53. tmpbValue.m128i_value = _mm_xor_si128(tmpbValue.m128i_value, X86_WORD_SIGNBITS.m128i_value);
  54. x86Result.m128i_value = _mm_cmplt_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // compare a < b?
  55. return X86SIMDValue::ToSIMDValue(x86Result);
  56. }
  57. SIMDValue SIMDUint16x8Operation::OpLessThanOrEqual(const SIMDValue& aValue, const SIMDValue& bValue)
  58. {
  59. X86SIMDValue x86Result;
  60. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  61. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  62. // Signed comparison of unsigned ints can be done if the ints have the "sign" bit xored with 1
  63. tmpaValue.m128i_value = _mm_xor_si128(tmpaValue.m128i_value, X86_WORD_SIGNBITS.m128i_value);
  64. tmpbValue.m128i_value = _mm_xor_si128(tmpbValue.m128i_value, X86_WORD_SIGNBITS.m128i_value);
  65. x86Result.m128i_value = _mm_cmplt_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // compare a < b?
  66. tmpaValue.m128i_value = _mm_cmpeq_epi16(tmpaValue.m128i_value, tmpbValue.m128i_value); // compare a == b?
  67. x86Result.m128i_value = _mm_or_si128(x86Result.m128i_value, tmpaValue.m128i_value); // result = (a<b)|(a==b)
  68. return X86SIMDValue::ToSIMDValue(x86Result);
  69. }
  70. SIMDValue SIMDUint16x8Operation::OpGreaterThanOrEqual(const SIMDValue& aValue, const SIMDValue& bValue)
  71. {
  72. SIMDValue result;
  73. result = SIMDUint16x8Operation::OpLessThan(aValue, bValue);
  74. result = SIMDInt32x4Operation::OpNot(result);
  75. return result;
  76. }
  77. SIMDValue SIMDUint16x8Operation::OpGreaterThan(const SIMDValue& aValue, const SIMDValue& bValue)
  78. {
  79. SIMDValue result;
  80. result = SIMDUint16x8Operation::OpLessThanOrEqual(aValue, bValue);
  81. result = SIMDInt32x4Operation::OpNot(result);
  82. return result;
  83. }
  84. SIMDValue SIMDUint16x8Operation::OpShiftRightByScalar(const SIMDValue& value, int count)
  85. {
  86. X86SIMDValue x86Result = { { 0, 0, 0, 0 } };
  87. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(value);
  88. x86Result.m128i_value = _mm_srli_epi16(tmpaValue.m128i_value, count & SIMDUtils::SIMDGetShiftAmountMask(2));
  89. return X86SIMDValue::ToSIMDValue(x86Result);
  90. }
  91. SIMDValue SIMDUint16x8Operation::OpAddSaturate(const SIMDValue& aValue, const SIMDValue& bValue)
  92. {
  93. X86SIMDValue x86Result;
  94. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  95. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  96. x86Result.m128i_value = _mm_adds_epu16(tmpaValue.m128i_value, tmpbValue.m128i_value); // a + b saturated
  97. return X86SIMDValue::ToSIMDValue(x86Result);
  98. }
  99. SIMDValue SIMDUint16x8Operation::OpSubSaturate(const SIMDValue& aValue, const SIMDValue& bValue)
  100. {
  101. X86SIMDValue x86Result;
  102. X86SIMDValue tmpaValue = X86SIMDValue::ToX86SIMDValue(aValue);
  103. X86SIMDValue tmpbValue = X86SIMDValue::ToX86SIMDValue(bValue);
  104. x86Result.m128i_value = _mm_subs_epu16(tmpaValue.m128i_value, tmpbValue.m128i_value); // a - b saturated
  105. return X86SIMDValue::ToSIMDValue(x86Result);
  106. }
  107. }
  108. #endif