testReverseHeap.js 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331
  1. //-------------------------------------------------------------------------------------------------------
  2. // Copyright (C) Microsoft Corporation and contributors. All rights reserved.
  3. // Licensed under the MIT license. See LICENSE.txt file in the project root for full license information.
  4. //-------------------------------------------------------------------------------------------------------
  5. this.WScript.LoadScriptFile("..\\UnitTestFramework\\SimdJsHelpers.js");
  6. function asmModule(stdlib, imports, buffer) {
  7. "use asm";
  8. var i4 = stdlib.SIMD.Int32x4;
  9. var i4check = i4.check;
  10. var i4splat = i4.splat;
  11. var i4fromFloat32x4 = i4.fromFloat32x4;
  12. var i4fromFloat32x4Bits = i4.fromFloat32x4Bits;
  13. //var i4abs = i4.abs;
  14. var i4neg = i4.neg;
  15. var i4add = i4.add;
  16. var i4sub = i4.sub;
  17. var i4mul = i4.mul;
  18. var i4swizzle = i4.swizzle;
  19. var i4shuffle = i4.shuffle;
  20. var i4lessThan = i4.lessThan;
  21. var i4equal = i4.equal;
  22. var i4greaterThan = i4.greaterThan;
  23. var i4select = i4.select;
  24. var i4and = i4.and;
  25. var i4or = i4.or;
  26. var i4xor = i4.xor;
  27. var i4not = i4.not;
  28. var i4load = i4.load;
  29. var i4load1 = i4.load1;
  30. var i4load2 = i4.load2;
  31. var i4load3 = i4.load3;
  32. var i4store = i4.store
  33. var i4store1 = i4.store1;
  34. var i4store2 = i4.store2;
  35. var i4store3 = i4.store3;
  36. //var i4shiftLeftByScalar = i4.shiftLeftByScalar;
  37. //var i4shiftRightByScalar = i4.shiftRightByScalar;
  38. //var i4shiftRightArithmeticByScalar = i4.shiftRightArithmeticByScalar;
  39. var f4 = stdlib.SIMD.Float32x4;
  40. var f4check = f4.check;
  41. var f4splat = f4.splat;
  42. var f4fromInt32x4 = f4.fromInt32x4;
  43. var f4fromInt32x4Bits = f4.fromInt32x4Bits;
  44. var f4abs = f4.abs;
  45. var f4neg = f4.neg;
  46. var f4add = f4.add;
  47. var f4sub = f4.sub;
  48. var f4mul = f4.mul;
  49. var f4div = f4.div;
  50. var f4min = f4.min;
  51. var f4max = f4.max;
  52. var f4sqrt = f4.sqrt;
  53. var f4swizzle = f4.swizzle;
  54. var f4shuffle = f4.shuffle;
  55. var f4lessThan = f4.lessThan;
  56. var f4lessThanOrEqual = f4.lessThanOrEqual;
  57. var f4equal = f4.equal;
  58. var f4notEqual = f4.notEqual;
  59. var f4greaterThan = f4.greaterThan;
  60. var f4greaterThanOrEqual = f4.greaterThanOrEqual;
  61. var f4select = f4.select;
  62. var f4load = f4.load;
  63. var f4load1 = f4.load1;
  64. var f4load2 = f4.load2;
  65. var f4load3 = f4.load3;
  66. var f4store = f4.store;
  67. var f4store1 = f4.store1;
  68. var f4store2 = f4.store2;
  69. var f4store3 = f4.store3;
  70. var fround = stdlib.Math.fround;
  71. var globImportF4 = f4check(imports.g1); // global var import
  72. var globImportI4 = i4check(imports.g2); // global var import
  73. var g1 = f4(-5033.2,-3401.0,665.34,32234.1); // global var initialized
  74. var g2 = i4(1065353216, -1073741824, -1077936128, 1082130432); // global var initialized
  75. var gval = 1234;
  76. var gval2 = 1234.0;
  77. var OFFSET_1 = 10;
  78. var OFFSET_2 = 15;
  79. var loopCOUNT = 10;
  80. var Int8Heap = new stdlib.Int8Array (buffer);
  81. var Uint8Heap = new stdlib.Uint8Array (buffer);
  82. var Int16Heap = new stdlib.Int16Array(buffer);
  83. var Uint16Heap = new stdlib.Uint16Array(buffer);
  84. var Int32Heap = new stdlib.Int32Array(buffer);
  85. var Uint32Heap = new stdlib.Uint32Array(buffer);
  86. var Float32Heap = new stdlib.Float32Array(buffer);
  87. var Float64Heap = new stdlib.Float64Array(buffer);
  88. //Reverses heap values at start index and end index
  89. function reverseI4(start, end)
  90. {
  91. start = start | 0;
  92. end = end | 0;
  93. var BLOCK_SIZE = 4;
  94. var ret1 = i4(0, 0, 0, 0), ret2 = i4(0, 0, 0, 0);
  95. var i = 0, temp = 0;
  96. while(((BLOCK_SIZE * 2)|0) <= (((end - start) - ((i * 2)|0))|0))
  97. {
  98. ret1 = i4swizzle(i4load(Int32Heap, (start + i) << 2 >> 2), 3, 2, 1, 0);
  99. ret2 = i4swizzle(i4load(Int32Heap, (end - i - BLOCK_SIZE) << 2 >> 2), 3, 2, 1, 0);
  100. i4store(Int32Heap, (end - i - BLOCK_SIZE) << 2 >> 2, ret1);
  101. i4store(Int32Heap, (start + i) << 2 >> 2, ret2);
  102. i = (i + BLOCK_SIZE)|0;
  103. }
  104. while(1 < ((((end - start) + 0) - ((i * 2)|0))|0))
  105. {
  106. temp = Int32Heap[start + i << 2 >> 2] | 0;
  107. Int32Heap[start + i << 2 >> 2] = Int32Heap[(end - i - 1) << 2 >> 2];
  108. Int32Heap[(end - i - 1) << 2 >> 2] = temp;
  109. i = (i + 1)|0;
  110. }
  111. }
  112. //Reverses heap values at start index and end index
  113. function reverseF4(start, end)
  114. {
  115. start = start | 0;
  116. end = end | 0;
  117. var BLOCK_SIZE = 4;
  118. var ret1 = f4(0.0, 0.0, 0.0, 0.0), ret2 = f4(0.0, 0.0, 0.0, 0.0);
  119. var i = 0, temp = 0;
  120. while(((BLOCK_SIZE * 2)|0) <= (((end - start) - ((i * 2)|0))|0))
  121. {
  122. ret1 = f4swizzle(f4load(Int32Heap, (start + i) << 2 >> 2), 3, 2, 1, 0);
  123. ret2 = f4swizzle(f4load(Int32Heap, (end - i - BLOCK_SIZE) << 2 >> 2), 3, 2, 1, 0);
  124. f4store(Int32Heap, (end - i - BLOCK_SIZE) << 2 >> 2, ret1);
  125. f4store(Int32Heap, (start + i) << 2 >> 2, ret2);
  126. i = (i + BLOCK_SIZE)|0;
  127. }
  128. while(1 < ((((end - start) + 0) - ((i * 2)|0))|0))
  129. {
  130. temp = Int32Heap[start + i << 2 >> 2] | 0;
  131. Int32Heap[start + i << 2 >> 2] = Int32Heap[(end - i - 1) << 2 >> 2];
  132. Int32Heap[(end - i - 1) << 2 >> 2] = temp;
  133. i = (i + 1)|0;
  134. }
  135. }
  136. /*
  137. //Reverses heap values at start index and end index
  138. function reverseD2(start, end)
  139. {
  140. start = start | 0;
  141. end = end | 0;
  142. var BLOCK_SIZE = 4;
  143. var ret1 = d2(0.0, 0.0), ret2 = d2(0.0, 0.0);
  144. var start32 = 0, end32 = 0;
  145. var i = 0, i64 = 0, temp = 0.0;
  146. start32 = (start * 2)|0;
  147. end32 = (end * 2)|0;
  148. while(((BLOCK_SIZE * 2)|0) <= (((end32 - start32) - ((i * 2)|0))|0))
  149. {
  150. ret1 = d2swizzle(d2load(Float32Heap, (start32 + i) << 2 >> 2), 1, 0);
  151. ret2 = d2swizzle(d2load(Float32Heap, (end32 - i - BLOCK_SIZE) << 2 >> 2), 1, 0);
  152. d2store(Float32Heap, (end32 - i - BLOCK_SIZE) << 2 >> 2, ret1);
  153. d2store(Float32Heap, (start32 + i) << 2 >> 2, ret2);
  154. i = (i + BLOCK_SIZE)|0;
  155. i64 = (i64 + 2)|0;
  156. }
  157. while(1 < ((((end - start) + 0) - ((i64 * 2)|0))|0))
  158. {
  159. temp = +Float64Heap[start + i64 << 3 >> 3];
  160. Float64Heap[start + i64 << 3 >> 3] = Float64Heap[(end - i64 - 1) << 3 >> 3];
  161. Float64Heap[(end - i64 - 1) << 3 >> 3] = temp;
  162. i64 = (i64 + 1)|0;
  163. }
  164. }
  165. */
  166. return {reverseI4:reverseI4, reverseF4:reverseF4/*, reverseD2:reverseD2*/};
  167. }
  168. var buffer = new ArrayBuffer(0x10000); //16mb min 2^12
  169. //Reset or flush the buffer
  170. function initI4(buffer) {
  171. var values = new Int32Array( buffer );
  172. for( var i=0; i < values.length ; ++i ) {
  173. values[i] = i * 10;
  174. }
  175. return values.length;
  176. }
  177. //Reset or flush the buffer
  178. function initF4(buffer) {
  179. var values = new Float32Array( buffer );
  180. for( var i=0; i < values.length ; ++i ) {
  181. values[i] = i * 10;
  182. }
  183. return values.length;
  184. }
  185. //Reset or flush the buffer
  186. function initD2(buffer) {
  187. var values = new Float64Array( buffer );
  188. for( var i=0; i < values.length ; ++i ) {
  189. values[i] = i * 10;
  190. }
  191. return values.length;
  192. }
  193. function GEN_BASELINE(loadfn, buffer, count)
  194. {
  195. var i4;
  196. print("[");
  197. for (var i = 0; i < count/* * 16*/; i += 4)
  198. {
  199. i4 = loadfn(buffer, i);
  200. print(i4.toString()+",");
  201. }
  202. print("]");
  203. }
  204. function verify_results(type, results_ex, buffer, count)
  205. {
  206. var i4;
  207. for (var i = 0, idx = 0; i < count/* * 16*/; i += 4)
  208. {
  209. i4 = type.load(buffer, i);
  210. equalSimd(results_ex[idx++], i4, type, "Reverse Heap" );
  211. }
  212. }
  213. //Module initialization
  214. var m = asmModule(this, {g0:initI4(buffer),g1:SIMD.Float32x4(9,9,9,9), g2:SIMD.Int32x4(1, 2, 3, 4)}, buffer);
  215. var values = new Float32Array(buffer);
  216. //Resetting the buffer.
  217. initI4(buffer);
  218. // print("Reversing - Start");
  219. // GEN_BASELINE(SIMD.Int32x4.load, values, 8*4);
  220. var exp_results = [
  221. SIMD.Int32x4(0, 10, 20, 30),
  222. SIMD.Int32x4(40, 50, 60, 70),
  223. SIMD.Int32x4(80, 90, 100, 110),
  224. SIMD.Int32x4(120, 130, 140, 150),
  225. SIMD.Int32x4(160, 170, 180, 190),
  226. SIMD.Int32x4(200, 210, 220, 230),
  227. SIMD.Int32x4(240, 250, 260, 270),
  228. SIMD.Int32x4(280, 290, 300, 310),
  229. ];
  230. verify_results(SIMD.Int32x4, exp_results, values, 8*4);
  231. m.reverseI4(3, 31);
  232. // print("Reversing - Start");
  233. // GEN_BASELINE(SIMD.Int32x4.load, values, 8*4);
  234. var exp_results = [
  235. SIMD.Int32x4(0, 10, 20, 300),
  236. SIMD.Int32x4(290, 280, 270, 260),
  237. SIMD.Int32x4(250, 240, 230, 220),
  238. SIMD.Int32x4(210, 200, 190, 180),
  239. SIMD.Int32x4(170, 160, 150, 140),
  240. SIMD.Int32x4(130, 120, 110, 100),
  241. SIMD.Int32x4(90, 80, 70, 60),
  242. SIMD.Int32x4(50, 40, 30, 310),
  243. ];
  244. verify_results(SIMD.Int32x4, exp_results, values, 8*4);
  245. //Resetting the buffer.
  246. initF4(buffer);
  247. // print("Reversing - Start");
  248. // GEN_BASELINE(SIMD.Float32x4.load, values, 8*4);
  249. var exp_results = [
  250. SIMD.Float32x4(0, 10, 20, 30),
  251. SIMD.Float32x4(40, 50, 60, 70),
  252. SIMD.Float32x4(80, 90, 100, 110),
  253. SIMD.Float32x4(120, 130, 140, 150),
  254. SIMD.Float32x4(160, 170, 180, 190),
  255. SIMD.Float32x4(200, 210, 220, 230),
  256. SIMD.Float32x4(240, 250, 260, 270),
  257. SIMD.Float32x4(280, 290, 300, 310),
  258. ];
  259. verify_results(SIMD.Float32x4, exp_results, values, 8*4);
  260. m.reverseF4(3, 31);
  261. // print("Reversing - Start");
  262. // GEN_BASELINE(SIMD.Float32x4.load, values, 8*4);
  263. var exp_results = [
  264. SIMD.Float32x4(0, 10, 20, 300),
  265. SIMD.Float32x4(290, 280, 270, 260),
  266. SIMD.Float32x4(250, 240, 230, 220),
  267. SIMD.Float32x4(210, 200, 190, 180),
  268. SIMD.Float32x4(170, 160, 150, 140),
  269. SIMD.Float32x4(130, 120, 110, 100),
  270. SIMD.Float32x4(90, 80, 70, 60),
  271. SIMD.Float32x4(50, 40, 30, 310),
  272. ];
  273. verify_results(SIMD.Float32x4, exp_results, values, 8*4);
  274. //Resetting the buffer.
  275. // initD2(buffer);
  276. // print("Reversing - Start");
  277. // GEN_BASELINE(SIMD.Int32x4.load, values, 8*4);
  278. // m.reverseD2(3, 8);
  279. // print("Reversing - Start");
  280. // GEN_BASELINE(SIMD.Int32x4.load, values, 8*4);
  281. print("PASS");