| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153 |
- //-------------------------------------------------------------------------------------------------------
- // Copyright (C) Microsoft. All rights reserved.
- // Licensed under the MIT license. See LICENSE.txt file in the project root for full license information.
- //-------------------------------------------------------------------------------------------------------
- function asmModule(stdlib, imports, buffer) {
- "use asm";
- var log = stdlib.Math.log;
- var toF = stdlib.Math.fround;
- var imul = stdlib.Math.imul;
- var i4 = stdlib.SIMD.Int32x4;
- var i4store = i4.store;
- var i4load = i4.load
- var i4swizzle = i4.swizzle;
- var i4check = i4.check;
- var i4add = i4.add;
- var i4sub = i4.sub;
- var i4lessThan = i4.lessThan;
- var i4splat = i4.splat;
- var f4 = stdlib.SIMD.Float32x4;
- var f4equal = f4.equal;
- var f4lessThan = f4.lessThan;
- var f4splat = f4.splat;
- var f4store = f4.store;
- var f4load = f4.load;
- var f4check = f4.check;
- var f4abs = f4.abs;
- var f4add = f4.add;
- var f4sub = f4.sub;
- var Float32Heap = new stdlib.Float32Array(buffer);
- var Int32Heap = new stdlib.Int32Array(buffer);
- var BLOCK_SIZE = 4;
- function matrixMultiplication(aIndex, bIndex, cIndex) {
- aIndex = aIndex|0;
- bIndex = bIndex|0;
- cIndex = cIndex|0;
- var i = 0, j = 0, dim1 = 0, dim2 = 0, intersectionNum = 0, matrixSize = 0;
- var newPiece = i4(0, 0, 0, 0), cPiece = i4(0, 0, 0, 0);
- //array dimensions don't match
- if((Int32Heap[aIndex + 1 << 2 >> 2]|0) != (Int32Heap[bIndex << 2 >> 2]|0)) {
- return -1;
- }
- dim1 = Int32Heap[aIndex << 2 >> 2]|0;
- dim2 = Int32Heap[bIndex + 1 << 2 >> 2]|0;
- intersectionNum = Int32Heap[bIndex << 2 >> 2]|0;
- matrixSize = imul(dim1, dim2);
- Int32Heap[cIndex << 2 >> 2] = dim1;
- Int32Heap[cIndex + 1 << 2 >> 2] = dim2;
- while((i|0) < (matrixSize|0)) {
- cPiece = i4(0, 0, 0, 0);
- j = 0;
- while( (j|0) < (intersectionNum|0)) {
- newPiece = i4((getIntersectionPiece(aIndex, bIndex, dim2, i, 0, j)|0),
- (getIntersectionPiece(aIndex, bIndex, dim2, i, 1, j)|0),
- (getIntersectionPiece(aIndex, bIndex, dim2, i, 2, j)|0),
- (getIntersectionPiece(aIndex, bIndex, dim2, i, 3, j)|0));
- cPiece = i4add(cPiece, newPiece);
- j = (j + 1)|0;
- }
- i4store(Int32Heap, cIndex + 2 + i << 2 >> 2, cPiece);
- i = (i + BLOCK_SIZE)|0;
- }
- return 0;
- }
- function getIntersectionPiece(aIndex, bIndex, dim2, resultBlock, resultIndex, intersectionNum) {
- aIndex = aIndex|0;
- bIndex = bIndex|0;
- dim2 = dim2|0;
- resultBlock = resultBlock|0;
- resultIndex = resultIndex|0;
- intersectionNum = intersectionNum|0;
- var aElem = 0, bElem = 0, cElem = 0;
- aElem = (getElement(aIndex, ((resultBlock|0) / (dim2|0))|0, intersectionNum))|0;
- bElem = (getElement(bIndex, intersectionNum, (resultBlock + resultIndex)|0))|0;
- return (aElem * bElem)|0;
- }
- function getElement(start, row, column) {
- start = start|0;
- row = row|0;
- column = column|0;
- var dim1 = 0, dim2 = 0;
- dim2 = Int32Heap[start << 2 >> 2]|0;
- dim1 = Int32Heap[start + 1 << 2 >> 2]|0;
- return (Int32Heap[(start + 2 + imul(row, dim1) + column) << 2 >> 2])|0;
- }
- function new2DMatrix(startIndex, dim1, dim2) {
- startIndex = startIndex|0;
- dim1 = dim1|0;
- dim2 = dim2|0;
- var i = 0, matrixSize = 0;
- matrixSize = imul(dim1, dim2);
- Int32Heap[startIndex << 2 >> 2] = dim1;
- Int32Heap[startIndex + 1 << 2 >> 2] = dim2;
- for(i = 0; (i|0) < ((matrixSize - BLOCK_SIZE)|0); i = (i + BLOCK_SIZE)|0) {
- i4store(Int32Heap, startIndex + 2 + i << 2 >> 2, i4((i+1), (i+2), (i+3), (i+4)));
- }
- for(; (i|0) < (matrixSize|0); i = (i + 1)|0) {
- Int32Heap[(startIndex + 2 + i) << 2 >> 2] = (i+1)|0;
- }
- return (startIndex + 2 + i)|0;
- }
- return {new2DMatrix: new2DMatrix,
- matrixMultiplication:matrixMultiplication};
- }
- function print2DMatrix(buffer, start) {
- var IntHeap32 = new Int32Array(buffer);
- var FloatHeap32 = new Float32Array(buffer);
- var f4;
- var dim1 = IntHeap32[start];
- var dim2 = IntHeap32[start+1];
- print(dim1 + " by " + dim2 + " matrix");
- for (var i = 0; i < Math.imul(dim1, dim2); i += 4) {
- i4 = SIMD.Int32x4.load(IntHeap32, i + start + 2);
- print(i4.toString());
- }
- }
- var buffer = new ArrayBuffer(16 * 1024 * 1024);
- var m = asmModule(this, null, buffer);
- print("2D Matrix Multiplication");
- m.new2DMatrix(0, 4, 8);
- m.new2DMatrix(200, 8, 12);
- m.new2DMatrix(400, 4, 4);
- m.new2DMatrix(600, 4, 4);
- m.matrixMultiplication(0, 200, 800);
- m.matrixMultiplication(400, 600, 1000);
- print2DMatrix(buffer, 800);
- print2DMatrix(buffer, 1000);
|