blob: a563f208d3a19dae7d3d915d8a08cdaee2f34679 [file] [log] [blame]
//-------------------------------------------------------------------------------------------------------
// Copyright (C) Microsoft Corporation and contributors. All rights reserved.
// Licensed under the MIT license. See LICENSE.txt file in the project root for full license information.
//-------------------------------------------------------------------------------------------------------
this.WScript.LoadScriptFile("..\\UnitTestFramework\\SimdJsHelpers.js");
function asmModule(stdlib, imports, buffer) {
"use asm";
var i4 = stdlib.SIMD.Int32x4;
var i4check = i4.check;
var i4splat = i4.splat;
var i4fromFloat32x4 = i4.fromFloat32x4;
var i4fromFloat32x4Bits = i4.fromFloat32x4Bits;
//var i4abs = i4.abs;
var i4neg = i4.neg;
var i4add = i4.add;
var i4sub = i4.sub;
var i4mul = i4.mul;
var i4swizzle = i4.swizzle;
var i4shuffle = i4.shuffle;
var i4lessThan = i4.lessThan;
var i4equal = i4.equal;
var i4greaterThan = i4.greaterThan;
var i4select = i4.select;
var i4and = i4.and;
var i4or = i4.or;
var i4xor = i4.xor;
var i4not = i4.not;
var i4load = i4.load;
var i4load1 = i4.load1;
var i4load2 = i4.load2;
var i4load3 = i4.load3;
var i4store = i4.store
var i4store1 = i4.store1;
var i4store2 = i4.store2;
var i4store3 = i4.store3;
//var i4shiftLeftByScalar = i4.shiftLeftByScalar;
//var i4shiftRightByScalar = i4.shiftRightByScalar;
//var i4shiftRightArithmeticByScalar = i4.shiftRightArithmeticByScalar;
var f4 = stdlib.SIMD.Float32x4;
var f4check = f4.check;
var f4splat = f4.splat;
var f4fromInt32x4 = f4.fromInt32x4;
var f4fromInt32x4Bits = f4.fromInt32x4Bits;
var f4abs = f4.abs;
var f4neg = f4.neg;
var f4add = f4.add;
var f4sub = f4.sub;
var f4mul = f4.mul;
var f4div = f4.div;
var f4min = f4.min;
var f4max = f4.max;
var f4sqrt = f4.sqrt;
var f4swizzle = f4.swizzle;
var f4shuffle = f4.shuffle;
var f4lessThan = f4.lessThan;
var f4lessThanOrEqual = f4.lessThanOrEqual;
var f4equal = f4.equal;
var f4notEqual = f4.notEqual;
var f4greaterThan = f4.greaterThan;
var f4greaterThanOrEqual = f4.greaterThanOrEqual;
var f4select = f4.select;
var f4load = f4.load;
var f4load1 = f4.load1;
var f4load2 = f4.load2;
var f4load3 = f4.load3;
var f4store = f4.store;
var f4store1 = f4.store1;
var f4store2 = f4.store2;
var f4store3 = f4.store3;
var fround = stdlib.Math.fround;
var globImportF4 = f4check(imports.g1); // global var import
var globImportI4 = i4check(imports.g2); // global var import
var g1 = f4(-5033.2,-3401.0,665.34,32234.1); // global var initialized
var g2 = i4(1065353216, -1073741824, -1077936128, 1082130432); // global var initialized
var gval = 1234;
var gval2 = 1234.0;
var OFFSET_1 = 10;
var OFFSET_2 = 15;
var loopCOUNT = 10;
var Int8Heap = new stdlib.Int8Array (buffer);
var Uint8Heap = new stdlib.Uint8Array (buffer);
var Int16Heap = new stdlib.Int16Array(buffer);
var Uint16Heap = new stdlib.Uint16Array(buffer);
var Int32Heap = new stdlib.Int32Array(buffer);
var Uint32Heap = new stdlib.Uint32Array(buffer);
var Float32Heap = new stdlib.Float32Array(buffer);
var Float64Heap = new stdlib.Float64Array(buffer);
//Reverses heap values at start index and end index
function reverseI4(start, end)
{
start = start | 0;
end = end | 0;
var BLOCK_SIZE = 4;
var ret1 = i4(0, 0, 0, 0), ret2 = i4(0, 0, 0, 0);
var i = 0, temp = 0;
while(((BLOCK_SIZE * 2)|0) <= (((end - start) - ((i * 2)|0))|0))
{
ret1 = i4swizzle(i4load(Int32Heap, (start + i) << 2 >> 2), 3, 2, 1, 0);
ret2 = i4swizzle(i4load(Int32Heap, (end - i - BLOCK_SIZE) << 2 >> 2), 3, 2, 1, 0);
i4store(Int32Heap, (end - i - BLOCK_SIZE) << 2 >> 2, ret1);
i4store(Int32Heap, (start + i) << 2 >> 2, ret2);
i = (i + BLOCK_SIZE)|0;
}
while(1 < ((((end - start) + 0) - ((i * 2)|0))|0))
{
temp = Int32Heap[start + i << 2 >> 2] | 0;
Int32Heap[start + i << 2 >> 2] = Int32Heap[(end - i - 1) << 2 >> 2];
Int32Heap[(end - i - 1) << 2 >> 2] = temp;
i = (i + 1)|0;
}
}
//Reverses heap values at start index and end index
function reverseF4(start, end)
{
start = start | 0;
end = end | 0;
var BLOCK_SIZE = 4;
var ret1 = f4(0.0, 0.0, 0.0, 0.0), ret2 = f4(0.0, 0.0, 0.0, 0.0);
var i = 0, temp = 0;
while(((BLOCK_SIZE * 2)|0) <= (((end - start) - ((i * 2)|0))|0))
{
ret1 = f4swizzle(f4load(Int32Heap, (start + i) << 2 >> 2), 3, 2, 1, 0);
ret2 = f4swizzle(f4load(Int32Heap, (end - i - BLOCK_SIZE) << 2 >> 2), 3, 2, 1, 0);
f4store(Int32Heap, (end - i - BLOCK_SIZE) << 2 >> 2, ret1);
f4store(Int32Heap, (start + i) << 2 >> 2, ret2);
i = (i + BLOCK_SIZE)|0;
}
while(1 < ((((end - start) + 0) - ((i * 2)|0))|0))
{
temp = Int32Heap[start + i << 2 >> 2] | 0;
Int32Heap[start + i << 2 >> 2] = Int32Heap[(end - i - 1) << 2 >> 2];
Int32Heap[(end - i - 1) << 2 >> 2] = temp;
i = (i + 1)|0;
}
}
/*
//Reverses heap values at start index and end index
function reverseD2(start, end)
{
start = start | 0;
end = end | 0;
var BLOCK_SIZE = 4;
var ret1 = d2(0.0, 0.0), ret2 = d2(0.0, 0.0);
var start32 = 0, end32 = 0;
var i = 0, i64 = 0, temp = 0.0;
start32 = (start * 2)|0;
end32 = (end * 2)|0;
while(((BLOCK_SIZE * 2)|0) <= (((end32 - start32) - ((i * 2)|0))|0))
{
ret1 = d2swizzle(d2load(Float32Heap, (start32 + i) << 2 >> 2), 1, 0);
ret2 = d2swizzle(d2load(Float32Heap, (end32 - i - BLOCK_SIZE) << 2 >> 2), 1, 0);
d2store(Float32Heap, (end32 - i - BLOCK_SIZE) << 2 >> 2, ret1);
d2store(Float32Heap, (start32 + i) << 2 >> 2, ret2);
i = (i + BLOCK_SIZE)|0;
i64 = (i64 + 2)|0;
}
while(1 < ((((end - start) + 0) - ((i64 * 2)|0))|0))
{
temp = +Float64Heap[start + i64 << 3 >> 3];
Float64Heap[start + i64 << 3 >> 3] = Float64Heap[(end - i64 - 1) << 3 >> 3];
Float64Heap[(end - i64 - 1) << 3 >> 3] = temp;
i64 = (i64 + 1)|0;
}
}
*/
return {reverseI4:reverseI4, reverseF4:reverseF4/*, reverseD2:reverseD2*/};
}
var buffer = new ArrayBuffer(0x10000); //16mb min 2^12
//Reset or flush the buffer
function initI4(buffer) {
var values = new Int32Array( buffer );
for( var i=0; i < values.length ; ++i ) {
values[i] = i * 10;
}
return values.length;
}
//Reset or flush the buffer
function initF4(buffer) {
var values = new Float32Array( buffer );
for( var i=0; i < values.length ; ++i ) {
values[i] = i * 10;
}
return values.length;
}
//Reset or flush the buffer
function initD2(buffer) {
var values = new Float64Array( buffer );
for( var i=0; i < values.length ; ++i ) {
values[i] = i * 10;
}
return values.length;
}
function GEN_BASELINE(loadfn, buffer, count)
{
var i4;
print("[");
for (var i = 0; i < count/* * 16*/; i += 4)
{
i4 = loadfn(buffer, i);
print(i4.toString()+",");
}
print("]");
}
function verify_results(type, results_ex, buffer, count)
{
var i4;
for (var i = 0, idx = 0; i < count/* * 16*/; i += 4)
{
i4 = type.load(buffer, i);
equalSimd(results_ex[idx++], i4, type, "Reverse Heap" );
}
}
//Module initialization
var m = asmModule(this, {g0:initI4(buffer),g1:SIMD.Float32x4(9,9,9,9), g2:SIMD.Int32x4(1, 2, 3, 4)}, buffer);
var values = new Float32Array(buffer);
//Resetting the buffer.
initI4(buffer);
// print("Reversing - Start");
// GEN_BASELINE(SIMD.Int32x4.load, values, 8*4);
var exp_results = [
SIMD.Int32x4(0, 10, 20, 30),
SIMD.Int32x4(40, 50, 60, 70),
SIMD.Int32x4(80, 90, 100, 110),
SIMD.Int32x4(120, 130, 140, 150),
SIMD.Int32x4(160, 170, 180, 190),
SIMD.Int32x4(200, 210, 220, 230),
SIMD.Int32x4(240, 250, 260, 270),
SIMD.Int32x4(280, 290, 300, 310),
];
verify_results(SIMD.Int32x4, exp_results, values, 8*4);
m.reverseI4(3, 31);
// print("Reversing - Start");
// GEN_BASELINE(SIMD.Int32x4.load, values, 8*4);
var exp_results = [
SIMD.Int32x4(0, 10, 20, 300),
SIMD.Int32x4(290, 280, 270, 260),
SIMD.Int32x4(250, 240, 230, 220),
SIMD.Int32x4(210, 200, 190, 180),
SIMD.Int32x4(170, 160, 150, 140),
SIMD.Int32x4(130, 120, 110, 100),
SIMD.Int32x4(90, 80, 70, 60),
SIMD.Int32x4(50, 40, 30, 310),
];
verify_results(SIMD.Int32x4, exp_results, values, 8*4);
//Resetting the buffer.
initF4(buffer);
// print("Reversing - Start");
// GEN_BASELINE(SIMD.Float32x4.load, values, 8*4);
var exp_results = [
SIMD.Float32x4(0, 10, 20, 30),
SIMD.Float32x4(40, 50, 60, 70),
SIMD.Float32x4(80, 90, 100, 110),
SIMD.Float32x4(120, 130, 140, 150),
SIMD.Float32x4(160, 170, 180, 190),
SIMD.Float32x4(200, 210, 220, 230),
SIMD.Float32x4(240, 250, 260, 270),
SIMD.Float32x4(280, 290, 300, 310),
];
verify_results(SIMD.Float32x4, exp_results, values, 8*4);
m.reverseF4(3, 31);
// print("Reversing - Start");
// GEN_BASELINE(SIMD.Float32x4.load, values, 8*4);
var exp_results = [
SIMD.Float32x4(0, 10, 20, 300),
SIMD.Float32x4(290, 280, 270, 260),
SIMD.Float32x4(250, 240, 230, 220),
SIMD.Float32x4(210, 200, 190, 180),
SIMD.Float32x4(170, 160, 150, 140),
SIMD.Float32x4(130, 120, 110, 100),
SIMD.Float32x4(90, 80, 70, 60),
SIMD.Float32x4(50, 40, 30, 310),
];
verify_results(SIMD.Float32x4, exp_results, values, 8*4);
//Resetting the buffer.
// initD2(buffer);
// print("Reversing - Start");
// GEN_BASELINE(SIMD.Int32x4.load, values, 8*4);
// m.reverseD2(3, 8);
// print("Reversing - Start");
// GEN_BASELINE(SIMD.Int32x4.load, values, 8*4);
print("PASS");