sdk/sources/android-23/com/example/android/rs/blasbenchmark/BNNMTest.java - android_tools - Git at Google

 /*
  * Copyright (C) 2015 The Android Open Source Project
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
  * You may obtain a copy of the License at
  *
  *      http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 package com.example.android.rs.blasbenchmark;

 import android.renderscript.*;
 import android.util.Log;
 import java.util.Random;
 import java.lang.Math;

 public class BNNMTest extends TestBase {

     static {
         System.loadLibrary("gemmdata");
     }

     native void getData(byte[] a, byte[] b, byte[] c);

     ScriptIntrinsicBLAS mBLAS;
     private Allocation matA;
     private Allocation matB;
     private Allocation matC;

     private int m;
     private int n;
     private int k;

     private int a_offset;
     private int b_offset;
     private int c_offset;
     private int c_mult_int;

     private int mTestSize;

     BNNMTest(int testSize) {
         mTestSize = testSize;
     }

     public void createTest() {
         mBLAS = ScriptIntrinsicBLAS.create(mRS);
         setTest();
     }

     private void setTest() {
         switch (mTestSize) {
             case 1:
                 setTestSmall();
                 break;
             case 2:
                 setTestMedium();
                 break;
             case 3:
                 setTestLarge();
                 break;
             default:
                 break;
         }
     }

     // In Java, the eight-bit 'byte' type is signed, but the API for the 8-bit
     // matrix multiplication deals with unsigned bytes. This is a convenience
     // function that converts arrays of unsigned ints to their equivalent
     // representations as signed bytes. For example, the bit pattern 0xff is 255
     // as an unsigned value, but -127 as a Java signed byte. So if you pass in an
     // array of int[] {255} into this function, you'll get back byte[] {-127}.
     private byte[] unsignedToSignedByte(int[] input) {
         byte[] output = new byte[input.length];
         for (int i = 0; i < input.length; ++i) {
             output[i] = (byte)(input[i]);
         }
         return output;
     }


     private void addByteNoise(byte[] data, int count, float frequency, int maxDelta) {
         Random rand = new Random();
         for (int n = 0; n < count; ++n) {
             if (rand.nextFloat() < frequency) {
                 final int originalValue = data[n];
                 final float direction = rand.nextFloat();
                 int delta = (int)(Math.ceil(rand.nextFloat() * maxDelta));
                 if (direction < 0.5f) {
                     delta = -delta;
                 }
                 int newValue = (originalValue + delta);
                 if (newValue < -127) {
                     newValue = -127;
                 }
                 if (newValue > 127) {
                     newValue = 127;
                 }
                 data[n] = (byte)(newValue);
             }
         }
     }

     private boolean testWithTolerance(byte[] c_byte, byte[] c_byte_output) {

         // The testing procedure here is a bit complex, but the aim is to mimic the
         // requirements we've empirically found running deep neural networks in real
         // applications. We want to open the door to vendors using approximations that
         // produce slightly different results for optimization's sake, but keep the
         // precision loss within small enough bounds that we don't lose accuracy in
         // the final result.
         // After experimentation, we've found that we can tolerate around 5% of the
         // output bytes being different by 1. Any larger differences are not tolerable
         // and we can't get good results if the frequency of small differences is
         // higher than 5%. This test tries to measure those properties on an example
         // set of parameters that were captured from a real application.
         // For example, if you uncommented this function that adds random noise to the
         // results at a 3% specified frequency, the test should fail:
         // AddByteNoise(c_byte_output, c_count, 0.03f, 1);

         final boolean areSizesDifferent = (c_byte.length != c_byte_output.length);
         final int c_count = Math.min(c_byte.length, c_byte_output.length);

         int howManyDifferent = 0;
         boolean areAnyTooDifferent = false;
         for (int i = 0; i < c_count; i++) {
             byte expectedValue = c_byte[i];
             byte actualValue = c_byte_output[i];
             int delta = (expectedValue - actualValue);
             // First make sure that the difference is no more than one.
             if ((delta < -1) || (delta > 1)) {
                 areAnyTooDifferent = true;
             }
             // If there is a difference, increment the counter to track it.
             if (delta != 0) {
                 // Don't spam the logs if too many are different.
                 if (howManyDifferent < 50) {
                     android.util.Log.e("BNNM", "Mismatch at " + i +
                                        ": expected " + (expectedValue & 0xff) +
                                        ", got " + (actualValue & 0xff));
                 }
                 ++howManyDifferent;
             }
         }
         // We want no more than 2% of the values to show any differences, so work out
         // what that means in absolute numbers.
         final int percentThreshold = 2;
         final int differenceThreshold = Math.max((percentThreshold * c_count) / 100, 1);
         final boolean areTooManyDifferent = (howManyDifferent >= differenceThreshold);

         if (areAnyTooDifferent) {
             android.util.Log.e("BNNM", "Some outputs were too different.");
         }

         if (areTooManyDifferent) {
             android.util.Log.e("BNNM", "There were too many small differences." +
                                " We can tolerate " + percentThreshold + "% (" +
                                differenceThreshold + "), but there were " + howManyDifferent);
         }

         return !(areAnyTooDifferent || areTooManyDifferent);
     }

     // This test multiplies a couple of small 8-bit matrices, and compares the
     // results with hand-calculated expectations.
     public void setTestSmall() {
         // The A matrix is:
         // |   1 |   4 |
         // |   2 |   5 |
         // |   3 |   6 |
         byte[] a_byte = unsignedToSignedByte(new int[] {
                 1, 2, 3,
                 4, 5, 6,
             });
         final int a_rows = 3;
         final int a_cols = 2;
         a_offset = 0;
         // The B matrix is:
         // |  -1 |  -2 |  -3 |  -4 |
         // |  -5 |  -6 |  -7 |  -8 |
         // |  -9 | -10 | -11 | -12 |
         byte[] b_byte = unsignedToSignedByte(new int[] {
                 11, 7, 3,
                 10, 6, 2,
                 9, 5, 1,
                 8, 4, 0,
             });
         final int b_cols = 4;
         b_offset = 12;
         // EightBitGemm implements C = B.transposed() * A,
         // so we expect to get these results:
         // 1*-1 + 2*-5 + 3*-9 + 128 = 90
         // 1*-2 + 2*-6 + 3*-10 + 128 = 84
         // 1*-3 + 2*-7 + 3*-11 + 128 = 78
         // 1*-4 + 2*-8 + 3*-12 + 128 = 72
         // 4*-1 + 5*-5 + 6*-9 + 128 = 45
         // 4*-2 + 5*-6 + 6*-10 + 128 = 30
         // 4*-3 + 5*-7 + 6*-11 + 128 = 15
         // 4*-4 + 5*-8 + 6*-12 + 128 = 0
         // | 90 |  45 |
         // | 84 |  30 |
         // | 78 | 15 |
         // | 72 | 0 |
         c_offset = 128;
         final int c_shift = 21;
         c_mult_int = (1 << c_shift);
         byte[] expected_data = unsignedToSignedByte(new int[] {
                 90, 84, 78, 72,
                 45, 30, 15, 0,
             });

         m = a_cols;
         n = b_cols;
         k = a_rows;

         Type.Builder builder = new Type.Builder(mRS, Element.U8(mRS));
         Type a_type = builder.setX(k).setY(m).create();
         Type b_type = builder.setX(k).setY(n).create();
         Type c_type = builder.setX(n).setY(m).create();

         matA = Allocation.createTyped(mRS, a_type);
         matB = Allocation.createTyped(mRS, b_type);
         matC = Allocation.createTyped(mRS, c_type);
         matA.copyFrom(a_byte);
         matB.copyFrom(b_byte);

         //During setup, do a sample run to see if the result is correct.
         mBLAS.BNNM(matA, a_offset, matB, b_offset, matC, c_offset, c_mult_int);
         int c_count = (m * n);
         byte[] c_byte_output = new byte[c_count];
         matC.copyTo(c_byte_output);
         if (!testWithTolerance(expected_data, c_byte_output)) {
             Log.e(TAG, "Result is not correct!");
             throw new AssertionError("Result is not correct.");
         }
     }


     // This test multiplies another two medium 8-bit matrices, and compares the
     // results with the expected values. The data here is arbitrary.
     public void setTestMedium() {
         byte[] a_byte = unsignedToSignedByte(new int[] {
                 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23,
                 23, 22, 21, 20, 19, 18, 17, 16, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1,
                 1, 23, 2, 22, 3, 21, 4, 20, 5, 19, 6, 18, 7, 17, 8, 16, 9, 15, 10, 14, 11, 13, 12,
                 23, 1, 22, 2, 21, 3, 20, 4, 19, 5, 18, 6, 17, 7, 16, 8, 15, 9, 14, 10, 13, 11, 12,
                 1, 1, 1, 1, 1, 1, 1, 1, 1, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12,
                 3, 1, 4, 1, 5, 8, 2, 3, 1, 14, 11, 15, 18, 12, 13, 11, 14, 11, 15, 18, 12, 13, 11,
                 8, 0, 5, 8, 1, 3, 7, 5, 7, 13, 10, 23, 13, 11, 17, 23, 12, 19, 17, 13, 14, 10, 19,
             });
         final int a_rows = 23;
         final int a_cols = 7;
         a_offset = 13;
         byte[] b_byte = unsignedToSignedByte(new int[] {
                 0, 2, 4, 6, 8, 10, 1, 3, 5, 7, 9, 11, 0, 2, 4, 6, 8, 10, 1, 3, 5, 7, 9,
                 0, 20, 40, 60, 80, 10, 11, 13, 15, 17, 19, 21, 10, 12, 14, 6, 8, 10, 1, 3, 5, 7, 9,
                 1, 21, 41, 61, 81, 11, 12, 14, 16, 18, 20, 22, 11, 13, 15, 7, 9, 11, 2, 4, 6, 8, 9,
                 0, 19, 39, 59, 79, 9, 10, 12, 14, 16, 18, 20, 9, 11, 13, 5, 7, 9, 0, 2, 4, 6, 8,
                 2, 22, 42, 62, 82, 12, 13, 15, 17, 19, 21, 23, 12, 14, 16, 8, 9, 12, 3, 5, 7, 9, 9,
                 0, 18, 38, 58, 78, 8, 9, 11, 13, 15, 17, 19, 8, 10, 12, 4, 6, 8, 0, 1, 3, 5, 7,
                 3, 23, 43, 63, 83, 13, 14, 16, 18, 20, 22, 24, 13, 15, 17, 9, 9, 13, 4, 6, 8, 9, 9,
                 0, 17, 37, 57, 77, 7, 8, 10, 12, 14, 16, 18, 7, 9, 11, 3, 5, 7, 0, 0, 2, 4, 6,
                 10, 20, 30, 40, 50, 1, 2, 3, 4, 5, 11, 12, 13, 14, 15, 21, 22, 23, 24, 25, 1, 2, 3,
             });
         final int b_cols = 9;
         b_offset = 23;
         c_offset = 2121;
         final int c_shift = 21;
         c_mult_int = 132359;
         byte[] expected_data = unsignedToSignedByte(new int[] {
                 167, 53, 51, 54, 49, 55, 46,
                 56, 116, 153, 232, 232, 234, 231,
                 236, 232, 237, 174, 168, 131, 130,
                 132, 129, 133, 128, 133, 134, 151,
                 154, 152, 156, 151, 158, 150, 160,
                 156, 255, 113, 106, 120, 98, 127,
                 91, 134, 178, 231, 102, 97, 107,
                 92, 111, 87, 116, 164, 187, 76,
                 73, 78, 70, 81, 67, 83, 139,
             });

         m = a_cols;
         n = b_cols;
         k = a_rows;

         Type.Builder builder = new Type.Builder(mRS, Element.U8(mRS));
         Type a_type = builder.setX(k).setY(m).create();
         Type b_type = builder.setX(k).setY(n).create();
         Type c_type = builder.setX(n).setY(m).create();

         matA = Allocation.createTyped(mRS, a_type);
         matB = Allocation.createTyped(mRS, b_type);
         matC = Allocation.createTyped(mRS, c_type);

         matA.copyFrom(a_byte);
         matB.copyFrom(b_byte);

         //During setup, do a sample run to see if the result is correct.
         mBLAS.BNNM(matA, a_offset, matB, b_offset, matC, c_offset, c_mult_int);
         int c_count = (m * n);
         byte[] c_byte_output = new byte[c_count];
         matC.copyTo(c_byte_output);
         if (!testWithTolerance(expected_data, c_byte_output)) {
             Log.e(TAG, "Result is not correct!");
             throw new AssertionError("Result is not correct.");
         }
     }


     // This test takes a large set of real data captured from a convolutional
     // neural network solving a computer vision problem, and runs it through the
     // eight-bit matrix multiply. We test the results to make sure they're close
     // enough to be usable.
     public void setTestLarge() {

         m = 256;
         n = 192;
         k = 1152;
         a_offset = 0;
         b_offset = 84;
         c_mult_int = 3401;
         c_offset = 74980;

         int a_count = (m * k);
         int b_count = (n * k);
         int c_count = (m * n);

         byte[] a_byte = new byte[a_count];
         byte[] b_byte = new byte[b_count];
         byte[] c_byte = new byte[c_count];

         getData(a_byte, b_byte, c_byte);

         Type.Builder builder = new Type.Builder(mRS, Element.U8(mRS));
         Type a_type = builder.setX(k).setY(m).create();
         Type b_type = builder.setX(k).setY(n).create();
         Type c_type = builder.setX(n).setY(m).create();

         matA = Allocation.createTyped(mRS, a_type);
         matB = Allocation.createTyped(mRS, b_type);
         matC = Allocation.createTyped(mRS, c_type);

         matA.copyFrom(a_byte);
         matB.copyFrom(b_byte);

         //During setup, do a sample run to see if the result is correct.
         mBLAS.BNNM(matA, a_offset, matB, b_offset, matC, c_offset, c_mult_int);
         byte[] c_byte_output = new byte[c_count];
         matC.copyTo(c_byte_output);
         if (!testWithTolerance(c_byte, c_byte_output)) {
             Log.e(TAG, "Result is not correct!");
             throw new AssertionError("Result is not correct.");
         }
     }

     public void runTest() {
         mBLAS.BNNM(matA, a_offset, matB, b_offset, matC, c_offset, c_mult_int);
     }

     public String getTestInfo() {
         return "8Bit GEMM Test: m=" + m + ", n=" + n + ", k=" + k;
     }
 }
	/*
	* Copyright (C) 2015 The Android Open Source Project
	*
	* Licensed under the Apache License, Version 2.0 (the "License");
	* you may not use this file except in compliance with the License.
	* You may obtain a copy of the License at
	*
	* http://www.apache.org/licenses/LICENSE-2.0
	*
	* Unless required by applicable law or agreed to in writing, software
	* distributed under the License is distributed on an "AS IS" BASIS,
	* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
	* See the License for the specific language governing permissions and
	* limitations under the License.
	*/

	package com.example.android.rs.blasbenchmark;

	import android.renderscript.*;
	import android.util.Log;
	import java.util.Random;
	import java.lang.Math;

	public class BNNMTest extends TestBase {

	static {
	System.loadLibrary("gemmdata");
	}

	native void getData(byte[] a, byte[] b, byte[] c);

	ScriptIntrinsicBLAS mBLAS;
	private Allocation matA;
	private Allocation matB;
	private Allocation matC;

	private int m;
	private int n;
	private int k;

	private int a_offset;
	private int b_offset;
	private int c_offset;
	private int c_mult_int;

	private int mTestSize;

	BNNMTest(int testSize) {
	mTestSize = testSize;
	}

	public void createTest() {
	mBLAS = ScriptIntrinsicBLAS.create(mRS);
	setTest();
	}

	private void setTest() {
	switch (mTestSize) {
	case 1:
	setTestSmall();
	break;
	case 2:
	setTestMedium();
	break;
	case 3:
	setTestLarge();
	break;
	default:
	break;
	}
	}

	// In Java, the eight-bit 'byte' type is signed, but the API for the 8-bit
	// matrix multiplication deals with unsigned bytes. This is a convenience
	// function that converts arrays of unsigned ints to their equivalent
	// representations as signed bytes. For example, the bit pattern 0xff is 255
	// as an unsigned value, but -127 as a Java signed byte. So if you pass in an
	// array of int[] {255} into this function, you'll get back byte[] {-127}.
	private byte[] unsignedToSignedByte(int[] input) {
	byte[] output = new byte[input.length];
	for (int i = 0; i < input.length; ++i) {
	output[i] = (byte)(input[i]);
	}
	return output;
	}


	private void addByteNoise(byte[] data, int count, float frequency, int maxDelta) {
	Random rand = new Random();
	for (int n = 0; n < count; ++n) {
	if (rand.nextFloat() < frequency) {
	final int originalValue = data[n];
	final float direction = rand.nextFloat();
	int delta = (int)(Math.ceil(rand.nextFloat() * maxDelta));
	if (direction < 0.5f) {
	delta = -delta;
	}
	int newValue = (originalValue + delta);
	if (newValue < -127) {
	newValue = -127;
	}
	if (newValue > 127) {
	newValue = 127;
	}
	data[n] = (byte)(newValue);
	}
	}
	}

	private boolean testWithTolerance(byte[] c_byte, byte[] c_byte_output) {

	// The testing procedure here is a bit complex, but the aim is to mimic the
	// requirements we've empirically found running deep neural networks in real
	// applications. We want to open the door to vendors using approximations that
	// produce slightly different results for optimization's sake, but keep the
	// precision loss within small enough bounds that we don't lose accuracy in
	// the final result.
	// After experimentation, we've found that we can tolerate around 5% of the
	// output bytes being different by 1. Any larger differences are not tolerable
	// and we can't get good results if the frequency of small differences is
	// higher than 5%. This test tries to measure those properties on an example
	// set of parameters that were captured from a real application.
	// For example, if you uncommented this function that adds random noise to the
	// results at a 3% specified frequency, the test should fail:
	// AddByteNoise(c_byte_output, c_count, 0.03f, 1);

	final boolean areSizesDifferent = (c_byte.length != c_byte_output.length);
	final int c_count = Math.min(c_byte.length, c_byte_output.length);

	int howManyDifferent = 0;
	boolean areAnyTooDifferent = false;
	for (int i = 0; i < c_count; i++) {
	byte expectedValue = c_byte[i];
	byte actualValue = c_byte_output[i];
	int delta = (expectedValue - actualValue);
	// First make sure that the difference is no more than one.
	if ((delta < -1) \|\| (delta > 1)) {
	areAnyTooDifferent = true;
	}
	// If there is a difference, increment the counter to track it.
	if (delta != 0) {
	// Don't spam the logs if too many are different.
	if (howManyDifferent < 50) {
	android.util.Log.e("BNNM", "Mismatch at " + i +
	": expected " + (expectedValue & 0xff) +
	", got " + (actualValue & 0xff));
	}
	++howManyDifferent;
	}
	}
	// We want no more than 2% of the values to show any differences, so work out
	// what that means in absolute numbers.
	final int percentThreshold = 2;
	final int differenceThreshold = Math.max((percentThreshold * c_count) / 100, 1);
	final boolean areTooManyDifferent = (howManyDifferent >= differenceThreshold);

	if (areAnyTooDifferent) {
	android.util.Log.e("BNNM", "Some outputs were too different.");
	}

	if (areTooManyDifferent) {
	android.util.Log.e("BNNM", "There were too many small differences." +
	" We can tolerate " + percentThreshold + "% (" +
	differenceThreshold + "), but there were " + howManyDifferent);
	}

	return !(areAnyTooDifferent \|\| areTooManyDifferent);
	}

	// This test multiplies a couple of small 8-bit matrices, and compares the
	// results with hand-calculated expectations.
	public void setTestSmall() {
	// The A matrix is:
	// \| 1 \| 4 \|
	// \| 2 \| 5 \|
	// \| 3 \| 6 \|
	byte[] a_byte = unsignedToSignedByte(new int[] {
	1, 2, 3,
	4, 5, 6,
	});
	final int a_rows = 3;
	final int a_cols = 2;
	a_offset = 0;
	// The B matrix is:
	// \| -1 \| -2 \| -3 \| -4 \|
	// \| -5 \| -6 \| -7 \| -8 \|
	// \| -9 \| -10 \| -11 \| -12 \|
	byte[] b_byte = unsignedToSignedByte(new int[] {
	11, 7, 3,
	10, 6, 2,
	9, 5, 1,
	8, 4, 0,
	});
	final int b_cols = 4;
	b_offset = 12;
	// EightBitGemm implements C = B.transposed() * A,
	// so we expect to get these results:
	// 1-1 + 2-5 + 3*-9 + 128 = 90
	// 1-2 + 2-6 + 3*-10 + 128 = 84
	// 1-3 + 2-7 + 3*-11 + 128 = 78
	// 1-4 + 2-8 + 3*-12 + 128 = 72
	// 4-1 + 5-5 + 6*-9 + 128 = 45
	// 4-2 + 5-6 + 6*-10 + 128 = 30
	// 4-3 + 5-7 + 6*-11 + 128 = 15
	// 4-4 + 5-8 + 6*-12 + 128 = 0
	// \| 90 \| 45 \|
	// \| 84 \| 30 \|
	// \| 78 \| 15 \|
	// \| 72 \| 0 \|
	c_offset = 128;
	final int c_shift = 21;
	c_mult_int = (1 << c_shift);
	byte[] expected_data = unsignedToSignedByte(new int[] {
	90, 84, 78, 72,
	45, 30, 15, 0,
	});

	m = a_cols;
	n = b_cols;
	k = a_rows;

	Type.Builder builder = new Type.Builder(mRS, Element.U8(mRS));
	Type a_type = builder.setX(k).setY(m).create();
	Type b_type = builder.setX(k).setY(n).create();
	Type c_type = builder.setX(n).setY(m).create();

	matA = Allocation.createTyped(mRS, a_type);
	matB = Allocation.createTyped(mRS, b_type);
	matC = Allocation.createTyped(mRS, c_type);
	matA.copyFrom(a_byte);
	matB.copyFrom(b_byte);

	//During setup, do a sample run to see if the result is correct.
	mBLAS.BNNM(matA, a_offset, matB, b_offset, matC, c_offset, c_mult_int);
	int c_count = (m * n);
	byte[] c_byte_output = new byte[c_count];
	matC.copyTo(c_byte_output);
	if (!testWithTolerance(expected_data, c_byte_output)) {
	Log.e(TAG, "Result is not correct!");
	throw new AssertionError("Result is not correct.");
	}
	}


	// This test multiplies another two medium 8-bit matrices, and compares the
	// results with the expected values. The data here is arbitrary.
	public void setTestMedium() {
	byte[] a_byte = unsignedToSignedByte(new int[] {
	1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23,
	23, 22, 21, 20, 19, 18, 17, 16, 15, 14, 13, 12, 11, 10, 9, 8, 7, 6, 5, 4, 3, 2, 1,
	1, 23, 2, 22, 3, 21, 4, 20, 5, 19, 6, 18, 7, 17, 8, 16, 9, 15, 10, 14, 11, 13, 12,
	23, 1, 22, 2, 21, 3, 20, 4, 19, 5, 18, 6, 17, 7, 16, 8, 15, 9, 14, 10, 13, 11, 12,
	1, 1, 1, 1, 1, 1, 1, 1, 1, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12, 12,
	3, 1, 4, 1, 5, 8, 2, 3, 1, 14, 11, 15, 18, 12, 13, 11, 14, 11, 15, 18, 12, 13, 11,
	8, 0, 5, 8, 1, 3, 7, 5, 7, 13, 10, 23, 13, 11, 17, 23, 12, 19, 17, 13, 14, 10, 19,
	});
	final int a_rows = 23;
	final int a_cols = 7;
	a_offset = 13;
	byte[] b_byte = unsignedToSignedByte(new int[] {
	0, 2, 4, 6, 8, 10, 1, 3, 5, 7, 9, 11, 0, 2, 4, 6, 8, 10, 1, 3, 5, 7, 9,
	0, 20, 40, 60, 80, 10, 11, 13, 15, 17, 19, 21, 10, 12, 14, 6, 8, 10, 1, 3, 5, 7, 9,
	1, 21, 41, 61, 81, 11, 12, 14, 16, 18, 20, 22, 11, 13, 15, 7, 9, 11, 2, 4, 6, 8, 9,
	0, 19, 39, 59, 79, 9, 10, 12, 14, 16, 18, 20, 9, 11, 13, 5, 7, 9, 0, 2, 4, 6, 8,
	2, 22, 42, 62, 82, 12, 13, 15, 17, 19, 21, 23, 12, 14, 16, 8, 9, 12, 3, 5, 7, 9, 9,
	0, 18, 38, 58, 78, 8, 9, 11, 13, 15, 17, 19, 8, 10, 12, 4, 6, 8, 0, 1, 3, 5, 7,
	3, 23, 43, 63, 83, 13, 14, 16, 18, 20, 22, 24, 13, 15, 17, 9, 9, 13, 4, 6, 8, 9, 9,
	0, 17, 37, 57, 77, 7, 8, 10, 12, 14, 16, 18, 7, 9, 11, 3, 5, 7, 0, 0, 2, 4, 6,
	10, 20, 30, 40, 50, 1, 2, 3, 4, 5, 11, 12, 13, 14, 15, 21, 22, 23, 24, 25, 1, 2, 3,
	});
	final int b_cols = 9;
	b_offset = 23;
	c_offset = 2121;
	final int c_shift = 21;
	c_mult_int = 132359;
	byte[] expected_data = unsignedToSignedByte(new int[] {
	167, 53, 51, 54, 49, 55, 46,
	56, 116, 153, 232, 232, 234, 231,
	236, 232, 237, 174, 168, 131, 130,
	132, 129, 133, 128, 133, 134, 151,
	154, 152, 156, 151, 158, 150, 160,
	156, 255, 113, 106, 120, 98, 127,
	91, 134, 178, 231, 102, 97, 107,
	92, 111, 87, 116, 164, 187, 76,
	73, 78, 70, 81, 67, 83, 139,
	});

	m = a_cols;
	n = b_cols;
	k = a_rows;

	Type.Builder builder = new Type.Builder(mRS, Element.U8(mRS));
	Type a_type = builder.setX(k).setY(m).create();
	Type b_type = builder.setX(k).setY(n).create();
	Type c_type = builder.setX(n).setY(m).create();

	matA = Allocation.createTyped(mRS, a_type);
	matB = Allocation.createTyped(mRS, b_type);
	matC = Allocation.createTyped(mRS, c_type);

	matA.copyFrom(a_byte);
	matB.copyFrom(b_byte);

	//During setup, do a sample run to see if the result is correct.
	mBLAS.BNNM(matA, a_offset, matB, b_offset, matC, c_offset, c_mult_int);
	int c_count = (m * n);
	byte[] c_byte_output = new byte[c_count];
	matC.copyTo(c_byte_output);
	if (!testWithTolerance(expected_data, c_byte_output)) {
	Log.e(TAG, "Result is not correct!");
	throw new AssertionError("Result is not correct.");
	}
	}



	// This test takes a large set of real data captured from a convolutional
	// neural network solving a computer vision problem, and runs it through the
	// eight-bit matrix multiply. We test the results to make sure they're close
	// enough to be usable.
	public void setTestLarge() {

	m = 256;
	n = 192;
	k = 1152;
	a_offset = 0;
	b_offset = 84;
	c_mult_int = 3401;
	c_offset = 74980;

	int a_count = (m * k);
	int b_count = (n * k);
	int c_count = (m * n);

	byte[] a_byte = new byte[a_count];
	byte[] b_byte = new byte[b_count];
	byte[] c_byte = new byte[c_count];

	getData(a_byte, b_byte, c_byte);

	Type.Builder builder = new Type.Builder(mRS, Element.U8(mRS));
	Type a_type = builder.setX(k).setY(m).create();
	Type b_type = builder.setX(k).setY(n).create();
	Type c_type = builder.setX(n).setY(m).create();

	matA = Allocation.createTyped(mRS, a_type);
	matB = Allocation.createTyped(mRS, b_type);
	matC = Allocation.createTyped(mRS, c_type);

	matA.copyFrom(a_byte);
	matB.copyFrom(b_byte);

	//During setup, do a sample run to see if the result is correct.
	mBLAS.BNNM(matA, a_offset, matB, b_offset, matC, c_offset, c_mult_int);
	byte[] c_byte_output = new byte[c_count];
	matC.copyTo(c_byte_output);
	if (!testWithTolerance(c_byte, c_byte_output)) {
	Log.e(TAG, "Result is not correct!");
	throw new AssertionError("Result is not correct.");
	}
	}

	public void runTest() {
	mBLAS.BNNM(matA, a_offset, matB, b_offset, matC, c_offset, c_mult_int);
	}

	public String getTestInfo() {
	return "8Bit GEMM Test: m=" + m + ", n=" + n + ", k=" + k;
	}
	}