@@ -84,7 +84,7 @@ public class Main {
8484 * @param size
8585 */
8686 @ Reflect
87- public static void matrixMultiplyKernel2D (@ RO KernelContext kc , @ RO F32Array matrixA , @ RO F32Array matrixB , @ WO F32Array matrixC , int size ) {
87+ public static void matrixMultiplyKernel2D (KernelContext kc , F32Array matrixA , F32Array matrixB , F32Array matrixC , int size ) {
8888 if (kc .gix < kc .gsx ) {
8989 if (kc .giy < kc .gsy ) {
9090 float acc = 0.0f ;
@@ -106,7 +106,7 @@ public static void matrixMultiplyKernel2D(@RO KernelContext kc, @RO F32Array mat
106106 * @param size
107107 */
108108 @ Reflect
109- public static void matrixMultiplyKernel2DLI (@ RO KernelContext kc , @ RO F32Array matrixA , @ RO F32Array matrixB , @ WO F32Array matrixC , int size ) {
109+ public static void matrixMultiplyKernel2DLI (KernelContext kc , F32Array matrixA , F32Array matrixB , F32Array matrixC , int size ) {
110110 if (kc .gix < kc .gsx ) {
111111 if (kc .giy < kc .gsy ) {
112112 float acc = 0.0f ;
@@ -141,7 +141,7 @@ static MyLocalArrayFixedSize createLocal() {
141141 }
142142
143143 @ Reflect
144- public static void matrixMultiplyKernel2DTiling (@ RO KernelContext kc , @ RO F32Array matrixA , @ RO F32Array matrixB , @ WO F32Array matrixC , int size ) {
144+ public static void matrixMultiplyKernel2DTiling (KernelContext kc , F32Array matrixA , F32Array matrixB , F32Array matrixC , int size ) {
145145
146146 final int tileSize = 16 ;
147147 MyLocalArrayFixedSize tileA = MyLocalArrayFixedSize .createLocal ();
@@ -254,7 +254,7 @@ static FlatPrivate createPrivate() {
254254 * @param size
255255 */
256256 @ Reflect
257- public static void matrixMultiplyKernel2DRegisterTiling (@ RO KernelContext kc , @ RO F32Array matrixA , @ RO F32Array matrixB , @ WO F32Array matrixC , int size ) {
257+ public static void matrixMultiplyKernel2DRegisterTiling (KernelContext kc , F32Array matrixA , F32Array matrixB , F32Array matrixC , int size ) {
258258
259259 // Configuration for the kernel: Keep in mind that if you change the following parameters,
260260 // also change the scheduling (global and local work sizes).
@@ -376,7 +376,7 @@ public static void matrixMultiplyKernel2DRegisterTiling(@RO KernelContext kc, @R
376376 * @param size
377377 */
378378 @ Reflect
379- public static void matrixMultiplyKernel2DRegisterTilingVectorized (@ RO KernelContext kc , @ RO F32ArrayPadded matrixA , @ RO F32ArrayPadded matrixB , @ WO F32ArrayPadded matrixC , int size ) {
379+ public static void matrixMultiplyKernel2DRegisterTilingVectorized (KernelContext kc , F32ArrayPadded matrixA , F32ArrayPadded matrixB , F32ArrayPadded matrixC , int size ) {
380380
381381 // Configuration for the kernel: Keep in mind that if you change the following parameters,
382382 // also change the scheduling (global and local work sizes).
@@ -524,7 +524,7 @@ static FlatPrivateHalf createPrivate() {
524524 }
525525
526526 @ Reflect
527- public static void matrixMultiplyKernel2DRegisterTilingHalf (@ RO KernelContext kc , @ RO F16Array matrixA , @ RO F16Array matrixB , @ WO F16Array matrixC , int size ) {
527+ public static void matrixMultiplyKernel2DRegisterTilingHalf (KernelContext kc , F16Array matrixA , F16Array matrixB , F16Array matrixC , int size ) {
528528
529529 // Configuration for the kernel: Keep in mind that if you change the following parameters,
530530 // also change the scheduling (global and local work sizes).
@@ -648,7 +648,7 @@ public static float compute(@RO KernelContext kc, @RO F32Array matrixA, @RO F32A
648648 * @param size
649649 */
650650 @ Reflect
651- public static void matrixMultiplyKernel1D (@ RO KernelContext kc , @ RO F32Array matrixA , @ RO F32Array matrixB , @ WO F32Array matrixC , int size ) {
651+ public static void matrixMultiplyKernel1D (KernelContext kc , F32Array matrixA , F32Array matrixB , F32Array matrixC , int size ) {
652652 if (kc .gix < kc .gsx ) {
653653 for (int j = 0 ; j < size ; j ++) {
654654 float acc = 0.0f ;
@@ -664,7 +664,7 @@ public static void matrixMultiplyKernel1D(@RO KernelContext kc, @RO F32Array mat
664664 * 1D Matrix Multiply with function calls passing the kernel context ID. This is just for testing purposes.
665665 */
666666 @ Reflect
667- public static void matrixMultiplyKernel1DWithFunctionCalls (@ RO KernelContext kc , @ RO F32Array matrixA , @ RO F32Array matrixB , @ WO F32Array matrixC , int size ) {
667+ public static void matrixMultiplyKernel1DWithFunctionCalls (KernelContext kc , F32Array matrixA , F32Array matrixB , F32Array matrixC , int size ) {
668668 if (kc .gix < kc .gsx ) {
669669 for (int j = 0 ; j < size ; j ++) {
670670 float acc = compute (kc , matrixA , matrixB , size , j );
0 commit comments