diff --git a/matrix_opencl.cpp b/matrix_opencl.cpp index 03a00eeebb121ac8c31a207a7424c1079257cfd0..47c6e778ef169b7a36473a8fa3eb7287cc76c7bc 100644 --- a/matrix_opencl.cpp +++ b/matrix_opencl.cpp @@ -76,7 +76,7 @@ const std::string kernel_source_transpose = R"( B[output_idx] = A[input_idx]; } )"; -const std::string kernel_source_matrix_mul = R"( +/*const std::string kernel_source_matrix_mul = R"( __kernel void matrix_mul(__global const float* A, __global const float* B, __global float* C, int A_rows, int A_cols, int B_cols) { int row = get_global_id(0); int col = get_global_id(1); @@ -84,8 +84,8 @@ const std::string kernel_source_matrix_mul = R"( C[row * B_cols + col] += A[row * A_cols + k] * B[k * B_cols + col]; } } -)"; -/*const std::string kernel_source_matrix_mul = R"( +)";*/ +const std::string kernel_source_matrix_mul = R"( __kernel void matrix_mul(__global const float* A,__global const float* B, __global float* C, int M, int K, int N) { int i = get_global_id(0); float Awrk[1024]; @@ -101,7 +101,7 @@ const std::string kernel_source_matrix_mul = R"( C[i * N + j] = tmp; } } -)";*/ +)"; const std::string kernel_source_sigmoid = R"( __kernel void sigmoid(__global const float* input, __global float* output, int rows, int cols) { int idx = get_global_id(0);