diff --git a/matrix_opencl.cpp b/matrix_opencl.cpp
index 03a00eeebb121ac8c31a207a7424c1079257cfd0..47c6e778ef169b7a36473a8fa3eb7287cc76c7bc 100644
--- a/matrix_opencl.cpp
+++ b/matrix_opencl.cpp
@@ -76,7 +76,7 @@ const std::string kernel_source_transpose = R"(
         B[output_idx] = A[input_idx];
     }
 )";
-const std::string kernel_source_matrix_mul = R"(
+/*const std::string kernel_source_matrix_mul = R"(
     __kernel void matrix_mul(__global const float* A, __global const float* B, __global float* C, int A_rows, int A_cols, int B_cols) {
         int row = get_global_id(0);
         int col = get_global_id(1);
@@ -84,8 +84,8 @@ const std::string kernel_source_matrix_mul = R"(
             C[row * B_cols + col] += A[row * A_cols + k] * B[k * B_cols + col];
         }
     }
-)";
-/*const std::string kernel_source_matrix_mul = R"(
+)";*/
+const std::string kernel_source_matrix_mul = R"(
     __kernel void matrix_mul(__global const float* A,__global const float* B, __global float* C, int M, int K, int N) {
         int i = get_global_id(0);
         float Awrk[1024];
@@ -101,7 +101,7 @@ const std::string kernel_source_matrix_mul = R"(
             C[i * N + j] = tmp;
         }
     }
-)";*/
+)";
 const std::string kernel_source_sigmoid = R"(
     __kernel void sigmoid(__global const float* input, __global float* output, int rows, int cols) {
         int idx = get_global_id(0);