diff --git a/matrix_opencl.cpp b/matrix_opencl.cpp
index 8c108ef2862eb898645431ee8f5f9e96a8267771..c367b4539fb36ede1797719e7229fb6b2ae6fd8d 100644
--- a/matrix_opencl.cpp
+++ b/matrix_opencl.cpp
@@ -192,7 +192,7 @@ void KernelCache::compileKernels(cl::Context context, const std::vector<cl::Devi
         kernel_matrix_mul = cl::Kernel(prog_matrix_mul, "matrix_mul");
 
         cl::Program prog_matrix_mul_V2 = loadAndBuildProgram(context, devices, kernel_source_matrix_mul_V2, "matrix_mul_V2");
-        kernel_matrix_mul_V2 = cl::Kernel(prog_matrix_mul_V2, "matrix_mul_V2");
+        kernel_matrix_mul_v2 = cl::Kernel(prog_matrix_mul_V2, "matrix_mul_V2");
 
         cl::Program prog_sigmoid = loadAndBuildProgram(context, devices, kernel_source_sigmoid, "sigmoid");
         kernel_sigmoid = cl::Kernel(prog_sigmoid, "sigmoid");
@@ -380,7 +380,7 @@ MatrixCL MatrixCL::operator*(const MatrixCL& other) const {
 MatrixCL MatrixCL::matrix_mul_V2(const MatrixCL& other) const {
     MatrixCL result(rows_, other.numCols(), context_, queue_);
 
-    cl::Kernel kernel = kernels_->kernel_matrix_mul_V2; 
+    cl::Kernel kernel = kernels_->kernel_matrix_mul_v2; 
     kernel.setArg(0, buffer_);
     kernel.setArg(1, other.getBuffer());
     kernel.setArg(2, result.getBuffer());