diff --git a/matrix_opencl.cpp b/matrix_opencl.cpp index 6786c1c829d8c36002fa23d8a597fb59c53d56b2..bd052dc75ac7a1ff3d7837e80c5879db12d49416 100644 --- a/matrix_opencl.cpp +++ b/matrix_opencl.cpp @@ -77,7 +77,7 @@ const std::string kernel_source_transpose = R"( } )"; // NAIVE -/*const std::string kernel_source_matrix_mul = R"( +const std::string kernel_source_matrix_mul = R"( __kernel void matrix_mul(__global const float* A, __global const float* B, __global float* C, int A_rows, int A_cols, int B_cols) { int row = get_global_id(0); int col = get_global_id(1); @@ -85,10 +85,10 @@ const std::string kernel_source_transpose = R"( C[row * B_cols + col] += A[row * A_cols + k] * B[k * B_cols + col]; } } -)";*/ +)"; // FASTER -const std::string kernel_source_matrix_mul = R"( +/*const std::string kernel_source_matrix_mul = R"( __kernel void matrix_mul(__global const float* A, __global const float* B, __global float* C, @@ -120,7 +120,7 @@ const std::string kernel_source_matrix_mul = R"( barrier(CLK_LOCAL_MEM_FENCE); } -})"; +})";*/ const std::string kernel_source_sigmoid = R"( __kernel void sigmoid(__global const float* input, __global float* output, int rows, int cols) { int idx = get_global_id(0); @@ -348,7 +348,7 @@ MatrixCL MatrixCL::operator+(const MatrixCL& other) const { } // NAIVE VERSION -/*MatrixCL MatrixCL::operator*(const MatrixCL& other) const { +MatrixCL MatrixCL::operator*(const MatrixCL& other) const { if (cols_ != other.rows_) throw std::runtime_error("Matrix dimension error."); @@ -368,10 +368,10 @@ MatrixCL MatrixCL::operator+(const MatrixCL& other) const { } return result; -}*/ +} // FASTER VERSION -MatrixCL MatrixCL::operator*(const MatrixCL& other) const { +/*MatrixCL MatrixCL::operator*(const MatrixCL& other) const { if (cols_ != other.rows_) throw std::runtime_error("Matrix dimension error."); @@ -404,7 +404,7 @@ MatrixCL MatrixCL::operator*(const MatrixCL& other) const { } return result; -} +}*/ MatrixCL MatrixCL::transpose() const {