/dports/math/clblast/CLBlast-1.1.0/test/ |
H A D | wrapper_cuda.hpp | 116 void CUDAToHost(const Arguments<U> &args, BuffersCUDA<T> &buffers, BuffersHost<T> &buffers_host, in CUDAToHost() argument 119 … (name == kBufVecX) { buffers_host.x_vec = std::vector<T>(args.x_size, static_cast<T>(0)); CUDAToH… in CUDAToHost() 120 … (name == kBufVecY) { buffers_host.y_vec = std::vector<T>(args.y_size, static_cast<T>(0)); CUDAToH… in CUDAToHost() 121 … (name == kBufMatA) { buffers_host.a_mat = std::vector<T>(args.a_size, static_cast<T>(0)); CUDAToH… in CUDAToHost() 122 … (name == kBufMatB) { buffers_host.b_mat = std::vector<T>(args.b_size, static_cast<T>(0)); CUDAToH… in CUDAToHost() 123 … (name == kBufMatC) { buffers_host.c_mat = std::vector<T>(args.c_size, static_cast<T>(0)); CUDAToH… in CUDAToHost() 124 …name == kBufMatAP) { buffers_host.ap_mat = std::vector<T>(args.ap_size, static_cast<T>(0)); CUDATo… in CUDAToHost() 125 …e == kBufScalar) { buffers_host.scalar = std::vector<T>(args.scalar_size, static_cast<T>(0)); CUDA… in CUDAToHost() 134 if (name == kBufVecX) { HostToCUDA(&buffers.x_vec, buffers_host.x_vec, args.x_size); } in HostToCUDA() 135 else if (name == kBufVecY) { HostToCUDA(&buffers.y_vec, buffers_host.y_vec, args.y_size); } in HostToCUDA() [all …]
|
H A D | test_utilities.cpp | 33 void DeviceToHost(const Arguments<U> &args, Buffers<T> &buffers, BuffersHost<T> &buffers_host, in DeviceToHost() argument 36 …e == kBufVecX) {buffers_host.x_vec = std::vector<T>(args.x_size, static_cast<T>(0)); buffers.x_vec… in DeviceToHost() 37 … == kBufVecY) { buffers_host.y_vec = std::vector<T>(args.y_size, static_cast<T>(0)); buffers.y_vec… in DeviceToHost() 38 … == kBufMatA) { buffers_host.a_mat = std::vector<T>(args.a_size, static_cast<T>(0)); buffers.a_mat… in DeviceToHost() 39 … == kBufMatB) { buffers_host.b_mat = std::vector<T>(args.b_size, static_cast<T>(0)); buffers.b_mat… in DeviceToHost() 40 … == kBufMatC) { buffers_host.c_mat = std::vector<T>(args.c_size, static_cast<T>(0)); buffers.c_mat… in DeviceToHost() 41 … kBufMatAP) { buffers_host.ap_mat = std::vector<T>(args.ap_size, static_cast<T>(0)); buffers.ap_ma… in DeviceToHost() 42 …Scalar) { buffers_host.scalar = std::vector<T>(args.scalar_size, static_cast<T>(0)); buffers.scala… in DeviceToHost() 48 void HostToDevice(const Arguments<U> &args, Buffers<T> &buffers, BuffersHost<T> &buffers_host, in HostToDevice() argument 51 if (name == kBufVecX) { buffers.x_vec.Write(queue, args.x_size, buffers_host.x_vec); } in HostToDevice() [all …]
|
/dports/math/clblast/CLBlast-1.1.0/test/routines/levelx/ |
H A D | xinvert.hpp | 57 buffers_host.b_mat[i * b_ld + i + b_offset] = a_value; in RunReference() 68 a_value = buffers_host.a_mat[k * a_ld + i + a_offset]; in RunReference() 72 … buffers_host.b_mat[j * b_ld + i + b_offset] = - sum * buffers_host.b_mat[i * b_ld + i + b_offset]; in RunReference() 89 … buffers_host.b_mat[j * b_ld + i + b_offset] = - sum * buffers_host.b_mat[i * b_ld + i + b_offset]; in RunReference() 100 auto a_buffer2 = HalfToFloatBuffer(buffers_host.a_mat); in RunReference() 101 auto b_buffer2 = HalfToFloatBuffer(buffers_host.b_mat); in RunReference() 110 FloatToHalfBuffer(buffers_host.b_mat, b_buffer2); in RunReference() 182 auto buffers_host = BuffersHost<T>(); in RunReference1() local 183 DeviceToHost(args, buffers, buffers_host, queue, BuffersIn()); in RunReference1() 184 const auto status = RunReference(args, buffers_host); in RunReference1() [all …]
|
H A D | xomatcopy.hpp | 25 StatusCode RunReference(const Arguments<T> &args, BuffersHost<T> &buffers_host) { in RunReference() argument 48 buffers_host.b_mat[b_index] = args.alpha * buffers_host.a_mat[a_index]; in RunReference() 56 StatusCode RunReference<half>(const Arguments<half> &args, BuffersHost<half> &buffers_host) { in RunReference() argument 57 auto a_buffer2 = HalfToFloatBuffer(buffers_host.a_mat); in RunReference() 58 auto b_buffer2 = HalfToFloatBuffer(buffers_host.b_mat); in RunReference() 68 FloatToHalfBuffer(buffers_host.b_mat, b_buffer2); in RunReference() 143 auto buffers_host = BuffersHost<T>(); in RunReference1() local 144 DeviceToHost(args, buffers, buffers_host, queue, BuffersIn()); in RunReference1() 145 const auto status = RunReference(args, buffers_host); in RunReference1() 146 HostToDevice(args, buffers, buffers_host, queue, BuffersOut()); in RunReference1() [all …]
|
H A D | xim2col.hpp | 104 auto buffers_host = BuffersHost<T>(); in RunReference1() local 105 DeviceToHost(args, buffers, buffers_host, queue, BuffersIn()); in RunReference1() 106 const auto status = RunReference(args, buffers_host); in RunReference1() 107 HostToDevice(args, buffers, buffers_host, queue, BuffersOut()); in RunReference1() 111 static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue&) { in RunReference2() argument 112 return RunReference(args, buffers_host); in RunReference2() 146 StatusCode RunReference(const Arguments<T> &args, BuffersHost<T> &buffers_host) { in RunReference() argument 162 val = buffers_host.a_mat[input_index + args.a_offset]; in RunReference() 170 buffers_host.b_mat[output_index + args.b_offset] = val; in RunReference()
|
/dports/math/clblast/CLBlast-1.1.0/test/routines/level1/ |
H A D | xdot.hpp | 104 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 106 buffers_host.scalar, args.dot_offset, in RunReference2() 107 buffers_host.x_vec, args.x_offset, args.x_inc, in RunReference2() 108 buffers_host.y_vec, args.y_offset, args.y_inc); in RunReference2()
|
H A D | xdotc.hpp | 104 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 106 buffers_host.scalar, args.dot_offset, in RunReference2() 107 buffers_host.x_vec, args.x_offset, args.x_inc, in RunReference2() 108 buffers_host.y_vec, args.y_offset, args.y_inc); in RunReference2()
|
H A D | xdotu.hpp | 104 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 106 buffers_host.scalar, args.dot_offset, in RunReference2() 107 buffers_host.x_vec, args.x_offset, args.x_inc, in RunReference2() 108 buffers_host.y_vec, args.y_offset, args.y_inc); in RunReference2()
|
H A D | xasum.hpp | 98 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 100 buffers_host.scalar, args.asum_offset, in RunReference2() 101 buffers_host.x_vec, args.x_offset, args.x_inc); in RunReference2()
|
H A D | xamax.hpp | 98 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 100 buffers_host.scalar, args.imax_offset, in RunReference2() 101 buffers_host.x_vec, args.x_offset, args.x_inc); in RunReference2()
|
H A D | xnrm2.hpp | 98 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 100 buffers_host.scalar, args.nrm2_offset, in RunReference2() 101 buffers_host.x_vec, args.x_offset, args.x_inc); in RunReference2()
|
/dports/math/clblast/CLBlast-1.1.0/test/routines/level2/ |
H A D | xhpmv.hpp | 109 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 113 buffers_host.ap_mat, args.ap_offset, in RunReference2() 114 buffers_host.x_vec, args.x_offset, args.x_inc, args.beta, in RunReference2() 115 buffers_host.y_vec, args.y_offset, args.y_inc); in RunReference2()
|
H A D | xspmv.hpp | 109 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 113 buffers_host.ap_mat, args.ap_offset, in RunReference2() 114 buffers_host.x_vec, args.x_offset, args.x_inc, args.beta, in RunReference2() 115 buffers_host.y_vec, args.y_offset, args.y_inc); in RunReference2()
|
H A D | xsyr2.hpp | 109 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 113 buffers_host.x_vec, args.x_offset, args.x_inc, in RunReference2() 114 buffers_host.y_vec, args.y_offset, args.y_inc, in RunReference2() 115 buffers_host.a_mat, args.a_offset, args.a_ld); in RunReference2()
|
H A D | xher2.hpp | 109 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 113 buffers_host.x_vec, args.x_offset, args.x_inc, in RunReference2() 114 buffers_host.y_vec, args.y_offset, args.y_inc, in RunReference2() 115 buffers_host.a_mat, args.a_offset, args.a_ld); in RunReference2()
|
H A D | xhpr2.hpp | 109 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 113 buffers_host.x_vec, args.x_offset, args.x_inc, in RunReference2() 114 buffers_host.y_vec, args.y_offset, args.y_inc, in RunReference2() 115 buffers_host.ap_mat, args.ap_offset); in RunReference2()
|
H A D | xspr2.hpp | 109 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 113 buffers_host.x_vec, args.x_offset, args.x_inc, in RunReference2() 114 buffers_host.y_vec, args.y_offset, args.y_inc, in RunReference2() 115 buffers_host.ap_mat, args.ap_offset); in RunReference2()
|
H A D | xgeru.hpp | 110 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 113 buffers_host.x_vec, args.x_offset, args.x_inc, in RunReference2() 114 buffers_host.y_vec, args.y_offset, args.y_inc, in RunReference2() 115 buffers_host.a_mat, args.a_offset, args.a_ld); in RunReference2()
|
H A D | xsbmv.hpp | 109 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 113 buffers_host.a_mat, args.a_offset, args.a_ld, in RunReference2() 114 buffers_host.x_vec, args.x_offset, args.x_inc, args.beta, in RunReference2() 115 buffers_host.y_vec, args.y_offset, args.y_inc); in RunReference2()
|
H A D | xger.hpp | 110 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 113 buffers_host.x_vec, args.x_offset, args.x_inc, in RunReference2() 114 buffers_host.y_vec, args.y_offset, args.y_inc, in RunReference2() 115 buffers_host.a_mat, args.a_offset, args.a_ld); in RunReference2()
|
H A D | xgerc.hpp | 110 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 113 buffers_host.x_vec, args.x_offset, args.x_inc, in RunReference2() 114 buffers_host.y_vec, args.y_offset, args.y_inc, in RunReference2() 115 buffers_host.a_mat, args.a_offset, args.a_ld); in RunReference2()
|
H A D | xhbmv.hpp | 109 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 113 buffers_host.a_mat, args.a_offset, args.a_ld, in RunReference2() 114 buffers_host.x_vec, args.x_offset, args.x_inc, args.beta, in RunReference2() 115 buffers_host.y_vec, args.y_offset, args.y_inc); in RunReference2()
|
H A D | xhemv.hpp | 109 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 113 buffers_host.a_mat, args.a_offset, args.a_ld, in RunReference2() 114 buffers_host.x_vec, args.x_offset, args.x_inc, args.beta, in RunReference2() 115 buffers_host.y_vec, args.y_offset, args.y_inc); in RunReference2()
|
H A D | xsymv.hpp | 109 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 113 buffers_host.a_mat, args.a_offset, args.a_ld, in RunReference2() 114 buffers_host.x_vec, args.x_offset, args.x_inc, args.beta, in RunReference2() 115 buffers_host.y_vec, args.y_offset, args.y_inc); in RunReference2()
|
H A D | xgemv.hpp | 115 … static StatusCode RunReference2(const Arguments<T> &args, BuffersHost<T> &buffers_host, Queue &) { in RunReference2() argument 119 buffers_host.a_mat, args.a_offset, args.a_ld, in RunReference2() 120 buffers_host.x_vec, args.x_offset, args.x_inc, args.beta, in RunReference2() 121 buffers_host.y_vec, args.y_offset, args.y_inc); in RunReference2()
|