28 #ifndef SPLA_CL_FORMAT_CSR_HPP
29 #define SPLA_CL_FORMAT_CSR_HPP
47 auto& ctx = get_acc_cl()->get_context();
48 const auto flags = CL_MEM_READ_WRITE | CL_MEM_HOST_NO_ACCESS | CL_MEM_COPY_HOST_PTR;
50 cl::Buffer cl_Ap(ctx, flags, (n_rows + 1) *
sizeof(
uint), (
void*) Ap);
51 cl::Buffer cl_Aj(ctx, flags, n_values *
sizeof(
uint), (
void*) Aj);
52 cl::Buffer cl_Ax(ctx, flags, n_values *
sizeof(T), (
void*) Ax);
54 storage.
Ap = std::move(cl_Ap);
55 storage.
Aj = std::move(cl_Aj);
56 storage.
Ax = std::move(cl_Ax);
65 auto& ctx = get_acc_cl()->get_context();
66 const auto flags = CL_MEM_READ_WRITE | CL_MEM_HOST_NO_ACCESS;
68 cl::Buffer cl_Ap(ctx, flags, (n_rows + 1) *
sizeof(
uint));
69 cl::Buffer cl_Aj(ctx, flags, n_values *
sizeof(
uint));
70 cl::Buffer cl_Ax(ctx, flags, n_values *
sizeof(T));
72 storage.
Ap = std::move(cl_Ap);
73 storage.
Aj = std::move(cl_Aj);
74 storage.
Ax = std::move(cl_Ax);
86 cl::CommandQueue& queue,
87 cl_mem_flags staging_flags = CL_MEM_READ_ONLY | CL_MEM_HOST_READ_ONLY | CL_MEM_ALLOC_HOST_PTR,
88 bool blocking =
true) {
89 const std::size_t buffer_size_Ap = (n_rows + 1) *
sizeof(
uint);
90 const std::size_t buffer_size_Aj = n_values *
sizeof(
uint);
91 const std::size_t buffer_size_Ax = n_values *
sizeof(T);
93 cl::Buffer staging_Ap(get_acc_cl()->get_context(), staging_flags, buffer_size_Ap);
94 cl::Buffer staging_Aj(get_acc_cl()->get_context(), staging_flags, buffer_size_Aj);
95 cl::Buffer staging_Ax(get_acc_cl()->get_context(), staging_flags, buffer_size_Ax);
97 queue.enqueueCopyBuffer(storage.
Ap, staging_Ap, 0, 0, buffer_size_Ap);
98 queue.enqueueCopyBuffer(storage.
Aj, staging_Aj, 0, 0, buffer_size_Aj);
99 queue.enqueueCopyBuffer(storage.
Ax, staging_Ax, 0, 0, buffer_size_Ax);
101 queue.enqueueReadBuffer(staging_Ap,
false, 0, buffer_size_Ap, Ap);
102 queue.enqueueReadBuffer(staging_Aj,
false, 0, buffer_size_Aj, Aj);
103 queue.enqueueReadBuffer(staging_Ax, blocking, 0, buffer_size_Ax, Ax);
OpenCL compressed sparse row matrix representation.
Definition: cl_formats.hpp:94
cl::Buffer Ax
Definition: cl_formats.hpp:102
cl::Buffer Ap
Definition: cl_formats.hpp:100
cl::Buffer Aj
Definition: cl_formats.hpp:101
uint values
Definition: tdecoration.hpp:58
void cl_csr_init(std::size_t n_rows, std::size_t n_values, const uint *Ap, const uint *Aj, const T *Ax, CLCsr< T > &storage)
Definition: cl_format_csr.hpp:41
void cl_csr_resize(std::size_t n_rows, std::size_t n_values, CLCsr< T > &storage)
Definition: cl_format_csr.hpp:62
void cl_csr_read(std::size_t n_rows, std::size_t n_values, uint *Ap, uint *Aj, T *Ax, CLCsr< T > &storage, cl::CommandQueue &queue, cl_mem_flags staging_flags=CL_MEM_READ_ONLY|CL_MEM_HOST_READ_ONLY|CL_MEM_ALLOC_HOST_PTR, bool blocking=true)
Definition: cl_format_csr.hpp:80
std::uint32_t uint
Library index and size type.
Definition: config.hpp:56
Definition: algorithm.hpp:37