1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
|
#include <rocsparse/rocsparse.h>
#include <hip/hip_runtime.h>
#include <iostream>
#include <vector>
#include <random>
#include <algorithm>
int main()
{
using rint = rocsparse_int;
rint n = 1024;
std::random_device rd;
std::mt19937 gen(rd());
std::uniform_real_distribution<float> dist(-1.0, 1.0);
auto myrand = [&]() -> float {return dist(gen);};
std::vector<float> xin(n);
std::generate(xin.begin(), xin.end(), myrand);
rocsparse_handle handle;
rocsparse_create_handle(&handle);
std::vector<rint> row_ptr(n + 1);
std::vector<rint> col(3 * n);
std::vector<float> data(3 * n);
//Second order finite differences matrix in 1D
row_ptr[0] = 0;
for(size_t i = 0; i < n; i++){
rint off = row_ptr[i];
if(i > 0){
col[off] = i - 1;
data[off++] = -1.0f;
}
col[off] = i;
data[off++] = 2.0f;
if(i < n - 1){
col[off] = i + 1;
data[off++] = -1.0f;
}
row_ptr[i + 1] = off;
}
rint *rp;
rint *c;
float *d;
float *x;
float *y;
hipMalloc((void **)&rp, sizeof *rp * (n + 1));
hipMalloc((void **)&c, sizeof *c * 3 * n);
hipMalloc((void **)&d, sizeof *d * 3 * n);
hipMalloc((void **)&x, sizeof *x * n);
hipMalloc((void **)&y, sizeof *y * n);
hipMemcpy(rp, row_ptr.data(), sizeof *rp * (n + 1), hipMemcpyHostToDevice);
hipMemcpy(c, col.data(), sizeof *c * 3 * n, hipMemcpyHostToDevice);
hipMemcpy(d, data.data(), sizeof *d * 3 * n, hipMemcpyHostToDevice);
hipMemcpy(x, xin.data(), sizeof *x * n, hipMemcpyHostToDevice);
float alpha = 14.124f;
float beta = 0.0f;
rocsparse_mat_descr descr;
rocsparse_create_mat_descr(&descr);
rocsparse_scsrmv(handle, rocsparse_operation_none,
n, n, 3 * n - 2, &alpha, descr, d, rp, c, nullptr,
x, &beta, y);
std::vector<float> yout(n);
hipMemcpy(yout.data(), y, sizeof *y * n, hipMemcpyDeviceToHost);
float tol = 0.0001f;
for(rint i = 0; i < n; i++){
for(rint jj = row_ptr[i]; jj < row_ptr[i + 1]; jj++){
rint j = col[jj];
yout[i] -= alpha * data[jj] * xin[j];
}
if(std::abs(yout[i]) > tol){
std::cout << "Entry " << i << " is not computed correctly.\n";
std::cout << "Expected 0 but got " << yout[i] << std::endl;
return 1;
}
}
std::cout << "TESTS PASSED!" << std::endl;
rocsparse_destroy_handle(handle);
rocsparse_destroy_mat_descr(descr);
hipFree(rp);
hipFree(c);
hipFree(d);
hipFree(x);
hipFree(y);
}
|