summarylogtreecommitdiffstats
path: root/test.cpp
blob: d7bba2070259a43c809b037dc923c7652e49081f (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
#include <rocsparse/rocsparse.h>
#include <hip/hip_runtime.h>
#include <iostream>
#include <vector>
#include <random>
#include <algorithm>

int main()
{
    using rint = rocsparse_int;
    rint n = 1024;

    std::random_device rd;
    std::mt19937 gen(rd());
    std::uniform_real_distribution<float> dist(-1.0, 1.0);

    auto myrand = [&]() -> float {return dist(gen);};

    std::vector<float> xin(n);
    std::generate(xin.begin(), xin.end(), myrand);

    rocsparse_handle handle;
    rocsparse_create_handle(&handle); 

    std::vector<rint> row_ptr(n + 1);
    std::vector<rint> col(3 * n);
    std::vector<float> data(3 * n);
    
    //Second order finite differences matrix in 1D
    row_ptr[0] = 0;
    for(size_t i = 0; i < n; i++){
        rint off = row_ptr[i];
        if(i > 0){
            col[off] = i - 1;
            data[off++] = -1.0f;
        }
        col[off] = i;
        data[off++] = 2.0f;
        if(i < n - 1){
            col[off] = i + 1;
            data[off++] = -1.0f;
        }
        row_ptr[i + 1] = off;
    }

    rint *rp;
    rint *c;
    float *d;

    float *x;
    float *y;
    hipMalloc((void **)&rp, sizeof *rp * (n + 1));
    hipMalloc((void **)&c, sizeof *c * 3 * n);
    hipMalloc((void **)&d, sizeof *d * 3 * n);

    hipMalloc((void **)&x, sizeof *x * n);
    hipMalloc((void **)&y, sizeof *y * n);

    hipMemcpy(rp, row_ptr.data(), sizeof *rp * (n + 1), hipMemcpyHostToDevice);
    hipMemcpy(c, col.data(), sizeof *c * 3 * n, hipMemcpyHostToDevice);
    hipMemcpy(d, data.data(), sizeof *d * 3 * n, hipMemcpyHostToDevice);

    hipMemcpy(x, xin.data(), sizeof *x * n, hipMemcpyHostToDevice);

    float alpha = 14.124f;
    float beta = 0.0f;

    rocsparse_mat_descr descr;
    rocsparse_create_mat_descr(&descr);

    rocsparse_scsrmv(handle, rocsparse_operation_none,
        n, n, 3 * n - 2, &alpha, descr, d, rp, c, nullptr,
        x, &beta, y);

    std::vector<float> yout(n);
    hipMemcpy(yout.data(), y, sizeof *y * n, hipMemcpyDeviceToHost);

    float tol = 0.0001f;
    for(rint i = 0; i < n; i++){
        for(rint jj = row_ptr[i]; jj < row_ptr[i + 1]; jj++){
            rint j = col[jj];
            yout[i] -= alpha * data[jj] * xin[j];
        }
        if(std::abs(yout[i]) > tol){
            std::cout << "Entry " << i << " is not computed correctly.\n";
            std::cout << "Expected 0 but got " <<  yout[i] << std::endl;
            return 1;
        }
    }

    std::cout << "TESTS PASSED!" << std::endl;

    rocsparse_destroy_handle(handle);
    rocsparse_destroy_mat_descr(descr);
    hipFree(rp);
    hipFree(c);
    hipFree(d);
    hipFree(x);
    hipFree(y);
}