@@ -10,6 +10,7 @@ cpu_mat = rand(rng, Float32, m, n)
10
10
gpu_mat = CuArray {Float32} (cpu_mat)
11
11
gpu_mat_long = CuArray {Float32} (rand (rng, Float32, m_long, n_long))
12
12
gpu_vec = reshape (gpu_mat, length (gpu_mat))
13
+ gpu_vec_long = reshape (gpu_mat_long, length (gpu_mat_long))
13
14
gpu_arr_3d = reshape (gpu_mat, (m, 40 , 25 ))
14
15
gpu_arr_4d = reshape (gpu_mat, (m, 10 , 10 , 10 ))
15
16
gpu_mat_ints = CuArray (rand (rng, - 10 : 10 , m, n))
52
53
53
54
let group = addgroup! (group, " reverse" )
54
55
group[" 1d" ] = @async_benchmarkable reverse ($ gpu_vec)
56
+ group[" 1dL" ] = @async_benchmarkable reverse ($ gpu_vec_long)
55
57
group[" 2d" ] = @async_benchmarkable reverse ($ gpu_mat; dims= 1 )
58
+ group[" 2dL" ] = @async_benchmarkable reverse ($ gpu_mat_long; dims= 1 )
56
59
group[" 1d_inplace" ] = @async_benchmarkable reverse! ($ gpu_vec)
60
+ group[" 1dL_inplace" ] = @async_benchmarkable reverse! ($ gpu_vec_long)
57
61
group[" 2d_inplace" ] = @async_benchmarkable reverse! ($ gpu_mat; dims= 1 )
62
+ group[" 2dL_inplace" ] = @async_benchmarkable reverse! ($ gpu_mat_long; dims= 2 )
58
63
end
59
64
60
65
group[" broadcast" ] = @async_benchmarkable $ gpu_mat .= 0f0
0 commit comments