@@ -10,6 +10,7 @@ cpu_mat = rand(rng, Float32, m, n)
1010gpu_mat = CuArray {Float32} (cpu_mat)
1111gpu_mat_long = CuArray {Float32} (rand (rng, Float32, m_long, n_long))
1212gpu_vec = reshape (gpu_mat, length (gpu_mat))
13+ gpu_vec_long = reshape (gpu_mat_long, length (gpu_mat_long))
1314gpu_arr_3d = reshape (gpu_mat, (m, 40 , 25 ))
1415gpu_arr_4d = reshape (gpu_mat, (m, 10 , 10 , 10 ))
1516gpu_mat_ints = CuArray (rand (rng, - 10 : 10 , m, n))
5253
5354let group = addgroup! (group, " reverse" )
5455 group[" 1d" ] = @async_benchmarkable reverse ($ gpu_vec)
56+ group[" 1dL" ] = @async_benchmarkable reverse ($ gpu_vec_long)
5557 group[" 2d" ] = @async_benchmarkable reverse ($ gpu_mat; dims= 1 )
58+ group[" 2dL" ] = @async_benchmarkable reverse ($ gpu_mat_long; dims= 1 )
5659 group[" 1d_inplace" ] = @async_benchmarkable reverse! ($ gpu_vec)
60+ group[" 1dL_inplace" ] = @async_benchmarkable reverse! ($ gpu_vec_long)
5761 group[" 2d_inplace" ] = @async_benchmarkable reverse! ($ gpu_mat; dims= 1 )
62+ group[" 2dL_inplace" ] = @async_benchmarkable reverse! ($ gpu_mat_long; dims= 2 )
5863end
5964
6065group[" broadcast" ] = @async_benchmarkable $ gpu_mat .= 0f0
0 commit comments