Skip to content

Commit 483d045

Browse files
committed
merge
2 parents c4087ea + 22e8c51 commit 483d045

File tree

1 file changed

+19
-0
lines changed

1 file changed

+19
-0
lines changed

src/cuda.jl

Lines changed: 19 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -24,3 +24,22 @@ for TT in [:(Tropical{<:NativeTypes}), :TropicalTypes]
2424
end
2525
end
2626

27+
<<<<<<< HEAD
28+
=======
29+
using .CUDA: @cartesianidx, AbstractGPUArray, gpu_call
30+
31+
@inline @generated function map_index(dest, src, I, perm::NTuple{N,T}) where {N,T}
32+
Expr(:(=), Expr(:ref, :dest, [:(@inbounds I[perm[$i]]) for i in 1:N]...), Expr(:ref, :src, :I))
33+
end
34+
function LinearAlgebra.permutedims!(dest::AbstractGPUArray, src::AbstractGPUArray,
35+
perm::NTuple)
36+
Base.checkdims_perm(dest, src, perm)
37+
function permutedims_kernel(ctx, dest, src, perm)
38+
I = @cartesianidx src
39+
map_index(dest, src, I, perm)
40+
return
41+
end
42+
gpu_call(permutedims_kernel, dest, src, perm)
43+
return dest
44+
end
45+
>>>>>>> 22e8c5179a33a94ddc43baa995933d109050d502

0 commit comments

Comments
 (0)