Skip to content

Commit a406d0c

Browse files
committed
Fixing norm for AMD
1 parent 5cd5dcd commit a406d0c

7 files changed

+38
-14
lines changed

Project.toml

+1-1
Original file line numberDiff line numberDiff line change
@@ -18,7 +18,7 @@ SparseArrays = "2f01184e-e22b-5df5-ae63-d93ebab69eaf"
1818
Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40"
1919

2020
[compat]
21-
AMDGPU = "=0.4.2"
21+
AMDGPU = "0.4"
2222
CUDA = "3.4"
2323
ExaTron = "2"
2424
FileIO = "1.14"

src/interface/solve_acopf.jl

+4-6
Original file line numberDiff line numberDiff line change
@@ -17,14 +17,12 @@ function solve_acopf(case::String;
1717
elseif use_gpu && isa(ka_device, Nothing)
1818
CUDA.device!(gpu_no)
1919
TD = CuArray{Float64,1}; TI = CuArray{Int,1}; TM = CuArray{Float64,2}
20-
elseif use_gpu && isa(ka_device, KA.Device)
21-
if has_cuda_gpu()
20+
elseif has_cuda_gpu()
2221
TD = CuArray{Float64,1}; TI = CuArray{Int,1}; TM = CuArray{Float64,2}
23-
elseif has_rocm_gpu()
24-
TD = ROCArray{Float64,1}; TI = ROCArray{Int,1}; TM = ROCArray{Float64,2}
25-
end
22+
elseif has_rocm_gpu()
23+
TD = ROCArray{Float64,1}; TI = ROCArray{Int,1}; TM = ROCArray{Float64,2}
2624
else
27-
error("Inconsistent device selection use_gpu=$use_gpu and ka_device=$(typepof(ka_device))")
25+
error("Inconsistent device selection use_gpu=$use_gpu and ka_device=$(typeof(ka_device))")
2826
end
2927

3028
env = AdmmEnv{T,TD,TI,TM}(case, rho_pq, rho_va; case_format=case_format,

src/models/acopf/acopf_admm_prepoststep_ka.jl

+1-1
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@ function admm_outer_prestep(
44
device
55
)
66
sol, info = mod.solution, mod.info
7-
info.norm_z_prev = norm(sol.z_curr)
7+
info.norm_z_prev = norm(sol.z_curr, device)
88
return
99
end
1010

src/models/acopf/acopf_admm_update_residual_ka.jl

+4-4
Original file line numberDiff line numberDiff line change
@@ -33,10 +33,10 @@ function admm_update_residual(
3333
)
3434
wait(ev)
3535

36-
info.primres = norm(sol.rp)
37-
info.dualres = norm(sol.rd)
38-
info.norm_z_curr = norm(sol.z_curr)
39-
info.mismatch = norm(sol.Ax_plus_By)
36+
info.primres = norm(sol.rp, device)
37+
info.dualres = norm(sol.rd, device)
38+
info.norm_z_curr = norm(sol.z_curr, device)
39+
info.mismatch = norm(sol.Ax_plus_By, device)
4040

4141
return
4242
end

src/utils/utilities_ka.jl

+24
Original file line numberDiff line numberDiff line change
@@ -17,3 +17,27 @@ end
1717
c[tx] = a[tx] - b[tx]
1818
end
1919
end
20+
@kernel function norm_kernel(::Val{n}, x,
21+
y
22+
) where {n}
23+
tx = @index(Local, Linear)
24+
bx = @index(Group, Linear)
25+
26+
_x = @localmem Float64 (n,)
27+
_x[tx] = x[tx]
28+
@synchronize
29+
30+
v = ExaTron.dnrm2(n, _x, 1, tx)
31+
if bx == 1 && tx == 1
32+
y[1] = v
33+
end
34+
@synchronize
35+
36+
end
37+
function LinearAlgebra.norm(x, device)
38+
y = KAArray{Float64}(1, device)
39+
n = length(x)
40+
wait(norm_kernel(device,n)(Val{n}(), x, y,ndrange=(n,),dependencies=Event(device)))
41+
ret = y |> Array
42+
return ret[1]
43+
end

test/algorithms/acopf_update_cpu.jl

+1-1
Original file line numberDiff line numberDiff line change
@@ -176,5 +176,5 @@
176176
@test mod.info.status == :Solved
177177
@test mod.info.outer == 20
178178
@test mod.info.cumul == 1232
179-
@test isapprox(mod.info.objval, 129645.676; atol=1e-3)
179+
@test isapprox(mod.info.objval, 129645.676; rtol=1e-6)
180180
end

test/algorithms/acopf_update_ka.jl

+3-1
Original file line numberDiff line numberDiff line change
@@ -13,6 +13,8 @@ if CUDA.has_cuda_gpu() || AMDGPU.has_rocm_gpu()
1313
end
1414
if AMDGPU.has_rocm_gpu()
1515
using ROCKernels
16+
# Set for crusher login node to avoid other users
17+
AMDGPU.default_device!(AMDGPU.devices()[2])
1618
function ExaAdmm.KAArray{T}(n::Int, device::ROCDevice) where {T}
1719
return ROCArray{T}(undef, n)
1820
end
@@ -31,7 +33,7 @@ end
3133
if isa(device, KA.CPU)
3234
TD = Array{Float64,1}; TI = Array{Int,1}; TM = Array{Float64,2}
3335
env = ExaAdmm.AdmmEnv{T,TD,TI,TM}(case, rho_pq, rho_va; use_gpu=false, ka_device=device, verbose=verbose)
34-
else isa(device, ROCDevice)
36+
else
3537
if CUDA.has_cuda_gpu()
3638
TD = CuArray{Float64,1}; TI = CuArray{Int,1}; TM = CuArray{Float64,2}
3739
elseif AMDGPU.has_rocm_gpu()

0 commit comments

Comments
 (0)