Add Diagonal svd implementation and tests

lkdvos · lkdvos · commit 77ef1e6532c7 · 2025-09-02T16:08:16.000-04:00
diff --git a/src/implementations/svd.jl b/src/implementations/svd.jl
@@ -7,6 +7,8 @@ copy_input(::typeof(svd_compact), A) = copy_input(svd_full, A)
 copy_input(::typeof(svd_vals), A) = copy_input(svd_full, A)
 copy_input(::typeof(svd_trunc), A) = copy_input(svd_compact, A)
 
+copy_input(::typeof(svd_full), A::Diagonal) = copy(A)
+
 # TODO: many of these checks are happening again in the LAPACK routines
 function check_input(::typeof(svd_full!), A::AbstractMatrix, USVᴴ, ::AbstractAlgorithm)
     m, n = size(A)
@@ -42,6 +44,32 @@ function check_input(::typeof(svd_vals!), A::AbstractMatrix, S, ::AbstractAlgori
     return nothing
 end
 
+function check_input(::typeof(svd_full!), A::AbstractMatrix, USVᴴ, ::DiagonalAlgorithm)
+    m, n = size(A)
+    @assert m == n && isdiag(A)
+    U, S, Vᴴ = USVᴴ
+    @assert U isa AbstractMatrix && S isa Diagonal && Vᴴ isa AbstractMatrix
+    @check_size(U, (m, m))
+    @check_scalar(U, A)
+    @check_size(S, (m, n))
+    @check_scalar(S, A, real)
+    @check_size(Vᴴ, (n, n))
+    @check_scalar(Vᴴ, A)
+    return nothing
+end
+function check_input(::typeof(svd_compact!), A::AbstractMatrix, USVᴴ,
+                     alg::DiagonalAlgorithm)
+    return check_input(svd_full!, A, USVᴴ, alg)
+end
+function check_input(::typeof(svd_vals!), A::AbstractMatrix, S, ::DiagonalAlgorithm)
+    m, n = size(A)
+    @assert m == n && isdiag(A)
+    @assert S isa AbstractVector
+    @check_size(S, (m,))
+    @check_scalar(S, A, real)
+    return nothing
+end
+
 # Outputs
 # -------
 function initialize_output(::typeof(svd_full!), A::AbstractMatrix, ::AbstractAlgorithm)
@@ -66,6 +94,18 @@ function initialize_output(::typeof(svd_trunc!), A::AbstractMatrix, alg::Truncat
     return initialize_output(svd_compact!, A, alg.alg)
 end
 
+function initialize_output(::typeof(svd_full!), A::Diagonal, ::DiagonalAlgorithm)
+    TA = eltype(A)
+    TUV = Base.promote_op(sign_safe, TA)
+    return similar(A, TUV, size(A)), similar(A, real(TA)), similar(A, TUV, size(A))
+end
+function initialize_output(::typeof(svd_compact!), A::Diagonal, alg::DiagonalAlgorithm)
+    return initialize_output(svd_full!, A, alg)
+end
+function initialize_output(::typeof(svd_vals!), A::Diagonal, ::DiagonalAlgorithm)
+    return eltype(A) <: Real ? diagview(A) : similar(A, real(eltype(A)), size(A, 1))
+end
+
 function gaugefix!(::typeof(svd_full!), U, S, Vᴴ, m::Int, n::Int)
     for j in 1:max(m, n)
         if j <= min(m, n)
@@ -111,7 +151,6 @@ function gaugefix!(::typeof(svd_trunc!), U, S, Vᴴ, m::Int, n::Int)
     return (U, S, Vᴴ)
 end
 
-
 # Implementation
 # --------------
 function svd_full!(A::AbstractMatrix, USVᴴ, alg::LAPACK_SVDAlgorithm)
@@ -203,7 +242,39 @@ function svd_trunc!(A::AbstractMatrix, USVᴴ, alg::TruncatedAlgorithm)
     return truncate!(svd_trunc!, USVᴴ′, alg.trunc)
 end
 
-### GPU logic
+# Diagonal logic
+# --------------
+function svd_full!(A::AbstractMatrix, USVᴴ, alg::DiagonalAlgorithm)
+    check_input(svd_full!, A, USVᴴ, alg)
+    Ad = diagview(A)
+    U, S, Vᴴ = USVᴴ
+    Sd = diagview(S)
+    Sd .= abs.(Ad)
+    p = sortperm(Sd; rev=true)
+    permute!(Sd, p)
+    T = eltype(Vᴴ)
+    zero!(U)
+    zero!(Vᴴ)
+    @inbounds for (i, pi) in enumerate(p)
+        s = Ad[pi]
+        U[pi, i] = sign_safe(s)
+        Vᴴ[i, pi] = one(T)
+    end
+    return U, S, Vᴴ
+end
+function svd_compact!(A::AbstractMatrix, USVᴴ, alg::DiagonalAlgorithm)
+    return svd_full!(A, USVᴴ, alg)
+end
+function svd_vals!(A::AbstractMatrix, S, alg::DiagonalAlgorithm)
+    check_input(svd_vals!, A, S, alg)
+    Ad = diagview(A)
+    S .= abs.(Ad)
+    sort!(S; rev=true)
+    return S
+end
+
+# GPU logic
+# ---------
 # placed here to avoid code duplication since much of the logic is replicable across
 # CUDA and AMDGPU
 ###
@@ -213,12 +284,13 @@ const CUSOLVER_SVDAlgorithm = Union{CUSOLVER_QRIteration,
                                     CUSOLVER_Randomized}
 const ROCSOLVER_SVDAlgorithm = Union{ROCSOLVER_QRIteration,
                                      ROCSOLVER_Jacobi}
-const GPU_SVDAlgorithm = Union{CUSOLVER_SVDAlgorithm, ROCSOLVER_SVDAlgorithm}
+const GPU_SVDAlgorithm = Union{CUSOLVER_SVDAlgorithm,ROCSOLVER_SVDAlgorithm}
 
 const GPU_SVDPolar = Union{CUSOLVER_SVDPolar}
 const GPU_Randomized = Union{CUSOLVER_Randomized}
 
-function check_input(::typeof(svd_trunc!), A::AbstractMatrix, USVᴴ, alg::CUSOLVER_Randomized)
+function check_input(::typeof(svd_trunc!), A::AbstractMatrix, USVᴴ,
+                     alg::CUSOLVER_Randomized)
     m, n = size(A)
     minmn = min(m, n)
     U, S, Vᴴ = USVᴴ
@@ -232,7 +304,8 @@ function check_input(::typeof(svd_trunc!), A::AbstractMatrix, USVᴴ, alg::CUSOL
     return nothing
 end
 
-function initialize_output(::typeof(svd_trunc!), A::AbstractMatrix, alg::TruncatedAlgorithm{<:CUSOLVER_Randomized})
+function initialize_output(::typeof(svd_trunc!), A::AbstractMatrix,
+                           alg::TruncatedAlgorithm{<:CUSOLVER_Randomized})
     m, n = size(A)
     minmn = min(m, n)
     U = similar(A, (m, m))
@@ -241,10 +314,22 @@ function initialize_output(::typeof(svd_trunc!), A::AbstractMatrix, alg::Truncat
     return (U, S, Vᴴ)
 end
 
-_gpu_gesvd!(A::AbstractMatrix, S::AbstractVector, U::AbstractMatrix, Vᴴ::AbstractMatrix) = throw(MethodError(_gpu_gesvd!, (A, S, U, Vᴴ)))
-_gpu_Xgesvdp!(A::AbstractMatrix, S::AbstractVector, U::AbstractMatrix, Vᴴ::AbstractMatrix; kwargs...) = throw(MethodError(_gpu_Xgesvdp!, (A, S, U, Vᴴ)))
-_gpu_Xgesvdr!(A::AbstractMatrix, S::AbstractVector, U::AbstractMatrix, Vᴴ::AbstractMatrix; kwargs...) = throw(MethodError(_gpu_Xgesvdr!, (A, S, U, Vᴴ)))
-_gpu_gesvdj!(A::AbstractMatrix, S::AbstractVector, U::AbstractMatrix, Vᴴ::AbstractMatrix; kwargs...) = throw(MethodError(_gpu_gesvdj!, (A, S, U, Vᴴ)))
+function _gpu_gesvd!(A::AbstractMatrix, S::AbstractVector, U::AbstractMatrix,
+                     Vᴴ::AbstractMatrix)
+    throw(MethodError(_gpu_gesvd!, (A, S, U, Vᴴ)))
+end
+function _gpu_Xgesvdp!(A::AbstractMatrix, S::AbstractVector, U::AbstractMatrix,
+                       Vᴴ::AbstractMatrix; kwargs...)
+    throw(MethodError(_gpu_Xgesvdp!, (A, S, U, Vᴴ)))
+end
+function _gpu_Xgesvdr!(A::AbstractMatrix, S::AbstractVector, U::AbstractMatrix,
+                       Vᴴ::AbstractMatrix; kwargs...)
+    throw(MethodError(_gpu_Xgesvdr!, (A, S, U, Vᴴ)))
+end
+function _gpu_gesvdj!(A::AbstractMatrix, S::AbstractVector, U::AbstractMatrix,
+                      Vᴴ::AbstractMatrix; kwargs...)
+    throw(MethodError(_gpu_gesvdj!, (A, S, U, Vᴴ)))
+end
 # GPU SVD implementation
 function MatrixAlgebraKit.svd_full!(A::AbstractMatrix, USVᴴ, alg::GPU_SVDAlgorithm)
     check_input(svd_full!, A, USVᴴ, alg)
@@ -298,7 +383,7 @@ function MatrixAlgebraKit.svd_compact!(A::AbstractMatrix, USVᴴ, alg::GPU_SVDAl
         throw(ArgumentError("Unsupported SVD algorithm"))
     end
     # TODO: make this controllable using a `gaugefix` keyword argument
-    gaugefix!(svd_compact!, U, S, Vᴴ, size(A)...) 
+    gaugefix!(svd_compact!, U, S, Vᴴ, size(A)...)
     return USVᴴ
 end
 _argmaxabs(x) = reduce(_largest, x; init=zero(eltype(x)))
diff --git a/src/interface/svd.jl b/src/interface/svd.jl
@@ -97,6 +97,9 @@ end
 function default_svd_algorithm(::Type{T}; kwargs...) where {T<:YALAPACK.BlasMat}
     return LAPACK_DivideAndConquer(; kwargs...)
 end
+function default_svd_algorithm(::Type{T}; kwargs...) where {T<:Diagonal}
+    return DiagonalAlgorithm(; kwargs...)
+end
 
 for f in (:svd_full!, :svd_compact!, :svd_vals!)
     @eval function default_algorithm(::typeof($f), ::Type{A}; kwargs...) where {A}
diff --git a/test/svd.jl b/test/svd.jl
@@ -5,7 +5,9 @@ using StableRNGs
 using LinearAlgebra: LinearAlgebra, Diagonal, I, isposdef
 using MatrixAlgebraKit: TruncatedAlgorithm, TruncationKeepAbove, diagview, isisometry
 
-@testset "svd_compact! for T = $T" for T in (Float32, Float64, ComplexF32, ComplexF64)
+const BLASFloats = (Float32, Float64, ComplexF32, ComplexF64)
+
+@testset "svd_compact! for T = $T" for T in BLASFloats
     rng = StableRNG(123)
     m = 54
     @testset "size ($m, $n)" for n in (37, m, 63, 0)
@@ -54,7 +56,7 @@ using MatrixAlgebraKit: TruncatedAlgorithm, TruncationKeepAbove, diagview, isiso
     end
 end
 
-@testset "svd_full! for T = $T" for T in (Float32, Float64, ComplexF32, ComplexF64)
+@testset "svd_full! for T = $T" for T in BLASFloats
     rng = StableRNG(123)
     m = 54
     @testset "size ($m, $n)" for n in (37, m, 63, 0)
@@ -88,7 +90,7 @@ end
     end
 end
 
-@testset "svd_trunc! for T = $T" for T in (Float32, Float64, ComplexF32, ComplexF64)
+@testset "svd_trunc! for T = $T" for T in BLASFloats
     rng = StableRNG(123)
     m = 54
     if LinearAlgebra.LAPACK.version() < v"3.12.0"
@@ -122,9 +124,7 @@ end
     end
 end
 
-@testset "svd_trunc! mix maxrank and tol for T = $T" for T in
-                                                         (Float32, Float64, ComplexF32,
-                                                          ComplexF64)
+@testset "svd_trunc! mix maxrank and tol for T = $T" for T in BLASFloats
     rng = StableRNG(123)
     if LinearAlgebra.LAPACK.version() < v"3.12.0"
         algs = (LAPACK_DivideAndConquer(), LAPACK_QRIteration(), LAPACK_Bisection())
@@ -152,9 +152,7 @@ end
     end
 end
 
-@testset "svd_trunc! specify truncation algorithm T = $T" for T in
-                                                              (Float32, Float64, ComplexF32,
-                                                               ComplexF64)
+@testset "svd_trunc! specify truncation algorithm T = $T" for T in BLASFloats
     rng = StableRNG(123)
     m = 4
     U = qr_compact(randn(rng, T, m, m))[1]
@@ -166,3 +164,37 @@ end
     @test diagview(S2) ≈ diagview(S)[1:2] rtol = sqrt(eps(real(T)))
     @test_throws ArgumentError svd_trunc(A; alg, trunc=(; maxrank=2))
 end
+
+@testset "svd for Diagonal{$T}" for T in BLASFloats
+    rng = StableRNG(123)
+    for m in (54, 0)
+        Ad = randn(T, m)
+        A = Diagonal(Ad)
+
+        U, S, Vᴴ = @constinferred svd_compact(A)
+        @test U isa AbstractMatrix{T} && size(U) == size(A)
+        @test Vᴴ isa AbstractMatrix{T} && size(Vᴴ) == size(A)
+        @test S isa Diagonal{real(T)} && size(S) == size(A)
+        @test isunitary(U)
+        @test isunitary(Vᴴ)
+        @test all(≥(0), diagview(S))
+        @test A ≈ U * S * Vᴴ
+
+        U, S, Vᴴ = @constinferred svd_full(A)
+        @test U isa AbstractMatrix{T} && size(U) == size(A)
+        @test Vᴴ isa AbstractMatrix{T} && size(Vᴴ) == size(A)
+        @test S isa Diagonal{real(T)} && size(S) == size(A)
+        @test isunitary(U)
+        @test isunitary(Vᴴ)
+        @test all(≥(0), diagview(S))
+        @test A ≈ U * S * Vᴴ
+
+        S2 = @constinferred svd_vals(A)
+        @test S2 isa AbstractVector{real(T)} && length(S2) == m
+        @test S2 ≈ diagview(S)
+
+        alg = TruncatedAlgorithm(DiagonalAlgorithm(), truncrank(2))
+        U3, S3, Vᴴ3 = @constinferred svd_trunc(A; alg)
+        @test diagview(S3) ≈ S2[1:min(m, 2)]
+    end
+end