Propagate NaNs and update tests (#260)

* Fix promotion of F64, add compat bounds for stdlibs * Test == 0, not > 0 to propagate NaNs * Fix indexing of data in tests to ensure inputs match * Fix and extend DimensionMismatch tests and check for new NaNs * Floating point rounding error fix * gkl_divergence() needs same types like kl_divergence() and renyi_divergence() * Remove unnecessary update * Update workflow versions * Another floating point rounding error * Update zero() to iszero() * Add in testing of different input types * Add in additional testing * Update compats and fix using * Fix for new stdlib dependency requirements * Fix promote_type to promote_rule * Fixing stdlib deps for julia 1.0 and 1.9 together * Remove Requires dependency * Revert workflow changes --------- Co-authored-by: Daniel Karrasch <[email protected]>
JuliaStats · Nov 30, 2023 · 886ad02 · 886ad02 · devmotion · Nov 30, 2023
1 parent 6d0110d
commit 886ad02
Show file tree

Hide file tree

Showing 6 changed files with 46 additions and 37 deletions.
diff --git a/.github/workflows/CI.yml b/.github/workflows/CI.yml
@@ -26,7 +26,7 @@ jobs:
         arch:
           - x64
     steps:
-      - uses: actions/checkout@v2
+      - uses: actions/checkout@v4
       - uses: julia-actions/setup-julia@v1
         with:
           version: ${{ matrix.version }}
@@ -37,7 +37,7 @@ jobs:
           coverage: ${{ matrix.version != '1' }}
       - uses: julia-actions/julia-processcoverage@v1
         if: matrix.version != '1'
-      - uses: codecov/codecov-action@v1
+      - uses: codecov/codecov-action@v3
         if: matrix.version != '1'
         with:
           file: lcov.info
diff --git a/Project.toml b/Project.toml
@@ -1,6 +1,6 @@
 name = "Distances"
 uuid = "b4f34e82-e78d-54a5-968a-f98e89d6e8f7"
-version = "0.10.10"
+version = "0.10.11"
 
 [deps]
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
@@ -18,6 +18,9 @@ DistancesSparseArraysExt = "SparseArrays"
 
 [compat]
 ChainRulesCore = "1"
+LinearAlgebra = "<0.0.1, 1"
+SparseArrays = "<0.0.1, 1"
+Statistics = "<0.0.1, 1"
 StatsAPI = "1"
 julia = "1"
 

diff --git a/ext/DistancesSparseArraysExt.jl b/ext/DistancesSparseArraysExt.jl
@@ -4,7 +4,6 @@ using Distances
 import Distances: _evaluate
 using Distances: UnionMetrics, result_type, eval_start, eval_op, eval_reduce, eval_end
 using SparseArrays: SparseVectorUnion, nonzeroinds, nonzeros, nnz
-using SparseArrays: SparseVectorUnion
 
 eval_op_a(d, ai, b) = eval_op(d, ai, zero(eltype(b)))
 eval_op_b(d, bi, a) = eval_op(d, zero(eltype(a)), bi)

diff --git a/src/metrics.jl b/src/metrics.jl
@@ -423,12 +423,12 @@ const chisq_dist = ChiSqDist()
 
 # KLDivergence
 @inline eval_op(dist::KLDivergence, ai, bi) =
-    ai > 0 ? ai * log(ai / bi) : zero(eval_op(dist, oneunit(ai), bi))
+    iszero(ai) ? zero(eval_op(dist, oneunit(ai), bi)) : ai * log(ai / bi)
 const kl_divergence = KLDivergence()
 
 # GenKLDivergence
 @inline eval_op(dist::GenKLDivergence, ai, bi) =
-    ai > 0 ? ai * log(ai / bi) - ai + bi : oftype(eval_op(dist, oneunit(ai), bi), bi)
+    iszero(ai) ? oftype(eval_op(dist, oneunit(ai), bi), bi) : ai * log(ai / bi) - ai + bi
 const gkl_divergence = GenKLDivergence()
 
 # RenyiDivergence
@@ -437,8 +437,8 @@ Base.@propagate_inbounds function eval_start(::RenyiDivergence, a, b)
     zero(T), zero(T), T(sum(a)), T(sum(b))
 end
 
-@inline function eval_op(dist::RenyiDivergence, ai::T, bi::T) where {T <: Real}
-    if ai == zero(T)
+@inline function eval_op(dist::RenyiDivergence, ai::T, bi::T) where T
+    if iszero(ai)
         return zero(T), zero(T), zero(T), zero(T)
     elseif dist.is_normal
         return ai, ai * ((ai / bi)^dist.p), zero(T), zero(T)
@@ -452,12 +452,12 @@ end
 end
 
 @inline function eval_reduce(dist::RenyiDivergence,
-                                               s1::Tuple{T,T,T,T},
-                                               s2::Tuple{T,T,T,T}) where {T <: Real}
+                             s1::Tuple{T,T,T,T},
+                             s2::Tuple{T,T,T,T}) where T
     if dist.is_inf
-        if s1[1] == zero(T)
+        if iszero(s1[1])
             return (s2[1], s2[2], s1[3], s1[4])
-        elseif s2[1] == zero(T)
+        elseif iszero(s2[1])
             return s1
         else
             return s1[2] > s2[2] ? s1 : (s2[1], s2[2], s1[3], s1[4])
@@ -487,11 +487,11 @@ end
 
 # JSDivergence
 
-@inline function eval_op(::JSDivergence, ai::T, bi::T) where {T}
+@inline function eval_op(::JSDivergence, ai::T, bi::T) where T
     u = (ai + bi) / 2
-    ta = ai > 0 ? ai * log(ai) / 2 : zero(log(one(T)))
-    tb = bi > 0 ? bi * log(bi) / 2 : zero(log(one(T)))
-    tu = u > 0 ? u * log(u) : zero(log(one(T)))
+    ta = iszero(ai) ? zero(log(one(T))) : ai * log(ai) / 2
+    tb = iszero(bi) ? zero(log(one(T))) : bi * log(bi) / 2
+    tu = iszero(u) ? zero(log(one(T))) : u * log(u)
     ta + tb - tu
 end
 const js_divergence = JSDivergence()

diff --git a/test/F64.jl b/test/F64.jl
@@ -37,8 +37,8 @@ Base.:<=(a::F64, b::F64) = a.x <= b.x
 Base.eps(::Type{F64}) = eps(Float64)
 
 # promotion
-Base.promote_type(::Type{Float32}, ::Type{F64}) = Float64 # for eig
-Base.promote_type(::Type{Float64}, ::Type{F64}) = Float64 # for vecnorm
+Base.promote_rule(::Type{Float32}, ::Type{F64}) = Float64 # for eig
+Base.promote_rule(::Type{Float64}, ::Type{F64}) = Float64 # for vecnorm
 Base.promote(a::F64, b::T) where {T <: Number} = a, F64(float(b))
 Base.promote(a::T, b::F64) where {T <: Number} = F64(float(a)), b
 

diff --git a/test/test_dists.jl b/test/test_dists.jl
@@ -222,7 +222,7 @@ end
             for (x, y) in ((x, y), (sparsevec(x), sparsevec(y)),
                            (convert(Array{Union{Missing, T}}, x), convert(Array{Union{Missing, T}}, y)),
                            ((Iterators.take(x, 4), Iterators.take(y, 4))), # iterator
-                           (((x[i] for i in 1:length(x)), (y[i] for i in 1:length(y)))), # generator
+                           (((x[i] for i in eachindex(x)), (y[i] for i in eachindex(y)))), # generator
                           )
                 xc, yc = collect(x), collect(y)
                 @test sqeuclidean(x, y) == 57.0
@@ -241,14 +241,14 @@ end
                 x_int, y_int = Int64.(x), Int64.(y)
                 @test cosine_dist(x_int, y_int) == (1.0 - 112.0 / sqrt(19530.0))
                 @test corr_dist(x, y) ≈ cosine_dist(x .- mean(x), vec(yc) .- mean(y))
-                @test corr_dist(OffsetVector(xc, -1:length(xc)-2), yc) == corr_dist(x, y)
+                @test corr_dist(OffsetVector(xc, eachindex(xc).-2), yc) == corr_dist(x, y)
                 @test chisq_dist(x, y) == sum((xc - vec(yc)).^2 ./ (xc + vec(yc)))
                 @test spannorm_dist(x, y) == maximum(xc - vec(yc)) - minimum(xc - vec(yc))
-
-                @test gkl_divergence(x, y) ≈ sum(i -> xc[i] * log(xc[i] / yc[i]) - xc[i] + yc[i], 1:length(x))
-
-                @test meanad(x, y) ≈ mean(Float64[abs(xc[i] - yc[i]) for i in 1:length(x)])
-                @test msd(x, y) ≈ mean(Float64[abs2(xc[i] - yc[i]) for i in 1:length(x)])
+                @test kl_divergence(x, y) ≈ sum(xc[i] * log(xc[i] / yc[i]) for i in eachindex(xc, yc))
+                @test gkl_divergence(x, y) ≈ sum(xc[i] * log(xc[i] / yc[i]) - xc[i] + yc[i] for i in eachindex(xc, yc))
+                @test bhattacharyya(x, y) == bhattacharyya(xc, yc)
+                @test meanad(x, y) ≈ mean(Float64[abs(xc[i] - yc[i]) for i in eachindex(xc, yc)])
+                @test msd(x, y) ≈ mean(Float64[abs2(xc[i] - yc[i]) for i in eachindex(xc, yc)])
                 @test rmsd(x, y) ≈ sqrt(msd(x, y))
                 @test nrmsd(x, y) ≈ sqrt(msd(x, y)) / (maximum(x) - minimum(x))
 
@@ -257,7 +257,7 @@ end
 
                 w = rand(Float64, length(x))
                 @test wsqeuclidean(x, y, w) ≈ dot((xc - vec(yc)).^2, w)
-                @test weuclidean(x, y, w) == sqrt(wsqeuclidean(x, y, w))
+                @test weuclidean(x, y, w) ≈ sqrt(wsqeuclidean(x, y, w))
                 @test wcityblock(x, y, w) ≈ dot(abs.(xc - vec(yc)), w)
                 @test wminkowski(x, y, w, 2) ≈ weuclidean(x, y, w)
             end
@@ -272,7 +272,7 @@ end
         w = rand(T, size(a))
 
         @test whamming(a, a, w) === T(0.0)
-        @test whamming(a, b, w) === sum((a .!= b) .* w)
+        @test whamming(a, b, w) ≈ (a .≠ b) ⋅ w
 
         # Minimal test of Jaccard - test return type stability.
         @inferred Jaccard()(rand(T, 3), rand(T, 3))
@@ -295,7 +295,7 @@ end
         q /= sum(q)
 
         klv = 0.0
-        for i = 1:length(p)
+        for i in eachindex(p, q)
             if p[i] > 0
                 klv += p[i] * log(p[i] / q[i])
             end
@@ -304,7 +304,7 @@ end
         pm = (p + q) / 2
         for (r, p, pm) in ((r, p, pm),
                            (Iterators.take(r, length(r)), Iterators.take(p, length(p)), Iterators.take(pm, length(pm))),
-                           ((r[i] for i in 1:length(r)), (p[i] for i in 1:length(p)), (pm[i] for i in 1:length(pm))),
+                           ((r[i] for i in eachindex(r)), (p[i] for i in eachindex(p)), (pm[i] for i in eachindex(pm))),
                           )
             @test kl_divergence(p, q) ≈ klv
             @test typeof(kl_divergence(p, q)) == T
@@ -330,6 +330,9 @@ end # testset
     a = [NaN, 0]; b = [0, 1]
     @test isnan(chebyshev(a, b)) == isnan(maximum(a - b))
     @test isnan(renyi_divergence([0.5, 0.0, 0.5], [0.5, 0.5, NaN], 2))
+    @test isnan(kl_divergence([0.5, 0.0, 0.5], [0.5, 0.5, NaN]))
+    @test isnan(gkl_divergence([0.5, 0.0, 0.5], [0.5, 0.5, NaN]))
+    @test isnan(js_divergence([0.5, 0.0, 0.5], [0.5, 0.5, NaN]))
 end #testset
 
 @testset "empty vector" begin
@@ -364,6 +367,12 @@ end #testset
 end # testset
 
 @testset "DimensionMismatch throwing" begin
+    a = 1.0:2; b = 1:3.0
+    @test_throws DimensionMismatch cosine_dist(a, b)
+    @test_throws DimensionMismatch kl_divergence(a, b)
+    @test_throws DimensionMismatch gkl_divergence(a, b)
+    @test_throws DimensionMismatch js_divergence(a, b)
+    @test_throws DimensionMismatch renyi_divergence(a, b, 1.0)
     a = [1, 0]; b = [2]
     @test_throws DimensionMismatch sqeuclidean(a, b)
     a = (1, 0); b = (2,)
@@ -414,23 +423,21 @@ end # testset
         @test (@inferred peuclidean(x, y, fill(10, 4))) == sqrt(37)
         @test (@inferred peuclidean(x - vec(y), zero(y), fill(10, 4))) == peuclidean(x, y, fill(10, 4))
         @test (@inferred peuclidean(x, y, [10.0, 10.0, 10.0, Inf])) == sqrt(57)
-        @test_throws DimensionMismatch cosine_dist(1.0:2, 1.0:3)
         @test (@inferred cosine_dist(x, y)) ≈ (1 - 112 / sqrt(19530))
         @test (@inferred corr_dist(x, y)) ≈ cosine_dist(x .- mean(x), vec(y) .- mean(y))
         @test (@inferred chisq_dist(x, y)) == sum((x - vec(y)).^2 ./ (x + vec(y)))
         @test (@inferred spannorm_dist(x, y)) == maximum(x - vec(y)) - minimum(x - vec(y))
-
-        @test (@inferred gkl_divergence(x, y)) ≈ sum(i -> x[i] * log(x[i] / y[i]) - x[i] + y[i], 1:length(x))
-
-        @test (@inferred meanad(x, y)) ≈ mean(Float64[abs(x[i] - y[i]) for i in 1:length(x)])
-        @test (@inferred msd(x, y)) ≈ mean(Float64[abs2(x[i] - y[i]) for i in 1:length(x)])
+        @test (@inferred kl_divergence(x, y)) ≈ sum(x[i] * log(x[i] / y[i]) for i in eachindex(x, y))
+        @test (@inferred gkl_divergence(x, y)) ≈ sum(x[i] * log(x[i] / y[i]) - x[i] + y[i] for i in eachindex(x, y))
+        @test (@inferred meanad(x, y)) ≈ mean(Float64[abs(x[i] - y[i]) for i in eachindex(x, y)])
+        @test (@inferred msd(x, y)) ≈ mean(Float64[abs2(x[i] - y[i]) for i in eachindex(x, y)])
         @test (@inferred rmsd(x, y)) ≈ sqrt(msd(x, y))
         @test (@inferred nrmsd(x, y)) ≈ sqrt(msd(x, y)) / (maximum(x) - minimum(x))
 
         w = ones(Int, 4)
         @test sqeuclidean(x, y) ≈ wsqeuclidean(x, y, w)
 
-        w = rand(1:length(x), size(x))
+        w = rand(eachindex(x), size(x))
         @test (@inferred wsqeuclidean(x, y, w)) ≈ dot((x - vec(y)).^2, w)
         @test (@inferred weuclidean(x, y, w)) == sqrt(wsqeuclidean(x, y, w))
         @test (@inferred wcityblock(x, y, w)) ≈ dot(abs.(x - vec(y)), w)
@@ -972,7 +979,7 @@ end
     G(p) = -1 * sum(log.(p))
     ∇G(p) = map(x -> -1 * x^(-1), p)
     function ISdist(p::AbstractVector, q::AbstractVector)
-        return sum([p[i]/q[i] - log(p[i]/q[i]) - 1 for i in 1:length(p)])
+        return sum([p[i]/q[i] - log(p[i]/q[i]) - 1 for i in eachindex(p, q)])
     end
     @test bregman(G, ∇G, p, q) ≈ ISdist(p, q)
 end