FluxML · nomadbl · May 24, 2023 · May 24, 2023 · May 24, 2023 · May 25, 2023
diff --git a/src/onehot.jl b/src/onehot.jl
@@ -48,7 +48,7 @@ end
 _findval(val, labels::Tuple{}, i::Integer) = nothing
 
 """
-    onehotbatch(xs, labels, [default])
+    onehotbatch(xs, labels, [default]; dims::Val{D}=Val{1})
-    onehotbatch(xs, labels, [default]; dims::Val{D}=Val{1})
+    onehotbatch(xs, labels, [default]; dims = Val(1))
-    onehotbatch(xs, labels, [default]; dims::Val{D}=Val{1})
+    onehotbatch(xs, labels, [default]; dims = Val(1))
 
 Returns a [`OneHotMatrix`](@ref) where `k`th column of the matrix is [`onehot(xs[k], labels)`](@ref onehot).
 This is a sparse matrix, which stores just a `Vector{UInt32}` containing the indices of the
@@ -64,6 +64,8 @@ i.e. `result[:, k...] == onehot(xs[k...], labels)`.
 Note that `xs` can be any iterable, such as a string. And that using a tuple
 for `labels` will often speed up construction, certainly for less than 32 classes.
 
+If dims keyword is given, the onehot vectors lie on the [dims] dimension rather than the first one.
-If dims keyword is given, the onehot vectors lie on the [dims] dimension rather than the first one.
+If dims keyword is given, the onehot vectors lie on the `dims` dimension rather than the first one. `dims` should be provided as a `Val` to guarantee type stability (but an plain integer is valid as well).
-If dims keyword is given, the onehot vectors lie on the [dims] dimension rather than the first one.
+If dims keyword is given, the onehot vectors lie on the `dims` dimension rather than the first one. `dims` should be provided as a `Val` to guarantee type stability (but an plain integer is valid as well).
+
 # Examples
 ```jldoctest
 julia> oh = onehotbatch("abracadabra", 'a':'e', 'e')
@@ -74,30 +76,40 @@ julia> oh = onehotbatch("abracadabra", 'a':'e', 'e')
  ⋅  ⋅  ⋅  ⋅  ⋅  ⋅  1  ⋅  ⋅  ⋅  ⋅
  ⋅  ⋅  1  ⋅  ⋅  ⋅  ⋅  ⋅  ⋅  1  ⋅
 
+ julia> oh = onehotbatch("abracadabra", 'a':'e', 'e'; dims=2)
+5×11 OneHotMatrix(::Vector{UInt32}) with eltype Bool:
+ 1  ⋅  ⋅  ⋅  ⋅
+ ⋅  1  ⋅  ⋅  ⋅
+ ⋅  ⋅  ⋅  ⋅  1
+ 1  ⋅  ⋅  ⋅  ⋅
+ ⋅  ⋅  1  ⋅  ⋅
+ 1  ⋅  ⋅  ⋅  ⋅
+ ⋅  ⋅  ⋅  1  ⋅
+ 1  ⋅  ⋅  ⋅  ⋅
+ ⋅  1  ⋅  ⋅  ⋅
+ ⋅  ⋅  ⋅  ⋅  1
+ 1  ⋅  ⋅  ⋅  ⋅
+
 julia> reshape(1:15, 3, 5) * oh  # this matrix multiplication is done efficiently
 3×11 Matrix{Int64}:
  1  4  13  1  7  1  10  1  4  13  1
  2  5  14  2  8  2  11  2  5  14  2
  3  6  15  3  9  3  12  3  6  15  3
 ```
 """
-onehotbatch(data, labels, default...) = _onehotbatch(data, length(labels) < 32 ? Tuple(labels) : labels, default...)
 
-function _onehotbatch(data, labels)
-  indices = UInt32[something(_findval(i, labels), 0) for i in data]
-  if 0 in indices
-    for x in data
-      isnothing(_findval(x, labels)) && error("Value $x not found in labels")
-    end
+onehotbatch(data::String, labels, default...; dims::Val{D} = Val(1)) where D = onehotbatch(collect(data), labels, default...; dims=dims)
+onehotbatch(data::AbstractRange, labels, default...; dims::Val{D} = Val(1)) where D = onehotbatch(collect(data), labels, default...; dims=dims)
+function onehotbatch(data::AbstractArray{<:Any, N}, labels, default...; dims::Val{D}= Val(1)) where {N,D}
+  out = _onehotbatch(data, length(labels) < 32 ? Tuple(labels) : labels, default...)
+  if D==1
+    out
+  else
+    perm = Tuple(ntuple(d -> d==D ? 1 : (d==1 ? D : d), N+1))
+    # need to use obtuse PermutedDimsArray constructor in order to stabilise permuation types
+    iperm = invperm(perm)
+    PermutedDimsArray{eltype(out),N+1,(perm...,),(iperm...,),typeof(out)}(out)
   end
-  return OneHotArray(indices, length(labels))
-end
-
-function _onehotbatch(data, labels, default)
-  default_index = _findval(default, labels)
-  isnothing(default_index) && error("Default value $default is not in labels")
-  indices = UInt32[something(_findval(i, labels), default_index) for i in data]
-  return OneHotArray(indices, length(labels))
 end
 
 function onehotbatch(data::AbstractArray{<:Integer}, labels::AbstractUnitRange{<:Integer})
@@ -108,6 +120,8 @@ function onehotbatch(data::AbstractArray{<:Integer}, labels::AbstractUnitRange{<
   indices = UInt32.(data .+ offset)
   return OneHotArray(indices, length(labels))
 end
+onehotbatch(data::AbstractRange{<:Integer}, labels::AbstractUnitRange{<:Integer}) = onehotbatch(collect(data), labels)
+
 # That bounds check with extrema synchronises on GPU, much slower than rest of the function,
 # hence add a special method, with a less helpful error message:
 function onehotbatch(data::AbstractGPUArray{<:Integer}, labels::AbstractUnitRange{<:Integer})
@@ -120,6 +134,24 @@ function onehotbatch(data::AbstractGPUArray{<:Integer}, labels::AbstractUnitRang
   return OneHotArray(indices, length(labels))
 end
 
+
+function _onehotbatch(data, labels)
+  indices = UInt32[something(_findval(i, labels), 0) for i in data]
+  if 0 in indices
+    for x in data
+      isnothing(_findval(x, labels)) && error("Value $x not found in labels")
+    end
+  end
+  return OneHotArray(indices, length(labels))
+end
+
+function _onehotbatch(data, labels, default)
+  default_index = _findval(default, labels)
+  isnothing(default_index) && error("Default value $default is not in labels")
+  indices = UInt32[something(_findval(i, labels), default_index) for i in data]
+  return OneHotArray(indices, length(labels))
+end
+
 """
     onecold(y::AbstractArray, labels = 1:size(y,1))
 

diff --git a/test/onehot.jl b/test/onehot.jl
@@ -69,3 +69,17 @@ end
   @test y[:,1] isa OneHotVector
   @test y[:,:] isa OneHotMatrix
 end
+
+@testset "onehotbatch dims" begin
+  # basic tests
+  @test onehotbatch([20, 10], 10:10:30; dims=Val(2)) == Bool[0 1 0; 1 0 0]
+  @test onehotbatch([10, 20], [30, 40, 50], 30; dims=Val(2)) == Bool[1 0 0; 1 0 0]
+  # higher dimensions
+  @test size(onehotbatch(reshape(collect(1:12), 3, 4), 1:12; dims=Val(2))) == (3, 12, 4) # test shape
+  @test sum(onehotbatch(reshape(collect(1:12), 3, 4), 1:12; dims=Val(2)), dims=2)[:] == ones(12) # test onehot on the second dim
+  # works with strings
+  @test onehotbatch("ba", 'a':'c'; dims=Val(2)) == Bool[0 1 0; 1 0 0]
+
+  @test @inferred(onehotbatch([20, 10], 10:10:30; dims=Val(2))) == Bool[0 1 0; 1 0 0]
+  @test @inferred(onehotbatch([40, 10], (10,20,30), 20; dims=Val(2))) == Bool[0 1 0; 1 0 0]
+end