diff --git a/.buildkite/pipeline.yml b/.buildkite/pipeline.yml
new file mode 100644
index 00000000..379da306
--- /dev/null
+++ b/.buildkite/pipeline.yml
@@ -0,0 +1,37 @@
+steps:
+  - label: "Nvidia GPUs -- RegularizedLeastSquares.jl"
+    plugins:
+      - JuliaCI/julia#v1:
+          version: "1.10"
+    agents:
+      queue: "juliagpu"
+      cuda: "*"
+    command: |
+      julia --color=yes --project -e '
+      using Pkg
+      Pkg.add("TestEnv")
+      using TestEnv
+      TestEnv.activate();
+      Pkg.add("CUDA")
+      Pkg.instantiate()
+      include("test/gpu/cuda.jl")'
+    timeout_in_minutes: 30
+
+  - label: "AMD GPUs -- RegularizedLeastSquares.jl"
+    plugins:
+      - JuliaCI/julia#v1:
+          version: "1.10"
+    agents:
+      queue: "juliagpu"
+      rocm: "*"
+      rocmgpu: "*"
+    command: |
+      julia --color=yes --project -e '
+      using Pkg
+      Pkg.add("TestEnv")
+      using TestEnv
+      TestEnv.activate();
+      Pkg.add("AMDGPU")
+      Pkg.instantiate()
+      include("test/gpu/rocm.jl")'
+    timeout_in_minutes: 30
\ No newline at end of file
diff --git a/Project.toml b/Project.toml
index 40450a36..44c689fc 100644
--- a/Project.toml
+++ b/Project.toml
@@ -16,10 +16,14 @@ SparseArrays = "2f01184e-e22b-5df5-ae63-d93ebab69eaf"
 VectorizationBase = "3d5dd08c-fd9d-11e8-17fa-ed2836048c2f"
 InteractiveUtils = "b77e0a4c-d291-57a0-90e8-8db25a27a240"
 
+[weakdeps]
+GPUArrays = "0c68f7d7-f131-5f86-a1c3-88cf8149b2d7"
+
 [extras]
 Test = "8dfed614-e22c-5e08-85e1-65c5234f0b40"
 Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
 FFTW = "7a1cc6ca-52ef-59f5-83cd-3a7055c09341"
+JLArrays = "27aeb0d3-9eb9-45fb-866b-73c2ecf80fcb"
 
 [compat]
 IterativeSolvers = "0.9"
@@ -27,9 +31,14 @@ julia = "1.9"
 StatsBase = "0.33, 0.34"
 VectorizationBase = "0.19, 0.21"
 FFTW = "1.0"
-LinearOperatorCollection = "1.2"
-LinearOperators = "2.3.3"
 FLoops = "0.2"
+GPUArrays = "8, 9, 10"
+JLArrays = "0.1.2"
+LinearOperatorCollection = "2"
+LinearOperators = "2.3.3"
 
 [targets]
-test = ["Test", "Random", "FFTW"]
+test = ["Test", "Random", "FFTW", "JLArrays"]
+
+[extensions]
+RegularizedLeastSquaresGPUArraysExt = "GPUArrays"
diff --git a/ext/RegularizedLeastSquaresGPUArraysExt/Kaczmarz.jl b/ext/RegularizedLeastSquaresGPUArraysExt/Kaczmarz.jl
new file mode 100644
index 00000000..279828ba
--- /dev/null
+++ b/ext/RegularizedLeastSquaresGPUArraysExt/Kaczmarz.jl
@@ -0,0 +1,15 @@
+function RegularizedLeastSquares.iterate_row_index(solver::Kaczmarz, state::RegularizedLeastSquares.KaczmarzState{T, vecT}, A, row, index) where {T, vecT <: AbstractGPUArray}
+  state.τl = RegularizedLeastSquares.dot_with_matrix_row(A,state.x,row)
+  @allowscalar state.αl = solver.denom[index]*(state.u[row]-state.τl-state.ɛw*state.vl[row])
+  RegularizedLeastSquares.kaczmarz_update!(A,state.x,row,state.αl)
+  @allowscalar state.vl[row] += state.αl*state.ɛw
+end
+
+function RegularizedLeastSquares.kaczmarz_update!(A, x::vecT, row, beta) where {T, vecT <: AbstractGPUVector{T}}
+  x[:] .=  x .+ beta * conj.(view(A, row, :))
+end
+
+function RegularizedLeastSquares.kaczmarz_update!(B::Transpose{T, S}, x::vecT, row, beta) where {T, S <: AbstractGPUArray{T}, vecT <: AbstractGPUVector{T}}
+  A = B.parent
+  x[:] .=  x .+ beta * conj.(view(A, :, row))
+end
diff --git a/ext/RegularizedLeastSquaresGPUArraysExt/ProxL21.jl b/ext/RegularizedLeastSquaresGPUArraysExt/ProxL21.jl
new file mode 100644
index 00000000..da70c268
--- /dev/null
+++ b/ext/RegularizedLeastSquaresGPUArraysExt/ProxL21.jl
@@ -0,0 +1,11 @@
+function RegularizedLeastSquares.proxL21!(x::vecT, λ::T, slices::Int64) where {T, vecT <: Union{AbstractGPUVector{T}, AbstractGPUVector{Complex{T}}}}
+  sliceLength = div(length(x),slices)
+  groupNorm = copyto!(similar(x, Float32, sliceLength), [Float32(norm(x[i:sliceLength:end])) for i=1:sliceLength])
+
+  gpu_call(x, λ, groupNorm, sliceLength) do ctx, x_, λ_, groupNorm_, sliceLength_
+    i = @linearidx(x_)
+    @inbounds x_[i] = x_[i]*max( (groupNorm_[mod1(i,sliceLength_)]-λ_)/groupNorm_[mod1(i,sliceLength_)],0)
+    return nothing
+  end
+  return x
+end
\ No newline at end of file
diff --git a/ext/RegularizedLeastSquaresGPUArraysExt/ProxTV.jl b/ext/RegularizedLeastSquaresGPUArraysExt/ProxTV.jl
new file mode 100644
index 00000000..a09f7797
--- /dev/null
+++ b/ext/RegularizedLeastSquaresGPUArraysExt/ProxTV.jl
@@ -0,0 +1,15 @@
+function RegularizedLeastSquares.tv_restrictMagnitude!(x::vecT) where {T, vecT <: AbstractGPUVector{T}}
+  gpu_call(x) do ctx, x_
+    i = @linearidx(x_)
+    @inbounds x_[i] /= max(1, abs(x_[i]))
+    return nothing
+  end
+end
+
+function RegularizedLeastSquares.tv_linearcomb!(rs::vecT, t3, pq::vecT, t2, pqOld::vecT) where {T, vecT <: AbstractGPUVector{T}}
+  gpu_call(rs, t3, pq, t2, pqOld) do ctx, rs_, t3_, pq_, t2_, pqOld_
+    i = @linearidx(rs_)
+    @inbounds rs_[i] = t3_ * pq_[i] - t2_ * pqOld_[i]
+    return nothing
+  end
+end
\ No newline at end of file
diff --git a/ext/RegularizedLeastSquaresGPUArraysExt/RegularizedLeastSquaresGPUArraysExt.jl b/ext/RegularizedLeastSquaresGPUArraysExt/RegularizedLeastSquaresGPUArraysExt.jl
new file mode 100644
index 00000000..1109f789
--- /dev/null
+++ b/ext/RegularizedLeastSquaresGPUArraysExt/RegularizedLeastSquaresGPUArraysExt.jl
@@ -0,0 +1,10 @@
+module RegularizedLeastSquaresGPUArraysExt
+
+using RegularizedLeastSquares, RegularizedLeastSquares.LinearAlgebra, GPUArrays
+
+include("Utils.jl")
+include("ProxTV.jl")
+include("ProxL21.jl")
+include("Kaczmarz.jl")
+
+end
\ No newline at end of file
diff --git a/ext/RegularizedLeastSquaresGPUArraysExt/Utils.jl b/ext/RegularizedLeastSquaresGPUArraysExt/Utils.jl
new file mode 100644
index 00000000..47b973bc
--- /dev/null
+++ b/ext/RegularizedLeastSquaresGPUArraysExt/Utils.jl
@@ -0,0 +1,47 @@
+"""
+This function enforces the constraint of a real solution.
+"""
+function RegularizedLeastSquares.enfReal!(x::arrT) where {N, T<:Complex, arrGPUT <: AbstractGPUArray{T}, arrT <: Union{arrGPUT, SubArray{T, N, arrGPUT}}}
+  #Returns x as complex vector with imaginary part set to zero
+  gpu_call(x) do ctx, x_
+    i = @linearidx(x_)
+    @inbounds (x_[i] = complex(x_[i].re))
+    return nothing
+  end
+end
+
+"""
+This function enforces the constraint of a real solution.
+"""
+RegularizedLeastSquares.enfReal!(x::arrT) where {N, T<:Real, arrGPUT <: AbstractGPUArray{T}, arrT <: Union{arrGPUT, SubArray{T, N, arrGPUT}}} = nothing
+
+"""
+This function enforces positivity constraints on its input.
+"""
+function RegularizedLeastSquares.enfPos!(x::arrT) where {N, T<:Complex, arrGPUT <: AbstractGPUArray{T}, arrT <: Union{arrGPUT, SubArray{T, N, arrGPUT}}}
+  #Return x as complex vector with negative parts projected onto 0
+  gpu_call(x) do ctx, x_
+    i = @linearidx(x_)
+    @inbounds (x_[i].re < 0) && (x_[i] = im*x_[i].im)
+    return nothing
+  end
+end
+
+"""
+This function enforces positivity constraints on its input.
+"""
+function RegularizedLeastSquares.enfPos!(x::arrT) where {T<:Real, arrT <: AbstractGPUArray{T}}
+  #Return x as complex vector with negative parts projected onto 0
+  gpu_call(x) do ctx, x_
+    i = @linearidx(x_)
+    @inbounds (x_[i] < 0) && (x_[i] = zero(T))
+    return nothing
+  end
+end
+
+RegularizedLeastSquares.rownorm²(A::AbstractGPUMatrix,row::Int64) = sum(map(abs2, @view A[row, :]))
+RegularizedLeastSquares.rownorm²(B::Transpose{T,S},row::Int64) where {T,S<:AbstractGPUArray} = sum(map(abs2, @view B.parent[:, row]))
+
+
+RegularizedLeastSquares.dot_with_matrix_row(A::AbstractGPUMatrix{T}, x::AbstractGPUVector{T}, k::Int64) where {T} = reduce(+, x .* view(A, k, :))
+RegularizedLeastSquares.dot_with_matrix_row(B::Transpose{T,S}, x::AbstractGPUVector{T}, k::Int64) where {T,S<:AbstractGPUArray} = reduce(+, x .* view(B.parent, :, k))
\ No newline at end of file
diff --git a/src/ADMM.jl b/src/ADMM.jl
index b6d19379..48f5d355 100644
--- a/src/ADMM.jl
+++ b/src/ADMM.jl
@@ -1,13 +1,22 @@
 export ADMM
 
-mutable struct ADMM{matT,opT,R,ropT,P,vecT,rvecT,preconT,rT} <: AbstractPrimalDualSolver where {vecT <: AbstractVector{Union{rT, Complex{rT}}}, rvecT <: AbstractVector{rT}}
-  # operators and regularization
+mutable struct ADMM{matT,opT,R,ropT,P,preconT} <: AbstractPrimalDualSolver
   A::matT
   reg::Vector{R}
   regTrafo::Vector{ropT}
   proj::Vector{P}
-  # fields and operators for x update
   AHA::opT
+  precon::preconT
+  normalizeReg::AbstractRegularizationNormalization
+  vary_ρ::Symbol
+  verbose::Bool
+  iterations::Int64
+  iterationsCG::Int64
+  state::AbstractSolverState{<:ADMM}
+end
+
+mutable struct ADMMState{rT <: Real, rvecT <: AbstractVector{rT}, vecT <: Union{AbstractVector{rT}, AbstractVector{Complex{rT}}}} <: AbstractSolverState{ADMM}
+  # fields and operators for x update
   β::vecT
   β_y::vecT
   # fields for primal & dual variables
@@ -16,12 +25,10 @@ mutable struct ADMM{matT,opT,R,ropT,P,vecT,rvecT,preconT,rT} <: AbstractPrimalDu
   z::Vector{vecT}
   zᵒˡᵈ::Vector{vecT}
   u::Vector{vecT}
-  uᵒˡᵈ::Vector{vecT}
-  # other parameters
-  precon::preconT
+  uᵒˡᵈ::Vector{vecT}  
+  # other paremters
   ρ::rvecT
-  iterations::Int64
-  iterationsCG::Int64
+  iteration::Int64
   # state variables for CG
   cgStateVars::CGStateVariables
   # convergence parameters
@@ -34,9 +41,6 @@ mutable struct ADMM{matT,opT,R,ropT,P,vecT,rvecT,preconT,rT} <: AbstractPrimalDu
   absTol::rT
   relTol::rT
   tolInner::rT
-  normalizeReg::AbstractRegularizationNormalization
-  vary_ρ::Symbol
-  verbose::Bool
 end
 
 """
@@ -75,7 +79,7 @@ function ADMM(A
             ; AHA = A'*A
             , precon = Identity()
             , reg = L1Regularization(zero(real(eltype(AHA))))
-            , regTrafo = opEye(eltype(AHA), size(AHA,1))
+            , regTrafo = opEye(eltype(AHA), size(AHA,1), S = LinearOperators.storage_type(AHA))
             , normalizeReg::AbstractRegularizationNormalization = NoNormalization()
             , rho = 1e-1
             , vary_rho::Symbol = :none
@@ -131,7 +135,29 @@ function ADMM(A
   # normalization parameters
   reg = normalize(ADMM, normalizeReg, reg, A, nothing)
 
-  return ADMM(A, reg, regTrafo, proj, AHA, β, β_y, x, xᵒˡᵈ, z, zᵒˡᵈ, u, uᵒˡᵈ, precon, rho, iterations, iterationsCG, cgStateVars, rᵏ, sᵏ, ɛᵖʳⁱ, ɛᵈᵘᵃ, rT(0), Δ, rT(absTol), rT(relTol), rT(tolInner), normalizeReg, vary_rho, verbose)
+  state = ADMMState(β, β_y, x, xᵒˡᵈ, z, zᵒˡᵈ, u, uᵒˡᵈ, rho, 0, cgStateVars, rᵏ, sᵏ, ɛᵖʳⁱ, ɛᵈᵘᵃ, rT(0), Δ, rT(absTol), rT(relTol), rT(tolInner))
+
+  return ADMM(A, reg, regTrafo, proj, AHA, precon, normalizeReg, vary_rho, verbose, iterations, iterationsCG, state)
+end
+
+function init!(solver::ADMM, state::ADMMState{rT, rvecT, vecT}, b::otherT; kwargs...) where {rT, rvecT, vecT, otherT}
+  x    = similar(b, size(state.x)...)
+  xᵒˡᵈ = similar(b, size(state.xᵒˡᵈ)...)
+  β    = similar(b, size(state.β)...)
+  β_y  = similar(b, size(state.β_y)...)
+
+  z    = [similar(b, size(state.z[i])...)     for i ∈ eachindex(solver.reg)]
+  zᵒˡᵈ = [similar(b, size(state.zᵒˡᵈ[i])...)  for i ∈ eachindex(solver.reg)]
+  u    = [similar(b, size(state.u[i])...)     for i ∈ eachindex(solver.reg)]
+  uᵒˡᵈ = [similar(b, size(state.uᵒˡᵈ[i])...)  for i ∈ eachindex(solver.reg)]
+
+  cgStateVars = CGStateVariables(zero(x),similar(x),similar(x))
+
+  state = ADMMState(β, β_y, x, xᵒˡᵈ, z, zᵒˡᵈ, u, uᵒˡᵈ, state.ρ, state.iteration, cgStateVars,
+      state.rᵏ, state.sᵏ, state.ɛᵖʳⁱ, state.ɛᵈᵘᵃ, state.σᵃᵇˢ, state.Δ, state.absTol, state.relTol, state.tolInner)
+  
+  solver.state = state
+  init!(solver, state, b; kwargs...)
 end
 
 """
@@ -139,35 +165,36 @@ end
 
 (re-) initializes the ADMM iterator
 """
-function init!(solver::ADMM, b; x0=0)
-  solver.x .= x0
+function init!(solver::ADMM, state::ADMMState{rT, rvecT, vecT}, b::vecT; x0 = 0) where {rT, rvecT, vecT}
+  state.x .= x0
 
   # right hand side for the x-update
   if solver.A === nothing
-    solver.β_y .= b
+    state.β_y .= b
   else
-    mul!(solver.β_y, adjoint(solver.A), b)
+    mul!(state.β_y, adjoint(solver.A), b)
   end
 
   # primal and dual variables
   for i ∈ eachindex(solver.reg)
-    solver.z[i] .= solver.regTrafo[i] * solver.x
-    solver.u[i] .= 0
+    state.z[i] .= solver.regTrafo[i] * state.x
+    state.u[i] .= 0
   end
 
   # convergence parameter
-  solver.rᵏ .= Inf
-  solver.sᵏ .= Inf
-  solver.ɛᵖʳⁱ .= 0
-  solver.ɛᵈᵘᵃ .= 0
-  solver.σᵃᵇˢ = sqrt(length(b)) * solver.absTol
-  solver.Δ .= Inf
-
+  state.rᵏ .= Inf
+  state.sᵏ .= Inf
+  state.ɛᵖʳⁱ .= 0
+  state.ɛᵈᵘᵃ .= 0
+  state.σᵃᵇˢ = sqrt(length(b)) * state.absTol
+  state.Δ .= Inf
+
+  state.iteration = 0
   # normalization of regularization parameters
   solver.reg = normalize(solver, solver.normalizeReg, solver.reg, solver.A, b)
 end
 
-solverconvergence(solver::ADMM) = (; :primal => solver.rᵏ, :dual => solver.sᵏ)
+solverconvergence(state::ADMMState) = (; :primal => state.rᵏ, :dual => state.sᵏ)
 
 
 """
@@ -175,65 +202,65 @@ solverconvergence(solver::ADMM) = (; :primal => solver.rᵏ, :dual => solver.s
 
 performs one ADMM iteration.
 """
-function iterate(solver::ADMM, iteration=1)
-  done(solver, iteration) && return nothing
+function iterate(solver::ADMM, state::S = solver.state) where S <: AbstractSolverState{<:ADMM}
+  done(solver, state) && return nothing
   solver.verbose && println("Outer ADMM Iteration #$iteration")
 
   # 1. solve arg min_x 1/2|| Ax-b ||² + ρ/2 Σ_i||Φi*x+ui-zi||²
   # <=> (A'A+ρ Σ_i Φi'Φi)*x = A'b+ρΣ_i Φi'(zi-ui)
-  solver.β .= solver.β_y
+  state.β .= state.β_y
   AHA = solver.AHA
   for i ∈ eachindex(solver.reg)
-    mul!(solver.β, adjoint(solver.regTrafo[i]), solver.z[i],  solver.ρ[i], 1)
-    mul!(solver.β, adjoint(solver.regTrafo[i]), solver.u[i], -solver.ρ[i], 1)
-    AHA += solver.ρ[i] * adjoint(solver.regTrafo[i]) * solver.regTrafo[i]
+    mul!(state.β, adjoint(solver.regTrafo[i]), state.z[i],  state.ρ[i], 1)
+    mul!(state.β, adjoint(solver.regTrafo[i]), state.u[i], -state.ρ[i], 1)
+    AHA += state.ρ[i] * adjoint(solver.regTrafo[i]) * solver.regTrafo[i]
   end
   solver.verbose && println("conjugated gradients: ")
-  solver.xᵒˡᵈ .= solver.x
-  cg!(solver.x, AHA, solver.β, Pl=solver.precon, maxiter=solver.iterationsCG, reltol=solver.tolInner, statevars=solver.cgStateVars, verbose=solver.verbose)
+  state.xᵒˡᵈ .= state.x
+  cg!(state.x, AHA, state.β, Pl=solver.precon, maxiter=solver.iterationsCG, reltol=state.tolInner, statevars=state.cgStateVars, verbose=solver.verbose)
 
   for proj in solver.proj
-    prox!(proj, solver.x)
+    prox!(proj, state.x)
   end
 
   #  proximal map for regularization terms
   for i ∈ eachindex(solver.reg)
     # swap z and zᵒˡᵈ w/o copying data
-    tmp = solver.zᵒˡᵈ[i]
-    solver.zᵒˡᵈ[i] = solver.z[i]
-    solver.z[i] = tmp
+    tmp = state.zᵒˡᵈ[i]
+    state.zᵒˡᵈ[i] = state.z[i]
+    state.z[i] = tmp
 
     # 2. update z using the proximal map of 1/ρ*g(x)
-    mul!(solver.z[i], solver.regTrafo[i], solver.x)
-    solver.z[i] .+= solver.u[i]
-    if solver.ρ[i] != 0
-      prox!(solver.reg[i], solver.z[i], λ(solver.reg[i])/2solver.ρ[i]) # λ is divided by 2 to match the ISTA-type algorithms
+    mul!(state.z[i], solver.regTrafo[i], state.x)
+    state.z[i] .+= state.u[i]
+    if state.ρ[i] != 0
+      prox!(solver.reg[i], state.z[i], λ(solver.reg[i])/2state.ρ[i]) # λ is divided by 2 to match the ISTA-type algorithms
     end
 
     # 3. update u
-    solver.uᵒˡᵈ[i] .= solver.u[i]
-    mul!(solver.u[i], solver.regTrafo[i], solver.x, 1, 1)
-    solver.u[i] .-= solver.z[i]
+    state.uᵒˡᵈ[i] .= state.u[i]
+    mul!(state.u[i], solver.regTrafo[i], state.x, 1, 1)
+    state.u[i] .-= state.z[i]
 
     # update convergence criteria (one for each constraint)
-    solver.rᵏ[i] = norm(solver.regTrafo[i] * solver.x - solver.z[i])  # primal residual (x-z)
-    solver.sᵏ[i] = norm(solver.ρ[i] * adjoint(solver.regTrafo[i]) * (solver.z[i] .- solver.zᵒˡᵈ[i])) # dual residual (concerning f(x))
-
-    solver.ɛᵖʳⁱ[i] = max(norm(solver.regTrafo[i] * solver.x), norm(solver.z[i]))
-    solver.ɛᵈᵘᵃ[i] = norm(solver.ρ[i] * adjoint(solver.regTrafo[i]) * solver.u[i])
-
-    Δᵒˡᵈ = solver.Δ[i]
-    solver.Δ[i] = norm(solver.x    .- solver.xᵒˡᵈ   ) +
-                  norm(solver.z[i] .- solver.zᵒˡᵈ[i]) +
-                  norm(solver.u[i] .- solver.uᵒˡᵈ[i])
-
-    if (solver.vary_ρ == :balance && solver.rᵏ[i]/solver.ɛᵖʳⁱ[i] > 10solver.sᵏ[i]/solver.ɛᵈᵘᵃ[i]) || # adapt ρ according to Boyd et al.
-       (solver.vary_ρ == :PnP     && solver.Δ[i]/Δᵒˡᵈ > 0.9) # adapt ρ according to Chang et al.
-      solver.ρ[i] *= 2
-      solver.u[i] ./= 2
-    elseif solver.vary_ρ == :balance && solver.sᵏ[i]/solver.ɛᵈᵘᵃ[i] > 10solver.rᵏ[i]/solver.ɛᵖʳⁱ[i]
-      solver.ρ[i] /= 2
-      solver.u[i] .*= 2
+    state.rᵏ[i] = norm(solver.regTrafo[i] * state.x - state.z[i])  # primal residual (x-z)
+    state.sᵏ[i] = norm(state.ρ[i] * adjoint(solver.regTrafo[i]) * (state.z[i] .- state.zᵒˡᵈ[i])) # dual residual (concerning f(x))
+
+    state.ɛᵖʳⁱ[i] = max(norm(solver.regTrafo[i] * state.x), norm(state.z[i]))
+    state.ɛᵈᵘᵃ[i] = norm(state.ρ[i] * adjoint(solver.regTrafo[i]) * state.u[i])
+
+    Δᵒˡᵈ = state.Δ[i]
+    state.Δ[i] = norm(state.x    .- state.xᵒˡᵈ   ) +
+                  norm(state.z[i] .- state.zᵒˡᵈ[i]) +
+                  norm(state.u[i] .- state.uᵒˡᵈ[i])
+
+    if (solver.vary_ρ == :balance && state.rᵏ[i]/state.ɛᵖʳⁱ[i] > 10state.sᵏ[i]/state.ɛᵈᵘᵃ[i]) || # adapt ρ according to Boyd et al.
+       (solver.vary_ρ == :PnP     && state.Δ[i]/Δᵒˡᵈ > 0.9) # adapt ρ according to Chang et al.
+      state.ρ[i] *= 2
+      state.u[i] ./= 2
+    elseif solver.vary_ρ == :balance && state.sᵏ[i]/state.ɛᵈᵘᵃ[i] > 10state.rᵏ[i]/state.ɛᵖʳⁱ[i]
+      state.ρ[i] /= 2
+      state.u[i] .*= 2
     end
 
     if solver.verbose
@@ -245,15 +272,16 @@ function iterate(solver::ADMM, iteration=1)
     end
   end
 
-  return solver.rᵏ, iteration+1
+  state.iteration += 1
+  return state.x, state
 end
 
-function converged(solver::ADMM)
+function converged(solver::ADMM, state::ADMMState)
   for i ∈ eachindex(solver.reg)
-    (solver.rᵏ[i] >= solver.σᵃᵇˢ + solver.relTol * solver.ɛᵖʳⁱ[i]) && return false
-    (solver.sᵏ[i] >= solver.σᵃᵇˢ + solver.relTol * solver.ɛᵈᵘᵃ[i]) && return false
+    (state.rᵏ[i] >= state.σᵃᵇˢ + state.relTol * state.ɛᵖʳⁱ[i]) && return false
+    (state.sᵏ[i] >= state.σᵃᵇˢ + state.relTol * state.ɛᵈᵘᵃ[i]) && return false
   end
-  return true
+  return false
 end
 
-@inline done(solver::ADMM,iteration::Int) = converged(solver) || iteration >= solver.iterations
\ No newline at end of file
+@inline done(solver::ADMM, state::ADMMState) = converged(solver, state) || state.iteration >= solver.iterations
\ No newline at end of file
diff --git a/src/CGNR.jl b/src/CGNR.jl
index d91753b2..762e8194 100644
--- a/src/CGNR.jl
+++ b/src/CGNR.jl
@@ -1,21 +1,26 @@
 export cgnr, CGNR
 
-mutable struct CGNR{matT,opT,vecT,T,R,PR} <: AbstractKrylovSolver
+mutable struct CGNR{matT,opT, R,PR} <: AbstractKrylovSolver
   A::matT
   AHA::opT
   L2::R
   constr::PR
-  x::vecT
-  x₀::vecT
-  pl::vecT
-  vl::vecT
-  αl::T
-  βl::T
-  ζl::T
-  iterations::Int64
-  relTol::Float64
-  z0::Float64
   normalizeReg::AbstractRegularizationNormalization
+  iterations::Int64
+  state::AbstractSolverState{<:CGNR}
+end
+
+mutable struct CGNRState{T, Tc, vecTc} <: AbstractSolverState{CGNR} where {T, Tc <: Union{T, Complex{T}}, vecTc<:AbstractArray{Tc}}
+  x::vecTc
+  x₀::vecTc
+  pl::vecTc
+  vl::vecTc
+  αl::Tc
+  βl::Tc
+  ζl::Tc
+  iteration::Int64
+  relTol::T
+  z0::T
 end
 
 """
@@ -78,9 +83,20 @@ function CGNR(A
   end
   other = identity.(other)
 
+  state = CGNRState(x, x₀, pl, vl, αl, βl, ζl, 0, real(T)(relTol), zero(real(T)))
 
-  return CGNR(A, AHA,
-    L2, other, x, x₀, pl, vl, αl, βl, ζl, iterations, Float64(relTol), 0.0, normalizeReg)
+  return CGNR(A, AHA, L2, other, normalizeReg, iterations, state)
+end
+
+function init!(solver::CGNR, state::CGNRState{T, Tc, vecTc}, b::otherTc; kwargs...) where {T, Tc, vecTc, otherTc}
+  x = similar(b, size(state.x)...)
+  x₀ = similar(b, size(state.x₀)...)
+  pl = similar(b, size(state.pl)...)
+  vl = similar(b, size(state.vl)...)
+
+  state = CGNRState(x, x₀, pl, vl, state.αl, state.βl, state.ζl, state.iteration, state.relTol, state.z0)
+  solver.state = state
+  init!(solver, state, b; kwargs...)
 end
 
 """
@@ -88,25 +104,26 @@ end
 
 (re-) initializes the CGNR iterator
 """
-function init!(solver::CGNR, b; x0 = 0)
-  solver.pl .= 0     #temporary vector
-  solver.vl .= 0     #temporary vector
-  solver.αl  = 0     #temporary scalar
-  solver.βl  = 0     #temporary scalar
-  solver.ζl  = 0     #temporary scalar
+function init!(solver::CGNR, state::CGNRState{T, Tc, vecTc}, b::vecTc; x0 = 0) where {T, Tc <: Union{T, Complex{T}}, vecTc<:AbstractArray{Tc}}
+  state.pl .= 0     #temporary vector
+  state.vl .= 0     #temporary vector
+  state.αl  = 0     #temporary scalar
+  state.βl  = 0     #temporary scalar
+  state.ζl  = 0     #temporary scalar
+  state.iteration = 0
   if all(x0 .== 0)
-    solver.x .= 0
+    state.x .= 0
   else
     solver.A === nothing && error("providing x0 requires solver.A to be defined")
-    solver.x .= x0
+    state.x .= x0
     mul!(b, solver.A, solver.x, -1, 1)
   end
 
   #x₀ = Aᶜ*rl, where ᶜ denotes complex conjugation
-  initCGNR(solver.x₀, solver.A, b)
+  initCGNR(state.x₀, solver.A, b)
 
-  solver.z0 = norm(solver.x₀)
-  copyto!(solver.pl, solver.x₀)
+  state.z0 = norm(state.x₀)
+  copyto!(state.pl, state.x₀)
 
   # normalization of regularization parameters
   solver.L2 = normalize(solver, solver.normalizeReg, solver.L2, solver.A, b)
@@ -116,51 +133,53 @@ initCGNR(x₀, A, b) = mul!(x₀, adjoint(A), b)
 initCGNR(x₀, prod::ProdOp{T, <:WeightingOp, matT}, b) where {T, matT} = mul!(x₀, adjoint(prod.B), b .* prod.A.weights)
 initCGNR(x₀, ::Nothing, b) = x₀ .= b
 
-solverconvergence(solver::CGNR) = (; :residual => norm(solver.x₀))
+solverconvergence(state::CGNRState) = (; :residual => norm(state.x₀))
 
 """
   iterate(solver::CGNR{vecT,T,Tsparse}, iteration::Int=0) where {vecT,T,Tsparse}
 
 performs one CGNR iteration.
 """
-function iterate(solver::CGNR, iteration::Int=0)
-  if done(solver, iteration)
+function iterate(solver::CGNR, state=solver.state)
+  if done(solver, state)
     for r in solver.constr
-      prox!(r, solver.x)
+      prox!(r, state.x)
     end
     return nothing
   end
 
-  mul!(solver.vl, solver.AHA, solver.pl)
+  mul!(state.vl, solver.AHA, state.pl)
 
-  solver.ζl = norm(solver.x₀)^2
-  normvl = dot(solver.pl, solver.vl)
+  state.ζl = norm(state.x₀)^2
+  normvl = dot(state.pl, state.vl)
 
   λ_ = λ(solver.L2)
   if λ_ > 0
-    solver.αl = solver.ζl / (normvl + λ_ * norm(solver.pl)^2)
+    state.αl = state.ζl / (normvl + λ_ * norm(state.pl)^2)
   else
-    solver.αl = solver.ζl / normvl
+    state.αl = state.ζl / normvl
   end
 
-  BLAS.axpy!(solver.αl, solver.pl, solver.x)
+  state.x .+= state.pl .* state.αl
 
-  BLAS.axpy!(-solver.αl, solver.vl, solver.x₀)
+  state.x₀ .+= state.vl .* -state.αl
 
   if λ_ > 0
-    BLAS.axpy!(-λ_ * solver.αl, solver.pl, solver.x₀)
+    state.x₀ .+= state.pl .* -λ_ * state.αl
   end
 
-  solver.βl = dot(solver.x₀, solver.x₀) / solver.ζl
+  state.βl = dot(state.x₀, state.x₀) / state.ζl
+
+  rmul!(state.pl, state.βl)
+  state.pl .+= state.x₀
 
-  rmul!(solver.pl, solver.βl)
-  BLAS.axpy!(one(eltype(solver.AHA)), solver.x₀, solver.pl)
-  return solver.x₀, iteration + 1
+  state.iteration += 1
+  return state.x, state
 end
 
 
-function converged(solver::CGNR)
-  return norm(solver.x₀) / solver.z0 <= solver.relTol
+function converged(::CGNR, state::CGNRState)
+  return norm(state.x₀) / state.z0 <= state.relTol
 end
 
-@inline done(solver::CGNR, iteration::Int) = converged(solver) || iteration >= min(solver.iterations, size(solver.AHA, 2))
\ No newline at end of file
+@inline done(solver::CGNR, state::CGNRState) = converged(solver, state) || state.iteration >= min(solver.iterations, size(solver.AHA, 2))
\ No newline at end of file
diff --git a/src/Callbacks.jl b/src/Callbacks.jl
index 7bd2eb4f..32dce909 100644
--- a/src/Callbacks.jl
+++ b/src/Callbacks.jl
@@ -41,7 +41,7 @@ end
 
 Callback that accumlates the solvers convergence metrics per iteration. Results are stored in the `convMeas` field.
 """
-StoreConvergenceCallback() = new(Dict{Symbol, Any}())
+StoreConvergenceCallback() = StoreConvergenceCallback(Dict{Symbol, Any}())
 function (cb::StoreConvergenceCallback)(solver::AbstractLinearSolver, _)
   meas = solverconvergence(solver)
   for key in keys(meas)
diff --git a/src/Direct.jl b/src/Direct.jl
index 117dd6d5..e420a3ec 100644
--- a/src/Direct.jl
+++ b/src/Direct.jl
@@ -1,15 +1,17 @@
 export PseudoInverse, DirectSolver
-
-
 ### Direct Solver ###
 
-mutable struct DirectSolver{matT,vecT, R, PR}  <: AbstractDirectSolver
+mutable struct DirectSolver{matT, R, PR}  <: AbstractDirectSolver
   A::matT
-  x::vecT
-  b::vecT
   l2::R
   normalizeReg::AbstractRegularizationNormalization
   proj::Vector{PR}
+  state::AbstractSolverState{<:AbstractDirectSolver}
+end
+
+mutable struct DirectSolverState{vecT} <: AbstractSolverState{DirectSolver}
+  x::vecT
+  b::vecT
 end
 
 function DirectSolver(A; reg::Vector{<:AbstractRegularization} = [L2Regularization(zero(real(eltype(A))))], normalizeReg::AbstractRegularizationNormalization = NoNormalization())
@@ -36,24 +38,31 @@ function DirectSolver(A; reg::Vector{<:AbstractRegularization} = [L2Regularizati
   x = Vector{T}(undef,size(A, 2))
   b = zeros(T, size(A,1))
 
-  return DirectSolver(A, x, b, L2, normalizeReg, other)
+  return DirectSolver(A, L2, normalizeReg, other, DirectSolverState(x, b))
 end
 
-function init!(solver::DirectSolver, b; x0=0)
+function init!(solver::DirectSolver, state::DirectSolverState{vecT}, b::otherT; kwargs...) where {vecT, otherT}
+  x = similar(b, size(state.x)...)
+  bvecT = similar(b, size(state.b)...)
+  solver.state = DirectSolverState(x, bvecT)
+  init!(solver, solver.state, b; kwargs...)
+end
+function init!(solver::DirectSolver, state::DirectSolverState{vecT}, b::vecT; x0=0) where vecT
   solver.l2 = normalize(solver, solver.normalizeReg, solver.l2, solver.A, b)
-  solver.b .= b
+  state.b .= b
+  state.x .= x0
 end
 
-function iterate(solver::DirectSolver, iteration=0)
+function iterate(solver::DirectSolver, state = solver.state)
   A = solver.A
   λ_ = λ(solver.l2)
-  lufact = lu(Matrix(A'*A + λ_*opEye(size(A,2),size(A,2))))
-  x = \(lufact,A' * solver.b)
+  lufact = lu(A'*A .+ λ_)
+  x = \(lufact,A' * state.b)
 
   for p in solver.proj
     prox!(p, x)
   end
-  solver.x .= x
+  state.x .= x
   return nothing
 end
 
@@ -89,13 +98,12 @@ end
 
 ###  Pseudoinverse ###
 
-mutable struct PseudoInverse{R, vecT, PR}  <: AbstractDirectSolver
+mutable struct PseudoInverse{R, PR}  <: AbstractDirectSolver
   svd::SVD
-  x::vecT
-  b::vecT
   l2::R
   normalizeReg::AbstractRegularizationNormalization
   proj::Vector{PR}
+  state::AbstractSolverState{<:AbstractDirectSolver}
 end
 
 function PseudoInverse(A; reg::Vector{<:AbstractRegularization} = [L2Regularization(zero(real(eltype(A))))], normalizeReg::AbstractRegularizationNormalization = NoNormalization())
@@ -127,33 +135,35 @@ end
 function PseudoInverse(A::AbstractMatrix, x, b, l2, norm, proj)
   u, s, v = svd(A)
   temp = SVD(u, s, v)
-  return PseudoInverse(temp, x, b, l2, norm, proj)
+  return PseudoInverse(temp, l2, norm, proj, DirectSolverState(x, b))
 end
 
-function init!(solver::PseudoInverse, b; x0=0)
+function init!(solver::PseudoInverse, state::DirectSolverState{vecT}, b::otherT; kwargs...) where {vecT, otherT}
+  x = similar(b, size(state.x)...)
+  bvecT = similar(b, size(state.b)...)
+  solver.state = DirectSolverState(x, bvecT)
+  init!(solver, solver.state, b; kwargs...)
+end
+function init!(solver::PseudoInverse, state::DirectSolverState{vecT}, b::vecT; x0=0) where vecT
   solver.l2 = normalize(solver, solver.normalizeReg, solver.l2, solver.svd, b)
-  solver.b .= b
+  state.b .= b
 end
 
-function iterate(solver::PseudoInverse, iteration=0)
+function iterate(solver::PseudoInverse, state = solver.state)
   # Inversion by using the pseudoinverse of the SVD
   svd = solver.svd
 
   # Calculate singular values used for tikhonov regularization
-  D = [1/s for s in svd.S]
   λ_ = λ(solver.l2)
-  for i=1:length(D)
-    σi = svd.S[i]
-    D[i] = σi/(σi*σi+λ_*λ_)
-  end
+  D = svd.S ./ (svd.S.*svd.S .+ λ_ )
 
-  tmp = adjoint(svd.U)*solver.b
+  tmp = adjoint(svd.U)*state.b
   tmp .*= D
   x = svd.Vt * tmp
 
   for p in solver.proj
     prox!(p, x)
   end
-  solver.x = x
+  state.x = x
   return nothing
 end
\ No newline at end of file
diff --git a/src/FISTA.jl b/src/FISTA.jl
index ce14fff1..c0835b19 100644
--- a/src/FISTA.jl
+++ b/src/FISTA.jl
@@ -1,10 +1,18 @@
 export FISTA
 
-mutable struct FISTA{rT <: Real, vecT <: Union{AbstractVector{rT}, AbstractVector{Complex{rT}}}, matA, matAHA, R, RN} <: AbstractProximalGradientSolver
+mutable struct FISTA{matA, matAHA, R, RN} <: AbstractProximalGradientSolver
   A::matA
   AHA::matAHA
   reg::R
   proj::Vector{RN}
+  normalizeReg::AbstractRegularizationNormalization
+  verbose::Bool
+  restart::Symbol
+  iterations::Int64
+  state::AbstractSolverState{<:FISTA}
+end
+
+mutable struct FISTAState{rT <: Real, vecT <: Union{AbstractVector{rT}, AbstractVector{Complex{rT}}}} <: AbstractSolverState{FISTA}
   x::vecT
   x₀::vecT
   xᵒˡᵈ::vecT
@@ -12,15 +20,13 @@ mutable struct FISTA{rT <: Real, vecT <: Union{AbstractVector{rT}, AbstractVecto
   ρ::rT
   theta::rT
   thetaᵒˡᵈ::rT
-  iterations::Int64
+  iteration::Int64
   relTol::rT
-  normalizeReg::AbstractRegularizationNormalization
   norm_x₀::rT
   rel_res_norm::rT
-  verbose::Bool
-  restart::Symbol
 end
 
+
 """
     FISTA(A; AHA=A'*A, reg=L1Regularization(zero(real(eltype(AHA)))), normalizeReg=NoNormalization(), iterations=50, verbose = false, rho = 0.95 / power_iterations(AHA), theta=1, relTol=eps(real(eltype(AHA))), restart = :none)
     FISTA( ; AHA=,     reg=L1Regularization(zero(real(eltype(AHA)))), normalizeReg=NoNormalization(), iterations=50, verbose = false, rho = 0.95 / power_iterations(AHA), theta=1, relTol=eps(real(eltype(AHA))), restart = :none)
@@ -80,8 +86,20 @@ function FISTA(A
   other = identity.(other)
   reg = normalize(FISTA, normalizeReg, reg, A, nothing)
 
+  state = FISTAState(x, x₀, xᵒˡᵈ, res, rT(rho), rT(theta), rT(theta), 0, rT(relTol), one(rT), rT(Inf))
+
+  return FISTA(A, AHA, reg[1], other, normalizeReg, verbose, restart, iterations, state)
+end
+
+function init!(solver::FISTA, state::FISTAState{rT, vecT}, b::otherT; kwargs...) where {rT, vecT, otherT}
+  x = similar(b, size(state.x)...)
+  x₀ = similar(b, size(state.x₀)...)
+  xᵒˡᵈ = similar(b, size(state.xᵒˡᵈ)...)
+  res = similar(b, size(state.res)...)
 
-  return FISTA(A, AHA, reg[1], other, x, x₀, xᵒˡᵈ, res, rT(rho),rT(theta),rT(theta),iterations,rT(relTol),normalizeReg,one(rT),rT(Inf),verbose,restart)
+  state = FISTAState(x, x₀, xᵒˡᵈ, res, state.ρ, state.theta, state.theta, state.iteration, state.relTol, state.norm_x₀, state.rel_res_norm)
+  solver.state = state
+  init!(solver, state, b; kwargs...)
 end
 
 """
@@ -89,25 +107,28 @@ end
 
 (re-) initializes the FISTA iterator
 """
-function init!(solver::FISTA, b; x0 = 0, theta=1)
+function init!(solver::FISTA, state::FISTAState{rT, vecT}, b::vecT; x0 = 0, theta=1) where {rT, vecT}
   if solver.A === nothing
-    solver.x₀ .= b
+    state.x₀ .= b
   else
-    mul!(solver.x₀, adjoint(solver.A), b)
+    mul!(state.x₀, adjoint(solver.A), b)
   end
+  state.iteration = 0
 
-  solver.norm_x₀ = norm(solver.x₀)
+  state.norm_x₀ = norm(state.x₀)
 
-  solver.x    .= x0
-  solver.xᵒˡᵈ .= 0 # makes no difference in 1st iteration what this is set to
+  state.x    .= x0
+  state.xᵒˡᵈ .= 0 # makes no difference in 1st iteration what this is set to
 
-  solver.theta = theta
-  solver.thetaᵒˡᵈ = theta
+  state.res[:] .= rT(Inf)
+  state.theta = theta
+  state.thetaᵒˡᵈ = theta
+  state.rel_res_norm = rT(Inf)
   # normalization of regularization parameters
-  solver.reg = normalize(solver, solver.normalizeReg, solver.reg, solver.A, solver.x₀)
+  solver.reg = normalize(solver, solver.normalizeReg, solver.reg, solver.A, state.x₀)
 end
 
-solverconvergence(solver::FISTA) = (; :residual => norm(solver.res))
+solverconvergence(state::FISTAState) = (; :residual => norm(state.res))
 
 
 """
@@ -115,53 +136,54 @@ solverconvergence(solver::FISTA) = (; :residual => norm(solver.res))
 
 performs one fista iteration.
 """
-function iterate(solver::FISTA, iteration::Int=0)
-  if done(solver, iteration) return nothing end
+function iterate(solver::FISTA, state = solver.state)
+  if done(solver, state) return nothing end
 
   # momentum / Nesterov step
   # this implementation mimics BART, saving memory by first swapping x and xᵒˡᵈ before calculating x + α * (x - xᵒˡᵈ)
-  tmp = solver.xᵒˡᵈ
-  solver.xᵒˡᵈ = solver.x
-  solver.x = tmp # swap x and xᵒˡᵈ
-  solver.x .*= ((1 - solver.thetaᵒˡᵈ)/solver.theta) # here we calculate -α * xᵒˡᵈ, where xᵒˡᵈ is now stored in x
-  solver.x .+= ((solver.thetaᵒˡᵈ-1)/solver.theta + 1) .* (solver.xᵒˡᵈ) # add (α+1)*x, where x is now stored in xᵒˡᵈ
+  tmp = state.xᵒˡᵈ
+  state.xᵒˡᵈ = state.x
+  state.x = tmp # swap x and xᵒˡᵈ
+  state.x .*= ((1 - state.thetaᵒˡᵈ)/state.theta) # here we calculate -α * xᵒˡᵈ, where xᵒˡᵈ is now stored in x
+  state.x .+= ((state.thetaᵒˡᵈ-1)/state.theta + 1) .* (state.xᵒˡᵈ) # add (α+1)*x, where x is now stored in xᵒˡᵈ
 
   # calculate residuum and do gradient step
   # solver.x .-= solver.ρ .* (solver.AHA * solver.x .- solver.x₀)
-  mul!(solver.res, solver.AHA, solver.x)
-  solver.res .-= solver.x₀
-  solver.x .-= solver.ρ .* solver.res
+  mul!(state.res, solver.AHA, state.x)
+  state.res .-= state.x₀
+  state.x .-= state.ρ .* state.res
 
-  solver.rel_res_norm = norm(solver.res) / solver.norm_x₀
-  solver.verbose && println("Iteration $iteration; rel. residual = $(solver.rel_res_norm)")
+  state.rel_res_norm = norm(state.res) / state.norm_x₀
+  solver.verbose && println("Iteration $iteration; rel. residual = $(state.rel_res_norm)")
 
   # the two lines below are equivalent to the ones above and non-allocating, but require the 5-argument mul! function to implemented for AHA, i.e. if AHA is LinearOperator, it requires LinearOperators.jl v2
   # mul!(solver.x, solver.AHA, solver.xᵒˡᵈ, -solver.ρ, 1)
   # solver.x .+= solver.ρ .* solver.x₀
 
   # proximal map
-  prox!(solver.reg, solver.x, solver.ρ * λ(solver.reg))
+  prox!(solver.reg, state.x, state.ρ * λ(solver.reg))
 
   for proj in solver.proj
-    prox!(proj, solver.x)
+    prox!(proj, state.x)
   end
 
   # gradient restart conditions
   if solver.restart == :gradient
-    if real(solver.res ⋅ (solver.x .- solver.xᵒˡᵈ) ) > 0 #if momentum is at an obtuse angle to the negative gradient
+    if real(state.res ⋅ (state.x .- state.xᵒˡᵈ) ) > 0 #if momentum is at an obtuse angle to the negative gradient
       solver.verbose && println("Gradient restart at iter $iteration")
-      solver.theta = 1
+      state.theta = 1
     end
   end
 
   # predictor-corrector update
-  solver.thetaᵒˡᵈ = solver.theta
-  solver.theta = (1 + sqrt(1 + 4 * solver.thetaᵒˡᵈ^2)) / 2
+  state.thetaᵒˡᵈ = state.theta
+  state.theta = (1 + sqrt(1 + 4 * state.thetaᵒˡᵈ^2)) / 2
 
+  state.iteration += 1
   # return the residual-norm as item and iteration number as state
-  return solver, iteration+1
+  return state.x, state
 end
 
-@inline converged(solver::FISTA) = (solver.rel_res_norm < solver.relTol)
+@inline converged(::FISTA, state::FISTAState) = (state.rel_res_norm < state.relTol)
 
-@inline done(solver::FISTA,iteration) = converged(solver) || iteration>=solver.iterations
+@inline done(solver::FISTA, state::FISTAState) = converged(solver, state) || state.iteration>=solver.iterations
\ No newline at end of file
diff --git a/src/Kaczmarz.jl b/src/Kaczmarz.jl
index 842d1674..614508c9 100644
--- a/src/Kaczmarz.jl
+++ b/src/Kaczmarz.jl
@@ -1,26 +1,31 @@
 export kaczmarz
 export Kaczmarz
 
-mutable struct Kaczmarz{matT,R,T,U,RN} <: AbstractRowActionSolver
+mutable struct Kaczmarz{matT,R,U,RN} <: AbstractRowActionSolver
   A::matT
-  u::Vector{T}
   L2::R
   reg::Vector{RN}
   denom::Vector{U}
   rowindex::Vector{Int64}
   rowIndexCycle::Vector{Int64}
-  x::Vector{T}
-  vl::Vector{T}
-  εw::T
-  τl::T
-  αl::T
   randomized::Bool
   subMatrixSize::Int64
   probabilities::Vector{U}
   shuffleRows::Bool
   seed::Int64
-  iterations::Int64
   normalizeReg::AbstractRegularizationNormalization
+  iterations::Int64
+  state::AbstractSolverState{<:Kaczmarz}
+end
+
+mutable struct KaczmarzState{T, vecT <: AbstractArray{T}} <: AbstractSolverState{Kaczmarz}
+  u::vecT
+  x::vecT
+  vl::vecT
+  εw::T
+  τl::T
+  αl::T
+  iteration::Int64
 end
 
 """
@@ -66,7 +71,7 @@ function Kaczmarz(A
   end
 
   # Tikhonov matrix is only valid with NoNormalization or SystemMatrixBasedNormalization
-  if λ(L2) isa Vector && !(normalizeReg isa NoNormalization || normalizeReg isa SystemMatrixBasedNormalization)
+  if λ(L2) isa AbstractVector && !(normalizeReg isa NoNormalization || normalizeReg isa SystemMatrixBasedNormalization)
     error("Tikhonov matrix for Kaczmarz is only valid with no or system matrix based normalization")
   end
 
@@ -98,10 +103,21 @@ function Kaczmarz(A
   τl = zero(eltype(A))
   αl = zero(eltype(A))
 
-  return Kaczmarz(A, u, L2, other, denom, rowindex, rowIndexCycle, x, vl, εw, τl, αl,
+  state = KaczmarzState(u, x, vl, εw, τl, αl, 0)
+
+  return Kaczmarz(A, L2, other, denom, rowindex, rowIndexCycle,
                   randomized, subMatrixSize, probabilities, shuffleRows,
-                  Int64(seed), iterations,
-                  normalizeReg)
+                  Int64(seed), normalizeReg, iterations, state)
+end
+
+function init!(solver::Kaczmarz, state::KaczmarzState{T, vecT}, b::otherT; kwargs...) where {T, vecT, otherT}
+  u = similar(b, size(state.u)...)
+  x = similar(b, size(state.x)...)
+  vl = similar(b, size(state.vl)...)
+
+  state = KaczmarzState(u, x, vl, state.εw, state.τl, state.αl, state.iteration)
+  solver.state = state
+  init!(solver, state, b; kwargs...)
 end
 
 """
@@ -109,7 +125,7 @@ end
 
 (re-) initializes the Kacmarz iterator
 """
-function init!(solver::Kaczmarz, b; x0 = 0)
+function init!(solver::Kaczmarz, state::KaczmarzState{T, vecT}, b::vecT; x0 = 0) where {T, vecT}
   λ_prev = λ(solver.L2)
   solver.L2  = normalize(solver, solver.normalizeReg, solver.L2,  solver.A, b)
   solver.reg = normalize(solver, solver.normalizeReg, solver.reg, solver.A, b)
@@ -134,26 +150,27 @@ function init!(solver::Kaczmarz, b; x0 = 0)
   end
 
   # start vector
-  solver.x .= x0
-  solver.vl .= 0
+  state.x .= x0
+  state.vl .= 0
 
-  solver.u .= b
-  if λ_ isa Vector
-    solver.ɛw = 0
+  state.u .= b
+  if λ_ isa AbstractVector
+    state.ɛw = 0
   else
-    solver.ɛw = sqrt(λ_)
+    state.ɛw = sqrt(λ_)
   end
+  state.iteration = 0
 end
 
 
-function solversolution(solver::Kaczmarz{matT, RN}) where {matT, R<:L2Regularization{<:Vector}, RN <: Union{R, AbstractNestedRegularization{<:R}}}
-  return solver.x .* (1 ./ sqrt.(λ(solver.L2)))
+function solversolution(solver::Kaczmarz{matT, RN}) where {matT, R<:L2Regularization{<:AbstractVector}, RN <: Union{R, AbstractNestedRegularization{<:R}}}
+  return solver.state.x .* (1 ./ sqrt.(λ(solver.L2)))
 end
-solversolution(solver::Kaczmarz) = solver.x
-solverconvergence(solver::Kaczmarz) = (; :residual => norm(solver.vl))
+solversolution(solver::Kaczmarz) = solver.state.x
+solverconvergence(state::KaczmarzState) = (; :residual => norm(state.vl))
 
-function iterate(solver::Kaczmarz, iteration::Int=0)
-  if done(solver,iteration) return nothing end
+function iterate(solver::Kaczmarz, state = solver.state)
+  if done(solver,state) return nothing end
 
   if solver.randomized
     usedIndices = Int.(StatsBase.sample!(Random.GLOBAL_RNG, solver.rowIndexCycle, weights(solver.probabilities), zeros(solver.subMatrixSize), replace=false))
@@ -163,25 +180,26 @@ function iterate(solver::Kaczmarz, iteration::Int=0)
 
   for i in usedIndices
     row = solver.rowindex[i]
-    iterate_row_index(solver, solver.A, row, i)
+    iterate_row_index(solver, state, solver.A, row, i)
   end
 
   for r in solver.reg
-    prox!(r, solver.x)
+    prox!(r, state.x)
   end
 
-  return solver.vl, iteration+1
+  state.iteration += 1
+  return state.x, state
 end
 
-iterate_row_index(solver::Kaczmarz, A::AbstractLinearSolver, row, index) = iterate_row_index(solver, Matrix(A[row, :]), row, index) 
-function iterate_row_index(solver::Kaczmarz, A, row, index)
-  solver.τl = dot_with_matrix_row(A,solver.x,row)
-  solver.αl = solver.denom[index]*(solver.u[row]-solver.τl-solver.ɛw*solver.vl[row])
-  kaczmarz_update!(A,solver.x,row,solver.αl)
-  solver.vl[row] += solver.αl*solver.ɛw
+iterate_row_index(solver::Kaczmarz, state::KaczmarzState, A::AbstractLinearSolver, row, index) = iterate_row_index(solver, Matrix(A[row, :]), row, index) 
+function iterate_row_index(solver::Kaczmarz, state::KaczmarzState, A, row, index)
+  state.τl = dot_with_matrix_row(A,state.x,row)
+  state.αl = solver.denom[index]*(state.u[row]-state.τl-state.ɛw*state.vl[row])
+  kaczmarz_update!(A,state.x,row,state.αl)
+  state.vl[row] += state.αl*state.ɛw
 end
 
-@inline done(solver::Kaczmarz,iteration::Int) = iteration>=solver.iterations
+@inline done(solver::Kaczmarz,state::KaczmarzState) = state.iteration>=solver.iterations
 
 
 """
@@ -221,14 +239,14 @@ function initkaczmarz(A,λ)
   end
   return A, denom, rowindex
 end
-function initkaczmarz(A, λ::Vector)
+function initkaczmarz(A, λ::AbstractVector)
   λ = real(eltype(A)).(λ)
   A = initikhonov(A, λ)
   return initkaczmarz(A, 0)
 end
 
 initikhonov(A, λ) = transpose((1 ./ sqrt.(λ)) .* transpose(A)) # optimize structure for row access
-initikhonov(prod::ProdOp{Tc, WeightingOp{T}, matT}, λ) where {T, Tc<:Union{T, Complex{T}}, matT} = ProdOp(prod.A, initikhonov(prod.B, λ))
+initikhonov(prod::ProdOp{Tc, <:WeightingOp, matT}, λ) where {T, Tc<:Union{T, Complex{T}}, matT} = ProdOp(prod.A, initikhonov(prod.B, λ))
 ### kaczmarz_update! ###
 
 """
@@ -256,7 +274,7 @@ function kaczmarz_update!(B::Transpose{T,S}, x::Vector,
   end
 end
 
-function kaczmarz_update!(prod::ProdOp{Tc, WeightingOp{T}, matT}, x::Vector, k, beta) where {T, Tc<:Union{T, Complex{T}}, matT}
+function kaczmarz_update!(prod::ProdOp{Tc, WeightingOp{T, vecT}}, x, k, beta) where {T, Tc<:Union{T, Complex{T}}, vecT}
   weight = prod.A.weights[k]
   kaczmarz_update!(prod.B, x, k, weight*beta) # only for real weights
 end
diff --git a/src/OptISTA.jl b/src/OptISTA.jl
index eaf41e7c..509fde2e 100644
--- a/src/OptISTA.jl
+++ b/src/OptISTA.jl
@@ -1,10 +1,17 @@
 export optista, OptISTA
 
-mutable struct OptISTA{rT <: Real, vecT <: Union{AbstractVector{rT}, AbstractVector{Complex{rT}}}, matA, matAHA, R, RN} <: AbstractProximalGradientSolver
+mutable struct OptISTA{matA, matAHA, R, RN} <: AbstractProximalGradientSolver
   A::matA
   AHA::matAHA
   reg::R
   proj::Vector{RN}
+  normalizeReg::AbstractRegularizationNormalization
+  verbose::Bool
+  iterations::Int64
+  state::AbstractSolverState{<:OptISTA}
+end
+
+mutable struct OptISTAState{rT <: Real, vecT <: Union{AbstractVector{rT}, AbstractVector{Complex{rT}}}} <: AbstractSolverState{OptISTA}
   x::vecT
   x₀::vecT
   y::vecT
@@ -18,12 +25,10 @@ mutable struct OptISTA{rT <: Real, vecT <: Union{AbstractVector{rT}, AbstractVec
   α::rT
   β::rT
   γ::rT
-  iterations::Int64
+  iteration::Int64
   relTol::rT
-  normalizeReg::AbstractRegularizationNormalization
   norm_x₀::rT
   rel_res_norm::rT
-  verbose::Bool
 end
 
 """
@@ -93,8 +98,23 @@ function OptISTA(A
   other = identity.(other)
   reg = normalize(OptISTA, normalizeReg, reg, A, nothing)
 
-  return OptISTA(A, AHA, reg[1], other, x, x₀, y, z, zᵒˡᵈ, res, rT(rho),rT(theta),rT(theta),rT(θn),rT(0),rT(1),rT(1),
-    iterations,rT(relTol),normalizeReg,one(rT),rT(Inf),verbose)
+  state = OptISTAState(x, x₀, y, z, zᵒˡᵈ, res, rT(rho),rT(theta),rT(theta),rT(θn),rT(0),rT(1),rT(1),
+  0,rT(relTol), one(rT),rT(Inf))
+
+  return OptISTA(A, AHA, reg[1], other, normalizeReg, verbose, iterations, state)
+end
+
+function init!(solver::OptISTA, state::OptISTAState{rT, vecT}, b::otherT; kwargs...) where {rT, vecT, otherT}
+  x = similar(b, size(state.x)...)
+  x₀ = similar(b, size(state.x₀)...)
+  y = similar(b, size(state.y)...)
+  z = similar(b, size(state.z)...)
+  zᵒˡᵈ = similar(b, size(state.zᵒˡᵈ)...)
+  res = similar(b, size(state.res)...)
+
+  state = OptISTAState(x, x₀, y, z, zᵒˡᵈ, res, state.ρ, state.θ, state.θᵒˡᵈ, state.θn, state.α, state.β, state.γ, state.iteration, state.relTol, state.norm_x₀, state.rel_res_norm)
+  solver.state = state
+  init!(solver, state, b; kwargs...)
 end
 
 """
@@ -105,80 +125,84 @@ end
 
 (re-) initializes the OptISTA iterator
 """
-function init!(solver::OptISTA, b; x0=0, θ=1)
+function init!(solver::OptISTA, state::OptISTAState{rT, vecT}, b::vecT; x0 = 0, θ=1) where {rT, vecT}
   if solver.A === nothing
-    solver.x₀ .= b
+    state.x₀ .= b
   else
-    mul!(solver.x₀, adjoint(solver.A), b)
+    mul!(state.x₀, adjoint(solver.A), b)
   end
 
-  solver.norm_x₀ = norm(solver.x₀)
+  state.norm_x₀ = norm(state.x₀)
 
-  solver.x .= x0
-  solver.y .= solver.x
-  solver.z .= solver.x
-  solver.zᵒˡᵈ .= solver.x
+  state.x .= x0
+  state.y .= state.x
+  state.z .= state.x
+  state.zᵒˡᵈ .= state.x
 
-  solver.θ = θ
-  solver.θᵒˡᵈ = θ
-  solver.θn = θ
+  state.res[:] .= rT(Inf)
+  state.θ = θ
+  state.θᵒˡᵈ = θ
+  state.θn = θ
   for _ = 1:(solver.iterations-1)
-    solver.θn = (1 + sqrt(1 + 4 * solver.θn^2)) / 2
+    state.θn = (1 + sqrt(1 + 4 * state.θn^2)) / 2
   end
-  solver.θn = (1 + sqrt(1 + 8 * solver.θn^2)) / 2
+  state.θn = (1 + sqrt(1 + 8 * state.θn^2)) / 2
+  state.rel_res_norm = rT(Inf)
 
+  state.iteration = 0
   # normalization of regularization parameters
-  solver.reg = normalize(solver, solver.normalizeReg, solver.reg, solver.A, solver.x₀)
+  solver.reg = normalize(solver, solver.normalizeReg, solver.reg, solver.A, state.x₀)
 end
 
-solverconvergence(solver::OptISTA) = (; :residual => norm(solver.res))
+solverconvergence(state::OptISTAState) = (; :residual => norm(state.res))
 
 """
   iterate(it::OptISTA, iteration::Int=0)
 
 performs one OptISTA iteration.
 """
-function iterate(solver::OptISTA, iteration::Int=0)
-  if done(solver, iteration) return nothing end
+function iterate(solver::OptISTA, state::OptISTAState = solver.state)
+  if done(solver, state) return nothing end
 
   # inertial parameters
-  solver.γ = 2solver.θ / solver.θn^2 * (solver.θn^2 - 2solver.θ^2 + solver.θ)
-  solver.θᵒˡᵈ = solver.θ
-  if iteration == solver.iterations - 1 #the convergence rate depends on choice of # iterations!
-    solver.θ = (1 + sqrt(1 + 8 * solver.θᵒˡᵈ^2)) / 2
+  state.γ = 2state.θ / state.θn^2 * (state.θn^2 - 2state.θ^2 + state.θ)
+  state.θᵒˡᵈ = state.θ
+  if state.iteration == solver.iterations - 1 #the convergence rate depends on choice of # iterations!
+    state.θ = (1 + sqrt(1 + 8 * state.θᵒˡᵈ^2)) / 2
   else
-    solver.θ = (1 + sqrt(1 + 4 * solver.θᵒˡᵈ^2)) / 2
+    state.θ = (1 + sqrt(1 + 4 * state.θᵒˡᵈ^2)) / 2
   end
-  solver.α = (solver.θᵒˡᵈ - 1) / solver.θ
-  solver.β = solver.θᵒˡᵈ / solver.θ
+  state.α = (state.θᵒˡᵈ - 1) / state.θ
+  state.β = state.θᵒˡᵈ / state.θ
 
   # calculate residuum and do gradient step
-  # solver.y .-= solver.ρ * solver.γ .* (solver.AHA * solver.x .- solver.x₀)
-  solver.zᵒˡᵈ .= solver.z #store this for inertia step
-  solver.z .= solver.y #save yᵒˡᵈ in the variable z
-  mul!(solver.res, solver.AHA, solver.x)
-  solver.res .-= solver.x₀
-  solver.y .-= solver.ρ * solver.γ .* solver.res
+  # state.y .-= state.ρ * state.γ .* (solver.AHA * state.x .- state.x₀)
+  state.zᵒˡᵈ .= state.z #store this for inertia step
+  state.z .= state.y #save yᵒˡᵈ in the variable z
+  mul!(state.res, solver.AHA, state.x)
+  state.res .-= state.x₀
+  state.y .-= state.ρ * state.γ .* state.res
 
-  solver.rel_res_norm = norm(solver.res) / solver.norm_x₀
-  solver.verbose && println("Iteration $iteration; rel. residual = $(solver.rel_res_norm)")
+  state.rel_res_norm = norm(state.res) / state.norm_x₀
+  solver.verbose && println("Iteration $iteration; rel. residual = $(state.rel_res_norm)")
 
   # proximal map
-  prox!(solver.reg, solver.y, solver.ρ * solver.γ * λ(solver.reg))
+  prox!(solver.reg, state.y, state.ρ * state.γ * λ(solver.reg))
 
   # inertia steps
   # z = x + (y - yᵒˡᵈ) / γ
   # x = z + α * (z - zᵒˡᵈ) + β * (z - x)
-  solver.z ./= -solver.γ #yᵒˡᵈ is already stored in z
-  solver.z .+= solver.x .+ solver.y ./ solver.γ
-  solver.x .*= -solver.β
-  solver.x .+= (1 + solver.α + solver.β) .* solver.z
-  solver.x .-= solver.α .* solver.zᵒˡᵈ
+  state.z ./= -state.γ #yᵒˡᵈ is already stored in z
+  state.z .+= state.x .+ state.y ./ state.γ
+  state.x .*= -state.β
+  state.x .+= (1 + state.α + state.β) .* state.z
+  state.x .-= state.α .* state.zᵒˡᵈ
 
+  state.iteration += 1
   # return the residual-norm as item and iteration number as state
-  return solver, iteration+1
+  return state.x, state
 end
 
-@inline converged(solver::OptISTA) = (solver.rel_res_norm < solver.relTol)
+@inline converged(solver::OptISTA, state::OptISTAState) = (state.rel_res_norm < state.relTol)
 
-@inline done(solver::OptISTA,iteration) = converged(solver) || iteration>=solver.iterations
+@inline done(solver::OptISTA, state::OptISTAState) = converged(solver, state) || state.iteration >= solver.iterations
\ No newline at end of file
diff --git a/src/POGM.jl b/src/POGM.jl
index e06f4e15..a99efb56 100644
--- a/src/POGM.jl
+++ b/src/POGM.jl
@@ -1,10 +1,18 @@
 export pogm, POGM
 
-mutable struct POGM{rT<:Real,vecT<:Union{AbstractVector{rT},AbstractVector{Complex{rT}}},matA,matAHA,R,RN} <: AbstractProximalGradientSolver
+mutable struct POGM{matA,matAHA,R,RN} <: AbstractProximalGradientSolver
   A::matA
   AHA::matAHA
   reg::R
   proj::Vector{RN}
+  normalizeReg::AbstractRegularizationNormalization
+  verbose::Bool
+  restart::Symbol  
+  iterations::Int64
+  state::AbstractSolverState{<:POGM}
+end
+
+mutable struct POGMState{rT <: Real, vecT <: Union{AbstractVector{rT}, AbstractVector{Complex{rT}}}} <: AbstractSolverState{POGM}
   x::vecT
   x₀::vecT
   xᵒˡᵈ::vecT
@@ -21,15 +29,11 @@ mutable struct POGM{rT<:Real,vecT<:Union{AbstractVector{rT},AbstractVector{Compl
   γᵒˡᵈ::rT
   σ::rT
   σ_fac::rT
-  iterations::Int64
+  iteration::Int64
   relTol::rT
-  normalizeReg::AbstractRegularizationNormalization
   norm_x₀::rT
   rel_res_norm::rT
-  verbose::Bool
-  restart::Symbol
 end
-
 """
     POGM(A; AHA = A'*A, reg = L1Regularization(zero(real(eltype(AHA)))), normalizeReg = NoNormalization(), iterations = 50, verbose = false, rho = 0.95 / power_iterations(AHA), theta = 1, sigma_fac = 1, relTol = eps(real(eltype(AHA))), restart = :none)
     POGM( ; AHA = ,     reg = L1Regularization(zero(real(eltype(AHA)))), normalizeReg = NoNormalization(), iterations = 50, verbose = false, rho = 0.95 / power_iterations(AHA), theta = 1, sigma_fac = 1, relTol = eps(real(eltype(AHA))), restart = :none)
@@ -103,8 +107,27 @@ function POGM(A
   other = identity.(other)
   reg = normalize(POGM, normalizeReg, reg, A, nothing)
 
-  return POGM(A, AHA, reg[1], other, x, x₀, xᵒˡᵈ, y, z, w, res, rT(rho), rT(theta), rT(theta), rT(0), rT(1), rT(1), rT(1), rT(1), rT(sigma_fac),
-    iterations, rT(relTol), normalizeReg, one(rT), rT(Inf), verbose, restart)
+  state = POGMState(x, x₀, xᵒˡᵈ, y, z, w, res, rT(rho), rT(theta), rT(theta), rT(0), rT(1), rT(1),
+   rT(1), rT(1), rT(sigma_fac), 0, rT(relTol), one(rT), rT(Inf))
+
+  return POGM(A, AHA, reg[1], other, normalizeReg, verbose, restart, iterations, state)
+end
+
+function init!(solver::POGM, state::POGMState{rT, vecT}, b::otherT; kwargs...) where {rT, vecT, otherT}
+  x = similar(b, size(state.x)...)
+  x₀ = similar(b, size(state.x₀)...)
+  xᵒˡᵈ = similar(b, size(state.xᵒˡᵈ)...)
+  y = similar(b, size(state.y)...)
+  z = similar(b, size(state.z)...)
+  w = similar(b, size(state.w)...)
+  res = similar(b, size(state.res)...)
+
+  state = POGMState(x, x₀, xᵒˡᵈ, y, z, w, res, state.ρ, state.theta, state.theta,
+    state.α, state.β, state.γ, state.γᵒˡᵈ, state.σ, state.σ_fac,
+    state.iteration, state.relTol, state.norm_x₀, state.rel_res_norm)
+  
+  solver.state = state
+  init!(solver, state, b; kwargs...)
 end
 
 """
@@ -112,102 +135,107 @@ end
 
 (re-) initializes the POGM iterator
 """
-function init!(solver::POGM, b; x0=0, theta=1)
+function init!(solver::POGM, state::POGMState{rT, vecT}, b::vecT; x0 = 0, theta=1) where {rT, vecT}
   if solver.A === nothing
-    solver.x₀ .= b
+    state.x₀ .= b
   else
-    mul!(solver.x₀, adjoint(solver.A), b)
+    mul!(state.x₀, adjoint(solver.A), b)
   end
 
-  solver.norm_x₀ = norm(solver.x₀)
+  state.norm_x₀ = norm(state.x₀)
 
-  solver.x .= x0
-  solver.xᵒˡᵈ .= 0 # makes no difference in 1st iteration what this is set to
-  solver.y .= 0
-  solver.z .= 0
+  state.x .= x0
+  state.xᵒˡᵈ .= 0 # makes no difference in 1st iteration what this is set to
+  state.y .= 0
+  state.z .= 0
   if solver.restart != :none #save time if not using restart
-    solver.w .= 0
+    state.w .= 0
   end
 
-  solver.theta = theta
-  solver.thetaᵒˡᵈ = theta
-  solver.σ = 1
+  state.res[:] .= rT(Inf)
+  state.theta = theta
+  state.thetaᵒˡᵈ = theta
+  state.σ = 1
+  state.rel_res_norm = rT(Inf)
+
+  state.iteration = 0
   # normalization of regularization parameters
-  solver.reg = normalize(solver, solver.normalizeReg, solver.reg, solver.A, solver.x₀)
+  solver.reg = normalize(solver, solver.normalizeReg, solver.reg, solver.A, state.x₀)
 end
 
-solverconvergence(solver::POGM) = (; :residual => norm(solver.res))
+solverconvergence(state::POGMState) = (; :residual => norm(state.res))
 
 """
   iterate(it::POGM, iteration::Int=0)
 
 performs one POGM iteration.
 """
-function iterate(solver::POGM, iteration::Int=0)
-  if done(solver, iteration)
+function iterate(solver::POGM, state = solver.state)
+  if done(solver, state)
     return nothing
   end
 
   # calculate residuum and do gradient step
   # solver.x .-= solver.ρ .* (solver.AHA * solver.x .- solver.x₀)
-  solver.xᵒˡᵈ .= solver.x #save this for inertia step later
-  mul!(solver.res, solver.AHA, solver.x)
-  solver.res .-= solver.x₀
-  solver.x .-= solver.ρ .* solver.res
+  state.xᵒˡᵈ .= state.x #save this for inertia step later
+  mul!(state.res, solver.AHA, state.x)
+  state.res .-= state.x₀
+  state.x .-= state.ρ .* state.res
 
-  solver.rel_res_norm = norm(solver.res) / solver.norm_x₀
-  solver.verbose && println("Iteration $iteration; rel. residual = $(solver.rel_res_norm)")
+  state.rel_res_norm = norm(state.res) / state.norm_x₀
+  solver.verbose && println("Iteration $iteration; rel. residual = $(state.rel_res_norm)")
 
   # inertial parameters
-  solver.thetaᵒˡᵈ = solver.theta
-  if iteration == solver.iterations - 1 && solver.restart != :none #the convergence rate depends on choice of # iterations!
-    solver.theta = (1 + sqrt(1 + 8 * solver.thetaᵒˡᵈ^2)) / 2
+  state.thetaᵒˡᵈ = state.theta
+  if state.iteration == solver.iterations - 1 && solver.restart != :none #the convergence rate depends on choice of # iterations!
+    state.theta = (1 + sqrt(1 + 8 * state.thetaᵒˡᵈ^2)) / 2
   else
-    solver.theta = (1 + sqrt(1 + 4 * solver.thetaᵒˡᵈ^2)) / 2
+    state.theta = (1 + sqrt(1 + 4 * state.thetaᵒˡᵈ^2)) / 2
   end
-  solver.α = (solver.thetaᵒˡᵈ - 1) / solver.theta
-  solver.β = solver.σ * solver.thetaᵒˡᵈ / solver.theta
-  solver.γᵒˡᵈ = solver.γ
+  state.α = (state.thetaᵒˡᵈ - 1) / state.theta
+  state.β = state.σ * state.thetaᵒˡᵈ / state.theta
+  state.γᵒˡᵈ = state.γ
   if solver.restart == :gradient
-    solver.γ = solver.ρ * (1 + solver.α + solver.β)
+    state.γ = state.ρ * (1 + state.α + state.β)
   else
-    solver.γ = solver.ρ * (2solver.thetaᵒˡᵈ + solver.theta - 1) / solver.theta
+    state.γ = state.ρ * (2state.thetaᵒˡᵈ + state.theta - 1) / state.theta
   end
 
   # inertia steps
   # x + α * (x - y) + β * (x - xᵒˡᵈ) + ρα/γᵒˡᵈ * (z - xᵒˡᵈ)
-  tmp = solver.y
-  solver.y = solver.x
-  solver.x = tmp # swap x and y
-  solver.x .*= -solver.α # here we calculate -α * y, where y is now stored in x
-  solver.x .+= (1 + solver.α + solver.β) .* solver.y
-  solver.x .-= (solver.β + solver.ρ * solver.α / solver.γᵒˡᵈ) .* solver.xᵒˡᵈ
-  solver.x .+= solver.ρ * solver.α / solver.γᵒˡᵈ .* solver.z
-  solver.z .= solver.x #store this for next iteration and GR
+  tmp = state.y
+  state.y = state.x
+  state.x = tmp # swap x and y
+  state.x .*= -state.α # here we calculate -α * y, where y is now stored in x
+  state.x .+= (1 + state.α + state.β) .* state.y
+  state.x .-= (state.β + state.ρ * state.α / state.γᵒˡᵈ) .* state.xᵒˡᵈ
+  state.x .+= state.ρ * state.α / state.γᵒˡᵈ .* state.z
+  state.z .= state.x #store this for next iteration and GR
 
   # proximal map
-  prox!(solver.reg, solver.x, solver.γ * λ(solver.reg))
+  prox!(solver.reg, state.x, state.γ * λ(solver.reg))
   for proj in solver.proj
-    prox!(proj, solver.x)
+    prox!(proj, state.x)
   end
 
   # gradient restart conditions
   if solver.restart == :gradient
-    solver.w .+= solver.y .+ solver.ρ ./ solver.γ .* (solver.x .- solver.z)
-    if real((solver.w ⋅ solver.x - solver.w ⋅ solver.z) / solver.γ - solver.w ⋅ solver.res) < 0
+    state.w .+= state.y .+ state.ρ ./ state.γ .* (state.x .- state.z)
+    if real((state.w ⋅ state.x - state.w ⋅ state.z) / state.γ - state.w ⋅ state.res) < 0
       solver.verbose && println("Gradient restart at iter $iteration")
-      solver.σ = 1
-      solver.theta = 1
+      state.σ = 1
+      state.theta = 1
     else # decreasing γ
-      solver.σ *= solver.σ_fac
+      state.σ *= state.σ_fac
     end
-    solver.w .= solver.ρ / solver.γ .* (solver.z .- solver.x) .- solver.y
+    state.w .= state.ρ / state.γ .* (state.z .- state.x) .- state.y
   end
 
   # return the residual-norm as item and iteration number as state
-  return solver, iteration + 1
+  state.iteration += 1
+  return state.x, state
 end
 
-@inline converged(solver::POGM) = (solver.rel_res_norm < solver.relTol)
+@inline converged(solver::POGM, state::POGMState) = (state.rel_res_norm < state.relTol)
 
-@inline done(solver::POGM, iteration) = converged(solver) || iteration >= solver.iterations
+@inline done(solver::POGM, state::POGMState) = converged(solver, state) || state.iteration >= solver.iterations
\ No newline at end of file
diff --git a/src/Regularization/PlugAndPlayRegularization.jl b/src/Regularization/PlugAndPlayRegularization.jl
index 2772afb2..6bb482ad 100644
--- a/src/Regularization/PlugAndPlayRegularization.jl
+++ b/src/Regularization/PlugAndPlayRegularization.jl
@@ -26,9 +26,9 @@ PlugAndPlayRegularization(model, shape; kwargs...) = PlugAndPlayRegularization(o
 
 function prox!(self::PlugAndPlayRegularization, x::AbstractArray{Complex{T}}, λ::T) where {T <: Real}
     if self.ignoreIm
-        x[:] = prox!(self, real.(x), λ) + imag.(x) * one(T)im
+        copyto!(x, prox!(self, real.(x), λ) + imag.(x) * one(T)im)
     else
-        x[:] = prox!(self, real.(x), λ) + prox!(self, imag.(x), λ) * one(T)im
+        copyto!(x, prox!(self, real.(x), λ) + prox!(self, imag.(x), λ) * one(T)im)
     end
     return x
 end
@@ -50,7 +50,7 @@ function prox!(self::PlugAndPlayRegularization, x::AbstractArray{T}, λ::T) wher
     out = out - λ * (out - self.model(out))
     out = RegularizedLeastSquares.inverse_transform(tf, out)
 
-    x[:] = vec(out)
+    copyto!(x, vec(out))
     return x
 end
 
diff --git a/src/Regularization/TransformedRegularization.jl b/src/Regularization/TransformedRegularization.jl
index 8bd98d20..1f07b592 100644
--- a/src/Regularization/TransformedRegularization.jl
+++ b/src/Regularization/TransformedRegularization.jl
@@ -28,7 +28,7 @@ innerreg(reg::TransformedRegularization) = reg.reg
 function prox!(reg::TransformedRegularization, x::AbstractArray, args...)
 	z = reg.trafo * x
   result = prox!(reg.reg, z, args...)
-	x[:] = adjoint(reg.trafo) * result
+	copyto!(x, adjoint(reg.trafo) * result)
   return x
 end
 function norm(reg::TransformedRegularization, x::AbstractArray, args...)
diff --git a/src/RegularizedLeastSquares.jl b/src/RegularizedLeastSquares.jl
index 709df2c3..5cb7d4be 100644
--- a/src/RegularizedLeastSquares.jl
+++ b/src/RegularizedLeastSquares.jl
@@ -15,9 +15,10 @@ using StatsBase
 using LinearOperatorCollection
 using InteractiveUtils
 
-export AbstractLinearSolver, createLinearSolver, init, deinit, solve!, linearSolverList, linearSolverListReal, applicableSolverList, power_iterations
+export AbstractLinearSolver, createLinearSolver, init!, deinit, solve!, linearSolverList, linearSolverListReal, applicableSolverList, power_iterations
 
 abstract type AbstractLinearSolver end
+abstract type AbstractSolverState{S} end
 
 """
     solve!(solver::AbstractLinearSolver, b; x0 = 0, callbacks = (_, _) -> nothing)
@@ -152,13 +153,13 @@ include("Transforms.jl")
 include("Regularization/Regularization.jl")
 include("proximalMaps/ProximalMaps.jl")
 
-export solversolution, solverconvergence
+export solversolution, solverconvergence, solverstate
 """
     solversolution(solver::AbstractLinearSolver)
 
 Return the current solution of the solver
 """
-solversolution(solver::AbstractLinearSolver) = solver.x
+solversolution(solver::AbstractLinearSolver) = solverstate(solver).x
 """
     solverconvergence(solver::AbstractLinearSolver)
 
@@ -166,10 +167,15 @@ Return a named tuple of the solvers current convergence metrics
 """
 function solverconvergence end
 
+solverstate(solver::AbstractLinearSolver) = solver.state
+solverconvergence(solver::AbstractLinearSolver) = solverconvergence(solverstate(solver))
+
+init!(solver::AbstractLinearSolver, b; kwargs...) = init!(solver, solverstate(solver), b; kwargs...)
+
 include("Utils.jl")
 include("Kaczmarz.jl")
-include("DAXKaczmarz.jl")
-include("DAXConstrained.jl")
+#include("DAXKaczmarz.jl")
+#include("DAXConstrained.jl")
 include("CGNR.jl")
 include("Direct.jl")
 include("FISTA.jl")
@@ -177,7 +183,7 @@ include("OptISTA.jl")
 include("POGM.jl")
 include("ADMM.jl")
 include("SplitBregman.jl")
-include("PrimalDualSolver.jl")
+#include("PrimalDualSolver.jl")
 
 include("Callbacks.jl")
 
@@ -187,7 +193,8 @@ include("deprecated.jl")
 Return a list of all available linear solvers
 """
 function linearSolverList()
-  filter(s -> s ∉ [DaxKaczmarz, DaxConstrained, PrimalDualSolver], linearSolverListReal())
+  #filter(s -> s ∉ [DaxKaczmarz, DaxConstrained, PrimalDualSolver], linearSolverListReal())
+  linearSolverListReal()
 end
 
 function linearSolverListReal()
@@ -239,12 +246,12 @@ See also [`isapplicable`](@ref), [`linearSolverList`](@ref).
 """
 applicableSolverList(args...) = filter(solver -> isapplicable(solver, args...), linearSolverListReal())
 
-function filterKwargs(T::Type, kwargs)
+function filterKwargs(T::Type, kwargWarning, kwargs)
   table = methods(T)
   keywords = union(Base.kwarg_decl.(table)...)
   filtered = filter(in(keywords), keys(kwargs))
 
-  if length(filtered) < length(kwargs)
+  if length(filtered) < length(kwargs) && kwargWarning
     filteredout = filter(!in(keywords), keys(kwargs))
     @warn "The following arguments were passed but filtered out: $(join(filteredout, ", ")). Please watch closely if this introduces unexpexted behaviour in your code."
   end
@@ -260,12 +267,12 @@ regularized linear systems. All solvers return an approximate solution to Ax = b
 
 TODO: give a hint what solvers are available
 """
-function createLinearSolver(solver::Type{T}, A; kwargs...) where {T<:AbstractLinearSolver}
-  return solver(A; filterKwargs(T, kwargs)...)
+function createLinearSolver(solver::Type{T}, A; kwargWarning::Bool = true, kwargs...) where {T<:AbstractLinearSolver}
+  return solver(A; filterKwargs(T,kwargWarning,kwargs)...)
 end
 
-function createLinearSolver(solver::Type{T}; AHA, kwargs...) where {T<:AbstractLinearSolver}
-  return solver(; filterKwargs(T, kwargs)..., AHA = AHA)
+function createLinearSolver(solver::Type{T}; AHA, kwargWarning::Bool = true, kwargs...) where {T<:AbstractLinearSolver}
+  return solver(; filterKwargs(T,kwargWarning,kwargs)..., AHA = AHA)
 end
 
 end
\ No newline at end of file
diff --git a/src/SplitBregman.jl b/src/SplitBregman.jl
index f665e240..8b4602fd 100644
--- a/src/SplitBregman.jl
+++ b/src/SplitBregman.jl
@@ -1,14 +1,26 @@
 export SplitBregman
 
-mutable struct SplitBregman{matT,opT,R,ropT,P,vecT,rvecT,preconT,rT} <: AbstractPrimalDualSolver
+mutable struct SplitBregman{matT,opT,R,ropT,P,preconT} <: AbstractPrimalDualSolver
   # operators and regularization
   A::matT
   reg::Vector{R}
   regTrafo::Vector{ropT}
   proj::Vector{P}
-  y::vecT
   # fields and operators for x update
   AHA::opT
+  # other parameters
+  precon::preconT
+  normalizeReg::AbstractRegularizationNormalization
+  verbose::Bool
+  iterations::Int64
+  iterationsInner::Int64
+  iterationsCG::Int64
+  state::AbstractSolverState{<:SplitBregman}
+end
+
+mutable struct SplitBregmanState{rT <: Real, rvecT <: AbstractVector{rT}, vecT <: Union{AbstractVector{rT}, AbstractVector{Complex{rT}}}} <: AbstractSolverState{SplitBregman}
+  y::vecT
+  # fields and operators for x update
   β::vecT
   β_y::vecT
   # fields for primal & dual variables
@@ -16,12 +28,10 @@ mutable struct SplitBregman{matT,opT,R,ropT,P,vecT,rvecT,preconT,rT} <: Abstract
   z::Vector{vecT}
   zᵒˡᵈ::Vector{vecT}
   u::Vector{vecT}
-  # other parameters
-  precon::preconT
+  # other paremters
   ρ::rvecT
-  iterationsOuter::Int64
-  iterationsInner::Int64
-  iterationsCG::Int64
+  iteration::Int64
+  iter_cnt::Int64
   # state variables for CG
   cgStateVars::CGStateVariables
   # convergence parameters
@@ -33,15 +43,11 @@ mutable struct SplitBregman{matT,opT,R,ropT,P,vecT,rvecT,preconT,rT} <: Abstract
   absTol::rT
   relTol::rT
   tolInner::rT
-  #counter for internal iterations
-  iter_cnt::Int64
-  normalizeReg::AbstractRegularizationNormalization
-  verbose::Bool
 end
 
 """
-    SplitBregman(A; AHA = A'*A, precon = Identity(), reg = L1Regularization(zero(real(eltype(AHA)))), regTrafo = opEye(eltype(AHA), size(AHA,1)), normalizeReg = NoNormalization(), rho = 1e-1, iterationsOuter = 10, iterationsInner = 10, iterationsCG = 10, absTol = eps(real(eltype(AHA))), relTol = eps(real(eltype(AHA))), tolInner = 1e-5, verbose = false)
-    SplitBregman( ; AHA = ,     precon = Identity(), reg = L1Regularization(zero(real(eltype(AHA)))), regTrafo = opEye(eltype(AHA), size(AHA,1)), normalizeReg = NoNormalization(), rho = 1e-1, iterationsOuter = 10, iterationsInner = 10, iterationsCG = 10, absTol = eps(real(eltype(AHA))), relTol = eps(real(eltype(AHA))), tolInner = 1e-5, verbose = false)
+    SplitBregman(A; AHA = A'*A, precon = Identity(), reg = L1Regularization(zero(real(eltype(AHA)))), regTrafo = opEye(eltype(AHA), size(AHA,1)), normalizeReg = NoNormalization(), rho = 1e-1, iterations = 10, iterationsInner = 10, iterationsCG = 10, absTol = eps(real(eltype(AHA))), relTol = eps(real(eltype(AHA))), tolInner = 1e-5, verbose = false)
+    SplitBregman( ; AHA = ,     precon = Identity(), reg = L1Regularization(zero(real(eltype(AHA)))), regTrafo = opEye(eltype(AHA), size(AHA,1)), normalizeReg = NoNormalization(), rho = 1e-1, iterations = 10, iterationsInner = 10, iterationsCG = 10, absTol = eps(real(eltype(AHA))), relTol = eps(real(eltype(AHA))), tolInner = 1e-5, verbose = false)
 
 Creates a `SplitBregman` object for the forward operator `A` or normal operator `AHA`.
 
@@ -57,7 +63,7 @@ Creates a `SplitBregman` object for the forward operator `A` or normal operator
   * `regTrafo`                                          - transformation to a space in which `reg` is applied; if `reg` is a vector, `regTrafo` has to be a vector of the same length. Use `opEye(eltype(AHA), size(AHA,1))` if no transformation is desired.
   * `normalizeReg::AbstractRegularizationNormalization` - regularization normalization scheme; options are `NoNormalization()`, `MeasurementBasedNormalization()`, `SystemMatrixBasedNormalization()`
   * `rho::Real`                                         - weights for condition on regularized variables; can also be a vector for multiple regularization terms
-  * `iterationsOuter::Int`                              - maximum number of outer iterations. Set to 1 for unconstraint split Bregman (equivalent to ADMM)
+  * `iterations::Int`                              - maximum number of outer iterations. Set to 1 for unconstraint split Bregman (equivalent to ADMM)
   * `iterationsInner::Int`                              - maximum number of inner iterations
   * `iterationsCG::Int`                                 - maximum number of (inner) CG iterations
   * `absTol::Real`                                      - absolute tolerance for stopping criterion
@@ -65,7 +71,7 @@ Creates a `SplitBregman` object for the forward operator `A` or normal operator
   * `tolInner::Real`                                    - relative tolerance for CG stopping criterion
   * `verbose::Bool`                                     - print residual in each iteration
 
-This algorithm solves the constraint problem (Eq. (4.7) in [Tom Goldstein and Stanley Osher](https://doi.org/10.1137/080725891)), i.e. `||R(x)||₁` such that `||Ax -b||₂² < σ²`. In order to solve the unconstraint problem (Eq. (4.8) in [Tom Goldstein and Stanley Osher](https://doi.org/10.1137/080725891)), i.e. `||Ax -b||₂² + λ ||R(x)||₁`, you can either set `iterationsOuter=1` or use ADMM instead, which is equivalent (`iterationsOuter=1` in SplitBregman in implied in ADMM and the SplitBregman variable `iterationsInner` is simply called `iterations` in ADMM)
+This algorithm solves the constraint problem (Eq. (4.7) in [Tom Goldstein and Stanley Osher](https://doi.org/10.1137/080725891)), i.e. `||R(x)||₁` such that `||Ax -b||₂² < σ²`. In order to solve the unconstraint problem (Eq. (4.8) in [Tom Goldstein and Stanley Osher](https://doi.org/10.1137/080725891)), i.e. `||Ax -b||₂² + λ ||R(x)||₁`, you can either set `iterations=1` or use ADMM instead, which is equivalent (`iterations=1` in SplitBregman in implied in ADMM and the SplitBregman variable `iterationsInner` is simply called `iterations` in ADMM)
 
 Like ADMM, SplitBregman differs from ISTA-type algorithms in the sense that the proximal operation is applied separately from the transformation to the space in which the penalty is applied. This is reflected by the interface which has `reg` and `regTrafo` as separate arguments. E.g., for a TV penalty, you should NOT set `reg=TVRegularization`, but instead use `reg=L1Regularization(λ), regTrafo=RegularizedLeastSquares.GradientOp(Float64; shape=(Nx,Ny,Nz))`.
 
@@ -77,10 +83,10 @@ function SplitBregman(A
                     ; AHA = A'*A
                     , precon = Identity()
                     , reg = L1Regularization(zero(real(eltype(AHA))))
-                    , regTrafo = opEye(eltype(AHA), size(AHA,1))
+                    , regTrafo = opEye(eltype(AHA), size(AHA,1), S = LinearOperators.storage_type(AHA))
                     , normalizeReg::AbstractRegularizationNormalization = NoNormalization()
                     , rho = 1e-1
-                    , iterationsOuter::Int = 10
+                    , iterations::Int = 10
                     , iterationsInner::Int = 10
                     , iterationsCG::Int = 10
                     , absTol::Real = eps(real(eltype(AHA)))
@@ -128,13 +134,32 @@ function SplitBregman(A
   ɛᵖʳⁱ = similar(rᵏ)
   ɛᵈᵘᵃ = similar(rᵏ)
 
-  iter_cnt = 1
-
 
   # normalization parameters
   reg = normalize(SplitBregman, normalizeReg, reg, A, nothing)
 
-  return SplitBregman(A,reg,regTrafo,proj,y,AHA,β,β_y,x,z,zᵒˡᵈ,u,precon,rho,iterationsOuter,iterationsInner,iterationsCG,cgStateVars,rᵏ,sᵏ,ɛᵖʳⁱ,ɛᵈᵘᵃ,rT(0),rT(absTol),rT(relTol),rT(tolInner),iter_cnt,normalizeReg,verbose)
+  state = SplitBregmanState(y, β, β_y, x, z, zᵒˡᵈ, u, rho, 1, 1, cgStateVars,rᵏ,sᵏ,ɛᵖʳⁱ,ɛᵈᵘᵃ,rT(0),rT(absTol),rT(relTol),rT(tolInner))
+
+  return SplitBregman(A,reg,regTrafo,proj,AHA,precon,normalizeReg,verbose,iterations,iterationsInner,iterationsCG,state)
+end
+
+function init!(solver::SplitBregman, state::SplitBregmanState{rT, rvecT, vecT}, b::otherT; kwargs...) where {rT, rvecT, vecT, otherT}
+  y    = similar(b, size(state.y)...)
+  x    = similar(b, size(state.x)...)
+  β    = similar(b, size(state.β)...)
+  β_y  = similar(b, size(state.β_y)...)
+
+  z    = [similar(b, size(state.z[i])...)     for i ∈ eachindex(solver.reg)]
+  zᵒˡᵈ = [similar(b, size(state.zᵒˡᵈ[i])...)  for i ∈ eachindex(solver.reg)]
+  u    = [similar(b, size(state.u[i])...)     for i ∈ eachindex(solver.reg)]
+
+  cgStateVars = CGStateVariables(zero(x),similar(x),similar(x))
+
+  state = SplitBregmanState(y, β, β_y, x, z, zᵒˡᵈ, u, state.ρ, state.iteration, state.iter_cnt, cgStateVars,
+      state.rᵏ, state.sᵏ, state.ɛᵖʳⁱ, state.ɛᵈᵘᵃ, state.σᵃᵇˢ, state.absTol, state.relTol, state.tolInner)
+  
+  solver.state = state
+  init!(solver, state, b; kwargs...)
 end
 
 """
@@ -142,112 +167,114 @@ end
 
 (re-) initializes the SplitBregman iterator
 """
-function init!(solver::SplitBregman, b; x0 = 0)
-  solver.x .= x0
+function init!(solver::SplitBregman, state::SplitBregmanState{rT, rvecT, vecT}, b::vecT; x0 = 0) where {rT, rvecT, vecT}
+  state.x .= x0
 
   # right hand side for the x-update
   if solver.A === nothing
-    solver.β_y .= b
+    state.β_y .= b
   else
-    mul!(solver.β_y, adjoint(solver.A), b)
+    mul!(state.β_y, adjoint(solver.A), b)
   end
-  solver.y .= solver.β_y
+  state.y .= state.β_y
 
   # primal and dual variables
   for i ∈ eachindex(solver.reg)
-    solver.z[i] .= solver.regTrafo[i]*solver.x
-    solver.u[i] .= 0
+    state.z[i] .= solver.regTrafo[i]*state.x
+    state.u[i] .= 0
   end
 
   # convergence parameter
-  solver.rᵏ .= Inf
-  solver.sᵏ .= Inf
-  solver.ɛᵖʳⁱ .= 0
-  solver.ɛᵈᵘᵃ .= 0
-  solver.σᵃᵇˢ = sqrt(length(b)) * solver.absTol
+  state.rᵏ .= Inf
+  state.sᵏ .= Inf
+  state.ɛᵖʳⁱ .= 0
+  state.ɛᵈᵘᵃ .= 0
+  state.σᵃᵇˢ = sqrt(length(b)) * state.absTol
 
   # normalization of regularization parameters
   solver.reg = normalize(solver, solver.normalizeReg, solver.reg, solver.A, b)
 
   # reset interation counter
-  solver.iter_cnt = 1
+  state.iter_cnt = 1
+  state.iteration = 1
 end
 
-solverconvergence(solver::SplitBregman) = (; :primal => solver.rᵏ, :dual => solver.sᵏ)
+solverconvergence(state::SplitBregmanState) = (; :primal => state.rᵏ, :dual => state.sᵏ)
 
-function iterate(solver::SplitBregman, iteration=1)
-  if done(solver, iteration) return nothing end
-  solver.verbose && println("SplitBregman Iteration #$iteration – Outer iteration $(solver.iter_cnt)")
+function iterate(solver::SplitBregman, state=solver.state)
+  if done(solver, state) return nothing end
+  solver.verbose && println("SplitBregman Iteration #$(state.iteration) – Outer iteration $(state.iter_cnt)")
 
   # update x
-  solver.β .= solver.β_y
+  state.β .= state.β_y
   AHA = solver.AHA
   for i ∈ eachindex(solver.reg)
-    mul!(solver.β, adjoint(solver.regTrafo[i]), solver.z[i],  solver.ρ[i], 1)
-    mul!(solver.β, adjoint(solver.regTrafo[i]), solver.u[i], -solver.ρ[i], 1)
-    AHA += solver.ρ[i] * adjoint(solver.regTrafo[i]) * solver.regTrafo[i]
+    mul!(state.β, adjoint(solver.regTrafo[i]), state.z[i],  state.ρ[i], 1)
+    mul!(state.β, adjoint(solver.regTrafo[i]), state.u[i], -state.ρ[i], 1)
+    AHA += state.ρ[i] * adjoint(solver.regTrafo[i]) * solver.regTrafo[i]
   end
   solver.verbose && println("conjugated gradients: ")
-  cg!(solver.x, AHA, solver.β, Pl = solver.precon, maxiter = solver.iterationsCG, reltol = solver.tolInner, statevars = solver.cgStateVars, verbose = solver.verbose)
+  cg!(state.x, AHA, state.β, Pl = solver.precon, maxiter = solver.iterationsCG, reltol = state.tolInner, statevars = state.cgStateVars, verbose = solver.verbose)
 
   for proj in solver.proj
-    prox!(proj, solver.x)
+    prox!(proj, state.x)
   end
 
   #  proximal map for regularization terms
   for i ∈ eachindex(solver.reg)
     # swap z and zᵒˡᵈ w/o copying data
-    tmp = solver.zᵒˡᵈ[i]
-    solver.zᵒˡᵈ[i] = solver.z[i]
-    solver.z[i] = tmp
+    tmp = state.zᵒˡᵈ[i]
+    state.zᵒˡᵈ[i] = state.z[i]
+    state.z[i] = tmp
 
     # 2. update z using the proximal map of 1/ρ*g(x)
-    mul!(solver.z[i], solver.regTrafo[i], solver.x)
-    solver.z[i] .+= solver.u[i]
-    if solver.ρ[i] != 0
-      prox!(solver.reg[i], solver.z[i], λ(solver.reg[i])/2solver.ρ[i]) # λ is divided by 2 to match the ISTA-type algorithms
+    mul!(state.z[i], solver.regTrafo[i], state.x)
+    state.z[i] .+= state.u[i]
+    if state.ρ[i] != 0
+      prox!(solver.reg[i], state.z[i], λ(solver.reg[i])/state.ρ[i]) # λ is divided by 2 to match the ISTA-type algorithms
     end
 
     # 3. update u
-    mul!(solver.u[i], solver.regTrafo[i], solver.x, 1, 1)
-    solver.u[i] .-= solver.z[i]
+    mul!(state.u[i], solver.regTrafo[i], state.x, 1, 1)
+    state.u[i] .-= state.z[i]
 
     # update convergence criteria (one for each constraint)
-    solver.rᵏ[i] = norm(solver.regTrafo[i] * solver.x - solver.z[i])  # primal residual (x-z)
-    solver.sᵏ[i] = norm(solver.ρ[i] * adjoint(solver.regTrafo[i]) * (solver.z[i] .- solver.zᵒˡᵈ[i])) # dual residual (concerning f(x))
+    state.rᵏ[i] = norm(solver.regTrafo[i] * state.x - state.z[i])  # primal residual (x-z)
+    state.sᵏ[i] = norm(state.ρ[i] * adjoint(solver.regTrafo[i]) * (state.z[i] .- state.zᵒˡᵈ[i])) # dual residual (concerning f(x))
 
-    solver.ɛᵖʳⁱ[i] = max(norm(solver.regTrafo[i] * solver.x), norm(solver.z[i]))
-    solver.ɛᵈᵘᵃ[i] = norm(solver.ρ[i] * adjoint(solver.regTrafo[i]) * solver.u[i])
+    state.ɛᵖʳⁱ[i] = max(norm(solver.regTrafo[i] * state.x), norm(state.z[i]))
+    state.ɛᵈᵘᵃ[i] = norm(state.ρ[i] * adjoint(solver.regTrafo[i]) * state.u[i])
 
     if solver.verbose
-      println("rᵏ[$i]/ɛᵖʳⁱ[$i] = $(solver.rᵏ[i]/solver.ɛᵖʳⁱ[i])")
-      println("sᵏ[$i]/ɛᵈᵘᵃ[$i] = $(solver.sᵏ[i]/solver.ɛᵈᵘᵃ[i])")
+      println("rᵏ[$i]/ɛᵖʳⁱ[$i] = $(state.rᵏ[i]/state.ɛᵖʳⁱ[i])")
+      println("sᵏ[$i]/ɛᵈᵘᵃ[$i] = $(state.sᵏ[i]/state.ɛᵈᵘᵃ[i])")
       flush(stdout)
     end
   end
 
 
-  if converged(solver) || iteration >= solver.iterationsInner
-    solver.β_y .+= solver.y
-    mul!(solver.β_y, solver.AHA, solver.x, -1, 1)
+  if converged(solver, state) || state.iteration >= solver.iterationsInner
+    state.β_y .+= state.y
+    mul!(state.β_y, solver.AHA, state.x, -1, 1)
     # reset z and b
     for i ∈ eachindex(solver.reg)
-      mul!(solver.z[i], solver.regTrafo[i], solver.x)
-      solver.u[i] .= 0
+      mul!(state.z[i], solver.regTrafo[i], state.x)
+      state.u[i] .= 0
     end
-    solver.iter_cnt += 1
-    iteration = 0
+    state.iter_cnt += 1
+    state.iteration = 0
   end
 
-  return solver.rᵏ, iteration+1
+  state.iteration += 1
+  return state.x, state
 end
 
-function converged(solver::SplitBregman)
+function converged(solver::SplitBregman, state)
     for i ∈ eachindex(solver.reg)
-      (solver.rᵏ[i] >= solver.σᵃᵇˢ + solver.relTol * solver.ɛᵖʳⁱ[i]) && return false
-      (solver.sᵏ[i] >= solver.σᵃᵇˢ + solver.relTol * solver.ɛᵈᵘᵃ[i]) && return false
+      (state.rᵏ[i] >= state.σᵃᵇˢ + state.relTol * state.ɛᵖʳⁱ[i]) && return false
+      (state.sᵏ[i] >= state.σᵃᵇˢ + state.relTol * state.ɛᵈᵘᵃ[i]) && return false
     end
   return true
 end
 
-@inline done(solver::SplitBregman,iteration::Int) = converged(solver) || (iteration == 1 && solver.iter_cnt > solver.iterationsOuter)
\ No newline at end of file
+@inline done(solver::SplitBregman,state) = converged(solver, state) || (state.iteration == 1 && state.iter_cnt > solver.iterations)
\ No newline at end of file
diff --git a/src/Utils.jl b/src/Utils.jl
index 98f317a6..a593b78b 100644
--- a/src/Utils.jl
+++ b/src/Utils.jl
@@ -99,7 +99,7 @@ function dot_with_matrix_row(B::Transpose{T,S},
   tmp
 end
 
-function dot_with_matrix_row(prod::ProdOp{T, <:WeightingOp, matT}, x::Vector{T}, k) where {T, matT}
+function dot_with_matrix_row(prod::ProdOp{T, <:WeightingOp, matT}, x::AbstractVector{T}, k) where {T, matT}
   A = prod.B
   return prod.A.weights[k]*dot_with_matrix_row(A, x, k)
 end
@@ -111,35 +111,35 @@ end
 """
 This function enforces the constraint of a real solution.
 """
-function enfReal!(x::AbstractArray{T}, mask=ones(Bool, length(x))) where {T<:Complex}
+function enfReal!(x::AbstractArray{T}) where {T<:Complex}
   #Returns x as complex vector with imaginary part set to zero
   @simd for i in 1:length(x)
-    @inbounds mask[i] && (x[i] = complex(x[i].re))
+    @inbounds (x[i] = complex(x[i].re))
   end
 end
 
 """
 This function enforces the constraint of a real solution.
 """
-enfReal!(x::AbstractArray{T}, mask=ones(Bool, length(x))) where {T<:Real} = nothing
+enfReal!(x::AbstractArray{T}) where {T<:Real} = nothing
 
 """
 This function enforces positivity constraints on its input.
 """
-function enfPos!(x::AbstractArray{T}, mask=ones(Bool, length(x))) where {T<:Complex}
+function enfPos!(x::AbstractArray{T}) where {T<:Complex}
   #Return x as complex vector with negative parts projected onto 0
   @simd for i in 1:length(x)
-    @inbounds (x[i].re < 0 && mask[i]) && (x[i] = im*x[i].im)
+    @inbounds (x[i].re < 0) && (x[i] = im*x[i].im)
   end
 end
 
 """
 This function enforces positivity constraints on its input.
 """
-function enfPos!(x::AbstractArray{T}, mask=ones(Bool, length(x))) where {T<:Real}
+function enfPos!(x::AbstractArray{T}) where {T<:Real}
   #Return x as complex vector with negative parts projected onto 0
   @simd for i in 1:length(x)
-    @inbounds (x[i] < 0 && mask[i]) && (x[i] = zero(T))
+    @inbounds (x[i] < 0) && (x[i] = zero(T))
   end
 end
 
@@ -245,9 +245,11 @@ end
     power_iterations(AᴴA; rtol=1e-3, maxiter=30, verbose=false)
 
 Power iterations to determine the maximum eigenvalue of a normal operator or square matrix.
+For custom AᴴA which are not an abstract array or an `AbstractLinearOperator` one can pass a vector `b` of `size(AᴴA, 2)` to be used during the computation. 
 
 # Arguments
 * `AᴴA`                 - operator or matrix; has to be square
+* b                     - (optional), vector to be used during computation
 
 # Keyword Arguments
 * `rtol=1e-3`           - relative tolerance; function terminates if the change of the max. eigenvalue is smaller than this values
@@ -257,8 +259,11 @@ Power iterations to determine the maximum eigenvalue of a normal operator or squ
 # Output
 maximum eigenvalue of the operator
 """
-function power_iterations(AᴴA; rtol=1e-3, maxiter=30, verbose=false)
-  b = randn(eltype(AᴴA), size(AᴴA,2))
+power_iterations(AᴴA::AbstractArray; kwargs...) = power_iterations(AᴴA, similar(AᴴA, size(AᴴA, 2)); kwargs...)
+power_iterations(AᴴA::AbstractLinearOperator; kwargs...) = power_iterations(AᴴA, similar(LinearOperators.storage_type(AᴴA), size(AᴴA, 2)); kwargs...)
+function power_iterations(AᴴA, b; rtol=1e-3, maxiter=30, verbose=false)
+  copyto!(b, randn(eltype(b), size(AᴴA, 2)))
+  
   bᵒˡᵈ = similar(b)
   λ = Inf
 
diff --git a/src/proximalMaps/ProxL21.jl b/src/proximalMaps/ProxL21.jl
index 4452a9f4..d02d6379 100644
--- a/src/proximalMaps/ProxL21.jl
+++ b/src/proximalMaps/ProxL21.jl
@@ -30,7 +30,7 @@ end
 function proxL21!(x::Union{AbstractArray{T}, AbstractArray{Complex{T}}}, λ::T, slices::Int64) where T
   sliceLength = div(length(x),slices)
   groupNorm = [norm(x[i:sliceLength:end]) for i=1:sliceLength]
-  x[:] = [ x[i]*max( (groupNorm[mod1(i,sliceLength)]-λ)/groupNorm[mod1(i,sliceLength)],0 ) for i=1:length(x)]
+  copyto!(x, [ x[i]*max( (groupNorm[mod1(i,sliceLength)]-λ)/groupNorm[mod1(i,sliceLength)],0 ) for i=1:length(x)])
   return x
 end
 
diff --git a/src/proximalMaps/ProxLLR.jl b/src/proximalMaps/ProxLLR.jl
index 79880ebb..46e47ec7 100644
--- a/src/proximalMaps/ProxLLR.jl
+++ b/src/proximalMaps/ProxLLR.jl
@@ -39,7 +39,7 @@ end
 
 performs the proximal map for LLR regularization using singular-value-thresholding on non-overlapping blocks
 """
-function proxLLRNonOverlapping!(reg::LLRRegularization{TR, N, TI}, x::AbstractArray{Tc}, λ::T) where {TR, N, TI, T, Tc <: Union{T, Complex{T}}}
+function proxLLRNonOverlapping!(reg::LLRRegularization{TR, N, TI}, x::Union{AbstractArray{T}, AbstractArray{Complex{T}}}, λ::T) where {TR, N, TI, T}
     shape = reg.shape
     blockSize = reg.blockSize
     randshift = reg.randshift
@@ -59,7 +59,8 @@ function proxLLRNonOverlapping!(reg::LLRRegularization{TR, N, TI}, x::AbstractAr
     ext = mod.(shape, blockSize)
     pad = mod.(blockSize .- ext, blockSize)
     if any(pad .!= 0)
-        xp = zeros(Tc, (shape .+ pad)..., K)
+        xp = similar(x, eltype(x), (shape .+ pad)..., K)
+        fill!(xp, zero(eltype(x)))
         xp[CartesianIndices(x)] .= xs
     else
         xp = xs
@@ -68,15 +69,16 @@ function proxLLRNonOverlapping!(reg::LLRRegularization{TR, N, TI}, x::AbstractAr
     bthreads = BLAS.get_num_threads()
     try
         BLAS.set_num_threads(1)
-        xᴸᴸᴿ = [Array{Tc}(undef, prod(blockSize), K) for _ = 1:Threads.nthreads()]
+        blocks = CartesianIndices(StepRange.(TI(0), blockSize, shape .- 1))
+        xᴸᴸᴿ = [similar(x, prod(blockSize), K) for _ = 1:length(blocks)]
         let xp = xp # Avoid boxing error
-            @floop for i ∈ CartesianIndices(StepRange.(TI(0), blockSize, shape .- 1))
-                @views xᴸᴸᴿ[Threads.threadid()] .= reshape(xp[i.+block_idx, :], :, K)
-                ub = sqrt(norm(xᴸᴸᴿ[Threads.threadid()]' * xᴸᴸᴿ[Threads.threadid()], Inf)) #upper bound on singular values given by matrix infinity norm
+            @floop for (id, i) ∈ enumerate(blocks)
+                @views xᴸᴸᴿ[id] .= reshape(xp[i.+block_idx, :], :, K)
+                ub = sqrt(norm(xᴸᴸᴿ[id]' * xᴸᴸᴿ[id], Inf)) #upper bound on singular values given by matrix infinity norm
                 if λ >= ub #save time by skipping the SVT as recommended by Ong/Lustig, IEEE 2016
                     xp[i.+block_idx, :] .= 0
                 else # threshold singular values
-                    SVDec = svd!(xᴸᴸᴿ[Threads.threadid()])
+                    SVDec = svd!(xᴸᴸᴿ[id])
                     prox!(L1Regularization, SVDec.S, λ)
                     xp[i.+block_idx, :] .= reshape(SVDec.U * Diagonal(SVDec.S) * SVDec.Vt, blockSize..., :)
                 end
@@ -168,7 +170,7 @@ proxLLROverlapping!(reg::LLRRegularization, x, λ)
 
 performs the proximal map for LLR regularization using singular-value-thresholding with fully overlapping blocks
 """
-function proxLLROverlapping!(reg::LLRRegularization{TR, N, TI}, x::AbstractArray{Tc}, λ::T) where {TR, N, TI, T, Tc <: Union{T, Complex{T}}}
+function proxLLROverlapping!(reg::LLRRegularization{TR, N, TI}, x::Union{AbstractArray{T}, AbstractArray{Complex{T}}}, λ::T) where {TR, N, TI, T}
     shape = reg.shape
     blockSize = reg.blockSize
 
@@ -180,7 +182,7 @@ function proxLLROverlapping!(reg::LLRRegularization{TR, N, TI}, x::AbstractArray
     ext = mod.(shape, blockSize)
     pad = mod.(blockSize .- ext, blockSize)
     if any(pad .!= 0)
-        xp = zeros(Tc, (shape .+ pad)..., K)
+        xp = zeros(eltype(x), (shape .+ pad)..., K)
         xp[CartesianIndices(x)] .= x
     else
         xp = copy(x)
diff --git a/src/proximalMaps/ProxNuclear.jl b/src/proximalMaps/ProxNuclear.jl
index e14898dc..f8e7c14d 100644
--- a/src/proximalMaps/ProxNuclear.jl
+++ b/src/proximalMaps/ProxNuclear.jl
@@ -26,7 +26,7 @@ performs singular value soft-thresholding - i.e. the proximal map for the nuclea
 function prox!(reg::NuclearRegularization, x::Union{AbstractArray{T}, AbstractArray{Complex{T}}}, λ::T) where {T <: Real}
   U,S,V = svd(reshape(x, reg.svtShape))
   prox!(L1Regularization, S, λ)
-  x[:] = vec(U*Matrix(Diagonal(S))*V')
+  copyto!(x, vec(U*Diagonal(S)*V'))
   return x
 end
 
diff --git a/src/proximalMaps/ProxProj.jl b/src/proximalMaps/ProxProj.jl
index 4a19abca..6a6bc99b 100644
--- a/src/proximalMaps/ProxProj.jl
+++ b/src/proximalMaps/ProxProj.jl
@@ -5,14 +5,14 @@ struct ProjectionRegularization <: AbstractProjectionRegularization
 end
 ProjectionRegularization(; projFunc::Function=x->x, kargs...) = ProjectionRegularization(projFunc)
 
-function prox!(reg::ProjectionRegularization, x::Vector{Tc}) where {T, Tc <: Union{T, Complex{T}}}
-  x[:] = reg.projFunc(x)
+function prox!(reg::ProjectionRegularization, x::AbstractArray{Tc}) where {T, Tc <: Union{T, Complex{T}}}
+  copyto!(x, reg.projFunc(x))
   return x
 end
 
-function norm(reg::ProjectionRegularization, x::Vector{Tc}) where {T, Tc <: Union{T, Complex{T}}}
+function norm(reg::ProjectionRegularization, x::AbstractArray{Tc}) where {T, Tc <: Union{T, Complex{T}}}
   y = copy(x)
-  y[:] = prox!(reg, y)
+  copyto!(y, prox!(reg, y))
   if y != x
     return Inf
   end
diff --git a/src/proximalMaps/ProxReal.jl b/src/proximalMaps/ProxReal.jl
index af898ab5..c083ae32 100644
--- a/src/proximalMaps/ProxReal.jl
+++ b/src/proximalMaps/ProxReal.jl
@@ -13,7 +13,7 @@ end
 
 enforce realness of solution `x`.
 """
-function prox!(::RealRegularization, x::Vector{T}) where T
+function prox!(::RealRegularization, x::AbstractArray{T}) where T
   enfReal!(x)
   return x
 end
@@ -23,7 +23,7 @@ end
 
 returns the value of the characteristic function of real, Real numbers.
 """
-function norm(reg::RealRegularization, x::Vector{T}) where T
+function norm(reg::RealRegularization, x::AbstractArray{T}) where T
   y = copy(x)
   prox!(reg, y)
   if y != x
diff --git a/src/proximalMaps/ProxTV.jl b/src/proximalMaps/ProxTV.jl
index a17d21f0..e319e8d5 100644
--- a/src/proximalMaps/ProxTV.jl
+++ b/src/proximalMaps/ProxTV.jl
@@ -1,5 +1,13 @@
 export TVRegularization
 
+mutable struct TVParams{Tc,vecTc <: AbstractVector{Tc}, matT}
+  pq::vecTc
+  rs::vecTc
+  pqOld::vecTc
+  xTmp::vecTc
+  ∇::matT
+end
+
 """
     TVRegularization
 
@@ -21,29 +29,21 @@ and Deblurring Problems", IEEE Trans. Image Process. 18(11), 2009
 * `dims`                    - Dimension to perform the TV along. If `Integer`, the Condat algorithm is called, and the FDG algorithm otherwise.
 * `iterationsTV=20`         - number of FGP iterations
 """
-struct TVRegularization{T,N,TI} <: AbstractParameterizedRegularization{T} where {N,TI<:Integer}
+mutable struct TVRegularization{T,N,TI} <: AbstractParameterizedRegularization{T} where {N,TI<:Integer}
   λ::T
   dims
   shape::NTuple{N,TI}
   iterationsTV::Int64
+  params::Union{TVParams, Nothing}
 end
-TVRegularization(λ; shape=(0,), dims=1:length(shape), iterationsTV=10, kargs...) = TVRegularization(λ, dims, shape, iterationsTV)
-
-
-mutable struct TVParams{Tc,matT}
-  pq::Vector{Tc}
-  rs::Vector{Tc}
-  pqOld::Vector{Tc}
-  xTmp::Vector{Tc}
-  ∇::matT
-end
+TVRegularization(λ; shape=(0,), dims=1:length(shape), iterationsTV=10, kargs...) = TVRegularization(λ, dims, shape, iterationsTV, nothing)
 
 function TVParams(shape, T::Type=Float64; dims=1:length(shape))
   return TVParams(Vector{T}(undef, prod(shape)); shape=shape, dims=dims)
 end
 
 function TVParams(x::AbstractVector{Tc}; shape, dims=1:length(shape)) where {Tc}
-  ∇ = GradientOp(Tc; shape, dims)
+  ∇ = GradientOp(Tc; shape, dims, S = typeof(x))
 
   # allocate storage
   xTmp = similar(x)
@@ -61,12 +61,13 @@ end
 
 Proximal map for TV regularization. Calculated with the Condat algorithm if the TV is calculated only along one dimension and with the Fast Gradient Projection algorithm otherwise.
 """
-prox!(reg::TVRegularization, x::Union{AbstractArray{T}, AbstractArray{Complex{T}}}, λ::T) where {T <: Real} = proxTV!(x, λ, shape=reg.shape, dims=reg.dims, iterationsTV=reg.iterationsTV)
+prox!(reg::TVRegularization, x::Union{AbstractArray{T}, AbstractArray{Complex{T}}}, λ::T) where {T <: Real} = proxTV!(reg, x, λ, shape=reg.shape, dims=reg.dims, iterationsTV=reg.iterationsTV)
 
-function proxTV!(x, λ; shape, dims=1:length(shape), kwargs...) # use kwargs for shape and dims
-  return proxTV!(x, λ, shape, dims; kwargs...) # define shape and dims w/o kwargs to enable multiple dispatch on dims
+function proxTV!(reg, x, λ; shape, dims=1:length(shape), kwargs...) # use kwargs for shape and dims
+  return proxTV!(reg, x, λ, shape, dims; kwargs...) # define shape and dims w/o kwargs to enable multiple dispatch on dims
 end
 
+proxTV!(reg, x, shape, dims::Integer; kwargs...) = proxTV!(reg, x, shape, dims; kwargs...)
 function proxTV!(x::AbstractVector{T}, λ::T, shape, dims::Integer; kwargs...) where {T<:Real}
   x_ = reshape(x, shape)
   i = CartesianIndices((ones(Int, dims - 1)..., 0:shape[dims]-1, ones(Int, length(shape) - dims)...))
@@ -77,12 +78,19 @@ function proxTV!(x::AbstractVector{T}, λ::T, shape, dims::Integer; kwargs...) w
   return x
 end
 
-function proxTV!(x::AbstractVector{Tc}, λ::T, shape, dims; iterationsTV=10, tvpar=TVParams(x; shape=shape, dims=dims), kwargs...) where {T<:Real,Tc<:Union{T,Complex{T}}}
-  return proxTV!(x, λ, tvpar; iterationsTV=iterationsTV)
+# Reuse TvParams if possible
+function proxTV!(reg, x::AbstractVector{Tc}, λ::T, shape, dims; iterationsTV=10, kwargs...) where {T<:Real,Tc<:Union{T,Complex{T}}}
+  if isnothing(reg.params) || length(x) != length(reg.params.xTmp) || typeof(x) != typeof(reg.params.xTmp)
+    reg.params = TVParams(x; shape = shape, dims = dims)
+  end
+  return proxTV!(x, λ, reg.params; iterationsTV=iterationsTV)
 end
 
 function proxTV!(x::AbstractVector{Tc}, λ::T, p::TVParams{Tc}; iterationsTV=10, kwargs...) where {T<:Real,Tc<:Union{T,Complex{T}}}
   @assert length(p.xTmp) == length(x)
+  @assert length(p.rs) == length(p.pq)
+  @assert length(p.rs) == length(p.pq)
+
   # initialize dual variables
   p.xTmp .= 0
   p.pq .= 0
@@ -96,13 +104,11 @@ function proxTV!(x::AbstractVector{Tc}, λ::T, p::TVParams{Tc}; iterationsTV=10,
     p.pq = p.rs
 
     # gradient projection step for dual variables
-    Threads.@threads for i ∈ eachindex(p.xTmp, x)
-      @inbounds p.xTmp[i] = x[i]
-    end
+    tv_copy!(p.xTmp, x)
     mul!(p.xTmp, transpose(p.∇), p.rs, -λ, 1) # xtmp = x-λ*transpose(∇)*rs
     mul!(p.pq, p.∇, p.xTmp, 1 / (8λ), 1) # rs = ∇*xTmp/(8λ)
 
-    restrictMagnitude!(p.pq)
+    tv_restrictMagnitude!(p.pq)
 
     # form linear combination of old and new estimates
     tOld = t
@@ -111,22 +117,33 @@ function proxTV!(x::AbstractVector{Tc}, λ::T, p::TVParams{Tc}; iterationsTV=10,
     t3 = 1 + t2
 
     p.rs = pqTmp
-    Threads.@threads for i ∈ eachindex(p.rs, p.pq, p.pqOld)
-      @inbounds p.rs[i] = t3 * p.pq[i] - t2 * p.pqOld[i]
-    end
+    tv_linearcomb!(p.rs, t3, p.pq, t2, p.pqOld)
   end
 
   mul!(x, transpose(p.∇), p.pq, -λ, one(Tc)) # x .-= λ*transpose(∇)*pq
   return x
 end
 
+tv_copy!(dest, src) = copyto!(dest, src)
+function tv_copy!(dest::Vector{T}, src::Vector{T}) where T
+  Threads.@threads for i ∈ eachindex(dest, src)
+    @inbounds dest[i] = src[i]
+  end
+end
+
 # restrict x to a number smaller then one
-function restrictMagnitude!(x)
+function tv_restrictMagnitude!(x)
   Threads.@threads for i in eachindex(x)
     @inbounds x[i] /= max(1, abs(x[i]))
   end
 end
 
+function tv_linearcomb!(rs, t3, pq, t2, pqOld)
+  Threads.@threads for i ∈ eachindex(rs, pq, pqOld)
+    @inbounds rs[i] = t3 * pq[i] - t2 * pqOld[i]
+  end
+end
+
 """
   norm(reg::TVRegularization, x, λ)
 
diff --git a/src/proximalMaps/ProxTVCondat.jl b/src/proximalMaps/ProxTVCondat.jl
index a4cc0e71..0f2dd854 100644
--- a/src/proximalMaps/ProxTVCondat.jl
+++ b/src/proximalMaps/ProxTVCondat.jl
@@ -14,7 +14,7 @@ function proxTVCondat!(x::Vector{T}, λ::Float64; shape=[], kargs...) where T
     tv_denoise_3d_condat!(y_, nhood[d,:], λ*omega[d])
     y .+= y_ ./ length(omega)
   end
-  x[:] = y[:]
+  copyto!(x, y)
   return y
 end
 
diff --git a/test/gpu/cuda.jl b/test/gpu/cuda.jl
new file mode 100644
index 00000000..e7d0eb2c
--- /dev/null
+++ b/test/gpu/cuda.jl
@@ -0,0 +1,5 @@
+using CUDA
+
+arrayTypes = [CuArray]
+
+include(joinpath(@__DIR__(), "..", "runtests.jl"))
\ No newline at end of file
diff --git a/test/gpu/rocm.jl b/test/gpu/rocm.jl
new file mode 100644
index 00000000..ebf32fb3
--- /dev/null
+++ b/test/gpu/rocm.jl
@@ -0,0 +1,5 @@
+using AMDGPU
+
+arrayTypes = [ROCArray]
+
+include(joinpath(@__DIR__(), "..", "runtests.jl"))
\ No newline at end of file
diff --git a/test/runtests.jl b/test/runtests.jl
index 00d5f82d..ddb6ad34 100644
--- a/test/runtests.jl
+++ b/test/runtests.jl
@@ -2,6 +2,10 @@ using RegularizedLeastSquares, LinearAlgebra, RegularizedLeastSquares.LinearOper
 # Packages for testing only
 using Random, Test
 using FFTW
+using JLArrays
+
+areTypesDefined = @isdefined arrayTypes
+arrayTypes = areTypesDefined ? arrayTypes : [Array, JLArray]
 
 @testset "RegularizedLeastSquares" begin
   include("testCreation.jl")
diff --git a/test/testCallbacks.jl b/test/testCallbacks.jl
new file mode 100644
index 00000000..4d4f57f4
--- /dev/null
+++ b/test/testCallbacks.jl
@@ -0,0 +1,58 @@
+@testset "Test Callbacks" begin
+  A = rand(32, 32)
+  x = rand(32)
+  b = A * x
+
+  iterations = 10
+  solver = createLinearSolver(CGNR, A; iterations = iterations, relTol = 0.0)
+
+  @testset "Store Solution Callback" begin
+    cbk = StoreSolutionCallback()
+    x_approx = solve!(solver, b; callbacks = cbk)
+
+    @test length(cbk.solutions) == iterations + 1
+    @test cbk.solutions[end] == x_approx
+  end
+
+  @testset "Compare Solution Callback" begin
+    cbk = CompareSolutionCallback(x)
+    x_approx = solve!(solver, b; callbacks = cbk)
+
+    @test length(cbk.results) == iterations + 1
+    @test cbk.results[1] > cbk.results[end]
+  end
+
+  @testset "Store Solution Callback" begin
+    cbk = StoreConvergenceCallback()
+    x_approx = solve!(solver, b; callbacks = cbk)
+
+    @test length(first(values(cbk.convMeas))) == iterations + 1
+    conv = solverconvergence(solver)
+    @test cbk.convMeas[keys(conv)[1]][end] == conv[1]
+  end
+
+  @testset "Do-Syntax Callback" begin
+    counter = 0
+
+    solve!(solver, b) do solver, it
+      counter +=1
+    end
+
+    @test counter == iterations + 1
+  end
+
+  @testset "Multiple Callbacks" begin
+    callbacks = [StoreSolutionCallback(), StoreConvergenceCallback()]
+
+    x_approx = solve!(solver, b; callbacks)
+
+    cbk = callbacks[1]
+    @test length(cbk.solutions) == iterations + 1
+    @test cbk.solutions[end] == x_approx
+
+    cbk = callbacks[2]
+    @test length(first(values(cbk.convMeas))) == iterations + 1
+    conv = solverconvergence(solver)
+    @test cbk.convMeas[keys(conv)[1]][end] == conv[1]
+  end
+end
\ No newline at end of file
diff --git a/test/testKaczmarz.jl b/test/testKaczmarz.jl
index 0e85c8c9..1d8a3f50 100644
--- a/test/testKaczmarz.jl
+++ b/test/testKaczmarz.jl
@@ -1,119 +1,123 @@
 Random.seed!(12345)
 
-@testset "test Kaczmarz update" begin
-    for T in [Float32,Float64,ComplexF32,ComplexF64]
-        # set up
-	M = 127
-	N = 16
-
-	A = rand(T,M,N)
-	Aᵀ = transpose(A)
-	b = zeros(T,M)
-	β = rand(T)
-	k = rand(1:N)
-	# end set up
-
-	RegularizedLeastSquares.kaczmarz_update!(Aᵀ,b,k,β)
-	@test b ≈ β*conj(A[:,k])
+@testset "Test Kaczmarz" begin
+  for arrayType in arrayTypes
+    @testset "$arrayType" begin
+
+      for T in [Float32, Float64, ComplexF32, ComplexF64]
+       @testset "test Kaczmarz update $T" begin
+          # set up
+          M = 127
+          N = 16
+
+          A = arrayType(rand(T, M, N))
+          Aᵀ = transpose(A)
+          b = arrayType(zeros(T, M))
+          β = rand(T)
+          k = rand(1:N)
+          # end set up
+
+          RegularizedLeastSquares.kaczmarz_update!(Aᵀ, b, k, β)
+          @test Array(b) ≈ β * conj(Array(A[:, k]))
+
+          # set up
+          M = 127
+          N = 16
+
+          A = arrayType(rand(T, N, M))
+          b = arrayType(zeros(T, M))
+          β = rand(T)
+          k = rand(1:N)
+          # end set up
+
+          RegularizedLeastSquares.kaczmarz_update!(A, b, k, β)
+          @test Array(b) ≈ β * conj(Array(A[k, :]))
+        end
+      end
+
+      # Test Tikhonov regularization matrix
+      @testset "Kaczmarz Tikhonov matrix" begin
+        A = rand(3, 2) + im * rand(3, 2)
+        x = rand(2) + im * rand(2)
+        b = A * x
+
+        regMatrix = rand(2) # Tikhonov matrix
+
+        solver = Kaczmarz
+        S = createLinearSolver(solver, arrayType(A), iterations=200, reg=[L2Regularization(arrayType(regMatrix))])
+        x_approx = Array(solve!(S, arrayType(b)))
+        #@info "Testing solver $solver ...: $x  == $x_approx"
+        @test norm(x - x_approx) / norm(x) ≈ 0 atol = 0.1
+
+        ## Test spatial regularization
+        M = 12
+        N = 8
+        A = rand(M, N) + im * rand(M, N)
+        x = rand(N) + im * rand(N)
+        b = A * x
+
+        # regularization
+        λ = rand(1)
+        regMatrix = rand(N)
+
+        # @show A, x, regMatrix
+        # use regularization matrix
+
+        S = createLinearSolver(solver, arrayType(A), iterations=100, reg=[L2Regularization(arrayType(regMatrix))])
+        x_matrix = Array(solve!(S, arrayType(b)))
+
+        # use standard reconstruction
+        S = createLinearSolver(solver, arrayType(A * Diagonal(1 ./ sqrt.(regMatrix))), iterations=100)
+        x_approx = Array(solve!(S, arrayType(b))) ./ sqrt.(regMatrix)
+
+        # test
+        #@info "Testing solver $solver ...: $x_matrix  == $x_approx"
+        @test norm(x_approx - x_matrix) / norm(x_approx) ≈ 0 atol = 0.1
+      end
+
+      @testset "Kaczmarz Weighting Matrix" begin
+        # TODO does not work on GPU atm, see https://github.com/JuliaGPU/GPUArrays.jl/issues/543
+        M = 12
+        N = 8
+        A = rand(M, N) + im * rand(M, N)
+        x = rand(N) + im * rand(N)
+        b = A * x
+        w = WeightingOp(rand(M))
+        d = diagm(w.weights)
+
+        reg = L2Regularization(rand())
+
+        solver = Kaczmarz
+        S = createLinearSolver(solver, d * A, iterations=200, reg=reg)
+        S_weighted = createLinearSolver(solver, *(ProdOp, w, A), iterations=200, reg=reg)
+        x_approx = solve!(S, d * b)
+        x_weighted = solve!(S_weighted, d * b)
+        #@info "Testing solver $solver ...: $x  == $x_approx"
+        @test isapprox(x_approx, x_weighted)
+      end
+
+
+      # Test Kaczmarz parameters
+      @testset "Kaczmarz parameters" begin
+        M = 12
+        N = 8
+        A = rand(M, N) + im * rand(M, N)
+        x = rand(N) + im * rand(N)
+        b = A * x
+
+        solver = Kaczmarz
+        S = createLinearSolver(solver, arrayType(A), iterations=200)
+        x_approx = Array(solve!(S, arrayType(b)))
+        @test norm(x - x_approx) / norm(x) ≈ 0 atol = 0.1
+
+        S = createLinearSolver(solver, arrayType(A), iterations=200, shuffleRows=true)
+        x_approx = Array(solve!(S, arrayType(b)))
+        @test norm(x - x_approx) / norm(x) ≈ 0 atol = 0.1
+
+        S = createLinearSolver(solver, arrayType(A), iterations=2000, randomized=true)
+        x_approx = Array(solve!(S, arrayType(b)))
+        @test norm(x - x_approx) / norm(x) ≈ 0 atol = 0.1
+      end
     end
-
-    for T in [Float32,Float64,ComplexF32,ComplexF64]
-        # set up
-        M = 127
-        N = 16
-
-        A = rand(T,N,M)
-        b = zeros(T,M)
-        β = rand(T)
-        k = rand(1:N)
-        # end set up
-
-	RegularizedLeastSquares.kaczmarz_update!(A,b,k,β)
-        @test b ≈ β*conj(A[k,:])
-    end
-end
-
-# Test Tikhonov regularization matrix
-@testset "Kaczmarz Tikhonov matrix" begin
-  A = rand(3,2)+im*rand(3,2)
-  x = rand(2)+im*rand(2)
-  b = A*x
-
-  regMatrix = rand(2) # Tikhonov matrix
-
-  solver = Kaczmarz
-  S = createLinearSolver(solver, A, iterations=200, reg=[L2Regularization(regMatrix)])
-  x_approx = solve!(S,b)
-  #@info "Testing solver $solver ...: $x  == $x_approx"
-  @test norm(x - x_approx) / norm(x) ≈ 0 atol=0.1
-
-  ## Test spatial regularization
-  M = 12
-  N = 8
-  A = rand(M,N)+im*rand(M,N)
-  x = rand(N)+im*rand(N)
-  b = A*x
-
-  # regularization
-  λ = rand(1)
-  regMatrix = rand(N)
-
-  # @show A, x, regMatrix
-  # use regularization matrix
-
-  S = createLinearSolver(solver, A, iterations=100, reg=[L2Regularization(regMatrix)])
-  x_matrix = solve!(S,b)
-
-  # use standard reconstruction
-  S = createLinearSolver(solver, A * Diagonal(1 ./ sqrt.(regMatrix)), iterations=100)
-  x_approx = solve!(S,b) ./ sqrt.(regMatrix)
-
-  # test
-  #@info "Testing solver $solver ...: $x_matrix  == $x_approx"
-  @test norm(x_approx - x_matrix) / norm(x_approx) ≈ 0 atol=0.1
-end
-
-@testset "Kaczmarz Weighting Matrix" begin
-  M = 12
-  N = 8
-  A = rand(M,N)+im*rand(M,N)
-  x = rand(N)+im*rand(N)
-  b = A*x
-  w = WeightingOp(rand(M))
-  d = diagm(w.weights)
-
-  reg = L2Regularization(rand())
-
-  solver = Kaczmarz
-  S = createLinearSolver(solver, d*A, iterations=200, reg = reg)
-  S_weighted = createLinearSolver(solver, *(ProdOp, w, A), iterations=200, reg = reg)
-  x_approx = solve!(S, d*b)
-  x_weighted = solve!(S_weighted, d*b)
-  #@info "Testing solver $solver ...: $x  == $x_approx"
-  @test isapprox(x_approx, x_weighted)
-end
-
-
-# Test Kaczmarz parameters
-@testset "Kaczmarz parameters" begin
-  M = 12
-  N = 8
-  A = rand(M,N)+im*rand(M,N)
-  x = rand(N)+im*rand(N)
-  b = A*x
-
-  solver = Kaczmarz
-  S = createLinearSolver(solver, A, iterations=200)
-  x_approx = solve!(S,b)
-  @test norm(x - x_approx) / norm(x) ≈ 0 atol=0.1
-
-  S = createLinearSolver(solver, A, iterations=200, shuffleRows=true)
-  x_approx = solve!(S,b)
-  @test norm(x - x_approx) / norm(x) ≈ 0 atol=0.1
-
-  S = createLinearSolver(solver, A, iterations=2000, randomized=true)
-  x_approx = solve!(S,b)
-  @test norm(x - x_approx) / norm(x) ≈ 0 atol=0.1
+  end
 end
-
-
diff --git a/test/testProxMaps.jl b/test/testProxMaps.jl
index 788f1148..e98bbfac 100644
--- a/test/testProxMaps.jl
+++ b/test/testProxMaps.jl
@@ -1,5 +1,5 @@
 # check Thikonov proximal map
-function testL2Prox(N=1024; numPeaks=5, λ=0.01)
+function testL2Prox(N=256; numPeaks=5, λ=0.01, arrayType = Array)
   @info "test L2-regularization"
   Random.seed!(1234)
   x = zeros(N)
@@ -9,14 +9,14 @@ function testL2Prox(N=1024; numPeaks=5, λ=0.01)
 
   # x_l2 = 1. / (1. + 2. *λ)*x
   x_l2 = copy(x)
-  prox!(L2Regularization, x_l2, λ)
+  x_l2 = Array(prox!(L2Regularization, arrayType(x_l2), λ))
   @test norm(x_l2 - 1.0/(1.0+2.0*λ)*x) / norm(1.0/(1.0+2.0*λ)*x) ≈ 0 atol=0.001
   # check decrease of objective function
   @test 0.5*norm(x-x_l2)^2 + norm(L2Regularization, x_l2, λ) <= norm(L2Regularization, x, λ)
 end
 
 # denoise a signal consisting of a number of delta peaks
-function testL1Prox(N=1024; numPeaks=5, σ=0.03)
+function testL1Prox(N=256; numPeaks=5, σ=0.03, arrayType = Array)
   @info "test L1-regularization"
   Random.seed!(1234)
   x = zeros(N)
@@ -28,7 +28,7 @@ function testL1Prox(N=1024; numPeaks=5, σ=0.03)
   xNoisy = x .+ σ/sqrt(2.0)*(randn(N)+1im*randn(N))
 
   x_l1 = copy(xNoisy)
-  prox!(L1Regularization, x_l1, 2*σ)
+  x_l1 = Array(prox!(L1Regularization, arrayType(x_l1), 2*σ))
 
   # solution should be better then without denoising
   @info "rel. L1 error : $(norm(x - x_l1)/ norm(x)) vs $(norm(x - xNoisy)/ norm(x))"
@@ -41,7 +41,7 @@ end
 # denoise a signal consisting  of multiple slices with delta peaks at the same locations
 # only the last slices are noisy.
 # Thus, the first slices serve as a reference to enhance denoising
-function testL21Prox(N=1024; numPeaks=5, numSlices=8, noisySlices=2, σ=0.05)
+function testL21Prox(N=256; numPeaks=5, numSlices=8, noisySlices=2, σ=0.05, arrayType = Array)
   @info "test L21-regularization"
   Random.seed!(1234)
   x = zeros(ComplexF64,N,numSlices)
@@ -59,7 +59,7 @@ function testL21Prox(N=1024; numPeaks=5, numSlices=8, noisySlices=2, σ=0.05)
   prox!(L1Regularization, x_l1, 2*σ)
 
   x_l21 = copy(xNoisy)
-  prox!(L21Regularization, x_l21, 2*σ,slices=numSlices)
+  x_l21 = Array(prox!(L21Regularization, arrayType(x_l21), 2*σ,slices=numSlices))
 
   # solution should be better then without denoising and with l1-denoising
   @info "rel. L21 error : $(norm(x - x_l21)/ norm(x)) vs $(norm(x - xNoisy)/ norm(x))"
@@ -72,7 +72,7 @@ function testL21Prox(N=1024; numPeaks=5, numSlices=8, noisySlices=2, σ=0.05)
 end
 
 # denoise a piece-wise constant signal using TV regularization
-function testTVprox(N=1024; numEdges=5, σ=0.05)
+function testTVprox(N=256; numEdges=5, σ=0.05, arrayType = Array)
   @info "test TV-regularization"
   Random.seed!(1234)
   x = zeros(ComplexF64,N,N)
@@ -91,7 +91,7 @@ function testTVprox(N=1024; numEdges=5, σ=0.05)
   prox!(L1Regularization, x_l1, 2*σ)
 
   x_tv = copy(xNoisy)
-  prox!(TVRegularization, x_tv, 2*σ, shape=(N,N), dims=1:2)
+  x_tv = Array(prox!(TVRegularization, arrayType(x_tv), 2*σ, shape=(N,N), dims=1:2))
 
   @info "rel. TV error : $(norm(x - x_tv)/ norm(x)) vs $(norm(x - xNoisy)/ norm(x))"
   @test norm(x - x_tv) <= norm(x - xNoisy)
@@ -103,7 +103,7 @@ function testTVprox(N=1024; numEdges=5, σ=0.05)
 end
 
 # denoise a signal that is piecewise constant along a given direction
-function testDirectionalTVprox(N=256; numEdges=5, σ=0.05, T=ComplexF64)
+function testDirectionalTVprox(N=256; numEdges=5, σ=0.05, T=ComplexF64, arrayType = Array)
   x = zeros(T,N,N)
   for i=1:numEdges
     idx = rand(0:N-1)
@@ -115,7 +115,7 @@ function testDirectionalTVprox(N=256; numEdges=5, σ=0.05, T=ComplexF64)
   xNoisy .+= (σ/sqrt(2)) .* randn(T, N, N)
 
   x_tv = copy(xNoisy)
-  prox!(TVRegularization, vec(x_tv), 2*σ, shape=(N,N), dims=1)
+  x_tv = Array(reshape(prox!(TVRegularization, arrayType(vec(x_tv)), 2*σ, shape=(N,N), dims=1), N, N))
 
   x_tv2 = copy(xNoisy)
   for i=1:N
@@ -131,19 +131,19 @@ function testDirectionalTVprox(N=256; numEdges=5, σ=0.05, T=ComplexF64)
 
   ## cf. Condat and gradient based algorithm
   x_tv3 = copy(xNoisy)
-  prox!(TVRegularization, vec(x_tv3), 2*σ, shape=(N,N), dims=(1,))
+  x_tv3 = Array(reshape(prox!(TVRegularization, vec(x_tv3), 2*σ, shape=(N,N), dims=(1,)), N, N))
   @test norm(x_tv-x_tv3) / norm(x) ≈ 0 atol=1e-2
 end
 
 # test enforcement of positivity constraint
-function testPositive(N=1024)
+function testPositive(N=256; arrayType = Array)
   @info "test positivity-constraint"
   Random.seed!(1234)
   x = randn(N) .+ 1im*randn(N)
   xPos = real.(x)
   xPos[findall(x->x<0,xPos)] .= 0
   xProj = copy(x)
-  prox!(PositiveRegularization, xProj)
+  xProj = Array(prox!(PositiveRegularization, arrayType(xProj)))
 
   @test norm(xProj-xPos)/norm(xPos) ≈ 0 atol=1.e-4
   # check decrease of objective function
@@ -151,20 +151,20 @@ function testPositive(N=1024)
 end
 
 # test enforcement of "realness"-constraint
-function testProj(N=1012)
+function testProj(N=1012; arrayType = Array)
   @info "test realness-constraint"
   Random.seed!(1234)
   x = randn(N) .+ 1im*randn(N)
   xReal = real.(x)
   xProj = copy(x)
-  prox!(ProjectionRegularization, xProj, projFunc=x->real(x))
+  xProj = Array(prox!(ProjectionRegularization, arrayType(xProj), projFunc=x->real(x)))
   @test norm(xProj-xReal)/norm(xReal) ≈ 0 atol=1.e-4
   # check decrease of objective function
   @test 0.5*norm(x-xProj)^2+norm(ProjectionRegularization, xProj,projFunc=x->real(x)) <= norm(ProjectionRegularization, x,projFunc=x->real(x))
 end
 
 # test denoising of a low-rank matrix
-function testNuclear(N=32,rank=2;σ=0.05)
+function testNuclear(N=32,rank=2;σ=0.05, arrayType = Array)
   @info "test nuclear norm regularization"
   Random.seed!(1234)
   x = zeros(ComplexF64,N,N);
@@ -183,7 +183,7 @@ function testNuclear(N=32,rank=2;σ=0.05)
   xNoisy[:] += σ/sqrt(2.0)*(randn(N*N)+1im*randn(N*N))
 
   x_lr = copy(xNoisy)
-  prox!(NuclearRegularization, x_lr,5*σ,svtShape=(32,32))
+  x_lr = Array(prox!(NuclearRegularization, arrayType(x_lr),5*σ,svtShape=(32,32)))
   @test norm(x - x_lr) <= norm(x - xNoisy)
   @test norm(x - x_lr) / norm(x) ≈ 0 atol=0.05
   @info "rel. LR error : $(norm(x - x_lr)/ norm(x)) vs $(norm(x - xNoisy)/ norm(x))"
@@ -191,7 +191,7 @@ function testNuclear(N=32,rank=2;σ=0.05)
   @test 0.5*norm(xNoisy-x_lr)^2+norm(NuclearRegularization, x_lr,5*σ,svtShape=(N,N)) <= norm(NuclearRegularization, xNoisy,5*σ,svtShape=(N,N))
 end
 
-function testLLR(shape=(32,32,80),blockSize=(4,4);σ=0.05)
+function testLLR(shape=(32,32,80),blockSize=(4,4);σ=0.05, arrayType = Array)
   @info "test LLR regularization"
   Random.seed!(1234)
   x = zeros(ComplexF64,shape);
@@ -211,7 +211,7 @@ function testLLR(shape=(32,32,80),blockSize=(4,4);σ=0.05)
   xNoisy[:] += σ/sqrt(2.0)*(randn(prod(shape))+1im*randn(prod(shape)))
 
   x_llr = copy(xNoisy)
-  prox!(LLRRegularization, x_llr,10*σ,shape=shape[1:2],blockSize=blockSize,randshift=false)
+  x_llr = Array(prox!(LLRRegularization, arrayType(x_llr),10*σ,shape=shape[1:2],blockSize=blockSize,randshift=false))
   @test norm(x - x_llr) <= norm(x - xNoisy)
   @test norm(x - x_llr) / norm(x) ≈ 0 atol=0.05
   @info "rel. LLR error : $(norm(x - x_llr)/ norm(x)) vs $(norm(x - xNoisy)/ norm(x))"
@@ -219,7 +219,7 @@ function testLLR(shape=(32,32,80),blockSize=(4,4);σ=0.05)
   @test 0.5*norm(xNoisy-x_llr)^2+norm(LLRRegularization, x_llr,10*σ,shape=shape[1:2],blockSize=blockSize,randshift=false) <= norm(LLRRegularization, xNoisy,10*σ,shape=shape[1:2],blockSize=blockSize,randshift=false)
 end
 
-function testLLROverlapping(shape=(32,32,80),blockSize=(4,4);σ=0.05)
+function testLLROverlapping(shape=(32,32,80),blockSize=(4,4);σ=0.05, arrayType = Array)
   @info "test Overlapping LLR regularization"
   Random.seed!(1234)
   x = zeros(ComplexF64,shape);
@@ -239,15 +239,15 @@ function testLLROverlapping(shape=(32,32,80),blockSize=(4,4);σ=0.05)
   xNoisy[:] += σ/sqrt(2.0)*(randn(prod(shape))+1im*randn(prod(shape)))
 
   x_llr = copy(xNoisy)
-  proxLLROverlapping!(x_llr,10*σ,shape=shape[1:2],blockSize=blockSize)
+  prox!(LLRRegularization, x_llr,10*σ,shape=shape[1:2],blockSize=blockSize, fullyOverlapping = true)
   @test norm(x - x_llr) <= norm(x - xNoisy)
   @test norm(x - x_llr) / norm(x) ≈ 0 atol=0.05
   @info "rel. LLR error : $(norm(x - x_llr)/ norm(x)) vs $(norm(x - xNoisy)/ norm(x))"
   # check decrease of objective function
-  @test 0.5*norm(xNoisy-x_llr)^2+normLLR(x_llr,10*σ,shape=shape[1:2],blockSize=blockSize,randshift=false) <= normLLR(xNoisy,10*σ,shape=shape[1:2],blockSize=blockSize,randshift=false)
+  #@test 0.5*norm(xNoisy-x_llr)^2+normLLR(x_llr,10*σ,shape=shape[1:2],blockSize=blockSize,randshift=false) <= normLLR(xNoisy,10*σ,shape=shape[1:2],blockSize=blockSize,randshift=false)
 end
 
-function testLLR_3D(shape=(32,32,32,80),blockSize=(4,4,4);σ=0.05)
+function testLLR_3D(shape=(32,32,32,80),blockSize=(4,4,4);σ=0.05, arrayType = Array)
   @info "test LLR 3D regularization"
   Random.seed!(1234)
   x = zeros(ComplexF64,shape)
@@ -269,7 +269,7 @@ function testLLR_3D(shape=(32,32,32,80),blockSize=(4,4,4);σ=0.05)
   xNoisy[:] += σ/sqrt(2.0)*(randn(prod(shape))+1im*randn(prod(shape)))
 
   x_llr = copy(xNoisy)
-  prox!(LLRRegularization, x_llr,10*σ,shape=shape[1:end-1],blockSize=blockSize,randshift=false)
+  x_llr = Array(prox!(LLRRegularization, arrayType(x_llr),10*σ,shape=shape[1:end-1],blockSize=blockSize,randshift=false))
   @test norm(x - x_llr) <= norm(x - xNoisy)
   @test norm(x - x_llr) / norm(x) ≈ 0 atol=0.05
   @info "rel. LLR 3D error : $(norm(x - x_llr)/ norm(x)) vs $(norm(x - xNoisy)/ norm(x))"
@@ -285,27 +285,33 @@ function testConversion()
         true
       catch e
         false
-      end skip = in(prox, [LLRRegularization, NuclearRegularization])
+      end skip = in(prox, [LLRRegularization])
       @test try norm(prox, zeros(xType, 10), lambdaType(0.0); shape=(2, 5), svtShape=(2, 5))
         true
       catch e
         false
-      end skip = in(prox, [LLRRegularization, NuclearRegularization])
+      end skip = in(prox, [LLRRegularization])
     end
   end
 end
 
 @testset "Proximal Maps" begin
-  @testset "L2 Prox" testL2Prox()
-  @testset "L1 Prox" testL1Prox()
-  @testset "L21 Prox" testL21Prox()
-  @testset "TV Prox" testTVprox()
-  @testset "TV Prox Directional" testDirectionalTVprox()
-  @testset "Positive Prox" testPositive()
-  @testset "Projection Prox" testProj()
-  @testset "Nuclear Prox" testNuclear()
-  #@testset "LLR Prox" testLLR()
-  #@testset "LLR Prox Overlapping" #testLLROverlapping()
-  #@testset "LLR Prox 3D" testLLR_3D()
+  for arrayType in arrayTypes
+    @testset "$arrayType" begin
+      @testset "L2 Prox" testL2Prox(;arrayType)
+      @testset "L1 Prox" testL1Prox(;arrayType)
+      @testset "L21 Prox" testL21Prox(;arrayType)
+      @testset "TV Prox" testTVprox(;arrayType)
+      @testset "TV Prox Directional" testDirectionalTVprox(;arrayType)
+      @testset "Positive Prox" testPositive(;arrayType)
+      @testset "Projection Prox" testProj(;arrayType)
+      if !areTypesDefined # Don't run these tests on GPUs/buildkite, since svd can fail
+        @testset "Nuclear Prox" testNuclear(;arrayType)
+        @testset "LLR Prox: $arrayType" testLLR(;arrayType)
+        @testset "LLR Prox Overlapping: $arrayType" testLLROverlapping(;arrayType)
+        @testset "LLR Prox 3D: $arrayType" testLLR_3D(;arrayType)
+      end
+    end
+  end
   @testset "Prox Lambda Conversion" testConversion()
 end
diff --git a/test/testRegularization.jl b/test/testRegularization.jl
index 12eecd1e..28525fb6 100644
--- a/test/testRegularization.jl
+++ b/test/testRegularization.jl
@@ -3,17 +3,17 @@
     model(x) = x
     # reduced constructor, checking defaults
     pnp_reg = PnPRegularization(model, [2])
-    @assert pnp_reg.λ == 1.0
-    @assert pnp_reg.model == model
-    @assert pnp_reg.shape == [2]
-    @assert pnp_reg.input_transform == RegularizedLeastSquares.MinMaxTransform
-    @assert pnp_reg.ignoreIm == false
+    @test pnp_reg.λ == 1.0
+    @test pnp_reg.model == model
+    @test pnp_reg.shape == [2]
+    @test pnp_reg.input_transform == RegularizedLeastSquares.MinMaxTransform
+    @test pnp_reg.ignoreIm == false
     # full constructor
     pnp_reg = PnPRegularization(0.1; model=model, shape=[2], input_transform=x -> x, ignoreIm=true)
     # full constructor defaults
     pnp_reg = PnPRegularization(0.1; model=model, shape=[2])
-    @assert pnp_reg.input_transform == RegularizedLeastSquares.MinMaxTransform
-    @assert pnp_reg.ignoreIm == false
+    @test pnp_reg.input_transform == RegularizedLeastSquares.MinMaxTransform
+    @test pnp_reg.ignoreIm == false
     # unnecessary kwargs are ignored
     pnp_reg = PnPRegularization(0.1; model=model, shape=[2], input_transform=x -> x, ignoreIm=true, sMtHeLsE=1)
 end
@@ -27,9 +27,14 @@ end
     b = A * x
 
     for solver in supported_solvers
-        S = createLinearSolver(solver, A, iterations=2; reg=[pnp_reg])
-        x_approx = solve!(S, b)
-        @info "PnP Regularization and $solver Compatibility"
+        @test try 
+            S = createLinearSolver(solver, A, iterations=2; reg=[pnp_reg])
+            x_approx = solve!(S, b)
+            @info "PnP Regularization and $solver Compatibility"
+            true
+        catch ex
+            false
+        end
     end
 end
 
@@ -38,7 +43,7 @@ end
     pnp_reg = PnPRegularization(0.1; model=x -> zeros(eltype(x), size(x)), shape=[2], input_transform=RegularizedLeastSquares.IdentityTransform)
     out = prox!(pnp_reg, [1.0, 2.0], 0.1)
     @info out
-    @assert out == [0.9, 1.8]
+    @test out == [0.9, 1.8]
 end
 
 
@@ -49,8 +54,8 @@ end
         input_transform=RegularizedLeastSquares.IdentityTransform
     )
     out = prox!(pnp_reg, [1.0 + 1.0im, 2.0 + 2.0im], 0.1)
-    @assert real(out) == [0.9, 1.8]
-    @assert imag(out) == [0.9, 1.8]
+    @test real(out) == [0.9, 1.8]
+    @test imag(out) == [0.9, 1.8]
     # ignoreIm = true
     pnp_reg = PnPRegularization(
         0.1; model=x -> zeros(eltype(x), size(x)), shape=[2],
@@ -58,15 +63,15 @@ end
         ignoreIm=true
     )
     out = prox!(pnp_reg, [1.0 + 1.0im, 2.0 + 2.0im], 0.1)
-    @assert real(out) == [0.9, 1.8]
-    @assert imag(out) == [1.0, 2.0]
+    @test real(out) == [0.9, 1.8]
+    @test imag(out) == [1.0, 2.0]
 end
 
 
 @testset "PnP Prox λ clipping" begin
     pnp_reg = PnPRegularization(0.1; model=x -> zeros(eltype(x), size(x)), shape=[2], input_transform=RegularizedLeastSquares.IdentityTransform)
     out = @test_warn "$(typeof(pnp_reg)) was given λ with value 1.5. Valid range is [0, 1]. λ changed to temp" prox!(pnp_reg, [1.0, 2.0], 1.5)
-    @assert out == [0.0, 0.0]
+    @test out == [0.0, 0.0]
     out = @test_warn "$(typeof(pnp_reg)) was given λ with value -1.5. Valid range is [0, 1]. λ changed to temp" prox!(pnp_reg, [1.0, 2.0], -1.5)
-    @assert out == [1.0, 2.0]
+    @test out == [1.0, 2.0]
 end
\ No newline at end of file
diff --git a/test/testSolvers.jl b/test/testSolvers.jl
index 553ec496..09a9bb84 100644
--- a/test/testSolvers.jl
+++ b/test/testSolvers.jl
@@ -1,52 +1,70 @@
 Random.seed!(12345)
 
-@testset "Real Linear Solver" begin
-    A = rand(3, 2)
-    x = rand(2)
+function testRealLinearSolver(; arrayType = Array, elType = Float32)
+    A = rand(elType, 3, 2)
+    x = rand(elType, 2)
     b = A * x
 
     solvers = linearSolverListReal()
 
-    for solver in solvers
-        S = createLinearSolver(solver, A, iterations = 200)
-        x_approx = solve!(S, b)
-        @info "Testing solver $solver: $x ≈ $x_approx"
-        @test x_approx ≈ x rtol = 0.1
+    @testset for solver in solvers
+        @test try
+            S = createLinearSolver(solver, arrayType(A), iterations = 200)
+            x_approx = Array(solve!(S, arrayType(b)))
+            @info "Testing solver $solver: $x ≈ $x_approx"
+            @test x_approx ≈ x rtol = 0.1
+            true
+        catch e
+            @error e
+            false
+        end skip = arrayType != Array && solver <: AbstractDirectSolver # 
     end
 end
 
-@testset "Complex Linear Solver" begin
-    A = rand(3, 2) + im * rand(3, 2)
-    x = rand(2) + im * rand(2)
+function testComplexLinearSolver(; arrayType = Array, elType = Float32)
+    A = rand(elType, 3, 2) + im * rand(elType, 3, 2)
+    x = rand(elType, 2) + im * rand(elType, 2)
     b = A * x
 
     solvers = linearSolverList()
 
-    for solver in solvers
-        S = createLinearSolver(solver, A, iterations = 100)
-        x_approx = solve!(S, b)
-        @info "Testing solver $solver: $x ≈ $x_approx"
-        @test x_approx ≈ x rtol = 0.1
+    @testset for solver in solvers
+        @test try
+            S = createLinearSolver(solver, arrayType(A), iterations = 100)
+            x_approx = Array(solve!(S, arrayType(b)))
+            @info "Testing solver $solver: $x ≈ $x_approx"
+            @test x_approx ≈ x rtol = 0.1
+            true
+        catch e
+            @error e
+            false
+        end skip = arrayType != Array && solver <: AbstractDirectSolver
     end
 end
 
-@testset "Complex Linear Solver w/ AHA Interface" begin
-    A = rand(3, 2) + im * rand(3, 2)
-    x = rand(2) + im * rand(2)
+function testComplexLinearAHASolver(; arrayType = Array, elType = Float32)
+    A = rand(elType, 3, 2) + im * rand(elType, 3, 2)
+    x = rand(elType, 2) + im * rand(elType, 2)
     AHA = A'*A
     b = AHA * x
 
-    solvers = filter(s -> s ∉ [DirectSolver, PseudoInverse, DaxKaczmarz, DaxConstrained, Kaczmarz, PrimalDualSolver], linearSolverListReal())
-
-    for solver in solvers
-        S = createLinearSolver(solver, nothing; AHA=AHA, iterations = 100)
-        x_approx = solve!(S, b)
-        @info "Testing solver $solver: $x ≈ $x_approx"
-        @test x_approx ≈ x rtol = 0.1
+    solvers = filter(s -> s ∉ [DirectSolver, PseudoInverse, Kaczmarz], linearSolverListReal())
+
+    @testset for solver in solvers
+        @test try
+            S = createLinearSolver(solver, nothing; AHA=arrayType(AHA), iterations = 100)
+            x_approx = Array(solve!(S, arrayType(b)))
+            @info "Testing solver $solver: $x ≈ $x_approx"
+            @test x_approx ≈ x rtol = 0.1
+            true
+        catch e
+            @error e
+            false
+        end
     end
 end
 
-@testset "General Convex Solver" begin
+function testConvexLinearSolver(; arrayType = Array, elType = Float32)
     # fully sampled operator, image and data
     N = 256
     numPeaks = 5
@@ -59,11 +77,11 @@ end
 
     # random undersampling
     idx = sort(unique(rand(1:N, div(N, 2))))
-    b = b[idx]
-    F = F[idx, :]
+    b = arrayType(b[idx])
+    F = arrayType(F[idx, :])
 
     for solver in [POGM, OptISTA, FISTA, ADMM]
-        reg = L1Regularization(1e-3)
+        reg = L1Regularization(elType(1e-3))
         S = createLinearSolver(
             solver,
             F;
@@ -71,7 +89,7 @@ end
             iterations = 200,
             normalizeReg = NoNormalization(),
         )
-        x_approx = solve!(S, b)
+        x_approx = Array(solve!(S, b))
         @info "Testing solver $solver w/o restart: relative error = $(norm(x - x_approx) / norm(x))"
         @test x ≈ x_approx rtol = 0.1
 
@@ -85,13 +103,13 @@ end
                 normalizeReg = NoNormalization(),
                 restart = :gradient,
             )
-            x_approx = solve!(S, b)
+            x_approx = Array(solve!(S, b))
             @info "Testing solver $solver w/ gradient restart: relative error = $(norm(x - x_approx) / norm(x))"
             @test x ≈ x_approx rtol = 0.1
         end
 
         # test invariance to the maximum eigenvalue
-        reg = L1Regularization(reg.λ * length(b) / norm(b, 1))
+        reg = L1Regularization(elType(reg.λ * length(b) / norm(b, 1)))
         scale_F = 1e3
         S = createLinearSolver(
             solver,
@@ -100,7 +118,7 @@ end
             iterations = 200,
             normalizeReg = MeasurementBasedNormalization(),
         )
-        x_approx = solve!(S, b)
+        x_approx = Array(solve!(S, b))
         x_approx .*= scale_F
         @info "Testing solver $solver w/o restart and after re-scaling: relative error = $(norm(x - x_approx) / norm(x))"
         @test x ≈ x_approx rtol = 0.1
@@ -108,7 +126,7 @@ end
 
     # test ADMM with option vary_rho
     solver = ADMM
-    reg = L1Regularization(1.e-3)
+    reg = L1Regularization(elType(1.e-3))
     S = createLinearSolver(
         solver,
         F;
@@ -119,7 +137,7 @@ end
         vary_rho = :balance,
         verbose = false,
     )
-    x_approx = solve!(S, b)
+    x_approx = Array(solve!(S, b))
     @info "Testing solver $solver: relative error = $(norm(x - x_approx) / norm(x))"
     @test x ≈ x_approx rtol = 0.1
 
@@ -133,7 +151,7 @@ end
         vary_rho = :balance,
         verbose = false,
     )
-    x_approx = solve!(S, b)
+    x_approx = Array(solve!(S, b))
     @info "Testing solver $solver: relative error = $(norm(x - x_approx) / norm(x))"
     @test x ≈ x_approx rtol = 0.1
 
@@ -148,13 +166,13 @@ end
         vary_rho = :PnP,
         verbose = false,
     )
-    x_approx = solve!(S, b)
+    x_approx = Array(solve!(S, b))
     @info "Testing solver $solver: relative error = $(norm(x - x_approx) / norm(x))"
     @test x ≈ x_approx rtol = 0.1
 
     ##
     solver = SplitBregman
-    reg = L1Regularization(2e-3)
+    reg = L1Regularization(elType(2e-3))
     S = createLinearSolver(
         solver,
         F;
@@ -164,11 +182,11 @@ end
         rho = 1.0,
         normalizeReg = NoNormalization(),
     )
-    x_approx = solve!(S, b)
+    x_approx = Array(solve!(S, b))
     @info "Testing solver $solver: relative error = $(norm(x - x_approx) / norm(x))"
     @test x ≈ x_approx rtol = 0.1
 
-    reg = L1Regularization(reg.λ * length(b) / norm(b, 1))
+    reg = L1Regularization(elType(reg.λ * length(b) / norm(b, 1)))
     S = createLinearSolver(
         solver,
         F;
@@ -178,11 +196,11 @@ end
         rho = 1.0,
         normalizeReg = MeasurementBasedNormalization(),
     )
-    x_approx = solve!(S, b)
+    x_approx = Array(solve!(S, b))
     @info "Testing solver $solver: relative error = $(norm(x - x_approx) / norm(x))"
     @test x ≈ x_approx rtol = 0.1
 
-    ##
+    #=
     solver = PrimalDualSolver
     reg = [L1Regularization(1.e-4), TVRegularization(1.e-4, shape = (0,0))]
     FR = [real.(F ./ norm(F)); imag.(F ./ norm(F))]
@@ -196,4 +214,30 @@ end
     x_approx = solve!(S, bR)
     @info "Testing solver $solver: relative error = $(norm(x - x_approx) / norm(x))"
     @test x ≈ x_approx rtol = 0.1
+    =#
 end
+
+
+@testset "Test Solvers" begin
+    for arrayType in arrayTypes
+        @testset "$arrayType" begin
+        for elType in [Float32, Float64]
+                @testset "Real Linear Solver: $elType" begin
+                    testRealLinearSolver(; arrayType, elType)
+                end
+
+                @testset "Complex Linear Solver: $elType" begin
+                    testComplexLinearSolver(; arrayType, elType)
+                end
+
+                @testset "Complex Linear Solver w/ AHA Interface: $elType" begin
+                    testComplexLinearAHASolver(; arrayType, elType)
+                end
+
+                @testset "General Convex Solver: $elType" begin
+                    testConvexLinearSolver(; arrayType, elType)
+                end
+            end
+        end
+    end
+end
\ No newline at end of file