diff --git a/Project.toml b/Project.toml
index 7e30fd805..9e17a4488 100644
--- a/Project.toml
+++ b/Project.toml
@@ -1,13 +1,16 @@
 name = "TensorKit"
 uuid = "07d1fe3e-3e46-537d-9eac-e9e13d0d4cec"
 authors = ["Jutho Haegeman"]
-version = "0.14.11"
+version = "0.15.0"
 
 [deps]
 LRUCache = "8ac3fa9e-de4c-5943-b1dc-09c6b5f20637"
 LinearAlgebra = "37e2e46d-f89d-539d-b4ee-838fcccc9c8e"
+MatrixAlgebraKit = "6c742aac-3347-4629-af66-fc926824e5e4"
+OhMyThreads = "67456a42-1dca-4109-a031-0a68de7e3ad5"
 PackageExtensionCompat = "65ce6f38-6b18-4e1d-a461-8949797d7930"
 Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
+ScopedValues = "7e506255-f358-4e82-b7e4-beb19740aa63"
 Strided = "5e0ebb24-38b0-5f93-81fe-25c709ecae67"
 TensorKitSectors = "13a9c161-d5da-41f0-bcbd-e1a08ae0647f"
 TensorOperations = "6aa20fa7-93e2-5fca-9bc0-fbd0db3c71a2"
@@ -30,8 +33,11 @@ Combinatorics = "1"
 FiniteDifferences = "0.12"
 LRUCache = "1.0.2"
 LinearAlgebra = "1"
+MatrixAlgebraKit = "0.5.0"
+OhMyThreads = "0.8.0"
 PackageExtensionCompat = "1"
 Random = "1"
+ScopedValues = "1.3.0"
 Strided = "2"
 TensorKitSectors = "0.1.4, 0.2"
 TensorOperations = "5.1"
diff --git a/docs/Project.toml b/docs/Project.toml
index bb471e442..fc67550fd 100644
--- a/docs/Project.toml
+++ b/docs/Project.toml
@@ -1,10 +1,9 @@
 [deps]
 Documenter = "e30172f5-a6a5-5a46-863b-614d45cd2de4"
+DocumenterInterLinks = "d12716ef-a0f6-4df4-a9f1-a5a34e75c656"
 Random = "9a3f8284-a2c9-5f02-9a11-845980a1fd5c"
 TensorKit = "07d1fe3e-3e46-537d-9eac-e9e13d0d4cec"
-TensorKitSectors = "13a9c161-d5da-41f0-bcbd-e1a08ae0647f"
 
 [compat]
 Documenter = "1"
 Random = "1"
-TensorKitSectors = "0.1"
diff --git a/docs/make.jl b/docs/make.jl
index 2dab6cbdd..1ad55321d 100644
--- a/docs/make.jl
+++ b/docs/make.jl
@@ -1,6 +1,12 @@
 using Documenter
 using Random
-using TensorKit, TensorKitSectors
+using TensorKit
+using TensorKit.TensorKitSectors
+using TensorKit.MatrixAlgebraKit
+using DocumenterInterLinks
+
+links = InterLinks("MatrixAlgebraKit" => "https://quantumkithub.github.io/MatrixAlgebraKit.jl/stable/",
+                   "TensorOperations" => "https://quantumkithub.github.io/TensorOperations.jl/stable/")
 
 pages = ["Home" => "index.md",
          "Manual" => ["man/intro.md", "man/tutorial.md", "man/categories.md",
@@ -15,6 +21,7 @@ makedocs(; modules=[TensorKit, TensorKitSectors],
          format=Documenter.HTML(; prettyurls=true, mathengine=MathJax(),
                                 assets=["assets/custom.css"]),
          pages=pages,
-         pagesonly=true)
+         pagesonly=true,
+         plugins=[links])
 
 deploydocs(; repo="github.com/QuantumKitHub/TensorKit.jl.git", push_preview=true)
diff --git a/docs/src/lib/spaces.md b/docs/src/lib/spaces.md
index 83350156d..205301d83 100644
--- a/docs/src/lib/spaces.md
+++ b/docs/src/lib/spaces.md
@@ -90,6 +90,7 @@ dual
 conj
 flip
 ⊕
+⊖
 zero(::ElementarySpace)
 oneunit
 supremum
diff --git a/docs/src/lib/tensors.md b/docs/src/lib/tensors.md
index 51b9bcf13..4d1c5c9cc 100644
--- a/docs/src/lib/tensors.md
+++ b/docs/src/lib/tensors.md
@@ -214,26 +214,21 @@ contract!
 
 ## `TensorMap` factorizations
 
-The factorisation methods come in two flavors, namely a non-destructive version where you
-can specify an additional permutation of the domain and codomain indices before the
-factorisation is performed (provided that `sectorstyle(t)` has a symmetric braiding) as
-well as a destructive version The non-destructive methods are given first:
+The factorisation methods are powered by [MatrixAlgebraKit.jl](https://github.com/QuantumKitHub/MatrixAlgebraKit.jl)
+and all follow the same strategy. The idea is that the `TensorMap` is interpreted as a linear
+map based on the current partition of indices between `domain` and `codomain`, and then the
+entire range of MatrixAlgebraKit functions can be called.
+Factorizing a tensor according to a different partition of the indices is possible
+by prepending the factorization step with an explicit call to [`permute`](@ref) or [`transpose`](@ref).
 
-```@docs
-leftorth
-rightorth
-leftnull
-rightnull
-tsvd
-eigh
-eig
-eigen
-isposdef
-```
+For the full list of factorizations, see [Decompositions](@extref MatrixAlgebraKit).
 
-The corresponding destructive methods have an exclamation mark at the end of their name,
-and only accept the `TensorMap` object as well as the method-specific algorithm and keyword
-arguments.
+Additionally, it is possible to obtain truncated versions of some of these factorizations
+through the [`MatrixAlgebraKit.TruncationStrategy`](@ref) objects.
 
+The exact truncation strategy can be controlled through the strategies defined in [Truncations](@extref MatrixAlgebraKit),
+but for `TensorMap`s there is also the special-purpose scheme:
 
-TODO: document svd truncation types
+```@docs
+truncspace
+```
diff --git a/ext/TensorKitChainRulesCoreExt/TensorKitChainRulesCoreExt.jl b/ext/TensorKitChainRulesCoreExt/TensorKitChainRulesCoreExt.jl
index 16c7583d1..e89f79b55 100644
--- a/ext/TensorKitChainRulesCoreExt/TensorKitChainRulesCoreExt.jl
+++ b/ext/TensorKitChainRulesCoreExt/TensorKitChainRulesCoreExt.jl
@@ -3,6 +3,7 @@ module TensorKitChainRulesCoreExt
 using TensorOperations
 using VectorInterface
 using TensorKit
+using TensorKit: foreachblock
 using ChainRulesCore
 using LinearAlgebra
 using TupleTools
@@ -15,6 +16,5 @@ include("utility.jl")
 include("constructors.jl")
 include("linalg.jl")
 include("tensoroperations.jl")
-include("factorizations.jl")
 
 end
diff --git a/ext/TensorKitChainRulesCoreExt/factorizations.jl b/ext/TensorKitChainRulesCoreExt/factorizations.jl
index abfb724bc..a104f408a 100644
--- a/ext/TensorKitChainRulesCoreExt/factorizations.jl
+++ b/ext/TensorKitChainRulesCoreExt/factorizations.jl
@@ -1,481 +1,2 @@
 # Factorizations rules
 # --------------------
-function ChainRulesCore.rrule(::typeof(TensorKit.tsvd!), t::AbstractTensorMap;
-                              trunc::TensorKit.TruncationScheme=TensorKit.NoTruncation(),
-                              p::Real=2,
-                              alg::Union{TensorKit.SVD,TensorKit.SDD}=TensorKit.SDD())
-    U, Σ, V⁺, truncerr = tsvd(t; trunc=TensorKit.NoTruncation(), p=p, alg=alg)
-
-    if !(trunc isa TensorKit.NoTruncation) && !isempty(blocksectors(t))
-        Σdata = TensorKit.SectorDict(c => diag(b) for (c, b) in blocks(Σ))
-
-        truncdim = TensorKit._compute_truncdim(Σdata, trunc, p)
-        truncerr = TensorKit._compute_truncerr(Σdata, truncdim, p)
-
-        SVDdata = TensorKit.SectorDict(c => (block(U, c), Σc, block(V⁺, c))
-                                       for (c, Σc) in Σdata)
-
-        Ũ, Σ̃, Ṽ⁺ = TensorKit._create_svdtensors(t, SVDdata, truncdim)
-    else
-        Ũ, Σ̃, Ṽ⁺ = U, Σ, V⁺
-    end
-
-    function tsvd!_pullback(ΔUSVϵ)
-        ΔU, ΔΣ, ΔV⁺, = unthunk.(ΔUSVϵ)
-        Δt = similar(t)
-        for (c, b) in blocks(Δt)
-            Uc, Σc, V⁺c = block(U, c), block(Σ, c), block(V⁺, c)
-            ΔUc, ΔΣc, ΔV⁺c = block(ΔU, c), block(ΔΣ, c), block(ΔV⁺, c)
-            Σdc = view(Σc, diagind(Σc))
-            ΔΣdc = (ΔΣc isa AbstractZero) ? ΔΣc : view(ΔΣc, diagind(ΔΣc))
-            svd_pullback!(b, Uc, Σdc, V⁺c, ΔUc, ΔΣdc, ΔV⁺c)
-        end
-        return NoTangent(), Δt
-    end
-    function tsvd!_pullback(::Tuple{ZeroTangent,ZeroTangent,ZeroTangent})
-        return NoTangent(), ZeroTangent()
-    end
-
-    return (Ũ, Σ̃, Ṽ⁺, truncerr), tsvd!_pullback
-end
-
-function ChainRulesCore.rrule(::typeof(LinearAlgebra.svdvals!), t::AbstractTensorMap)
-    U, S, V⁺ = tsvd(t)
-    s = diag(S)
-    project_t = ProjectTo(t)
-
-    function svdvals_pullback(Δs′)
-        Δs = unthunk(Δs′)
-        ΔS = diagm(codomain(S), domain(S), Δs)
-        return NoTangent(), project_t(U * ΔS * V⁺)
-    end
-
-    return s, svdvals_pullback
-end
-
-function ChainRulesCore.rrule(::typeof(TensorKit.eig!), t::AbstractTensorMap; kwargs...)
-    D, V = eig(t; kwargs...)
-
-    function eig!_pullback((_ΔD, _ΔV))
-        ΔD, ΔV = unthunk(_ΔD), unthunk(_ΔV)
-        Δt = similar(t)
-        for (c, b) in blocks(Δt)
-            Dc, Vc = block(D, c), block(V, c)
-            ΔDc, ΔVc = block(ΔD, c), block(ΔV, c)
-            Ddc = view(Dc, diagind(Dc))
-            ΔDdc = (ΔDc isa AbstractZero) ? ΔDc : view(ΔDc, diagind(ΔDc))
-            eig_pullback!(b, Ddc, Vc, ΔDdc, ΔVc)
-        end
-        return NoTangent(), Δt
-    end
-    function eig!_pullback(::Tuple{ZeroTangent,ZeroTangent})
-        return NoTangent(), ZeroTangent()
-    end
-
-    return (D, V), eig!_pullback
-end
-
-function ChainRulesCore.rrule(::typeof(TensorKit.eigh!), t::AbstractTensorMap; kwargs...)
-    D, V = eigh(t; kwargs...)
-
-    function eigh!_pullback((_ΔD, _ΔV))
-        ΔD, ΔV = unthunk(_ΔD), unthunk(_ΔV)
-        Δt = similar(t)
-        for (c, b) in blocks(Δt)
-            Dc, Vc = block(D, c), block(V, c)
-            ΔDc, ΔVc = block(ΔD, c), block(ΔV, c)
-            Ddc = view(Dc, diagind(Dc))
-            ΔDdc = (ΔDc isa AbstractZero) ? ΔDc : view(ΔDc, diagind(ΔDc))
-            eigh_pullback!(b, Ddc, Vc, ΔDdc, ΔVc)
-        end
-        return NoTangent(), Δt
-    end
-    function eigh!_pullback(::Tuple{ZeroTangent,ZeroTangent})
-        return NoTangent(), ZeroTangent()
-    end
-
-    return (D, V), eigh!_pullback
-end
-
-function ChainRulesCore.rrule(::typeof(LinearAlgebra.eigvals!), t::AbstractTensorMap;
-                              sortby=nothing, kwargs...)
-    @assert sortby === nothing "only `sortby=nothing` is supported"
-    (D, _), eig_pullback = rrule(TensorKit.eig!, t; kwargs...)
-    d = diag(D)
-    project_t = ProjectTo(t)
-    function eigvals_pullback(Δd′)
-        Δd = unthunk(Δd′)
-        ΔD = diagm(codomain(D), domain(D), Δd)
-        return NoTangent(), project_t(eig_pullback((ΔD, ZeroTangent()))[2])
-    end
-
-    return d, eigvals_pullback
-end
-
-function ChainRulesCore.rrule(::typeof(leftorth!), t::AbstractTensorMap; alg=QRpos())
-    alg isa TensorKit.QR || alg isa TensorKit.QRpos ||
-        error("only `alg=QR()` and `alg=QRpos()` are supported")
-    Q, R = leftorth(t; alg)
-    function leftorth!_pullback((_ΔQ, _ΔR))
-        ΔQ, ΔR = unthunk(_ΔQ), unthunk(_ΔR)
-        Δt = similar(t)
-        for (c, b) in blocks(Δt)
-            qr_pullback!(b, block(Q, c), block(R, c), block(ΔQ, c), block(ΔR, c))
-        end
-        return NoTangent(), Δt
-    end
-    leftorth!_pullback(::Tuple{ZeroTangent,ZeroTangent}) = NoTangent(), ZeroTangent()
-    return (Q, R), leftorth!_pullback
-end
-
-function ChainRulesCore.rrule(::typeof(rightorth!), t::AbstractTensorMap; alg=LQpos())
-    alg isa TensorKit.LQ || alg isa TensorKit.LQpos ||
-        error("only `alg=LQ()` and `alg=LQpos()` are supported")
-    L, Q = rightorth(t; alg)
-    function rightorth!_pullback((_ΔL, _ΔQ))
-        ΔL, ΔQ = unthunk(_ΔL), unthunk(_ΔQ)
-        Δt = similar(t)
-        for (c, b) in blocks(Δt)
-            lq_pullback!(b, block(L, c), block(Q, c), block(ΔL, c), block(ΔQ, c))
-        end
-        return NoTangent(), Δt
-    end
-    rightorth!_pullback(::Tuple{ZeroTangent,ZeroTangent}) = NoTangent(), ZeroTangent()
-    return (L, Q), rightorth!_pullback
-end
-
-# Corresponding matrix factorisations: implemented as mutating methods
-# ---------------------------------------------------------------------
-# helper routines
-safe_inv(a, tol) = abs(a) < tol ? zero(a) : inv(a)
-
-function lowertriangularind(A::AbstractMatrix)
-    m, n = size(A)
-    I = Vector{Int}(undef, div(m * (m - 1), 2) + m * (n - m))
-    offset = 0
-    for j in 1:n
-        r = (j + 1):m
-        I[offset .- j .+ r] = (j - 1) * m .+ r
-        offset += length(r)
-    end
-    return I
-end
-
-function uppertriangularind(A::AbstractMatrix)
-    m, n = size(A)
-    I = Vector{Int}(undef, div(m * (m - 1), 2) + m * (n - m))
-    offset = 0
-    for i in 1:m
-        r = (i + 1):n
-        I[offset .- i .+ r] = i .+ m .* (r .- 1)
-        offset += length(r)
-    end
-    return I
-end
-
-# SVD_pullback: pullback implementation for general (possibly truncated) SVD
-#
-# Arguments are U, S and Vd of full (non-truncated, but still thin) SVD, as well as
-# cotangent ΔU, ΔS, ΔVd variables of truncated SVD
-# 
-# Checks whether the cotangent variables are such that they would couple to gauge-dependent
-# degrees of freedom (phases of singular vectors), and prints a warning if this is the case
-#
-# An implementation that only uses U, S, and Vd from truncated SVD is also possible, but
-# requires solving a Sylvester equation, which does not seem to be supported on GPUs.
-#
-# Other implementation considerations for GPU compatibility:
-# no scalar indexing, lots of broadcasting and views
-#
-function svd_pullback!(ΔA::AbstractMatrix, U::AbstractMatrix, S::AbstractVector,
-                       Vd::AbstractMatrix, ΔU, ΔS, ΔVd;
-                       tol::Real=default_pullback_gaugetol(S))
-
-    # Basic size checks and determination
-    m, n = size(U, 1), size(Vd, 2)
-    size(U, 2) == size(Vd, 1) == length(S) == min(m, n) || throw(DimensionMismatch())
-    p = -1
-    if !(ΔU isa AbstractZero)
-        m == size(ΔU, 1) || throw(DimensionMismatch())
-        p = size(ΔU, 2)
-    end
-    if !(ΔVd isa AbstractZero)
-        n == size(ΔVd, 2) || throw(DimensionMismatch())
-        if p == -1
-            p = size(ΔVd, 1)
-        else
-            p == size(ΔVd, 1) || throw(DimensionMismatch())
-        end
-    end
-    if !(ΔS isa AbstractZero)
-        if p == -1
-            p = length(ΔS)
-        else
-            p == length(ΔS) || throw(DimensionMismatch())
-        end
-    end
-    Up = view(U, :, 1:p)
-    Vp = view(Vd, 1:p, :)'
-    Sp = view(S, 1:p)
-
-    # rank
-    r = searchsortedlast(S, tol; rev=true)
-
-    # compute antihermitian part of projection of ΔU and ΔV onto U and V
-    # also already subtract this projection from ΔU and ΔV
-    if !(ΔU isa AbstractZero)
-        UΔU = Up' * ΔU
-        aUΔU = rmul!(UΔU - UΔU', 1 / 2)
-        if m > p
-            ΔU -= Up * UΔU
-        end
-    else
-        aUΔU = fill!(similar(U, (p, p)), 0)
-    end
-    if !(ΔVd isa AbstractZero)
-        VΔV = Vp' * ΔVd'
-        aVΔV = rmul!(VΔV - VΔV', 1 / 2)
-        if n > p
-            ΔVd -= VΔV' * Vp'
-        end
-    else
-        aVΔV = fill!(similar(Vd, (p, p)), 0)
-    end
-
-    # check whether cotangents arise from gauge-invariance objective function
-    mask = abs.(Sp' .- Sp) .< tol
-    Δgauge = norm(view(aUΔU, mask) + view(aVΔV, mask), Inf)
-    if p > r
-        rprange = (r + 1):p
-        Δgauge = max(Δgauge, norm(view(aUΔU, rprange, rprange), Inf))
-        Δgauge = max(Δgauge, norm(view(aVΔV, rprange, rprange), Inf))
-    end
-    Δgauge < tol ||
-        @warn "`svd` cotangents sensitive to gauge choice: (|Δgauge| = $Δgauge)"
-
-    UdΔAV = (aUΔU .+ aVΔV) .* safe_inv.(Sp' .- Sp, tol) .+
-            (aUΔU .- aVΔV) .* safe_inv.(Sp' .+ Sp, tol)
-    if !(ΔS isa ZeroTangent)
-        UdΔAV[diagind(UdΔAV)] .+= real.(ΔS)
-        # in principle, ΔS is real, but maybe not if coming from an anyonic tensor
-    end
-    mul!(ΔA, Up, UdΔAV * Vp')
-
-    if r > p # contribution from truncation
-        Ur = view(U, :, (p + 1):r)
-        Vr = view(Vd, (p + 1):r, :)'
-        Sr = view(S, (p + 1):r)
-
-        if !(ΔU isa AbstractZero)
-            UrΔU = Ur' * ΔU
-            if m > r
-                ΔU -= Ur * UrΔU # subtract this part from ΔU
-            end
-        else
-            UrΔU = fill!(similar(U, (r - p, p)), 0)
-        end
-        if !(ΔVd isa AbstractZero)
-            VrΔV = Vr' * ΔVd'
-            if n > r
-                ΔVd -= VrΔV' * Vr' # subtract this part from ΔV
-            end
-        else
-            VrΔV = fill!(similar(Vd, (r - p, p)), 0)
-        end
-
-        X = (1 // 2) .* ((UrΔU .+ VrΔV) .* safe_inv.(Sp' .- Sr, tol) .+
-                         (UrΔU .- VrΔV) .* safe_inv.(Sp' .+ Sr, tol))
-        Y = (1 // 2) .* ((UrΔU .+ VrΔV) .* safe_inv.(Sp' .- Sr, tol) .-
-                         (UrΔU .- VrΔV) .* safe_inv.(Sp' .+ Sr, tol))
-
-        # ΔA += Ur * X * Vp' + Up * Y' * Vr'
-        mul!(ΔA, Ur, X * Vp', 1, 1)
-        mul!(ΔA, Up * Y', Vr', 1, 1)
-    end
-
-    if m > max(r, p) && !(ΔU isa AbstractZero) # remaining ΔU is already orthogonal to U[:,1:max(p,r)]
-        # ΔA += (ΔU .* safe_inv.(Sp', tol)) * Vp'
-        mul!(ΔA, ΔU .* safe_inv.(Sp', tol), Vp', 1, 1)
-    end
-    if n > max(r, p) && !(ΔVd isa AbstractZero) # remaining ΔV is already orthogonal to V[:,1:max(p,r)]
-        # ΔA += U * (safe_inv.(Sp, tol) .* ΔVd)
-        mul!(ΔA, Up, safe_inv.(Sp, tol) .* ΔVd, 1, 1)
-    end
-    return ΔA
-end
-
-function eig_pullback!(ΔA::AbstractMatrix, D::AbstractVector, V::AbstractMatrix, ΔD, ΔV;
-                       tol::Real=default_pullback_gaugetol(D))
-
-    # Basic size checks and determination
-    n = LinearAlgebra.checksquare(V)
-    n == length(D) || throw(DimensionMismatch())
-
-    if !(ΔV isa AbstractZero)
-        VdΔV = V' * ΔV
-
-        mask = abs.(transpose(D) .- D) .< tol
-        Δgauge = norm(view(VdΔV, mask), Inf)
-        Δgauge < tol ||
-            @warn "`eig` cotangents sensitive to gauge choice: (|Δgauge| = $Δgauge)"
-
-        VdΔV .*= conj.(safe_inv.(transpose(D) .- D, tol))
-
-        if !(ΔD isa AbstractZero)
-            view(VdΔV, diagind(VdΔV)) .+= ΔD
-        end
-        PΔV = V' \ VdΔV
-        if eltype(ΔA) <: Real
-            ΔAc = mul!(VdΔV, PΔV, V') # recycle VdΔV memory
-            ΔA .= real.(ΔAc)
-        else
-            mul!(ΔA, PΔV, V')
-        end
-    else
-        PΔV = V' \ Diagonal(ΔD)
-        if eltype(ΔA) <: Real
-            ΔAc = PΔV * V'
-            ΔA .= real.(ΔAc)
-        else
-            mul!(ΔA, PΔV, V')
-        end
-    end
-    return ΔA
-end
-
-function eigh_pullback!(ΔA::AbstractMatrix, D::AbstractVector, V::AbstractMatrix, ΔD, ΔV;
-                        tol::Real=default_pullback_gaugetol(D))
-
-    # Basic size checks and determination
-    n = LinearAlgebra.checksquare(V)
-    n == length(D) || throw(DimensionMismatch())
-
-    if !(ΔV isa AbstractZero)
-        VdΔV = V' * ΔV
-        aVdΔV = rmul!(VdΔV - VdΔV', 1 / 2)
-
-        mask = abs.(D' .- D) .< tol
-        Δgauge = norm(view(aVdΔV, mask))
-        Δgauge < tol ||
-            @warn "`eigh` cotangents sensitive to gauge choice: (|Δgauge| = $Δgauge)"
-
-        aVdΔV .*= safe_inv.(D' .- D, tol)
-
-        if !(ΔD isa AbstractZero)
-            view(aVdΔV, diagind(aVdΔV)) .+= real.(ΔD)
-            # in principle, ΔD is real, but maybe not if coming from an anyonic tensor
-        end
-        # recylce VdΔV space
-        mul!(ΔA, mul!(VdΔV, V, aVdΔV), V')
-    else
-        mul!(ΔA, V * Diagonal(ΔD), V')
-    end
-    return ΔA
-end
-
-function qr_pullback!(ΔA::AbstractMatrix, Q::AbstractMatrix, R::AbstractMatrix, ΔQ, ΔR;
-                      tol::Real=default_pullback_gaugetol(R))
-    Rd = view(R, diagind(R))
-    p = something(findlast(≥(tol) ∘ abs, Rd), 0)
-    m, n = size(R)
-
-    Q1 = view(Q, :, 1:p)
-    R1 = view(R, 1:p, :)
-    R11 = view(R, 1:p, 1:p)
-
-    ΔA1 = view(ΔA, :, 1:p)
-    ΔQ1 = view(ΔQ, :, 1:p)
-    ΔR1 = view(ΔR, 1:p, :)
-
-    M = similar(R, (p, p))
-    ΔR isa AbstractZero || mul!(M, ΔR1, R1')
-    ΔQ isa AbstractZero || mul!(M, Q1', ΔQ1, -1, !(ΔR isa AbstractZero))
-    view(M, lowertriangularind(M)) .= conj.(view(M, uppertriangularind(M)))
-    if eltype(M) <: Complex
-        Md = view(M, diagind(M))
-        Md .= real.(Md)
-    end
-
-    ΔA1 .= ΔQ1
-    mul!(ΔA1, Q1, M, +1, 1)
-
-    if n > p
-        R12 = view(R, 1:p, (p + 1):n)
-        ΔA2 = view(ΔA, :, (p + 1):n)
-        ΔR12 = view(ΔR, 1:p, (p + 1):n)
-
-        if ΔR isa AbstractZero
-            ΔA2 .= zero(eltype(ΔA))
-        else
-            mul!(ΔA2, Q1, ΔR12)
-            mul!(ΔA1, ΔA2, R12', -1, 1)
-        end
-    end
-    if m > p && !(ΔQ isa AbstractZero) # case where R is not full rank
-        Q2 = view(Q, :, (p + 1):m)
-        ΔQ2 = view(ΔQ, :, (p + 1):m)
-        Q1dΔQ2 = Q1' * ΔQ2
-        Δgauge = norm(mul!(copy(ΔQ2), Q1, Q1dΔQ2, -1, 1), Inf)
-        Δgauge < tol ||
-            @warn "`qr` cotangents sensitive to gauge choice: (|Δgauge| = $Δgauge)"
-        mul!(ΔA1, Q2, Q1dΔQ2', -1, 1)
-    end
-    rdiv!(ΔA1, UpperTriangular(R11)')
-    return ΔA
-end
-
-function lq_pullback!(ΔA::AbstractMatrix, L::AbstractMatrix, Q::AbstractMatrix, ΔL, ΔQ;
-                      tol::Real=default_pullback_gaugetol(L))
-    Ld = view(L, diagind(L))
-    p = something(findlast(≥(tol) ∘ abs, Ld), 0)
-    m, n = size(L)
-
-    L1 = view(L, :, 1:p)
-    L11 = view(L, 1:p, 1:p)
-    Q1 = view(Q, 1:p, :)
-
-    ΔA1 = view(ΔA, 1:p, :)
-    ΔQ1 = view(ΔQ, 1:p, :)
-    ΔL1 = view(ΔL, :, 1:p)
-
-    M = similar(L, (p, p))
-    ΔL isa AbstractZero || mul!(M, L1', ΔL1)
-    ΔQ isa AbstractZero || mul!(M, ΔQ1, Q1', -1, !(ΔL isa AbstractZero))
-    view(M, uppertriangularind(M)) .= conj.(view(M, lowertriangularind(M)))
-    if eltype(M) <: Complex
-        Md = view(M, diagind(M))
-        Md .= real.(Md)
-    end
-
-    ΔA1 .= ΔQ1
-    mul!(ΔA1, M, Q1, +1, 1)
-
-    if m > p
-        L21 = view(L, (p + 1):m, 1:p)
-        ΔA2 = view(ΔA, (p + 1):m, :)
-        ΔL21 = view(ΔL, (p + 1):m, 1:p)
-
-        if ΔL isa AbstractZero
-            ΔA2 .= zero(eltype(ΔA))
-        else
-            mul!(ΔA2, ΔL21, Q1)
-            mul!(ΔA1, L21', ΔA2, -1, 1)
-        end
-    end
-    if n > p && !(ΔQ isa AbstractZero) # case where R is not full rank
-        Q2 = view(Q, (p + 1):n, :)
-        ΔQ2 = view(ΔQ, (p + 1):n, :)
-        ΔQ2Q1d = ΔQ2 * Q1'
-        Δgauge = norm(mul!(copy(ΔQ2), ΔQ2Q1d, Q1, -1, 1))
-        Δgauge < tol ||
-            @warn "`lq` cotangents sensitive to gauge choice: (|Δgauge| = $Δgauge)"
-        mul!(ΔA1, ΔQ2Q1d', Q2, -1, 1)
-    end
-    ldiv!(LowerTriangular(L11)', ΔA1)
-    return ΔA
-end
-
-function default_pullback_gaugetol(a)
-    n = norm(a, Inf)
-    return eps(eltype(n))^(3 / 4) * max(n, one(n))
-end
diff --git a/src/TensorKit.jl b/src/TensorKit.jl
index 96a579e25..ce6c7697b 100644
--- a/src/TensorKit.jl
+++ b/src/TensorKit.jl
@@ -31,7 +31,7 @@ export TruncationScheme
 export SpaceMismatch, SectorMismatch, IndexError # error types
 
 # general vector space methods
-export space, field, dual, dim, reduceddim, dims, fuse, flip, isdual, oplus,
+export space, field, dual, dim, reduceddim, dims, fuse, flip, isdual, oplus, ominus,
        insertleftunit, insertrightunit, removeunit
 
 # partial order for vector spaces
@@ -47,7 +47,7 @@ export ZNSpace, SU2Irrep, U1Irrep, CU1Irrep
 #        bendleft, bendright, foldleft, foldright, cycleclockwise, cycleanticlockwise
 
 # some unicode
-export ⊕, ⊗, ×, ⊠, ℂ, ℝ, ℤ, ←, →, ≾, ≿, ≅, ≺, ≻
+export ⊕, ⊗, ⊖, ×, ⊠, ℂ, ℝ, ℤ, ←, →, ≾, ≿, ≅, ≺, ≻
 export ℤ₂, ℤ₃, ℤ₄, U₁, SU, SU₂, CU₁
 export fℤ₂, fU₁, fSU₂
 export ℤ₂Space, ℤ₃Space, ℤ₄Space, U₁Space, CU₁Space, SU₂Space
@@ -70,23 +70,28 @@ export inner, dot, norm, normalize, normalize!, tr
 
 # factorizations
 export mul!, lmul!, rmul!, adjoint!, pinv, axpy!, axpby!
-export leftorth, rightorth, leftnull, rightnull,
-       leftorth!, rightorth!, leftnull!, rightnull!,
-       tsvd!, tsvd, eigen, eigen!, eig, eig!, eigh, eigh!, exp, exp!,
-       isposdef, isposdef!, ishermitian, sylvester, rank, cond
+export left_orth, right_orth, left_null, right_null,
+       left_orth!, right_orth!, left_null!, right_null!,
+       left_polar, left_polar!, right_polar, right_polar!,
+       qr_full, qr_compact, qr_null, lq_full, lq_compact, lq_null,
+       qr_full!, qr_compact!, qr_null!, lq_full!, lq_compact!, lq_null!,
+       svd_compact!, svd_full!, svd_trunc!, svd_compact, svd_full, svd_trunc,
+       exp, exp!,
+       eigh_full!, eigh_full, eigh_trunc!, eigh_trunc, eig_full!, eig_full, eig_trunc!,
+       eig_trunc,
+       eigh_vals!, eigh_vals, eig_vals!, eig_vals,
+       isposdef, isposdef!, ishermitian, isisometry, isunitary, sylvester, rank, cond
+
 export braid, braid!, permute, permute!, transpose, transpose!, twist, twist!, repartition,
        repartition!
 export catdomain, catcodomain, absorb, absorb!
 
-export OrthogonalFactorizationAlgorithm, QR, QRpos, QL, QLpos, LQ, LQpos, RQ, RQpos,
-       SVD, SDD, Polar
-
 # tensor operations
 export @tensor, @tensoropt, @ncon, ncon, @planar, @plansor
 export scalar, add!, contract!
 
 # truncation schemes
-export notrunc, truncerr, truncdim, truncspace, truncbelow
+export notrunc, truncrank, trunctol, truncfilter, truncspace, truncerror
 
 # cache management
 export empty_globalcaches!
@@ -104,7 +109,11 @@ using TensorOperations: TensorOperations, @tensor, @tensoropt, @ncon, ncon
 using TensorOperations: IndexTuple, Index2Tuple, linearize, AbstractBackend
 const TO = TensorOperations
 
+using MatrixAlgebraKit
+
 using LRUCache
+using OhMyThreads
+using ScopedValues
 
 using TensorKitSectors
 import TensorKitSectors: dim, BraidingStyle, FusionStyle, ⊠, ⊗
@@ -117,7 +126,7 @@ using Base: @boundscheck, @propagate_inbounds, @constprop,
             SizeUnknown, HasLength, HasShape, IsInfinite, EltypeUnknown, HasEltype
 using Base.Iterators: product, filter
 
-using LinearAlgebra: LinearAlgebra
+using LinearAlgebra: LinearAlgebra, BlasFloat
 using LinearAlgebra: norm, dot, normalize, normalize!, tr,
                      axpy!, axpby!, lmul!, rmul!, mul!, ldiv!, rdiv!,
                      adjoint, adjoint!, transpose, transpose!,
@@ -125,6 +134,7 @@ using LinearAlgebra: norm, dot, normalize, normalize!, tr,
                      eigen, eigen!, svd, svd!,
                      isposdef, isposdef!, ishermitian, rank, cond,
                      Diagonal, Hermitian
+using MatrixAlgebraKit
 
 import Base.Meta
 
@@ -138,7 +148,6 @@ include("auxiliary/auxiliary.jl")
 include("auxiliary/caches.jl")
 include("auxiliary/dicts.jl")
 include("auxiliary/iterators.jl")
-include("auxiliary/linalg.jl")
 include("auxiliary/random.jl")
 
 #--------------------------------------------------------------------
@@ -202,6 +211,7 @@ end
 #-------------------------------------
 # general definitions
 include("tensors/abstracttensor.jl")
+include("tensors/backends.jl")
 include("tensors/blockiterator.jl")
 include("tensors/tensor.jl")
 include("tensors/adjoint.jl")
@@ -211,10 +221,11 @@ include("tensors/tensoroperations.jl")
 include("tensors/treetransformers.jl")
 include("tensors/indexmanipulations.jl")
 include("tensors/diagonal.jl")
-include("tensors/truncation.jl")
-include("tensors/factorizations.jl")
 include("tensors/braidingtensor.jl")
 
+include("factorizations/factorizations.jl")
+using .Factorizations
+
 # # Planar macros and related functionality
 # #-----------------------------------------
 @nospecialize
diff --git a/src/auxiliary/deprecate.jl b/src/auxiliary/deprecate.jl
index fa7667b2b..5853cad01 100644
--- a/src/auxiliary/deprecate.jl
+++ b/src/auxiliary/deprecate.jl
@@ -1,29 +1,6 @@
 import Base: transpose
 
 #! format: off
-Base.@deprecate(permute(t::AbstractTensorMap, p1::IndexTuple, p2::IndexTuple; copy::Bool=false),
-                permute(t, (p1, p2); copy=copy))
-Base.@deprecate(transpose(t::AbstractTensorMap, p1::IndexTuple, p2::IndexTuple; copy::Bool=false),
-                transpose(t, (p1, p2); copy=copy))
-Base.@deprecate(braid(t::AbstractTensorMap, p1::IndexTuple, p2::IndexTuple, levels; copy::Bool=false),
-                braid(t, (p1, p2), levels; copy=copy))
-
-Base.@deprecate(tsvd(t::AbstractTensorMap, p₁::IndexTuple, p₂::IndexTuple; kwargs...),
-                tsvd(t, (p₁, p₂); kwargs...))
-Base.@deprecate(leftorth(t::AbstractTensorMap, p₁::IndexTuple, p₂::IndexTuple; kwargs...),
-                leftorth(t, (p₁, p₂); kwargs...))
-Base.@deprecate(rightorth(t::AbstractTensorMap, p₁::IndexTuple, p₂::IndexTuple; kwargs...),
-                rightorth(t, (p₁, p₂); kwargs...))
-Base.@deprecate(leftnull(t::AbstractTensorMap, p₁::IndexTuple, p₂::IndexTuple; kwargs...),
-                leftnull(t, (p₁, p₂); kwargs...))
-Base.@deprecate(rightnull(t::AbstractTensorMap, p₁::IndexTuple, p₂::IndexTuple; kwargs...),
-                rightnull(t, (p₁, p₂); kwargs...))
-Base.@deprecate(LinearAlgebra.eigen(t::AbstractTensorMap, p₁::IndexTuple, p₂::IndexTuple; kwargs...),
-                LinearAlgebra.eigen(t, (p₁, p₂); kwargs...), false)
-Base.@deprecate(eig(t::AbstractTensorMap, p₁::IndexTuple, p₂::IndexTuple; kwargs...),
-                eig(t, (p₁, p₂); kwargs...))
-Base.@deprecate(eigh(t::AbstractTensorMap, p₁::IndexTuple, p₂::IndexTuple; kwargs...),
-                eigh(t, (p₁, p₂); kwargs...))
 
 for f in (:rand, :randn, :zeros, :ones)
     @eval begin
@@ -58,4 +35,165 @@ Base.@deprecate EuclideanProduct() EuclideanInnerProduct()
 
 Base.@deprecate insertunit(P::ProductSpace, args...; kwargs...) insertleftunit(args...; kwargs...)
 
+# Factorization structs
+@deprecate QR() MatrixAlgebraKit.LAPACK_HouseholderQR()
+@deprecate QRpos() MatrixAlgebraKit.LAPACK_HouseholderQR(; positive=true)
+
+@deprecate QL() MatrixAlgebraKit.LAPACK_HouseholderQL()
+@deprecate QLpos() MatrixAlgebraKit.LAPACK_HouseholderQL(; positive=true)
+
+@deprecate LQ() MatrixAlgebraKit.LAPACK_HouseholderLQ()
+@deprecate LQpos() MatrixAlgebraKit.LAPACK_HouseholderLQ(; positive=true)
+
+@deprecate RQ() MatrixAlgebraKit.LAPACK_HouseholderRQ()
+@deprecate RQpos() MatrixAlgebraKit.LAPACK_HouseholderRQ(; positive=true)
+
+@deprecate SDD() MatrixAlgebraKit.LAPACK_DivideAndConquer()
+@deprecate SVD() MatrixAlgebraKit.LAPACK_QRIteration()
+
+@deprecate Polar() MatrixAlgebraKit.PolarViaSVD(MatrixAlgebraKit.LAPACK_DivideAndConquer())
+
+# truncations
+const TruncationScheme = MatrixAlgebraKit.TruncationStrategy
+@deprecate truncdim(d::Int) truncrank(d)
+@deprecate truncbelow(ϵ::Real) trunctol(ϵ)
+
+# factorizations
+# --------------
+_kindof(::MatrixAlgebraKit.LAPACK_HouseholderQR) = :qr
+_kindof(::MatrixAlgebraKit.LAPACK_HouseholderLQ) = :lq
+_kindof(::MatrixAlgebraKit.LAPACK_SVDAlgorithm) = :svd
+_kindof(::MatrixAlgebraKit.PolarViaSVD) = :polar
+_kindof(::DiagonalAlgorithm) = :svd # shouldn't really matter
+
+_drop_alg(; alg=nothing, kwargs...) = kwargs
+_drop_p(; p=nothing, kwargs...) = kwargs
+
+function permutedcopy_oftype(t::AbstractTensorMap, T::Type{<:Number}, p::Index2Tuple)
+    return permute!(similar(t, T, permute(space(t), p)), t, p)
+end
+
+# orthogonalization
+export leftorth, leftorth!, rightorth, rightorth!
+function leftorth(t::AbstractTensorMap, p::Index2Tuple; kwargs...)
+    Base.depwarn("`leftorth` is deprecated, use `left_orth` instead", :leftorth)
+    return leftorth!(permutedcopy_oftype(t, factorisation_scalartype(leftorth, t), p); kwargs...)
+end
+function rightorth(t::AbstractTensorMap, p::Index2Tuple; kwargs...)
+    Base.depwarn("`rightorth` is deprecated, use `right_orth` instead", :rightorth)
+    return rightorth!(permutedcopy_oftype(t, factorisation_scalartype(rightorth, t), p); kwargs...)
+end
+function leftorth(t::AbstractTensorMap; kwargs...)
+    Base.depwarn("`leftorth` is deprecated, use `left_orth` instead", :leftorth)
+    return leftorth!(copy_oftype(t, factorisation_scalartype(leftorth, t)); kwargs...)
+end
+function rightorth(t::AbstractTensorMap; kwargs...)
+    Base.depwarn("`rightorth` is deprecated, use `right_orth` instead", :rightorth)
+    return rightorth!(copy_oftype(t, factorisation_scalartype(rightorth, t)); kwargs...)
+end
+function leftorth!(t::AbstractTensorMap; kwargs...)
+    Base.depwarn("`leftorth!` is deprecated, use `left_orth!` instead", :leftorth!)
+    haskey(kwargs, :alg) || return left_orth!(t; kwargs...)
+    alg = kwargs[:alg]
+    kind = _kindof(alg)
+    kind === :svd && return left_orth!(t; kind, alg_svd=alg, _drop_alg(; kwargs...)...)
+    kind === :qr && return left_orth!(t; kind, alg_qr=alg, _drop_alg(; kwargs...)...)
+    kind === :polar && return left_orth!(t; kind, alg_polar=alg, _drop_alg(; kwargs...)...)
+    throw(ArgumentError("invalid leftorth kind"))
+end
+function rightorth!(t::AbstractTensorMap; kwargs...)
+    Base.depwarn("`rightorth!` is deprecated, use `right_orth!` instead", :rightorth!)
+    haskey(kwargs, :alg) || return right_orth!(t; kwargs...)
+    alg = kwargs[:alg]
+    kind = _kindof(alg)
+    kind === :svd && return right_orth!(t; kind, alg_svd=alg, _drop_alg(; kwargs...)...)
+    kind === :lq && return right_orth!(t; kind, alg_lq=alg, _drop_alg(; kwargs...)...)
+    kind === :polar && return right_orth!(t; kind, alg_polar=alg, _drop_alg(; kwargs...)...)
+    throw(ArgumentError("invalid rightorth kind"))
+end
+
+# nullspaces
+export leftnull, leftnull!, rightnull, rightnull!
+function leftnull(t::AbstractTensorMap; kwargs...)
+    Base.depwarn("`leftnull` is deprecated, use `left_null` instead", :leftnull)
+    return leftnull!(copy_oftype(t, factorisation_scalartype(leftnull, t)); kwargs...)
+end
+function leftnull(t::AbstractTensorMap, p::Index2Tuple; kwargs...)
+    Base.depwarn("`leftnull` is deprecated, use `left_null` instead", :leftnull)
+    return leftnull!(permutedcopy_oftype(t, factorisation_scalartype(leftnull, t), p); kwargs...)
+end
+function rightnull(t::AbstractTensorMap; kwargs...)
+    Base.depwarn("`rightnull` is deprecated, use `right_null` instead", :rightnull)
+    return rightnull!(copy_oftype(t, factorisation_scalartype(rightnull, t)); kwargs...)
+end
+function rightnull(t::AbstractTensorMap, p::Index2Tuple; kwargs...)
+    Base.depwarn("`rightnull` is deprecated, use `right_null` instead", :rightnull)
+    return rightnull!(permutedcopy_oftype(t, factorisation_scalartype(rightnull, t), p); kwargs...)
+end
+function leftnull!(t::AbstractTensorMap; kwargs...)
+    Base.depwarn("`left_null!` is deprecated, use `left_null!` instead", :leftnull!)
+    haskey(kwargs, :alg) || return left_null!(t; kwargs...)
+    alg = kwargs[:alg]
+    kind = _kindof(alg)
+    kind === :svd && return left_null!(t; kind, alg_svd=alg, _drop_alg(; kwargs...)...)
+    kind === :qr && return left_null!(t; kind, alg_qr=alg, _drop_alg(; kwargs...)...)
+    throw(ArgumentError("invalid leftnull kind"))
+end
+function rightnull!(t::AbstractTensorMap; kwargs...)
+    Base.depwarn("`rightnull!` is deprecated, use `right_null!` instead", :rightnull!)
+    haskey(kwargs, :alg) || return right_null!(t; kwargs...)
+    alg = kwargs[:alg]
+    kind = _kindof(alg)
+    kind === :svd && return right_null!(t; kind, alg_svd=alg, _drop_alg(; kwargs...)...)
+    kind === :lq && return right_null!(t; kind, alg_lq=alg, _drop_alg(; kwargs...)...)
+    throw(ArgumentError("invalid rightnull kind"))
+end
+
+# eigen values
+export eig!, eigh!, eigen, eigen!
+@deprecate(eig(t::AbstractTensorMap, p::Index2Tuple; kwargs...),
+           eig!(permutedcopy_oftype(t, factorisation_scalartype(eig, t), p); kwargs...))
+@deprecate(eigh(t::AbstractTensorMap, p::Index2Tuple; kwargs...),
+           eigh!(permutedcopy_oftype(t, factorisation_scalartype(eigen, t), p); kwargs...))
+@deprecate(LinearAlgebra.eigen(t::AbstractTensorMap, p::Index2Tuple; kwargs...),
+           eigen!(permutedcopy_oftype(t, factorisation_scalartype(eigen, t), p); kwargs...),
+           false)
+function eig(t::AbstractTensorMap; kwargs...)
+    Base.depwarn("`eig` is deprecated, use `eig_full` or `eig_trunc` instead", :eig)
+    return haskey(kwargs, :trunc) ? eig_trunc(t; kwargs...) : eig_full(t; kwargs...)
+end
+function eig!(t::AbstractTensorMap; kwargs...)
+    Base.depwarn("`eig!` is deprecated, use `eig_full!` or `eig_trunc!` instead", :eig!)
+    return haskey(kwargs, :trunc) ? eig_trunc!(t; kwargs...) : eig_full!(t; kwargs...)
+end
+function eigh(t::AbstractTensorMap; kwargs...)
+    Base.depwarn("`eigh` is deprecated, use `eigh_full` or `eigh_trunc` instead", :eigh)
+    return haskey(kwargs, :trunc) ? eigh_trunc(t; kwargs...) : eigh_full(t; kwargs...)
+end
+function eigh!(t::AbstractTensorMap; kwargs...)
+    Base.depwarn("`eigh!` is deprecated, use `eigh_full!` or `eigh_trunc!` instead", :eigh!)
+    return haskey(kwargs, :trunc) ? eigh_trunc!(t; kwargs...) : eigh_full!(t; kwargs...)
+end
+
+# singular values
+export tsvd, tsvd!
+@deprecate(tsvd(t::AbstractTensorMap, p::Index2Tuple; kwargs...),
+           tsvd!(permutedcopy_oftype(t, factorisation_scalartype(tsvd, t), p); kwargs...))
+function tsvd(t::AbstractTensorMap; kwargs...)
+    Base.depwarn("`tsvd` is deprecated, use `svd_compact`, `svd_full` or `svd_trunc` instead", :tsvd)
+    if haskey(kwargs, :p)
+        Base.depwarn("p is a deprecated kwarg, and should be specified through the truncation strategy", :tsvd)
+        kwargs = _drop_p(; kwargs...)
+    end
+    return haskey(kwargs, :trunc) ? svd_trunc(t; kwargs...) : svd_compact(t; kwargs...)
+end
+function tsvd!(t::AbstractTensorMap; kwargs...)
+    Base.depwarn("`tsvd!` is deprecated, use `svd_compact!`, `svd_full!` or `svd_trunc!` instead", :tsvd!)
+    if haskey(kwargs, :p)
+        Base.depwarn("p is a deprecated kwarg, and should be specified through the truncation strategy", :tsvd!)
+        kwargs = _drop_p(; kwargs...)
+    end
+    return haskey(kwargs, :trunc) ? svd_trunc!(t; kwargs...) : svd_compact!(t; kwargs...)
+end
+
 #! format: on
diff --git a/src/auxiliary/linalg.jl b/src/auxiliary/linalg.jl
deleted file mode 100644
index 82e8600f0..000000000
--- a/src/auxiliary/linalg.jl
+++ /dev/null
@@ -1,386 +0,0 @@
-# Simple reference to getting and setting BLAS threads
-#------------------------------------------------------
-set_num_blas_threads(n::Integer) = LinearAlgebra.BLAS.set_num_threads(n)
-get_num_blas_threads() = LinearAlgebra.BLAS.get_num_threads()
-
-# Factorization algorithms
-#--------------------------
-abstract type FactorizationAlgorithm end
-abstract type OrthogonalFactorizationAlgorithm <: FactorizationAlgorithm end
-
-struct QRpos <: OrthogonalFactorizationAlgorithm
-end
-struct QR <: OrthogonalFactorizationAlgorithm
-end
-struct QL <: OrthogonalFactorizationAlgorithm
-end
-struct QLpos <: OrthogonalFactorizationAlgorithm
-end
-struct LQ <: OrthogonalFactorizationAlgorithm
-end
-struct LQpos <: OrthogonalFactorizationAlgorithm
-end
-struct RQ <: OrthogonalFactorizationAlgorithm
-end
-struct RQpos <: OrthogonalFactorizationAlgorithm
-end
-struct SDD <: OrthogonalFactorizationAlgorithm # lapack's default divide and conquer algorithm
-end
-struct SVD <: OrthogonalFactorizationAlgorithm
-end
-struct Polar <: OrthogonalFactorizationAlgorithm
-end
-
-Base.adjoint(::QRpos) = LQpos()
-Base.adjoint(::QR) = LQ()
-Base.adjoint(::LQpos) = QRpos()
-Base.adjoint(::LQ) = QR()
-
-Base.adjoint(::QLpos) = RQpos()
-Base.adjoint(::QL) = RQ()
-Base.adjoint(::RQpos) = QLpos()
-Base.adjoint(::RQ) = QL()
-
-Base.adjoint(alg::Union{SVD,SDD,Polar}) = alg
-
-const OFA = OrthogonalFactorizationAlgorithm
-const SVDAlg = Union{SVD,SDD}
-
-# Matrix algebra: entrypoint for calling matrix methods from within tensor implementations
-#------------------------------------------------------------------------------------------
-module MatrixAlgebra
-# TODO: all methods that we define here will need an extended version for CuMatrix/ROCMatrix in the
-# CUDA/AMD package extension.
-
-# TODO: other methods to include here:
-# mul! (possibly call matmul! instead)
-# adjoint!
-# sylvester
-# exp!
-# schur!?
-# 
-
-using LinearAlgebra
-using LinearAlgebra: BlasFloat, BlasReal, BlasComplex, checksquare
-
-using ..TensorKit: OrthogonalFactorizationAlgorithm,
-                   QL, QLpos, QR, QRpos, LQ, LQpos, RQ, RQpos, SVD, SDD, Polar
-
-# only defined in >v1.7
-@static if VERSION < v"1.7-"
-    _rf_findmax((fm, im), (fx, ix)) = isless(fm, fx) ? (fx, ix) : (fm, im)
-    _argmax(f, domain) = mapfoldl(x -> (f(x), x), _rf_findmax, domain)[2]
-else
-    _argmax(f, domain) = argmax(f, domain)
-end
-
-# TODO: define for CuMatrix if we support this
-function one!(A::StridedMatrix)
-    length(A) > 0 || return A
-    copyto!(A, LinearAlgebra.I)
-    return A
-end
-
-safesign(s::Real) = ifelse(s < zero(s), -one(s), +one(s))
-safesign(s::Complex) = ifelse(iszero(s), one(s), s / abs(s))
-
-function leftorth!(A::StridedMatrix{<:BlasFloat}, alg::Union{QR,QRpos}, atol::Real)
-    iszero(atol) || throw(ArgumentError("nonzero atol not supported by $alg"))
-    m, n = size(A)
-    k = min(m, n)
-    A, T = LAPACK.geqrt!(A, min(minimum(size(A)), 36))
-    Q = similar(A, m, k)
-    for j in 1:k
-        for i in 1:m
-            Q[i, j] = i == j
-        end
-    end
-    Q = LAPACK.gemqrt!('L', 'N', A, T, Q)
-    R = triu!(A[1:k, :])
-
-    if isa(alg, QRpos)
-        @inbounds for j in 1:k
-            s = safesign(R[j, j])
-            @simd for i in 1:m
-                Q[i, j] *= s
-            end
-        end
-        @inbounds for j in size(R, 2):-1:1
-            for i in 1:min(k, j)
-                R[i, j] = R[i, j] * conj(safesign(R[i, i]))
-            end
-        end
-    end
-    return Q, R
-end
-
-function leftorth!(A::StridedMatrix{<:BlasFloat}, alg::Union{QL,QLpos}, atol::Real)
-    iszero(atol) || throw(ArgumentError("nonzero atol not supported by $alg"))
-    m, n = size(A)
-    @assert m >= n
-
-    nhalf = div(n, 2)
-    #swap columns in A
-    @inbounds for j in 1:nhalf, i in 1:m
-        A[i, j], A[i, n + 1 - j] = A[i, n + 1 - j], A[i, j]
-    end
-    Q, R = leftorth!(A, isa(alg, QL) ? QR() : QRpos(), atol)
-
-    #swap columns in Q
-    @inbounds for j in 1:nhalf, i in 1:m
-        Q[i, j], Q[i, n + 1 - j] = Q[i, n + 1 - j], Q[i, j]
-    end
-    #swap rows and columns in R
-    @inbounds for j in 1:nhalf, i in 1:n
-        R[i, j], R[n + 1 - i, n + 1 - j] = R[n + 1 - i, n + 1 - j], R[i, j]
-    end
-    if isodd(n)
-        j = nhalf + 1
-        @inbounds for i in 1:nhalf
-            R[i, j], R[n + 1 - i, j] = R[n + 1 - i, j], R[i, j]
-        end
-    end
-    return Q, R
-end
-
-function leftorth!(A::StridedMatrix{<:BlasFloat}, alg::Union{SVD,SDD,Polar}, atol::Real)
-    U, S, V = alg isa SVD ? LAPACK.gesvd!('S', 'S', A) : LAPACK.gesdd!('S', A)
-    if isa(alg, Union{SVD,SDD})
-        n = count(s -> s .> atol, S)
-        if n != length(S)
-            return U[:, 1:n], lmul!(Diagonal(S[1:n]), V[1:n, :])
-        else
-            return U, lmul!(Diagonal(S), V)
-        end
-    else
-        iszero(atol) || throw(ArgumentError("nonzero atol not supported by $alg"))
-        # TODO: check Lapack to see if we can recycle memory of A
-        Q = mul!(A, U, V)
-        Sq = map!(sqrt, S, S)
-        SqV = lmul!(Diagonal(Sq), V)
-        R = SqV' * SqV
-        return Q, R
-    end
-end
-
-function leftnull!(A::StridedMatrix{<:BlasFloat}, alg::Union{QR,QRpos}, atol::Real)
-    iszero(atol) || throw(ArgumentError("nonzero atol not supported by $alg"))
-    m, n = size(A)
-    m >= n || throw(ArgumentError("no null space if less rows than columns"))
-
-    A, T = LAPACK.geqrt!(A, min(minimum(size(A)), 36))
-    N = similar(A, m, max(0, m - n))
-    fill!(N, 0)
-    for k in 1:(m - n)
-        N[n + k, k] = 1
-    end
-    return N = LAPACK.gemqrt!('L', 'N', A, T, N)
-end
-
-function leftnull!(A::StridedMatrix{<:BlasFloat}, alg::Union{SVD,SDD}, atol::Real)
-    size(A, 2) == 0 && return one!(similar(A, (size(A, 1), size(A, 1))))
-    U, S, V = alg isa SVD ? LAPACK.gesvd!('A', 'N', A) : LAPACK.gesdd!('A', A)
-    indstart = count(>(atol), S) + 1
-    return U[:, indstart:end]
-end
-
-function rightorth!(A::StridedMatrix{<:BlasFloat}, alg::Union{LQ,LQpos,RQ,RQpos},
-                    atol::Real)
-    iszero(atol) || throw(ArgumentError("nonzero atol not supported by $alg"))
-    # TODO: geqrfp seems a bit slower than geqrt in the intermediate region around
-    # matrix size 100, which is the interesting region. => Investigate and fix
-    m, n = size(A)
-    k = min(m, n)
-    At = transpose!(similar(A, n, m), A)
-
-    if isa(alg, RQ) || isa(alg, RQpos)
-        @assert m <= n
-
-        mhalf = div(m, 2)
-        # swap columns in At
-        @inbounds for j in 1:mhalf, i in 1:n
-            At[i, j], At[i, m + 1 - j] = At[i, m + 1 - j], At[i, j]
-        end
-        Qt, Rt = leftorth!(At, isa(alg, RQ) ? QR() : QRpos(), atol)
-
-        @inbounds for j in 1:mhalf, i in 1:n
-            Qt[i, j], Qt[i, m + 1 - j] = Qt[i, m + 1 - j], Qt[i, j]
-        end
-        @inbounds for j in 1:mhalf, i in 1:m
-            Rt[i, j], Rt[m + 1 - i, m + 1 - j] = Rt[m + 1 - i, m + 1 - j], Rt[i, j]
-        end
-        if isodd(m)
-            j = mhalf + 1
-            @inbounds for i in 1:mhalf
-                Rt[i, j], Rt[m + 1 - i, j] = Rt[m + 1 - i, j], Rt[i, j]
-            end
-        end
-        Q = transpose!(A, Qt)
-        R = transpose!(similar(A, (m, m)), Rt) # TODO: efficient in place
-        return R, Q
-    else
-        Qt, Lt = leftorth!(At, alg', atol)
-        if m > n
-            L = transpose!(A, Lt)
-            Q = transpose!(similar(A, (n, n)), Qt) # TODO: efficient in place
-        else
-            Q = transpose!(A, Qt)
-            L = transpose!(similar(A, (m, m)), Lt) # TODO: efficient in place
-        end
-        return L, Q
-    end
-end
-
-function rightorth!(A::StridedMatrix{<:BlasFloat}, alg::Union{SVD,SDD,Polar}, atol::Real)
-    U, S, V = alg isa SVD ? LAPACK.gesvd!('S', 'S', A) : LAPACK.gesdd!('S', A)
-    if isa(alg, Union{SVD,SDD})
-        n = count(s -> s .> atol, S)
-        if n != length(S)
-            return rmul!(U[:, 1:n], Diagonal(S[1:n])), V[1:n, :]
-        else
-            return rmul!(U, Diagonal(S)), V
-        end
-    else
-        iszero(atol) || throw(ArgumentError("nonzero atol not supported by $alg"))
-        Q = mul!(A, U, V)
-        Sq = map!(sqrt, S, S)
-        USq = rmul!(U, Diagonal(Sq))
-        L = USq * USq'
-        return L, Q
-    end
-end
-
-function rightnull!(A::StridedMatrix{<:BlasFloat}, alg::Union{LQ,LQpos}, atol::Real)
-    iszero(atol) || throw(ArgumentError("nonzero atol not supported by $alg"))
-    m, n = size(A)
-    k = min(m, n)
-    At = adjoint!(similar(A, n, m), A)
-    At, T = LAPACK.geqrt!(At, min(k, 36))
-    N = similar(A, max(n - m, 0), n)
-    fill!(N, 0)
-    for k in 1:(n - m)
-        N[k, m + k] = 1
-    end
-    return N = LAPACK.gemqrt!('R', eltype(At) <: Real ? 'T' : 'C', At, T, N)
-end
-
-function rightnull!(A::StridedMatrix{<:BlasFloat}, alg::Union{SVD,SDD}, atol::Real)
-    size(A, 1) == 0 && return one!(similar(A, (size(A, 2), size(A, 2))))
-    U, S, V = alg isa SVD ? LAPACK.gesvd!('N', 'A', A) : LAPACK.gesdd!('A', A)
-    indstart = count(>(atol), S) + 1
-    return V[indstart:end, :]
-end
-
-function svd!(A::StridedMatrix{T}, alg::Union{SVD,SDD}) where {T<:BlasFloat}
-    # fix another type instability in LAPACK wrappers
-    TT = Tuple{Matrix{T},Vector{real(T)},Matrix{T}}
-    U, S, V = alg isa SVD ? LAPACK.gesvd!('S', 'S', A)::TT : LAPACK.gesdd!('S', A)::TT
-    return U, S, V
-end
-
-function eig!(A::StridedMatrix{T}; permute::Bool=true, scale::Bool=true) where {T<:BlasReal}
-    n = checksquare(A)
-    n == 0 && return zeros(Complex{T}, 0), zeros(Complex{T}, 0, 0)
-
-    A, DR, DI, VL, VR, _ = LAPACK.geevx!(permute ? (scale ? 'B' : 'P') :
-                                         (scale ? 'S' : 'N'), 'N', 'V', 'N', A)
-    D = complex.(DR, DI)
-    V = zeros(Complex{T}, n, n)
-    j = 1
-    while j <= n
-        if DI[j] == 0
-            vr = view(VR, :, j)
-            s = conj(sign(_argmax(abs, vr)))
-            V[:, j] .= s .* vr
-        else
-            vr = view(VR, :, j)
-            vi = view(VR, :, j + 1)
-            s = conj(sign(_argmax(abs, vr))) # vectors coming from lapack have already real absmax component
-            V[:, j] .= s .* (vr .+ im .* vi)
-            V[:, j + 1] .= s .* (vr .- im .* vi)
-            j += 1
-        end
-        j += 1
-    end
-    return D, V
-end
-
-function eig!(A::StridedMatrix{T}; permute::Bool=true,
-              scale::Bool=true) where {T<:BlasComplex}
-    n = checksquare(A)
-    n == 0 && return zeros(T, 0), zeros(T, 0, 0)
-    D, V = LAPACK.geevx!(permute ? (scale ? 'B' : 'P') : (scale ? 'S' : 'N'), 'N', 'V', 'N',
-                         A)[[2, 4]]
-    for j in 1:n
-        v = view(V, :, j)
-        s = conj(sign(_argmax(abs, v)))
-        v .*= s
-    end
-    return D, V
-end
-
-function eigh!(A::StridedMatrix{T}) where {T<:BlasFloat}
-    n = checksquare(A)
-    n == 0 && return zeros(real(T), 0), zeros(T, 0, 0)
-    D, V = LAPACK.syevr!('V', 'A', 'U', A, 0.0, 0.0, 0, 0, -1.0)
-    for j in 1:n
-        v = view(V, :, j)
-        s = conj(sign(_argmax(abs, v)))
-        v .*= s
-    end
-    return D, V
-end
-
-## Old stuff and experiments
-
-# using LinearAlgebra: BlasFloat, Char, BlasInt, LAPACK, LAPACKException,
-#                      DimensionMismatch, SingularException, PosDefException, chkstride1,
-#                      checksquare,
-#                      triu!
-
-# TODO: reconsider the following implementation
-# Unfortunately, geqrfp seems a bit slower than geqrt in the intermediate region
-# around matrix size 100, which is the interesting region. => Investigate and maybe fix
-# function _leftorth!(A::StridedMatrix{<:BlasFloat})
-#     m, n = size(A)
-#     A, τ = geqrfp!(A)
-#     Q = LAPACK.ormqr!('L', 'N', A, τ, eye(eltype(A), m, min(m, n)))
-#     R = triu!(A[1:min(m, n), :])
-#     return Q, R
-# end
-
-# geqrfp!: computes qrpos factorization, missing in Base
-# geqrfp!(A::StridedMatrix{<:BlasFloat}) =
-#     ((m, n) = size(A); geqrfp!(A, similar(A, min(m, n))))
-#
-# for (geqrfp, elty, relty) in
-#     ((:dgeqrfp_, :Float64, :Float64), (:sgeqrfp_, :Float32, :Float32),
-#         (:zgeqrfp_, :ComplexF64, :Float64), (:cgeqrfp_, :ComplexF32, :Float32))
-#     @eval begin
-#         function geqrfp!(A::StridedMatrix{$elty}, tau::StridedVector{$elty})
-#             chkstride1(A, tau)
-#             m, n  = size(A)
-#             if length(tau) != min(m, n)
-#                 throw(DimensionMismatch("tau has length $(length(tau)), but needs length $(min(m, n))"))
-#             end
-#             work  = Vector{$elty}(1)
-#             lwork = BlasInt(-1)
-#             info  = Ref{BlasInt}()
-#             for i = 1:2                # first call returns lwork as work[1]
-#                 ccall((@blasfunc($geqrfp), liblapack), Nothing,
-#                       (Ptr{BlasInt}, Ptr{BlasInt}, Ptr{$elty}, Ptr{BlasInt},
-#                        Ptr{$elty}, Ptr{$elty}, Ptr{BlasInt}, Ptr{BlasInt}),
-#                       Ref(m), Ref(n), A, Ref(max(1, stride(A, 2))),
-#                       tau, work, Ref(lwork), info)
-#                 chklapackerror(info[])
-#                 if i == 1
-#                     lwork = BlasInt(real(work[1]))
-#                     resize!(work, lwork)
-#                 end
-#             end
-#             A, tau
-#         end
-#     end
-# end
-
-end
diff --git a/src/auxiliary/random.jl b/src/auxiliary/random.jl
index bc9df6f65..fe57f585e 100644
--- a/src/auxiliary/random.jl
+++ b/src/auxiliary/random.jl
@@ -20,6 +20,6 @@ function randisometry!(rng::Random.AbstractRNG, A::AbstractMatrix)
     dims = size(A)
     dims[1] >= dims[2] ||
         throw(DimensionMismatch("cannot create isometric matrix with dimensions $dims; isometry needs to be tall or square"))
-    Q, = MatrixAlgebra.leftorth!(Random.randn!(rng, A), QRpos(), 0)
+    Q, = qr_compact!(Random.randn!(rng, A); positive=true)
     return copy!(A, Q)
 end
diff --git a/src/factorizations/adjoint.jl b/src/factorizations/adjoint.jl
new file mode 100644
index 000000000..b4c148788
--- /dev/null
+++ b/src/factorizations/adjoint.jl
@@ -0,0 +1,100 @@
+# AdjointTensorMap
+# ----------------
+# map algorithms to their adjoint counterpart
+# TODO: this probably belongs in MatrixAlgebraKit
+_adjoint(alg::MAK.LAPACK_HouseholderQR) = MAK.LAPACK_HouseholderLQ(; alg.kwargs...)
+_adjoint(alg::MAK.LAPACK_HouseholderLQ) = MAK.LAPACK_HouseholderQR(; alg.kwargs...)
+_adjoint(alg::MAK.LAPACK_HouseholderQL) = MAK.LAPACK_HouseholderRQ(; alg.kwargs...)
+_adjoint(alg::MAK.LAPACK_HouseholderRQ) = MAK.LAPACK_HouseholderQL(; alg.kwargs...)
+_adjoint(alg::MAK.PolarViaSVD) = MAK.PolarViaSVD(_adjoint(alg.svdalg))
+_adjoint(alg::AbstractAlgorithm) = alg
+
+# 1-arg functions
+function MAK.initialize_output(::typeof(left_null!), t::AdjointTensorMap,
+                               alg::AbstractAlgorithm)
+    return adjoint(MAK.initialize_output(right_null!, adjoint(t), _adjoint(alg)))
+end
+function MAK.initialize_output(::typeof(right_null!), t::AdjointTensorMap,
+                               alg::AbstractAlgorithm)
+    return adjoint(MAK.initialize_output(left_null!, adjoint(t), _adjoint(alg)))
+end
+
+function MAK.left_null!(t::AdjointTensorMap, N, alg::AbstractAlgorithm)
+    right_null!(adjoint(t), adjoint(N), _adjoint(alg))
+    return N
+end
+function MAK.right_null!(t::AdjointTensorMap, N, alg::AbstractAlgorithm)
+    left_null!(adjoint(t), adjoint(N), _adjoint(alg))
+    return N
+end
+
+function MAK.is_left_isometry(t::AdjointTensorMap; kwargs...)
+    return is_right_isometry(adjoint(t); kwargs...)
+end
+function MAK.is_right_isometry(t::AdjointTensorMap; kwargs...)
+    return is_left_isometry(adjoint(t); kwargs...)
+end
+
+# 2-arg functions
+for (left_f!, right_f!) in zip((:qr_full!, :qr_compact!, :left_polar!, :left_orth!),
+                               (:lq_full!, :lq_compact!, :right_polar!, :right_orth!))
+    @eval function MAK.copy_input(::typeof($left_f!), t::AdjointTensorMap)
+        return adjoint(MAK.copy_input($right_f!, adjoint(t)))
+    end
+    @eval function MAK.copy_input(::typeof($right_f!), t::AdjointTensorMap)
+        return adjoint(MAK.copy_input($left_f!, adjoint(t)))
+    end
+
+    @eval function MAK.initialize_output(::typeof($left_f!), t::AdjointTensorMap,
+                                         alg::AbstractAlgorithm)
+        return reverse(adjoint.(MAK.initialize_output($right_f!, adjoint(t), _adjoint(alg))))
+    end
+    @eval function MAK.initialize_output(::typeof($right_f!), t::AdjointTensorMap,
+                                         alg::AbstractAlgorithm)
+        return reverse(adjoint.(MAK.initialize_output($left_f!, adjoint(t), _adjoint(alg))))
+    end
+
+    @eval function MAK.$left_f!(t::AdjointTensorMap, F, alg::AbstractAlgorithm)
+        $right_f!(adjoint(t), reverse(adjoint.(F)), _adjoint(alg))
+        return F
+    end
+    @eval function MAK.$right_f!(t::AdjointTensorMap, F, alg::AbstractAlgorithm)
+        $left_f!(adjoint(t), reverse(adjoint.(F)), _adjoint(alg))
+        return F
+    end
+end
+
+# 3-arg functions
+for f! in (:svd_full!, :svd_compact!, :svd_trunc!)
+    @eval function MAK.copy_input(::typeof($f!), t::AdjointTensorMap)
+        return adjoint(MAK.copy_input($f!, adjoint(t)))
+    end
+
+    @eval function MAK.initialize_output(::typeof($f!), t::AdjointTensorMap,
+                                         alg::AbstractAlgorithm)
+        return reverse(adjoint.(MAK.initialize_output($f!, adjoint(t), _adjoint(alg))))
+    end
+    @eval function MAK.$f!(t::AdjointTensorMap, F, alg::AbstractAlgorithm)
+        $f!(adjoint(t), reverse(adjoint.(F)), _adjoint(alg))
+        return F
+    end
+
+    # disambiguate by prohibition
+    @eval function MAK.initialize_output(::typeof($f!), t::AdjointTensorMap,
+                                         alg::DiagonalAlgorithm)
+        throw(MethodError($f!, (t, alg)))
+    end
+end
+# avoid amgiguity
+function MAK.initialize_output(::typeof(svd_trunc!), t::AdjointTensorMap,
+                               alg::TruncatedAlgorithm)
+    return MAK.initialize_output(svd_compact!, t, alg.alg)
+end
+# to fix ambiguity
+function MAK.svd_trunc!(t::AdjointTensorMap, USVᴴ, alg::TruncatedAlgorithm)
+    USVᴴ′ = svd_compact!(t, USVᴴ, alg.alg)
+    return MAK.truncate(svd_trunc!, USVᴴ′, alg.trunc)
+end
+function MAK.svd_compact!(t::AdjointTensorMap, USVᴴ, alg::DiagonalAlgorithm)
+    return MAK.svd_compact!(t, USVᴴ, alg.alg)
+end
diff --git a/src/factorizations/diagonal.jl b/src/factorizations/diagonal.jl
new file mode 100644
index 000000000..8fa33fd20
--- /dev/null
+++ b/src/factorizations/diagonal.jl
@@ -0,0 +1,190 @@
+# DiagonalTensorMap
+# -----------------
+_repack_diagonal(d::DiagonalTensorMap) = Diagonal(d.data)
+
+for f in (:svd_compact, :svd_full, :svd_trunc, :svd_vals, :qr_compact, :qr_full, :qr_null,
+          :lq_compact, :lq_full, :lq_null, :eig_full, :eig_trunc, :eig_vals, :eigh_full,
+          :eigh_trunc, :eigh_vals, :left_polar, :right_polar)
+    @eval MAK.copy_input(::typeof($f), d::DiagonalTensorMap) = copy(d)
+end
+
+for f! in (:eig_full!, :eig_trunc!)
+    @eval function MAK.initialize_output(::typeof($f!), d::AbstractTensorMap,
+                                         ::DiagonalAlgorithm)
+        return d, similar(d)
+    end
+end
+
+for f! in (:eigh_full!, :eigh_trunc!)
+    @eval function MAK.initialize_output(::typeof($f!), d::AbstractTensorMap,
+                                         ::DiagonalAlgorithm)
+        if scalartype(d) <: Real
+            return d, similar(d)
+        else
+            return similar(d, real(scalartype(d))), similar(d)
+        end
+    end
+end
+
+for f! in (:qr_full!, :qr_compact!)
+    @eval function MAK.initialize_output(::typeof($f!), d::AbstractTensorMap,
+                                         ::DiagonalAlgorithm)
+        return d, similar(d)
+    end
+    # to avoid ambiguities
+    @eval function MAK.initialize_output(::typeof($f!), d::AdjointTensorMap,
+                                         ::DiagonalAlgorithm)
+        return d, similar(d)
+    end
+end
+for f! in (:lq_full!, :lq_compact!)
+    @eval function MAK.initialize_output(::typeof($f!), d::AbstractTensorMap,
+                                         ::DiagonalAlgorithm)
+        return similar(d), d
+    end
+    # to avoid ambiguities
+    @eval function MAK.initialize_output(::typeof($f!), d::AdjointTensorMap,
+                                         ::DiagonalAlgorithm)
+        return similar(d), d
+    end
+end
+
+function MAK.initialize_output(::typeof(left_orth!), d::DiagonalTensorMap)
+    return d, similar(d)
+end
+function MAK.initialize_output(::typeof(right_orth!), d::DiagonalTensorMap)
+    return similar(d), d
+end
+
+function MAK.initialize_output(::typeof(svd_full!), t::AbstractTensorMap,
+                               ::DiagonalAlgorithm)
+    V_cod = fuse(codomain(t))
+    V_dom = fuse(domain(t))
+    U = similar(t, codomain(t) ← V_cod)
+    S = DiagonalTensorMap{real(scalartype(t))}(undef, V_cod ← V_dom)
+    Vᴴ = similar(t, V_dom ← domain(t))
+    return U, S, Vᴴ
+end
+
+for f! in
+    (:qr_full!, :qr_compact!, :lq_full!, :lq_compact!, :eig_full!, :eig_trunc!, :eigh_full!,
+     :eigh_trunc!, :right_orth!, :left_orth!)
+    @eval function MAK.$f!(d::DiagonalTensorMap, F, alg::DiagonalAlgorithm)
+        MAK.check_input($f!, d, F, alg)
+        $f!(_repack_diagonal(d), _repack_diagonal.(F), alg)
+        return F
+    end
+end
+
+for f! in (:qr_full!, :qr_compact!)
+    @eval function MAK.check_input(::typeof($f!), d::AbstractTensorMap, QR,
+                                   ::DiagonalAlgorithm)
+        Q, R = QR
+        @assert d isa DiagonalTensorMap
+        @assert Q isa DiagonalTensorMap && R isa DiagonalTensorMap
+        @check_scalar Q d
+        @check_scalar R d
+        @check_space(Q, space(d))
+        @check_space(R, space(d))
+
+        return nothing
+    end
+end
+
+for f! in (:lq_full!, :lq_compact!)
+    @eval function MAK.check_input(::typeof($f!), d::AbstractTensorMap, LQ,
+                                   ::DiagonalAlgorithm)
+        L, Q = LQ
+        @assert d isa DiagonalTensorMap
+        @assert Q isa DiagonalTensorMap && L isa DiagonalTensorMap
+        @check_scalar Q d
+        @check_scalar L d
+        @check_space(Q, space(d))
+        @check_space(L, space(d))
+
+        return nothing
+    end
+end
+
+# disambiguate
+function MAK.svd_compact!(t::AbstractTensorMap, USVᴴ, alg::DiagonalAlgorithm)
+    return svd_full!(t, USVᴴ, alg)
+end
+
+# f_vals
+# ------
+
+for f! in (:eig_vals!, :eigh_vals!, :svd_vals!)
+    @eval function MAK.$f!(d::AbstractTensorMap, V, alg::DiagonalAlgorithm)
+        MAK.check_input($f!, d, V, alg)
+        $f!(_repack_diagonal(d), diagview(_repack_diagonal(V)), alg)
+        return V
+    end
+    @eval function MAK.initialize_output(::typeof($f!), d::DiagonalTensorMap,
+                                         alg::DiagonalAlgorithm)
+        data = MAK.initialize_output($f!, _repack_diagonal(d), alg)
+        return DiagonalTensorMap(data, d.domain)
+    end
+end
+
+function MAK.check_input(::typeof(eig_full!), t::AbstractTensorMap, DV, ::DiagonalAlgorithm)
+    domain(t) == codomain(t) ||
+        throw(ArgumentError("Eigenvalue decomposition requires square input tensor"))
+
+    D, V = DV
+
+    @assert D isa DiagonalTensorMap
+    @assert V isa AbstractTensorMap
+
+    # scalartype checks
+    @check_scalar D t
+    @check_scalar V t
+
+    # space checks
+    @check_space D space(t)
+    @check_space V space(t)
+
+    return nothing
+end
+
+function MAK.check_input(::typeof(eigh_full!), t::AbstractTensorMap, DV,
+                         ::DiagonalAlgorithm)
+    domain(t) == codomain(t) ||
+        throw(ArgumentError("Eigenvalue decomposition requires square input tensor"))
+
+    D, V = DV
+
+    @assert D isa DiagonalTensorMap
+    @assert V isa AbstractTensorMap
+
+    # scalartype checks
+    @check_scalar D t real
+    @check_scalar V t
+
+    # space checks
+    @check_space D space(t)
+    @check_space V space(t)
+
+    return nothing
+end
+
+function MAK.check_input(::typeof(eig_vals!), t::AbstractTensorMap, D, ::DiagonalAlgorithm)
+    @assert D isa DiagonalTensorMap
+    @check_scalar D t
+    @check_space D space(t)
+    return nothing
+end
+
+function MAK.check_input(::typeof(eigh_vals!), t::AbstractTensorMap, D, ::DiagonalAlgorithm)
+    @assert D isa DiagonalTensorMap
+    @check_scalar D t real
+    @check_space D space(t)
+    return nothing
+end
+
+function MAK.check_input(::typeof(svd_vals!), t::AbstractTensorMap, D, ::DiagonalAlgorithm)
+    @assert D isa DiagonalTensorMap
+    @check_scalar D t real
+    @check_space D space(t)
+    return nothing
+end
diff --git a/src/factorizations/factorizations.jl b/src/factorizations/factorizations.jl
new file mode 100644
index 000000000..310bf10a2
--- /dev/null
+++ b/src/factorizations/factorizations.jl
@@ -0,0 +1,99 @@
+# Tensor factorization
+#----------------------
+# using submodule here to import MatrixAlgebraKit functions without polluting namespace
+module Factorizations
+
+export copy_oftype, factorisation_scalartype, one!, truncspace
+
+using ..TensorKit
+using ..TensorKit: AdjointTensorMap, SectorDict, blocktype, foreachblock, one!
+
+using LinearAlgebra: LinearAlgebra, BlasFloat, Diagonal, svdvals, svdvals!, eigen, eigen!,
+                     isposdef, isposdef!, ishermitian
+
+using TensorOperations: Index2Tuple
+
+using MatrixAlgebraKit
+import MatrixAlgebraKit as MAK
+using MatrixAlgebraKit: AbstractAlgorithm, TruncatedAlgorithm, DiagonalAlgorithm
+using MatrixAlgebraKit: TruncationStrategy, NoTruncation, TruncationByValue,
+                        TruncationByError, TruncationIntersection, TruncationByFilter,
+                        TruncationByOrder
+using MatrixAlgebraKit: left_orth_polar!, right_orth_polar!, left_orth_svd!,
+                        right_orth_svd!, left_null_svd!, right_null_svd!, diagview
+
+include("utility.jl")
+include("matrixalgebrakit.jl")
+include("truncation.jl")
+include("adjoint.jl")
+include("diagonal.jl")
+include("pullbacks.jl")
+
+TensorKit.one!(A::AbstractMatrix) = MatrixAlgebraKit.one!(A)
+
+function MatrixAlgebraKit.isisometry(t::AbstractTensorMap, (p₁, p₂)::Index2Tuple)
+    t = permute(t, (p₁, p₂); copy=false)
+    return isisometry(t)
+end
+
+#------------------------------#
+# LinearAlgebra overloads
+#------------------------------#
+
+function LinearAlgebra.eigen(t::AbstractTensorMap; kwargs...)
+    return ishermitian(t) ? eigh_full(t; kwargs...) : eig_full(t; kwargs...)
+end
+function LinearAlgebra.eigen!(t::AbstractTensorMap; kwargs...)
+    return ishermitian(t) ? eigh_full!(t; kwargs...) : eig_full!(t; kwargs...)
+end
+
+function LinearAlgebra.eigvals(t::AbstractTensorMap; kwargs...)
+    tcopy = copy_oftype(t, factorisation_scalartype(eigen, t))
+    return LinearAlgebra.eigvals!(tcopy; kwargs...)
+end
+LinearAlgebra.eigvals!(t::AbstractTensorMap; kwargs...) = diagview(eig_vals!(t))
+
+function LinearAlgebra.svdvals(t::AbstractTensorMap)
+    tcopy = copy_oftype(t, factorisation_scalartype(tsvd, t))
+    return LinearAlgebra.svdvals!(tcopy)
+end
+LinearAlgebra.svdvals!(t::AbstractTensorMap) = diagview(svd_vals!(t))
+
+#--------------------------------------------------#
+# Checks for hermiticity and positive definiteness #
+#--------------------------------------------------#
+function LinearAlgebra.ishermitian(t::AbstractTensorMap)
+    domain(t) == codomain(t) || return false
+    InnerProductStyle(t) === EuclideanInnerProduct() || return false # hermiticity only defined for euclidean
+    for (c, b) in blocks(t)
+        ishermitian(b) || return false
+    end
+    return true
+end
+
+function LinearAlgebra.isposdef(t::AbstractTensorMap)
+    return isposdef!(copy_oftype(t, factorisation_scalartype(isposdef, t)))
+end
+function LinearAlgebra.isposdef!(t::AbstractTensorMap)
+    domain(t) == codomain(t) ||
+        throw(SpaceMismatch("`isposdef` requires domain and codomain to be the same"))
+    InnerProductStyle(spacetype(t)) === EuclideanInnerProduct() || return false
+    for (c, b) in blocks(t)
+        isposdef!(b) || return false
+    end
+    return true
+end
+
+# TODO: tolerances are per-block, not global or weighted - does that matter?
+function MatrixAlgebraKit.is_left_isometry(t::AbstractTensorMap; kwargs...)
+    domain(t) ≾ codomain(t) || return false
+    f((c, b)) = MatrixAlgebraKit.is_left_isometry(b; kwargs...)
+    return all(f, blocks(t))
+end
+function MatrixAlgebraKit.is_right_isometry(t::AbstractTensorMap; kwargs...)
+    domain(t) ≿ codomain(t) || return false
+    f((c, b)) = MatrixAlgebraKit.is_right_isometry(b; kwargs...)
+    return all(f, blocks(t))
+end
+
+end
diff --git a/src/factorizations/matrixalgebrakit.jl b/src/factorizations/matrixalgebrakit.jl
new file mode 100644
index 000000000..e67290603
--- /dev/null
+++ b/src/factorizations/matrixalgebrakit.jl
@@ -0,0 +1,681 @@
+# Algorithm selection
+# -------------------
+for f in
+    [:svd_compact, :svd_full, :svd_trunc, :svd_vals, :qr_compact, :qr_full, :qr_null,
+     :lq_compact, :lq_full, :lq_null, :eig_full, :eig_trunc, :eig_vals, :eigh_full,
+     :eigh_trunc, :eigh_vals, :left_polar, :right_polar]
+    f! = Symbol(f, :!)
+    @eval function MAK.default_algorithm(::typeof($f!), ::Type{T};
+                                         kwargs...) where {T<:AbstractTensorMap}
+        return MAK.default_algorithm($f!, blocktype(T); kwargs...)
+    end
+    @eval function MAK.copy_input(::typeof($f), t::AbstractTensorMap)
+        return copy_oftype(t, factorisation_scalartype($f, t))
+    end
+end
+
+_select_truncation(f, ::AbstractTensorMap, trunc::TruncationStrategy) = trunc
+function _select_truncation(::typeof(left_null!), ::AbstractTensorMap, trunc::NamedTuple)
+    return MAK.null_truncation_strategy(; trunc...)
+end
+
+# Generic Implementations
+# -----------------------
+for f! in (:qr_compact!, :qr_full!,
+           :lq_compact!, :lq_full!,
+           :eig_full!, :eigh_full!,
+           :svd_compact!, :svd_full!,
+           :left_polar!, :left_orth_polar!,
+           :right_polar!, :right_orth_polar!,
+           :left_orth!, :right_orth!)
+    @eval function MAK.$f!(t::AbstractTensorMap, F, alg::AbstractAlgorithm)
+        MAK.check_input($f!, t, F, alg)
+
+        foreachblock(t, F...) do _, bs
+            factors = Base.tail(bs)
+            factors′ = $f!(first(bs), factors, alg)
+            # deal with the case where the output is not in-place
+            for (f′, f) in zip(factors′, factors)
+                f′ === f || copy!(f, f′)
+            end
+            return nothing
+        end
+
+        return F
+    end
+end
+
+# Handle these separately because single output instead of tuple
+for f! in (:qr_null!, :lq_null!)
+    @eval function MAK.$f!(t::AbstractTensorMap, N, alg::AbstractAlgorithm)
+        MAK.check_input($f!, t, N, alg)
+
+        foreachblock(t, N) do _, (b, n)
+            n′ = $f!(b, n, alg)
+            # deal with the case where the output is not the same as the input
+            n === n′ || copy!(n, n′)
+            return nothing
+        end
+
+        return N
+    end
+end
+
+# Handle these separately because single output instead of tuple
+for f! in (:svd_vals!, :eig_vals!, :eigh_vals!)
+    @eval function MAK.$f!(t::AbstractTensorMap, N, alg::AbstractAlgorithm)
+        MAK.check_input($f!, t, N, alg)
+
+        foreachblock(t, N) do _, (b, n)
+            n′ = $f!(b, diagview(n), alg)
+            # deal with the case where the output is not the same as the input
+            diagview(n) === n′ || copy!(diagview(n), n′)
+            return nothing
+        end
+
+        return N
+    end
+end
+
+# Singular value decomposition
+# ----------------------------
+function MAK.check_input(::typeof(svd_full!), t::AbstractTensorMap, USVᴴ,
+                         ::AbstractAlgorithm)
+    U, S, Vᴴ = USVᴴ
+
+    # type checks
+    @assert U isa AbstractTensorMap
+    @assert S isa AbstractTensorMap
+    @assert Vᴴ isa AbstractTensorMap
+
+    # scalartype checks
+    @check_scalar U t
+    @check_scalar S t real
+    @check_scalar Vᴴ t
+
+    # space checks
+    V_cod = fuse(codomain(t))
+    V_dom = fuse(domain(t))
+    @check_space(U, codomain(t) ← V_cod)
+    @check_space(S, V_cod ← V_dom)
+    @check_space(Vᴴ, V_dom ← domain(t))
+
+    return nothing
+end
+
+function MAK.check_input(::typeof(svd_compact!), t::AbstractTensorMap, USVᴴ,
+                         ::AbstractAlgorithm)
+    U, S, Vᴴ = USVᴴ
+
+    # type checks
+    @assert U isa AbstractTensorMap
+    @assert S isa DiagonalTensorMap
+    @assert Vᴴ isa AbstractTensorMap
+
+    # scalartype checks
+    @check_scalar U t
+    @check_scalar S t real
+    @check_scalar Vᴴ t
+
+    # space checks
+    V_cod = V_dom = infimum(fuse(codomain(t)), fuse(domain(t)))
+    @check_space(U, codomain(t) ← V_cod)
+    @check_space(S, V_cod ← V_dom)
+    @check_space(Vᴴ, V_dom ← domain(t))
+
+    return nothing
+end
+
+function MAK.check_input(::typeof(svd_vals!), t::AbstractTensorMap, D, ::AbstractAlgorithm)
+    @check_scalar D t real
+    @assert D isa DiagonalTensorMap
+    V_cod = V_dom = infimum(fuse(codomain(t)), fuse(domain(t)))
+    @check_space(D, V_cod ← V_dom)
+    return nothing
+end
+
+function MAK.initialize_output(::typeof(svd_full!), t::AbstractTensorMap,
+                               ::AbstractAlgorithm)
+    V_cod = fuse(codomain(t))
+    V_dom = fuse(domain(t))
+    U = similar(t, codomain(t) ← V_cod)
+    S = similar(t, real(scalartype(t)), V_cod ← V_dom)
+    Vᴴ = similar(t, V_dom ← domain(t))
+    return U, S, Vᴴ
+end
+
+function MAK.initialize_output(::typeof(svd_compact!), t::AbstractTensorMap,
+                               ::AbstractAlgorithm)
+    V_cod = V_dom = infimum(fuse(codomain(t)), fuse(domain(t)))
+    U = similar(t, codomain(t) ← V_cod)
+    S = DiagonalTensorMap{real(scalartype(t))}(undef, V_cod)
+    Vᴴ = similar(t, V_dom ← domain(t))
+    return U, S, Vᴴ
+end
+
+# TODO: remove this once `AbstractMatrix` specialization is removed in MatrixAlgebraKit
+function MAK.initialize_output(::typeof(svd_trunc!), t::AbstractTensorMap,
+                               alg::TruncatedAlgorithm)
+    return MAK.initialize_output(svd_compact!, t, alg.alg)
+end
+
+function MAK.initialize_output(::typeof(svd_vals!), t::AbstractTensorMap,
+                               alg::AbstractAlgorithm)
+    V_cod = infimum(fuse(codomain(t)), fuse(domain(t)))
+    return DiagonalTensorMap{real(scalartype(t))}(undef, V_cod)
+end
+
+# Eigenvalue decomposition
+# ------------------------
+function MAK.check_input(::typeof(eigh_full!), t::AbstractTensorMap, DV,
+                         ::AbstractAlgorithm)
+    domain(t) == codomain(t) ||
+        throw(ArgumentError("Eigenvalue decomposition requires square input tensor"))
+
+    D, V = DV
+
+    # type checks
+    @assert D isa DiagonalTensorMap
+    @assert V isa AbstractTensorMap
+
+    # scalartype checks
+    @check_scalar D t real
+    @check_scalar V t
+
+    # space checks
+    V_D = fuse(domain(t))
+    @check_space(D, V_D ← V_D)
+    @check_space(V, codomain(t) ← V_D)
+
+    return nothing
+end
+
+function MAK.check_input(::typeof(eig_full!), t::AbstractTensorMap, DV, ::AbstractAlgorithm)
+    domain(t) == codomain(t) ||
+        throw(ArgumentError("Eigenvalue decomposition requires square input tensor"))
+
+    D, V = DV
+
+    # type checks
+    @assert D isa DiagonalTensorMap
+    @assert V isa AbstractTensorMap
+
+    # scalartype checks
+    @check_scalar D t complex
+    @check_scalar V t complex
+
+    # space checks
+    V_D = fuse(domain(t))
+    @check_space(D, V_D ← V_D)
+    @check_space(V, codomain(t) ← V_D)
+
+    return nothing
+end
+
+function MAK.check_input(::typeof(eigh_vals!), t::AbstractTensorMap, D, ::AbstractAlgorithm)
+    @check_scalar D t real
+    @assert D isa DiagonalTensorMap
+    V_D = fuse(domain(t))
+    @check_space(D, V_D ← V_D)
+    return nothing
+end
+
+function MAK.check_input(::typeof(eig_vals!), t::AbstractTensorMap, D, ::AbstractAlgorithm)
+    @check_scalar D t complex
+    @assert D isa DiagonalTensorMap
+    V_D = fuse(domain(t))
+    @check_space(D, V_D ← V_D)
+    return nothing
+end
+
+function MAK.initialize_output(::typeof(eigh_full!), t::AbstractTensorMap,
+                               ::AbstractAlgorithm)
+    V_D = fuse(domain(t))
+    T = real(scalartype(t))
+    D = DiagonalTensorMap{T}(undef, V_D)
+    V = similar(t, codomain(t) ← V_D)
+    return D, V
+end
+
+function MAK.initialize_output(::typeof(eig_full!), t::AbstractTensorMap,
+                               ::AbstractAlgorithm)
+    V_D = fuse(domain(t))
+    Tc = complex(scalartype(t))
+    D = DiagonalTensorMap{Tc}(undef, V_D)
+    V = similar(t, Tc, codomain(t) ← V_D)
+    return D, V
+end
+
+function MAK.initialize_output(::typeof(eigh_vals!), t::AbstractTensorMap,
+                               alg::AbstractAlgorithm)
+    V_D = fuse(domain(t))
+    T = real(scalartype(t))
+    return D = DiagonalTensorMap{Tc}(undef, V_D)
+end
+
+function MAK.initialize_output(::typeof(eig_vals!), t::AbstractTensorMap,
+                               alg::AbstractAlgorithm)
+    V_D = fuse(domain(t))
+    Tc = complex(scalartype(t))
+    return D = DiagonalTensorMap{Tc}(undef, V_D)
+end
+
+# QR decomposition
+# ----------------
+function MAK.check_input(::typeof(qr_full!), t::AbstractTensorMap, QR, ::AbstractAlgorithm)
+    Q, R = QR
+
+    # type checks
+    @assert Q isa AbstractTensorMap
+    @assert R isa AbstractTensorMap
+
+    # scalartype checks
+    @check_scalar Q t
+    @check_scalar R t
+
+    # space checks
+    V_Q = fuse(codomain(t))
+    @check_space(Q, codomain(t) ← V_Q)
+    @check_space(R, V_Q ← domain(t))
+
+    return nothing
+end
+
+function MAK.check_input(::typeof(qr_compact!), t::AbstractTensorMap, QR,
+                         ::AbstractAlgorithm)
+    Q, R = QR
+
+    # type checks
+    @assert Q isa AbstractTensorMap
+    @assert R isa AbstractTensorMap
+
+    # scalartype checks
+    @check_scalar Q t
+    @check_scalar R t
+
+    # space checks
+    V_Q = infimum(fuse(codomain(t)), fuse(domain(t)))
+    @check_space(Q, codomain(t) ← V_Q)
+    @check_space(R, V_Q ← domain(t))
+
+    return nothing
+end
+
+function MAK.check_input(::typeof(qr_null!), t::AbstractTensorMap, N, ::AbstractAlgorithm)
+    # scalartype checks
+    @check_scalar N t
+
+    # space checks
+    V_Q = infimum(fuse(codomain(t)), fuse(domain(t)))
+    V_N = ⊖(fuse(codomain(t)), V_Q)
+    @check_space(N, codomain(t) ← V_N)
+
+    return nothing
+end
+
+function MAK.initialize_output(::typeof(qr_full!), t::AbstractTensorMap,
+                               ::AbstractAlgorithm)
+    V_Q = fuse(codomain(t))
+    Q = similar(t, codomain(t) ← V_Q)
+    R = similar(t, V_Q ← domain(t))
+    return Q, R
+end
+
+function MAK.initialize_output(::typeof(qr_compact!), t::AbstractTensorMap,
+                               ::AbstractAlgorithm)
+    V_Q = infimum(fuse(codomain(t)), fuse(domain(t)))
+    Q = similar(t, codomain(t) ← V_Q)
+    R = similar(t, V_Q ← domain(t))
+    return Q, R
+end
+
+function MAK.initialize_output(::typeof(qr_null!), t::AbstractTensorMap,
+                               ::AbstractAlgorithm)
+    V_Q = infimum(fuse(codomain(t)), fuse(domain(t)))
+    V_N = ⊖(fuse(codomain(t)), V_Q)
+    N = similar(t, codomain(t) ← V_N)
+    return N
+end
+
+# LQ decomposition
+# ----------------
+function MAK.check_input(::typeof(lq_full!), t::AbstractTensorMap, LQ, ::AbstractAlgorithm)
+    L, Q = LQ
+
+    # type checks
+    @assert L isa AbstractTensorMap
+    @assert Q isa AbstractTensorMap
+
+    # scalartype checks
+    @check_scalar L t
+    @check_scalar Q t
+
+    # space checks
+    V_Q = fuse(domain(t))
+    @check_space(L, codomain(t) ← V_Q)
+    @check_space(Q, V_Q ← domain(t))
+
+    return nothing
+end
+
+function MAK.check_input(::typeof(lq_compact!), t::AbstractTensorMap, LQ,
+                         ::AbstractAlgorithm)
+    L, Q = LQ
+
+    # type checks
+    @assert L isa AbstractTensorMap
+    @assert Q isa AbstractTensorMap
+
+    # scalartype checks
+    @check_scalar L t
+    @check_scalar Q t
+
+    # space checks
+    V_Q = infimum(fuse(codomain(t)), fuse(domain(t)))
+    @check_space(L, codomain(t) ← V_Q)
+    @check_space(Q, V_Q ← domain(t))
+
+    return nothing
+end
+
+function MAK.check_input(::typeof(lq_null!), t::AbstractTensorMap, N, ::AbstractAlgorithm)
+    # scalartype checks
+    @check_scalar N t
+
+    # space checks
+    V_Q = infimum(fuse(codomain(t)), fuse(domain(t)))
+    V_N = ⊖(fuse(domain(t)), V_Q)
+    @check_space(N, V_N ← domain(t))
+
+    return nothing
+end
+
+function MAK.initialize_output(::typeof(lq_full!), t::AbstractTensorMap,
+                               ::AbstractAlgorithm)
+    V_Q = fuse(domain(t))
+    L = similar(t, codomain(t) ← V_Q)
+    Q = similar(t, V_Q ← domain(t))
+    return L, Q
+end
+
+function MAK.initialize_output(::typeof(lq_compact!), t::AbstractTensorMap,
+                               ::AbstractAlgorithm)
+    V_Q = infimum(fuse(codomain(t)), fuse(domain(t)))
+    L = similar(t, codomain(t) ← V_Q)
+    Q = similar(t, V_Q ← domain(t))
+    return L, Q
+end
+
+function MAK.initialize_output(::typeof(lq_null!), t::AbstractTensorMap,
+                               ::AbstractAlgorithm)
+    V_Q = infimum(fuse(codomain(t)), fuse(domain(t)))
+    V_N = ⊖(fuse(domain(t)), V_Q)
+    N = similar(t, V_N ← domain(t))
+    return N
+end
+
+# Polar decomposition
+# -------------------
+function MAK.check_input(::typeof(left_polar!), t::AbstractTensorMap, WP,
+                         ::AbstractAlgorithm)
+    codomain(t) ≿ domain(t) ||
+        throw(ArgumentError("Polar decomposition requires `codomain(t) ≿ domain(t)`"))
+
+    W, P = WP
+    @assert W isa AbstractTensorMap
+    @assert P isa AbstractTensorMap
+
+    # scalartype checks
+    @check_scalar W t
+    @check_scalar P t
+
+    # space checks
+    @check_space(W, space(t))
+    @check_space(P, domain(t) ← domain(t))
+
+    return nothing
+end
+
+function MAK.check_input(::typeof(left_orth_polar!), t::AbstractTensorMap, WP,
+                         ::AbstractAlgorithm)
+    codomain(t) ≿ domain(t) ||
+        throw(ArgumentError("Polar decomposition requires `codomain(t) ≿ domain(t)`"))
+
+    W, P = WP
+    @assert W isa AbstractTensorMap
+    @assert P isa AbstractTensorMap
+
+    # scalartype checks
+    @check_scalar W t
+    @check_scalar P t
+
+    # space checks
+    VW = fuse(domain(t))
+    @check_space(W, codomain(t) ← VW)
+    @check_space(P, VW ← domain(t))
+
+    return nothing
+end
+
+function MAK.initialize_output(::typeof(left_polar!), t::AbstractTensorMap,
+                               ::AbstractAlgorithm)
+    W = similar(t, space(t))
+    P = similar(t, domain(t) ← domain(t))
+    return W, P
+end
+
+function MAK.check_input(::typeof(right_polar!), t::AbstractTensorMap, PWᴴ,
+                         ::AbstractAlgorithm)
+    codomain(t) ≾ domain(t) ||
+        throw(ArgumentError("Polar decomposition requires `domain(t) ≿ codomain(t)`"))
+
+    P, Wᴴ = PWᴴ
+    @assert P isa AbstractTensorMap
+    @assert Wᴴ isa AbstractTensorMap
+
+    # scalartype checks
+    @check_scalar P t
+    @check_scalar Wᴴ t
+
+    # space checks
+    @check_space(P, codomain(t) ← codomain(t))
+    @check_space(Wᴴ, space(t))
+
+    return nothing
+end
+
+function MAK.check_input(::typeof(right_orth_polar!), t::AbstractTensorMap, PWᴴ,
+                         ::AbstractAlgorithm)
+    codomain(t) ≾ domain(t) ||
+        throw(ArgumentError("Polar decomposition requires `domain(t) ≿ codomain(t)`"))
+
+    P, Wᴴ = PWᴴ
+    @assert P isa AbstractTensorMap
+    @assert Wᴴ isa AbstractTensorMap
+
+    # scalartype checks
+    @check_scalar P t
+    @check_scalar Wᴴ t
+
+    # space checks
+    VW = fuse(codomain(t))
+    @check_space(P, codomain(t) ← VW)
+    @check_space(Wᴴ, VW ← domain(t))
+
+    return nothing
+end
+
+function MAK.initialize_output(::typeof(right_polar!), t::AbstractTensorMap,
+                               ::AbstractAlgorithm)
+    P = similar(t, codomain(t) ← codomain(t))
+    Wᴴ = similar(t, space(t))
+    return P, Wᴴ
+end
+
+# Orthogonalization
+# -----------------
+function MAK.check_input(::typeof(left_orth!), t::AbstractTensorMap, VC,
+                         ::AbstractAlgorithm)
+    V, C = VC
+
+    # scalartype checks
+    @check_scalar V t
+    isnothing(C) || @check_scalar C t
+
+    # space checks
+    V_C = infimum(fuse(codomain(t)), fuse(domain(t)))
+    @check_space(V, codomain(t) ← V_C)
+    isnothing(C) || @check_space(C, V_C ← domain(t))
+
+    return nothing
+end
+
+function MAK.check_input(::typeof(right_orth!), t::AbstractTensorMap, CVᴴ,
+                         ::AbstractAlgorithm)
+    C, Vᴴ = CVᴴ
+
+    # scalartype checks
+    isnothing(C) || @check_scalar C t
+    @check_scalar Vᴴ t
+
+    # space checks
+    V_C = infimum(fuse(codomain(t)), fuse(domain(t)))
+    isnothing(C) || @check_space(C, codomain(t) ← V_C)
+    @check_space(Vᴴ, V_C ← domain(t))
+
+    return nothing
+end
+
+function MAK.initialize_output(::typeof(left_orth!), t::AbstractTensorMap)
+    V_C = infimum(fuse(codomain(t)), fuse(domain(t)))
+    V = similar(t, codomain(t) ← V_C)
+    C = similar(t, V_C ← domain(t))
+    return V, C
+end
+
+function MAK.initialize_output(::typeof(right_orth!), t::AbstractTensorMap)
+    V_C = infimum(fuse(codomain(t)), fuse(domain(t)))
+    C = similar(t, codomain(t) ← V_C)
+    Vᴴ = similar(t, V_C ← domain(t))
+    return C, Vᴴ
+end
+
+# This is a rework of the dispatch logic in order to avoid having to deal with having to
+# allocate the output before knowing the kind of decomposition. In particular, here I disable
+# providing output arguments for left_ and right_orth.
+# This is mainly because polar decompositions have different shapes, and SVD for Diagonal
+# also does
+function MAK.left_orth!(t::AbstractTensorMap;
+                        trunc::TruncationStrategy=notrunc(),
+                        kind=trunc == notrunc() ? :qr : :svd,
+                        alg_qr=(; positive=true), alg_polar=(;), alg_svd=(;))
+    trunc == notrunc() || kind === :svd ||
+        throw(ArgumentError("truncation not supported for left_orth with kind = $kind"))
+
+    return if kind === :qr
+        alg_qr isa NamedTuple ? qr_compact!(t; alg_qr...) : qr_compact!(t; alg=alg_qr)
+    elseif kind === :polar
+        alg_polar isa NamedTuple ? left_orth_polar!(t; alg_polar...) :
+        left_orth_polar!(t; alg=alg_polar)
+    elseif kind === :svd
+        alg_svd isa NamedTuple ? left_orth_svd!(t; trunc, alg_svd...) :
+        left_orth_svd!(t; trunc, alg=alg_svd)
+    else
+        throw(ArgumentError(lazy"`left_orth!` received unknown value `kind = $kind`"))
+    end
+end
+function MAK.right_orth!(t::AbstractTensorMap;
+                         trunc::TruncationStrategy=notrunc(),
+                         kind=trunc == notrunc() ? :lq : :svd,
+                         alg_lq=(; positive=true), alg_polar=(;), alg_svd=(;))
+    trunc == notrunc() || kind === :svd ||
+        throw(ArgumentError("truncation not supported for right_orth with kind = $kind"))
+
+    return if kind === :lq
+        alg_lq isa NamedTuple ? lq_compact!(t; alg_lq...) : lq_compact!(t; alg=alg_lq)
+    elseif kind === :polar
+        alg_polar isa NamedTuple ? right_orth_polar!(t; alg_polar...) :
+        right_orth_polar!(t; alg=alg_polar)
+    elseif kind === :svd
+        alg_svd isa NamedTuple ? right_orth_svd!(t; trunc, alg_svd...) :
+        right_orth_svd!(t; trunc, alg=alg_svd)
+    else
+        throw(ArgumentError(lazy"`right_orth!` received unknown value `kind = $kind`"))
+    end
+end
+
+function MAK.left_orth_polar!(t::AbstractTensorMap; alg=nothing, kwargs...)
+    alg′ = MAK.select_algorithm(left_polar!, t, alg; kwargs...)
+    VC = MAK.initialize_output(left_orth!, t)
+    return left_orth_polar!(t, VC, alg′)
+end
+function MAK.left_orth_polar!(t::AbstractTensorMap, VC, alg)
+    alg′ = MAK.select_algorithm(left_polar!, t, alg)
+    return left_orth_polar!(t, VC, alg′)
+end
+function MAK.right_orth_polar!(t::AbstractTensorMap; alg=nothing, kwargs...)
+    alg′ = MAK.select_algorithm(right_polar!, t, alg; kwargs...)
+    CVᴴ = MAK.initialize_output(right_orth!, t)
+    return right_orth_polar!(t, CVᴴ, alg′)
+end
+function MAK.right_orth_polar!(t::AbstractTensorMap, CVᴴ, alg)
+    alg′ = MAK.select_algorithm(right_polar!, t, alg)
+    return right_orth_polar!(t, CVᴴ, alg′)
+end
+
+function MAK.left_orth_svd!(t::AbstractTensorMap; trunc=notrunc(), kwargs...)
+    U, S, Vᴴ = trunc == notrunc() ? svd_compact!(t; kwargs...) :
+               svd_trunc!(t; trunc, kwargs...)
+    return U, lmul!(S, Vᴴ)
+end
+function MAK.right_orth_svd!(t::AbstractTensorMap; trunc=notrunc(), kwargs...)
+    U, S, Vᴴ = trunc == notrunc() ? svd_compact!(t; kwargs...) :
+               svd_trunc!(t; trunc, kwargs...)
+    return rmul!(U, S), Vᴴ
+end
+
+# Nullspace
+# ---------
+function MAK.check_input(::typeof(left_null!), t::AbstractTensorMap, N, ::AbstractAlgorithm)
+    # scalartype checks
+    @check_scalar N t
+
+    # space checks
+    V_Q = infimum(fuse(codomain(t)), fuse(domain(t)))
+    V_N = ⊖(fuse(codomain(t)), V_Q)
+    @check_space(N, codomain(t) ← V_N)
+
+    return nothing
+end
+
+function MAK.check_input(::typeof(right_null!), t::AbstractTensorMap, N,
+                         ::AbstractAlgorithm)
+    @check_scalar N t
+
+    # space checks
+    V_Q = infimum(fuse(codomain(t)), fuse(domain(t)))
+    V_N = ⊖(fuse(domain(t)), V_Q)
+    @check_space(N, V_N ← domain(t))
+
+    return nothing
+end
+
+function MAK.initialize_output(::typeof(left_null!), t::AbstractTensorMap)
+    V_Q = infimum(fuse(codomain(t)), fuse(domain(t)))
+    V_N = ⊖(fuse(codomain(t)), V_Q)
+    N = similar(t, codomain(t) ← V_N)
+    return N
+end
+
+function MAK.initialize_output(::typeof(right_null!), t::AbstractTensorMap)
+    V_Q = infimum(fuse(codomain(t)), fuse(domain(t)))
+    V_N = ⊖(fuse(domain(t)), V_Q)
+    N = similar(t, V_N ← domain(t))
+    return N
+end
+
+for (f!, f_svd!) in zip((:left_null!, :right_null!), (:left_null_svd!, :right_null_svd!))
+    @eval function MAK.$f_svd!(t::AbstractTensorMap, N, alg, ::Nothing=nothing)
+        return $f!(t, N; alg_svd=alg)
+    end
+end
diff --git a/src/factorizations/pullbacks.jl b/src/factorizations/pullbacks.jl
new file mode 100644
index 000000000..392304bd5
--- /dev/null
+++ b/src/factorizations/pullbacks.jl
@@ -0,0 +1,53 @@
+for pullback! in (:qr_pullback!, :lq_pullback!,
+                  :left_polar_pullback!, :right_polar_pullback!)
+    @eval function MAK.$pullback!(Δt::AbstractTensorMap, t::AbstractTensorMap,
+                                  F, ΔF; kwargs...)
+        foreachblock(Δt, t) do c, (Δb, b)
+            Fc = block.(F, Ref(c))
+            ΔFc = block.(ΔF, Ref(c))
+            return MAK.$pullback!(Δb, b, Fc, ΔFc; kwargs...)
+        end
+        return Δt
+    end
+end
+for pullback! in (:qr_null_pullback!, :lq_null_pullback!)
+    @eval function MAK.$pullback!(Δt::AbstractTensorMap, t::AbstractTensorMap,
+                                  F, ΔF; kwargs...)
+        foreachblock(Δt, t) do c, (Δb, b)
+            Fc = block(F, c)
+            ΔFc = block(ΔF, c)
+            return MAK.$pullback!(Δb, b, Fc, ΔFc; kwargs...)
+        end
+        return Δt
+    end
+end
+
+_notrunc_ind(t) = SectorDict(c => Colon() for c in blocksectors(t))
+
+for pullback! in (:svd_pullback!, :eig_pullback!, :eigh_pullback!)
+    @eval function MAK.$pullback!(Δt::AbstractTensorMap, t::AbstractTensorMap,
+                                  F, ΔF, inds=_notrunc_ind(t);
+                                  kwargs...)
+        for (c, ind) in inds
+            Δb = block(Δt, c)
+            b = block(t, c)
+            Fc = block.(F, Ref(c))
+            ΔFc = block.(ΔF, Ref(c))
+            MAK.$pullback!(Δb, b, Fc, ΔFc, ind; kwargs...)
+        end
+        return Δt
+    end
+end
+
+for pullback_trunc! in (:svd_trunc_pullback!, :eig_trunc_pullback!, :eigh_trunc_pullback!)
+    @eval function MAK.$pullback_trunc!(Δt::AbstractTensorMap,
+                                        t::AbstractTensorMap,
+                                        F, ΔF; kwargs...)
+        foreachblock(Δt, t) do c, (Δb, b)
+            Fc = block.(F, Ref(c))
+            ΔFc = block.(ΔF, Ref(c))
+            return MAK.$pullback_trunc!(Δb, b, Fc, ΔFc; kwargs...)
+        end
+        return Δt
+    end
+end
diff --git a/src/factorizations/truncation.jl b/src/factorizations/truncation.jl
new file mode 100644
index 000000000..35ae0df44
--- /dev/null
+++ b/src/factorizations/truncation.jl
@@ -0,0 +1,230 @@
+# Strategies
+# ----------
+"""
+    TruncationSpace(V::ElementarySpace, by::Function, rev::Bool)
+
+Truncation strategy to keep the first values for each sector when sorted according to `by` and `rev`,
+such that the resulting vector space is no greater than `V`.
+
+See also [`truncspace`](@ref).
+"""
+struct TruncationSpace{S<:ElementarySpace,F} <: TruncationStrategy
+    space::S
+    by::F
+    rev::Bool
+end
+
+"""
+    truncspace(space::ElementarySpace; by=abs, rev::Bool=true)
+
+Truncation strategy to keep the first values for each sector when sorted according to `by` and `rev`,
+such that the resulting vector space is no greater than `V`.
+"""
+function truncspace(space::ElementarySpace; by=abs, rev::Bool=true)
+    isdual(space) && throw(ArgumentError("resulting vector space is never dual"))
+    return TruncationSpace(space, by, rev)
+end
+
+# truncate!
+# ---------
+_blocklength(d::Integer, ind) = _blocklength(Base.OneTo(d), ind)
+_blocklength(ax, ind) = length(ax[ind])
+function truncate_space(V::ElementarySpace, inds)
+    return spacetype(V)(c => _blocklength(dim(V, c), ind) for (c, ind) in inds)
+end
+
+function truncate_domain!(tdst::AbstractTensorMap, tsrc::AbstractTensorMap, inds)
+    for (c, b) in blocks(tdst)
+        I = get(inds, c, nothing)
+        @assert !isnothing(I)
+        copy!(b, @view(block(tsrc, c)[:, I]))
+    end
+    return tdst
+end
+function truncate_codomain!(tdst::AbstractTensorMap, tsrc::AbstractTensorMap, inds)
+    for (c, b) in blocks(tdst)
+        I = get(inds, c, nothing)
+        @assert !isnothing(I)
+        copy!(b, @view(block(tsrc, c)[I, :]))
+    end
+    return tdst
+end
+function truncate_diagonal!(Ddst::DiagonalTensorMap, Dsrc::DiagonalTensorMap, inds)
+    for (c, b) in blocks(Ddst)
+        I = get(inds, c, nothing)
+        @assert !isnothing(I)
+        copy!(diagview(b), view(diagview(block(Dsrc, c)), I))
+    end
+    return Ddst
+end
+
+function MAK.truncate(::typeof(svd_trunc!), (U, S, Vᴴ)::NTuple{3,AbstractTensorMap},
+                      strategy::TruncationStrategy)
+    ind = MAK.findtruncated_svd(diagview(S), strategy)
+    V_truncated = truncate_space(space(S, 1), ind)
+
+    Ũ = similar(U, codomain(U) ← V_truncated)
+    truncate_domain!(Ũ, U, ind)
+    S̃ = DiagonalTensorMap{scalartype(S)}(undef, V_truncated)
+    truncate_diagonal!(S̃, S, ind)
+    Ṽᴴ = similar(Vᴴ, V_truncated ← domain(Vᴴ))
+    truncate_codomain!(Ṽᴴ, Vᴴ, ind)
+
+    return (Ũ, S̃, Ṽᴴ), ind
+end
+
+function MAK.truncate(::typeof(left_null!),
+                      (U, S)::Tuple{AbstractTensorMap,AbstractTensorMap},
+                      strategy::MatrixAlgebraKit.TruncationStrategy)
+    extended_S = SectorDict(c => vcat(diagview(b),
+                                      zeros(eltype(b), max(0, size(b, 2) - size(b, 1))))
+                            for (c, b) in blocks(S))
+    ind = MAK.findtruncated(extended_S, strategy)
+    V_truncated = truncate_space(space(S, 1), ind)
+    Ũ = similar(U, codomain(U) ← V_truncated)
+    truncate_domain!(Ũ, U, ind)
+    return Ũ, ind
+end
+
+for f! in (:eig_trunc!, :eigh_trunc!)
+    @eval function MAK.truncate(::typeof($f!),
+                                (D, V)::Tuple{DiagonalTensorMap,AbstractTensorMap},
+                                strategy::TruncationStrategy)
+        ind = MAK.findtruncated(diagview(D), strategy)
+        V_truncated = truncate_space(space(D, 1), ind)
+
+        D̃ = DiagonalTensorMap{scalartype(D)}(undef, V_truncated)
+        truncate_diagonal!(D̃, D, ind)
+
+        Ṽ = similar(V, codomain(V) ← V_truncated)
+        truncate_domain!(Ṽ, V, ind)
+
+        return (D̃, Ṽ), ind
+    end
+end
+
+# Find truncation
+# ---------------
+# auxiliary functions
+rtol_to_atol(S, p, atol, rtol) = rtol > 0 ? max(atol, TensorKit._norm(S, p) * rtol) : atol
+
+function _compute_truncerr(Σdata, truncdim, p=2)
+    I = keytype(Σdata)
+    S = scalartype(valtype(Σdata))
+    return TensorKit._norm((c => @view(v[(get(truncdim, c, 0) + 1):end])
+                            for (c, v) in Σdata),
+                           p, zero(S))
+end
+
+function _findnexttruncvalue(S, truncdim::SectorDict{I,Int}; by=identity,
+                             rev::Bool=true) where {I<:Sector}
+    # early return
+    (isempty(S) || all(iszero, values(truncdim))) && return nothing
+    if rev
+        σmin, imin = findmin(keys(truncdim)) do c
+            d = truncdim[c]
+            return by(S[c][d])
+        end
+        return σmin, keys(truncdim)[imin]
+    else
+        σmax, imax = findmax(keys(truncdim)) do c
+            d = truncdim[c]
+            return by(S[c][d])
+        end
+        return σmax, keys(truncdim)[imax]
+    end
+end
+
+# findtruncated
+# -------------
+# Generic fallback
+function MAK.findtruncated_svd(values::SectorDict, strategy::TruncationStrategy)
+    return MAK.findtruncated(values, strategy)
+end
+
+function MAK.findtruncated(values::SectorDict, ::NoTruncation)
+    return SectorDict(c => Colon() for (c, b) in values)
+end
+
+function MAK.findtruncated(values::SectorDict, strategy::TruncationByOrder)
+    perms = SectorDict(c => (sortperm(d; strategy.by, strategy.rev)) for (c, d) in values)
+    values_sorted = SectorDict(c => d[perms[c]] for (c, d) in values)
+    inds = MAK.findtruncated_svd(values_sorted, truncrank(strategy.howmany))
+    return SectorDict(c => perms[c][I] for (c, I) in inds)
+end
+function MAK.findtruncated_svd(values::SectorDict, strategy::TruncationByOrder)
+    I = keytype(values)
+    truncdim = SectorDict{I,Int}(c => length(d) for (c, d) in values)
+    totaldim = sum(dim(c) * d for (c, d) in truncdim; init=0)
+    while true
+        next = _findnexttruncvalue(values, truncdim; strategy.by, strategy.rev)
+        isnothing(next) && break
+        _, cmin = next
+        truncdim[cmin] -= 1
+        totaldim -= dim(cmin)
+        truncdim[cmin] == 0 && delete!(truncdim, cmin)
+        totaldim <= strategy.howmany && break
+    end
+    return SectorDict(c => Base.OneTo(d) for (c, d) in truncdim)
+end
+
+function MAK.findtruncated(values::SectorDict, strategy::TruncationByFilter)
+    return SectorDict(c => findall(strategy.filter, d) for (c, d) in values)
+end
+
+function MAK.findtruncated(values::SectorDict, strategy::TruncationByValue)
+    atol = rtol_to_atol(values, strategy.p, strategy.atol, strategy.rtol)
+    strategy′ = trunctol(; atol, strategy.by, strategy.keep_below)
+    return SectorDict(c => MAK.findtruncated(d, strategy′) for (c, d) in values)
+end
+function MAK.findtruncated_svd(values::SectorDict, strategy::TruncationByValue)
+    atol = rtol_to_atol(values, strategy.p, strategy.atol, strategy.rtol)
+    strategy′ = trunctol(; atol, strategy.by, strategy.keep_below)
+    return SectorDict(c => MAK.findtruncated_svd(d, strategy′) for (c, d) in values)
+end
+
+function MAK.findtruncated(values::SectorDict, strategy::TruncationByError)
+    perms = SectorDict(c => sortperm(d; by=abs, rev=true) for (c, d) in values)
+    values_sorted = SectorDict(c => d[perms[c]] for (c, d) in Sd)
+    inds = MAK.findtruncated_svd(values_sorted, truncrank(strategy.howmany))
+    return SectorDict(c => perms[c][I] for (c, I) in inds)
+end
+function MAK.findtruncated_svd(values::SectorDict, strategy::TruncationByError)
+    I = keytype(values)
+    truncdim = SectorDict{I,Int}(c => length(d) for (c, d) in values)
+    by(c, v) = abs(v)^strategy.p * dim(c)
+    Nᵖ = sum(((c, v),) -> sum(Base.Fix1(by, c), v), values)
+    ϵᵖ = max(strategy.atol^strategy.p, strategy.rtol^strategy.p * Nᵖ)
+    truncerrᵖ = zero(real(scalartype(valtype(values))))
+    next = _findnexttruncvalue(values, truncdim)
+    while !isnothing(next)
+        σmin, cmin = next
+        truncerrᵖ += by(cmin, σmin)
+        truncerrᵖ >= ϵᵖ && break
+        (truncdim[cmin] -= 1) == 0 && delete!(truncdim, cmin)
+        next = _findnexttruncvalue(values, truncdim)
+    end
+    return SectorDict{I,Base.OneTo{Int}}(c => Base.OneTo(d) for (c, d) in truncdim)
+end
+
+function MAK.findtruncated(values::SectorDict, strategy::TruncationSpace)
+    blockstrategy(c) = truncrank(dim(strategy.space, c); strategy.by, strategy.rev)
+    return SectorDict(c => MAK.findtruncated(d, blockstrategy(c)) for (c, d) in values)
+end
+function MAK.findtruncated_svd(values::SectorDict, strategy::TruncationSpace)
+    blockstrategy(c) = truncrank(dim(strategy.space, c); strategy.by, strategy.rev)
+    return SectorDict(c => MAK.findtruncated_svd(d, blockstrategy(c)) for (c, d) in values)
+end
+
+function MAK.findtruncated(values::SectorDict, strategy::TruncationIntersection)
+    inds = map(Base.Fix1(MAK.findtruncated, values), strategy)
+    return SectorDict(c => mapreduce(Base.Fix2(getindex, c), _ind_intersect, inds;
+                                     init=trues(length(values[c])))
+                      for c in intersect(map(keys, inds)...))
+end
+function MAK.findtruncated_svd(Sd::SectorDict, strategy::TruncationIntersection)
+    inds = map(Base.Fix1(MAK.findtruncated_svd, Sd), strategy)
+    return SectorDict(c => mapreduce(Base.Fix2(getindex, c), _ind_intersect, inds;
+                                     init=trues(length(values[c])))
+                      for c in intersect(map(keys, inds)...))
+end
diff --git a/src/factorizations/utility.jl b/src/factorizations/utility.jl
new file mode 100644
index 000000000..46e88c8a9
--- /dev/null
+++ b/src/factorizations/utility.jl
@@ -0,0 +1,26 @@
+# convenience to set default
+macro check_space(x, V)
+    return esc(:($MatrixAlgebraKit.@check_size($x, $V, $space)))
+end
+macro check_scalar(x, y, op=:identity, eltype=:scalartype)
+    return esc(:($MatrixAlgebraKit.@check_scalar($x, $y, $op, $eltype)))
+end
+
+function factorisation_scalartype(t::AbstractTensorMap)
+    T = scalartype(t)
+    return promote_type(Float32, typeof(zero(T) / sqrt(abs2(one(T)))))
+end
+factorisation_scalartype(f, t) = factorisation_scalartype(t)
+
+function copy_oftype(t::AbstractTensorMap, T::Type{<:Number})
+    return copy!(similar(t, T, space(t)), t)
+end
+
+function _reverse!(t::AbstractTensorMap; dims=:)
+    for (c, b) in blocks(t)
+        reverse!(b; dims)
+    end
+    return t
+end
+
+MAK.diagview(t::AbstractTensorMap) = SectorDict(c => diagview(b) for (c, b) in blocks(t))
diff --git a/src/spaces/cartesianspace.jl b/src/spaces/cartesianspace.jl
index f29ed263d..fe12f3dc6 100644
--- a/src/spaces/cartesianspace.jl
+++ b/src/spaces/cartesianspace.jl
@@ -49,7 +49,13 @@ sectortype(::Type{CartesianSpace}) = Trivial
 
 Base.oneunit(::Type{CartesianSpace}) = CartesianSpace(1)
 Base.zero(::Type{CartesianSpace}) = CartesianSpace(0)
+
 ⊕(V₁::CartesianSpace, V₂::CartesianSpace) = CartesianSpace(V₁.d + V₂.d)
+function ⊖(V::CartesianSpace, W::CartesianSpace)
+    V ≿ W || throw(ArgumentError("$(W) is not a subspace of $(V)"))
+    return CartesianSpace(dim(V) - dim(W))
+end
+
 fuse(V₁::CartesianSpace, V₂::CartesianSpace) = CartesianSpace(V₁.d * V₂.d)
 flip(V::CartesianSpace) = V
 
diff --git a/src/spaces/complexspace.jl b/src/spaces/complexspace.jl
index ff05888b8..1031db614 100644
--- a/src/spaces/complexspace.jl
+++ b/src/spaces/complexspace.jl
@@ -50,11 +50,18 @@ Base.conj(V::ComplexSpace) = ComplexSpace(dim(V), !isdual(V))
 
 Base.oneunit(::Type{ComplexSpace}) = ComplexSpace(1)
 Base.zero(::Type{ComplexSpace}) = ComplexSpace(0)
+
 function ⊕(V₁::ComplexSpace, V₂::ComplexSpace)
     return isdual(V₁) == isdual(V₂) ?
            ComplexSpace(dim(V₁) + dim(V₂), isdual(V₁)) :
            throw(SpaceMismatch("Direct sum of a vector space and its dual does not exist"))
 end
+function ⊖(V::ComplexSpace, W::ComplexSpace)
+    (V ≿ W && isdual(V) == isdual(W)) ||
+        throw(ArgumentError("$(W) is not a subspace of $(V)"))
+    return ComplexSpace(dim(V) - dim(W), isdual(V))
+end
+
 fuse(V₁::ComplexSpace, V₂::ComplexSpace) = ComplexSpace(V₁.d * V₂.d)
 flip(V::ComplexSpace) = dual(V)
 
diff --git a/src/spaces/gradedspace.jl b/src/spaces/gradedspace.jl
index 63903a1ac..568b13475 100644
--- a/src/spaces/gradedspace.jl
+++ b/src/spaces/gradedspace.jl
@@ -149,6 +149,13 @@ function ⊕(V₁::GradedSpace{I}, V₂::GradedSpace{I}) where {I<:Sector}
     return typeof(V₁)(dims; dual=dual1)
 end
 
+function ⊖(V::GradedSpace{I}, W::GradedSpace{I}) where {I<:Sector}
+    dual = isdual(V)
+    V ≿ W && dual == isdual(W) ||
+        throw(SpaceMismatch("$(W) is not a subspace of $(V)"))
+    return typeof(V)(c => dim(V, c) - dim(W, c) for c in sectors(V); dual)
+end
+
 function flip(V::GradedSpace{I}) where {I<:Sector}
     if isdual(V)
         typeof(V)(c => dim(V, c) for c in sectors(V))
diff --git a/src/spaces/vectorspaces.jl b/src/spaces/vectorspaces.jl
index 844da081f..847182536 100644
--- a/src/spaces/vectorspaces.jl
+++ b/src/spaces/vectorspaces.jl
@@ -150,6 +150,17 @@ function ⊕ end
 ⊕(V::Vararg{ElementarySpace}) = foldl(⊕, V)
 const oplus = ⊕
 
+"""
+    ⊖(V::ElementarySpace, W::ElementarySpace) -> X::ElementarySpace
+    ominus(V::ElementarySpace, W::ElementarySpace) -> X::ElementarySpace
+
+Return a space that is equivalent to the orthogonal complement of `W` in `V`,
+i.e. an instance `X::ElementarySpace` such that `V = W ⊕ X`.
+"""
+⊖(V₁::S, V₂::S) where {S<:ElementarySpace}
+⊖(V₁::VectorSpace, V₂::VectorSpace) = ⊖(promote(V₁, V₂)...)
+const ominus = ⊖
+
 """
     ⊗(V₁::S, V₂::S, V₃::S...) where {S<:ElementarySpace} -> S
 
diff --git a/src/tensors/backends.jl b/src/tensors/backends.jl
new file mode 100644
index 000000000..0fc8f99f6
--- /dev/null
+++ b/src/tensors/backends.jl
@@ -0,0 +1,32 @@
+# Scheduler implementation
+# ------------------------
+function select_scheduler(scheduler=OhMyThreads.Implementation.NotGiven(); kwargs...)
+    return if scheduler == OhMyThreads.Implementation.NotGiven() && isempty(kwargs)
+        Threads.nthreads() == 1 ? SerialScheduler() : DynamicScheduler()
+    else
+        OhMyThreads.Implementation._scheduler_from_userinput(scheduler; kwargs...)
+    end
+end
+
+"""
+    const blockscheduler = ScopedValue{Scheduler}(SerialScheduler())
+
+The default scheduler used when looping over different blocks in the matrix representation of a
+tensor.
+For controlling this value, see also [`set_blockscheduler`](@ref) and [`with_blockscheduler`](@ref).
+"""
+const blockscheduler = ScopedValue{Scheduler}(SerialScheduler())
+
+"""
+    with_blockscheduler(f, [scheduler]; kwargs...)
+
+Run `f` in a scope where the `blockscheduler` is determined by `scheduler' and `kwargs...`.
+"""
+@inline function with_blockscheduler(f, scheduler=OhMyThreads.Implementation.NotGiven();
+                                     kwargs...)
+    @with blockscheduler => select_scheduler(scheduler; kwargs...) f()
+end
+
+# TODO: disable for trivial symmetry or small tensors?
+default_blockscheduler(t::AbstractTensorMap) = default_blockscheduler(typeof(t))
+default_blockscheduler(::Type{T}) where {T<:AbstractTensorMap} = blockscheduler[]
diff --git a/src/tensors/blockiterator.jl b/src/tensors/blockiterator.jl
index 7929b5d19..edbaa27c8 100644
--- a/src/tensors/blockiterator.jl
+++ b/src/tensors/blockiterator.jl
@@ -12,3 +12,35 @@ Base.IteratorSize(::BlockIterator) = Base.HasLength()
 Base.IteratorEltype(::BlockIterator) = Base.HasEltype()
 Base.eltype(::Type{<:BlockIterator{T}}) where {T} = Pair{sectortype(T),blocktype(T)}
 Base.length(iter::BlockIterator) = length(iter.structure)
+Base.isdone(iter::BlockIterator, state...) = Base.isdone(iter.structure, state...)
+
+# TODO: fast-path when structures are the same?
+# TODO: implement scheduler
+"""
+    foreachblock(f, ts::AbstractTensorMap...; [scheduler])
+
+Apply `f` to each block of `t` and the corresponding blocks of `ts`.
+Optionally, `scheduler` can be used to parallelize the computation.
+This function is equivalent to the following loop:
+
+```julia
+for c in union(blocksectors.(ts)...)
+    bs = map(t -> block(t, c), ts)
+    f(c, bs)
+end
+```
+"""
+function foreachblock(f, t::AbstractTensorMap, ts::AbstractTensorMap...; scheduler=nothing)
+    tensors = (t, ts...)
+    allsectors = union(blocksectors.(tensors)...)
+    foreach(allsectors) do c
+        return f(c, block.(tensors, Ref(c)))
+    end
+    return nothing
+end
+function foreachblock(f, t::AbstractTensorMap; scheduler=nothing)
+    foreach(blocks(t)) do (c, b)
+        return f(c, (b,))
+    end
+    return nothing
+end
diff --git a/src/tensors/diagonal.jl b/src/tensors/diagonal.jl
index 88d0c3b25..7ab300ca0 100644
--- a/src/tensors/diagonal.jl
+++ b/src/tensors/diagonal.jl
@@ -76,6 +76,11 @@ function DiagonalTensorMap(t::AbstractTensorMap{T,S,1,1}) where {T,S}
     return d
 end
 
+Base.similar(d::DiagonalTensorMap) = DiagonalTensorMap(similar(d.data), d.domain)
+function Base.similar(d::DiagonalTensorMap, ::Type{T}) where {T<:Number}
+    return DiagonalTensorMap(similar(d.data, T), d.domain)
+end
+
 # TODO: more constructors needed?
 
 # Special case adjoint:
@@ -94,7 +99,7 @@ function Base.copy!(t::AbstractTensorMap, d::DiagonalTensorMap)
     end
     return t
 end
-TensorMap(d::DiagonalTensorMap) = copy!(similar(d), d)
+TensorMap(d::DiagonalTensorMap) = copy!(similar(d, scalartype(d), space(d)), d)
 Base.convert(::Type{TensorMap}, d::DiagonalTensorMap) = TensorMap(d)
 
 function Base.convert(D::Type{<:DiagonalTensorMap}, d::DiagonalTensorMap)
@@ -277,16 +282,16 @@ end
 
 function LinearAlgebra.lmul!(D::DiagonalTensorMap, t::AbstractTensorMap)
     domain(D) == codomain(t) || throw(SpaceMismatch())
-    for (c, b) in blocks(t)
-        lmul!(block(D, c), b)
+    foreachblock(D, t) do c, bs
+        return lmul!(bs...)
     end
     return t
 end
 
 function LinearAlgebra.rmul!(t::AbstractTensorMap, D::DiagonalTensorMap)
     codomain(D) == domain(t) || throw(SpaceMismatch())
-    for (c, b) in blocks(t)
-        rmul!(b, block(D, c))
+    foreachblock(t, D) do c, bs
+        return rmul!(bs...)
     end
     return t
 end
@@ -317,65 +322,6 @@ function LinearAlgebra.isposdef(d::DiagonalTensorMap)
     return all(isposdef, d.data)
 end
 
-function eig!(d::DiagonalTensorMap)
-    return d, one(d)
-end
-function eigh!(d::DiagonalTensorMap{<:Real})
-    return d, one(d)
-end
-function eigh!(d::DiagonalTensorMap{<:Complex})
-    # TODO: should this test for hermiticity? `eigh!(::TensorMap)` also does not do this.
-    return DiagonalTensorMap(real(d.data), d.domain), one(d)
-end
-
-function leftorth!(d::DiagonalTensorMap; alg=QR(), kwargs...)
-    @assert alg isa Union{QR,QL}
-    return one(d), d # TODO: this is only correct for `alg = QR()` or `alg = QL()`
-end
-function rightorth!(d::DiagonalTensorMap; alg=LQ(), kwargs...)
-    @assert alg isa Union{LQ,RQ}
-    return d, one(d) # TODO: this is only correct for `alg = LQ()` or `alg = RQ()`
-end
-# not much to do here:
-leftnull!(d::DiagonalTensorMap; kwargs...) = leftnull!(TensorMap(d); kwargs...)
-rightnull!(d::DiagonalTensorMap; kwargs...) = rightnull!(TensorMap(d); kwargs...)
-
-function tsvd!(d::DiagonalTensorMap; trunc=NoTruncation(), p::Real=2, alg=SDD())
-    return _tsvd!(d, alg, trunc, p)
-end
-# helper function
-function _compute_svddata!(d::DiagonalTensorMap, alg::Union{SVD,SDD})
-    InnerProductStyle(d) === EuclideanInnerProduct() || throw_invalid_innerproduct(:tsvd!)
-    I = sectortype(d)
-    dims = SectorDict{I,Int}()
-    generator = Base.Iterators.map(blocks(d)) do (c, b)
-        lb = length(b.diag)
-        U = zerovector!(similar(b.diag, lb, lb))
-        V = zerovector!(similar(b.diag, lb, lb))
-        p = sortperm(b.diag; by=abs, rev=true)
-        for (i, pi) in enumerate(p)
-            U[pi, i] = MatrixAlgebra.safesign(b.diag[pi])
-            V[i, pi] = 1
-        end
-        Σ = abs.(view(b.diag, p))
-        dims[c] = lb
-        return c => (U, Σ, V)
-    end
-    SVDdata = SectorDict(generator)
-    return SVDdata, dims
-end
-
-function LinearAlgebra.svdvals(d::DiagonalTensorMap)
-    return SectorDict(c => LinearAlgebra.svdvals(b) for (c, b) in blocks(d))
-end
-function LinearAlgebra.eigvals(d::DiagonalTensorMap)
-    return SectorDict(c => LinearAlgebra.eigvals(b) for (c, b) in blocks(d))
-end
-
-function LinearAlgebra.cond(d::DiagonalTensorMap, p::Real=2)
-    return LinearAlgebra.cond(Diagonal(d.data), p)
-end
-
 # matrix functions
 for f in
     (:exp, :cos, :sin, :tan, :cot, :cosh, :sinh, :tanh, :coth, :atan, :acot, :asinh, :sqrt,
diff --git a/src/tensors/factorizations.jl b/src/tensors/factorizations.jl
deleted file mode 100644
index 9a6bf5dd1..000000000
--- a/src/tensors/factorizations.jl
+++ /dev/null
@@ -1,685 +0,0 @@
-# Tensor factorization
-#----------------------
-function factorisation_scalartype(t::AbstractTensorMap)
-    T = scalartype(t)
-    return promote_type(Float32, typeof(zero(T) / sqrt(abs2(one(T)))))
-end
-factorisation_scalartype(f, t) = factorisation_scalartype(t)
-
-function permutedcopy_oftype(t::AbstractTensorMap, T::Type{<:Number}, p::Index2Tuple)
-    return permute!(similar(t, T, permute(space(t), p)), t, p)
-end
-function copy_oftype(t::AbstractTensorMap, T::Type{<:Number})
-    return copy!(similar(t, T), t)
-end
-
-"""
-    tsvd(t::AbstractTensorMap, (leftind, rightind)::Index2Tuple;
-        trunc::TruncationScheme = notrunc(), p::Real = 2, alg::Union{SVD, SDD} = SDD())
-        -> U, S, V, ϵ
-
-Compute the (possibly truncated) singular value decomposition such that
-`norm(permute(t, (leftind, rightind)) - U * S * V) ≈ ϵ`, where `ϵ` thus represents the truncation error.
-
-If `leftind` and `rightind` are not specified, the current partition of left and right
-indices of `t` is used. In that case, less memory is allocated if one allows the data in
-`t` to be destroyed/overwritten, by using `tsvd!(t, trunc = notrunc(), p = 2)`.
-
-A truncation parameter `trunc` can be specified for the new internal dimension, in which
-case a truncated singular value decomposition will be computed. Choices are:
-*   `notrunc()`: no truncation (default);
-*   `truncerr(η::Real)`: truncates such that the p-norm of the truncated singular values is
-    smaller than `η`;
-*   `truncdim(χ::Int)`: truncates such that the equivalent total dimension of the internal
-    vector space is no larger than `χ`;
-*   `truncspace(V)`: truncates such that the dimension of the internal vector space is no
-    greater than that of `V` in any sector.
-*   `truncbelow(η::Real)`: truncates such that every singular value is larger then `η` ;
-
-Truncation options can also be combined using `&`, i.e. `truncbelow(η) & truncdim(χ)` will
-choose the truncation space such that every singular value is larger than `η`, and the
-equivalent total dimension of the internal vector space is no larger than `χ`.
-
-The method `tsvd` also returns the truncation error `ϵ`, computed as the `p` norm of the
-singular values that were truncated.
-
-THe keyword `alg` can be equal to `SVD()` or `SDD()`, corresponding to the underlying LAPACK
-algorithm that computes the decomposition (`_gesvd` or `_gesdd`).
-
-Orthogonality requires `InnerProductStyle(t) <: HasInnerProduct`, and `tsvd(!)`
-is currently only implemented for `InnerProductStyle(t) === EuclideanInnerProduct()`.
-"""
-function tsvd(t::AbstractTensorMap, p::Index2Tuple; kwargs...)
-    tcopy = permutedcopy_oftype(t, factorisation_scalartype(tsvd, t), p)
-    return tsvd!(tcopy; kwargs...)
-end
-
-function LinearAlgebra.svdvals(t::AbstractTensorMap)
-    tcopy = copy_oftype(t, factorisation_scalartype(tsvd, t))
-    return LinearAlgebra.svdvals!(tcopy)
-end
-
-"""
-    leftorth(t::AbstractTensorMap, (leftind, rightind)::Index2Tuple;
-                alg::OrthogonalFactorizationAlgorithm = QRpos()) -> Q, R
-
-Create orthonormal basis `Q` for indices in `leftind`, and remainder `R` such that
-`permute(t, (leftind, rightind)) = Q*R`.
-
-If `leftind` and `rightind` are not specified, the current partition of left and right
-indices of `t` is used. In that case, less memory is allocated if one allows the data in `t`
-to be destroyed/overwritten, by using `leftorth!(t, alg = QRpos())`.
-
-Different algorithms are available, namely `QR()`, `QRpos()`, `SVD()` and `Polar()`. `QR()`
-and `QRpos()` use a standard QR decomposition, producing an upper triangular matrix `R`.
-`Polar()` produces a Hermitian and positive semidefinite `R`. `QRpos()` corrects the
-standard QR decomposition such that the diagonal elements of `R` are positive. Only
-`QRpos()` and `Polar()` are unique (no residual freedom) so that they always return the same
-result for the same input tensor `t`.
-
-Orthogonality requires `InnerProductStyle(t) <: HasInnerProduct`, and
-`leftorth(!)` is currently only implemented for 
-    `InnerProductStyle(t) === EuclideanInnerProduct()`.
-"""
-function leftorth(t::AbstractTensorMap, p::Index2Tuple; kwargs...)
-    tcopy = permutedcopy_oftype(t, factorisation_scalartype(leftorth, t), p)
-    return leftorth!(tcopy; kwargs...)
-end
-
-"""
-    rightorth(t::AbstractTensorMap, (leftind, rightind)::Index2Tuple;
-                alg::OrthogonalFactorizationAlgorithm = LQpos()) -> L, Q
-
-Create orthonormal basis `Q` for indices in `rightind`, and remainder `L` such that
-`permute(t, (leftind, rightind)) = L*Q`.
-
-If `leftind` and `rightind` are not specified, the current partition of left and right
-indices of `t` is used. In that case, less memory is allocated if one allows the data in `t`
-to be destroyed/overwritten, by using `rightorth!(t, alg = LQpos())`.
-
-Different algorithms are available, namely `LQ()`, `LQpos()`, `RQ()`, `RQpos()`, `SVD()` and
-`Polar()`. `LQ()` and `LQpos()` produce a lower triangular matrix `L` and are computed using
-a QR decomposition of the transpose. `RQ()` and `RQpos()` produce an upper triangular
-remainder `L` and only works if the total left dimension is smaller than or equal to the
-total right dimension. `LQpos()` and `RQpos()` add an additional correction such that the
-diagonal elements of `L` are positive. `Polar()` produces a Hermitian and positive
-semidefinite `L`. Only `LQpos()`, `RQpos()` and `Polar()` are unique (no residual freedom)
-so that they always return the same result for the same input tensor `t`.
-
-Orthogonality requires `InnerProductStyle(t) <: HasInnerProduct`, and
-`rightorth(!)` is currently only implemented for 
-`InnerProductStyle(t) === EuclideanInnerProduct()`.
-"""
-function rightorth(t::AbstractTensorMap, p::Index2Tuple; kwargs...)
-    tcopy = permutedcopy_oftype(t, factorisation_scalartype(rightorth, t), p)
-    return rightorth!(tcopy; kwargs...)
-end
-
-"""
-    leftnull(t::AbstractTensor, (leftind, rightind)::Index2Tuple;
-                alg::OrthogonalFactorizationAlgorithm = QRpos()) -> N
-
-Create orthonormal basis for the orthogonal complement of the support of the indices in
-`leftind`, such that `N' * permute(t, (leftind, rightind)) = 0`.
-
-If `leftind` and `rightind` are not specified, the current partition of left and right
-indices of `t` is used. In that case, less memory is allocated if one allows the data in `t`
-to be destroyed/overwritten, by using `leftnull!(t, alg = QRpos())`.
-
-Different algorithms are available, namely `QR()` (or equivalently, `QRpos()`), `SVD()` and
-`SDD()`. The first assumes that the matrix is full rank and requires `iszero(atol)` and
-`iszero(rtol)`. With `SVD()` and `SDD()`, `rightnull` will use the corresponding singular
-value decomposition, and one can specify an absolute or relative tolerance for which
-singular values are to be considered zero, where `max(atol, norm(t)*rtol)` is used as upper
-bound.
-
-Orthogonality requires `InnerProductStyle(t) <: HasInnerProduct`, and
-`leftnull(!)` is currently only implemented for 
-`InnerProductStyle(t) === EuclideanInnerProduct()`.
-"""
-function leftnull(t::AbstractTensorMap, p::Index2Tuple; kwargs...)
-    tcopy = permutedcopy_oftype(t, factorisation_scalartype(leftnull, t), p)
-    return leftnull!(tcopy; kwargs...)
-end
-
-"""
-    rightnull(t::AbstractTensor, (leftind, rightind)::Index2Tuple;
-                alg::OrthogonalFactorizationAlgorithm = LQ(),
-                atol::Real = 0.0,
-                rtol::Real = eps(real(float(one(scalartype(t)))))*iszero(atol)) -> N
-
-Create orthonormal basis for the orthogonal complement of the support of the indices in
-`rightind`, such that `permute(t, (leftind, rightind))*N' = 0`.
-
-If `leftind` and `rightind` are not specified, the current partition of left and right
-indices of `t` is used. In that case, less memory is allocated if one allows the data in `t`
-to be destroyed/overwritten, by using `rightnull!(t, alg = LQpos())`.
-
-Different algorithms are available, namely `LQ()` (or equivalently, `LQpos`), `SVD()` and
-`SDD()`. The first assumes that the matrix is full rank and requires `iszero(atol)` and
-`iszero(rtol)`. With `SVD()` and `SDD()`, `rightnull` will use the corresponding singular
-value decomposition, and one can specify an absolute or relative tolerance for which
-singular values are to be considered zero, where `max(atol, norm(t)*rtol)` is used as upper
-bound.
-
-Orthogonality requires `InnerProductStyle(t) <: HasInnerProduct`, and
-`rightnull(!)` is currently only implemented for 
-`InnerProductStyle(t) === EuclideanInnerProduct()`.
-"""
-function rightnull(t::AbstractTensorMap, p::Index2Tuple; kwargs...)
-    tcopy = permutedcopy_oftype(t, factorisation_scalartype(rightnull, t), p)
-    return rightnull!(tcopy; kwargs...)
-end
-
-"""
-    eigen(t::AbstractTensor, (leftind, rightind)::Index2Tuple; kwargs...) -> D, V
-
-Compute eigenvalue factorization of tensor `t` as linear map from `rightind` to `leftind`.
-
-If `leftind` and `rightind` are not specified, the current partition of left and right
-indices of `t` is used. In that case, less memory is allocated if one allows the data in `t`
-to be destroyed/overwritten, by using `eigen!(t)`. Note that the permuted tensor on which
-`eigen!` is called should have equal domain and codomain, as otherwise the eigenvalue
-decomposition is meaningless and cannot satisfy
-```
-permute(t, (leftind, rightind)) * V = V * D
-```
-
-Accepts the same keyword arguments `scale` and `permute` as `eigen` of dense
-matrices. See the corresponding documentation for more information.
-
-See also `eig` and `eigh`
-"""
-function LinearAlgebra.eigen(t::AbstractTensorMap, p::Index2Tuple; kwargs...)
-    tcopy = permutedcopy_oftype(t, factorisation_scalartype(eigen, t), p)
-    return eigen!(tcopy; kwargs...)
-end
-
-function LinearAlgebra.eigvals(t::AbstractTensorMap; kwargs...)
-    tcopy = copy_oftype(t, factorisation_scalartype(eigen, t))
-    return LinearAlgebra.eigvals!(tcopy; kwargs...)
-end
-
-"""
-    eig(t::AbstractTensor, (leftind, rightind)::Index2Tuple; kwargs...) -> D, V
-
-Compute eigenvalue factorization of tensor `t` as linear map from `rightind` to `leftind`.
-The function `eig` assumes that the linear map is not hermitian and returns type stable
-complex valued `D` and `V` tensors for both real and complex valued `t`. See `eigh` for
-hermitian linear maps
-
-If `leftind` and `rightind` are not specified, the current partition of left and right
-indices of `t` is used. In that case, less memory is allocated if one allows the data in
-`t` to be destroyed/overwritten, by using `eig!(t)`. Note that the permuted tensor on
-which `eig!` is called should have equal domain and codomain, as otherwise the eigenvalue
-decomposition is meaningless and cannot satisfy
-```
-permute(t, (leftind, rightind)) * V = V * D
-```
-
-Accepts the same keyword arguments `scale` and `permute` as `eigen` of dense
-matrices. See the corresponding documentation for more information.
-
-See also `eigen` and `eigh`.
-"""
-function eig(t::AbstractTensorMap, p::Index2Tuple; kwargs...)
-    tcopy = permutedcopy_oftype(t, factorisation_scalartype(eig, t), p)
-    return eig!(tcopy; kwargs...)
-end
-
-"""
-    eigh(t::AbstractTensorMap, (leftind, rightind)::Index2Tuple) -> D, V
-
-Compute eigenvalue factorization of tensor `t` as linear map from `rightind` to `leftind`.
-The function `eigh` assumes that the linear map is hermitian and `D` and `V` tensors with
-the same `scalartype` as `t`. See `eig` and `eigen` for non-hermitian tensors. Hermiticity
-requires that the tensor acts on inner product spaces, and the current implementation
-requires `InnerProductStyle(t) === EuclideanInnerProduct()`.
-
-If `leftind` and `rightind` are not specified, the current partition of left and right
-indices of `t` is used. In that case, less memory is allocated if one allows the data in
-`t` to be destroyed/overwritten, by using `eigh!(t)`. Note that the permuted tensor on
-which `eigh!` is called should have equal domain and codomain, as otherwise the eigenvalue
-decomposition is meaningless and cannot satisfy
-```
-permute(t, (leftind, rightind)) * V = V * D
-```
-
-See also `eigen` and `eig`.
-"""
-function eigh(t::AbstractTensorMap, p::Index2Tuple; kwargs...)
-    tcopy = permutedcopy_oftype(t, factorisation_scalartype(eigh, t), p)
-    return eigh!(tcopy; kwargs...)
-end
-
-"""
-    isposdef(t::AbstractTensor, (leftind, rightind)::Index2Tuple) -> ::Bool
-
-Test whether a tensor `t` is positive definite as linear map from `rightind` to `leftind`.
-
-If `leftind` and `rightind` are not specified, the current partition of left and right
-indices of `t` is used. In that case, less memory is allocated if one allows the data in
-`t` to be destroyed/overwritten, by using `isposdef!(t)`. Note that the permuted tensor on
-which `isposdef!` is called should have equal domain and codomain, as otherwise it is
-meaningless.
-"""
-function LinearAlgebra.isposdef(t::AbstractTensorMap, (p₁, p₂)::Index2Tuple)
-    tcopy = permutedcopy_oftype(t, factorisation_scalartype(isposdef, t), p)
-    return isposdef!(tcopy)
-end
-
-function tsvd(t::AbstractTensorMap; kwargs...)
-    tcopy = copy_oftype(t, float(scalartype(t)))
-    return tsvd!(tcopy; kwargs...)
-end
-function leftorth(t::AbstractTensorMap; alg::OFA=QRpos(), kwargs...)
-    tcopy = copy_oftype(t, float(scalartype(t)))
-    return leftorth!(tcopy; alg=alg, kwargs...)
-end
-function rightorth(t::AbstractTensorMap; alg::OFA=LQpos(), kwargs...)
-    tcopy = copy_oftype(t, float(scalartype(t)))
-    return rightorth!(tcopy; alg=alg, kwargs...)
-end
-function leftnull(t::AbstractTensorMap; alg::OFA=QR(), kwargs...)
-    tcopy = copy_oftype(t, float(scalartype(t)))
-    return leftnull!(tcopy; alg=alg, kwargs...)
-end
-function rightnull(t::AbstractTensorMap; alg::OFA=LQ(), kwargs...)
-    tcopy = copy_oftype(t, float(scalartype(t)))
-    return rightnull!(tcopy; alg=alg, kwargs...)
-end
-function LinearAlgebra.eigen(t::AbstractTensorMap; kwargs...)
-    tcopy = copy_oftype(t, float(scalartype(t)))
-    return eigen!(tcopy; kwargs...)
-end
-function eig(t::AbstractTensorMap; kwargs...)
-    tcopy = copy_oftype(t, float(scalartype(t)))
-    return eig!(tcopy; kwargs...)
-end
-function eigh(t::AbstractTensorMap; kwargs...)
-    tcopy = copy_oftype(t, float(scalartype(t)))
-    return eigh!(tcopy; kwargs...)
-end
-function LinearAlgebra.isposdef(t::AbstractTensorMap)
-    tcopy = copy_oftype(t, float(scalartype(t)))
-    return isposdef!(tcopy)
-end
-
-# Orthogonal factorizations (mutation for recycling memory):
-# only possible if scalar type is floating point
-# only correct if Euclidean inner product
-#------------------------------------------------------------------------------------------
-const RealOrComplexFloat = Union{AbstractFloat,Complex{<:AbstractFloat}}
-
-function leftorth!(t::TensorMap{<:RealOrComplexFloat};
-                   alg::Union{QR,QRpos,QL,QLpos,SVD,SDD,Polar}=QRpos(),
-                   atol::Real=zero(float(real(scalartype(t)))),
-                   rtol::Real=(alg ∉ (SVD(), SDD())) ? zero(float(real(scalartype(t)))) :
-                              eps(real(float(one(scalartype(t))))) * iszero(atol))
-    InnerProductStyle(t) === EuclideanInnerProduct() ||
-        throw_invalid_innerproduct(:leftorth!)
-    if !iszero(rtol)
-        atol = max(atol, rtol * norm(t))
-    end
-    I = sectortype(t)
-    dims = SectorDict{I,Int}()
-
-    # compute QR factorization for each block
-    if !isempty(blocks(t))
-        generator = Base.Iterators.map(blocks(t)) do (c, b)
-            Qc, Rc = MatrixAlgebra.leftorth!(b, alg, atol)
-            dims[c] = size(Qc, 2)
-            return c => (Qc, Rc)
-        end
-        QRdata = SectorDict(generator)
-    end
-
-    # construct new space
-    S = spacetype(t)
-    V = S(dims)
-    if alg isa Polar
-        @assert V ≅ domain(t)
-        W = domain(t)
-    elseif length(domain(t)) == 1 && domain(t) ≅ V
-        W = domain(t)
-    elseif length(codomain(t)) == 1 && codomain(t) ≅ V
-        W = codomain(t)
-    else
-        W = ProductSpace(V)
-    end
-
-    # construct output tensors
-    T = float(scalartype(t))
-    Q = similar(t, T, codomain(t) ← W)
-    R = similar(t, T, W ← domain(t))
-    if !isempty(blocks(t))
-        for (c, (Qc, Rc)) in QRdata
-            copy!(block(Q, c), Qc)
-            copy!(block(R, c), Rc)
-        end
-    end
-    return Q, R
-end
-
-function leftnull!(t::TensorMap{<:RealOrComplexFloat};
-                   alg::Union{QR,QRpos,SVD,SDD}=QRpos(),
-                   atol::Real=zero(float(real(scalartype(t)))),
-                   rtol::Real=(alg ∉ (SVD(), SDD())) ? zero(float(real(scalartype(t)))) :
-                              eps(real(float(one(scalartype(t))))) * iszero(atol))
-    InnerProductStyle(t) === EuclideanInnerProduct() ||
-        throw_invalid_innerproduct(:leftnull!)
-    if !iszero(rtol)
-        atol = max(atol, rtol * norm(t))
-    end
-    I = sectortype(t)
-    dims = SectorDict{I,Int}()
-
-    # compute QR factorization for each block
-    V = codomain(t)
-    if !isempty(blocksectors(V))
-        generator = Base.Iterators.map(blocksectors(V)) do c
-            Nc = MatrixAlgebra.leftnull!(block(t, c), alg, atol)
-            dims[c] = size(Nc, 2)
-            return c => Nc
-        end
-        Ndata = SectorDict(generator)
-    end
-
-    # construct new space
-    S = spacetype(t)
-    W = S(dims)
-
-    # construct output tensor
-    T = float(scalartype(t))
-    N = similar(t, T, V ← W)
-    if !isempty(blocksectors(V))
-        for (c, Nc) in Ndata
-            copy!(block(N, c), Nc)
-        end
-    end
-    return N
-end
-
-function rightorth!(t::TensorMap{<:RealOrComplexFloat};
-                    alg::Union{LQ,LQpos,RQ,RQpos,SVD,SDD,Polar}=LQpos(),
-                    atol::Real=zero(float(real(scalartype(t)))),
-                    rtol::Real=(alg ∉ (SVD(), SDD())) ? zero(float(real(scalartype(t)))) :
-                               eps(real(float(one(scalartype(t))))) * iszero(atol))
-    InnerProductStyle(t) === EuclideanInnerProduct() ||
-        throw_invalid_innerproduct(:rightorth!)
-    if !iszero(rtol)
-        atol = max(atol, rtol * norm(t))
-    end
-    I = sectortype(t)
-    dims = SectorDict{I,Int}()
-
-    # compute LQ factorization for each block
-    if !isempty(blocks(t))
-        generator = Base.Iterators.map(blocks(t)) do (c, b)
-            Lc, Qc = MatrixAlgebra.rightorth!(b, alg, atol)
-            dims[c] = size(Qc, 1)
-            return c => (Lc, Qc)
-        end
-        LQdata = SectorDict(generator)
-    end
-
-    # construct new space
-    S = spacetype(t)
-    V = S(dims)
-    if alg isa Polar
-        @assert V ≅ codomain(t)
-        W = codomain(t)
-    elseif length(codomain(t)) == 1 && codomain(t) ≅ V
-        W = codomain(t)
-    elseif length(domain(t)) == 1 && domain(t) ≅ V
-        W = domain(t)
-    else
-        W = ProductSpace(V)
-    end
-
-    # construct output tensors
-    T = float(scalartype(t))
-    L = similar(t, T, codomain(t) ← W)
-    Q = similar(t, T, W ← domain(t))
-    if !isempty(blocks(t))
-        for (c, (Lc, Qc)) in LQdata
-            copy!(block(L, c), Lc)
-            copy!(block(Q, c), Qc)
-        end
-    end
-    return L, Q
-end
-
-function rightnull!(t::TensorMap{<:RealOrComplexFloat};
-                    alg::Union{LQ,LQpos,SVD,SDD}=LQpos(),
-                    atol::Real=zero(float(real(scalartype(t)))),
-                    rtol::Real=(alg ∉ (SVD(), SDD())) ? zero(float(real(scalartype(t)))) :
-                               eps(real(float(one(scalartype(t))))) * iszero(atol))
-    InnerProductStyle(t) === EuclideanInnerProduct() ||
-        throw_invalid_innerproduct(:rightnull!)
-    if !iszero(rtol)
-        atol = max(atol, rtol * norm(t))
-    end
-    I = sectortype(t)
-    dims = SectorDict{I,Int}()
-
-    # compute LQ factorization for each block
-    V = domain(t)
-    if !isempty(blocksectors(V))
-        generator = Base.Iterators.map(blocksectors(V)) do c
-            Nc = MatrixAlgebra.rightnull!(block(t, c), alg, atol)
-            dims[c] = size(Nc, 1)
-            return c => Nc
-        end
-        Ndata = SectorDict(generator)
-    end
-
-    # construct new space
-    S = spacetype(t)
-    W = S(dims)
-
-    # construct output tensor
-    T = float(scalartype(t))
-    N = similar(t, T, W ← V)
-    if !isempty(blocksectors(V))
-        for (c, Nc) in Ndata
-            copy!(block(N, c), Nc)
-        end
-    end
-    return N
-end
-
-function leftorth!(t::AdjointTensorMap; alg::OFA=QRpos())
-    InnerProductStyle(t) === EuclideanInnerProduct() ||
-        throw_invalid_innerproduct(:leftorth!)
-    return map(adjoint, reverse(rightorth!(adjoint(t); alg=alg')))
-end
-
-function rightorth!(t::AdjointTensorMap; alg::OFA=LQpos())
-    InnerProductStyle(t) === EuclideanInnerProduct() ||
-        throw_invalid_innerproduct(:rightorth!)
-    return map(adjoint, reverse(leftorth!(adjoint(t); alg=alg')))
-end
-
-function leftnull!(t::AdjointTensorMap; alg::OFA=QR(), kwargs...)
-    InnerProductStyle(t) === EuclideanInnerProduct() ||
-        throw_invalid_innerproduct(:leftnull!)
-    return adjoint(rightnull!(adjoint(t); alg=alg', kwargs...))
-end
-
-function rightnull!(t::AdjointTensorMap; alg::OFA=LQ(), kwargs...)
-    InnerProductStyle(t) === EuclideanInnerProduct() ||
-        throw_invalid_innerproduct(:rightnull!)
-    return adjoint(leftnull!(adjoint(t); alg=alg', kwargs...))
-end
-
-#------------------------------#
-# Singular value decomposition #
-#------------------------------#
-function LinearAlgebra.svdvals!(t::TensorMap{<:RealOrComplexFloat})
-    return SectorDict(c => LinearAlgebra.svdvals!(b) for (c, b) in blocks(t))
-end
-LinearAlgebra.svdvals!(t::AdjointTensorMap) = svdvals!(adjoint(t))
-
-function tsvd!(t::TensorMap{<:RealOrComplexFloat};
-               trunc=NoTruncation(), p::Real=2, alg=SDD())
-    return _tsvd!(t, alg, trunc, p)
-end
-function tsvd!(t::AdjointTensorMap; trunc=NoTruncation(), p::Real=2, alg=SDD())
-    u, s, vt, err = tsvd!(adjoint(t); trunc=trunc, p=p, alg=alg)
-    return adjoint(vt), adjoint(s), adjoint(u), err
-end
-
-# implementation dispatches on algorithm
-function _tsvd!(t::TensorMap{<:RealOrComplexFloat}, alg::Union{SVD,SDD},
-                trunc::TruncationScheme, p::Real=2)
-    # early return
-    if isempty(blocksectors(t))
-        truncerr = zero(real(scalartype(t)))
-        return _empty_svdtensors(t)..., truncerr
-    end
-
-    # compute SVD factorization for each block
-    S = spacetype(t)
-    SVDdata, dims = _compute_svddata!(t, alg)
-    Σdata = SectorDict(c => Σ for (c, (U, Σ, V)) in SVDdata)
-    truncdim = _compute_truncdim(Σdata, trunc, p)
-    truncerr = _compute_truncerr(Σdata, truncdim, p)
-
-    # construct output tensors
-    U, Σ, V⁺ = _create_svdtensors(t, SVDdata, truncdim)
-    return U, Σ, V⁺, truncerr
-end
-
-# helper functions
-function _compute_svddata!(t::TensorMap, alg::Union{SVD,SDD})
-    InnerProductStyle(t) === EuclideanInnerProduct() || throw_invalid_innerproduct(:tsvd!)
-    I = sectortype(t)
-    dims = SectorDict{I,Int}()
-    generator = Base.Iterators.map(blocks(t)) do (c, b)
-        U, Σ, V = MatrixAlgebra.svd!(b, alg)
-        dims[c] = length(Σ)
-        return c => (U, Σ, V)
-    end
-    SVDdata = SectorDict(generator)
-    return SVDdata, dims
-end
-
-function _create_svdtensors(t::TensorMap{<:RealOrComplexFloat}, SVDdata, dims)
-    T = scalartype(t)
-    S = spacetype(t)
-    W = S(dims)
-
-    Tr = real(T)
-    A = similarstoragetype(t, Tr)
-    Σ = DiagonalTensorMap{Tr,S,A}(undef, W)
-
-    U = similar(t, codomain(t) ← W)
-    V⁺ = similar(t, W ← domain(t))
-    for (c, (Uc, Σc, V⁺c)) in SVDdata
-        r = Base.OneTo(dims[c])
-        copy!(block(U, c), view(Uc, :, r))
-        copy!(block(Σ, c), Diagonal(view(Σc, r)))
-        copy!(block(V⁺, c), view(V⁺c, r, :))
-    end
-    return U, Σ, V⁺
-end
-
-function _empty_svdtensors(t::TensorMap{<:RealOrComplexFloat})
-    T = scalartype(t)
-    S = spacetype(t)
-    I = sectortype(t)
-    dims = SectorDict{I,Int}()
-    W = S(dims)
-
-    Tr = real(T)
-    A = similarstoragetype(t, Tr)
-    Σ = DiagonalTensorMap{Tr,S,A}(undef, W)
-
-    U = similar(t, codomain(t) ← W)
-    V⁺ = similar(t, W ← domain(t))
-    return U, Σ, V⁺
-end
-
-#--------------------------#
-# Eigenvalue decomposition #
-#--------------------------#
-function LinearAlgebra.eigen!(t::TensorMap{<:RealOrComplexFloat})
-    return ishermitian(t) ? eigh!(t) : eig!(t)
-end
-
-function LinearAlgebra.eigvals!(t::TensorMap{<:RealOrComplexFloat}; kwargs...)
-    return SectorDict(c => complex(LinearAlgebra.eigvals!(b; kwargs...))
-                      for (c, b) in blocks(t))
-end
-function LinearAlgebra.eigvals!(t::AdjointTensorMap{<:RealOrComplexFloat}; kwargs...)
-    return SectorDict(c => conj!(complex(LinearAlgebra.eigvals!(b; kwargs...)))
-                      for (c, b) in blocks(t))
-end
-
-function eigh!(t::TensorMap{<:RealOrComplexFloat})
-    InnerProductStyle(t) === EuclideanInnerProduct() || throw_invalid_innerproduct(:eigh!)
-    domain(t) == codomain(t) ||
-        throw(SpaceMismatch("`eigh!` requires domain and codomain to be the same"))
-
-    T = scalartype(t)
-    I = sectortype(t)
-    S = spacetype(t)
-    dims = SectorDict{I,Int}(c => size(b, 1) for (c, b) in blocks(t))
-    W = S(dims)
-
-    Tr = real(T)
-    A = similarstoragetype(t, Tr)
-    D = DiagonalTensorMap{Tr,S,A}(undef, W)
-    V = similar(t, domain(t) ← W)
-    for (c, b) in blocks(t)
-        values, vectors = MatrixAlgebra.eigh!(b)
-        copy!(block(D, c), Diagonal(values))
-        copy!(block(V, c), vectors)
-    end
-    return D, V
-end
-
-function eig!(t::TensorMap{<:RealOrComplexFloat}; kwargs...)
-    domain(t) == codomain(t) ||
-        throw(SpaceMismatch("`eig!` requires domain and codomain to be the same"))
-
-    T = scalartype(t)
-    I = sectortype(t)
-    S = spacetype(t)
-    dims = SectorDict{I,Int}(c => size(b, 1) for (c, b) in blocks(t))
-    W = S(dims)
-
-    Tc = complex(T)
-    A = similarstoragetype(t, Tc)
-    D = DiagonalTensorMap{Tc,S,A}(undef, W)
-    V = similar(t, Tc, domain(t) ← W)
-    for (c, b) in blocks(t)
-        values, vectors = MatrixAlgebra.eig!(b; kwargs...)
-        copy!(block(D, c), Diagonal(values))
-        copy!(block(V, c), vectors)
-    end
-    return D, V
-end
-
-#--------------------------------------------------#
-# Checks for hermiticity and positive definiteness #
-#--------------------------------------------------#
-function LinearAlgebra.ishermitian(t::TensorMap)
-    domain(t) == codomain(t) || return false
-    InnerProductStyle(t) === EuclideanInnerProduct() || return false # hermiticity only defined for euclidean
-    for (c, b) in blocks(t)
-        ishermitian(b) || return false
-    end
-    return true
-end
-
-function LinearAlgebra.isposdef!(t::TensorMap)
-    domain(t) == codomain(t) ||
-        throw(SpaceMismatch("`isposdef` requires domain and codomain to be the same"))
-    InnerProductStyle(spacetype(t)) === EuclideanInnerProduct() || return false
-    for (c, b) in blocks(t)
-        isposdef!(b) || return false
-    end
-    return true
-end
diff --git a/src/tensors/linalg.jl b/src/tensors/linalg.jl
index 5eba8414c..7ab6c2988 100644
--- a/src/tensors/linalg.jl
+++ b/src/tensors/linalg.jl
@@ -59,7 +59,7 @@ function one!(t::AbstractTensorMap)
     domain(t) == codomain(t) ||
         throw(SectorMismatch("no identity if domain and codomain are different"))
     for (c, b) in blocks(t)
-        MatrixAlgebra.one!(b)
+        one!(b)
     end
     return t
 end
@@ -106,7 +106,7 @@ function isomorphism!(t::AbstractTensorMap)
     domain(t) ≅ codomain(t) ||
         throw(SpaceMismatch(lazy"domain and codomain are not isomorphic: $(space(t))"))
     for (_, b) in blocks(t)
-        MatrixAlgebra.one!(b)
+        one!(b)
     end
     return t
 end
@@ -155,7 +155,7 @@ function isometry!(t::AbstractTensorMap)
     domain(t) ≾ codomain(t) ||
         throw(SpaceMismatch(lazy"domain and codomain are not isometrically embeddable: $(space(t))"))
     for (_, b) in blocks(t)
-        MatrixAlgebra.one!(b)
+        one!(b)
     end
     return t
 end
@@ -179,7 +179,6 @@ end
 
 # Diagonal tensors
 # ----------------
-# TODO: consider adding a specialised DiagonalTensorMap type
 function LinearAlgebra.diag(t::AbstractTensorMap)
     return SectorDict(c => LinearAlgebra.diag(b) for (c, b) in blocks(t))
 end
@@ -288,12 +287,19 @@ end
 
 _default_rtol(t) = eps(real(float(scalartype(t)))) * min(dim(domain(t)), dim(codomain(t)))
 
-function LinearAlgebra.rank(t::AbstractTensorMap; atol::Real=0,
-                            rtol::Real=atol > 0 ? 0 : _default_rtol(t))
-    dim(t) == 0 && return 0
+function LinearAlgebra.rank(t::AbstractTensorMap;
+                            atol::Real=0, rtol::Real=atol > 0 ? 0 : _default_rtol(t))
+    r = dim(one(sectortype(t))) * 0
+    dim(t) == 0 && return r
     S = LinearAlgebra.svdvals(t)
     tol = max(atol, rtol * maximum(first, values(S)))
-    return sum(cs -> dim(cs[1]) * count(>(tol), cs[2]), S)
+    for (c, b) in S
+        if !isempty(b)
+            r += dim(c) * count(>(tol), b)
+        end
+    end
+    return r
+    # return sum(((c, b),) -> dim(c) * count(>(tol), b), S; init)
 end
 
 function LinearAlgebra.cond(t::AbstractTensorMap, p::Real=2)
@@ -377,7 +383,7 @@ function Base.inv(t::AbstractTensorMap)
     T = float(scalartype(t))
     tinv = similar(t, T, dom ← cod)
     for (c, b) in blocks(t)
-        binv = MatrixAlgebra.one!(block(tinv, c))
+        binv = one!(block(tinv, c))
         ldiv!(lu(b), binv)
     end
     return tinv
@@ -449,11 +455,11 @@ for f in (:cos, :sin, :tan, :cot, :cosh, :sinh, :tanh, :coth, :atan, :acot, :asi
         tf = similar(t, T)
         if T <: Real
             for (c, b) in blocks(t)
-                copy!(block(tf, c), real(MatrixAlgebra.$f(b)))
+                copy!(block(tf, c), real(MatrixAlgebraKit.$f(b)))
             end
         else
             for (c, b) in blocks(t)
-                copy!(block(tf, c), MatrixAlgebra.$f(b))
+                copy!(block(tf, c), MatrixAlgebraKit.$f(b))
             end
         end
         return tf
diff --git a/src/tensors/truncation.jl b/src/tensors/truncation.jl
deleted file mode 100644
index e49cdc94d..000000000
--- a/src/tensors/truncation.jl
+++ /dev/null
@@ -1,163 +0,0 @@
-# truncation.jl
-#
-# Implements truncation schemes for truncating a tensor with svd, leftorth or rightorth
-abstract type TruncationScheme end
-
-struct NoTruncation <: TruncationScheme
-end
-notrunc() = NoTruncation()
-
-struct TruncationError{T<:Real} <: TruncationScheme
-    ϵ::T
-end
-truncerr(epsilon::Real) = TruncationError(epsilon)
-
-struct TruncationDimension <: TruncationScheme
-    dim::Int
-end
-truncdim(d::Int) = TruncationDimension(d)
-
-struct TruncationSpace{S<:ElementarySpace} <: TruncationScheme
-    space::S
-end
-truncspace(space::ElementarySpace) = TruncationSpace(space)
-
-struct TruncationCutoff{T<:Real} <: TruncationScheme
-    ϵ::T
-    add_back::Int
-end
-truncbelow(epsilon::Real, add_back::Int=0) = TruncationCutoff(epsilon, add_back)
-
-# Compute the total truncation error given truncation dimensions
-function _compute_truncerr(Σdata, truncdim, p=2)
-    I = keytype(Σdata)
-    S = scalartype(valtype(Σdata))
-    return _norm((c => view(v, (truncdim[c] + 1):length(v)) for (c, v) in Σdata), p,
-                 zero(S))
-end
-
-# Compute truncation dimensions
-function _compute_truncdim(Σdata, ::NoTruncation, p=2)
-    I = keytype(Σdata)
-    truncdim = SectorDict{I,Int}(c => length(v) for (c, v) in Σdata)
-    return truncdim
-end
-function _compute_truncdim(Σdata, trunc::TruncationError, p=2)
-    I = keytype(Σdata)
-    S = real(eltype(valtype(Σdata)))
-    truncdim = SectorDict{I,Int}(c => length(Σc) for (c, Σc) in Σdata)
-    truncerr = zero(S)
-    while true
-        cmin = _findnexttruncvalue(Σdata, truncdim, p)
-        isnothing(cmin) && break
-        truncdim[cmin] -= 1
-        truncerr = _compute_truncerr(Σdata, truncdim, p)
-        if truncerr > trunc.ϵ
-            truncdim[cmin] += 1
-            break
-        end
-    end
-    return truncdim
-end
-function _compute_truncdim(Σdata, trunc::TruncationDimension, p=2)
-    I = keytype(Σdata)
-    truncdim = SectorDict{I,Int}(c => length(v) for (c, v) in Σdata)
-    while sum(dim(c) * d for (c, d) in truncdim) > trunc.dim
-        cmin = _findnexttruncvalue(Σdata, truncdim, p)
-        isnothing(cmin) && break
-        truncdim[cmin] -= 1
-    end
-    return truncdim
-end
-function _compute_truncdim(Σdata, trunc::TruncationSpace, p=2)
-    I = keytype(Σdata)
-    truncdim = SectorDict{I,Int}(c => min(length(v), dim(trunc.space, c))
-                                 for (c, v) in Σdata)
-    return truncdim
-end
-
-function _compute_truncdim(Σdata, trunc::TruncationCutoff, p=2)
-    I = keytype(Σdata)
-    truncdim = SectorDict{I,Int}(c => length(v) for (c, v) in Σdata)
-    for (c, v) in Σdata
-        newdim = findlast(Base.Fix2(>, trunc.ϵ), v)
-        if newdim === nothing
-            truncdim[c] = 0
-        else
-            truncdim[c] = newdim
-        end
-    end
-    for i in 1:(trunc.add_back)
-        cmax = _findnextgrowvalue(Σdata, truncdim, p)
-        isnothing(cmax) && break
-        truncdim[cmax] += 1
-    end
-    return truncdim
-end
-
-# Combine truncations
-struct MultipleTruncation{T<:Tuple{Vararg{TruncationScheme}}} <: TruncationScheme
-    truncations::T
-end
-function Base.:&(a::MultipleTruncation, b::MultipleTruncation)
-    return MultipleTruncation((a.truncations..., b.truncations...))
-end
-function Base.:&(a::MultipleTruncation, b::TruncationScheme)
-    return MultipleTruncation((a.truncations..., b))
-end
-function Base.:&(a::TruncationScheme, b::MultipleTruncation)
-    return MultipleTruncation((a, b.truncations...))
-end
-Base.:&(a::TruncationScheme, b::TruncationScheme) = MultipleTruncation((a, b))
-
-function _compute_truncdim(Σdata, trunc::MultipleTruncation, p::Real=2)
-    truncdim = _compute_truncdim(Σdata, trunc.truncations[1], p)
-    for k in 2:length(trunc.truncations)
-        truncdimₖ = _compute_truncdim(Σdata, trunc.truncations[k], p)
-        for (c, d) in truncdim
-            truncdim[c] = min(d, truncdimₖ[c])
-        end
-    end
-    return truncdim
-end
-
-# auxiliary function
-function _findnexttruncvalue(Σdata, truncdim::SectorDict{I,Int}, p::Real) where {I<:Sector}
-    # early return
-    (isempty(Σdata) || all(iszero, values(truncdim))) && return nothing
-
-    # find some suitable starting candidate
-    cmin = findfirst(>(0), truncdim)
-    σmin = Σdata[cmin][truncdim[cmin]]
-
-    # find the actual minimum singular value
-    for (c, σs) in Σdata
-        if truncdim[c] > 0
-            σ = σs[truncdim[c]]
-            if σ < σmin
-                cmin, σmin = c, σ
-            end
-        end
-    end
-    return cmin
-end
-function _findnextgrowvalue(Σdata, truncdim::SectorDict{I,Int}, p::Real) where {I<:Sector}
-    istruncated = SectorDict{I,Bool}(c => (d < length(Σdata[c])) for (c, d) in truncdim)
-    # early return
-    (isempty(Σdata) || !any(values(istruncated))) && return nothing
-
-    # find some suitable starting candidate
-    cmax = findfirst(istruncated)
-    σmax = Σdata[cmax][truncdim[cmax] + 1]
-
-    # find the actual maximal singular value
-    for (c, σs) in Σdata
-        if istruncated[c]
-            σ = σs[truncdim[c] + 1]
-            if σ > σmax
-                cmax, σmax = c, σ
-            end
-        end
-    end
-    return cmax
-end
diff --git a/src/tensors/vectorinterface.jl b/src/tensors/vectorinterface.jl
index 92faa23be..f9eb0b6d1 100644
--- a/src/tensors/vectorinterface.jl
+++ b/src/tensors/vectorinterface.jl
@@ -68,7 +68,7 @@ function VectorInterface.add(ty::AbstractTensorMap, tx::AbstractTensorMap,
                              α::Number, β::Number)
     space(ty) == space(tx) || throw(SpaceMismatch("$(space(ty)) ≠ $(space(tx))"))
     T = VectorInterface.promote_add(ty, tx, α, β)
-    return add!(scale!(similar(ty, T), ty, β), tx, α)
+    return add!(scale!(zerovector(ty, T), ty, β), tx, α)
 end
 function VectorInterface.add!(ty::AbstractTensorMap, tx::AbstractTensorMap,
                               α::Number, β::Number)
diff --git a/test/ad.jl b/test/ad.jl
index e5e2d884d..ddd419db1 100644
--- a/test/ad.jl
+++ b/test/ad.jl
@@ -1,9 +1,11 @@
 using ChainRulesCore
 using ChainRulesTestUtils
-using FiniteDifferences: FiniteDifferences
+using FiniteDifferences: FiniteDifferences, central_fdm, forward_fdm
 using Random
 using LinearAlgebra
 using Zygote
+using MatrixAlgebraKit
+using MatrixAlgebraKit: LAPACK_HouseholderQR, LAPACK_HouseholderLQ, diagview
 
 const _repartition = @static if isdefined(Base, :get_extension)
     Base.get_extension(TensorKit, :TensorKitChainRulesCoreExt)._repartition
@@ -26,6 +28,7 @@ function ChainRulesTestUtils.test_approx(actual::AbstractTensorMap,
     for (c, b) in blocks(actual)
         ChainRulesTestUtils.@test_msg msg isapprox(b, block(expected, c); kwargs...)
     end
+    return nothing
 end
 
 # make sure that norms are computed correctly:
@@ -50,8 +53,8 @@ function FiniteDifferences.to_vec(t::TensorKit.SectorDict)
 end
 
 # Float32 and finite differences don't mix well
-precision(::Type{<:Union{Float32,Complex{Float32}}}) = 1e-2
-precision(::Type{<:Union{Float64,Complex{Float64}}}) = 1e-6
+precision(::Type{<:Union{Float32,Complex{Float32}}}) = 1.0e-2
+precision(::Type{<:Union{Float64,Complex{Float64}}}) = 1.0e-6
 
 function randindextuple(N::Int, k::Int=rand(0:N))
     @assert 0 ≤ k ≤ N
@@ -59,414 +62,559 @@ function randindextuple(N::Int, k::Int=rand(0:N))
     return (tuple(_p[1:k]...), tuple(_p[(k + 1):end]...))
 end
 
-# rrules for functions that destroy inputs
-# ----------------------------------------
-function ChainRulesCore.rrule(::typeof(TensorKit.tsvd), args...; kwargs...)
-    return ChainRulesCore.rrule(tsvd!, args...; kwargs...)
+function test_ad_rrule(f, args...; check_inferred=false, kwargs...)
+    test_rrule(Zygote.ZygoteRuleConfig(), f, args...;
+               rrule_f=rrule_via_ad, check_inferred, kwargs...)
+    return nothing
 end
-function ChainRulesCore.rrule(::typeof(LinearAlgebra.svdvals), args...; kwargs...)
-    return ChainRulesCore.rrule(svdvals!, args...; kwargs...)
-end
-function ChainRulesCore.rrule(::typeof(TensorKit.eig), args...; kwargs...)
-    return ChainRulesCore.rrule(eig!, args...; kwargs...)
-end
-function ChainRulesCore.rrule(::typeof(TensorKit.eigh), args...; kwargs...)
-    return ChainRulesCore.rrule(eigh!, args...; kwargs...)
-end
-function ChainRulesCore.rrule(::typeof(LinearAlgebra.eigvals), args...; kwargs...)
-    return ChainRulesCore.rrule(eigvals!, args...; kwargs...)
+
+# Gauge fixing tangents
+# ---------------------
+function remove_qrgauge_dependence!(ΔQ, t, Q)
+    for (c, b) in blocks(ΔQ)
+        m, n = size(block(t, c))
+        minmn = min(m, n)
+        Qc = block(Q, c)
+        Q1 = view(Qc, 1:m, 1:minmn)
+        ΔQ2 = view(b, :, (minmn + 1):m)
+        mul!(ΔQ2, Q1, Q1' * ΔQ2)
+    end
+    return ΔQ
 end
-function ChainRulesCore.rrule(::typeof(TensorKit.leftorth), args...; kwargs...)
-    return ChainRulesCore.rrule(leftorth!, args...; kwargs...)
+
+function remove_lqgauge_dependence!(ΔQ, t, Q)
+    for (c, b) in blocks(ΔQ)
+        m, n = size(block(t, c))
+        minmn = min(m, n)
+        Qc = block(Q, c)
+        Q1 = view(Qc, 1:minmn, 1:n)
+        ΔQ2 = view(b, (minmn + 1):n, :)
+        mul!(ΔQ2, ΔQ2 * Q1', Q1)
+    end
+    return ΔQ
 end
-function ChainRulesCore.rrule(::typeof(TensorKit.rightorth), args...; kwargs...)
-    return ChainRulesCore.rrule(rightorth!, args...; kwargs...)
+function remove_eiggauge_dependence!(ΔV, D, V;
+                                     degeneracy_atol=MatrixAlgebraKit.default_pullback_gaugetol(D))
+    gaugepart = V' * ΔV
+    for (c, b) in blocks(gaugepart)
+        Dc = diagview(block(D, c))
+        # for some reason this fails only on tests, and I cannot reproduce it in an
+        # interactive session.
+        # b[abs.(transpose(diagview(Dc)) .- diagview(Dc)) .>= degeneracy_atol] .= 0
+        for j in axes(b, 2), i in axes(b, 1)
+            abs(Dc[i] - Dc[j]) >= degeneracy_atol && (b[i, j] = 0)
+        end
+    end
+    mul!(ΔV, V / (V' * V), gaugepart, -1, 1)
+    return ΔV
 end
-
-# eigh′: make argument of eigh explicitly Hermitian
-#---------------------------------------------------
-eigh′(t::AbstractTensorMap) = eigh(scale!(t + t', 1 / 2))
-
-function ChainRulesCore.rrule(::typeof(eigh′), args...; kwargs...)
-    return ChainRulesCore.rrule(eigh!, args...; kwargs...)
+function remove_eighgauge_dependence!(ΔV, D, V;
+                                      degeneracy_atol=MatrixAlgebraKit.default_pullback_gaugetol(D))
+    gaugepart = V' * ΔV
+    gaugepart = (gaugepart - gaugepart') / 2
+    for (c, b) in blocks(gaugepart)
+        Dc = diagview(block(D, c))
+        # for some reason this fails only on tests, and I cannot reproduce it in an
+        # interactive session.
+        # b[abs.(transpose(diagview(Dc)) .- diagview(Dc)) .>= degeneracy_atol] .= 0
+        for j in axes(b, 2), i in axes(b, 1)
+            abs(Dc[i] - Dc[j]) >= degeneracy_atol && (b[i, j] = 0)
+        end
+    end
+    mul!(ΔV, V / (V' * V), gaugepart, -1, 1)
+    return ΔV
 end
-
-# complex-valued svd?
-# -------------------
-function remove_svdgauge_depence!(ΔU, ΔV, U, S, V)
-    # simple implementation, assumes no degeneracies or zeros in singular values
-    gaugepart = U' * ΔU + V * ΔV'
+function remove_svdgauge_dependence!(ΔU, ΔVᴴ, U, S, Vᴴ;
+                                     degeneracy_atol=MatrixAlgebraKit.default_pullback_gaugetol(S))
+    gaugepart = U' * ΔU + Vᴴ * ΔVᴴ'
+    gaugepart = (gaugepart - gaugepart') / 2
     for (c, b) in blocks(gaugepart)
-        mul!(block(ΔU, c), block(U, c), Diagonal(imag(diag(b))), -im, 1)
+        Sd = diagview(block(S, c))
+        # for some reason this fails only on tests, and I cannot reproduce it in an
+        # interactive session.
+        # b[abs.(transpose(diagview(Sc)) .- diagview(Sc)) .>= degeneracy_atol] .= 0
+        for j in axes(b, 2), i in axes(b, 1)
+            abs(Sd[i] - Sd[j]) >= degeneracy_atol && (b[i, j] = 0)
+        end
     end
-    return ΔU, ΔV
+    mul!(ΔU, U, gaugepart, -1, 1)
+    return ΔU, ΔVᴴ
 end
 
+project_hermitian(A) = (A + A') / 2
+
 # Tests
 # -----
 
 ChainRulesTestUtils.test_method_tables()
 
-Vlist = ((ℂ^2, (ℂ^3)', ℂ^3, ℂ^2, (ℂ^2)'),
-         (ℂ[Z2Irrep](0 => 1, 1 => 1),
-          ℂ[Z2Irrep](0 => 1, 1 => 2)',
-          ℂ[Z2Irrep](0 => 3, 1 => 2)',
-          ℂ[Z2Irrep](0 => 2, 1 => 3),
-          ℂ[Z2Irrep](0 => 2, 1 => 2)),
-         (ℂ[FermionParity](0 => 1, 1 => 1),
-          ℂ[FermionParity](0 => 1, 1 => 2)',
-          ℂ[FermionParity](0 => 2, 1 => 2)',
-          ℂ[FermionParity](0 => 2, 1 => 3),
-          ℂ[FermionParity](0 => 2, 1 => 2)),
-         (ℂ[U1Irrep](0 => 2, 1 => 1, -1 => 1),
-          ℂ[U1Irrep](0 => 3, 1 => 1, -1 => 1),
-          ℂ[U1Irrep](0 => 2, 1 => 2, -1 => 1)',
-          ℂ[U1Irrep](0 => 1, 1 => 1, -1 => 2),
-          ℂ[U1Irrep](0 => 1, 1 => 2, -1 => 1)'),
-         (ℂ[SU2Irrep](0 => 2, 1 // 2 => 1),
-          ℂ[SU2Irrep](0 => 1, 1 => 1),
-          ℂ[SU2Irrep](1 // 2 => 1, 1 => 1)',
-          ℂ[SU2Irrep](1 // 2 => 2),
-          ℂ[SU2Irrep](0 => 1, 1 // 2 => 1, 3 // 2 => 1)'),
-         (ℂ[FibonacciAnyon](:I => 1, :τ => 1),
-          ℂ[FibonacciAnyon](:I => 1, :τ => 2)',
-          ℂ[FibonacciAnyon](:I => 3, :τ => 2)',
-          ℂ[FibonacciAnyon](:I => 2, :τ => 3),
-          ℂ[FibonacciAnyon](:I => 2, :τ => 2)))
-
-@timedtestset "Automatic Differentiation with spacetype $(TensorKit.type_repr(eltype(V)))" verbose = true for V in
-                                                                                                              Vlist
+spacelist = ((ℂ^2, (ℂ^3)', ℂ^3, ℂ^2, (ℂ^2)'),
+             (Vect[Z2Irrep](0 => 1, 1 => 1),
+              Vect[Z2Irrep](0 => 1, 1 => 2)',
+              Vect[Z2Irrep](0 => 2, 1 => 2)',
+              Vect[Z2Irrep](0 => 2, 1 => 3),
+              Vect[Z2Irrep](0 => 2, 1 => 2)),
+             (Vect[FermionParity](0 => 1, 1 => 1),
+              Vect[FermionParity](0 => 1, 1 => 2)',
+              Vect[FermionParity](0 => 2, 1 => 1)',
+              Vect[FermionParity](0 => 2, 1 => 3),
+              Vect[FermionParity](0 => 2, 1 => 2)),
+             (Vect[U1Irrep](0 => 2, 1 => 1, -1 => 1),
+              Vect[U1Irrep](0 => 2, 1 => 1, -1 => 1),
+              Vect[U1Irrep](0 => 2, 1 => 2, -1 => 1)',
+              Vect[U1Irrep](0 => 1, 1 => 1, -1 => 2),
+              Vect[U1Irrep](0 => 1, 1 => 2, -1 => 1)'),
+             (Vect[SU2Irrep](0 => 2, 1 // 2 => 1),
+              Vect[SU2Irrep](0 => 1, 1 => 1),
+              Vect[SU2Irrep](1 // 2 => 1, 1 => 1)',
+              Vect[SU2Irrep](1 // 2 => 2),
+              Vect[SU2Irrep](0 => 1, 1 // 2 => 1, 3 // 2 => 1)'),
+             (Vect[FibonacciAnyon](:I => 1, :τ => 1),
+              Vect[FibonacciAnyon](:I => 1, :τ => 2)',
+              Vect[FibonacciAnyon](:I => 2, :τ => 2)',
+              Vect[FibonacciAnyon](:I => 2, :τ => 3),
+              Vect[FibonacciAnyon](:I => 2, :τ => 2)))
+
+for V in spacelist
+    I = sectortype(eltype(V))
+    Istr = TensorKit.type_repr(I)
     eltypes = isreal(sectortype(eltype(V))) ? (Float64, ComplexF64) : (ComplexF64,)
     symmetricbraiding = BraidingStyle(sectortype(eltype(V))) isa SymmetricBraiding
+    println("---------------------------------------")
+    println("Auto-diff with symmetry: $Istr")
+    println("---------------------------------------")
+    @timedtestset "AD with symmetry $Istr" verbose = true begin
+        V1, V2, V3, V4, V5 = V
+        W = V1 ⊗ V2
+        @timedtestset "Basic utility" begin
+            T1 = randn(Float64, V[1] ⊗ V[2] ← V[3] ⊗ V[4])
+            T2 = randn(ComplexF64, V[1] ⊗ V[2] ← V[3] ⊗ V[4])
+
+            P1 = ProjectTo(T1)
+            @test P1(T1) == T1
+            @test P1(T2) == real(T2)
+
+            test_rrule(copy, T1)
+            test_rrule(copy, T2)
+            test_rrule(TensorKit.copy_oftype, T1, ComplexF64)
+            if symmetricbraiding
+                test_rrule(TensorKit.permutedcopy_oftype, T1, ComplexF64,
+                           ((3, 1), (2, 4)))
+
+                test_rrule(convert, Array, T1)
+                test_rrule(TensorMap, convert(Array, T1), codomain(T1), domain(T1);
+                           fkwargs=(; tol=Inf))
+            end
 
-    @timedtestset "Basic utility" begin
-        T1 = randn(Float64, V[1] ⊗ V[2] ← V[3] ⊗ V[4])
-        T2 = randn(ComplexF64, V[1] ⊗ V[2] ← V[3] ⊗ V[4])
-
-        P1 = ProjectTo(T1)
-        @test P1(T1) == T1
-        @test P1(T2) == real(T2)
-
-        test_rrule(copy, T1)
-        test_rrule(copy, T2)
-        test_rrule(TensorKit.copy_oftype, T1, ComplexF64)
-        if symmetricbraiding
-            test_rrule(TensorKit.permutedcopy_oftype, T1, ComplexF64, ((3, 1), (2, 4)))
-
-            test_rrule(convert, Array, T1)
-            test_rrule(TensorMap, convert(Array, T1), codomain(T1), domain(T1);
-                       fkwargs=(; tol=Inf))
+            test_rrule(Base.getproperty, T1, :data)
+            test_rrule(TensorMap{scalartype(T1)}, T1.data, T1.space)
+            test_rrule(Base.getproperty, T2, :data)
+            test_rrule(TensorMap{scalartype(T2)}, T2.data, T2.space)
         end
 
-        test_rrule(Base.getproperty, T1, :data)
-        test_rrule(TensorMap{scalartype(T1)}, T1.data, T1.space)
-        test_rrule(Base.getproperty, T2, :data)
-        test_rrule(TensorMap{scalartype(T2)}, T2.data, T2.space)
-    end
-
-    @timedtestset "Basic utility (DiagonalTensor)" begin
-        for v in V
-            rdim = reduceddim(v)
-            D1 = DiagonalTensorMap(randn(rdim), v)
-            D2 = DiagonalTensorMap(randn(rdim), v)
-            D = D1 + im * D2
-            T1 = TensorMap(D1)
-            T2 = TensorMap(D2)
-            T = T1 + im * T2
-
-            # real -> real
-            P1 = ProjectTo(D1)
-            @test P1(D1) == D1
-            @test P1(T1) == D1
-
-            # complex -> complex
-            P2 = ProjectTo(D)
-            @test P2(D) == D
-            @test P2(T) == D
-
-            # real -> complex 
-            @test P2(D1) == D1 + 0 * im * D1
-            @test P2(T1) == D1 + 0 * im * D1
-
-            # complex -> real
-            @test P1(D) == D1
-            @test P1(T) == D1
-
-            test_rrule(DiagonalTensorMap, D1.data, D1.domain)
-            test_rrule(DiagonalTensorMap, D.data, D.domain)
-            test_rrule(Base.getproperty, D, :data)
-            test_rrule(Base.getproperty, D1, :data)
-
-            test_rrule(DiagonalTensorMap, rand!(T1))
-            test_rrule(DiagonalTensorMap, randn!(T))
+        @timedtestset "Basic utility (DiagonalTensor)" begin
+            for v in V
+                rdim = reduceddim(v)
+                D1 = DiagonalTensorMap(randn(rdim), v)
+                D2 = DiagonalTensorMap(randn(rdim), v)
+                D = D1 + im * D2
+                T1 = TensorMap(D1)
+                T2 = TensorMap(D2)
+                T = T1 + im * T2
+
+                # real -> real
+                P1 = ProjectTo(D1)
+                @test P1(D1) == D1
+                @test P1(T1) == D1
+
+                # complex -> complex
+                P2 = ProjectTo(D)
+                @test P2(D) == D
+                @test P2(T) == D
+
+                # real -> complex
+                @test P2(D1) == D1 + 0 * im * D1
+                @test P2(T1) == D1 + 0 * im * D1
+
+                # complex -> real
+                @test P1(D) == D1
+                @test P1(T) == D1
+
+                test_rrule(DiagonalTensorMap, D1.data, D1.domain)
+                test_rrule(DiagonalTensorMap, D.data, D.domain)
+                test_rrule(Base.getproperty, D, :data)
+                test_rrule(Base.getproperty, D1, :data)
+
+                test_rrule(DiagonalTensorMap, rand!(T1))
+                test_rrule(DiagonalTensorMap, randn!(T))
+            end
         end
-    end
-
-    @timedtestset "Basic Linear Algebra with scalartype $T" for T in eltypes
-        A = randn(T, V[1] ⊗ V[2] ← V[3] ⊗ V[4] ⊗ V[5])
-        B = randn(T, space(A))
 
-        test_rrule(real, A)
-        test_rrule(imag, A)
+        @timedtestset "Basic Linear Algebra with scalartype $T" for T in eltypes
+            A = randn(T, V[1] ⊗ V[2] ← V[3] ⊗ V[4] ⊗ V[5])
+            B = randn(T, space(A))
 
-        test_rrule(+, A, B)
-        test_rrule(-, A)
-        test_rrule(-, A, B)
+            test_rrule(real, A)
+            test_rrule(imag, A)
 
-        α = randn(T)
-        test_rrule(*, α, A)
-        test_rrule(*, A, α)
+            test_rrule(+, A, B)
+            test_rrule(-, A)
+            test_rrule(-, A, B)
 
-        C = randn(T, domain(A), codomain(A))
-        test_rrule(*, A, C)
+            α = randn(T)
+            test_rrule(*, α, A)
+            test_rrule(*, A, α)
 
-        symmetricbraiding && test_rrule(permute, A, ((1, 3, 2), (5, 4)))
-        test_rrule(twist, A, 1)
-        test_rrule(twist, A, [1, 3])
+            C = randn(T, domain(A), codomain(A))
+            test_rrule(*, A, C)
 
-        test_rrule(flip, A, 1)
-        test_rrule(flip, A, [1, 3, 4])
+            symmetricbraiding && test_rrule(permute, A, ((1, 3, 2), (5, 4)))
+            test_rrule(twist, A, 1)
+            test_rrule(twist, A, [1, 3])
 
-        D = randn(T, V[1] ⊗ V[2] ← V[3])
-        E = randn(T, V[4] ← V[5])
-        symmetricbraiding && test_rrule(⊗, D, E)
-    end
+            test_rrule(flip, A, 1)
+            test_rrule(flip, A, [1, 3, 4])
 
-    @timedtestset "Linear Algebra part II with scalartype $T" for T in eltypes
-        for i in 1:3
-            E = randn(T, ⊗(V[1:i]...) ← ⊗(V[1:i]...))
-            test_rrule(LinearAlgebra.tr, E)
-            test_rrule(exp, E; check_inferred=false)
-            test_rrule(inv, E)
+            D = randn(T, V[1] ⊗ V[2] ← V[3])
+            E = randn(T, V[4] ← V[5])
+            symmetricbraiding && test_rrule(⊗, D, E)
         end
 
-        A = randn(T, V[1] ⊗ V[2] ← V[3] ⊗ V[4] ⊗ V[5])
-        test_rrule(LinearAlgebra.adjoint, A)
-        test_rrule(LinearAlgebra.norm, A, 2)
+        @timedtestset "Linear Algebra part II with scalartype $T" for T in eltypes
+            for i in 1:3
+                E = randn(T, ⊗(V[1:i]...) ← ⊗(V[1:i]...))
+                test_rrule(LinearAlgebra.tr, E)
+                test_rrule(exp, E; check_inferred=false)
+                test_rrule(inv, E)
+            end
 
-        B = randn(T, space(A))
-        test_rrule(LinearAlgebra.dot, A, B)
-    end
+            A = randn(T, V[1] ⊗ V[2] ← V[3] ⊗ V[4] ⊗ V[5])
+            test_rrule(LinearAlgebra.adjoint, A)
+            test_rrule(LinearAlgebra.norm, A, 2)
 
-    @timedtestset "Matrix functions ($T)" for T in eltypes
-        for f in (sqrt, exp)
-            check_inferred = false # !(T <: Real) # not type-stable for real functions
-            t1 = randn(T, V[1] ← V[1])
-            t2 = randn(T, V[2] ← V[2])
-            d = DiagonalTensorMap{T}(undef, V[1])
-            (T <: Real && f === sqrt) ? randexp!(d.data) : randn!(d.data)
-            d2 = DiagonalTensorMap{T}(undef, V[1])
-            (T <: Real && f === sqrt) ? randexp!(d2.data) : randn!(d2.data)
-            test_rrule(f, t1; rrule_f=Zygote.rrule_via_ad, check_inferred)
-            test_rrule(f, t2; rrule_f=Zygote.rrule_via_ad, check_inferred)
-            test_rrule(f, d; check_inferred, output_tangent=d2)
+            B = randn(T, space(A))
+            test_rrule(LinearAlgebra.dot, A, B)
         end
-    end
 
-    symmetricbraiding &&
-        @timedtestset "TensorOperations with scalartype $T" for T in eltypes
-            atol = precision(T)
-            rtol = precision(T)
+        @timedtestset "Matrix functions ($T)" for T in eltypes
+            for f in (sqrt, exp)
+                check_inferred = false # !(T <: Real) # not type-stable for real functions
+                t1 = randn(T, V[1] ← V[1])
+                t2 = randn(T, V[2] ← V[2])
+                d = DiagonalTensorMap{T}(undef, V[1])
+                d2 = DiagonalTensorMap{T}(undef, V[1])
+                d3 = DiagonalTensorMap{T}(undef, V[1])
+                if (T <: Real && f === sqrt)
+                    # ensuring no square root of negative numbers
+                    randexp!(d.data)
+                    d.data .+= 5
+                    randexp!(d2.data)
+                    d2.data .+= 5
+                    randexp!(d3.data)
+                    d3.data .+= 5
+                else
+                    randn!(d.data)
+                    randn!(d2.data)
+                    randn!(d3.data)
+                end
 
-            @timedtestset "tensortrace!" begin
-                for _ in 1:5
-                    k1 = rand(0:3)
-                    k2 = k1 == 3 ? 1 : rand(1:2)
-                    V1 = map(v -> rand(Bool) ? v' : v, rand(V, k1))
-                    V2 = map(v -> rand(Bool) ? v' : v, rand(V, k2))
+                test_rrule(f, t1; rrule_f=Zygote.rrule_via_ad, check_inferred)
+                test_rrule(f, t2; rrule_f=Zygote.rrule_via_ad, check_inferred)
+                test_rrule(f, d ⊢ d2; check_inferred, output_tangent=d3)
+            end
+        end
 
-                    (_p, _q) = randindextuple(k1 + 2 * k2, k1)
-                    p = _repartition(_p, rand(0:k1))
-                    q = _repartition(_q, k2)
-                    ip = _repartition(invperm(linearize((_p, _q))), rand(0:(k1 + 2 * k2)))
-                    A = randn(T, permute(prod(V1) ⊗ prod(V2) ← prod(V2), ip))
+        symmetricbraiding &&
+            @timedtestset "TensorOperations with scalartype $T" for T in eltypes
+                atol = precision(T)
+                rtol = precision(T)
+
+                @timedtestset "tensortrace!" begin
+                    for _ in 1:5
+                        k1 = rand(0:2)
+                        k2 = rand(1:2)
+                        V1 = map(v -> rand(Bool) ? v' : v, rand(V, k1))
+                        V2 = map(v -> rand(Bool) ? v' : v, rand(V, k2))
+
+                        (_p, _q) = randindextuple(k1 + 2 * k2, k1)
+                        p = _repartition(_p, rand(0:k1))
+                        q = _repartition(_q, k2)
+                        ip = _repartition(invperm(linearize((_p, _q))),
+                                          rand(0:(k1 + 2 * k2)))
+                        A = randn(T, permute(prod(V1) ⊗ prod(V2) ← prod(V2), ip))
+
+                        α = randn(T)
+                        β = randn(T)
+                        for conjA in (false, true)
+                            C = randn!(TensorOperations.tensoralloc_add(T, A, p, conjA,
+                                                                        Val(false)))
+                            test_rrule(tensortrace!, C, A, p, q, conjA, α, β; atol, rtol)
+                        end
+                    end
+                end
 
+                @timedtestset "tensoradd!" begin
+                    A = randn(T, V[1] ⊗ V[2] ← V[4] ⊗ V[5])
                     α = randn(T)
                     β = randn(T)
-                    for conjA in (false, true)
-                        C = randn!(TensorOperations.tensoralloc_add(T, A, p, conjA,
-                                                                    Val(false)))
-                        test_rrule(tensortrace!, C, A, p, q, conjA, α, β; atol, rtol)
-                    end
-                end
-            end
 
-            @timedtestset "tensoradd!" begin
-                A = randn(T, V[1] ⊗ V[2] ⊗ V[3] ← V[4] ⊗ V[5])
-                α = randn(T)
-                β = randn(T)
+                    # repeat a couple times to get some distribution of arrows
+                    for _ in 1:5
+                        p = randindextuple(numind(A))
 
-                # repeat a couple times to get some distribution of arrows
-                for _ in 1:5
-                    p = randindextuple(length(V))
+                        C1 = randn!(TensorOperations.tensoralloc_add(T, A, p, false,
+                                                                     Val(false)))
+                        test_rrule(tensoradd!, C1, A, p, false, α, β; atol, rtol)
 
-                    C1 = randn!(TensorOperations.tensoralloc_add(T, A, p, false,
-                                                                 Val(false)))
-                    test_rrule(tensoradd!, C1, A, p, false, α, β; atol, rtol)
+                        C2 = randn!(TensorOperations.tensoralloc_add(T, A, p, true,
+                                                                     Val(false)))
+                        test_rrule(tensoradd!, C2, A, p, true, α, β; atol, rtol)
+
+                        A = rand(Bool) ? C1 : C2
+                    end
+                end
 
-                    C2 = randn!(TensorOperations.tensoralloc_add(T, A, p, true, Val(false)))
-                    test_rrule(tensoradd!, C2, A, p, true, α, β; atol, rtol)
+                @timedtestset "tensorcontract!" begin
+                    for _ in 1:5
+                        d = 0
+                        local V1, V2, V3
+                        # retry a couple times to make sure there are at least some nonzero elements
+                        for _ in 1:10
+                            k1 = rand(0:3)
+                            k2 = rand(0:2)
+                            k3 = rand(0:2)
+                            V1 = prod(v -> rand(Bool) ? v' : v, rand(V, k1); init=one(V[1]))
+                            V2 = prod(v -> rand(Bool) ? v' : v, rand(V, k2); init=one(V[1]))
+                            V3 = prod(v -> rand(Bool) ? v' : v, rand(V, k3); init=one(V[1]))
+                            d = min(dim(V1 ← V2), dim(V1' ← V2), dim(V2 ← V3),
+                                    dim(V2' ← V3))
+                            d > 0 && break
+                        end
+                        ipA = randindextuple(length(V1) + length(V2))
+                        pA = _repartition(invperm(linearize(ipA)), length(V1))
+                        ipB = randindextuple(length(V2) + length(V3))
+                        pB = _repartition(invperm(linearize(ipB)), length(V2))
+                        pAB = randindextuple(length(V1) + length(V3))
+
+                        α = randn(T)
+                        β = randn(T)
+                        V2_conj = prod(conj, V2; init=one(V[1]))
+
+                        for conjA in (false, true), conjB in (false, true)
+                            A = randn(T, permute(V1 ← (conjA ? V2_conj : V2), ipA))
+                            B = randn(T, permute((conjB ? V2_conj : V2) ← V3, ipB))
+                            C = randn!(TensorOperations.tensoralloc_contract(T, A, pA,
+                                                                             conjA,
+                                                                             B, pB, conjB,
+                                                                             pAB,
+                                                                             Val(false)))
+                            test_rrule(tensorcontract!, C,
+                                       A, pA, conjA, B, pB, conjB, pAB,
+                                       α, β; atol, rtol)
+                        end
+                    end
+                end
 
-                    A = rand(Bool) ? C1 : C2
+                @timedtestset "tensorscalar" begin
+                    A = randn(T, ProductSpace{typeof(V[1]),0}())
+                    test_rrule(tensorscalar, A)
                 end
             end
 
-            @timedtestset "tensorcontract!" begin
-                for _ in 1:5
-                    d = 0
-                    local V1, V2, V3
-                    # retry a couple times to make sure there are at least some nonzero elements
-                    for _ in 1:10
-                        k1 = rand(0:3)
-                        k2 = rand(0:2)
-                        k3 = rand(0:2)
-                        V1 = prod(v -> rand(Bool) ? v' : v, rand(V, k1); init=one(V[1]))
-                        V2 = prod(v -> rand(Bool) ? v' : v, rand(V, k2); init=one(V[1]))
-                        V3 = prod(v -> rand(Bool) ? v' : v, rand(V, k3); init=one(V[1]))
-                        d = min(dim(V1 ← V2), dim(V1' ← V2), dim(V2 ← V3), dim(V2' ← V3))
-                        d > 0 && break
+        @timedtestset "Factorizations" begin
+            W = V[1] ⊗ V[2]
+            @testset "QR" begin
+                for T in eltypes,
+                    t in (randn(T, W, W), randn(T, W, W)',
+                          randn(T, W, V[1]), randn(T, V[1], W),
+                          randn(T, W, V[1])', randn(T, V[1], W)',
+                          DiagonalTensorMap(randn(T, reduceddim(V[1])), V[1]))
+
+                    atol = rtol = precision(T) * dim(space(t))
+                    fkwargs = (; positive=true) # make FiniteDifferences happy
+
+                    test_ad_rrule(qr_compact, t; fkwargs, atol, rtol)
+                    test_ad_rrule(first ∘ qr_compact, t; fkwargs, atol, rtol)
+                    test_ad_rrule(last ∘ qr_compact, t; fkwargs, atol, rtol)
+
+                    # qr_full/qr_null requires being careful with gauges
+                    Q, R = qr_full(t)
+                    ΔQ = rand_tangent(Q)
+                    ΔR = rand_tangent(R)
+
+                    if fuse(domain(t)) ≺ fuse(codomain(t))
+                        _, full_pb = Zygote.pullback(qr_full, t)
+                        @test_logs (:warn, r"^`qr") match_mode = :any full_pb((ΔQ, ΔR))
                     end
-                    ipA = randindextuple(length(V1) + length(V2))
-                    pA = _repartition(invperm(linearize(ipA)), length(V1))
-                    ipB = randindextuple(length(V2) + length(V3))
-                    pB = _repartition(invperm(linearize(ipB)), length(V2))
-                    pAB = randindextuple(length(V1) + length(V3))
 
-                    α = randn(T)
-                    β = randn(T)
-                    V2_conj = prod(conj, V2; init=one(V[1]))
-
-                    for conjA in (false, true), conjB in (false, true)
-                        A = randn(T, permute(V1 ← (conjA ? V2_conj : V2), ipA))
-                        B = randn(T, permute((conjB ? V2_conj : V2) ← V3, ipB))
-                        C = randn!(TensorOperations.tensoralloc_contract(T, A, pA,
-                                                                         conjA,
-                                                                         B, pB, conjB, pAB,
-                                                                         Val(false)))
-                        test_rrule(tensorcontract!, C,
-                                   A, pA, conjA, B, pB, conjB, pAB,
-                                   α, β; atol, rtol)
-                    end
+                    remove_qrgauge_dependence!(ΔQ, t, Q)
+
+                    test_ad_rrule(qr_full, t; fkwargs, atol, rtol, output_tangent=(ΔQ, ΔR))
+                    test_ad_rrule(first ∘ qr_full, t; fkwargs, atol, rtol,
+                                  output_tangent=ΔQ)
+                    test_ad_rrule(last ∘ qr_full, t; fkwargs, atol, rtol, output_tangent=ΔR)
+
+                    # TODO: figure out the following:
+                    # N = qr_null(t)
+                    # ΔN = Q * rand(T, domain(Q) ← domain(N))
+                    # test_ad_rrule(qr_null, t; fkwargs, atol, rtol, output_tangent=ΔN)
+
+                    # if fuse(domain(t)) ≺ fuse(codomain(t))
+                    #     _, null_pb = Zygote.pullback(qr_null, t)
+                    #     @test_logs (:warn, r"^`qr") match_mode = :any null_pb(rand_tangent(N))
+                    # end
                 end
             end
 
-            @timedtestset "tensorscalar" begin
-                A = randn(T, ProductSpace{typeof(V[1]),0}())
-                test_rrule(tensorscalar, A)
-            end
-        end
+            @testset "LQ" begin
+                for T in eltypes,
+                    t in (randn(T, W, W), randn(T, W, W)',
+                          randn(T, W, V[1]), randn(T, V[1], W),
+                          randn(T, W, V[1])', randn(T, V[1], W)',
+                          DiagonalTensorMap(randn(T, reduceddim(V[1])), V[1]))
+
+                    atol = rtol = precision(T) * dim(space(t))
+                    fkwargs = (; positive=true) # make FiniteDifferences happy
+
+                    test_ad_rrule(lq_compact, t; fkwargs, atol, rtol)
+                    test_ad_rrule(first ∘ lq_compact, t; fkwargs, atol, rtol)
+                    test_ad_rrule(last ∘ lq_compact, t; fkwargs, atol, rtol)
+
+                    # lq_full/lq_null requires being careful with gauges
+                    L, Q = lq_full(t)
+                    ΔQ = rand_tangent(Q)
+                    ΔL = rand_tangent(L)
+
+                    if fuse(codomain(t)) ≺ fuse(domain(t))
+                        _, full_pb = Zygote.pullback(lq_full, t)
+                        # broken due to typo in MAK
+                        # @test_logs (:warn, r"^`lq") match_mode = :any full_pb((ΔL, ΔQ))
+                    end
 
-    @timedtestset "Factorizations with scalartype $T" for T in eltypes
-        A = randn(T, V[1] ⊗ V[2] ← V[3] ⊗ V[4] ⊗ V[5])
-        B = randn(T, space(A)')
-        C = randn(T, V[1] ⊗ V[2] ← V[1] ⊗ V[2])
-        H = randn(T, V[3] ⊗ V[4] ← V[3] ⊗ V[4])
-        H = (H + H') / 2
-        atol = precision(T)
-
-        for alg in (TensorKit.QR(), TensorKit.QRpos())
-            test_rrule(leftorth, A; fkwargs=(; alg=alg), atol)
-            test_rrule(leftorth, B; fkwargs=(; alg=alg), atol)
-            test_rrule(leftorth, C; fkwargs=(; alg=alg), atol)
-        end
+                    remove_lqgauge_dependence!(ΔQ, t, Q)
 
-        for alg in (TensorKit.LQ(), TensorKit.LQpos())
-            test_rrule(rightorth, A; fkwargs=(; alg=alg), atol)
-            test_rrule(rightorth, B; fkwargs=(; alg=alg), atol)
-            test_rrule(rightorth, C; fkwargs=(; alg=alg), atol)
-        end
+                    test_ad_rrule(lq_full, t; fkwargs, atol, rtol, output_tangent=(ΔL, ΔQ))
+                    test_ad_rrule(first ∘ lq_full, t; fkwargs, atol, rtol,
+                                  output_tangent=ΔL)
+                    test_ad_rrule(last ∘ lq_full, t; fkwargs, atol, rtol, output_tangent=ΔQ)
 
-        let (D, V) = eig(C)
-            ΔD = randn(scalartype(D), space(D))
-            ΔV = randn(scalartype(V), space(V))
-            gaugepart = V' * ΔV
-            for (c, b) in blocks(gaugepart)
-                mul!(block(ΔV, c), inv(block(V, c))', Diagonal(diag(b)), -1, 1)
-            end
-            test_rrule(eig, C; atol, output_tangent=(ΔD, ΔV))
-        end
+                    # TODO: figure out the following
+                    # Nᴴ = lq_null(t)
+                    # ΔN = rand(T, codomain(Nᴴ) ← codomain(Q)) * Q
+                    # test_ad_rrule(lq_null, t; fkwargs, atol, rtol, output_tangent=Nᴴ)
 
-        let (D, U) = eigh′(H)
-            ΔD = randn(scalartype(D), space(D))
-            ΔU = randn(scalartype(U), space(U))
-            if T <: Complex
-                gaugepart = U' * ΔU
-                for (c, b) in blocks(gaugepart)
-                    mul!(block(ΔU, c), block(U, c), Diagonal(imag(diag(b))), -im, 1)
+                    # if fuse(codomain(t)) ≺ fuse(domain(t))
+                    #     _, null_pb = Zygote.pullback(lq_null, t)
+                    #     # broken due to typo in MAK
+                    #     # @test_logs (:warn, r"^`lq") match_mode = :any null_pb(rand_tangent(Nᴴ))
+                    # end
                 end
             end
-            test_rrule(eigh′, H; atol, output_tangent=(ΔD, ΔU))
-        end
 
-        let (U, S, V, ϵ) = tsvd(A)
-            ΔU = randn(scalartype(U), space(U))
-            ΔS = randn(scalartype(S), space(S))
-            ΔV = randn(scalartype(V), space(V))
-            if T <: Complex # remove gauge dependent components
-                gaugepart = U' * ΔU + V * ΔV'
-                for (c, b) in blocks(gaugepart)
-                    mul!(block(ΔU, c), block(U, c), Diagonal(imag(diag(b))), -im, 1)
+            @testset "Eigenvalue decomposition" begin
+                for T in eltypes,
+                    t in (rand(T, V[1], V[1]), rand(T, W, W), rand(T, W, W)',
+                          DiagonalTensorMap(rand(T, reduceddim(V[1])), V[1]))
+
+                    atol = rtol = precision(T) * dim(space(t))
+
+                    d, v = eig_full(t)
+                    Δv = rand_tangent(v)
+                    Δd = rand_tangent(d)
+                    Δd2 = randn!(similar(d, space(d)))
+                    remove_eiggauge_dependence!(Δv, d, v)
+
+                    test_ad_rrule(eig_full, t; output_tangent=(Δd, Δv), atol, rtol)
+                    test_ad_rrule(first ∘ eig_full, t; output_tangent=Δd, atol, rtol)
+                    test_ad_rrule(last ∘ eig_full, t; output_tangent=Δv, atol, rtol)
+                    test_ad_rrule(eig_full, t; output_tangent=(Δd2, Δv), atol, rtol)
+
+                    t += t'
+                    d, v = eigh_full(t)
+                    Δv = rand_tangent(v)
+                    Δd = rand_tangent(d)
+                    Δd2 = randn!(similar(d, space(d)))
+                    remove_eighgauge_dependence!(Δv, d, v)
+
+                    # necessary for FiniteDifferences to not complain
+                    eigh_full′ = eigh_full ∘ project_hermitian
+
+                    test_ad_rrule(eigh_full′, t; output_tangent=(Δd, Δv), atol, rtol)
+                    test_ad_rrule(first ∘ eigh_full′, t; output_tangent=Δd, atol, rtol)
+                    test_ad_rrule(last ∘ eigh_full′, t; output_tangent=Δv, atol, rtol)
+                    test_ad_rrule(eigh_full′, t; output_tangent=(Δd2, Δv), atol, rtol)
                 end
             end
-            test_rrule(tsvd, A; atol, output_tangent=(ΔU, ΔS, ΔV, 0.0))
-
-            allS = mapreduce(x -> diag(x[2]), vcat, blocks(S))
-            truncval = (maximum(allS) + minimum(allS)) / 2
-            U, S, V, ϵ = tsvd(A; trunc=truncerr(truncval))
-            ΔU = randn(scalartype(U), space(U))
-            ΔS = randn(scalartype(S), space(S))
-            ΔV = randn(scalartype(V), space(V))
-            T <: Complex && remove_svdgauge_depence!(ΔU, ΔV, U, S, V)
-            test_rrule(tsvd, A; atol, output_tangent=(ΔU, ΔS, ΔV, 0.0),
-                       fkwargs=(; trunc=truncerr(truncval)))
-        end
-
-        let (U, S, V, ϵ) = tsvd(B)
-            ΔU = randn(scalartype(U), space(U))
-            ΔS = randn(scalartype(S), space(S))
-            ΔV = randn(scalartype(V), space(V))
-            T <: Complex && remove_svdgauge_depence!(ΔU, ΔV, U, S, V)
-            test_rrule(tsvd, B; atol, output_tangent=(ΔU, ΔS, ΔV, 0.0))
-
-            Vtrunc = spacetype(S)(TensorKit.SectorDict(c => ceil(Int, size(b, 1) / 2)
-                                                       for (c, b) in blocks(S)))
-
-            U, S, V, ϵ = tsvd(B; trunc=truncspace(Vtrunc))
-            ΔU = randn(scalartype(U), space(U))
-            ΔS = randn(scalartype(S), space(S))
-            ΔV = randn(scalartype(V), space(V))
-            T <: Complex && remove_svdgauge_depence!(ΔU, ΔV, U, S, V)
-            test_rrule(tsvd, B; atol, output_tangent=(ΔU, ΔS, ΔV, 0.0),
-                       fkwargs=(; trunc=truncspace(Vtrunc)))
-        end
 
-        let (U, S, V, ϵ) = tsvd(C)
-            ΔU = randn(scalartype(U), space(U))
-            ΔS = randn(scalartype(S), space(S))
-            ΔV = randn(scalartype(V), space(V))
-            T <: Complex && remove_svdgauge_depence!(ΔU, ΔV, U, S, V)
-            test_rrule(tsvd, C; atol, output_tangent=(ΔU, ΔS, ΔV, 0.0))
-
-            c, = TensorKit.MatrixAlgebra._argmax(x -> sqrt(dim(x[1])) * maximum(diag(x[2])),
-                                                 blocks(S))
-            trunc = truncdim(round(Int, 2 * dim(c)))
-            U, S, V, ϵ = tsvd(C; trunc)
-            ΔU = randn(scalartype(U), space(U))
-            ΔS = randn(scalartype(S), space(S))
-            ΔV = randn(scalartype(V), space(V))
-            T <: Complex && remove_svdgauge_depence!(ΔU, ΔV, U, S, V)
-            test_rrule(tsvd, C; atol, output_tangent=(ΔU, ΔS, ΔV, 0.0), fkwargs=(; trunc))
-        end
+            @testset "Singular value decomposition" begin
+                for T in eltypes,
+                    t in (randn(T, V[1], V[1]), randn(T, W, W), randn(T, W, W))
+                    # TODO: fix diagonaltensormap case
+                    #   DiagonalTensorMap(rand(T, reduceddim(V1)), V1))
+
+                    atol = rtol = degeneracy_atol = precision(T) * dim(space(t))
+                    USVᴴ = svd_compact(t)
+                    ΔU, ΔS, ΔVᴴ = rand_tangent.(USVᴴ)
+                    ΔS2 = randn!(similar(ΔS, space(ΔS)))
+                    ΔU, ΔVᴴ = remove_svdgauge_dependence!(ΔU, ΔVᴴ, USVᴴ...; degeneracy_atol)
+
+                    test_ad_rrule(svd_full, t; output_tangent=(ΔU, ΔS, ΔVᴴ), atol, rtol)
+                    test_ad_rrule(svd_full, t; output_tangent=(ΔU, ΔS2, ΔVᴴ), atol, rtol)
+                    test_ad_rrule(svd_compact, t; output_tangent=(ΔU, ΔS, ΔVᴴ), atol, rtol)
+                    test_ad_rrule(svd_compact, t; output_tangent=(ΔU, ΔS2, ΔVᴴ), atol, rtol)
+
+                    # TODO: I'm not sure how to properly test with spaces that might change
+                    # with the finite-difference methods, as then the jacobian is ill-defined.
+
+                    trunc = truncrank(round(Int, min(dim(domain(t)), dim(codomain(t))) ÷ 2))
+                    USVᴴ_trunc = svd_trunc(t; trunc)
+                    ΔUSVᴴ_trunc = rand_tangent.(USVᴴ_trunc)
+                    remove_svdgauge_dependence!(ΔUSVᴴ_trunc[1], ΔUSVᴴ_trunc[3],
+                                                USVᴴ_trunc...;
+                                                degeneracy_atol)
+                    # test_ad_rrule(svd_trunc, t;
+                    #               fkwargs=(; trunc), output_tangent=ΔUSVᴴ_trunc, atol, rtol)
+
+                    trunc = truncspace(space(USVᴴ_trunc[2], 1))
+                    USVᴴ_trunc = svd_trunc(t; trunc)
+                    ΔUSVᴴ_trunc = rand_tangent.(USVᴴ_trunc)
+                    remove_svdgauge_dependence!(ΔUSVᴴ_trunc[1], ΔUSVᴴ_trunc[3],
+                                                USVᴴ_trunc...;
+                                                degeneracy_atol)
+                    test_ad_rrule(svd_trunc, t;
+                                  fkwargs=(; trunc), output_tangent=ΔUSVᴴ_trunc, atol, rtol)
+
+                    # ϵ = norm(*(USVᴴ_trunc...) - t)
+                    # trunc = truncerror(; atol=ϵ)
+                    # USVᴴ_trunc = svd_trunc(t; trunc)
+                    # ΔUSVᴴ_trunc = rand_tangent.(USVᴴ_trunc)
+                    # remove_svdgauge_dependence!(ΔUSVᴴ_trunc[1], ΔUSVᴴ_trunc[3], USVᴴ_trunc...;
+                    #                            degeneracy_atol)
+                    # test_ad_rrule(svd_trunc, t;
+                    #               fkwargs=(; trunc), output_tangent=ΔUSVᴴ_trunc, atol, rtol)
+
+                    tol = minimum(((c, b),) -> minimum(diagview(b)), blocks(USVᴴ_trunc[2]))
+                    trunc = trunctol(; atol=10 * tol)
+                    USVᴴ_trunc = svd_trunc(t; trunc)
+                    ΔUSVᴴ_trunc = rand_tangent.(USVᴴ_trunc)
+                    remove_svdgauge_dependence!(ΔUSVᴴ_trunc[1], ΔUSVᴴ_trunc[3],
+                                                USVᴴ_trunc...;
+                                                degeneracy_atol)
+                    test_ad_rrule(svd_trunc, t;
+                                  fkwargs=(; trunc), output_tangent=ΔUSVᴴ_trunc, atol, rtol)
+                end
+            end
 
-        let D = LinearAlgebra.eigvals(C)
-            ΔD = diag(randn(complex(scalartype(C)), space(C)))
-            test_rrule(LinearAlgebra.eigvals, C; atol, output_tangent=ΔD,
-                       fkwargs=(; sortby=nothing))
-        end
+            # let D = LinearAlgebra.eigvals(C)
+            #     ΔD = diag(randn(complex(scalartype(C)), space(C)))
+            #     test_rrule(LinearAlgebra.eigvals, C; atol, output_tangent=ΔD,
+            #                fkwargs=(; sortby=nothing))
+            # end
 
-        let S = LinearAlgebra.svdvals(C)
-            ΔS = diag(randn(real(scalartype(C)), space(C)))
-            test_rrule(LinearAlgebra.svdvals, C; atol, output_tangent=ΔS)
+            # let S = LinearAlgebra.svdvals(C)
+            #     ΔS = diag(randn(real(scalartype(C)), space(C)))
+            #     test_rrule(LinearAlgebra.svdvals, C; atol, output_tangent=ΔS)
+            # end
         end
     end
 end
diff --git a/test/bugfixes.jl b/test/bugfixes.jl
index fb2f0f45c..3b93f998a 100644
--- a/test/bugfixes.jl
+++ b/test/bugfixes.jl
@@ -47,7 +47,7 @@
     # https://github.com/quantumkithub/TensorKit.jl/issues/201
     @testset "Issue #201" begin
         function f(A::AbstractTensorMap)
-            U, S, V, = tsvd(A)
+            U, S, V, = svd_compact(A)
             return tr(S)
         end
         function f(A::AbstractMatrix)
@@ -60,7 +60,7 @@
         @test convert(Array, grad1) ≈ grad2
 
         function g(A::AbstractTensorMap)
-            U, S, V, = tsvd(A)
+            U, S, V, = svd_compact(A)
             return tr(U * V)
         end
         function g(A::AbstractMatrix)
diff --git a/test/diagonal.jl b/test/diagonal.jl
index e5fcaa430..8d20c6ca0 100644
--- a/test/diagonal.jl
+++ b/test/diagonal.jl
@@ -49,7 +49,9 @@ diagspacelist = ((ℂ^4)', ℂ[Z2Irrep](0 => 2, 1 => 3),
             @test norm(zerovector!(t)) == 0
             @test norm(one!(t)) ≈ sqrt(dim(V))
             @test one!(t) == id(V)
-            @test norm(one!(t) - id(V)) == 0
+            if T != BigFloat # seems broken for now
+                @test norm(one!(t) - id(V)) == 0
+            end
 
             t1 = DiagonalTensorMap(rand(T, reduceddim(V)), V)
             t2 = DiagonalTensorMap(rand(T, reduceddim(V)), V)
@@ -183,58 +185,6 @@ diagspacelist = ((ℂ^4)', ℂ[Z2Irrep](0 => 2, 1 => 3),
         @planar E2[-1 -2 -3; -4 -5] = B[-1 -2 1; -4 -5] * t'[-3; 1]
         @test E1 ≈ E2
     end
-    @timedtestset "Factorization" begin
-        for T in (Float32, ComplexF64)
-            t = DiagonalTensorMap(rand(T, reduceddim(V)), V)
-            @testset "eig" begin
-                D, W = @constinferred eig(t)
-                @test t * W ≈ W * D
-                t2 = t + t'
-                D2, V2 = @constinferred eigh(t2)
-                VdV2 = V2' * V2
-                @test VdV2 ≈ one(VdV2)
-                @test t2 * V2 ≈ V2 * D2
-
-                @test rank(D) ≈ rank(t)
-                @test cond(D) ≈ cond(t)
-                @test all(((s, t),) -> isapprox(s, t),
-                          zip(values(LinearAlgebra.eigvals(D)),
-                              values(LinearAlgebra.eigvals(t))))
-            end
-            @testset "leftorth with $alg" for alg in (TensorKit.QR(), TensorKit.QL())
-                Q, R = @constinferred leftorth(t; alg=alg)
-                QdQ = Q' * Q
-                @test QdQ ≈ one(QdQ)
-                @test Q * R ≈ t
-                if alg isa Polar
-                    @test isposdef(R)
-                end
-            end
-            @testset "rightorth with $alg" for alg in (TensorKit.RQ(), TensorKit.LQ())
-                L, Q = @constinferred rightorth(t; alg=alg)
-                QQd = Q * Q'
-                @test QQd ≈ one(QQd)
-                @test L * Q ≈ t
-                if alg isa Polar
-                    @test isposdef(L)
-                end
-            end
-            @testset "tsvd with $alg" for alg in (TensorKit.SVD(), TensorKit.SDD())
-                U, S, Vᴴ = @constinferred tsvd(t; alg=alg)
-                UdU = U' * U
-                @test UdU ≈ one(UdU)
-                VdV = Vᴴ * Vᴴ'
-                @test VdV ≈ one(VdV)
-                @test U * S * Vᴴ ≈ t
-
-                @test rank(S) ≈ rank(t)
-                @test cond(S) ≈ cond(t)
-                @test all(((s, t),) -> isapprox(s, t),
-                          zip(values(LinearAlgebra.svdvals(S)),
-                              values(LinearAlgebra.svdvals(t))))
-            end
-        end
-    end
     @timedtestset "Tensor functions" begin
         for T in (Float64, ComplexF64)
             d = DiagonalTensorMap(rand(T, reduceddim(V)), V)
diff --git a/test/factorizations.jl b/test/factorizations.jl
new file mode 100644
index 000000000..4022ff3e6
--- /dev/null
+++ b/test/factorizations.jl
@@ -0,0 +1,343 @@
+spacelist = try
+    if ENV["CI"] == "true"
+        println("Detected running on CI")
+        if Sys.iswindows()
+            (Vtr, Vℤ₃, VU₁, VfU₁, VCU₁, VSU₂)
+        elseif Sys.isapple()
+            (Vtr, Vℤ₃, VfU₁, VfSU₂)
+        else
+            (Vtr, VU₁, VCU₁, VSU₂, VfSU₂)
+        end
+    else
+        (Vtr, Vℤ₃, VU₁, VfU₁, VCU₁, VSU₂, VfSU₂)
+    end
+catch
+    (Vtr, Vℤ₃, VU₁, VfU₁, VCU₁, VSU₂, VfSU₂)
+end
+
+eltypes = (Float32, ComplexF64)
+
+for V in spacelist
+    I = sectortype(first(V))
+    Istr = TensorKit.type_repr(I)
+    println("---------------------------------------")
+    println("Factorizations with symmetry: $Istr")
+    println("---------------------------------------")
+    @timedtestset "Factorizations with symmetry: $Istr" verbose = true begin
+        V1, V2, V3, V4, V5 = V
+        W = V1 ⊗ V2
+
+        @testset "QR decomposition" begin
+            for T in eltypes,
+                t in (rand(T, W, W), rand(T, W, W)', rand(T, W, V1), rand(T, V1, W)',
+                      DiagonalTensorMap(rand(T, reduceddim(V1)), V1))
+
+                Q, R = @constinferred qr_full(t)
+                @test Q * R ≈ t
+                @test isunitary(Q)
+
+                Q, R = @constinferred qr_compact(t)
+                @test Q * R ≈ t
+                @test isisometry(Q)
+
+                Q, R = @constinferred left_orth(t; kind=:qr)
+                @test Q * R ≈ t
+                @test isisometry(Q)
+
+                N = @constinferred qr_null(t)
+                @test isisometry(N)
+                @test norm(N' * t) ≈ 0 atol = 100 * eps(norm(t))
+
+                N = @constinferred left_null(t; kind=:qr)
+                @test isisometry(N)
+                @test norm(N' * t) ≈ 0 atol = 100 * eps(norm(t))
+            end
+
+            # empty tensor
+            for T in eltypes
+                t = rand(T, V1 ⊗ V2, zero(V1))
+
+                Q, R = @constinferred qr_full(t)
+                @test Q * R ≈ t
+                @test isunitary(Q)
+                @test dim(R) == dim(t) == 0
+
+                Q, R = @constinferred qr_compact(t)
+                @test Q * R ≈ t
+                @test isisometry(Q)
+                @test dim(Q) == dim(R) == dim(t)
+
+                Q, R = @constinferred left_orth(t; kind=:qr)
+                @test Q * R ≈ t
+                @test isisometry(Q)
+                @test dim(Q) == dim(R) == dim(t)
+
+                N = @constinferred qr_null(t)
+                @test isunitary(N)
+                @test norm(N' * t) ≈ 0 atol = 100 * eps(norm(t))
+            end
+        end
+
+        @testset "LQ decomposition" begin
+            for T in eltypes,
+                t in (rand(T, W, W), rand(T, W, W)', rand(T, W, V1), rand(T, V1, W)',
+                      DiagonalTensorMap(rand(T, reduceddim(V1)), V1))
+
+                L, Q = @constinferred lq_full(t)
+                @test L * Q ≈ t
+                @test isunitary(Q)
+
+                L, Q = @constinferred lq_compact(t)
+                @test L * Q ≈ t
+                @test isisometry(Q; side=:right)
+
+                L, Q = @constinferred right_orth(t; kind=:lq)
+                @test L * Q ≈ t
+                @test isisometry(Q; side=:right)
+
+                Nᴴ = @constinferred lq_null(t)
+                @test isisometry(Nᴴ; side=:right)
+                @test norm(t * Nᴴ') ≈ 0 atol = 100 * eps(norm(t))
+            end
+
+            for T in eltypes
+                # empty tensor
+                t = rand(T, zero(V1), V1 ⊗ V2)
+
+                L, Q = @constinferred lq_full(t)
+                @test L * Q ≈ t
+                @test isunitary(Q)
+                @test dim(L) == dim(t) == 0
+
+                L, Q = @constinferred lq_compact(t)
+                @test L * Q ≈ t
+                @test isisometry(Q; side=:right)
+                @test dim(Q) == dim(L) == dim(t)
+
+                L, Q = @constinferred right_orth(t; kind=:lq)
+                @test L * Q ≈ t
+                @test isisometry(Q; side=:right)
+                @test dim(Q) == dim(L) == dim(t)
+
+                Nᴴ = @constinferred lq_null(t)
+                @test isunitary(Nᴴ)
+                @test norm(t * Nᴴ') ≈ 0 atol = 100 * eps(norm(t))
+            end
+        end
+
+        @testset "Polar decomposition" begin
+            for T in eltypes,
+                t in (rand(T, W, W), rand(T, W, W)', rand(T, W, V1), rand(T, V1, W)',
+                      DiagonalTensorMap(rand(T, reduceddim(V1)), V1))
+
+                @assert domain(t) ≾ codomain(t)
+                w, p = @constinferred left_polar(t)
+                @test w * p ≈ t
+                @test isisometry(w)
+                @test isposdef(p)
+
+                w, p = @constinferred left_orth(t; kind=:polar)
+                @test w * p ≈ t
+                @test isisometry(w)
+            end
+
+            for T in eltypes,
+                t in (rand(T, W, W), rand(T, W, W)', rand(T, V1, W), rand(T, W, V1)')
+
+                @assert codomain(t) ≾ domain(t)
+                p, wᴴ = @constinferred right_polar(t)
+                @test p * wᴴ ≈ t
+                @test isisometry(wᴴ; side=:right)
+                @test isposdef(p)
+
+                p, wᴴ = @constinferred right_orth(t; kind=:polar)
+                @test p * wᴴ ≈ t
+                @test isisometry(wᴴ; side=:right)
+            end
+        end
+
+        @testset "SVD" begin
+            for T in eltypes,
+                t in (rand(T, W, W), rand(T, W, W)',
+                      rand(T, W, V1), rand(T, V1, W),
+                      rand(T, W, V1)', rand(T, V1, W)',
+                      DiagonalTensorMap(rand(T, reduceddim(V1)), V1))
+
+                u, s, vᴴ = @constinferred svd_full(t)
+                @test u * s * vᴴ ≈ t
+                @test isunitary(u)
+                @test isunitary(vᴴ)
+
+                u, s, vᴴ = @constinferred svd_compact(t)
+                @test u * s * vᴴ ≈ t
+                @test isisometry(u)
+                @test isposdef(s)
+                @test isisometry(vᴴ; side=:right)
+
+                s′ = LinearAlgebra.diag(s)
+                for (c, b) in LinearAlgebra.svdvals(t)
+                    @test b ≈ s′[c]
+                end
+
+                v, c = @constinferred left_orth(t; kind=:svd)
+                @test v * c ≈ t
+                @test isisometry(v)
+
+                N = @constinferred left_null(t; kind=:svd)
+                @test isisometry(N)
+                @test norm(N' * t) ≈ 0 atol = 100 * eps(norm(t))
+
+                Nᴴ = @constinferred right_null(t; kind=:svd)
+                @test isisometry(Nᴴ; side=:right)
+                @test norm(t * Nᴴ') ≈ 0 atol = 100 * eps(norm(t))
+            end
+
+            # empty tensor
+            for T in eltypes, t in (rand(T, W, zero(V1)), rand(T, zero(V1), W))
+                U, S, Vᴴ = @constinferred svd_full(t)
+                @test U * S * Vᴴ ≈ t
+                @test isunitary(U)
+                @test isunitary(Vᴴ)
+
+                U, S, Vᴴ = @constinferred svd_compact(t)
+                @test U * S * Vᴴ ≈ t
+                @test dim(U) == dim(S) == dim(Vᴴ) == dim(t) == 0
+            end
+        end
+
+        @testset "truncated SVD" begin
+            for T in eltypes,
+                t in (randn(T, W, W), randn(T, W, W)',
+                      randn(T, W, V1), randn(T, V1, W),
+                      randn(T, W, V1)', randn(T, V1, W)',
+                      DiagonalTensorMap(randn(T, reduceddim(V1)), V1))
+
+                @constinferred normalize!(t)
+
+                U, S, Vᴴ = @constinferred svd_trunc(t; trunc=notrunc())
+                @test U * S * Vᴴ ≈ t
+                @test isisometry(U)
+                @test isisometry(Vᴴ; side=:right)
+
+                trunc = truncrank(dim(domain(S)) ÷ 2)
+                U1, S1, Vᴴ1 = @constinferred svd_trunc(t; trunc)
+                @test t * Vᴴ1' ≈ U1 * S1
+                @test isisometry(U1)
+                @test isisometry(Vᴴ1; side=:right)
+                @test dim(domain(S1)) <= trunc.howmany
+
+                λ = minimum(minimum, values(LinearAlgebra.diag(S1)))
+                trunc = trunctol(; atol=λ - 10eps(λ))
+                U2, S2, Vᴴ2 = @constinferred svd_trunc(t; trunc)
+                @test t * Vᴴ2' ≈ U2 * S2
+                @test isisometry(U2)
+                @test isisometry(Vᴴ2; side=:right)
+                @test minimum(minimum, values(LinearAlgebra.diag(S1))) >= λ
+                @test U2 ≈ U1
+                @test S2 ≈ S1
+                @test Vᴴ2 ≈ Vᴴ1
+
+                trunc = truncspace(space(S2, 1))
+                U3, S3, Vᴴ3 = @constinferred svd_trunc(t; trunc)
+                @test t * Vᴴ3' ≈ U3 * S3
+                @test isisometry(U3)
+                @test isisometry(Vᴴ3; side=:right)
+                @test space(S3, 1) ≾ space(S2, 1)
+
+                trunc = truncerror(; atol=0.5)
+                U4, S4, Vᴴ4 = @constinferred svd_trunc(t; trunc)
+                @test t * Vᴴ4' ≈ U4 * S4
+                @test isisometry(U4)
+                @test isisometry(Vᴴ4; side=:right)
+                @test norm(t - U4 * S4 * Vᴴ4) <= 0.5
+            end
+        end
+
+        @testset "Eigenvalue decomposition" begin
+            for T in eltypes,
+                t in (rand(T, V1, V1), rand(T, W, W), rand(T, W, W)',
+                      DiagonalTensorMap(rand(T, reduceddim(V1)), V1))
+
+                d, v = @constinferred eig_full(t)
+                @test t * v ≈ v * d
+
+                d′ = LinearAlgebra.diag(d)
+                for (c, b) in LinearAlgebra.eigvals(t)
+                    @test sort(b; by=abs) ≈ sort(d′[c]; by=abs)
+                end
+
+                vdv = v' * v
+                vdv = (vdv + vdv') / 2
+                @test @constinferred isposdef(vdv)
+                t isa DiagonalTensorMap || @test !isposdef(t) # unlikely for non-hermitian map
+
+                d, v = @constinferred eig_trunc(t; trunc=truncrank(dim(domain(t)) ÷ 2))
+                @test t * v ≈ v * d
+                @test dim(domain(d)) ≤ dim(domain(t)) ÷ 2
+
+                t2 = (t + t')
+                D, V = eigen(t2)
+                @test isisometry(V)
+                D̃, Ṽ = @constinferred eigh_full(t2)
+                @test D ≈ D̃
+                @test V ≈ Ṽ
+                λ = minimum(minimum(real(LinearAlgebra.diag(b)))
+                            for (c, b) in blocks(D))
+                @test cond(Ṽ) ≈ one(real(T))
+                @test isposdef(t2) == isposdef(λ)
+                @test isposdef(t2 - λ * one(t2) + 0.1 * one(t2))
+                @test !isposdef(t2 - λ * one(t2) - 0.1 * one(t2))
+
+                add!(t, t')
+
+                d, v = @constinferred eigh_full(t)
+                @test t * v ≈ v * d
+                @test isunitary(v)
+
+                λ = minimum(minimum(real(LinearAlgebra.diag(b))) for (c, b) in blocks(d))
+                @test cond(v) ≈ one(real(T))
+                @test isposdef(t) == isposdef(λ)
+                @test isposdef(t - λ * one(t) + 0.1 * one(t))
+                @test !isposdef(t - λ * one(t) - 0.1 * one(t))
+
+                d, v = @constinferred eigh_trunc(t; trunc=truncrank(dim(domain(t)) ÷ 2))
+                @test t * v ≈ v * d
+                @test dim(domain(d)) ≤ dim(domain(t)) ÷ 2
+            end
+        end
+
+        @testset "Condition number and rank" begin
+            for T in eltypes,
+                t in (rand(T, W, W), rand(T, W, W)',
+                      rand(T, W, V1), rand(T, V1, W),
+                      rand(T, W, V1)', rand(T, V1, W)',
+                      DiagonalTensorMap(rand(T, reduceddim(V1)), V1))
+
+                d1, d2 = dim(codomain(t)), dim(domain(t))
+                @test rank(t) == min(d1, d2)
+                M = left_null(t)
+                @test @constinferred(rank(M)) + rank(t) == d1
+                Mᴴ = right_null(t)
+                @test rank(Mᴴ) + rank(t) == d2
+            end
+            for T in eltypes
+                u = unitary(T, V1 ⊗ V2, V1 ⊗ V2)
+                @test @constinferred(cond(u)) ≈ one(real(T))
+                @test @constinferred(rank(u)) == dim(V1 ⊗ V2)
+
+                t = rand(T, zero(V1), W)
+                @test rank(t) == 0
+                t2 = rand(T, zero(V1) * zero(V2), zero(V1) * zero(V2))
+                @test rank(t2) == 0
+                @test cond(t2) == 0.0
+            end
+            for T in eltypes, t in (rand(T, W, W), rand(T, W, W)')
+                add!(t, t')
+                vals = @constinferred LinearAlgebra.eigvals(t)
+                λmax = maximum(s -> maximum(abs, s), values(vals))
+                λmin = minimum(s -> minimum(abs, s), values(vals))
+                @test cond(t) ≈ λmax / λmin
+            end
+        end
+    end
+end
diff --git a/test/runtests.jl b/test/runtests.jl
index 9fafa1d9f..f9829c237 100644
--- a/test/runtests.jl
+++ b/test/runtests.jl
@@ -59,11 +59,7 @@ sectorlist = (Z2Irrep, Z3Irrep, Z4Irrep, Z3Irrep ⊠ Z4Irrep,
               Z2Irrep ⊠ FibonacciAnyon ⊠ FibonacciAnyon)
 
 # spaces
-Vtr = (ℂ^3,
-       (ℂ^4)',
-       ℂ^5,
-       ℂ^6,
-       (ℂ^7)')
+Vtr = (ℂ^2, (ℂ^3)', ℂ^4, ℂ^3, (ℂ^2)')
 Vℤ₂ = (ℂ[Z2Irrep](0 => 1, 1 => 1),
        ℂ[Z2Irrep](0 => 1, 1 => 2)',
        ℂ[Z2Irrep](0 => 3, 1 => 2)',
@@ -71,12 +67,12 @@ Vℤ₂ = (ℂ[Z2Irrep](0 => 1, 1 => 1),
        ℂ[Z2Irrep](0 => 2, 1 => 5))
 Vfℤ₂ = (ℂ[FermionParity](0 => 1, 1 => 1),
         ℂ[FermionParity](0 => 1, 1 => 2)',
-        ℂ[FermionParity](0 => 3, 1 => 2)',
+        ℂ[FermionParity](0 => 2, 1 => 1)',
         ℂ[FermionParity](0 => 2, 1 => 3),
         ℂ[FermionParity](0 => 2, 1 => 5))
-Vℤ₃ = (ℂ[Z3Irrep](0 => 1, 1 => 2, 2 => 2),
-       ℂ[Z3Irrep](0 => 3, 1 => 1, 2 => 1),
-       ℂ[Z3Irrep](0 => 2, 1 => 2, 2 => 1)',
+Vℤ₃ = (ℂ[Z3Irrep](0 => 1, 1 => 2, 2 => 1),
+       ℂ[Z3Irrep](0 => 2, 1 => 1, 2 => 1),
+       ℂ[Z3Irrep](0 => 1, 1 => 2, 2 => 1)',
        ℂ[Z3Irrep](0 => 1, 1 => 2, 2 => 3),
        ℂ[Z3Irrep](0 => 1, 1 => 3, 2 => 3)')
 VU₁ = (ℂ[U1Irrep](0 => 1, 1 => 2, -1 => 2),
@@ -110,24 +106,24 @@ VSU₂U₁ = (Vect[SU2Irrep ⊠ U1Irrep]((0, 0) => 1, (1 // 2, -1) => 1),
           Vect[SU2Irrep ⊠ U1Irrep]((1 // 2, 1) => 1, (1, -2) => 1)',
           Vect[SU2Irrep ⊠ U1Irrep]((0, 0) => 2, (0, 2) => 1, (1 // 2, 1) => 1),
           Vect[SU2Irrep ⊠ U1Irrep]((0, 0) => 1, (1 // 2, 1) => 1)')
-# VSU₃ = (ℂ[SU3Irrep]((0, 0, 0) => 3, (1, 0, 0) => 1),
-#     ℂ[SU3Irrep]((0, 0, 0) => 3, (2, 0, 0) => 1)',
-#     ℂ[SU3Irrep]((1, 1, 0) => 1, (2, 1, 0) => 1),
-#     ℂ[SU3Irrep]((1, 0, 0) => 1, (2, 0, 0) => 1),
-#     ℂ[SU3Irrep]((0, 0, 0) => 1, (1, 0, 0) => 1, (1, 1, 0) => 1)')
+Vfib = (Vect[FibonacciAnyon](:I => 1, :τ => 1),
+        Vect[FibonacciAnyon](:I => 1, :τ => 2)',
+        Vect[FibonacciAnyon](:I => 3, :τ => 2)',
+        Vect[FibonacciAnyon](:I => 2, :τ => 3),
+        Vect[FibonacciAnyon](:I => 2, :τ => 2))
 
 if !is_buildkite
     Ti = time()
-    include("fusiontrees.jl")
-    include("spaces.jl")
-    include("tensors.jl")
-    include("diagonal.jl")
-    include("planar.jl")
-    # TODO: remove once we know AD is slow on macOS CI
+    @time include("fusiontrees.jl")
+    @time include("spaces.jl")
+    @time include("tensors.jl")
+    @time include("factorizations.jl")
+    @time include("diagonal.jl")
+    @time include("planar.jl")
     if !(Sys.isapple() && get(ENV, "CI", "false") == "true") && isempty(VERSION.prerelease)
-        include("ad.jl")
+        @time include("ad.jl")
     end
-    include("bugfixes.jl")
+    @time include("bugfixes.jl")
     Tf = time()
     printstyled("Finished all tests in ",
                 string(round((Tf - Ti) / 60; sigdigits=3)),
diff --git a/test/tensors.jl b/test/tensors.jl
index 30526f2c1..f60de0d1b 100644
--- a/test/tensors.jl
+++ b/test/tensors.jl
@@ -1,9 +1,3 @@
-for V in (Vtr, Vℤ₂, Vfℤ₂, Vℤ₃, VU₁, VfU₁, VCU₁, VSU₂, VfSU₂, VSU₂U₁)#, VSU₃)
-    V1, V2, V3, V4, V5 = V
-    @assert V3 * V4 * V2 ≿ V1' * V5' # necessary for leftorth tests
-    @assert V3 * V4 ≾ V1' * V2' * V5' # necessary for rightorth tests
-end
-
 spacelist = try
     if ENV["CI"] == "true"
         println("Detected running on CI")
@@ -369,9 +363,8 @@ for V in spacelist
             for T in (Float64, ComplexF64)
                 t1 = randisometry(T, W1, W2)
                 t2 = randisometry(T, W2 ← W2)
-                @test t1' * t1 ≈ one(t2)
-                @test t2' * t2 ≈ one(t2)
-                @test t2 * t2' ≈ one(t2)
+                @test isisometry(t1)
+                @test isunitary(t2)
                 P = t1 * t1'
                 @test P * P ≈ P
             end
@@ -439,204 +432,6 @@ for V in spacelist
             @test LinearAlgebra.isdiag(D)
             @test LinearAlgebra.diag(D) == d
         end
-        @timedtestset "Factorization" begin
-            W = V1 ⊗ V2 ⊗ V3 ⊗ V4 ⊗ V5
-            for T in (Float32, ComplexF64)
-                # Test both a normal tensor and an adjoint one.
-                ts = (rand(T, W), rand(T, W)')
-                for t in ts
-                    @testset "leftorth with $alg" for alg in
-                                                      (TensorKit.QR(), TensorKit.QRpos(),
-                                                       TensorKit.QL(), TensorKit.QLpos(),
-                                                       TensorKit.Polar(), TensorKit.SVD(),
-                                                       TensorKit.SDD())
-                        Q, R = @constinferred leftorth(t, ((3, 4, 2), (1, 5)); alg=alg)
-                        QdQ = Q' * Q
-                        @test QdQ ≈ one(QdQ)
-                        @test Q * R ≈ permute(t, ((3, 4, 2), (1, 5)))
-                        if alg isa Polar
-                            @test isposdef(R)
-                            @test domain(R) == codomain(R) == space(t, 1)' ⊗ space(t, 5)'
-                        end
-                    end
-                    @testset "leftnull with $alg" for alg in
-                                                      (TensorKit.QR(), TensorKit.SVD(),
-                                                       TensorKit.SDD())
-                        N = @constinferred leftnull(t, ((3, 4, 2), (1, 5)); alg=alg)
-                        NdN = N' * N
-                        @test NdN ≈ one(NdN)
-                        @test norm(N' * permute(t, ((3, 4, 2), (1, 5)))) <
-                              100 * eps(norm(t))
-                    end
-                    @testset "rightorth with $alg" for alg in
-                                                       (TensorKit.RQ(), TensorKit.RQpos(),
-                                                        TensorKit.LQ(), TensorKit.LQpos(),
-                                                        TensorKit.Polar(), TensorKit.SVD(),
-                                                        TensorKit.SDD())
-                        L, Q = @constinferred rightorth(t, ((3, 4), (2, 1, 5)); alg=alg)
-                        QQd = Q * Q'
-                        @test QQd ≈ one(QQd)
-                        @test L * Q ≈ permute(t, ((3, 4), (2, 1, 5)))
-                        if alg isa Polar
-                            @test isposdef(L)
-                            @test domain(L) == codomain(L) == space(t, 3) ⊗ space(t, 4)
-                        end
-                    end
-                    @testset "rightnull with $alg" for alg in
-                                                       (TensorKit.LQ(), TensorKit.SVD(),
-                                                        TensorKit.SDD())
-                        M = @constinferred rightnull(t, ((3, 4), (2, 1, 5)); alg=alg)
-                        MMd = M * M'
-                        @test MMd ≈ one(MMd)
-                        @test norm(permute(t, ((3, 4), (2, 1, 5))) * M') <
-                              100 * eps(norm(t))
-                    end
-                    @testset "tsvd with $alg" for alg in (TensorKit.SVD(), TensorKit.SDD())
-                        U, S, V = @constinferred tsvd(t, ((3, 4, 2), (1, 5)); alg=alg)
-                        UdU = U' * U
-                        @test UdU ≈ one(UdU)
-                        VVd = V * V'
-                        @test VVd ≈ one(VVd)
-                        t2 = permute(t, ((3, 4, 2), (1, 5)))
-                        @test U * S * V ≈ t2
-
-                        s = LinearAlgebra.svdvals(t2)
-                        s′ = LinearAlgebra.diag(S)
-                        for (c, b) in s
-                            @test b ≈ s′[c]
-                        end
-                    end
-                    @testset "cond and rank" begin
-                        t2 = permute(t, ((3, 4, 2), (1, 5)))
-                        d1 = dim(codomain(t2))
-                        d2 = dim(domain(t2))
-                        @test rank(t2) == min(d1, d2)
-                        M = leftnull(t2)
-                        @test rank(M) == max(d1, d2) - min(d1, d2)
-                        t3 = unitary(T, V1 ⊗ V2, V1 ⊗ V2)
-                        @test cond(t3) ≈ one(real(T))
-                        @test rank(t3) == dim(V1 ⊗ V2)
-                        t4 = randn(T, V1 ⊗ V2, V1 ⊗ V2)
-                        t4 = (t4 + t4') / 2
-                        vals = LinearAlgebra.eigvals(t4)
-                        λmax = maximum(s -> maximum(abs, s), values(vals))
-                        λmin = minimum(s -> minimum(abs, s), values(vals))
-                        @test cond(t4) ≈ λmax / λmin
-                    end
-                end
-                @testset "empty tensor" begin
-                    t = randn(T, V1 ⊗ V2, zero(V1))
-                    @testset "leftorth with $alg" for alg in
-                                                      (TensorKit.QR(), TensorKit.QRpos(),
-                                                       TensorKit.QL(), TensorKit.QLpos(),
-                                                       TensorKit.Polar(), TensorKit.SVD(),
-                                                       TensorKit.SDD())
-                        Q, R = @constinferred leftorth(t; alg=alg)
-                        @test Q == t
-                        @test dim(Q) == dim(R) == 0
-                    end
-                    @testset "leftnull with $alg" for alg in
-                                                      (TensorKit.QR(), TensorKit.SVD(),
-                                                       TensorKit.SDD())
-                        N = @constinferred leftnull(t; alg=alg)
-                        @test N' * N ≈ id(domain(N))
-                        @test N * N' ≈ id(codomain(N))
-                    end
-                    @testset "rightorth with $alg" for alg in
-                                                       (TensorKit.RQ(), TensorKit.RQpos(),
-                                                        TensorKit.LQ(), TensorKit.LQpos(),
-                                                        TensorKit.Polar(), TensorKit.SVD(),
-                                                        TensorKit.SDD())
-                        L, Q = @constinferred rightorth(copy(t'); alg=alg)
-                        @test Q == t'
-                        @test dim(Q) == dim(L) == 0
-                    end
-                    @testset "rightnull with $alg" for alg in
-                                                       (TensorKit.LQ(), TensorKit.SVD(),
-                                                        TensorKit.SDD())
-                        M = @constinferred rightnull(copy(t'); alg=alg)
-                        @test M * M' ≈ id(codomain(M))
-                        @test M' * M ≈ id(domain(M))
-                    end
-                    @testset "tsvd with $alg" for alg in (TensorKit.SVD(), TensorKit.SDD())
-                        U, S, V = @constinferred tsvd(t; alg=alg)
-                        @test U == t
-                        @test dim(U) == dim(S) == dim(V)
-                    end
-                    @testset "cond and rank" begin
-                        @test rank(t) == 0
-                        W2 = zero(V1) * zero(V2)
-                        t2 = rand(W2, W2)
-                        @test rank(t2) == 0
-                        @test cond(t2) == 0.0
-                    end
-                end
-                t = rand(T, V1 ⊗ V1' ⊗ V2 ⊗ V2')
-                @testset "eig and isposdef" begin
-                    D, V = eigen(t, ((1, 3), (2, 4)))
-                    t2 = permute(t, ((1, 3), (2, 4)))
-                    @test t2 * V ≈ V * D
-
-                    d = LinearAlgebra.eigvals(t2; sortby=nothing)
-                    d′ = LinearAlgebra.diag(D)
-                    for (c, b) in d
-                        @test b ≈ d′[c]
-                    end
-
-                    # Somehow moving these test before the previous one gives rise to errors
-                    # with T=Float32 on x86 platforms. Is this an OpenBLAS issue? 
-                    VdV = V' * V
-                    VdV = (VdV + VdV') / 2
-                    @test isposdef(VdV)
-
-                    @test !isposdef(t2) # unlikely for non-hermitian map
-                    t2 = (t2 + t2')
-                    D, V = eigen(t2)
-                    VdV = V' * V
-                    @test VdV ≈ one(VdV)
-                    D̃, Ṽ = @constinferred eigh(t2)
-                    @test D ≈ D̃
-                    @test V ≈ Ṽ
-                    λ = minimum(minimum(real(LinearAlgebra.diag(b)))
-                                for (c, b) in blocks(D))
-                    @test cond(Ṽ) ≈ one(real(T))
-                    @test isposdef(t2) == isposdef(λ)
-                    @test isposdef(t2 - λ * one(t2) + 0.1 * one(t2))
-                    @test !isposdef(t2 - λ * one(t2) - 0.1 * one(t2))
-                end
-            end
-        end
-        @timedtestset "Tensor truncation" begin
-            for T in (Float32, ComplexF64)
-                for p in (1, 2, 3, Inf)
-                    # Test both a normal tensor and an adjoint one.
-                    ts = (randn(T, V1 ⊗ V2 ⊗ V3, V4 ⊗ V5),
-                          randn(T, V4 ⊗ V5, V1 ⊗ V2 ⊗ V3)')
-                    for t in ts
-                        U₀, S₀, V₀, = tsvd(t)
-                        t = rmul!(t, 1 / norm(S₀, p))
-                        U, S, V, ϵ = @constinferred tsvd(t; trunc=truncerr(5e-1), p=p)
-                        # @show p, ϵ
-                        # @show domain(S)
-                        # @test min(space(S,1), space(S₀,1)) != space(S₀,1)
-                        U′, S′, V′, ϵ′ = tsvd(t; trunc=truncerr(nextfloat(ϵ)), p=p)
-                        @test (U, S, V, ϵ) == (U′, S′, V′, ϵ′)
-                        U′, S′, V′, ϵ′ = tsvd(t; trunc=truncdim(ceil(Int, dim(domain(S)))),
-                                              p=p)
-                        @test (U, S, V, ϵ) == (U′, S′, V′, ϵ′)
-                        U′, S′, V′, ϵ′ = tsvd(t; trunc=truncspace(space(S, 1)), p=p)
-                        @test (U, S, V, ϵ) == (U′, S′, V′, ϵ′)
-                        # results with truncationcutoff cannot be compared because they don't take degeneracy into account, and thus truncate differently
-                        U, S, V, ϵ = tsvd(t; trunc=truncbelow(1 / dim(domain(S₀))), p=p)
-                        # @show p, ϵ
-                        # @show domain(S)
-                        # @test min(space(S,1), space(S₀,1)) != space(S₀,1)
-                        U′, S′, V′, ϵ′ = tsvd(t; trunc=truncspace(space(S, 1)), p=p)
-                        @test (U, S, V, ϵ) == (U′, S′, V′, ϵ′)
-                    end
-                end
-            end
-        end
         if BraidingStyle(I) isa Bosonic && hasfusiontensor(I)
             @timedtestset "Tensor functions" begin
                 W = V1 ⊗ V2
@@ -691,8 +486,8 @@ for V in spacelist
             for T in (Float32, ComplexF64)
                 tA = rand(T, V1 ⊗ V3, V1 ⊗ V3)
                 tB = rand(T, V2 ⊗ V4, V2 ⊗ V4)
-                tA = 3 // 2 * leftorth(tA; alg=Polar())[1]
-                tB = 1 // 5 * leftorth(tB; alg=Polar())[1]
+                tA = 3 // 2 * left_polar(tA)[1]
+                tB = 1 // 5 * left_polar(tB)[1]
                 tC = rand(T, V1 ⊗ V3, V2 ⊗ V4)
                 t = @constinferred sylvester(tA, tB, tC)
                 @test codomain(t) == V1 ⊗ V3