The source files for all examples can be found in /examples.

Signal Decomposition

This example uses the GenericSolver to solve a signal decomposition problem with custom proximal operators. This problem seeks to decompose an observed signal into a sum of several components.

using GeNIOS
using Random, LinearAlgebra, SparseArrays
using Plots
using ProximalOperators: TotalVariation1D, prox!
using BandedMatrices
using LinearMaps

Generating the problem data

Random.seed!(1)
T, K = 200, 3
t = range(0, 1000, T)

# component 2: sine wave
s2 = @. sin(2π * t * 1/500)

# component 3: square wave
square(x) = x % 2π < π ? 1 : -1
s3 = @. square(2π  * t * 1/450)

# component 1: noise
s1 = 0.1 * randn(T)

# observed signal
X = hcat(s1, s2, s3)
y = sum(X, dims=2) |> vec

sig_plt = plot(
    t,
    y,
    lw=1,
    label="observed signal",
    xlabel="time",
    ylabel="signal",
    legend=:topright,
    dpi=300,
    marker=:circle,
    ls=:dash,
    color=:royalblue
)
plot!(sig_plt,
    t,
    sum(X[:, 2:end], dims=2) |> vec,
    label="true signal",
    lw=3,
    color=:royalblue
)

We will separate the observed signal $y$ into a sum of $K=3$ signals $x_k$. The first is mean-squared small (noise). The second is second-order smooth (smooth derivative). The third is first-difference sparse (piecewise constant). This problem can be phrased as

\[\begin{array}{ll} \text{minimize} & (1/T)\|y - x^2 - x^3\|_2^2 + \gamma_2 \phi_2(x^2) + \gamma_3 \phi_1(x^3), \end{array}\]

where

\[\phi_2(x) = \frac{1}{T-2}\sum_{i=2}^{T-1} (x_{t+1} - 2x_t + x_{t-1})^2\]

and

\[\phi_3(x) = \frac{1}{T-1}\sum_{i=1}^{T-1} \lvert x_{t+1} - x_t \rvert\]

We will solve this problem using the genertic solver interface, with the first term as $f(x)$ and the second and third terms as $g(z)$. Specifically, this problem can be rephrased as

\[\begin{array}{ll} \text{minimize} & (1/T)\|x^1\|_2^2 + I_{\{0\}}(z^1) + \gamma_2 \phi_2(z^2) + \gamma_3 \phi_1(z^3) \\ \text{subject to} & x^1 + x^2 + x^3 - z^1 = y \\ && x^2 - z^2 = 0 \\ && x^3 - z^3 = 0, \end{array}\]

where $I_{\{0\}}(z^1)$ is the indicator function for the zeros vector. We note that the proximal operators for the second and third terms can be parallelized.

First we define $f(x)$, which is just a quadratic.

params = (; T=T)

f(x, p) = sum(abs2, x[1:p.T] ) / p.T

function grad_f!(g, x, p)
    @. g[1:p.T] = 2/p.T * x[1:p.T]
    g[p.T+1:end] .= zero(eltype(x))
    return nothing
end

grad_f! (generic function with 1 method)

The HessianOperator here is block diagonal, with a $T \times T$ identity block, followed by two zero blocks.

struct HessianSignal <: HessianOperator end
function LinearAlgebra.mul!(y, ::HessianSignal, x)
    T = length(x) ÷ 3
    @. y[1:T] = 2/T * x[1:T]
    y[T+1:end] .= zero(eltype(x))
    return nothing
end
update!(::HessianSignal, ::Solver) = nothing
Hf = HessianSignal()

Main.HessianSignal()

A custom proximal operator

Now, we define $g$ and its proximal operator. Here, we will take advantage of parallelization, as this problem is clearly separable across components. Further performance improvements could be made for these proximal operators, which we avoid for simplicity.

We use ProximalOperators.jl to help construct the proximal operator.

function g(z, p)
    @views z1, z2, z3 = z[1:p.T], z[p.T+1:2p.T], z[2p.T+1:end]
    any(.!iszero.(z1)) && return Inf

    gz2 = sum(t->(z2[t+1] - 2z[t] + z[t-1])^2, 2:p.T-1)
    gz3 = sum(abs, diff(z3)) / (p.T-1)
    return gz2 + gz3
end

# the prox operator for g, using ProximalOperators.jl
function prox_g!(v, z, ρ, p)
    @views z1, z2, z3 = z[1:p.T], z[p.T+1:2p.T], z[2p.T+1:end]
    @views v1, v2, v3 = v[1:p.T], v[p.T+1:2p.T], v[2p.T+1:end]

    Threads.@threads for k in 1:3
        if k == 1
            # Prox for z1
            v1 .= zero(eltype(z))
        elseif k == 2
            # Prox for z2
            # g²(z²) = γ₂/T * ||Az||²
            du = vcat(zeros(1), ones(p.T-2))
            d = vcat(zeros(1), -2*ones(p.T-2), zeros(1))
            dl = vcat(ones(p.T-2), zeros(1))

            # Use banded matrix for O(T) solve time
            A = BandedMatrix(-1 => dl, 0 => d, 1 => du)
            F = cholesky(I + 1e3/(ρ * p.T) * A'*A)
            ldiv!(v2, F, z2)
        else
            # Prox for z3
            ϕ³ = TotalVariation1D(1/p.T)
            prox!(v3, ϕ³, z3, 1/ρ)
        end
    end

    return nothing
end

prox_g! (generic function with 1 method)

The constraints

Note that $M$ is a highly structured matrix. We use LinearMaps.jl to implement this more efficiently.

_0 = LinearMap(spzeros(T, T))
M = [
        I  I  I;
        _0  I  _0;
        _0  _0  I
]
c = vcat(y, zeros(T), zeros(T));

Solving the problem

solver = GeNIOS.GenericSolver(
    f, grad_f!, Hf,         # f(x)
    g, prox_g!,             # g(z)
    M, c;                   # M, c: Mx + z = c
    params=params
)
res = solve!(solver, options=GeNIOS.SolverOptions(eps_abs=1e-5, print_iter=100))

x1 = solver.xk[1:T]
x2 = solver.xk[T+1:2T]
x3 = solver.xk[2T+1:end];

Starting setup...
Setup in  0.338s

──────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
    Iteration        Obj Val       r_primal         r_dual              ρ           Time
──────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────
            0      0.000e+00            Inf            Inf      1.000e+00         0.000
            1      0.000e+00      2.146e+01      3.716e+01      1.000e+00         2.763
          100      1.034e+02      5.062e-04      8.941e-03      5.000e-01         2.992
          200      1.070e+02      4.418e-04      1.876e-03      1.250e-01         3.123
          300      1.078e+02      3.830e-04      1.075e-03      1.250e-01         3.247
          400      1.072e+02      1.604e-04      6.493e-04      1.250e-01         3.373
          500      1.079e+02      1.081e-04      4.436e-04      1.250e-01         3.496
          585      1.088e+02      8.961e-05      2.570e-04      1.250e-01         3.601

SOLVED in  3.601s, 585 iterations
Total time:  3.939s
──────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────

Plotting the results

res_plt = plot(
    t,
    y,
    lw=1,
    label="observed signal",
    xlabel="time",
    ylabel="signal",
    legend=:topright,
    dpi=300,
    marker=:circle,
    ls=:dash
)
plot!(res_plt,
    t,
    sum(X[:, 2:end], dims=2) |> vec,
    label="true signal",
    lw=3,
    color=:blue
)
plot!(res_plt,
    t,
    x2 + x3,
    label="reconstructed signal",
    lw=3,
    color=:coral1
)

Visualizing each component

p1 = plot(
    t,
    X[:, 1],
    lw=1,
    label="x1 true",
    xlabel="time",
    ylabel="signal",
    legend=:topright,
    dpi=300,
    marker=:circle,
    ls=:dash,
    color=:royalblue
)
plot!(p1,
    t,
    x1,
    label="x1 estimated",
    lw=3,
    color=:coral1
)

p2 = plot(
    t,
    X[:, 2],
    lw=3,
    label="x2 true",
    xlabel="time",
    ylabel="signal",
    legend=:topright,
    dpi=300,
    ls=:dash,
    color=:royalblue
)
plot!(p2,
    t,
    x2,
    label="x2 estimated",
    lw=3,
    color=:coral1
)

p3 = plot(
    t,
    X[:, 3],
    lw=3,
    label="x3 true",
    xlabel="time",
    ylabel="signal",
    legend=:topright,
    dpi=300,
    ls=:dash,
    color=:royalblue
)
plot!(p3,
    t,
    x3,
    label="x3 estimated",
    lw=3,
    color=:coral1
)
decomp_plt = plot(p1, p2, p3, layout=(3,1))

This page was generated using Literate.jl.