Thu, 23 Jan 2025 23:34:05 +0100
Merging adjustments, parameter tuning, etc.
32 | 1 | /*! |
2 | Solver for the point source localisation problem using a sliding | |
3 | forward-backward splitting method. | |
4 | */ | |
5 | ||
6 | use numeric_literals::replace_float_literals; | |
7 | use serde::{Serialize, Deserialize}; | |
8 | //use colored::Colorize; | |
9 | //use nalgebra::{DVector, DMatrix}; | |
10 | use itertools::izip; | |
34
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
11 | use std::iter::Iterator; |
32 | 12 | |
35 | 13 | use alg_tools::iterate::AlgIteratorFactory; |
34
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
14 | use alg_tools::euclidean::Euclidean; |
37
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
15 | use alg_tools::mapping::{Mapping, DifferentiableRealMapping, Instance}; |
35 | 16 | use alg_tools::norms::Norm; |
32 | 17 | use alg_tools::nalgebra_support::ToNalgebraRealField; |
37
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
18 | use alg_tools::norms::L2; |
32 | 19 | |
20 | use crate::types::*; | |
35 | 21 | use crate::measures::{DiscreteMeasure, Radon, RNDM}; |
37
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
22 | use crate::measures::merging::SpikeMerging; |
35 | 23 | use crate::forward_model::{ |
24 | ForwardModel, | |
25 | AdjointProductBoundedBy, | |
26 | LipschitzValues, | |
27 | }; | |
32 | 28 | //use crate::tolerance::Tolerance; |
29 | use crate::plot::{ | |
30 | SeqPlotter, | |
31 | Plotting, | |
32 | PlotLookup | |
33 | }; | |
34 | use crate::fb::*; | |
35 | use crate::regularisation::SlidingRegTerm; | |
36 | use crate::dataterm::{ | |
37 | L2Squared, | |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
38 | DataTerm, |
32 | 39 | calculate_residual, |
40 | calculate_residual2, | |
41 | }; | |
35 | 42 | //use crate::transport::TransportLipschitz; |
43 | ||
44 | /// Transport settings for [`pointsource_sliding_fb_reg`]. | |
45 | #[derive(Clone, Copy, Eq, PartialEq, Serialize, Deserialize, Debug)] | |
46 | #[serde(default)] | |
47 | pub struct TransportConfig<F : Float> { | |
48 | /// Transport step length $θ$ normalised to $(0, 1)$. | |
49 | pub θ0 : F, | |
50 | /// Factor in $(0, 1)$ for decreasing transport to adapt to tolerance. | |
51 | pub adaptation : F, | |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
52 | /// A priori transport tolerance multiplier (C_pri) |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
53 | pub tolerance_mult_pri : F, |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
54 | /// A posteriori transport tolerance multiplier (C_pos) |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
55 | pub tolerance_mult_pos : F, |
35 | 56 | } |
57 | ||
58 | #[replace_float_literals(F::cast_from(literal))] | |
59 | impl <F : Float> TransportConfig<F> { | |
60 | /// Check that the parameters are ok. Panics if not. | |
61 | pub fn check(&self) { | |
62 | assert!(self.θ0 > 0.0); | |
63 | assert!(0.0 < self.adaptation && self.adaptation < 1.0); | |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
64 | assert!(self.tolerance_mult_pri > 0.0); |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
65 | assert!(self.tolerance_mult_pos > 0.0); |
35 | 66 | } |
67 | } | |
68 | ||
69 | #[replace_float_literals(F::cast_from(literal))] | |
70 | impl<F : Float> Default for TransportConfig<F> { | |
71 | fn default() -> Self { | |
72 | TransportConfig { | |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
73 | θ0 : 0.4, |
35 | 74 | adaptation : 0.9, |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
75 | tolerance_mult_pos : 100.0, |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
76 | tolerance_mult_pri : 1000.0, |
35 | 77 | } |
78 | } | |
79 | } | |
32 | 80 | |
81 | /// Settings for [`pointsource_sliding_fb_reg`]. | |
82 | #[derive(Clone, Copy, Eq, PartialEq, Serialize, Deserialize, Debug)] | |
83 | #[serde(default)] | |
84 | pub struct SlidingFBConfig<F : Float> { | |
85 | /// Step length scaling | |
86 | pub τ0 : F, | |
35 | 87 | /// Transport parameters |
88 | pub transport : TransportConfig<F>, | |
32 | 89 | /// Generic parameters |
90 | pub insertion : FBGenericConfig<F>, | |
91 | } | |
92 | ||
93 | #[replace_float_literals(F::cast_from(literal))] | |
94 | impl<F : Float> Default for SlidingFBConfig<F> { | |
95 | fn default() -> Self { | |
96 | SlidingFBConfig { | |
97 | τ0 : 0.99, | |
35 | 98 | transport : Default::default(), |
32 | 99 | insertion : Default::default() |
100 | } | |
101 | } | |
102 | } | |
103 | ||
35 | 104 | /// Internal type of adaptive transport step length calculation |
105 | pub(crate) enum TransportStepLength<F : Float, G : Fn(F, F) -> F> { | |
106 | /// Fixed, known step length | |
107 | Fixed(F), | |
108 | /// Adaptive step length, only wrt. maximum transport. | |
109 | /// Content of `l` depends on use case, while `g` calculates the step length from `l`. | |
110 | AdaptiveMax{ l : F, max_transport : F, g : G }, | |
111 | /// Adaptive step length. | |
112 | /// Content of `l` depends on use case, while `g` calculates the step length from `l`. | |
113 | FullyAdaptive{ l : F, max_transport : F, g : G }, | |
114 | } | |
115 | ||
116 | /// Constrution and a priori transport adaptation. | |
32 | 117 | #[replace_float_literals(F::cast_from(literal))] |
35 | 118 | pub(crate) fn initial_transport<F, G, D, Observable, const N : usize>( |
119 | γ1 : &mut RNDM<F, N>, | |
120 | μ : &mut RNDM<F, N>, | |
121 | opAapply : impl Fn(&RNDM<F, N>) -> Observable, | |
122 | ε : F, | |
123 | τ : F, | |
124 | θ_or_adaptive : &mut TransportStepLength<F, G>, | |
125 | opAnorm : F, | |
126 | v : D, | |
127 | tconfig : &TransportConfig<F> | |
128 | ) -> (Vec<F>, RNDM<F, N>) | |
129 | where | |
130 | F : Float + ToNalgebraRealField, | |
131 | G : Fn(F, F) -> F, | |
132 | Observable : Euclidean<F, Output=Observable>, | |
133 | for<'a> &'a Observable : Instance<Observable>, | |
134 | //for<'b> A::Preadjoint<'b> : LipschitzValues<FloatType=F>, | |
37
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
135 | D : DifferentiableRealMapping<F, N>, |
35 | 136 | { |
137 | ||
138 | use TransportStepLength::*; | |
139 | ||
140 | // Save current base point and shift μ to new positions. Idea is that | |
141 | // μ_base(_masses) = μ^k (vector of masses) | |
142 | // μ_base_minus_γ0 = μ^k - π_♯^0γ^{k+1} | |
143 | // γ1 = π_♯^1γ^{k+1} | |
144 | // μ = μ^{k+1} | |
145 | let μ_base_masses : Vec<F> = μ.iter_masses().collect(); | |
146 | let mut μ_base_minus_γ0 = μ.clone(); // Weights will be set in the loop below. | |
147 | // Construct μ^{k+1} and π_♯^1γ^{k+1} initial candidates | |
148 | //let mut sum_norm_dv = 0.0; | |
149 | let γ_prev_len = γ1.len(); | |
150 | assert!(μ.len() >= γ_prev_len); | |
151 | γ1.extend(μ[γ_prev_len..].iter().cloned()); | |
152 | ||
153 | // Calculate initial transport and step length. | |
154 | // First calculate initial transported weights | |
155 | for (δ, ρ) in izip!(μ.iter_spikes(), γ1.iter_spikes_mut()) { | |
156 | // If old transport has opposing sign, the new transport will be none. | |
157 | ρ.α = if (ρ.α > 0.0 && δ.α < 0.0) || (ρ.α < 0.0 && δ.α > 0.0) { | |
158 | 0.0 | |
159 | } else { | |
160 | δ.α | |
161 | }; | |
162 | }; | |
163 | ||
164 | // A priori transport adaptation based on bounding 2 ‖A‖ ‖A(γ₁-γ₀)‖‖γ‖ by scaling γ. | |
165 | // 1. Calculate transport rays. | |
166 | // If the Lipschitz factor of the values v=∇F(μ) are not known, estimate it. | |
167 | match *θ_or_adaptive { | |
168 | Fixed(θ) => { | |
169 | let θτ = τ * θ; | |
170 | for (δ, ρ) in izip!(μ.iter_spikes(), γ1.iter_spikes_mut()) { | |
171 | ρ.x = δ.x - v.differential(&δ.x) * (ρ.α.signum() * θτ); | |
172 | } | |
173 | }, | |
174 | AdaptiveMax{ l : ℓ_v, ref mut max_transport, g : ref calculate_θ } => { | |
175 | *max_transport = max_transport.max(γ1.norm(Radon)); | |
176 | let θτ = τ * calculate_θ(ℓ_v, *max_transport); | |
177 | for (δ, ρ) in izip!(μ.iter_spikes(), γ1.iter_spikes_mut()) { | |
178 | ρ.x = δ.x - v.differential(&δ.x) * (ρ.α.signum() * θτ); | |
179 | } | |
180 | }, | |
181 | FullyAdaptive{ l : ref mut adaptive_ℓ_v, ref mut max_transport, g : ref calculate_θ } => { | |
182 | *max_transport = max_transport.max(γ1.norm(Radon)); | |
183 | let mut θ = calculate_θ(*adaptive_ℓ_v, *max_transport); | |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
184 | // Do two runs through the spikes to update θ, breaking if first run did not cause |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
185 | // a change. |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
186 | for _i in 0..=1 { |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
187 | let mut changes = false; |
35 | 188 | for (δ, ρ) in izip!(μ.iter_spikes(), γ1.iter_spikes_mut()) { |
189 | let dv_x = v.differential(&δ.x); | |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
190 | let g = &dv_x * (ρ.α.signum() * θ * τ); |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
191 | ρ.x = δ.x - g; |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
192 | let n = g.norm2(); |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
193 | if n >= F::EPSILON { |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
194 | // Estimate Lipschitz factor of ∇v |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
195 | let this_ℓ_v = (dv_x - v.differential(&ρ.x)).norm2() / n; |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
196 | *adaptive_ℓ_v = adaptive_ℓ_v.max(this_ℓ_v); |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
197 | θ = calculate_θ(*adaptive_ℓ_v, *max_transport); |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
198 | changes = true |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
199 | } |
35 | 200 | } |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
201 | if !changes { |
35 | 202 | break |
203 | } | |
34
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
204 | } |
32 | 205 | } |
35 | 206 | } |
207 | ||
208 | // 2. Adjust transport mass, if needed. | |
209 | // This tries to remove the smallest transport masses first. | |
210 | if true { | |
211 | // Alternative 1 : subtract same amount from all transport rays until reaching zero | |
212 | loop { | |
213 | let nr =γ1.norm(Radon); | |
214 | let n = τ * 2.0 * opAnorm * (opAapply(&*γ1)-opAapply(&*μ)).norm2(); | |
215 | if n <= 0.0 || nr <= 0.0 { | |
216 | break | |
217 | } | |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
218 | let reduction_needed = nr - (ε * tconfig.tolerance_mult_pri / n); |
35 | 219 | if reduction_needed <= 0.0 { |
220 | break | |
221 | } | |
222 | let (min_nonzero, n_nonzero) = γ1.iter_masses() | |
223 | .map(|α| α.abs()) | |
224 | .filter(|α| *α > F::EPSILON) | |
225 | .fold((F::INFINITY, 0), |(a, n), b| (a.min(b), n+1)); | |
226 | assert!(n_nonzero > 0); | |
227 | // Reduction that can be done in all nonzero spikes simultaneously | |
228 | let h = (reduction_needed / F::cast_from(n_nonzero)).min(min_nonzero); | |
229 | for (δ, ρ) in izip!(μ.iter_spikes_mut(), γ1.iter_spikes_mut()) { | |
230 | ρ.α = ρ.α.signum() * (ρ.α.abs() - h).max(0.0); | |
231 | δ.α = ρ.α; | |
232 | } | |
233 | if min_nonzero * F::cast_from(n_nonzero) >= reduction_needed { | |
234 | break | |
235 | } | |
236 | } | |
237 | } else { | |
238 | // Alternative 2: first reduce transport rays with greater effect based on differential. | |
239 | // This is a an inefficient quick-and-dirty implementation. | |
240 | loop { | |
241 | let nr = γ1.norm(Radon); | |
242 | let a = opAapply(&*γ1)-opAapply(&*μ); | |
243 | let na = a.norm2(); | |
244 | let n = τ * 2.0 * opAnorm * na; | |
245 | if n <= 0.0 || nr <= 0.0 { | |
246 | break | |
247 | } | |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
248 | let reduction_needed = nr - (ε * tconfig.tolerance_mult_pri / n); |
35 | 249 | if reduction_needed <= 0.0 { |
250 | break | |
251 | } | |
252 | let mut max_d = 0.0; | |
253 | let mut max_d_ind = 0; | |
254 | for (δ, ρ, i) in izip!(μ.iter_spikes_mut(), γ1.iter_spikes(), 0..) { | |
255 | // Calculate differential of ‖A(γ₁-γ₀)‖‖γ‖ wrt. each spike | |
256 | let s = δ.α.signum(); | |
257 | // TODO: this is very inefficient implementation due to the limitations | |
258 | // of the closure parameters. | |
259 | let δ1 = DiscreteMeasure::from([(ρ.x, s)]); | |
260 | let δ2 = DiscreteMeasure::from([(δ.x, s)]); | |
261 | let a_part = opAapply(&δ1)-opAapply(&δ2); | |
262 | let d = a.dot(&a_part)/na * nr + 2.0 * na; | |
263 | if d > max_d { | |
264 | max_d = d; | |
265 | max_d_ind = i; | |
266 | } | |
267 | } | |
268 | // Just set mass to zero for transport ray with greater differential | |
269 | assert!(max_d > 0.0); | |
270 | γ1[max_d_ind].α = 0.0; | |
271 | μ[max_d_ind].α = 0.0; | |
272 | } | |
273 | } | |
274 | ||
275 | // Set initial guess for μ=μ^{k+1}. | |
276 | for (δ, ρ, &β) in izip!(μ.iter_spikes_mut(), γ1.iter_spikes(), μ_base_masses.iter()) { | |
277 | if ρ.α.abs() > F::EPSILON { | |
278 | δ.x = ρ.x; | |
279 | //δ.α = ρ.α; // already set above | |
280 | } else { | |
281 | δ.α = β; | |
282 | } | |
283 | } | |
284 | // Calculate μ^k-π_♯^0γ^{k+1} and v̆ = A_*(A[μ_transported + μ_transported_base]-b) | |
285 | μ_base_minus_γ0.set_masses(μ_base_masses.iter().zip(γ1.iter_masses()) | |
286 | .map(|(&a,b)| a - b)); | |
287 | (μ_base_masses, μ_base_minus_γ0) | |
288 | } | |
289 | ||
290 | /// A posteriori transport adaptation. | |
291 | #[replace_float_literals(F::cast_from(literal))] | |
292 | pub(crate) fn aposteriori_transport<F, const N : usize>( | |
293 | γ1 : &mut RNDM<F, N>, | |
294 | μ : &mut RNDM<F, N>, | |
295 | μ_base_minus_γ0 : &mut RNDM<F, N>, | |
296 | μ_base_masses : &Vec<F>, | |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
297 | extra : Option<F>, |
35 | 298 | ε : F, |
299 | tconfig : &TransportConfig<F> | |
300 | ) -> bool | |
301 | where F : Float + ToNalgebraRealField { | |
302 | ||
303 | // 1. If π_♯^1γ^{k+1} = γ1 has non-zero mass at some point y, but μ = μ^{k+1} does not, | |
304 | // then the ansatz ∇w̃_x(y) = w^{k+1}(y) may not be satisfied. So set the mass of γ1 | |
305 | // at that point to zero, and retry. | |
306 | let mut all_ok = true; | |
307 | for (α_μ, α_γ1) in izip!(μ.iter_masses(), γ1.iter_masses_mut()) { | |
308 | if α_μ == 0.0 && *α_γ1 != 0.0 { | |
309 | all_ok = false; | |
310 | *α_γ1 = 0.0; | |
311 | } | |
312 | } | |
313 | ||
314 | // 2. Through bounding ∫ B_ω(y, z) dλ(x, y, z). | |
315 | // through the estimate ≤ C ‖Δ‖‖γ^{k+1}‖ for Δ := μ^{k+1}-μ^k-(π_♯^1-π_♯^0)γ^{k+1}, | |
316 | // which holds for some some C if the convolution kernel in 𝒟 has Lipschitz gradient. | |
317 | let nγ = γ1.norm(Radon); | |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
318 | let nΔ = μ_base_minus_γ0.norm(Radon) + μ.dist_matching(&γ1) + extra.unwrap_or(0.0); |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
319 | let t = ε * tconfig.tolerance_mult_pos; |
35 | 320 | if nγ*nΔ > t { |
321 | // Since t/(nγ*nΔ)<1, and the constant tconfig.adaptation < 1, | |
322 | // this will guarantee that eventually ‖γ‖ decreases sufficiently that we | |
323 | // will not enter here. | |
324 | *γ1 *= tconfig.adaptation * t / ( nγ * nΔ ); | |
325 | all_ok = false | |
326 | } | |
327 | ||
328 | if !all_ok { | |
329 | // Update weights for μ_base_minus_γ0 = μ^k - π_♯^0γ^{k+1} | |
330 | μ_base_minus_γ0.set_masses(μ_base_masses.iter().zip(γ1.iter_masses()) | |
331 | .map(|(&a,b)| a - b)); | |
332 | ||
333 | } | |
334 | ||
335 | all_ok | |
32 | 336 | } |
337 | ||
338 | /// Iteratively solve the pointsource localisation problem using sliding forward-backward | |
339 | /// splitting | |
340 | /// | |
35 | 341 | /// The parametrisation is as for [`pointsource_fb_reg`]. |
32 | 342 | /// Inertia is currently not supported. |
343 | #[replace_float_literals(F::cast_from(literal))] | |
37
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
344 | pub fn pointsource_sliding_fb_reg<F, I, A, Reg, P, const N : usize>( |
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
345 | opA : &A, |
32 | 346 | b : &A::Observable, |
347 | reg : Reg, | |
37
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
348 | prox_penalty : &P, |
35 | 349 | config : &SlidingFBConfig<F>, |
32 | 350 | iterator : I, |
351 | mut plotter : SeqPlotter<F, N>, | |
35 | 352 | ) -> RNDM<F, N> |
37
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
353 | where |
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
354 | F : Float + ToNalgebraRealField, |
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
355 | I : AlgIteratorFactory<IterInfo<F, N>>, |
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
356 | A : ForwardModel<RNDM<F, N>, F> |
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
357 | + AdjointProductBoundedBy<RNDM<F, N>, P, FloatType=F>, |
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
358 | //+ TransportLipschitz<L2Squared, FloatType=F>, |
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
359 | for<'b> &'b A::Observable : std::ops::Neg<Output=A::Observable> + Instance<A::Observable>, |
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
360 | for<'b> A::Preadjoint<'b> : LipschitzValues<FloatType=F>, |
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
361 | A::PreadjointCodomain : DifferentiableRealMapping<F, N>, |
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
362 | RNDM<F, N> : SpikeMerging<F>, |
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
363 | Reg : SlidingRegTerm<F, N>, |
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
364 | P : ProxPenalty<F, A::PreadjointCodomain, Reg, N>, |
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
365 | PlotLookup : Plotting<N>, |
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
366 | { |
32 | 367 | |
35 | 368 | // Check parameters |
369 | assert!(config.τ0 > 0.0, "Invalid step length parameter"); | |
370 | config.transport.check(); | |
32 | 371 | |
372 | // Initialise iterates | |
34
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
373 | let mut μ = DiscreteMeasure::new(); |
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
374 | let mut γ1 = DiscreteMeasure::new(); |
35 | 375 | let mut residual = -b; // Has to equal $Aμ-b$. |
376 | ||
377 | // Set up parameters | |
378 | let opAnorm = opA.opnorm_bound(Radon, L2); | |
379 | //let max_transport = config.max_transport.scale | |
380 | // * reg.radon_norm_bound(b.norm2_squared() / 2.0); | |
381 | //let ℓ = opA.transport.lipschitz_factor(L2Squared) * max_transport; | |
382 | let ℓ = 0.0; | |
37
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
383 | let τ = config.τ0 / opA.adjoint_product_bound(prox_penalty).unwrap(); |
35 | 384 | let calculate_θ = |ℓ_v, _| config.transport.θ0 / (τ*(ℓ + ℓ_v)); |
385 | let mut θ_or_adaptive = match opA.preadjoint().value_diff_unit_lipschitz_factor() { | |
386 | // We only estimate w (the uniform Lipschitz for of v), if we also estimate ℓ_v | |
387 | // (the uniform Lipschitz factor of ∇v). | |
388 | // We assume that the residual is decreasing. | |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
389 | Some(ℓ_v0) => TransportStepLength::Fixed(calculate_θ(ℓ_v0 * b.norm2(), 0.0)), |
35 | 390 | None => TransportStepLength::FullyAdaptive { |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
391 | l : 10.0 * F::EPSILON, // Start with something very small to estimate differentials |
35 | 392 | max_transport : 0.0, |
393 | g : calculate_θ | |
394 | }, | |
395 | }; | |
396 | // We multiply tolerance by τ for FB since our subproblems depending on tolerances are scaled | |
397 | // by τ compared to the conditional gradient approach. | |
398 | let tolerance = config.insertion.tolerance * τ * reg.tolerance_scaling(); | |
399 | let mut ε = tolerance.initial(); | |
400 | ||
401 | // Statistics | |
402 | let full_stats = |residual : &A::Observable, | |
403 | μ : &RNDM<F, N>, | |
404 | ε, stats| IterInfo { | |
405 | value : residual.norm2_squared_div2() + reg.apply(μ), | |
406 | n_spikes : μ.len(), | |
407 | ε, | |
408 | // postprocessing: config.insertion.postprocessing.then(|| μ.clone()), | |
409 | .. stats | |
410 | }; | |
32 | 411 | let mut stats = IterInfo::new(); |
412 | ||
413 | // Run the algorithm | |
35 | 414 | for state in iterator.iter_init(|| full_stats(&residual, &μ, ε, stats.clone())) { |
415 | // Calculate initial transport | |
416 | let v = opA.preadjoint().apply(residual); | |
417 | let (μ_base_masses, mut μ_base_minus_γ0) = initial_transport( | |
418 | &mut γ1, &mut μ, |ν| opA.apply(ν), | |
419 | ε, τ, &mut θ_or_adaptive, opAnorm, | |
420 | v, &config.transport, | |
421 | ); | |
34
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
422 | |
32 | 423 | // Solve finite-dimensional subproblem several times until the dual variable for the |
424 | // regularisation term conforms to the assumptions made for the transport above. | |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
425 | let (maybe_d, _within_tolerances, mut τv̆) = 'adapt_transport: loop { |
35 | 426 | // Calculate τv̆ = τA_*(A[μ_transported + μ_transported_base]-b) |
34
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
427 | let residual_μ̆ = calculate_residual2(&γ1, &μ_base_minus_γ0, opA, b); |
37
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
428 | let mut τv̆ = opA.preadjoint().apply(residual_μ̆ * τ); |
32 | 429 | |
430 | // Construct μ^{k+1} by solving finite-dimensional subproblems and insert new spikes. | |
37
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
431 | let (maybe_d, within_tolerances) = prox_penalty.insert_and_reweigh( |
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
432 | &mut μ, &mut τv̆, &γ1, Some(&μ_base_minus_γ0), |
35 | 433 | τ, ε, &config.insertion, |
434 | ®, &state, &mut stats, | |
32 | 435 | ); |
436 | ||
35 | 437 | // A posteriori transport adaptation. |
438 | if aposteriori_transport( | |
439 | &mut γ1, &mut μ, &mut μ_base_minus_γ0, &μ_base_masses, | |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
440 | None, |
35 | 441 | ε, &config.transport |
442 | ) { | |
37
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
443 | break 'adapt_transport (maybe_d, within_tolerances, τv̆) |
32 | 444 | } |
445 | }; | |
446 | ||
34
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
447 | stats.untransported_fraction = Some({ |
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
448 | assert_eq!(μ_base_masses.len(), γ1.len()); |
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
449 | let (a, b) = stats.untransported_fraction.unwrap_or((0.0, 0.0)); |
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
450 | let source = μ_base_masses.iter().map(|v| v.abs()).sum(); |
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
451 | (a + μ_base_minus_γ0.norm(Radon), b + source) |
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
452 | }); |
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
453 | stats.transport_error = Some({ |
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
454 | assert_eq!(μ_base_masses.len(), γ1.len()); |
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
455 | let (a, b) = stats.transport_error.unwrap_or((0.0, 0.0)); |
35 | 456 | (a + μ.dist_matching(&γ1), b + γ1.norm(Radon)) |
34
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
457 | }); |
32 | 458 | |
39
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
459 | // Merge spikes. |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
460 | // This crucially expects the merge routine to be stable with respect to spike locations, |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
461 | // and not to performing any pruning. That is be to done below simultaneously for γ. |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
462 | let ins = &config.insertion; |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
463 | if ins.merge_now(&state) { |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
464 | stats.merged += prox_penalty.merge_spikes( |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
465 | &mut μ, &mut τv̆, &γ1, Some(&μ_base_minus_γ0), τ, ε, ins, ®, |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
466 | Some(|μ̃ : &RNDM<F, N>| L2Squared.calculate_fit_op(μ̃, opA, b)), |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
467 | ); |
6316d68b58af
Merging adjustments, parameter tuning, etc.
Tuomo Valkonen <tuomov@iki.fi>
parents:
37
diff
changeset
|
468 | } |
35 | 469 | |
34
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
470 | // Prune spikes with zero weight. To maintain correct ordering between μ and γ1, also the |
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
471 | // latter needs to be pruned when μ is. |
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
472 | // TODO: This could do with a two-vector Vec::retain to avoid copies. |
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
473 | let μ_new = DiscreteMeasure::from_iter(μ.iter_spikes().filter(|δ| δ.α != F::ZERO).cloned()); |
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
474 | if μ_new.len() != μ.len() { |
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
475 | let mut μ_iter = μ.iter_spikes(); |
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
476 | γ1.prune_by(|_| μ_iter.next().unwrap().α != F::ZERO); |
35 | 477 | stats.pruned += μ.len() - μ_new.len(); |
34
efa60bc4f743
Radon FB + sliding improvements
Tuomo Valkonen <tuomov@iki.fi>
parents:
32
diff
changeset
|
478 | μ = μ_new; |
32 | 479 | } |
480 | ||
481 | // Update residual | |
482 | residual = calculate_residual(&μ, opA, b); | |
483 | ||
35 | 484 | let iter = state.iteration(); |
32 | 485 | stats.this_iters += 1; |
486 | ||
35 | 487 | // Give statistics if requested |
32 | 488 | state.if_verbose(|| { |
37
c5d8bd1a7728
Generic proximal penalty support
Tuomo Valkonen <tuomov@iki.fi>
parents:
35
diff
changeset
|
489 | plotter.plot_spikes(iter, maybe_d.as_ref(), Some(&τv̆), &μ); |
35 | 490 | full_stats(&residual, &μ, ε, std::mem::replace(&mut stats, IterInfo::new())) |
491 | }); | |
32 | 492 | |
35 | 493 | // Update main tolerance for next iteration |
494 | ε = tolerance.update(ε, iter); | |
495 | } | |
496 | ||
497 | postprocess(μ, &config.insertion, L2Squared, opA, b) | |
32 | 498 | } |