Library QBS.showcase.bayesian_regression

From HB Require Import structures.
From mathcomp Require Import all_boot all_algebra reals ereal topology
  classical_sets normedtype numfun measure lebesgue_integral
  lebesgue_integral_fubini lebesgue_stieltjes_measure lebesgue_measure
  probability charge boolp.
From mathcomp.algebra_tactics Require Import ring.
From QBS Require Import quasi_borel probability_qbs pair_qbs_measure
  measure_as_qbs_measure normal_algebra.

Import GRing.Theory Num.Def Num.Theory measurable_realfun.

Set Implicit Arguments.
Unset Strict Implicit.
Unset Printing Implicit Defensive.
Import boolp order.Order.POrderTheory.

Local Open Scope classical_set_scope.

Integration against normal_prob via Radon-Nikodym.

Section integral_normal_prob.
Variable R : realType.
Local Notation mu := (@lebesgue_measure R).
Local Open Scope ring_scope.
Local Open Scope ereal_scope.

Lemma integral_normal_prob (m sigma : R) (hsigma : (sigma != 0)%R)
    f (f_meas : measurable_fun setT f)
    (f_int : (\int[normal_prob m sigma]_x `|f x| < +oo)%E) :
  \int[normal_prob m sigma]_x f x =
  \int[mu]_x (f x × (normal_pdf m sigma x)%:E).
Proof.
rewrite -(Radon_Nikodym_change_of_variables
            (normal_prob_dominates m sigma) measurableT); last first.
  by apply/integrableP; split.
apply: ae_eq_integral ⇒ //.
- apply: emeasurable_funM ⇒ //; apply: (measurable_int mu).
  apply: (integrableS _ _ (@subsetT _ _)) ⇒ //=.
  by apply: Radon_Nikodym_integrable; exact: normal_prob_dominates.
- apply: emeasurable_funM ⇒ //=; apply/measurableT_comp ⇒ //=.
  by apply/measurable_funTS; exact: measurable_normal_pdf.
- apply: ae_eqe_mul2l ⇒ /=.
  rewrite Radon_NikodymE//=; first exact: normal_prob_dominates.
  move⇒ ?.
  case: cid ⇒ /= h [h1 h2 h3].
  apply: integral_ae_eq ⇒ //=.
  + apply/measurable_EFinP; exact: measurable_normal_pdf.
  + by move⇒ E E01 mE; rewrite -h3.
Qed.

End integral_normal_prob.

Part II: Bayesian regression example.

Section bayesian_regression.
Variable R : realType.
Local Notation mR := (measurableTypeR R).
Local Open Scope ring_scope.
Local Open Scope ereal_scope.

Let prior_sigma : R := 3%:R. Let noise_sigma : R := 2%:R^-1.

Lemma prior_sigma_gt0 : (0 < prior_sigma)%R.
Proof. by rewrite /prior_sigma ltr0n. Qed.

Definition slope_prior : qbs_prob (realQ R) :=
@qbs_normal_distribution R (0 : R) prior_sigma prior_sigma_gt0.

Definition intercept_prior : qbs_prob (realQ R) :=
@qbs_normal_distribution R (0 : R) prior_sigma prior_sigma_gt0.

Definition d (mu x : R) : R := normal_pdf mu noise_sigma x.

Lemma d_ge0 (mu x : R) : (0 ≤ d mu x)%R.
Proof. exact: normal_pdf_ge0. Qed.

Observation likelihood: product of 5 normal densities at the data points (1,2.5),...,(5,8.0).

Definition obs (params : realQ R × realQ R) : R :=
  let s := fst params in
  let b := snd params in
  (d (s × 1 + b) (5%:R / 2%:R) ×
   d (s × 2%:R + b) (19%:R / 5%:R) ×
   d (s × 3%:R + b) (9%:R / 2%:R) ×
   d (s × 4%:R + b) (31%:R / 5%:R) ×
   d (s × 5%:R + b) 8%:R)%R.
Lemma obs_ge0 (params : realQ R × realQ R) : (0 ≤ obs params)%R.
Proof.
rewrite /obs.
do 4! (apply: mulr_ge0; last exact: d_ge0).
exact: d_ge0.
Qed.

Marginal likelihood (normalizing constant Z).

Definition evidence : \bar R :=
  qbs_pair_integral slope_prior intercept_prior
    (fun params ⇒ (obs params)%:E).

Lemma evidence_ge0 : 0 ≤ evidence.
Proof.
rewrite /evidence /qbs_pair_integral.
apply: integral_ge0 ⇒ rr _.
rewrite lee_fin; exact: obs_ge0.
Qed.

Lemma evidence_eq
  (hint : (qbs_prob_mu slope_prior \x qbs_prob_mu intercept_prior).-integrable
    setT (qbs_pair_fun slope_prior intercept_prior
      (fun params ⇒ (obs params)%:E))) :
  evidence =
  qbs_integral _ slope_prior (fun s ⇒
    qbs_integral _ intercept_prior (fun b ⇒
      (obs (s , b ))%:E)).
Proof. rewrite /evidence; exact: qbs_pair_integral_iterated. Qed.

Unnormalized posterior: E_postg = E_priorg × obs / Z.

Definition posterior_density (g : realQ R × realQ R → \bar R) : \bar R :=
  qbs_pair_integral slope_prior intercept_prior
    (fun params ⇒ g params × (obs params)%:E)
   / evidence.

Lemma posterior_density_total
  (hev_pos : 0 < evidence)
  (hev_fin : evidence < +oo) :
  posterior_density (fun _ ⇒ 1) = 1.
Proof.
rewrite /posterior_density.
have → : (fun params : realQ R × realQ R ⇒ 1 × (obs params)%:E) =
          (fun params ⇒ (obs params)%:E).
  by apply: funext ⇒ p; rewrite mul1e.
rewrite -/(evidence).
apply: divee.
- by rewrite gt0_fin_numE.
- by move: hev_pos; rewrite lt0e ⇒ /andP[].
Qed.

Lemma posterior_density_eq (g : realQ R × realQ R → \bar R)
  (hint : (qbs_prob_mu slope_prior \x qbs_prob_mu intercept_prior).-integrable
    setT (qbs_pair_fun slope_prior intercept_prior
      (fun params ⇒ g params × (obs params)%:E))) :
  posterior_density g =
  qbs_integral _ slope_prior (fun s ⇒
    qbs_integral _ intercept_prior (fun b ⇒
      g (s , b ) × (obs (s , b ))%:E))
   / evidence.
Proof.
rewrite /posterior_density; congr (_ / _).
exact: qbs_pair_integral_iterated.
Qed.

Definition likelihood_single (obs_x : R) :
  prodQ (realQ R) (realQ R) → qbs_prob (realQ R) :=
  fun params ⇒
    @mkQBSProb R (realQ R) idfun
      (normal_prob (fst params × obs_x + snd params)%R noise_sigma
        : probability mR R)
      (@measurable_id _ mR setT).

Lemma likelihood_single_morphism (obs_x : R) :
  qbs_morphism
    (likelihood_single obs_x).
Proof.
move⇒ alpha halpha; rewrite /qbs_Mx /= ⇒ r.
exact: (@measurable_id _ mR setT).
Qed.

Lemma likelihood_single_strong (obs_x : R) :
  qbs_morphism_strong (prodQ (realQ R) (realQ R)) (realQ R)
    (likelihood_single obs_x).
Proof.
move⇒ alpha halpha.
∃ idfun.
∃ (fun r ⇒ normal_prob (fst (alpha r) × obs_x + snd (alpha r))%R
                   noise_sigma : probability mR R).
split; first exact: (@measurable_id _ mR setT).
by split.
Qed.

Definition predictive_integral (obs_x : R) (h : realQ R → \bar R) : \bar R :=
  qbs_pair_integral slope_prior intercept_prior
    (fun params ⇒ qbs_integral _ (likelihood_single obs_x params) h).

Lemma predictive_marginal (obs_x : R) (h : realQ R → \bar R)
  (hint : (qbs_prob_mu slope_prior \x qbs_prob_mu intercept_prior).-integrable
    setT (qbs_pair_fun slope_prior intercept_prior
      (fun params ⇒ qbs_integral _ (likelihood_single obs_x params) h))) :
  predictive_integral obs_x h =
  qbs_integral _ slope_prior (fun s ⇒
    qbs_integral _ intercept_prior (fun b ⇒
      qbs_integral _ (likelihood_single obs_x (s , b )) h)).
Proof. rewrite /predictive_integral; exact: qbs_pair_integral_iterated. Qed.

Definition prior : qbs_prob (prodQ (realQ R) (realQ R)) :=
  qbs_prob_pair slope_prior intercept_prior.

Lemma prior_inner_diag (s : realQ R) :
  qbs_Mx
    (fun r ⇒ qbs_prob_alpha
      ((fun b ⇒ qbs_return (prodQ (realQ R) (realQ R)) (s , b )
                   (qbs_prob_mu intercept_prior))
       (qbs_prob_alpha intercept_prior r)) r).
Proof.
rewrite /= /qbs_Mx /=; split.
- exact: (qbs_Mx_const s).
- exact: (@measurable_id _ mR setT).
Qed.

Definition prior_inner (s : realQ R) : qbs_prob (prodQ (realQ R) (realQ R)) :=
  qbs_bind (realQ R) (prodQ (realQ R) (realQ R))
    intercept_prior
    (fun b ⇒ qbs_return (prodQ (realQ R) (realQ R)) (s , b )
                (qbs_prob_mu intercept_prior))
    (prior_inner_diag s).

Lemma prior_bind_diag :
  qbs_Mx
    (fun r ⇒ qbs_prob_alpha
      (prior_inner (qbs_prob_alpha slope_prior r)) r).
Proof.
rewrite /= /qbs_Mx /=; split.
- exact: (@measurable_id _ mR setT).
- exact: (@measurable_id _ mR setT).
Qed.

Definition prior_bind : qbs_prob (prodQ (realQ R) (realQ R)) :=
  qbs_bind (realQ R) (prodQ (realQ R) (realQ R))
    slope_prior prior_inner prior_bind_diag.

Definition norm_qbs
    (g : realQ R × realQ R → \bar R)
    (obs_fn : realQ R × realQ R → R)
    : option (realQ R × realQ R → \bar R) :=
  let ev := qbs_pair_integral slope_prior intercept_prior
              (fun p ⇒ (obs_fn p)%:E) in
  if (0 < ev ) && (ev < +oo) then
    Some (fun p ⇒ g p × (obs_fn p)%:E / ev)
  else None.

Lemma norm_qbs_some (g : realQ R × realQ R → \bar R)
  (obs_fn : realQ R × realQ R → R)
  (hev_pos : 0 < qbs_pair_integral slope_prior intercept_prior
               (fun p ⇒ (obs_fn p)%:E))
  (hev_fin : qbs_pair_integral slope_prior intercept_prior
               (fun p ⇒ (obs_fn p)%:E) < +oo) :
  norm_qbs g obs_fn =
  Some (fun p ⇒ g p × (obs_fn p)%:E /
          qbs_pair_integral slope_prior intercept_prior
            (fun p ⇒ (obs_fn p)%:E)).
Proof.
rewrite /norm_qbs.
case: ifPn ⇒ // /negP.
move/negP; rewrite negb_and ⇒ /orP[/negP|/negP]; contradiction.
Qed.

Lemma norm_qbs_none (g : realQ R × realQ R → \bar R)
  (obs_fn : realQ R × realQ R → R)
  (hev : ¬ ((0 < qbs_pair_integral slope_prior intercept_prior
                 (fun p ⇒ (obs_fn p)%:E)) ∧
             (qbs_pair_integral slope_prior intercept_prior
                 (fun p ⇒ (obs_fn p)%:E) < +oo))) :
  norm_qbs g obs_fn = None.
Proof.
rewrite /norm_qbs.
case: ifPn ⇒ // /andP[h1 h2].
by exfalso; apply: hev.
Qed.

Full Bayesian program: normalize prior by obs.

Definition program : option (realQ R × realQ R → \bar R) :=
  norm_qbs (fun _ ⇒ 1) obs.

Lemma program_succeeds
  (hev_pos : 0 < evidence)
  (hev_fin : evidence < +oo) :
  program = Some (fun p ⇒ 1 × (obs p)%:E / evidence).
Proof.
rewrite /program /norm_qbs -/(evidence).
case: ifPn ⇒ // /negP.
move/negP; rewrite negb_and ⇒ /orP[/negP|/negP]; contradiction.
Qed.

Phase 1 integration: integrate out the intercept b.

Definition scalar_of_s (s : R) : R :=

  (normal_peak (sqrtr (3%:R ^+ 2 + (2%:R^-1 : R) ^+ 2)) ×
   normal_fun 0 (sqrtr (3%:R ^+ 2 + (2%:R^-1 : R) ^+ 2)) (5%:R / 2%:R - s)) ×

  (normal_peak (sqrtr (sqrtr (9%:R / 37%:R) ^+ 2 + (2%:R^-1 : R) ^+ 2)) ×
   normal_fun ((90%:R - 36%:R × s) / 37%:R)
     (sqrtr (sqrtr (9%:R / 37%:R) ^+ 2 + (2%:R^-1 : R) ^+ 2))
     (19%:R / 5%:R - 2%:R × s)) ×

  (normal_peak (sqrtr (sqrtr (9%:R / 73%:R) ^+ 2 + (2%:R^-1 : R) ^+ 2)) ×
   normal_fun ((1134%:R - 540%:R × s) / 365%:R)
     (sqrtr (sqrtr (9%:R / 73%:R) ^+ 2 + (2%:R^-1 : R) ^+ 2))
     (9%:R / 2%:R - 3%:R × s)) ×

  (normal_peak (sqrtr (sqrtr (9%:R / 109%:R) ^+ 2 + (2%:R^-1 : R) ^+ 2)) ×
   normal_fun ((1944%:R - 1080%:R × s) / 545%:R)
     (sqrtr (sqrtr (9%:R / 109%:R) ^+ 2 + (2%:R^-1 : R) ^+ 2))
     (31%:R / 5%:R - 4%:R × s)) ×

  (normal_peak (sqrtr (sqrtr (9%:R / 145%:R) ^+ 2 + (2%:R^-1 : R) ^+ 2)) ×
   normal_fun ((612%:R - 360%:R × s) / 145%:R)
     (sqrtr (sqrtr (9%:R / 145%:R) ^+ 2 + (2%:R^-1 : R) ^+ 2))
     (8%:R - 5%:R × s)).

Lemma scalar_of_s_ge0 (s : R) : (0 ≤ scalar_of_s s)%R.
Proof.
rewrite /scalar_of_s.
apply: mulr_ge0; last first.
  by apply: mulr_ge0; [exact: normal_peak_ge0|
     exact: normal_fun_ge0].
apply: mulr_ge0; last first.
  by apply: mulr_ge0; [exact: normal_peak_ge0|
     exact: normal_fun_ge0].
apply: mulr_ge0; last first.
  by apply: mulr_ge0; [exact: normal_peak_ge0|
     exact: normal_fun_ge0].
apply: mulr_ge0; last first.
  by apply: mulr_ge0; [exact: normal_peak_ge0|
     exact: normal_fun_ge0].
by apply: mulr_ge0; [exact: normal_peak_ge0 | exact: normal_fun_ge0].
Qed.

Let phase1_mu5 (s : R) : R := (900%:R - 540%:R × s) / 181%:R.
Let phase1_sigma5 : R := sqrtr (9%:R / 181%:R).

Lemma phase1_integration (s : R)
  (obs_meas : measurable_fun [set: mR]
    (fun b : mR ⇒ (obs (s , b ))%:E :> \bar R))
  (obs_int : (\int[normal_prob 0 prior_sigma]_b
    `|(obs (s , b ))%:E| < +oo)%E)
  :
  \int[normal_prob (0 : R) prior_sigma]_b (obs (s , b ))%:E =
  (scalar_of_s s)%:E.
Proof.
have h3 : (prior_sigma != 0)%R by rewrite /prior_sigma pnatr_eq0.
rewrite (integral_normal_prob h3) //.
under eq_integral do rewrite -EFinM.
have step1 : ∀ x : R, (obs (s, x ) × normal_pdf 0 prior_sigma x =
  scalar_of_s s × normal_pdf (phase1_mu5 s) phase1_sigma5 x)%R.
  move⇒ x; rewrite mulrC /obs /d /prior_sigma /noise_sigma.
  rewrite (obs_rewrite s x) !mulrA.
  exact: (phase1_combine5 s x).
under eq_integral do rewrite step1.
under eq_integral do rewrite EFinM.
rewrite ge0_integralZl_EFin //.
- rewrite integral_normal_pdf mule1 //.
- move⇒ x _; rewrite lee_fin; exact: normal_pdf_ge0.
- apply/measurableT_comp ⇒ //; exact: measurable_normal_pdf.
- exact: scalar_of_s_ge0.
Qed.

Phase 2 integration: integrate out the slope s.

Lemma scalar_of_s_eq (s : R) :
  scalar_of_s s =
  (gaussian_prod_scalar 0 (5%:R / 2%:R - s) 3%:R (2%:R^-1) ×
  gaussian_prod_scalar ((90%:R - 36%:R × s) / 37%:R)
                       (19%:R / 5%:R - 2%:R × s)
                       (sqrtr (9%:R / 37%:R)) (2%:R^-1) ×
  gaussian_prod_scalar ((1134%:R - 540%:R × s) / 365%:R)
                       (9%:R / 2%:R - 3%:R × s)
                       (sqrtr (9%:R / 73%:R)) (2%:R^-1) ×
  gaussian_prod_scalar ((1944%:R - 1080%:R × s) / 545%:R)
                       (31%:R / 5%:R - 4%:R × s)
                       (sqrtr (9%:R / 109%:R)) (2%:R^-1) ×
  gaussian_prod_scalar ((612%:R - 360%:R × s) / 145%:R)
                       (8%:R - 5%:R × s)
                       (sqrtr (9%:R / 145%:R)) (2%:R^-1))%R.
Proof. by rewrite /scalar_of_s /gaussian_prod_scalar. Qed.

Lemma scalar_of_s_mul_pdf (s : R) :
  (scalar_of_s s × normal_pdf 0 prior_sigma s =
   phase2_const R × normal_pdf (phase2_final_mu R) (phase2_final_sigma R) s)%R.
Proof.
rewrite (scalar_of_s_eq s).
pose proof (phase2_combine5 s) as h.
rewrite /prior_sigma -h; ring.
Qed.

Lemma phase2_integration
  (sos_meas : measurable_fun [set: mR]
    (fun s : mR ⇒ (scalar_of_s s)%:E :> \bar R))
  (sos_int : (\int[normal_prob 0 prior_sigma]_s
    `|(scalar_of_s s)%:E| < +oo)%E) :
  \int[normal_prob (0 : R) prior_sigma]_s (scalar_of_s s)%:E =
  (phase2_const R)%:E.
Proof.
have h3 : (prior_sigma != 0)%R by rewrite /prior_sigma pnatr_eq0.
rewrite (integral_normal_prob h3) //.
under eq_integral do rewrite -EFinM.
under eq_integral do rewrite scalar_of_s_mul_pdf.
under eq_integral do rewrite EFinM.
rewrite ge0_integralZl_EFin //.
- rewrite integral_normal_pdf ?mule1 //; exact: phase2_final_sigma_neq0.
- move⇒ x _; rewrite lee_fin; exact: normal_pdf_ge0.
- apply/measurableT_comp ⇒ //; exact: measurable_normal_pdf.
- have := phase2_const_gt0 R; rewrite lt0r ⇒ /andP[_]; done.
Qed.

Evidence value and unconditional program result.

Evidence equals phase2_const (explicit closed form).

Theorem evidence_value
  (hint : (qbs_prob_mu slope_prior \x qbs_prob_mu intercept_prior).-integrable
    setT (qbs_pair_fun slope_prior intercept_prior
      (fun params ⇒ (obs params)%:E)))
  (obs_meas : ∀ s, measurable_fun [set: mR]
    (fun b : mR ⇒ (obs (s , b ))%:E :> \bar R))
  (obs_int : ∀ s, (\int[normal_prob 0 prior_sigma]_b
    `|(obs (s , b ))%:E| < +oo)%E)
  (sos_meas : measurable_fun [set: mR]
    (fun s : mR ⇒ (scalar_of_s s)%:E :> \bar R))
  (sos_int : (\int[normal_prob 0 prior_sigma]_s
    `|(scalar_of_s s)%:E| < +oo)%E) :
  evidence = (phase2_const R)%:E.
Proof.
rewrite (evidence_eq hint) /qbs_integral /=.
have inner_eq : ∀ x : R,
  \int[normal_prob 0 prior_sigma]_b (obs (x , b ))%:E = (scalar_of_s x)%:E.
  move⇒ x; apply: phase1_integration;
    [exact: (obs_meas x)|exact: (obs_int x)].
under eq_integral do rewrite inner_eq.
exact: phase2_integration.
Qed.

Lemma evidence_pos
  (hint : (qbs_prob_mu slope_prior \x qbs_prob_mu intercept_prior).-integrable
    setT (qbs_pair_fun slope_prior intercept_prior
      (fun params ⇒ (obs params)%:E)))
  (obs_meas : ∀ s, measurable_fun [set: mR]
    (fun b : mR ⇒ (obs (s , b ))%:E :> \bar R))
  (obs_int : ∀ s, (\int[normal_prob 0 prior_sigma]_b
    `|(obs (s , b ))%:E| < +oo)%E)
  (sos_meas : measurable_fun [set: mR]
    (fun s : mR ⇒ (scalar_of_s s)%:E :> \bar R))
  (sos_int : (\int[normal_prob 0 prior_sigma]_s
    `|(scalar_of_s s)%:E| < +oo)%E) :
  0 < evidence ∧ evidence < +oo.
Proof.
rewrite (evidence_value hint obs_meas obs_int sos_meas sos_int).
split.
- by rewrite lte_fin; exact: phase2_const_gt0.
- by rewrite ltey.
Qed.

Discharging the measure-theoretic hypotheses.

Lemma noise_sigma_neq0 : (noise_sigma != 0)%R.
Proof. by rewrite /noise_sigma invr_neq0. Qed.

Lemma d_le_peak (mu x : R) : (d mu x ≤ normal_peak noise_sigma)%R.
Proof. rewrite /d; apply: normal_pdf_ub; exact: noise_sigma_neq0. Qed.

Lemma obs_ub (s b : R) : (obs (s , b ) ≤ normal_peak noise_sigma ^+5)%R.
Proof.
have hle : ∀ mu x : R, (d mu x ≤ normal_peak noise_sigma)%R := d_le_peak.
have hge : ∀ mu x : R, (0 ≤ d mu x)%R := d_ge0.
rewrite /obs /= exprSr exprSr exprSr exprSr expr1.
apply: ler_pM; [| | |exact: hle];
  first by repeat (apply: mulr_ge0); exact: hge.
  by exact: hge.
apply: ler_pM; [| | |exact: hle];
  first by repeat (apply: mulr_ge0); exact: hge.
  by exact: hge.
apply: ler_pM; [| | |exact: hle];
  first by repeat (apply: mulr_ge0); exact: hge.
  by exact: hge.
apply: ler_pM; [exact: hge|exact: hge|exact: hle|exact: hle].
Qed.

Lemma obs_meas_proof : ∀ s, measurable_fun [set: mR]
  (fun b : mR ⇒ (obs (s , b ))%:E :> \bar R).
Proof.
move⇒ s; apply/measurable_EFinP; rewrite /obs /d /=.
suff → : (fun b : mR ⇒
  (normal_pdf ((s × 1)%R + b)%R noise_sigma (5%:R / 2%:R) ×
  normal_pdf ((s × 2%:R)%R + b)%R noise_sigma (19%:R / 5%:R) ×
  normal_pdf ((s × 3%:R)%R + b)%R noise_sigma (9%:R / 2%:R) ×
  normal_pdf ((s × 4%:R)%R + b)%R noise_sigma (31%:R / 5%:R) ×
  normal_pdf ((s × 5%:R)%R + b)%R noise_sigma 8%:R)%R) =
  (fun b : mR ⇒ (normal_pdf (5%:R / 2%:R - 1 × s) noise_sigma b ×
  normal_pdf (19%:R / 5%:R - 2%:R × s) noise_sigma b ×
  normal_pdf (9%:R / 2%:R - 3%:R × s) noise_sigma b ×
  normal_pdf (31%:R / 5%:R - 4%:R × s) noise_sigma b ×
  normal_pdf (8%:R - 5%:R × s) noise_sigma b)%R).
  apply: measurable_funM; last exact: (measurable_normal_pdf _ _).
  apply: measurable_funM; last exact: (measurable_normal_pdf _ _).
  apply: measurable_funM; last exact: (measurable_normal_pdf _ _).
  apply: measurable_funM; last exact: (measurable_normal_pdf _ _).
  exact: (measurable_normal_pdf _ _).
apply: funext ⇒ b.
by rewrite !(normal_pdf_recenter _ s _ b noise_sigma_neq0).
Qed.

Lemma obs_int_proof : ∀ s,
  (\int[normal_prob 0 prior_sigma]_b `|(obs (s , b ))%:E| < +oo)%E.
Proof.
move⇒ s; have /integrableP[_ //] : (normal_prob 0 prior_sigma).-integrable setT
  (EFin \o (fun b ⇒ obs (s, b))).
have hbd : [bounded (fun b : mR ⇒ obs (s, b )) b | b in [set: mR]].
  rewrite /bounded_near.
  ∃ (normal_peak noise_sigma ^+ 5)%R; split; first by rewrite num_real.
  move⇒ M hM b _ /=.
  rewrite ger0_norm; last exact: (obs_ge0 (s, b)).
  exact: (le_trans
            (obs_ub s b)
            (ltW hM)).
apply: measurable_bounded_integrable.
- exact: measurableT.
- suff: ((normal_prob 0 prior_sigma : probability _ _) setT < +oo)%E by [].
  by rewrite probability_setT; exact: ltey.
- by move: (obs_meas_proof s) ⇒ /measurable_EFinP.
- exact: hbd.
Qed.

Let d_pair_meas_tac : ∀ k yk : R,
  measurable_fun [set: mR × mR]
    (fun rr : mR × mR ⇒ normal_peak noise_sigma ×
      normal_fun ((rr .1 × k)%R + rr .2)%R noise_sigma yk)%R.
Proof.
move⇒ k yk.
apply: measurable_funM; [exact: measurable_cst|].
rewrite /normal_fun.
apply: measurableT_comp; first exact: measurable_expR.
apply: measurable_funM; [|exact: measurable_cst].
apply: measurable_funN.
apply: (measurableT_comp (exprn_measurable 2)).
apply: measurable_funB; [exact: measurable_cst|].
apply: measurable_funD; [|exact: measurable_snd].
apply: measurable_funM; [|exact: measurable_cst]; exact: measurable_fst.
Qed.

Lemma obs_product_integrable :
  (qbs_prob_mu slope_prior \x qbs_prob_mu intercept_prior).-integrable
    setT (qbs_pair_fun slope_prior intercept_prior
      (fun params ⇒ (obs params)%:E)).
Proof.
have hfin :
  (qbs_prob_mu slope_prior \x qbs_prob_mu intercept_prior)
    [set: _] < +oo.
  rewrite (_ : [set: _] = setT `*` setT); last by rewrite setXTT.
  by rewrite product_measure1E //= probability_setT mule1; exact: ltey.
rewrite /qbs_pair_fun /=.
apply: (@measurable_bounded_integrable _ _ _ _ _ setT).
- exact: measurableT.
- exact: hfin.
- rewrite /obs /d /=.
  have hns := noise_sigma_neq0.
  have → : (fun rr : mR × mR ⇒
    (normal_pdf ((rr .1 × 1)%R + rr .2)%R noise_sigma (5%:R / 2%:R) ×
     normal_pdf ((rr .1 × 2%:R)%R + rr .2)%R noise_sigma (19%:R / 5%:R) ×
     normal_pdf ((rr .1 × 3%:R)%R + rr .2)%R noise_sigma (9%:R / 2%:R) ×
     normal_pdf ((rr .1 × 4%:R)%R + rr .2)%R noise_sigma (31%:R / 5%:R) ×
     normal_pdf ((rr .1 × 5%:R)%R + rr .2)%R noise_sigma 8%:R)%R) =
    (fun rr : mR × mR ⇒
    (normal_peak noise_sigma ×
       normal_fun ((rr .1 × 1)%R + rr .2)%R
         noise_sigma (5%:R / 2%:R) ×
    (normal_peak noise_sigma ×
       normal_fun ((rr .1 × 2%:R)%R + rr .2)%R
         noise_sigma (19%:R / 5%:R)) ×
    (normal_peak noise_sigma ×
       normal_fun ((rr .1 × 3%:R)%R + rr .2)%R
         noise_sigma (9%:R / 2%:R)) ×
    (normal_peak noise_sigma ×
       normal_fun ((rr .1 × 4%:R)%R + rr .2)%R
         noise_sigma (31%:R / 5%:R)) ×
    (normal_peak noise_sigma ×
       normal_fun ((rr .1 × 5%:R)%R + rr .2)%R
         noise_sigma 8%:R))%R).
    by apply: funext ⇒ -[s b] /=; rewrite !(normal_pdfE _ hns).
  apply: measurable_funM; last exact: (d_pair_meas_tac 5%:R 8%:R).
  apply: measurable_funM; last exact: (d_pair_meas_tac 4%:R (31%:R / 5%:R)).
  apply: measurable_funM; last exact: (d_pair_meas_tac 3%:R (9%:R / 2%:R)).
  apply: measurable_funM; last exact: (d_pair_meas_tac 2%:R (19%:R / 5%:R)).
  exact: (d_pair_meas_tac 1 (5%:R / 2%:R)).
- rewrite /bounded_near.
  ∃ (normal_peak noise_sigma ^+ 5)%R; split; first by rewrite num_real.
  move⇒ M hM -[s' b'] _ /=.
  rewrite ger0_norm ?obs_ge0 //.
  exact: (le_trans
            (obs_ub s' b')
            (ltW hM)).
Qed.

Lemma sos_meas_proof : measurable_fun [set: mR]
  (fun s : mR ⇒ (scalar_of_s s)%:E :> \bar R).
Proof.
apply/measurable_EFinP.
rewrite /scalar_of_s.
apply: measurable_funM.
apply: measurable_funM.
apply: measurable_funM.
apply: measurable_funM.
- apply: measurable_funM; first exact: measurable_cst.
  rewrite /normal_fun.
  apply: measurableT_comp; first exact: measurable_expR.
  apply: measurable_funM; [|exact: measurable_cst].
  apply: measurable_funN.
  apply: (measurableT_comp (exprn_measurable 2)).
  apply: measurable_funD;
    [apply: measurable_funB; [exact: measurable_cst|exact: measurable_id]|
     exact: measurable_cst].
- apply: measurable_funM; [exact: measurable_cst|].
  rewrite /normal_fun.
  apply: measurableT_comp; first exact: measurable_expR.
  apply: measurable_funM; last exact: measurable_cst.
  apply: measurable_funN.
  apply: (measurableT_comp (exprn_measurable 2)).
  apply: measurable_funB.
  + apply: measurable_funB; [exact: measurable_cst|].
    apply: measurable_funM; [exact: measurable_cst|exact: measurable_id].
  + apply: measurable_funM; last exact: measurable_cst.
    apply: measurable_funB; [exact: measurable_cst|].
    apply: measurable_funM; [exact: measurable_cst|exact: measurable_id].
all: apply: measurable_funM; [exact: measurable_cst|].
all: rewrite /normal_fun.
all: apply: measurableT_comp; first exact: measurable_expR.
all: apply: measurable_funM; last exact: measurable_cst.
all: apply: measurable_funN.
all: apply: (measurableT_comp (exprn_measurable 2)).
all: apply: measurable_funB.
all: try (apply: measurable_funB; [exact: measurable_cst|];
          apply: measurable_funM; [exact: measurable_cst|exact: measurable_id]).
all: try (apply: measurable_funM; last exact: measurable_cst;
          apply: measurable_funB; [exact: measurable_cst|];
          apply: measurable_funM; [exact: measurable_cst|exact: measurable_id]).
Qed.

Lemma sos_int_proof :
  (\int[normal_prob 0 prior_sigma]_s `|(scalar_of_s s)%:E| < +oo)%E.
Proof.
have nf_le1 : ∀ m sigma x : R, (normal_fun m sigma x ≤ 1)%R.
  move⇒ m sigma x; rewrite /normal_fun exp.expR_le1.
  apply: mulr_le0_ge0; first by rewrite oppr_le0; exact: sqr_ge0.
  by rewrite invr_ge0 mulr2n addr_ge0 // sqr_ge0.
set M := (normal_peak (sqrtr (3%:R ^+ 2 + (2%:R^-1 : R) ^+ 2)) ×
   normal_peak (sqrtr (sqrtr (9%:R / 37%:R) ^+ 2 + (2%:R^-1 : R) ^+ 2)) ×
   normal_peak (sqrtr (sqrtr (9%:R / 73%:R) ^+ 2 + (2%:R^-1 : R) ^+ 2)) ×
   normal_peak (sqrtr (sqrtr (9%:R / 109%:R) ^+ 2 + (2%:R^-1 : R) ^+ 2)) ×
   normal_peak (sqrtr (sqrtr (9%:R / 145%:R) ^+ 2 + (2%:R^-1 : R) ^+ 2)))%R.
suff sos_ub : ∀ s : R, (scalar_of_s s ≤ M)%R.
  have /integrableP[_ //] : (normal_prob 0 prior_sigma).-integrable setT
    (EFin \o scalar_of_s).
  apply: (@measurable_bounded_integrable _ _ _ _ _ setT).
  - exact: measurableT.
  - suff: ((normal_prob 0 prior_sigma : probability _ _) setT < +oo)%E by [].
    by rewrite probability_setT; exact: ltey.
  - by move: sos_meas_proof ⇒ /measurable_EFinP.
  - rewrite /bounded_near.
    ∃ M; split; first by rewrite num_real.
    move⇒ M' hM' s _ /=.
    rewrite ger0_norm ?scalar_of_s_ge0 //.
    exact: (le_trans
              (sos_ub s)
              (ltW hM')).
move⇒ s'; rewrite /scalar_of_s /M.
have le1 := nf_le1; have pk := @normal_peak_ge0 R; have nf := @normal_fun_ge0 R.
have hge : ∀ a b c : R, (0 ≤ normal_peak a × normal_fun b a c)%R.
  by move⇒ a b c; exact: (mulr_ge0 (pk _) (nf _ _ _)).
have hle : ∀ a b c : R,
  (normal_peak a × normal_fun b a c ≤ normal_peak a)%R.
  move⇒ a b c; rewrite -[X in (_ ≤ X)%R]mulr1.
  by apply: ler_pM.
apply: ler_pM; [| | |exact: hle].
apply: mulr_ge0; [|exact: hge].
apply: mulr_ge0; [|exact: hge].
apply: mulr_ge0; [exact: hge|exact: hge].
exact: hge.
apply: ler_pM; [| | |exact: hle].
apply: mulr_ge0; [|exact: hge].
apply: mulr_ge0; [exact: hge|exact: hge].
exact: hge.
apply: ler_pM; [| | |exact: hle].
apply: mulr_ge0; [exact: hge|exact: hge].
exact: hge.
apply: ler_pM; [exact: hge|exact: hge|exact: hle|exact: hle].
Qed.

Program succeeds and integrates to 1 (all measure-theoretic side conditions discharged).

Theorem program_integrates_to_1 :
  ∃ density ,
    program = Some density ∧
    posterior_density (fun _ ⇒ 1) = 1.
Proof.
have [hev_pos hev_fin] :=
  evidence_pos obs_product_integrable obs_meas_proof
    obs_int_proof sos_meas_proof sos_int_proof.
∃ (fun p ⇒ 1 × (obs p)%:E / evidence); split.
- rewrite /program /norm_qbs -/(evidence).
  case: ifPn ⇒ // /negP.
  move/negP; rewrite negb_and ⇒ /orP[/negP|/negP]; contradiction.
- exact: posterior_density_total.
Qed.

Posterior expectation formula: E_postg = E_priorg × obs/Z.

Lemma posterior_measure_characterization
    (g : realQ R × realQ R → \bar R)
    (hint : (qbs_prob_mu slope_prior \x qbs_prob_mu intercept_prior).-integrable
      setT (qbs_pair_fun slope_prior intercept_prior
        (fun params ⇒ g params × (obs params)%:E)))
    (obs_meas : ∀ s, measurable_fun [set: mR]
      (fun b : mR ⇒ (obs (s , b ))%:E :> \bar R))
    (obs_int : ∀ s, (\int[normal_prob 0 prior_sigma]_b
      `|(obs (s , b ))%:E| < +oo)%E)
    (sos_meas : measurable_fun [set: mR]
      (fun s : mR ⇒ (scalar_of_s s)%:E :> \bar R))
    (sos_int : (\int[normal_prob 0 prior_sigma]_s
      `|(scalar_of_s s)%:E| < +oo)%E) :
  posterior_density g =
  qbs_pair_integral slope_prior intercept_prior
    (fun params ⇒ g params × ((obs params)%:E / evidence)).
Proof.
rewrite /posterior_density.
have hev := evidence_value obs_product_integrable obs_meas obs_int
              sos_meas sos_int.
rewrite hev.
have hc_neq0 : (phase2_const R != 0)%R by exact: lt0r_neq0 (phase2_const_gt0 R).
rewrite /qbs_pair_integral /=.
have → : (fun rr ⇒
  g (qbs_prob_alpha slope_prior rr .1 , qbs_prob_alpha intercept_prior rr .2 ) ×
  ((obs (qbs_prob_alpha slope_prior rr .1 ,
         qbs_prob_alpha intercept_prior rr .2 ))%:E /
   (phase2_const R)%:E)) =
  (fun rr ⇒
  (g (qbs_prob_alpha slope_prior rr .1 , qbs_prob_alpha intercept_prior rr .2 ) ×
   (obs (qbs_prob_alpha slope_prior rr .1 ,
         qbs_prob_alpha intercept_prior rr .2 ))%:E) × ((phase2_const R)^-1)%:E).
  apply: funext ⇒ rr /=.
  by rewrite inver (negbTE hc_neq0) muleA.
rewrite inver (negbTE hc_neq0).
by rewrite integralZr.
Qed.

End bayesian_regression.