conductor(deob_pass3): score_dynamics_giorgini - Langevin SDE + DSM + Gauss-Newton in C11

2026-06-23 21:04:11 -04:00
parent e4d544a2d2
commit 7f5086c626
4 changed files with 293 additions and 0 deletions
@@ -0,0 +1,167 @@
+/* ============================================================================
+ *  score_dynamics_giorgini.c - Pass 3 projection of "Learning Dynamics from Statistics: a score-based approach"
+ * ============================================================================
+ *
+ *  PURPOSE
+ *  -------
+ *  A small C11 program that demonstrates the constructive form of the
+ *  lecture's two-inference-direction framework for learning stochastic
+ *  reduced models from stationary statistics, using the duffle + forth
+ *  bootslop conventions.
+ *
+ *  The program illustrates:
+ *    - The stationary score:  s(x) = gradient(log p_ss(x))
+ *    - Langevin SDE:  dx_t = F(X_t) * dt + sqrt(2) * sigma(X_t) * dW_t
+ *    - Denoising Score Matching (DSM) loss
+ *    - Statistical Jacobian + Gauss-Newton update (Direction 1)
+ *    - Drift construction from score + mobility tensor M(x) (Direction 2)
+ *
+ *  ENCODING (per lexicon v2 Rule 5)
+ *  --------------------------------
+ *    Vector       : Scalar (placeholder for linear alg)
+ *    Mobility     : Tensor[d, d] (placeholder)
+ *    Probability  : float (placeholder)
+ *    Score        : Vector[d] (the gradient of log p)
+ *
+ *  SEE ALSO
+ *  --------
+ *  - score_dynamics_giorgini_translation.md
+ *  - score_dynamics_giorgini_decoder.md
+ *  - score_dynamics_giorgini_notes.md
+ */
+
+#include <stddef.h>
+#include <stdint.h>
+#include <stdbool.h>
+#include <math.h>
+#include <assert.h>
+
+#ifdef INTELLISENSE_DIRECTIVES
+#	pragma once
+#	include "dsl.h"
+#	include "math.h"
+#endif
+
+#pragma region Types
+
+typedef float     TSet_(F32);
+typedef uint32_t  TSet_(U4);
+
+typedef Struct_(Scalar)  { F32 value; };
+typedef Struct_(Vector)  { F32_R data; U4 dim; };
+typedef Struct_(Tensor)  { F32_R data; U4 rows; U4 cols; };
+typedef Struct_(Score)   { F32_R grad_log_p; U4 dim; };
+
+#pragma endregion Types
+
+#pragma region Langevin SDE
+
+/* Langevin SDE increment: dx_t = F(X_t) * dt + sqrt(2) * sigma(X_t) * dW_t.
+ * This is the reduced model SDE; the resolved variables x : Vector[d]. */
+I_ F32 langevin_increment(F32 drift, F32 diffusion, F32 dt, F32 dW) {
+ return drift * dt + sqrtf(2.0f) * diffusion * dW;
+}
+
+/* Apply a single Euler-Maruyama step to a 1D Langevin. */
+I_ F32 langevin_step_1d(F32 x, F32 drift, F32 diffusion, F32 dt, F32 dW) {
+ return x + langevin_increment(drift, diffusion, dt, dW);
+}
+
+#pragma endregion Langevin SDE
+
+#pragma region Score Function
+
+/* The stationary score:  s(x) = gradient(log p_ss(x))
+ * For a 1D Gaussian with mean mu and variance var, the score is (mu - x) / var. */
+I_ F32 gaussian_score(F32 x, F32 mu, F32 var) {
+ assert(var > 0.0f);
+ return (mu - x) / var;
+}
+
+/* Compute score at a point given a parametric density family (placeholder).
+ * Returns the gradient of log p at x. */
+I_ Score score_at(F32 x, F32 mu, F32 var) {
+ Score s = { .grad_log_p = 0, .dim = 1 };
+ (void)x;
+ (void)mu;
+ (void)var;
+ return s;
+}
+
+#pragma endregion Score Function
+
+#pragma region DSM Loss
+
+/* Denoising Score Matching (DSM) loss.
+ * For Gaussian-perturbed data, the DSM loss is:
+ *   L_DSM(theta) = E[ || s_theta(x + sigma * z) + z / sigma ||^2 ]
+ * where z is standard normal. */
+I_ Scalar dsm_loss(F32 predicted_score, F32 noise_z, F32 sigma) {
+ F32 target: F32 = -noise_z / sigma;
+ F32 diff: F32 = predicted_score - target;
+ Scalar loss = { .value = diff * diff };
+ return loss;
+}
+
+#pragma endregion DSM Loss
+
+#pragma region GFDT + Gauss-Newton
+
+/* Generalized Fluctuation-Dissipation Theorem (GFDT) response.
+ * Direction 1: compute parameter sensitivity (the statistical Jacobian). */
+I_ F32 statistical_jacobian(F32 observable, F32 trajectory_avg, F32 score_dot) {
+ F32 correction: F32 = observable - trajectory_avg;
+ return score_dot * correction;
+}
+
+/* Gauss-Newton update for parameter calibration.
+ * theta_new = theta_old - alpha * (J^T J + lambda * I)^-1 * J^T r */
+I_ F32 gauss_newton_update(F32 theta, F32 alpha, F32 jacobian, F32 residual, F32 damping) {
+ F32 normal_eq: F32 = jacobian * jacobian + damping;
+ if (normal_eq < 1e-12f) { return theta; }
+ F32 step: F32 = alpha * jacobian * residual / normal_eq;
+ return theta - step;
+}
+
+#pragma endregion GFDT + Gauss-Newton
+
+#pragma region Drift Construction (Direction 2)
+
+/* Drift construction from score + mobility tensor.
+ * Per the lecture: F(x) = M(x) * s(x) + divergence(M, p_ss)
+ * (the closed-form drift for any Langevin SDE matching p_ss). */
+I_ F32 drift_from_score(F32 score, F32 mobility, F32 divergence_term) {
+ return mobility * score + divergence_term;
+}
+
+#pragma endregion Drift Construction
+
+#pragma region Main
+
+I_ S32 main(void) {
+ F32 x: F32 = 1.0f;
+ F32 drift: F32 = -0.5f;
+ F32 diffusion: F32 = 0.1f;
+ F32 dt: F32 = 0.01f;
+ F32 dW: F32 = 0.05f;
+
+ F32 x_next: F32 = langevin_step_1d(x, drift, diffusion, dt, dW);
+ (void)x_next;
+
+ F32 s: F32 = gaussian_score(x, 0.0f, 1.0f);
+ Scalar dsm: Scalar = dsm_loss(s, 0.1f, 0.5f);
+ (void)dsm;
+
+ F32 theta: F32 = 1.0f;
+ F32 theta_new: F32 = gauss_newton_update(theta, 0.01f, 0.5f, 0.2f, 1e-4f);
+ (void)theta_new;
+
+ F32 mobility: F32 = 1.0f;
+ F32 divergence: F32 = 0.0f;
+ F32 F_drift: F32 = drift_from_score(s, mobility, divergence);
+ (void)F_drift;
+
+ return 0;
+}
+
+#pragma endregion Main
@@ -0,0 +1,43 @@
+# score_dynamics_giorgini - Per-term Decoder (tier-categorized)
+
+## Tier 1: Core concepts
+
+| Term | C11 form | Etymology | Tier | Source |
+|---|---|---|---|---|
+| `Scalar` | `typedef struct { F32 value; } Scalar` | Latin *scalaris* | Tier 1 | Cluster 0 |
+| `Vector` | `typedef struct { F32_R data; U4 dim; } Vector` | Latin *vector* ("carrier") | Tier 1 | Cluster 8 |
+| `Tensor` | `typedef struct { F32_R data; U4 rows; U4 cols; } Tensor` | Latin *tensor* ("stretcher") | Tier 1 | Cluster 8 |
+
+## Tier 2: Data-oriented pipeline terms
+
+| Term | C11 form | Etymology | Tier | Source |
+|---|---|---|---|---|
+| `langevin_increment` | function | Paul Langevin, 1908; the eponym | Tier 2 | Cluster 2 |
+| `langevin_step_1d` | function | the Euler-Maruyama discretization of a 1D SDE | Tier 2 | Cluster 2 |
+| `gaussian_score` | function | the score of a 1D Gaussian density | Tier 2 | Cluster 2 |
+| `dsm_loss` | function | Denoising Score Matching loss (Vincent, 2011) | Tier 2 | Cluster 2 |
+| `statistical_jacobian` | function | the Jacobian from the GFDT | Tier 2 | Cluster 2 |
+| `gauss_newton_update` | function | Gauss-Newton optimization (the second-order update) | Tier 2 | Cluster 2 |
+| `drift_from_score` | function | Direction 2: construct drift from score + mobility | Tier 2 | Cluster 2 |
+
+## Tier 3: Type-theoretic primitives
+
+| Term | C11 form | Etymology | Tier | Source |
+|---|---|---|---|---|
+| `Score` | `typedef struct { F32_R grad_log_p; U4 dim; } Score` | the gradient of log p; the "score" in score-based modeling | Tier 3 | Cluster 3 |
+
+## Tier 4: AI-fuzzing tolerance terms
+
+| Term | C11 form | Etymology | Tier | Source |
+|---|---|---|---|---|
+| `mobility` | parameter | the mobility tensor M(x); per the lecture, the "free" tensor | Tier 4 | score_dynamics_giorgini section 2 |
+| `divergence` | parameter | the divergence of M weighted by p_ss | Tier 4 | score_dynamics_giorgini section 5.3 |
+| `damping` | parameter | the Tikhonov regularization (lambda in the Gauss-Newton) | Tier 4 | score_dynamics_giorgini section 5.2 |
+
+## Etymology notes (per Cluster 7, Pattern 3)
+
+- `Langevin` - Paul Langevin (1872-1946); the eponym; the SDE formulation is from 1908.
+- `Score` - the gradient of log-likelihood; coined in Hyvarinen 2005.
+- `DSM` - Denoising Score Matching; Pascal Vincent, 2011.
+- `GFDT` - Generalized Fluctuation-Dissipation Theorem; from non-equilibrium statistical physics.
+- `Gauss-Newton` - Carl Friedrich Gauss + Isaac Newton; the optimization algorithm.
@@ -0,0 +1,63 @@
+# score_dynamics_giorgini - Pass 3 Notes
+
+**Track:** `video_analysis_deob_pass3_20260623`
+**Date:** 2026-06-23
+**Language:** C11 (per the per-language default in `TIER2_STARTER.md` section 3)
+
+## Decisions made
+
+1. **Language:** C11 (default; per `TIER2_STARTER.md` section 3 cluster A row 4).
+2. **Conventions:** duffle + forth bootslop + raddbg fallback.
+3. **Type system:** `Vector[d]` and `Tensor[d, d]` as `Struct_(Vector)` / `Struct_(Tensor)` per the duffle convention.
+4. **Score function:** simplified to 1D Gaussian; the full implementation is per-sample gradient of a learned density.
+5. **DSM loss:** scalar placeholder; the full loss averages over the training batch.
+
+## Alternatives considered
+
+1. **Python:** could have used Python for the SDE simulator. Rejected because the lecture is heavily math/algorithms oriented.
+2. **Real SDE simulator:** could have implemented a full CIR / Kuramoto-Sivashinsky simulator. Rejected because the goal is to EXPRESS the concepts.
+
+## Language override (none)
+
+Per `TIER2_STARTER.md` section 3, the default for this video is C11. No override applied.
+
+## 4 + 3 verification criteria (per v2 lexicon section 7 of `TIER2_STARTER.md`)
+
+| # | Criterion | Status | Notes |
+|---|---|---|---|
+| 1 | **Lossless** | met | All 6 concepts from the translation table are represented. |
+| 2 | **Bounded** | met | No `infinity_val`; all values are finite. |
+| 3 | **Constructively typed** | met | Every expression has a type. |
+| 4 | **Etymology-cited** | met | Every new term has 1-line origin + 1-line history. |
+| 5 | **Encoding-explicit** | met | Every value-bearing term has an encoding. |
+| 6 | **Form-anchored** | met | Every re-encoding has a form anchor. |
+| 7 | **User-specific opt-in** | met | The principled form is produced. |
+
+## Hardware target (per v2 lexicon section 7 of `TIER2_STARTER.md`)
+
+Per user 2026-06-23, "target up to 10k." Default workstation: Ryzen 9 / i9, RTX 4090, 128GB DDR5, 4TB NVMe.
+
+This video's concepts map to:
+- **SDE simulation:** scales linearly with the number of trajectories; for 10k trajectories, a 1D Langevin step is < 1ms on modern CPUs.
+- **Score-based generative modeling:** requires a GPU for the neural network training; the 1024-dim Kuramoto-Sivashinsky example needs at least 16GB VRAM.
+- **Gauss-Newton optimization:** O(n^2) per iteration; the 2000-dim PlaSim example needs careful numerical conditioning.
+
+## Refinements discovered (Pass 3 to lexicon v3 candidates)
+
+1. **Mobility tensor as a Tier 4 term:** the mobility M(x) is a NEW v2 term; v3 should formalize it.
+2. **Direction 1 vs Direction 2 as a Tier 3 distinction:** the two inference directions could be encoded as distinct type-class predicates.
+
+## Gaps identified (concepts the code couldn't capture)
+
+1. **Kuramoto-Sivashinsky PDE:** the 1024-dim PDE example is too complex for a simple C11 program; the SHAPE is captured but not the dynamics.
+2. **Cox-Ingersoll-Ross (CIR) square-root diffusion:** the analytic ground truth is not implemented.
+3. **Nonequilibrium steady state:** the 2D overdamped Langevin with multiplicative noise is not implemented.
+
+## See also
+
+- `score_dynamics_giorgini.c` - the C11 program
+- `score_dynamics_giorgini_translation.md` - the math to C11 translation table
+- `score_dynamics_giorgini_decoder.md` - the per-term decoder (tier-categorized)
+- `conductor/tracks/video_analysis_deob_apply_20260621/artifacts/score_dynamics_giorgini/` - the Pass 2 input
+- `conductor/tracks/video_analysis_score_dynamics_giorgini_20260621/report.md` - the Pass 1 source
+- `conductor/tracks/video_analysis_deob_lexicon_20260621/lexicon.md` - the v2 lexicon
@@ -0,0 +1,20 @@
+# score_dynamics_giorgini - Translation Table (math to C11)
+
+**Source:** `conductor/tracks/video_analysis_deob_apply_20260621/artifacts/score_dynamics_giorgini/score_dynamics_giorgini_deobfuscated.md` (548 lines)
+**Target:** `score_dynamics_giorgini.c` (the C11 program)
+**Method:** Per v2 lexicon Rule 2 (form-anchor) + Rule 5 (encoding-explicit)
+
+| # | Math / concept | C11 form | Form anchor | Encoding |
+|---|---|---|---|---|
+| 1 | `dx_t = F(X_t) dt + sqrt(2) sigma(X_t) dW_t` | `langevin_increment(drift, diffusion, dt, dW)` | bounded: finite dt, dW | `F32` |
+| 2 | `s(x) = gradient(log p_ss(x))` | `gaussian_score(x, mu, var)` | bounded: 1D Gaussian density family | `F32` |
+| 3 | `L_DSM = E[ \|\| s_theta(x + sigma z) + z/sigma \|\|^2 ]` | `dsm_loss(predicted_score, noise_z, sigma)` | bounded: sigma > 0 | `Scalar : float` |
+| 4 | `J = -dC/dtheta` (statistical Jacobian) | `statistical_jacobian(observable, traj_avg, score_dot)` | bounded: finite observable + traj_avg | `F32` |
+| 5 | `theta_new = theta - alpha (J^T J + lambda I)^-1 J^T r` | `gauss_newton_update(theta, alpha, jac, residual, damping)` | bounded: damping > 0 | `F32` |
+| 6 | `F(x) = M(x) s(x) + div(M, p_ss)` | `drift_from_score(score, mobility, divergence)` | bounded: scalar mobility + divergence | `F32` |
+
+## Notes
+
+- The C11 program does NOT implement a full SDE simulator; it expresses the SHAPE of the lecture's two-direction framework.
+- All `Scalar` placeholders resolve to `F32` (float32) at the function signature.
+- Per the v2 lexicon section 9.1, the per-language rendering is the same as C11.