gHashTag · June 14, 2026 18:00
diff --git a/README.md b/README.md
diff --git a/Cargo.toml b/Cargo.toml
 [package]
 name = "floor_oracle"
 version = "0.1.0"
 edition = "2021"

 [[bin]]
 name = "floor_oracle"
 path = "src/bin/floor_oracle.rs"

 [[bin]]
 name = "floor_oracle_selftest"
 path = "src/bin/floor_oracle_selftest.rs"

 [profile.release]
 opt-level = 2
diff --git a/core.rs b/core.rs
 // core.rs -- shared deterministic logic for floor_oracle.
 // ASCII-only. No external crates. Integer-exact where it matters.
 // Included via include!() into both the oracle bin and the self-test bin.

 // ---- IGLA-Coder live constants (from src/bin/igla_coder.rs HEAD 4bbd5a946bd4) ----
 pub const VOCAB: u64 = 263;
 pub const MAXSEQ: u64 = 512;
 // dff = 4*d ; heads do not change the parameter count for this arch.

 // Param law, closed form:
 //   params = (VOCAB + MAXSEQ + 1)*d + L*(12*d^2 + 2*d)
 //          = 776*d + L*(12*d^2 + 2*d)
 // The (VOCAB+MAXSEQ+1) term = token embedding (VOCAB*d) + positional (MAXSEQ*d)
 // + final norm/proj scale (d). The per-layer term 12*d^2 covers attention
 // (q,k,v,o = 4*d^2) + MLP (d*dff + dff*d = 8*d^2) and 2*d the layer biases/norms.
 pub fn params_closed(d: u64, l: u64) -> u64 {
    (VOCAB + MAXSEQ + 1) * d + l * (12 * d * d + 2 * d)
 }

 // Independent re-derivation by explicit per-block tensor-shape sum.
 // If this disagrees with params_closed, the law is wrong -> abort upstream.
 pub fn params_tensor_sum(d: u64, l: u64) -> u64 {
    let embed = VOCAB * d;        // token embedding
    let pos = MAXSEQ * d;         // positional embedding
    let final_scale = d;          // final norm scale
    let per_layer_attn = 4 * d * d; // q,k,v,o projections
    let dff = 4 * d;
    let per_layer_mlp = d * dff + dff * d; // up + down = 8*d^2
    let per_layer_bias = 2 * d;   // norm/bias terms
    let per_layer = per_layer_attn + per_layer_mlp + per_layer_bias;
    embed + pos + final_scale + l * per_layer
 }

 pub const ANCHOR_PARAMS: u64 = 493_056; // d=128, L=2, heads=4

 // ---- Published floors (each typed from its paper, carries arXiv id) ----
 pub struct Floor {
    pub name: &'static str,
    pub params: u64,
    pub tokens: u64,
    pub arxiv: &'static str,
    pub pass1_pct: f64, // reported HumanEval pass@1, pretrain
 }

 pub fn floors() -> Vec<Floor> {
    vec![
        Floor { name: "TinyCodeLM-150M", params: 150_000_000, tokens: 72_000_000_000, arxiv: "2410.02749", pass1_pct: 6.1 },
        Floor { name: "TinyCodeLM-400M", params: 400_000_000, tokens: 72_000_000_000, arxiv: "2410.02749", pass1_pct: 6.7 },
        Floor { name: "phi-1-small-350M", params: 350_000_000, tokens: 7_000_000_000, arxiv: "2306.11644", pass1_pct: 45.0 },
        Floor { name: "SmolLM-135M", params: 135_000_000, tokens: 12_000_000_000, arxiv: "2502.02737", pass1_pct: 16.0 },
    ]
 }

 // Multiplicative gap (floor / ours). >1 means we are below the floor.
 pub fn gap(floor_val: u64, our_val: u64) -> f64 {
    floor_val as f64 / our_val as f64
 }

 // ---- Chinchilla deficit (Hoffmann 2022, 20 tok/param) ----
 pub const CHINCHILLA_TOK_PER_PARAM: u64 = 20;
 pub fn chinchilla_optimal_tokens(params: u64) -> u64 {
    CHINCHILLA_TOK_PER_PARAM * params
 }
 pub fn chinchilla_deficit(params: u64, corpus_tokens: u64) -> f64 {
    chinchilla_optimal_tokens(params) as f64 / corpus_tokens as f64
 }

 pub const OUR_CORPUS_TOKENS: u64 = 72_071; // real-corpus-grow run 2026-06-14

 // ---- Wilson 95% upper bound for 0 successes in n trials ----
 // For c=0 the Wilson upper bound has a closed form:
 //   u = z^2 / (n + z^2)   (with p_hat = 0)
 // z = 1.959963985 for 95% two-sided.
 pub const Z95: f64 = 1.959_963_985_0;
 pub fn wilson_zero_success_upper(n: u64) -> f64 {
    let z2 = Z95 * Z95;
    z2 / (n as f64 + z2)
 }

 // ---- pass@k unbiased estimator (Chen 2021): 1 - C(n-c,k)/C(n,k) ----
 // Exact via u128 binomials; pass@1 = c/n.
 pub fn binom_u128(n: u64, k: u64) -> u128 {
    if k > n { return 0; }
    let k = k.min(n - k);
    let mut num: u128 = 1;
    let mut den: u128 = 1;
    for i in 0..k {
        num = num.saturating_mul((n - i) as u128);
        den = den.saturating_mul((i + 1) as u128);
    }
    num / den
 }
 pub fn pass_at_k(n: u64, c: u64, k: u64) -> f64 {
    // c successes among n samples; probability that k random samples include >=1 success.
    if c >= n { return 1.0; }       // all succeed -> always
    if c == 0 { return 0.0; }       // none succeed -> never
    if k > n { return f64::NAN; }
    let fail = binom_u128(n - c, k) as f64 / binom_u128(n, k) as f64;
    1.0 - fail
 }
 pub fn pass_at_1(n: u64, c: u64) -> f64 {
    c as f64 / n as f64
 }

 // Verdict helper: are we below a floor on params?
 pub fn below_floor_params(floor_params: u64, our_params: u64) -> bool {
    our_params < floor_params
 }
diff --git a/floor_oracle.rs b/floor_oracle.rs
 // floor_oracle.rs -- scaling-floor + eval-power calculator for IGLA-Coder.
 // ASCII-only. Deterministic. Emits auditable JSON. RUST-ONLY.
 // Capability fields that need a real run stay TRAIN_BOX_PENDING -- never fabricated.

 include!("../core.rs");

 use std::fs;

 fn jstr(s: &str) -> String { format!("\"{}\"", s) }

 fn main() {
    // --- S-2: reproduce the 493,056 anchor TWO ways ---
    let d = 128u64;
    let l = 2u64;
    let p_closed = params_closed(d, l);
    let p_tensor = params_tensor_sum(d, l);
    if p_closed != ANCHOR_PARAMS || p_tensor != ANCHOR_PARAMS {
        eprintln!("FATAL: param law does not reproduce anchor: closed={} tensor={} expected={}",
            p_closed, p_tensor, ANCHOR_PARAMS);
        std::process::exit(2);
    }
    let p148 = params_closed(64, 2); // hidden=64 config (148K)

    // --- S-3: floor gaps from OUR config (493K params, 72071 tokens) ---
    let mut floor_json = Vec::new();
    let mut all_below = true;
    for f in floors() {
        let pg = gap(f.params, ANCHOR_PARAMS);
        let tg = gap(f.tokens, OUR_CORPUS_TOKENS);
        let below = below_floor_params(f.params, ANCHOR_PARAMS);
        if !below { all_below = false; }
        floor_json.push(format!(
            "    {{\"name\": {}, \"arxiv\": {}, \"floor_params\": {}, \"floor_tokens\": {}, \"reported_pass1_pct\": {:.1}, \"param_gap_x\": {:.1}, \"token_gap_x\": {:.1}, \"we_are_below\": {}}}",
            jstr(f.name), jstr(f.arxiv), f.params, f.tokens, f.pass1_pct, pg, tg, below));
    }

    // --- S-4: Chinchilla deficit ---
    let def493 = chinchilla_deficit(ANCHOR_PARAMS, OUR_CORPUS_TOKENS);
    let def148 = chinchilla_deficit(p148, OUR_CORPUS_TOKENS);

    // --- S-5: eval power ---
    let mut wilson_json = Vec::new();
    for n in [4u64, 16, 32] {
        wilson_json.push(format!(
            "    {{\"n\": {}, \"wilson95_zero_success_upper\": {:.4}}}", n, wilson_zero_success_upper(n)));
    }
    // pass@k illustration at n=16, hypothetical c values (NOT a measured rate)
    let mut passk_json = Vec::new();
    for &(n, c, k) in &[(16u64, 0u64, 1u64), (16, 1, 1), (16, 1, 16), (16, 4, 1), (16, 4, 8), (32, 0, 1)] {
        passk_json.push(format!(
            "    {{\"n\": {}, \"c\": {}, \"k\": {}, \"pass_at_k\": {:.4}}}", n, c, k, pass_at_k(n, c, k)));
    }

    let verdict = if all_below {
        "BELOW_EVERY_PUBLISHED_FLOOR (H0 expected): our 493056 params and 72071 tokens are below every published non-zero-pass@1 code-LM floor; a measured 0/n is consistent with any true rate under the Wilson ceiling for that n. Binding gap is JOINT (params AND tokens)."
    } else {
        "AT_OR_ABOVE_A_FLOOR (H1): a published floor at or below our scale exists -- gap is NOT scale; investigate data-format/architecture."
    };

    let json = format!(
 "{{
  \"loop\": \"2026-06-15\",
  \"canon_head\": \"4bbd5a946bd4fba257d1fa1a2e872b4101b76676\",
  \"our_config\": {{
    \"params_148k_hidden64\": {},
    \"params_493k_hidden128\": {},
    \"anchor_reproduced_two_ways\": true,
    \"corpus_tokens\": {}
  }},
  \"floors\": [
 {}
  ],
  \"chinchilla\": {{
    \"tok_per_param\": {},
    \"deficit_x_at_493k\": {:.1},
    \"deficit_x_at_148k\": {:.1}
  }},
  \"eval_power_wilson95_zero_success\": [
 {}
  ],
  \"pass_at_k_examples\": [
 {}
  ],
  \"capability_compile_at_1\": \"TRAIN_BOX_PENDING\",
  \"capability_pass_at_1\": \"TRAIN_BOX_PENDING\",
  \"verdict\": {}
 }}",
        p148, p_closed, OUR_CORPUS_TOKENS,
        floor_json.join(",\n"),
        CHINCHILLA_TOK_PER_PARAM, def493, def148,
        wilson_json.join(",\n"),
        passk_json.join(",\n"),
        jstr(verdict));

    println!("{}", json);
    let _ = fs::create_dir_all("data");
    fs::write("data/floor_oracle_report.json", &json).expect("write report");
    eprintln!("[ok] floor_oracle report written to data/floor_oracle_report.json");
 }
diff --git a/floor_oracle_report.json b/floor_oracle_report.json
 {
  "loop": "2026-06-15",
  "canon_head": "4bbd5a946bd4fba257d1fa1a2e872b4101b76676",
  "our_config": {
    "params_148k_hidden64": 148224,
    "params_493k_hidden128": 493056,
    "anchor_reproduced_two_ways": true,
    "corpus_tokens": 72071
  },
  "floors": [
    {"name": "TinyCodeLM-150M", "arxiv": "2410.02749", "floor_params": 150000000, "floor_tokens": 72000000000, "reported_pass1_pct": 6.1, "param_gap_x": 304.2, "token_gap_x": 999014.9, "we_are_below": true},
    {"name": "TinyCodeLM-400M", "arxiv": "2410.02749", "floor_params": 400000000, "floor_tokens": 72000000000, "reported_pass1_pct": 6.7, "param_gap_x": 811.3, "token_gap_x": 999014.9, "we_are_below": true},
    {"name": "phi-1-small-350M", "arxiv": "2306.11644", "floor_params": 350000000, "floor_tokens": 7000000000, "reported_pass1_pct": 45.0, "param_gap_x": 709.9, "token_gap_x": 97126.4, "we_are_below": true},
    {"name": "SmolLM-135M", "arxiv": "2502.02737", "floor_params": 135000000, "floor_tokens": 12000000000, "reported_pass1_pct": 16.0, "param_gap_x": 273.8, "token_gap_x": 166502.5, "we_are_below": true}
  ],
  "chinchilla": {
    "tok_per_param": 20,
    "deficit_x_at_493k": 136.8,
    "deficit_x_at_148k": 41.1
  },
  "eval_power_wilson95_zero_success": [
    {"n": 4, "wilson95_zero_success_upper": 0.4899},
    {"n": 16, "wilson95_zero_success_upper": 0.1936},
    {"n": 32, "wilson95_zero_success_upper": 0.1072}
  ],
  "pass_at_k_examples": [
    {"n": 16, "c": 0, "k": 1, "pass_at_k": 0.0000},
    {"n": 16, "c": 1, "k": 1, "pass_at_k": 0.0625},
    {"n": 16, "c": 1, "k": 16, "pass_at_k": 1.0000},
    {"n": 16, "c": 4, "k": 1, "pass_at_k": 0.2500},
    {"n": 16, "c": 4, "k": 8, "pass_at_k": 0.9615},
    {"n": 32, "c": 0, "k": 1, "pass_at_k": 0.0000}
  ],
  "capability_compile_at_1": "TRAIN_BOX_PENDING",
  "capability_pass_at_1": "TRAIN_BOX_PENDING",
  "verdict": "BELOW_EVERY_PUBLISHED_FLOOR (H0 expected): our 493056 params and 72071 tokens are below every published non-zero-pass@1 code-LM floor; a measured 0/n is consistent with any true rate under the Wilson ceiling for that n. Binding gap is JOINT (params AND tokens)."
 }
diff --git a/floor_oracle_selftest.rs b/floor_oracle_selftest.rs
 // floor_oracle_selftest.rs -- FAIL-reachable self-test for the oracle.
 // ASCII-only. Each gate is demonstrated reachable as a FAILURE on a broken input.
 // Exit 0 = all PASS; exit 1 = a gate failed.

 include!("../core.rs");

 use std::process::exit;

 fn check(name: &str, cond: bool, pass: &mut u32, fail: &mut u32) {
    if cond { *pass += 1; println!("PASS {}", name); }
    else { *fail += 1; println!("FAIL {}", name); }
 }

 // A deliberately WRONG param law to prove T1/T2 can fail.
 fn params_wrong(d: u64, l: u64) -> u64 { 999 * d + l * d } // not the real law

 fn main() {
    let mut pass = 0u32;
    let mut fail = 0u32;

    // T1: param law reproduces 493056 two independent ways.
    let pc = params_closed(128, 2);
    let pt = params_tensor_sum(128, 2);
    check("T1a closed law == 493056", pc == ANCHOR_PARAMS, &mut pass, &mut fail);
    check("T1b tensor-sum == 493056", pt == ANCHOR_PARAMS, &mut pass, &mut fail);
    check("T1c two derivations agree", pc == pt, &mut pass, &mut fail);
    // FAIL-reachability: the wrong law must NOT reproduce the anchor.
    check("T1d wrong law is rejected (FAIL-reachable)", params_wrong(128, 2) != ANCHOR_PARAMS, &mut pass, &mut fail);

    // T2: a lying floor (floor params < our params) MUST flip the verdict to at/above.
    let our = ANCHOR_PARAMS;
    let honest_floor = 150_000_000u64; // real TinyCodeLM-150M
    let lying_floor = 1_000u64;        // absurd: smaller than our model
    check("T2a honest floor -> we are below", below_floor_params(honest_floor, our), &mut pass, &mut fail);
    check("T2b lying floor -> NOT below (verdict flips, FAIL-reachable)", !below_floor_params(lying_floor, our), &mut pass, &mut fail);

    // T3: Wilson 0-success ceiling strictly decreasing in n.
    let w4 = wilson_zero_success_upper(4);
    let w16 = wilson_zero_success_upper(16);
    let w32 = wilson_zero_success_upper(32);
    check("T3a w4 > w16", w4 > w16, &mut pass, &mut fail);
    check("T3b w16 > w32", w16 > w32, &mut pass, &mut fail);
    // Sanity vs pre-registered values (~0.49 / ~0.19 / ~0.11).
    check("T3c w4 ~0.49", (w4 - 0.490).abs() < 0.02, &mut pass, &mut fail);
    check("T3d w16 ~0.19", (w16 - 0.194).abs() < 0.02, &mut pass, &mut fail);
    check("T3e w32 ~0.11", (w32 - 0.107).abs() < 0.02, &mut pass, &mut fail);

    // T4: pass@1 identity c/n.
    check("T4a pass@1(16,4) == 0.25", (pass_at_1(16, 4) - 0.25).abs() < 1e-12, &mut pass, &mut fail);
    check("T4b pass@1(32,0) == 0.0", pass_at_1(32, 0) == 0.0, &mut pass, &mut fail);

    // T5: pass@k boundaries + monotone non-decreasing in c.
    check("T5a pass@k c=0 -> 0", pass_at_k(16, 0, 1) == 0.0, &mut pass, &mut fail);
    check("T5b pass@k c=n -> 1", (pass_at_k(16, 16, 4) - 1.0).abs() < 1e-12, &mut pass, &mut fail);
    let mut monotone = true;
    let mut prev = -1.0f64;
    for c in 0..=16u64 {
        let v = pass_at_k(16, c, 4);
        if v + 1e-12 < prev { monotone = false; }
        prev = v;
    }
    check("T5c pass@k monotone non-decreasing in c", monotone, &mut pass, &mut fail);
    // FAIL-reachability: a decreasing-in-c "rate" would trip this; prove the guard works.
    let broken_monotone = {
        let seq = [0.0f64, 0.5, 0.4]; // deliberately decreasing
        let mut ok = true; let mut p = -1.0;
        for &v in &seq { if v + 1e-12 < p { ok = false; } p = v; }
        ok
    };
    check("T5d broken decreasing seq is caught (FAIL-reachable)", !broken_monotone, &mut pass, &mut fail);

    // T6: no-fabrication gate. With no result.json, the oracle MUST keep capability
    // as the literal sentinel and emit NO float rate. We assert the sentinel string
    // is what the oracle writes (read its emitted report if present, else the constant).
    let sentinel = "TRAIN_BOX_PENDING";
    let report = std::fs::read_to_string("data/floor_oracle_report.json").unwrap_or_default();
    if report.is_empty() {
        // oracle not yet run; assert the sentinel is a non-numeric string (cannot be a rate)
        check("T6a sentinel is non-numeric", sentinel.parse::<f64>().is_err(), &mut pass, &mut fail);
    } else {
        let has_sentinel = report.contains("\"capability_compile_at_1\": \"TRAIN_BOX_PENDING\"")
            && report.contains("\"capability_pass_at_1\": \"TRAIN_BOX_PENDING\"");
        check("T6a report keeps TRAIN_BOX_PENDING for both capability fields", has_sentinel, &mut pass, &mut fail);
        // no float capability rate may appear like "capability_pass_at_1": 0.xx
        let fabricated = report.contains("\"capability_pass_at_1\": 0.")
            || report.contains("\"capability_compile_at_1\": 0.");
        check("T6b no fabricated capability rate present (FAIL-reachable)", !fabricated, &mut pass, &mut fail);
    }

    // T7: determinism -- closed-form law is pure; same inputs -> same outputs.
    check("T7 determinism (pure law)", params_closed(128, 2) == params_closed(128, 2)
        && wilson_zero_success_upper(32) == wilson_zero_success_upper(32), &mut pass, &mut fail);

    println!("---");
    println!("PASS={} FAIL={}", pass, fail);
    if fail == 0 { println!("ALL SELF-TESTS PASS"); exit(0); }
    else { println!("SELF-TEST FAILURES PRESENT"); exit(1); }
 }
	[package]
	name = "floor_oracle"
	version = "0.1.0"
	edition = "2021"

	[[bin]]
	name = "floor_oracle"
	path = "src/bin/floor_oracle.rs"

	[[bin]]
	name = "floor_oracle_selftest"
	path = "src/bin/floor_oracle_selftest.rs"

	[profile.release]
	opt-level = 2
	// core.rs -- shared deterministic logic for floor_oracle.
	// ASCII-only. No external crates. Integer-exact where it matters.
	// Included via include!() into both the oracle bin and the self-test bin.

	// ---- IGLA-Coder live constants (from src/bin/igla_coder.rs HEAD 4bbd5a946bd4) ----
	pub const VOCAB: u64 = 263;
	pub const MAXSEQ: u64 = 512;
	// dff = 4*d ; heads do not change the parameter count for this arch.

	// Param law, closed form:
	// params = (VOCAB + MAXSEQ + 1)d + L(12d^2 + 2d)
	// = 776d + L(12d^2 + 2d)
	// The (VOCAB+MAXSEQ+1) term = token embedding (VOCABd) + positional (MAXSEQd)
	// + final norm/proj scale (d). The per-layer term 12*d^2 covers attention
	// (q,k,v,o = 4d^2) + MLP (ddff + dffd = 8d^2) and 2*d the layer biases/norms.
	pub fn params_closed(d: u64, l: u64) -> u64 {
	(VOCAB + MAXSEQ + 1) * d + l * (12 * d * d + 2 * d)
	}

	// Independent re-derivation by explicit per-block tensor-shape sum.
	// If this disagrees with params_closed, the law is wrong -> abort upstream.
	pub fn params_tensor_sum(d: u64, l: u64) -> u64 {
	let embed = VOCAB * d; // token embedding
	let pos = MAXSEQ * d; // positional embedding
	let final_scale = d; // final norm scale
	let per_layer_attn = 4 * d * d; // q,k,v,o projections
	let dff = 4 * d;
	let per_layer_mlp = d * dff + dff * d; // up + down = 8*d^2
	let per_layer_bias = 2 * d; // norm/bias terms
	let per_layer = per_layer_attn + per_layer_mlp + per_layer_bias;
	embed + pos + final_scale + l * per_layer
	}

	pub const ANCHOR_PARAMS: u64 = 493_056; // d=128, L=2, heads=4

	// ---- Published floors (each typed from its paper, carries arXiv id) ----
	pub struct Floor {
	pub name: &'static str,
	pub params: u64,
	pub tokens: u64,
	pub arxiv: &'static str,
	pub pass1_pct: f64, // reported HumanEval pass@1, pretrain
	}

	pub fn floors() -> Vec<Floor> {
	vec![
	Floor { name: "TinyCodeLM-150M", params: 150_000_000, tokens: 72_000_000_000, arxiv: "2410.02749", pass1_pct: 6.1 },
	Floor { name: "TinyCodeLM-400M", params: 400_000_000, tokens: 72_000_000_000, arxiv: "2410.02749", pass1_pct: 6.7 },
	Floor { name: "phi-1-small-350M", params: 350_000_000, tokens: 7_000_000_000, arxiv: "2306.11644", pass1_pct: 45.0 },
	Floor { name: "SmolLM-135M", params: 135_000_000, tokens: 12_000_000_000, arxiv: "2502.02737", pass1_pct: 16.0 },
	]
	}

	// Multiplicative gap (floor / ours). >1 means we are below the floor.
	pub fn gap(floor_val: u64, our_val: u64) -> f64 {
	floor_val as f64 / our_val as f64
	}

	// ---- Chinchilla deficit (Hoffmann 2022, 20 tok/param) ----
	pub const CHINCHILLA_TOK_PER_PARAM: u64 = 20;
	pub fn chinchilla_optimal_tokens(params: u64) -> u64 {
	CHINCHILLA_TOK_PER_PARAM * params
	}
	pub fn chinchilla_deficit(params: u64, corpus_tokens: u64) -> f64 {
	chinchilla_optimal_tokens(params) as f64 / corpus_tokens as f64
	}

	pub const OUR_CORPUS_TOKENS: u64 = 72_071; // real-corpus-grow run 2026-06-14

	// ---- Wilson 95% upper bound for 0 successes in n trials ----
	// For c=0 the Wilson upper bound has a closed form:
	// u = z^2 / (n + z^2) (with p_hat = 0)
	// z = 1.959963985 for 95% two-sided.
	pub const Z95: f64 = 1.959_963_985_0;
	pub fn wilson_zero_success_upper(n: u64) -> f64 {
	let z2 = Z95 * Z95;
	z2 / (n as f64 + z2)
	}

	// ---- pass@k unbiased estimator (Chen 2021): 1 - C(n-c,k)/C(n,k) ----
	// Exact via u128 binomials; pass@1 = c/n.
	pub fn binom_u128(n: u64, k: u64) -> u128 {
	if k > n { return 0; }
	let k = k.min(n - k);
	let mut num: u128 = 1;
	let mut den: u128 = 1;
	for i in 0..k {
	num = num.saturating_mul((n - i) as u128);
	den = den.saturating_mul((i + 1) as u128);
	}
	num / den
	}
	pub fn pass_at_k(n: u64, c: u64, k: u64) -> f64 {
	// c successes among n samples; probability that k random samples include >=1 success.
	if c >= n { return 1.0; } // all succeed -> always
	if c == 0 { return 0.0; } // none succeed -> never
	if k > n { return f64::NAN; }
	let fail = binom_u128(n - c, k) as f64 / binom_u128(n, k) as f64;
	1.0 - fail
	}
	pub fn pass_at_1(n: u64, c: u64) -> f64 {
	c as f64 / n as f64
	}

	// Verdict helper: are we below a floor on params?
	pub fn below_floor_params(floor_params: u64, our_params: u64) -> bool {
	our_params < floor_params
	}
	// floor_oracle.rs -- scaling-floor + eval-power calculator for IGLA-Coder.
	// ASCII-only. Deterministic. Emits auditable JSON. RUST-ONLY.
	// Capability fields that need a real run stay TRAIN_BOX_PENDING -- never fabricated.

	include!("../core.rs");

	use std::fs;

	fn jstr(s: &str) -> String { format!("\"{}\"", s) }

	fn main() {
	// --- S-2: reproduce the 493,056 anchor TWO ways ---
	let d = 128u64;
	let l = 2u64;
	let p_closed = params_closed(d, l);
	let p_tensor = params_tensor_sum(d, l);
	if p_closed != ANCHOR_PARAMS \|\| p_tensor != ANCHOR_PARAMS {
	eprintln!("FATAL: param law does not reproduce anchor: closed={} tensor={} expected={}",
	p_closed, p_tensor, ANCHOR_PARAMS);
	std::process::exit(2);
	}
	let p148 = params_closed(64, 2); // hidden=64 config (148K)

	// --- S-3: floor gaps from OUR config (493K params, 72071 tokens) ---
	let mut floor_json = Vec::new();
	let mut all_below = true;
	for f in floors() {
	let pg = gap(f.params, ANCHOR_PARAMS);
	let tg = gap(f.tokens, OUR_CORPUS_TOKENS);
	let below = below_floor_params(f.params, ANCHOR_PARAMS);
	if !below { all_below = false; }
	floor_json.push(format!(
	" {{\"name\": {}, \"arxiv\": {}, \"floor_params\": {}, \"floor_tokens\": {}, \"reported_pass1_pct\": {:.1}, \"param_gap_x\": {:.1}, \"token_gap_x\": {:.1}, \"we_are_below\": {}}}",
	jstr(f.name), jstr(f.arxiv), f.params, f.tokens, f.pass1_pct, pg, tg, below));
	}

	// --- S-4: Chinchilla deficit ---
	let def493 = chinchilla_deficit(ANCHOR_PARAMS, OUR_CORPUS_TOKENS);
	let def148 = chinchilla_deficit(p148, OUR_CORPUS_TOKENS);

	// --- S-5: eval power ---
	let mut wilson_json = Vec::new();
	for n in [4u64, 16, 32] {
	wilson_json.push(format!(
	" {{\"n\": {}, \"wilson95_zero_success_upper\": {:.4}}}", n, wilson_zero_success_upper(n)));
	}
	// pass@k illustration at n=16, hypothetical c values (NOT a measured rate)
	let mut passk_json = Vec::new();
	for &(n, c, k) in &[(16u64, 0u64, 1u64), (16, 1, 1), (16, 1, 16), (16, 4, 1), (16, 4, 8), (32, 0, 1)] {
	passk_json.push(format!(
	" {{\"n\": {}, \"c\": {}, \"k\": {}, \"pass_at_k\": {:.4}}}", n, c, k, pass_at_k(n, c, k)));
	}

	let verdict = if all_below {
	"BELOW_EVERY_PUBLISHED_FLOOR (H0 expected): our 493056 params and 72071 tokens are below every published non-zero-pass@1 code-LM floor; a measured 0/n is consistent with any true rate under the Wilson ceiling for that n. Binding gap is JOINT (params AND tokens)."
	} else {
	"AT_OR_ABOVE_A_FLOOR (H1): a published floor at or below our scale exists -- gap is NOT scale; investigate data-format/architecture."
	};

	let json = format!(
	"{{
	\"loop\": \"2026-06-15\",
	\"canon_head\": \"4bbd5a946bd4fba257d1fa1a2e872b4101b76676\",
	\"our_config\": {{
	\"params_148k_hidden64\": {},
	\"params_493k_hidden128\": {},
	\"anchor_reproduced_two_ways\": true,
	\"corpus_tokens\": {}
	}},
	\"floors\": [
	{}
	],
	\"chinchilla\": {{
	\"tok_per_param\": {},
	\"deficit_x_at_493k\": {:.1},
	\"deficit_x_at_148k\": {:.1}
	}},
	\"eval_power_wilson95_zero_success\": [
	{}
	],
	\"pass_at_k_examples\": [
	{}
	],
	\"capability_compile_at_1\": \"TRAIN_BOX_PENDING\",
	\"capability_pass_at_1\": \"TRAIN_BOX_PENDING\",
	\"verdict\": {}
	}}",
	p148, p_closed, OUR_CORPUS_TOKENS,
	floor_json.join(",\n"),
	CHINCHILLA_TOK_PER_PARAM, def493, def148,
	wilson_json.join(",\n"),
	passk_json.join(",\n"),
	jstr(verdict));

	println!("{}", json);
	let _ = fs::create_dir_all("data");
	fs::write("data/floor_oracle_report.json", &json).expect("write report");
	eprintln!("[ok] floor_oracle report written to data/floor_oracle_report.json");
	}
	{
	"loop": "2026-06-15",
	"canon_head": "4bbd5a946bd4fba257d1fa1a2e872b4101b76676",
	"our_config": {
	"params_148k_hidden64": 148224,
	"params_493k_hidden128": 493056,
	"anchor_reproduced_two_ways": true,
	"corpus_tokens": 72071
	},
	"floors": [
	{"name": "TinyCodeLM-150M", "arxiv": "2410.02749", "floor_params": 150000000, "floor_tokens": 72000000000, "reported_pass1_pct": 6.1, "param_gap_x": 304.2, "token_gap_x": 999014.9, "we_are_below": true},
	{"name": "TinyCodeLM-400M", "arxiv": "2410.02749", "floor_params": 400000000, "floor_tokens": 72000000000, "reported_pass1_pct": 6.7, "param_gap_x": 811.3, "token_gap_x": 999014.9, "we_are_below": true},
	{"name": "phi-1-small-350M", "arxiv": "2306.11644", "floor_params": 350000000, "floor_tokens": 7000000000, "reported_pass1_pct": 45.0, "param_gap_x": 709.9, "token_gap_x": 97126.4, "we_are_below": true},
	{"name": "SmolLM-135M", "arxiv": "2502.02737", "floor_params": 135000000, "floor_tokens": 12000000000, "reported_pass1_pct": 16.0, "param_gap_x": 273.8, "token_gap_x": 166502.5, "we_are_below": true}
	],
	"chinchilla": {
	"tok_per_param": 20,
	"deficit_x_at_493k": 136.8,
	"deficit_x_at_148k": 41.1
	},
	"eval_power_wilson95_zero_success": [
	{"n": 4, "wilson95_zero_success_upper": 0.4899},
	{"n": 16, "wilson95_zero_success_upper": 0.1936},
	{"n": 32, "wilson95_zero_success_upper": 0.1072}
	],
	"pass_at_k_examples": [
	{"n": 16, "c": 0, "k": 1, "pass_at_k": 0.0000},
	{"n": 16, "c": 1, "k": 1, "pass_at_k": 0.0625},
	{"n": 16, "c": 1, "k": 16, "pass_at_k": 1.0000},
	{"n": 16, "c": 4, "k": 1, "pass_at_k": 0.2500},
	{"n": 16, "c": 4, "k": 8, "pass_at_k": 0.9615},
	{"n": 32, "c": 0, "k": 1, "pass_at_k": 0.0000}
	],
	"capability_compile_at_1": "TRAIN_BOX_PENDING",
	"capability_pass_at_1": "TRAIN_BOX_PENDING",
	"verdict": "BELOW_EVERY_PUBLISHED_FLOOR (H0 expected): our 493056 params and 72071 tokens are below every published non-zero-pass@1 code-LM floor; a measured 0/n is consistent with any true rate under the Wilson ceiling for that n. Binding gap is JOINT (params AND tokens)."
	}
	// floor_oracle_selftest.rs -- FAIL-reachable self-test for the oracle.
	// ASCII-only. Each gate is demonstrated reachable as a FAILURE on a broken input.
	// Exit 0 = all PASS; exit 1 = a gate failed.

	include!("../core.rs");

	use std::process::exit;

	fn check(name: &str, cond: bool, pass: &mut u32, fail: &mut u32) {
	if cond { *pass += 1; println!("PASS {}", name); }
	else { *fail += 1; println!("FAIL {}", name); }
	}

	// A deliberately WRONG param law to prove T1/T2 can fail.
	fn params_wrong(d: u64, l: u64) -> u64 { 999 * d + l * d } // not the real law

	fn main() {
	let mut pass = 0u32;
	let mut fail = 0u32;

	// T1: param law reproduces 493056 two independent ways.
	let pc = params_closed(128, 2);
	let pt = params_tensor_sum(128, 2);
	check("T1a closed law == 493056", pc == ANCHOR_PARAMS, &mut pass, &mut fail);
	check("T1b tensor-sum == 493056", pt == ANCHOR_PARAMS, &mut pass, &mut fail);
	check("T1c two derivations agree", pc == pt, &mut pass, &mut fail);
	// FAIL-reachability: the wrong law must NOT reproduce the anchor.
	check("T1d wrong law is rejected (FAIL-reachable)", params_wrong(128, 2) != ANCHOR_PARAMS, &mut pass, &mut fail);

	// T2: a lying floor (floor params < our params) MUST flip the verdict to at/above.
	let our = ANCHOR_PARAMS;
	let honest_floor = 150_000_000u64; // real TinyCodeLM-150M
	let lying_floor = 1_000u64; // absurd: smaller than our model
	check("T2a honest floor -> we are below", below_floor_params(honest_floor, our), &mut pass, &mut fail);
	check("T2b lying floor -> NOT below (verdict flips, FAIL-reachable)", !below_floor_params(lying_floor, our), &mut pass, &mut fail);

	// T3: Wilson 0-success ceiling strictly decreasing in n.
	let w4 = wilson_zero_success_upper(4);
	let w16 = wilson_zero_success_upper(16);
	let w32 = wilson_zero_success_upper(32);
	check("T3a w4 > w16", w4 > w16, &mut pass, &mut fail);
	check("T3b w16 > w32", w16 > w32, &mut pass, &mut fail);
	// Sanity vs pre-registered values (~0.49 / ~0.19 / ~0.11).
	check("T3c w4 ~0.49", (w4 - 0.490).abs() < 0.02, &mut pass, &mut fail);
	check("T3d w16 ~0.19", (w16 - 0.194).abs() < 0.02, &mut pass, &mut fail);
	check("T3e w32 ~0.11", (w32 - 0.107).abs() < 0.02, &mut pass, &mut fail);

	// T4: pass@1 identity c/n.
	check("T4a pass@1(16,4) == 0.25", (pass_at_1(16, 4) - 0.25).abs() < 1e-12, &mut pass, &mut fail);
	check("T4b pass@1(32,0) == 0.0", pass_at_1(32, 0) == 0.0, &mut pass, &mut fail);

	// T5: pass@k boundaries + monotone non-decreasing in c.
	check("T5a pass@k c=0 -> 0", pass_at_k(16, 0, 1) == 0.0, &mut pass, &mut fail);
	check("T5b pass@k c=n -> 1", (pass_at_k(16, 16, 4) - 1.0).abs() < 1e-12, &mut pass, &mut fail);
	let mut monotone = true;
	let mut prev = -1.0f64;
	for c in 0..=16u64 {
	let v = pass_at_k(16, c, 4);
	if v + 1e-12 < prev { monotone = false; }
	prev = v;
	}
	check("T5c pass@k monotone non-decreasing in c", monotone, &mut pass, &mut fail);
	// FAIL-reachability: a decreasing-in-c "rate" would trip this; prove the guard works.
	let broken_monotone = {
	let seq = [0.0f64, 0.5, 0.4]; // deliberately decreasing
	let mut ok = true; let mut p = -1.0;
	for &v in &seq { if v + 1e-12 < p { ok = false; } p = v; }
	ok
	};
	check("T5d broken decreasing seq is caught (FAIL-reachable)", !broken_monotone, &mut pass, &mut fail);

	// T6: no-fabrication gate. With no result.json, the oracle MUST keep capability
	// as the literal sentinel and emit NO float rate. We assert the sentinel string
	// is what the oracle writes (read its emitted report if present, else the constant).
	let sentinel = "TRAIN_BOX_PENDING";
	let report = std::fs::read_to_string("data/floor_oracle_report.json").unwrap_or_default();
	if report.is_empty() {
	// oracle not yet run; assert the sentinel is a non-numeric string (cannot be a rate)
	check("T6a sentinel is non-numeric", sentinel.parse::<f64>().is_err(), &mut pass, &mut fail);
	} else {
	let has_sentinel = report.contains("\"capability_compile_at_1\": \"TRAIN_BOX_PENDING\"")
	&& report.contains("\"capability_pass_at_1\": \"TRAIN_BOX_PENDING\"");
	check("T6a report keeps TRAIN_BOX_PENDING for both capability fields", has_sentinel, &mut pass, &mut fail);
	// no float capability rate may appear like "capability_pass_at_1": 0.xx
	let fabricated = report.contains("\"capability_pass_at_1\": 0.")
	\|\| report.contains("\"capability_compile_at_1\": 0.");
	check("T6b no fabricated capability rate present (FAIL-reachable)", !fabricated, &mut pass, &mut fail);
	}

	// T7: determinism -- closed-form law is pure; same inputs -> same outputs.
	check("T7 determinism (pure law)", params_closed(128, 2) == params_closed(128, 2)
	&& wilson_zero_success_upper(32) == wilson_zero_success_upper(32), &mut pass, &mut fail);

	println!("---");
	println!("PASS={} FAIL={}", pass, fail);
	if fail == 0 { println!("ALL SELF-TESTS PASS"); exit(0); }
	else { println!("SELF-TEST FAILURES PRESENT"); exit(1); }
	}