refactor(ir): extract ErrorFlow (error_flow.zig) for path-sensitive error-flow diagnostics (A5.2 step 2)

Move the diagnostic-only Pass 1e (ERR E1.7 cleanup-absorption + E1.8 value-slot liveness) out of lower.zig into src/ir/error_flow.zig behind an ErrorFlow *Lowering facade (Principle 5, like ErrorAnalysis/CoercionResolver). Behavior preserved exactly — pure relocation. Moved verbatim (self. -> self.l. for Lowering members; sibling calls stay on the facade; provenHas is a file-local free fn): checkErrorFlow, analyzeFnBody, flowWalk, flowStmt, flowIf, flowMatch, flowExpr, applyRefinement, provenAdd/provenClone/provenIntersect, registerFailableDestructure, checkCleanupBody/checkCleanupNode/cleanupReject, plus the FlowCtx/ProvenSet types. - lowerRoot routes the single call site through self.errorFlow().checkErrorFlow(decls); no Lowering wrapper kept (only the pipeline calls it, no unit-test caller). New errorFlow() accessor. - The pass takes AST decls + ProgramIndex + diagnostics only — independent of IR Builder state (PLAN-ARCH A5.2 success criterion). - New pub: exprIsFailable (only widening; inferExprType/errorChannelOf already pub). lower.zig -389 (->17030); error_flow.zig 407. Barrel-wired in ir.zig. - No .test.zig: diagnostic-pass altitude (functions return only bool + emit diagnostics) — guarded by example anchors 1046-1053 (incl. scaffolding 1051/1052/1053). Phase A5 complete. Gate: zig build, zig build test, bash tests/run_examples.sh -> 361/0 (anchors 1046-1053 all ok, no .ir churn).
2026-06-03 06:54:13 +03:00
parent 2d2bfafa29
commit 1f354f6da0
3 changed files with 419 additions and 391 deletions
--- a/src/ir/lower.zig
+++ b/src/ir/lower.zig
@@ -28,6 +28,7 @@ const GenericResolver = @import("generics.zig").GenericResolver;
 const ProtocolResolver = @import("protocols.zig").ProtocolResolver;
 const CoercionResolver = @import("conversions.zig").CoercionResolver;
 const ErrorAnalysis = @import("error_analysis.zig").ErrorAnalysis;
+const ErrorFlow = @import("error_flow.zig").ErrorFlow;
 const semantic_diagnostics = @import("semantic_diagnostics.zig");

 const TypeId = types.TypeId;
@@ -337,7 +338,7 @@ pub const Lowering = struct {
        // the error-set convergence passes (so failable callees resolve) and
        // before body lowering — purely a diagnostic pass; `core.zig` halts on
        // any error before codegen.
-        self.checkErrorFlow(decls);
+        self.errorFlow().checkErrorFlow(decls);
        // Pass 1f: reject identifiers used in a type position that name no
        // declared type / primitive / in-scope generic param (issue 0064).
        // Runs after scanning (so every real type name is registered) and
@@ -434,395 +435,9 @@ pub const Lowering = struct {
        }
    }

-    // ── ERR E1.7 / E1.8 — error-flow analysis ───────────────────────────────
-    //
-    // One structured, path-sensitive walk over each MAIN-file function body
-    // (imported modules are trusted) drives two checks:
-    //
-    //  • E1.8 (value-slot liveness): a `v, err := failable()` destructure binds
-    //    `v` "live only where `err` is proven absent". A read of `v` is legal
-    //    iff `err` is proven null on the current path — established by
-    //    `if !err { … }` (proven inside) or `if err { return/raise }` (proven on
-    //    the fall-through). Error-set `==`/tag-compares do NOT prove absence.
-    //
-    //  • E1.7 (cleanup absorption): a bare failable call in a `defer`/`onfail`
-    //    body (with no `catch` / `or value`) is rejected — its error has nowhere
-    //    to propagate (the block is already exiting). See `checkCleanupBody`.
-
-    /// Per-function registration state for the flow walk. `bindings` maps each
-    /// failable value-slot variable to its partner error variable; `err_vars`
-    /// is the set of those error variables (so conditions over them refine the
-    /// proven-null set). Both are monotonic — entries are added as destructures
-    /// are encountered, never removed (out-of-scope names simply stop being read).
-    const FlowCtx = struct {
-        bindings: std.StringHashMap([]const u8),
-        err_vars: std.StringHashMap(void),
-    };
-
-    /// The proven-null set: error-variable names known to be absent on the
-    /// current path. Threaded by value-clone across branches; the join after an
-    /// `if` is the intersection of the reachable branches' sets.
-    const ProvenSet = std.ArrayList([]const u8);
-
-    fn provenHas(set: ProvenSet, name: []const u8) bool {
-        for (set.items) |n| if (std.mem.eql(u8, n, name)) return true;
-        return false;
-    }
-
-    fn provenAdd(self: *Lowering, set: *ProvenSet, name: []const u8) void {
-        if (!provenHas(set.*, name)) set.append(self.alloc, name) catch {};
-    }
-
-    fn provenClone(self: *Lowering, set: ProvenSet) ProvenSet {
-        var out = ProvenSet.empty;
-        out.appendSlice(self.alloc, set.items) catch {};
-        return out;
-    }
-
-    fn provenIntersect(self: *Lowering, a: ProvenSet, b: ProvenSet) ProvenSet {
-        var out = ProvenSet.empty;
-        for (a.items) |n| if (provenHas(b, n)) (out.append(self.alloc, n) catch {});
-        return out;
-    }
-
-    /// Pass 1e: run the error-flow checks over every function defined in the
-    /// main file. Library modules are assumed well-formed (and may use patterns
-    /// this conservative check would over-reject), so they are skipped.
-    fn checkErrorFlow(self: *Lowering, decls: []const *const Node) void {
-        if (self.diagnostics == null) return;
-        for (decls) |decl| {
-            if (self.main_file) |mf| {
-                if (decl.source_file) |sf| {
-                    if (!std.mem.eql(u8, sf, mf)) continue;
-                }
-            }
-            switch (decl.data) {
-                .fn_decl => |fd| self.analyzeFnBody(fd.body),
-                .const_decl => |cd| {
-                    if (cd.value.data == .fn_decl) self.analyzeFnBody(cd.value.data.fn_decl.body);
-                },
-                else => {},
-            }
-        }
-    }
-
-    /// Analyze one function (or lambda) body as its own boundary — a fresh
-    /// binding context and an empty proven set.
-    fn analyzeFnBody(self: *Lowering, body: *const Node) void {
-        var ctx = FlowCtx{
-            .bindings = std.StringHashMap([]const u8).init(self.alloc),
-            .err_vars = std.StringHashMap(void).init(self.alloc),
-        };
-        var proven = ProvenSet.empty;
-        _ = self.flowWalk(body, &ctx, &proven);
-    }
-
-    /// Walk a block or single statement. Returns whether control always
-    /// diverges (every path ends in return/raise/break/continue) — used by the
-    /// caller to mark code after a branch unreachable.
-    fn flowWalk(self: *Lowering, node: *const Node, ctx: *FlowCtx, proven: *ProvenSet) bool {
-        switch (node.data) {
-            .block => |b| {
-                for (b.stmts) |s| if (self.flowStmt(s, ctx, proven)) return true;
-                return false;
-            },
-            else => return self.flowStmt(node, ctx, proven),
-        }
-    }
-
-    fn flowStmt(self: *Lowering, node: *const Node, ctx: *FlowCtx, proven: *ProvenSet) bool {
-        switch (node.data) {
-            .destructure_decl => |dd| {
-                self.flowExpr(dd.value, ctx, proven.*);
-                self.registerFailableDestructure(&dd, ctx);
-                return false;
-            },
-            .var_decl => |vd| {
-                if (vd.value) |v| self.flowExpr(v, ctx, proven.*);
-                return false;
-            },
-            .const_decl => |cd| {
-                self.flowExpr(cd.value, ctx, proven.*);
-                return false;
-            },
-            .assignment => |a| {
-                self.flowExpr(a.value, ctx, proven.*);
-                self.flowExpr(a.target, ctx, proven.*);
-                return false;
-            },
-            .multi_assign => |ma| {
-                for (ma.values) |v| self.flowExpr(v, ctx, proven.*);
-                return false;
-            },
-            .return_stmt => |r| {
-                if (r.value) |v| self.flowExpr(v, ctx, proven.*);
-                return true;
-            },
-            .raise_stmt => |rs| {
-                self.flowExpr(rs.tag, ctx, proven.*);
-                return true;
-            },
-            .break_expr, .continue_expr => return true,
-            .if_expr => |ie| return self.flowIf(&ie, ctx, proven),
-            .while_expr => |we| {
-                self.flowExpr(we.condition, ctx, proven.*);
-                var loop_proven = self.provenClone(proven.*);
-                _ = self.flowWalk(we.body, ctx, &loop_proven);
-                return false;
-            },
-            .for_expr => |fe| {
-                self.flowExpr(fe.iterable, ctx, proven.*);
-                if (fe.range_end) |re| self.flowExpr(re, ctx, proven.*);
-                var loop_proven = self.provenClone(proven.*);
-                _ = self.flowWalk(fe.body, ctx, &loop_proven);
-                return false;
-            },
-            .match_expr => |me| return self.flowMatch(&me, ctx, proven),
-            .push_stmt => |ps| {
-                self.flowExpr(ps.context_expr, ctx, proven.*);
-                var inner = self.provenClone(proven.*);
-                _ = self.flowWalk(ps.body, ctx, &inner);
-                return false;
-            },
-            .defer_stmt => |ds| {
-                self.checkCleanupBody(ds.expr, "defer");
-                self.flowExpr(ds.expr, ctx, proven.*);
-                return false;
-            },
-            .onfail_stmt => |os| {
-                self.checkCleanupBody(os.body, "onfail");
-                self.flowExpr(os.body, ctx, proven.*);
-                return false;
-            },
-            else => {
-                self.flowExpr(node, ctx, proven.*);
-                return false;
-            },
-        }
-    }
-
-    /// Path-sensitive `if`: refine the proven set on each branch, recurse, and
-    /// join the reachable fall-through states by intersection.
-    fn flowIf(self: *Lowering, ie: *const ast.IfExpr, ctx: *FlowCtx, proven: *ProvenSet) bool {
-        self.flowExpr(ie.condition, ctx, proven.*);
-        var then_proven = self.provenClone(proven.*);
-        var else_proven = self.provenClone(proven.*);
-        self.applyRefinement(ie.condition, true, ctx, &then_proven);
-        self.applyRefinement(ie.condition, false, ctx, &else_proven);
-
-        const then_div = self.flowWalk(ie.then_branch, ctx, &then_proven);
-        var else_div = false;
-        if (ie.else_branch) |eb| else_div = self.flowWalk(eb, ctx, &else_proven);
-
-        // Reachable fall-through contributors: a branch that doesn't diverge,
-        // plus the implicit (empty) else when there is no `else`.
-        var contributors = std.ArrayList(ProvenSet).empty;
-        if (!then_div) contributors.append(self.alloc, then_proven) catch {};
-        if (ie.else_branch != null) {
-            if (!else_div) contributors.append(self.alloc, else_proven) catch {};
-        } else {
-            contributors.append(self.alloc, else_proven) catch {};
-        }
-        if (contributors.items.len == 0) return true; // both branches diverge
-
-        var result = self.provenClone(contributors.items[0]);
-        for (contributors.items[1..]) |c| result = self.provenIntersect(result, c);
-        proven.* = result;
-        return false;
-    }
-
-    /// Refine the proven-null set for a branch taken when `cond` is `want_true`.
-    /// A bare error-variable is truthy when it HOLDS an error, so its falsy edge
-    /// proves absence; `!`, `&&`, `||` compose. Tag/equality compares prove
-    /// nothing (error-set `==` compares tags, not presence).
-    fn applyRefinement(self: *Lowering, cond: *const Node, want_true: bool, ctx: *FlowCtx, set: *ProvenSet) void {
-        switch (cond.data) {
-            .identifier => |id| {
-                if (ctx.err_vars.contains(id.name) and !want_true) self.provenAdd(set, id.name);
-            },
-            .unary_op => |uop| {
-                if (uop.op == .not) self.applyRefinement(uop.operand, !want_true, ctx, set);
-            },
-            .binary_op => |bop| {
-                if (bop.op == .and_op and want_true) {
-                    self.applyRefinement(bop.lhs, true, ctx, set);
-                    self.applyRefinement(bop.rhs, true, ctx, set);
-                } else if (bop.op == .or_op and !want_true) {
-                    self.applyRefinement(bop.lhs, false, ctx, set);
-                    self.applyRefinement(bop.rhs, false, ctx, set);
-                }
-            },
-            else => {},
-        }
-    }
-
-    fn flowMatch(self: *Lowering, me: *const ast.MatchExpr, ctx: *FlowCtx, proven: *ProvenSet) bool {
-        self.flowExpr(me.subject, ctx, proven.*);
-        for (me.arms) |arm| {
-            var arm_proven = self.provenClone(proven.*);
-            _ = self.flowWalk(arm.body, ctx, &arm_proven);
-        }
-        return false;
-    }
-
-    /// Check an expression for reads of a still-tainted value-slot variable and
-    /// recurse into nested lambdas as their own boundaries. `proven` is by value
-    /// — sub-expressions never publish proven-null facts back to the statement.
-    fn flowExpr(self: *Lowering, node: *const Node, ctx: *FlowCtx, proven: ProvenSet) void {
-        switch (node.data) {
-            .identifier => |id| {
-                if (ctx.bindings.get(id.name)) |err_var| {
-                    if (!provenHas(proven, err_var)) {
-                        if (self.diagnostics) |d| d.addFmt(.err, node.span, "value `{s}` from a failable can be used only where its error `{s}` is proven absent — guard the use with `if !{s} {{ … }}`, or return early with `if {s} {{ return; }}` before reading `{s}`", .{ id.name, err_var, err_var, err_var, id.name });
-                    }
-                }
-            },
-            .lambda => |lam| self.analyzeFnBody(lam.body),
-            .binary_op => |b| {
-                self.flowExpr(b.lhs, ctx, proven);
-                // Short-circuit: the rhs of `&&` runs only when the lhs is true
-                // (and `||`'s rhs only when the lhs is false), so refine the
-                // proven-null set accordingly before checking it. This is what
-                // makes `if !err && use(v)` legal.
-                if (b.op == .and_op or b.op == .or_op) {
-                    var rp = self.provenClone(proven);
-                    self.applyRefinement(b.lhs, b.op == .and_op, ctx, &rp);
-                    self.flowExpr(b.rhs, ctx, rp);
-                } else {
-                    self.flowExpr(b.rhs, ctx, proven);
-                }
-            },
-            .chained_comparison => |cc| {
-                for (cc.operands) |op| self.flowExpr(op, ctx, proven);
-            },
-            .unary_op => |u| self.flowExpr(u.operand, ctx, proven),
-            .call => |c| {
-                self.flowExpr(c.callee, ctx, proven);
-                for (c.args) |a| self.flowExpr(a, ctx, proven);
-            },
-            .field_access => |fa| self.flowExpr(fa.object, ctx, proven),
-            .index_expr => |ix| {
-                self.flowExpr(ix.object, ctx, proven);
-                self.flowExpr(ix.index, ctx, proven);
-            },
-            .slice_expr => |se| {
-                self.flowExpr(se.object, ctx, proven);
-                if (se.start) |s| self.flowExpr(s, ctx, proven);
-                if (se.end) |e| self.flowExpr(e, ctx, proven);
-            },
-            .try_expr => |te| self.flowExpr(te.operand, ctx, proven),
-            .catch_expr => |ce| {
-                self.flowExpr(ce.operand, ctx, proven);
-                self.flowExpr(ce.body, ctx, proven);
-            },
-            .force_unwrap => |fu| self.flowExpr(fu.operand, ctx, proven),
-            .null_coalesce => |nc| {
-                self.flowExpr(nc.lhs, ctx, proven);
-                self.flowExpr(nc.rhs, ctx, proven);
-            },
-            .deref_expr => |de| self.flowExpr(de.operand, ctx, proven),
-            .comptime_expr => |ce| self.flowExpr(ce.expr, ctx, proven),
-            .insert_expr => |ie| self.flowExpr(ie.expr, ctx, proven),
-            .spread_expr => |se| self.flowExpr(se.operand, ctx, proven),
-            .struct_literal => |sl| {
-                for (sl.field_inits) |fi| self.flowExpr(fi.value, ctx, proven);
-            },
-            .array_literal => |al| {
-                for (al.elements) |el| self.flowExpr(el, ctx, proven);
-            },
-            .tuple_literal => |tl| {
-                for (tl.elements) |el| self.flowExpr(el.value, ctx, proven);
-            },
-            .if_expr => |ie| {
-                var tmp = self.provenClone(proven);
-                _ = self.flowIf(&ie, ctx, &tmp);
-            },
-            .match_expr => |me| {
-                var tmp = self.provenClone(proven);
-                _ = self.flowMatch(&me, ctx, &tmp);
-            },
-            .block => |b| {
-                var tmp = self.provenClone(proven);
-                for (b.stmts) |s| if (self.flowStmt(s, ctx, &tmp)) break;
-            },
-            else => {},
-        }
-    }
-
-    /// Register a `v…, err := failable()` destructure. Only a complete bare
-    /// destructure (every slot bound, error slot a real name) creates taint —
-    /// an omitted or `_`-bound error slot is already rejected by the discard
-    /// check in `lowerDestructureDecl`, so it produces no proof obligation here.
-    fn registerFailableDestructure(self: *Lowering, dd: *const ast.DestructureDecl, ctx: *FlowCtx) void {
-        const ty = self.inferExprType(dd.value);
-        if (self.errorChannelOf(ty) == null) return;
-        if (ty.isBuiltin()) return;
-        const ti = self.module.types.get(ty);
-        if (ti != .tuple) return;
-        const fields = ti.tuple.fields;
-        if (dd.names.len != fields.len) return;
-        const err_name = dd.names[fields.len - 1];
-        if (std.mem.eql(u8, err_name, "_")) return;
-        ctx.err_vars.put(err_name, {}) catch {};
-        var i: usize = 0;
-        while (i + 1 < dd.names.len) : (i += 1) {
-            const vn = dd.names[i];
-            if (std.mem.eql(u8, vn, "_")) continue;
-            ctx.bindings.put(vn, err_name) catch {};
-        }
-    }
-
-    /// E1.7: a `defer`/`onfail` body runs while the block is already exiting, so
-    /// a bare failable call has nowhere to send its error. Reject any failable
-    /// expression-statement that isn't absorbed locally by `catch` / `or value`
-    /// / a destructure binding. (Parser already bans `try`/`raise`/`return`/
-    /// `break`/`continue` here, so the only escape route left for a failable is
-    /// local absorption.) The check is transitive through nested blocks, `if`,
-    /// loops, match arms, and `catch` handlers, but stops at a nested closure
-    /// (its own function boundary).
-    fn checkCleanupBody(self: *Lowering, body: *const Node, kind: []const u8) void {
-        self.checkCleanupNode(body, kind);
-    }
-
-    fn checkCleanupNode(self: *Lowering, node: *const Node, kind: []const u8) void {
-        switch (node.data) {
-            .block => |b| for (b.stmts) |s| self.checkCleanupNode(s, kind),
-            .if_expr => |ie| {
-                self.cleanupReject(ie.condition, kind);
-                self.checkCleanupNode(ie.then_branch, kind);
-                if (ie.else_branch) |eb| self.checkCleanupNode(eb, kind);
-            },
-            .while_expr => |we| {
-                self.cleanupReject(we.condition, kind);
-                self.checkCleanupNode(we.body, kind);
-            },
-            .for_expr => |fe| self.checkCleanupNode(fe.body, kind),
-            .match_expr => |me| for (me.arms) |arm| self.checkCleanupNode(arm.body, kind),
-            .push_stmt => |ps| self.checkCleanupNode(ps.body, kind),
-            // A destructure binds the error slot → absorbed (explicit ownership).
-            .destructure_decl => {},
-            .var_decl => |vd| if (vd.value) |v| self.cleanupReject(v, kind),
-            .const_decl => |cd| self.cleanupReject(cd.value, kind),
-            .assignment => |a| self.cleanupReject(a.value, kind),
-            // Closures are their own boundary; the parser-banned control-flow
-            // exits are handled elsewhere; nested cleanup is independent.
-            .lambda, .return_stmt, .raise_stmt, .break_expr, .continue_expr, .defer_stmt, .onfail_stmt => {},
-            else => self.cleanupReject(node, kind),
-        }
-    }
-
-    /// Reject `expr` if it is a bare (un-absorbed) failable in cleanup position.
-    /// `catch` / `or value` strip the error channel (so `exprIsFailable` is
-    /// false for them); only a still-failable expression has an unhandled error.
-    fn cleanupReject(self: *Lowering, expr: *const Node, kind: []const u8) void {
-        if (expr.data == .catch_expr) {
-            // The operand is absorbed; the handler body still runs in cleanup.
-            self.checkCleanupNode(expr.data.catch_expr.body, kind);
-            return;
-        }
-        if (!self.exprIsFailable(expr)) return;
-        if (self.diagnostics) |d| d.addFmt(.err, expr.span, "a bare failable call in a `{s}` body has nowhere to send its error — the block is already exiting; absorb it locally with `catch` or `or <value>`", .{kind});
-    }
+    // ERR E1.7 / E1.8 — path-sensitive error-flow diagnostics (Pass 1e) live in
+    // `error_flow.zig` (`ErrorFlow`, a `*Lowering` facade). `lowerRoot` calls
+    // `self.errorFlow().checkErrorFlow(decls)`.

    /// On Android, the OS loads the .so via a Java-side Activity declared
    /// with `#jni_main #jni_class("...")`. The Java class drives the
@@ -13863,6 +13478,10 @@ pub const Lowering = struct {
        return .{ .l = self };
    }

+    pub fn errorFlow(self: *Lowering) ErrorFlow {
+        return .{ .l = self };
+    }
+
    /// Lower the `xx` operator (type coercion).
    /// Uses self.target_type for context when available. Handles:
    /// - Any → concrete type: unbox_any
@@ -14969,7 +14588,7 @@ pub const Lowering = struct {
    /// operand's success value, but the expression itself routes an error) or
    /// any expression whose type carries an error channel (a bare failable
    /// call). Used to detect failable `or` chains (deferred to E1.4b).
-    fn exprIsFailable(self: *Lowering, node: *const Node) bool {
+    pub fn exprIsFailable(self: *Lowering, node: *const Node) bool {
        if (node.data == .try_expr) return true;
        return self.errorChannelOf(self.inferExprType(node)) != null;
    }