add sx migrate tuple-syntax migration tool

Temporary scaffolding for the tuple-syntax cutover. Parses old-grammar .sx and rewrites tuple syntax to the new spelling: - tuple TYPES `(A, B)` -> `Tuple(A, B)` (named keeps `:`) - tuple VALUES `(a, b)` -> `.(a, b)` (named flips `:` -> `=`) - 1-tuples / empty / spread -> `.(x)` / `.()` / `.(..xs)`, `Tuple(..Ts)` - failable returns: the `!` channel stays OUTSIDE Tuple `-> (T, !)` -> `-> T !` `-> (T1, T2, !)` -> `-> Tuple(T1, T2) !` AST-walk based: rewrites only `tuple_literal` / `tuple_type_expr` nodes (function types, param lists, match bindings, arrays, struct literals, Closure sigs, groupings are left untouched). Nested tuples rewrite recursively as a single non-overlapping edit per outermost tuple. Value-vs-type ambiguity (call-arg tuples whose elements could be types, e.g. `size_of((Box, i32))`, empty `()`) is never guessed: such sites go to a worklist. A non-empty worklist exits nonzero and suppresses the "looks-done" stdout output unless `--force` is passed. `sx migrate <f>` prints migrated source; `--dry-run` prints only the worklist. Built against the old grammar; removed after the cutover.
2026-06-25 15:23:18 +03:00
parent 820cd62fa1
commit c882c6c63e
4 changed files with 918 additions and 0 deletions
--- a/src/main.zig
+++ b/src/main.zig
@@ -23,6 +23,13 @@ pub fn main(init: std.process.Init) !void {
        return;
    }

+    // `migrate` has its own flag (`--dry-run`) the generic flag loop below would
+    // reject, so dispatch it here before that loop runs.
+    if (std.mem.eql(u8, command, "migrate")) {
+        runMigrate(allocator, io, args[2..]);
+        return;
+    }
+
    // Parse flags and positional arguments
    var input_path: ?[]const u8 = null;
    var target_config = sx.target.TargetConfig{};
@@ -407,6 +414,7 @@ fn printUsage() void {
        \\  ir     Print LLVM IR to stdout
        \\  asm    Emit assembly (.s) file
        \\  lsp    Start language server (LSP)
+        \\  migrate  Rewrite old tuple syntax to new (`(a,b)`->`.(a,b)`, type `(A,B)`->`Tuple(A,B)`); `--dry-run` prints only the worklist, `--force` emits output despite unmigrated ambiguous sites
        \\
        \\Options:
        \\  --target <target>   Target triple or shorthand: wasm, macos, linux, windows, ios, ios-sim (default: host)
@@ -517,6 +525,72 @@ fn compilePipeline(allocator: std.mem.Allocator, io: std.Io, input_path: []const
    return comp;
 }

+/// `sx migrate [--dry-run] [--force] <file.sx>` — tuple-syntax migration tool.
+///
+/// Without flags: parse-only, rewrite the old tuple syntax, print the migrated
+/// source to stdout and any ambiguous-site worklist entries to stderr. A
+/// NON-EMPTY worklist is a hard failure (exit 2) — the migration is incomplete,
+/// so we do NOT print the rewritten source (which could be redirected over the
+/// input, silently shipping half-migrated code) unless `--force` is passed.
+///
+/// With `--dry-run`: print ONLY the worklist (to stderr), no rewritten source —
+/// so ambiguous sites can be audited first. A non-empty worklist still exits 2.
+///
+/// With `--force`: print the rewritten source even when the worklist is
+/// non-empty (the ambiguous sites are left in the OLD syntax). Exit is still 2
+/// so a script can detect the partial migration.
+fn runMigrate(allocator: std.mem.Allocator, io: std.Io, sub_args: []const []const u8) void {
+    var dry_run = false;
+    var force = false;
+    var input_path: ?[]const u8 = null;
+    for (sub_args) |a| {
+        if (std.mem.eql(u8, a, "--dry-run")) {
+            dry_run = true;
+        } else if (std.mem.eql(u8, a, "--force")) {
+            force = true;
+        } else if (std.mem.startsWith(u8, a, "-")) {
+            std.debug.print("error: unknown flag '{s}' for migrate\n", .{a});
+            std.process.exit(1);
+        } else {
+            input_path = a;
+        }
+    }
+    const path = input_path orelse {
+        std.debug.print("usage: sx migrate [--dry-run] [--force] <file.sx>\n", .{});
+        std.process.exit(1);
+    };
+
+    const source = readSource(allocator, io, path) catch |err| {
+        std.debug.print("error: cannot read '{s}': {}\n", .{ path, err });
+        std.process.exit(1);
+    };
+    const result = sx.migrate.migrateSource(allocator, io, path, source) catch |err| {
+        std.debug.print("error: migrate failed for '{s}': {}\n", .{ path, err });
+        std.process.exit(1);
+    };
+
+    // Worklist (ambiguous sites) always goes to stderr.
+    for (result.worklist) |w| {
+        std.debug.print("{s}:{d}:{d}: {s}: {s}\n", .{ path, w.line, w.col, w.reason, w.text });
+    }
+
+    const has_worklist = result.worklist.len > 0;
+
+    // Emit the rewritten source unless we'd be shipping a half-migrated file: a
+    // non-empty worklist in non-dry-run mode suppresses output unless --force.
+    if (!dry_run and (!has_worklist or force)) {
+        _ = std.c.write(1, result.output.ptr, result.output.len);
+    }
+
+    if (has_worklist) {
+        std.debug.print(
+            "{d} ambiguous site(s) unmigrated; resolve by hand or pass --force\n",
+            .{result.worklist.len},
+        );
+        std.process.exit(2);
+    }
+}
+
 fn dumpSxIR(allocator: std.mem.Allocator, io: std.Io, input_path: []const u8, stdlib_paths: []const []const u8) !void {
    const source = try readSource(allocator, io, input_path);
    var comp = sx.core.Compilation.init(allocator, io, input_path, source, .{}, stdlib_paths);
--- a/src/migrate.test.zig
+++ b/src/migrate.test.zig
@@ -0,0 +1,330 @@
+// Tests for migrate.zig — the `sx migrate` tuple-syntax rewriter.
+//
+// Each case parses an in-memory snippet (full decls, so it parses standalone),
+// runs the AST-walk migrator, and asserts the rewritten text and/or worklist.
+// The compiler grammar is UNCHANGED here: the migrator READS the old tuple
+// syntax `(a, b)` / `(A, B)` and EMITS the new `.(a, b)` / `Tuple(A, B)` text.
+
+const std = @import("std");
+const Parser = @import("parser.zig").Parser;
+const migrate = @import("migrate.zig");
+
+/// Parse `src` (must be valid old-syntax sx decls), migrate, return the
+/// rewritten text. Asserts the worklist is empty (use `runWith` for ambiguous
+/// cases).
+fn run(alloc: std.mem.Allocator, src: [:0]const u8) ![]const u8 {
+    const res = try runWith(alloc, src);
+    try std.testing.expectEqual(@as(usize, 0), res.worklist.len);
+    return res.output;
+}
+
+fn runWith(alloc: std.mem.Allocator, src: [:0]const u8) !migrate.MigrationResult {
+    var parser = Parser.init(alloc, src);
+    const root = try parser.parse();
+    return migrate.migrateRoot(alloc, src, root);
+}
+
+/// Assert that `needle` appears in `haystack` (substring), with a helpful
+/// failure message that prints the full migrated text.
+fn expectContains(haystack: []const u8, needle: []const u8) !void {
+    if (std.mem.indexOf(u8, haystack, needle) == null) {
+        std.debug.print("\nexpected to find:\n  {s}\nin migrated output:\n{s}\n", .{ needle, haystack });
+        return error.NotFound;
+    }
+}
+
+fn expectNotContains(haystack: []const u8, needle: []const u8) !void {
+    if (std.mem.indexOf(u8, haystack, needle) != null) {
+        std.debug.print("\nexpected NOT to find:\n  {s}\nin migrated output:\n{s}\n", .{ needle, haystack });
+        return error.UnexpectedlyFound;
+    }
+}
+
+// ── VALUE tuples → .(...) ────────────────────────────────────────────────
+
+test "migrate value: positional (40,2) -> .(40,2)" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () { x := (40, 2); }\n");
+    try expectContains(out, ".(40, 2)");
+    try expectNotContains(out, " (40, 2)"); // the old, un-dotted form is gone
+}
+
+test "migrate value: named (x:1,y:2) -> .(x = 1, y = 2)" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () { x := (x: 1, y: 2); }\n");
+    try expectContains(out, ".(x = 1, y = 2)");
+}
+
+test "migrate value: 1-tuple (x,) -> .(x)" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () { y := 9; x := (y,); }\n");
+    try expectContains(out, ".(y)");
+    try expectNotContains(out, "(y,)");
+}
+
+test "migrate value: spread (..xs) -> .(..xs)" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: (xs: i32) { t := (..xs); }\n");
+    try expectContains(out, ".(..xs)");
+}
+
+test "migrate value: operator operands (1,2)==(1,2)" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () { b := (1, 2) == (1, 2); }\n");
+    // Both operands rewritten.
+    try expectContains(out, ".(1, 2) == .(1, 2)");
+}
+
+test "migrate value+type: return body -> Tuple(i64,i64){ .(b,a) }" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(),
+        \\swap :: (a: i64, b: i64) -> (i64, i64) { (b, a) }
+        \\
+    );
+    try expectContains(out, "-> Tuple(i64, i64)");
+    try expectContains(out, ".(b, a)");
+}
+
+test "migrate value: empty () value -> .()" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    // `x := ()` — empty tuple value.
+    const out = try run(arena.allocator(), "f :: () { x := (); }\n");
+    try expectContains(out, ".()");
+}
+
+// ── TYPE tuples → Tuple(...) ─────────────────────────────────────────────
+
+test "migrate type: annotation a:(i32,string) -> a:Tuple(i32,string)" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () { a : (i32, string) = ---; }\n");
+    try expectContains(out, "Tuple(i32, string)");
+}
+
+test "migrate type: named (x:i32,y:string) -> Tuple(x: i32, y: string) keeps colon" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () { a : (x: i32, y: string) = ---; }\n");
+    try expectContains(out, "Tuple(x: i32, y: string)");
+}
+
+test "migrate type: struct field xs:(i32,i32) -> Tuple(i32,i32)" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "S :: struct { xs: (i32, i32); }\n");
+    try expectContains(out, "Tuple(i32, i32)");
+}
+
+test "migrate type: pack (..Ts) -> Tuple(..Ts)" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "S :: struct { xs: (..Ts); }\n");
+    try expectContains(out, "Tuple(..Ts)");
+}
+
+test "migrate type: 1-tuple (T,) -> Tuple(T) drops comma" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "S :: struct { xs: (i32,); }\n");
+    try expectContains(out, "Tuple(i32)");
+    try expectNotContains(out, "(i32,)");
+}
+
+// ── Worklist: ambiguous value-vs-type call arg ──────────────────────────
+
+test "migrate worklist: size_of((Box,i32)) is NOT rewritten, records worklist" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const res = try runWith(arena.allocator(),
+        \\f :: () { n := size_of((Box, i32)); }
+        \\
+    );
+    // Ambiguous inner tuple left untouched: no `.(` rewrite of `(Box, i32)`.
+    try expectNotContains(res.output, ".(Box, i32)");
+    try expectContains(res.output, "(Box, i32)");
+    // One worklist entry recorded.
+    try std.testing.expectEqual(@as(usize, 1), res.worklist.len);
+    try expectContains(res.worklist[0].text, "(Box, i32)");
+}
+
+test "migrate value: call arg with literal-only tuple IS rewritten" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    // `take((1, 2))` — all elements are concrete values → safe to rewrite.
+    const res = try runWith(arena.allocator(), "f :: () { take((1, 2)); }\n");
+    try expectContains(res.output, ".(1, 2)");
+    try std.testing.expectEqual(@as(usize, 0), res.worklist.len);
+}
+
+// ── Nested tuples (recursive rewrite, ONE edit per outermost tuple) ──────
+
+test "migrate nested value: ((1,2),(3,4)) -> .(.(1, 2), .(3, 4))" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () { x := ((1, 2), (3, 4)); }\n");
+    try expectContains(out, ".(.(1, 2), .(3, 4))");
+    // No stray un-migrated inner tuple, no trailing junk paren.
+    try expectNotContains(out, ".(1, 2), 3)");
+}
+
+test "migrate nested value: ((1,2),3) -> .(.(1, 2), 3)" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () { x := ((1, 2), 3); }\n");
+    try expectContains(out, ".(.(1, 2), 3)");
+    try expectNotContains(out, "(1, 2), 3))"); // the broken old output
+}
+
+test "migrate nested named value: (a:(p:1,q:2),b:3) -> .(a = .(p = 1, q = 2), b = 3)" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () { n := (a: (p: 1, q: 2), b: 3); }\n");
+    try expectContains(out, ".(a = .(p = 1, q = 2), b = 3)");
+}
+
+test "migrate nested type: ((i32,i32),i64) -> Tuple(Tuple(i32, i32), i64)" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () { a : ((i32, i32), i64) = ---; }\n");
+    try expectContains(out, "Tuple(Tuple(i32, i32), i64)");
+}
+
+// ── Failable multi-returns: `!` channel stays OUTSIDE Tuple(...) ─────────
+
+test "migrate failable: -> (T, !) -> -> T !" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () -> (i32, !) { }\n");
+    try expectContains(out, "-> i32 !");
+    try expectNotContains(out, "Tuple(");
+    try expectNotContains(out, ".(");
+}
+
+test "migrate failable: -> (T, !Named) keeps the named set" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(),
+        \\E :: error { Bad }
+        \\f :: () -> (i32, !E) { }
+        \\
+    );
+    try expectContains(out, "-> i32 !E");
+    try expectNotContains(out, "Tuple(");
+}
+
+test "migrate failable: -> (T1, T2, !) -> -> Tuple(T1, T2) !" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () -> (i32, i64, !) { }\n");
+    try expectContains(out, "-> Tuple(i32, i64) !");
+}
+
+test "migrate failable: bare -> ! unchanged" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () -> ! { }\n");
+    try expectContains(out, "-> !");
+    try expectNotContains(out, "Tuple");
+}
+
+// ── Inverted call-arg classification (conservative) ─────────────────────
+
+test "migrate worklist: empty () call arg is worklisted (unit type ambiguity)" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const res = try runWith(arena.allocator(), "f :: () { n := size_of(()); }\n");
+    // NOT silently rewritten to `.()`.
+    try expectNotContains(res.output, "size_of(.())");
+    try expectContains(res.output, "size_of(())");
+    try std.testing.expectEqual(@as(usize, 1), res.worklist.len);
+}
+
+test "migrate worklist: Vec(3) call-arg element is worklisted" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const res = try runWith(arena.allocator(), "f :: () { n := size_of((Vec(3), i32)); }\n");
+    try expectNotContains(res.output, ".(Vec(3), i32)");
+    try expectContains(res.output, "(Vec(3), i32)");
+    try std.testing.expectEqual(@as(usize, 1), res.worklist.len);
+}
+
+test "migrate worklist: pkg.T qualified path call-arg element is worklisted" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const res = try runWith(arena.allocator(), "f :: () { n := size_of((pkg.T, i32)); }\n");
+    try expectNotContains(res.output, ".(pkg.T, i32)");
+    try expectContains(res.output, "(pkg.T, i32)");
+    try std.testing.expectEqual(@as(usize, 1), res.worklist.len);
+}
+
+// ── Negatives: distinct AST nodes must NOT be touched ────────────────────
+
+test "migrate negative: function type (i32,i32)->i32 unchanged" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () { g : (i32, i32) -> i32 = ---; }\n");
+    try expectContains(out, "(i32, i32) -> i32");
+    try expectNotContains(out, "Tuple(i32, i32)");
+}
+
+test "migrate negative: function param list (self:*T,x:i32) unchanged" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "S :: struct {}\nm :: (self: *S, x: i32) { }\n");
+    try expectContains(out, "(self: *S, x: i32)");
+    try expectNotContains(out, "Tuple(");
+    try expectNotContains(out, ".(self");
+}
+
+test "migrate negative: array literal .[1,2,3] unchanged" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () { a := .[1, 2, 3]; }\n");
+    try expectContains(out, ".[1, 2, 3]");
+}
+
+test "migrate negative: struct literal .{x=1} unchanged" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () { a := .{ x = 1 }; }\n");
+    try expectContains(out, ".{ x = 1 }");
+}
+
+test "migrate negative: Closure(i32)->i32 type unchanged" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: () { c : Closure(i32) -> i32 = ---; }\n");
+    try expectContains(out, "Closure(i32) -> i32");
+    try expectNotContains(out, "Tuple(");
+}
+
+test "migrate negative: grouping (a+b)*c unchanged" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(), "f :: (a: i32, b: i32, c: i32) { x := (a + b) * c; }\n");
+    try expectContains(out, "(a + b) * c");
+    try expectNotContains(out, ".(a + b)");
+}
+
+test "migrate negative: match capture case .some: (val) unchanged" {
+    var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
+    defer arena.deinit();
+    const out = try run(arena.allocator(),
+        \\check :: (v: ?i32) -> i32 {
+        \\  return if v == {
+        \\    case .some: (val) { val }
+        \\    case .none: { 0 }
+        \\  };
+        \\}
+        \\
+    );
+    try expectContains(out, "case .some: (val)");
+    try expectNotContains(out, ".(val)");
+}
--- a/src/migrate.zig
+++ b/src/migrate.zig
@@ -0,0 +1,512 @@
+//! Tuple-syntax migration tool (`sx migrate`).
+//!
+//! Reads OLD-syntax `.sx` source (tuple TYPES `(A, B)`, tuple VALUES `(a, b)`)
+//! and emits NEW-syntax text (`Tuple(A, B)` / `.(a, b)`). The compiler grammar
+//! is UNCHANGED — this tool only reads the old syntax and rewrites it as text.
+//!
+//! Strategy: parse-only (read -> Compilation -> parse), then walk the parsed
+//! AST with a comptime-reflection child walker that recurses into every
+//! `*Node`-bearing field of every node variant. Two node kinds drive a rewrite:
+//!
+//!   * `tuple_type_expr` — produced by the parser in grammatically-forced TYPE
+//!     positions (`-> (...)`, `: (...)` annotations, struct-field/param types).
+//!     Rewritten to `Tuple(...)`. SPECIAL CASE: a failable multi-return whose
+//!     last element is the error-channel marker `!` keeps the channel OUTSIDE
+//!     the `Tuple(...)` (see `rewriteTupleType`).
+//!
+//!   * `tuple_literal` — produced in VALUE positions. Rewritten to `.(...)`.
+//!     In CALL-ARG position the value/type distinction is ambiguous, so we only
+//!     auto-rewrite when EVERY element is a concrete value literal; anything
+//!     else (bare identifier, `Vec(3)`, `pkg.T`, empty `()`, ...) is recorded on
+//!     the worklist and left untouched — never guess (CLAUDE.md silent-fallback
+//!     rule).
+//!
+//! Nesting: the rewrite is RECURSIVE but emits exactly ONE edit per OUTERMOST
+//! tuple. The replacement text for a tuple is built by recursively migrating its
+//! nested tuple elements (and any non-tuple subexpressions, e.g. calls) directly
+//! into that text. We never emit a separate, overlapping child edit for anything
+//! inside a tuple's span — `applyEdits` asserts non-overlap as a tripwire.
+//!
+//! Edits are collected against the ORIGINAL source byte offsets and applied
+//! DESCENDING by start offset so earlier offsets stay valid; comments and
+//! formatting outside the edited spans are preserved verbatim.
+
+const std = @import("std");
+const ast = @import("ast.zig");
+const core = @import("core.zig");
+
+const Node = ast.Node;
+
+/// A single text replacement against the original source: `source[start..end]`
+/// becomes `replacement`.
+pub const Edit = struct {
+    start: u32,
+    end: u32,
+    replacement: []const u8,
+};
+
+/// An ambiguous site we refused to rewrite. `line`/`col` are 1-based.
+pub const Worklist = struct {
+    line: u32,
+    col: u32,
+    text: []const u8,
+    reason: []const u8,
+};
+
+pub const MigrationResult = struct {
+    /// The rewritten source (a fresh allocation owning its bytes).
+    output: []const u8,
+    /// Ambiguous sites left untouched, in source order.
+    worklist: []const Worklist,
+};
+
+/// Walk state: collects edits + worklist entries while recursing the AST.
+const Walker = struct {
+    allocator: std.mem.Allocator,
+    source: []const u8,
+    edits: std.ArrayList(Edit) = .empty,
+    worklist: std.ArrayList(Worklist) = .empty,
+
+    /// Recurse into `node`. `is_call_arg` is true when this node is a DIRECT
+    /// argument of a `call` / `ffi_intrinsic_call` — the only context in which a
+    /// `tuple_literal` may be value-vs-type ambiguous.
+    ///
+    /// On hitting an OUTERMOST tuple we compute its full replacement (recursively
+    /// baking any nested tuples / subexprs into the text) and emit a SINGLE edit;
+    /// we do NOT continue the edit-emitting walk into the tuple's span (that would
+    /// produce overlapping edits). Worklist collection for ambiguous nested
+    /// call-args still happens, inside the recursive text builder.
+    fn walk(self: *Walker, node: *const Node, is_call_arg: bool) anyerror!void {
+        switch (node.data) {
+            .tuple_type_expr => |tt| {
+                const replacement = try self.buildTupleTypeText(node, tt);
+                if (replacement) |rep| {
+                    try self.edits.append(self.allocator, .{
+                        .start = node.span.start,
+                        .end = node.span.end,
+                        .replacement = rep,
+                    });
+                }
+                // Do NOT recurse into the tuple's element subtrees here — they
+                // are already baked into `replacement`. (A `null` replacement
+                // means "leave unchanged"; that only happens for `-> !`, which
+                // has no value elements to rewrite anyway.)
+                return;
+            },
+            .tuple_literal => |tl| {
+                if (is_call_arg and !tupleIsAllConcreteValues(tl)) {
+                    // Ambiguous in call-arg position (could be a type argument,
+                    // a parameterized type, a qualified path, the unit type
+                    // `()`, ...). Refuse to guess — record + leave untouched, and
+                    // keep walking into elements so nested unambiguous tuples are
+                    // still migrated.
+                    try self.recordWorklist(node);
+                    for (tl.elements) |el| try self.walk(el.value, false);
+                } else {
+                    const rep = try self.buildTupleValueText(node, tl);
+                    try self.edits.append(self.allocator, .{
+                        .start = node.span.start,
+                        .end = node.span.end,
+                        .replacement = rep,
+                    });
+                }
+                return;
+            },
+            // A `call`'s direct args get the call-arg flag; the callee does not.
+            .call => |c| {
+                try self.walk(c.callee, false);
+                for (c.args) |a| try self.walk(a, true);
+                return;
+            },
+            .ffi_intrinsic_call => |c| {
+                try self.walk(c.return_type, false);
+                for (c.args) |a| try self.walk(a, true);
+                return;
+            },
+            else => {},
+        }
+        // Generic recursion for every other node: visit each child *Node found
+        // by reflection over the active union payload. Call-arg context does NOT
+        // propagate past a non-call node.
+        try self.walkChildren(node);
+    }
+
+    /// Reflect over the active payload of `node.data` and recurse into every
+    /// `*Node` reachable through its fields (directly, through optionals,
+    /// slices, and nested aggregate structs/unions).
+    fn walkChildren(self: *Walker, node: *const Node) anyerror!void {
+        switch (node.data) {
+            inline else => |payload| {
+                try self.walkValue(@TypeOf(payload), payload);
+            },
+        }
+    }
+
+    /// Recurse into any `*Node` reachable from `value` of type `T`.
+    fn walkValue(self: *Walker, comptime T: type, value: T) anyerror!void {
+        if (T == *Node or T == *const Node) {
+            try self.walk(value, false);
+            return;
+        }
+        switch (@typeInfo(T)) {
+            .pointer => |ptr| {
+                switch (ptr.size) {
+                    .slice => {
+                        if (comptime containsNode(ptr.child)) {
+                            for (value) |elem| try self.walkValue(ptr.child, elem);
+                        }
+                    },
+                    // Non-slice pointers other than *Node (handled above) carry
+                    // no AST children we rewrite.
+                    else => {},
+                }
+            },
+            .optional => |opt| {
+                if (comptime containsNode(opt.child)) {
+                    if (value) |inner| try self.walkValue(opt.child, inner);
+                }
+            },
+            .@"struct" => |st| {
+                inline for (st.fields) |f| {
+                    if (comptime containsNode(f.type)) {
+                        try self.walkValue(f.type, @field(value, f.name));
+                    }
+                }
+            },
+            .@"union" => |un| {
+                if (comptime unionContainsNode(un)) {
+                    switch (value) {
+                        inline else => |inner| try self.walkValue(@TypeOf(inner), inner),
+                    }
+                }
+            },
+            else => {},
+        }
+    }
+
+    /// Build the replacement text for a `tuple_type_expr`, baking nested tuples
+    /// recursively. Returns `null` when the node should be left unchanged.
+    ///
+    /// Failable multi-return handling — the error channel `!` (an
+    /// `error_type_expr` element, always last) stays OUTSIDE the `Tuple(...)`:
+    ///   * `(!)`              → unchanged (no value tuple).
+    ///   * `(T, !)`           → `T !`            (single value: drop the parens).
+    ///   * `(T1, T2, !)`      → `Tuple(T1, T2) !`.
+    fn buildTupleTypeText(self: *Walker, node: *const Node, tt: ast.TupleTypeExpr) !?[]const u8 {
+        // Detect a trailing error-channel marker.
+        const n = tt.field_types.len;
+        const has_err = n > 0 and tt.field_types[n - 1].data == .error_type_expr;
+
+        if (has_err) {
+            const err_node = tt.field_types[n - 1];
+            // Raw text of the error marker, e.g. `!` or `!JsonError`.
+            const err_text = self.source[err_node.span.start..err_node.span.end];
+            const value_count = n - 1;
+            if (value_count == 0) {
+                // `-> !` (no value tuple) — leave unchanged.
+                return null;
+            }
+            if (value_count == 1) {
+                // `(T, !)` → `T !` — strip the parens, no Tuple wrapper.
+                const t_text = try self.migratedTypeElement(tt.field_types[0]);
+                return try std.fmt.allocPrint(self.allocator, "{s} {s}", .{ t_text, err_text });
+            }
+            // `(T1, T2, ..., !)` → `Tuple(T1, T2, ...) !`.
+            const inner = try self.buildTypeInner(node, tt, value_count);
+            return try std.fmt.allocPrint(self.allocator, "Tuple{s} {s}", .{ inner, err_text });
+        }
+
+        // Ordinary type tuple: `Tuple(...)`, names keep `:`.
+        const inner = try self.buildTypeInner(node, tt, n);
+        return try std.fmt.allocPrint(self.allocator, "Tuple{s}", .{inner});
+    }
+
+    /// Build the parenthesized inner `(...)` for a type tuple covering the first
+    /// `count` field types (a failable return passes `count < field_types.len` to
+    /// exclude the trailing `!`). Names keep their `:`. A 1-tuple drops its
+    /// trailing comma.
+    fn buildTypeInner(self: *Walker, node: *const Node, tt: ast.TupleTypeExpr, count: usize) ![]const u8 {
+        var out = std.ArrayList(u8).empty;
+        try out.append(self.allocator, '(');
+        for (tt.field_types[0..count], 0..) |ft, i| {
+            if (i != 0) try out.appendSlice(self.allocator, ", ");
+            // Named type tuple keeps `name: ` verbatim.
+            if (tt.field_names) |names| {
+                // Synthetic `_<i>` names mark positional slots — emit nothing.
+                if (!isSyntheticName(names[i], i)) {
+                    try out.appendSlice(self.allocator, names[i]);
+                    try out.appendSlice(self.allocator, ": ");
+                }
+            }
+            const el_text = try self.migratedTypeElement(ft);
+            try out.appendSlice(self.allocator, el_text);
+        }
+        try out.append(self.allocator, ')');
+        _ = node;
+        return out.toOwnedSlice(self.allocator);
+    }
+
+    /// Migrate a single TYPE element subtree to text. A nested tuple type is
+    /// baked recursively; everything else is copied verbatim from source but with
+    /// any nested tuples inside it rewritten.
+    fn migratedTypeElement(self: *Walker, ft: *const Node) anyerror![]const u8 {
+        if (ft.data == .tuple_type_expr) {
+            const rep = try self.buildTupleTypeText(ft, ft.data.tuple_type_expr);
+            return rep orelse self.source[ft.span.start..ft.span.end];
+        }
+        return self.migratedSubtree(ft, false);
+    }
+
+    /// Build the replacement text for a `tuple_literal`, baking nested tuples
+    /// recursively. Names flip `:` → ` = `.
+    fn buildTupleValueText(self: *Walker, node: *const Node, tl: ast.TupleLiteral) ![]const u8 {
+        var out = std.ArrayList(u8).empty;
+        try out.appendSlice(self.allocator, ".(");
+        for (tl.elements, 0..) |el, i| {
+            if (i != 0) try out.appendSlice(self.allocator, ", ");
+            if (el.name) |name| {
+                try out.appendSlice(self.allocator, name);
+                try out.appendSlice(self.allocator, " = ");
+            }
+            // Spread element: `..xs` — the parser models it as a spread_expr
+            // whose operand is the spread target; copy its source verbatim
+            // (its own nested tuples, if any, get migrated by migratedSubtree).
+            const el_text = try self.migratedValueElement(el.value);
+            try out.appendSlice(self.allocator, el_text);
+        }
+        try out.append(self.allocator, ')');
+        _ = node;
+        return out.toOwnedSlice(self.allocator);
+    }
+
+    /// Migrate a single VALUE element subtree to text. A nested tuple literal is
+    /// baked recursively; everything else is copied verbatim with nested tuples
+    /// inside rewritten.
+    fn migratedValueElement(self: *Walker, value: *const Node) anyerror![]const u8 {
+        if (value.data == .tuple_literal) {
+            const tl = value.data.tuple_literal;
+            // A nested tuple in a VALUE position is unambiguously a value (it is
+            // never itself a direct call-arg), so always rewrite it.
+            return self.buildTupleValueText(value, tl);
+        }
+        return self.migratedSubtree(value, false);
+    }
+
+    /// Return the migrated text for an arbitrary subtree by collecting the edits
+    /// its descendants produce (relative to `node.span`) and splicing them into
+    /// the raw source slice. Worklist entries discovered inside are appended to
+    /// the shared worklist. This is how a NON-tuple element of a tuple (e.g. a
+    /// `call` with its own nested tuple args) gets its inner tuples migrated
+    /// while preserving its surrounding formatting verbatim.
+    fn migratedSubtree(self: *Walker, node: *const Node, is_call_arg: bool) ![]const u8 {
+        // Sub-walk with a private edit list but the SHARED worklist.
+        var sub = Walker{
+            .allocator = self.allocator,
+            .source = self.source,
+            .worklist = self.worklist,
+        };
+        try sub.walk(node, is_call_arg);
+        // Carry any worklist entries the sub-walk found back to the parent.
+        self.worklist = sub.worklist;
+
+        const base = node.span.start;
+        const raw = self.source[node.span.start..node.span.end];
+        if (sub.edits.items.len == 0) return raw;
+        // Splice sub-edits (offsets are absolute; rebase to the slice).
+        return applyEditsRebased(self.allocator, raw, base, sub.edits.items);
+    }
+
+    fn recordWorklist(self: *Walker, node: *const Node) !void {
+        const lc = lineCol(self.source, node.span.start);
+        try self.worklist.append(self.allocator, .{
+            .line = lc.line,
+            .col = lc.col,
+            .text = self.source[node.span.start..node.span.end],
+            .reason = "ambiguous value-vs-type call arg; resolve to `Tuple(...)` or `.(...)` by hand",
+        });
+    }
+};
+
+/// A synthetic positional name is exactly `_<i>` for slot `i` (the parser
+/// fills these in for positional slots of an otherwise-named tuple). Treat such
+/// a name as "no name" so a mixed tuple's positional slots stay positional.
+fn isSyntheticName(name: []const u8, i: usize) bool {
+    if (name.len < 2 or name[0] != '_') return false;
+    var buf: [24]u8 = undefined;
+    const expect = std.fmt.bufPrint(&buf, "_{d}", .{i}) catch return false;
+    return std.mem.eql(u8, name, expect);
+}
+
+/// True when EVERY element of a call-arg `tuple_literal` is a concrete value
+/// literal (or an unambiguous value-operator expression over such). Only then is
+/// it safe to auto-rewrite the tuple to `.(...)` in call-arg position — anything
+/// else (bare identifier, parameterized type `Vec(3)`, qualified path `pkg.T`,
+/// empty `()`, ...) is ambiguous and goes to the worklist.
+fn tupleIsAllConcreteValues(tl: ast.TupleLiteral) bool {
+    // An empty `()` in call-arg position is ambiguous (unit type vs empty value).
+    if (tl.elements.len == 0) return false;
+    for (tl.elements) |el| {
+        if (!nodeIsConcreteValue(el.value)) return false;
+    }
+    return true;
+}
+
+/// A node is a "concrete value" when it can only denote a runtime value — never
+/// a type. Conservative: int/float/string/bool/char literals, null/undef, enum
+/// literals, array/struct literals, and value-operator expressions (binary /
+/// unary ops, comparisons) whose operands are themselves concrete values. A
+/// nested tuple literal of concrete values is concrete too. Everything else
+/// (identifiers, calls, field access, parameterized/qualified type syntax, ...)
+/// is NOT — it could be or contain a type.
+fn nodeIsConcreteValue(node: *const Node) bool {
+    return switch (node.data) {
+        .int_literal,
+        .float_literal,
+        .bool_literal,
+        .string_literal,
+        .null_literal,
+        .undef_literal,
+        .enum_literal,
+        .array_literal,
+        .struct_literal,
+        => true,
+        .binary_op => |b| nodeIsConcreteValue(b.lhs) and nodeIsConcreteValue(b.rhs),
+        .chained_comparison => |c| blk: {
+            for (c.operands) |o| {
+                if (!nodeIsConcreteValue(o)) break :blk false;
+            }
+            break :blk true;
+        },
+        .unary_op => |u| nodeIsConcreteValue(u.operand),
+        .tuple_literal => |t| tupleIsAllConcreteValues(t),
+        else => false,
+    };
+}
+
+/// Comptime: does type `T` (transitively) contain a `*Node` we'd recurse into?
+/// Prunes the reflection walk so we never descend into pure-scalar payloads.
+fn containsNode(comptime T: type) bool {
+    if (T == *Node or T == *const Node or T == Node) return true;
+    return switch (@typeInfo(T)) {
+        .pointer => |ptr| switch (ptr.size) {
+            .slice => containsNode(ptr.child),
+            .one => ptr.child == Node, // *Node handled above; other *X: no
+            else => false,
+        },
+        .optional => |opt| containsNode(opt.child),
+        .array => |arr| containsNode(arr.child),
+        .@"struct" => |st| blk: {
+            inline for (st.fields) |f| {
+                if (containsNode(f.type)) break :blk true;
+            }
+            break :blk false;
+        },
+        .@"union" => |un| unionContainsNode(un),
+        else => false,
+    };
+}
+
+fn unionContainsNode(comptime un: std.builtin.Type.Union) bool {
+    inline for (un.fields) |f| {
+        if (containsNode(f.type)) return true;
+    }
+    return false;
+}
+
+const LineCol = struct { line: u32, col: u32 };
+
+fn lineCol(source: []const u8, offset: u32) LineCol {
+    var line: u32 = 1;
+    var col: u32 = 1;
+    var i: usize = 0;
+    while (i < offset and i < source.len) : (i += 1) {
+        if (source[i] == '\n') {
+            line += 1;
+            col = 1;
+        } else {
+            col += 1;
+        }
+    }
+    return .{ .line = line, .col = col };
+}
+
+/// Migrate a source string in memory. Parse-only; never resolves imports or
+/// lowers. Returns the rewritten text + any ambiguous worklist entries.
+///
+/// `file_path` is used only for diagnostics labeling.
+pub fn migrateSource(
+    allocator: std.mem.Allocator,
+    io: std.Io,
+    file_path: []const u8,
+    source: [:0]const u8,
+) !MigrationResult {
+    var comp = core.Compilation.init(allocator, io, file_path, source, .{}, &.{});
+    defer comp.deinit();
+    comp.parse() catch {
+        comp.renderErrors();
+        return error.ParseFailed;
+    };
+    const root = comp.root orelse return error.ParseFailed;
+    return migrateRoot(allocator, source, root);
+}
+
+/// Migrate from an already-parsed `root`. Split from `migrateSource` so unit
+/// tests can parse in memory (via `Parser.init`) without an `std.Io`.
+pub fn migrateRoot(
+    allocator: std.mem.Allocator,
+    source: []const u8,
+    root: *const Node,
+) !MigrationResult {
+    var walker = Walker{ .allocator = allocator, .source = source };
+    for (root.data.root.decls) |decl| {
+        try walker.walk(decl, false);
+    }
+    const output = try applyEdits(allocator, source, walker.edits.items);
+    return .{
+        .output = output,
+        .worklist = try walker.worklist.toOwnedSlice(allocator),
+    };
+}
+
+/// Apply edits to a COPY of the original source. Edits are sorted DESCENDING by
+/// start so each splice leaves earlier offsets valid. Overlapping edits are a
+/// hard error — the recursive rewrite must emit exactly one edit per outermost
+/// tuple, so two edits sharing any byte is a bug.
+pub fn applyEdits(allocator: std.mem.Allocator, source: []const u8, edits_in: []const Edit) ![]const u8 {
+    const edits = try allocator.dupe(Edit, edits_in);
+    std.mem.sort(Edit, edits, {}, struct {
+        fn lessThan(_: void, a: Edit, b: Edit) bool {
+            return a.start > b.start; // descending
+        }
+    }.lessThan);
+
+    // Tripwire: after the descending sort, each edit's end must not exceed the
+    // next (lower-start) edit's start. Any overlap means the recursive rewrite
+    // double-emitted — refuse to produce corrupt output.
+    var prev_start: ?u32 = null;
+    for (edits) |e| {
+        if (prev_start) |ps| {
+            if (e.end > ps) return error.OverlappingEdits;
+        }
+        prev_start = e.start;
+    }
+
+    var out = try std.ArrayList(u8).initCapacity(allocator, source.len);
+    try out.appendSlice(allocator, source);
+    for (edits) |e| {
+        // Splice source[e.start..e.end] -> e.replacement.
+        try out.replaceRange(allocator, e.start, e.end - e.start, e.replacement);
+    }
+    return out.toOwnedSlice(allocator);
+}
+
+/// Apply edits whose `start`/`end` are ABSOLUTE source offsets to a `slice` that
+/// begins at absolute offset `base`. Used by `migratedSubtree` to splice a
+/// non-tuple subtree's inner tuple rewrites into its raw slice.
+fn applyEditsRebased(allocator: std.mem.Allocator, slice: []const u8, base: u32, edits_in: []const Edit) ![]const u8 {
+    var rebased = try allocator.alloc(Edit, edits_in.len);
+    for (edits_in, 0..) |e, i| {
+        rebased[i] = .{ .start = e.start - base, .end = e.end - base, .replacement = e.replacement };
+    }
+    return applyEdits(allocator, slice, rebased);
+}
--- a/src/root.zig
+++ b/src/root.zig
@@ -20,6 +20,8 @@ pub const core = @import("core.zig");
 pub const c_import = @import("c_import.zig");
 pub const c_import_tests = @import("c_import.test.zig");
 pub const corpus_run_tests = @import("corpus_run.test.zig");
+pub const migrate = @import("migrate.zig");
+pub const migrate_tests = @import("migrate.test.zig");
 pub const ir = @import("ir/ir.zig");

 pub const lsp = struct {