Surface rename of the signed integer family: s1..s64 become i1..i64
(u1..u64, usize, isize unchanged). 'string' keeps the s-prefix arm in
name classification; width parsing moves to the i-prefix arm next to
isize.
Internal TypeId tags follow the surface (.s8/.s16/.s32/.s64 ->
.i8/.i16/.i32/.i64), as do mono-key mangle fragments (ptr_i64,
tu_i64_bool) and all display/diagnostic formatting (i{d}).
Migrated in the same sweep: stdlib + examples + issue repros + FFI C
companions (shared symbol names like ffi_id_i64), expected
stdout/stderr/ir snapshots, specs.md, readme.md, CLAUDE.md/AGENTS.md,
implementation_plan.md, docs/, issue writeups. Vendored stb_image and
historical flow state left untouched.
zig build test: 426/426; examples suite: 595/595.
216 lines
9.0 KiB
Zig
216 lines
9.0 KiB
Zig
// Tests for sema.zig — the editor/LSP type classifier (the SECOND resolver,
|
|
// distinct from the codegen-side `ir/type_resolver.zig`). These pin behavior
|
|
// the example suite can't reach: the example runner exercises the codegen
|
|
// path (`sx run`), never sema's hover/completion/index resolution.
|
|
|
|
const std = @import("std");
|
|
const ast = @import("ast.zig");
|
|
const Node = ast.Node;
|
|
const Parser = @import("parser.zig").Parser;
|
|
const sema = @import("sema.zig");
|
|
const types = @import("types.zig");
|
|
const Type = types.Type;
|
|
|
|
// the backtick raw escape must hold in BOTH classifiers. A raw
|
|
// reserved-name type reference (`` `i2 ``) resolves to the user-declared type,
|
|
// while a BARE `i2` stays the builtin int. Before the fix sema's
|
|
// `resolveTypeNode` ran `Type.fromName` first and ignored `is_raw`, so the
|
|
// editor index would show the builtin for backtick code (the
|
|
// two-resolver divergence applied to raw types).
|
|
test "sema: backtick raw type reference resolves to the user type; bare stays builtin" {
|
|
var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
|
|
defer arena.deinit();
|
|
const alloc = arena.allocator();
|
|
|
|
const src =
|
|
\\`i2 :: struct { x: i64; }
|
|
\\
|
|
;
|
|
var parser = Parser.init(alloc, src);
|
|
const root = try parser.parse();
|
|
|
|
var analyzer = sema.Analyzer.init(alloc);
|
|
_ = try analyzer.analyze(root);
|
|
|
|
// The reserved-spelled user type registered under its plain name.
|
|
try std.testing.expect(analyzer.struct_types.contains("i2"));
|
|
|
|
// RAW reference (`` `i2 ``) → the user struct, NOT the 2-bit signed int.
|
|
var raw_node = Node{ .span = .{ .start = 0, .end = 0 }, .data = .{ .type_expr = .{ .name = "i2", .is_raw = true } } };
|
|
const raw_ty = analyzer.resolveTypeNode(&raw_node);
|
|
try std.testing.expect(raw_ty == .struct_type);
|
|
try std.testing.expectEqualStrings("i2", raw_ty.struct_type);
|
|
|
|
// BARE `i2` → the builtin 2-bit signed int.
|
|
var bare_node = Node{ .span = .{ .start = 0, .end = 0 }, .data = .{ .type_expr = .{ .name = "i2", .is_raw = false } } };
|
|
const bare_ty = analyzer.resolveTypeNode(&bare_node);
|
|
try std.testing.expect(bare_ty == .signed);
|
|
try std.testing.expectEqual(@as(u8, 2), bare_ty.signed);
|
|
}
|
|
|
|
// The same divergence guard for the string-keyed entry (`resolveTypeNameStr`,
|
|
// reached via `fieldType` when registering struct field types): a raw field
|
|
// annotation (`` `u8 ``) resolves to the user struct, a bare one (`u8`) to the
|
|
// builtin. Driven through the real analyze pipeline (no private access).
|
|
test "sema: a raw struct-field annotation resolves to the user type; bare stays builtin" {
|
|
var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
|
|
defer arena.deinit();
|
|
const alloc = arena.allocator();
|
|
|
|
const src =
|
|
\\`u8 :: struct { y: i64; }
|
|
\\Holder :: struct { a: `u8; b: u8; }
|
|
\\
|
|
;
|
|
var parser = Parser.init(alloc, src);
|
|
const root = try parser.parse();
|
|
|
|
var analyzer = sema.Analyzer.init(alloc);
|
|
_ = try analyzer.analyze(root);
|
|
|
|
const holder = analyzer.struct_types.get("Holder").?;
|
|
var a_ty: ?Type = null;
|
|
var b_ty: ?Type = null;
|
|
for (holder.field_names, holder.field_types) |fname, fty| {
|
|
if (std.mem.eql(u8, fname, "a")) a_ty = fty;
|
|
if (std.mem.eql(u8, fname, "b")) b_ty = fty;
|
|
}
|
|
|
|
// field `a : `u8` → the user struct named "u8".
|
|
try std.testing.expect(a_ty.? == .struct_type);
|
|
try std.testing.expectEqualStrings("u8", a_ty.?.struct_type);
|
|
|
|
// field `b : u8` → the builtin unsigned 8-bit int.
|
|
try std.testing.expect(b_ty.? == .unsigned);
|
|
try std.testing.expectEqual(@as(u8, 8), b_ty.?.unsigned);
|
|
}
|
|
|
|
// ── raw provenance through sema's COMPOUND type metadata ────────
|
|
//
|
|
// The direct-case fix (above) only covered a bare `` `i2 `` reference. A
|
|
// COMPOUND raw type (`*`i2`, `?`i2`, `[N]`i2`, …) stores its inner name as a
|
|
// bare string on the Type's info struct; the resolver re-reads that name via
|
|
// `resolveTypeNameStr`. Before threading `is_raw` ALONGSIDE the stored name,
|
|
// the resolver passed `skip_builtin = false`, so the LSP index reclassified a
|
|
// user type named `i2` as the builtin int — diverging from codegen. These
|
|
// pin every compound form: the raw inner resolves to the user type (FAILS on
|
|
// pre-fix sema), the bare inner stays the builtin (control, preserved).
|
|
|
|
fn symType(res: sema.SemaResult, name: []const u8) ?Type {
|
|
for (res.symbols) |sym| {
|
|
if (std.mem.eql(u8, sym.name, name)) return sym.ty;
|
|
}
|
|
return null;
|
|
}
|
|
|
|
test "sema: field access through a raw `*`i2` pointer resolves the user field; bare `*i2` stays builtin" {
|
|
var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
|
|
defer arena.deinit();
|
|
const alloc = arena.allocator();
|
|
|
|
const src =
|
|
\\`i2 :: struct { x: i64; }
|
|
\\f :: (p: *`i2) { y := p.x; }
|
|
\\g :: (q: *i2) { w := q.*; }
|
|
\\
|
|
;
|
|
var parser = Parser.init(alloc, src);
|
|
const root = try parser.parse();
|
|
var analyzer = sema.Analyzer.init(alloc);
|
|
const res = try analyzer.analyze(root);
|
|
|
|
// RAW: `p: *`i2` → field `x` on the user struct → i64. (Pre-fix: the
|
|
// pointee `i2` reclassified to the 2-bit int, `.x` not found → unresolved.)
|
|
const y = symType(res, "y") orelse return error.MissingSymbol;
|
|
try std.testing.expect(y == .signed);
|
|
try std.testing.expectEqual(@as(u8, 64), y.signed);
|
|
|
|
// CONTROL: `q: *i2` (bare) → deref yields the builtin 2-bit signed int.
|
|
const w = symType(res, "w") orelse return error.MissingSymbol;
|
|
try std.testing.expect(w == .signed);
|
|
try std.testing.expectEqual(@as(u8, 2), w.signed);
|
|
}
|
|
|
|
test "sema: unwrapping a raw `?`i2` optional resolves the user field; bare `?i2` stays builtin" {
|
|
var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
|
|
defer arena.deinit();
|
|
const alloc = arena.allocator();
|
|
|
|
const src =
|
|
\\`i2 :: struct { x: i64; }
|
|
\\f :: (o: ?`i2) { if val := o { y := val.x; } }
|
|
\\g :: (b: ?i2) { if v := b { w := v; } }
|
|
\\
|
|
;
|
|
var parser = Parser.init(alloc, src);
|
|
const root = try parser.parse();
|
|
var analyzer = sema.Analyzer.init(alloc);
|
|
const res = try analyzer.analyze(root);
|
|
|
|
// RAW: `o: ?`i2` → `if val := o` unwraps to the user struct → `val.x` is i64.
|
|
// (Pre-fix: the optional child `i2` reclassified to the 2-bit int.)
|
|
const y = symType(res, "y") orelse return error.MissingSymbol;
|
|
try std.testing.expect(y == .signed);
|
|
try std.testing.expectEqual(@as(u8, 64), y.signed);
|
|
|
|
// CONTROL: `b: ?i2` (bare) unwraps to the builtin 2-bit signed int.
|
|
const w = symType(res, "w") orelse return error.MissingSymbol;
|
|
try std.testing.expect(w == .signed);
|
|
try std.testing.expectEqual(@as(u8, 2), w.signed);
|
|
}
|
|
|
|
test "sema: indexing a raw `[N]`i2` array resolves the user element; bare `[N]i2` stays builtin" {
|
|
var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
|
|
defer arena.deinit();
|
|
const alloc = arena.allocator();
|
|
|
|
const src =
|
|
\\`i2 :: struct { x: i64; }
|
|
\\f :: (a: [4]`i2, b: [4]i2) { y := a[0]; w := b[0]; }
|
|
\\
|
|
;
|
|
var parser = Parser.init(alloc, src);
|
|
const root = try parser.parse();
|
|
var analyzer = sema.Analyzer.init(alloc);
|
|
const res = try analyzer.analyze(root);
|
|
|
|
// RAW: `a: [4]`i2` → element is the user struct. (Pre-fix: reclassified to
|
|
// the 2-bit int.)
|
|
const y = symType(res, "y") orelse return error.MissingSymbol;
|
|
try std.testing.expect(y == .struct_type);
|
|
try std.testing.expectEqualStrings("i2", y.struct_type);
|
|
|
|
// CONTROL: `b: [4]i2` (bare) → element is the builtin 2-bit signed int.
|
|
const w = symType(res, "w") orelse return error.MissingSymbol;
|
|
try std.testing.expect(w == .signed);
|
|
try std.testing.expectEqual(@as(u8, 2), w.signed);
|
|
}
|
|
|
|
// Parameterized raw type (`` `i2(i64) ``). Unlike the shapes above this never
|
|
// had the divergence — instantiation resolves the base name straight against
|
|
// `struct_types` (no builtin classifier in the path), so it passes before AND
|
|
// after. Included as coverage that the universal model holds for the
|
|
// parameterized form too: a `` `i2 ``-declared generic instantiates and its
|
|
// field resolves.
|
|
test "sema: a raw parameterized type `` `i2(i64) `` instantiates the user generic" {
|
|
var arena = std.heap.ArenaAllocator.init(std.testing.allocator);
|
|
defer arena.deinit();
|
|
const alloc = arena.allocator();
|
|
|
|
const src =
|
|
\\`i2 :: struct ($T: Type) { items: [*]T = null; n: i64 = 0; }
|
|
\\f :: (v: `i2(i64)) { y := v.n; }
|
|
\\
|
|
;
|
|
var parser = Parser.init(alloc, src);
|
|
const root = try parser.parse();
|
|
var analyzer = sema.Analyzer.init(alloc);
|
|
const res = try analyzer.analyze(root);
|
|
|
|
// `v: `i2(i64)` instantiates the `` `i2 ``-declared generic; its concrete
|
|
// field `n` resolves to i64 (the raw base name was not misread as a builtin).
|
|
const y = symType(res, "y") orelse return error.MissingSymbol;
|
|
try std.testing.expect(y == .signed);
|
|
try std.testing.expectEqual(@as(u8, 64), y.signed);
|
|
}
|