ziglang
diff --git a/‎lib/compiler_rt/stack_probe.zig‎
Lines changed: 28 additions & 28 deletions b/‎lib/compiler_rt/stack_probe.zig‎
Lines changed: 28 additions & 28 deletions
diff --git a/‎lib/std/math/float.zig‎
Lines changed: 41 additions & 22 deletions b/‎lib/std/math/float.zig‎
Lines changed: 41 additions & 22 deletions
diff --git a/‎lib/std/math/signbit.zig‎
Lines changed: 40 additions & 13 deletions b/‎lib/std/math/signbit.zig‎
Lines changed: 40 additions & 13 deletions
diff --git a/‎lib/std/posix.zig‎
Lines changed: 4 additions & 1 deletion b/‎lib/std/posix.zig‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎lib/std/start.zig‎
Lines changed: 6 additions & 0 deletions b/‎lib/std/start.zig‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎src/Air/Legalize.zig‎
Lines changed: 14 additions & 2 deletions b/‎src/Air/Legalize.zig‎
Lines changed: 14 additions & 2 deletions
diff --git a/‎src/arch/riscv64/CodeGen.zig‎
Lines changed: 13 additions & 6 deletions b/‎src/arch/riscv64/CodeGen.zig‎
Lines changed: 13 additions & 6 deletions
@@ -127,23 +127,23 @@ fn win_probe_stack_only() void {
         },
         .x86_64 => {
             asm volatile (
-                \\         push   %%rcx
-                \\         push   %%rax
-                \\         cmp    $0x1000,%%rax
-                \\         lea    24(%%rsp),%%rcx
+                \\         pushq  %%rcx
+                \\         pushq  %%rax
+                \\         cmpq   $0x1000,%%rax
+                \\         leaq   24(%%rsp),%%rcx
                 \\         jb     1f
                 \\ 2:
-                \\         sub    $0x1000,%%rcx
-                \\         test   %%rcx,(%%rcx)
-                \\         sub    $0x1000,%%rax
-                \\         cmp    $0x1000,%%rax
+                \\         subq   $0x1000,%%rcx
+                \\         testq  %%rcx,(%%rcx)
+                \\         subq   $0x1000,%%rax
+                \\         cmpq   $0x1000,%%rax
                 \\         ja     2b
                 \\ 1:
-                \\         sub    %%rax,%%rcx
-                \\         test   %%rcx,(%%rcx)
-                \\         pop    %%rax
-                \\         pop    %%rcx
-                \\         ret
+                \\         subq   %%rax,%%rcx
+                \\         testq  %%rcx,(%%rcx)
+                \\         popq   %%rax
+                \\         popq   %%rcx
+                \\         retq
             );
         },
         .x86 => {
@@ -179,26 +179,26 @@ fn win_probe_stack_adjust_sp() void {
     switch (arch) {
         .x86_64 => {
             asm volatile (
-                \\         push   %%rcx
-                \\         cmp    $0x1000,%%rax
-                \\         lea    16(%%rsp),%%rcx
+                \\         pushq  %%rcx
+                \\         cmpq   $0x1000,%%rax
+                \\         leaq   16(%%rsp),%%rcx
                 \\         jb     1f
                 \\ 2:
-                \\         sub    $0x1000,%%rcx
-                \\         test   %%rcx,(%%rcx)
-                \\         sub    $0x1000,%%rax
-                \\         cmp    $0x1000,%%rax
+                \\         subq   $0x1000,%%rcx
+                \\         testq  %%rcx,(%%rcx)
+                \\         subq   $0x1000,%%rax
+                \\         cmpq   $0x1000,%%rax
                 \\         ja     2b
                 \\ 1:
-                \\         sub    %%rax,%%rcx
-                \\         test   %%rcx,(%%rcx)
+                \\         subq   %%rax,%%rcx
+                \\         testq  %%rcx,(%%rcx)
                 \\
-                \\         lea    8(%%rsp),%%rax
-                \\         mov    %%rcx,%%rsp
-                \\         mov    -8(%%rax),%%rcx
-                \\         push   (%%rax)
-                \\         sub    %%rsp,%%rax
-                \\         ret
+                \\         leaq   8(%%rsp),%%rax
+                \\         movq   %%rcx,%%rsp
+                \\         movq   -8(%%rax),%%rcx
+                \\         pushq  (%%rax)
+                \\         subq   %%rsp,%%rax
+                \\         retq
             );
         },
         .x86 => {
 
@@ -220,42 +220,61 @@ pub inline fn floatEpsAt(comptime T: type, x: T) T {
     }
 }
 
-/// Returns the value inf for floating point type T.
-pub inline fn inf(comptime T: type) T {
-    return reconstructFloat(T, floatExponentMax(T) + 1, mantissaOne(T));
+/// Returns the inf value for a floating point `Type`.
+pub inline fn inf(comptime Type: type) Type {
+    const RuntimeType = switch (Type) {
+        else => Type,
+        comptime_float => f128, // any float type will do
+    };
+    return reconstructFloat(RuntimeType, floatExponentMax(RuntimeType) + 1, mantissaOne(RuntimeType));
 }
 
-/// Returns the canonical quiet NaN representation for floating point type T.
-pub inline fn nan(comptime T: type) T {
+/// Returns the canonical quiet NaN representation for a floating point `Type`.
+pub inline fn nan(comptime Type: type) Type {
+    const RuntimeType = switch (Type) {
+        else => Type,
+        comptime_float => f128, // any float type will do
+    };
     return reconstructFloat(
-        T,
-        floatExponentMax(T) + 1,
-        mantissaOne(T) | 1 << (floatFractionalBits(T) - 1),
+        RuntimeType,
+        floatExponentMax(RuntimeType) + 1,
+        mantissaOne(RuntimeType) | 1 << (floatFractionalBits(RuntimeType) - 1),
     );
 }
 
-/// Returns a signalling NaN representation for floating point type T.
+/// Returns a signalling NaN representation for a floating point `Type`.
 ///
 /// TODO: LLVM is known to miscompile on some architectures to quiet NaN -
 ///       this is tracked by https://github.com/ziglang/zig/issues/14366
-pub inline fn snan(comptime T: type) T {
+pub inline fn snan(comptime Type: type) Type {
+    const RuntimeType = switch (Type) {
+        else => Type,
+        comptime_float => f128, // any float type will do
+    };
     return reconstructFloat(
-        T,
-        floatExponentMax(T) + 1,
-        mantissaOne(T) | 1 << (floatFractionalBits(T) - 2),
+        RuntimeType,
+        floatExponentMax(RuntimeType) + 1,
+        mantissaOne(RuntimeType) | 1 << (floatFractionalBits(RuntimeType) - 2),
     );
 }
 
-test "float bits" {
-    inline for ([_]type{ f16, f32, f64, f80, f128, c_longdouble }) |T| {
-        // (1 +) for the sign bit, since it is separate from the other bits
-        const size = 1 + floatExponentBits(T) + floatMantissaBits(T);
-        try expect(@bitSizeOf(T) == size);
+fn floatBits(comptime Type: type) !void {
+    // (1 +) for the sign bit, since it is separate from the other bits
+    const size = 1 + floatExponentBits(Type) + floatMantissaBits(Type);
+    try expect(@bitSizeOf(Type) == size);
+    try expect(floatFractionalBits(Type) <= floatMantissaBits(Type));
 
-        // for machine epsilon, assert expmin <= -prec <= expmax
-        try expect(floatExponentMin(T) <= -floatFractionalBits(T));
-        try expect(-floatFractionalBits(T) <= floatExponentMax(T));
-    }
+    // for machine epsilon, assert expmin <= -prec <= expmax
+    try expect(floatExponentMin(Type) <= -floatFractionalBits(Type));
+    try expect(-floatFractionalBits(Type) <= floatExponentMax(Type));
+}
+test floatBits {
+    try floatBits(f16);
+    try floatBits(f32);
+    try floatBits(f64);
+    try floatBits(f80);
+    try floatBits(f128);
+    try floatBits(c_longdouble);
 }
 
 test inf {
 
@@ -4,20 +4,47 @@ const expect = std.testing.expect;
 
 /// Returns whether x is negative or negative 0.
 pub fn signbit(x: anytype) bool {
-    const T = @TypeOf(x);
-    const TBits = std.meta.Int(.unsigned, @typeInfo(T).float.bits);
-    return @as(TBits, @bitCast(x)) >> (@bitSizeOf(T) - 1) != 0;
+    return switch (@typeInfo(@TypeOf(x))) {
+        .int, .comptime_int => x,
+        .float => |float| @as(@Type(.{ .int = .{
+            .signedness = .signed,
+            .bits = float.bits,
+        } }), @bitCast(x)),
+        .comptime_float => @as(i128, @bitCast(@as(f128, x))), // any float type will do
+        else => @compileError("std.math.signbit does not support " ++ @typeName(@TypeOf(x))),
+    } < 0;
 }
 
 test signbit {
-    inline for ([_]type{ f16, f32, f64, f80, f128 }) |T| {
-        try expect(!signbit(@as(T, 0.0)));
-        try expect(!signbit(@as(T, 1.0)));
-        try expect(signbit(@as(T, -2.0)));
-        try expect(signbit(@as(T, -0.0)));
-        try expect(!signbit(math.inf(T)));
-        try expect(signbit(-math.inf(T)));
-        try expect(!signbit(math.nan(T)));
-        try expect(signbit(-math.nan(T)));
-    }
+    try testInts(i0);
+    try testInts(u0);
+    try testInts(i1);
+    try testInts(u1);
+    try testInts(i2);
+    try testInts(u2);
+
+    try testFloats(f16);
+    try testFloats(f32);
+    try testFloats(f64);
+    try testFloats(f80);
+    try testFloats(f128);
+    try testFloats(c_longdouble);
+    try testFloats(comptime_float);
+}
+
+fn testInts(comptime Type: type) !void {
+    try expect((std.math.minInt(Type) < 0) == signbit(@as(Type, std.math.minInt(Type))));
+    try expect(!signbit(@as(Type, 0)));
+    try expect(!signbit(@as(Type, std.math.maxInt(Type))));
+}
+
+fn testFloats(comptime Type: type) !void {
+    try expect(!signbit(@as(Type, 0.0)));
+    try expect(!signbit(@as(Type, 1.0)));
+    try expect(signbit(@as(Type, -2.0)));
+    try expect(signbit(@as(Type, -0.0)));
+    try expect(!signbit(math.inf(Type)));
+    try expect(signbit(-math.inf(Type)));
+    try expect(!signbit(math.nan(Type)));
+    try expect(signbit(-math.nan(Type)));
 }
@@ -7571,7 +7571,10 @@ const lfs64_abi = native_os == .linux and builtin.link_libc and (builtin.abi.isG
 /// If this happens the fix is to add the error code to the corresponding
 /// switch expression, possibly introduce a new error in the error set, and
 /// send a patch to Zig.
-pub const unexpected_error_tracing = builtin.zig_backend == .stage2_llvm and builtin.mode == .Debug;
+pub const unexpected_error_tracing = builtin.mode == .Debug and switch (builtin.zig_backend) {
+    .stage2_llvm, .stage2_x86_64 => true,
+    else => false,
+};
 
 pub const UnexpectedError = error{
     /// The Operating System returned an undocumented error code.
 
@@ -485,6 +485,9 @@ fn _start() callconv(.naked) noreturn {
 }
 
 fn WinStartup() callconv(.withStackAlign(.c, 1)) noreturn {
+    // Switch from the x87 fpu state set by windows to the state expected by the gnu abi.
+    if (builtin.abi == .gnu) asm volatile ("fninit");
+
     if (!builtin.single_threaded and !builtin.link_libc) {
         _ = @import("os/windows/tls.zig");
     }
@@ -495,6 +498,9 @@ fn WinStartup() callconv(.withStackAlign(.c, 1)) noreturn {
 }
 
 fn wWinMainCRTStartup() callconv(.withStackAlign(.c, 1)) noreturn {
+    // Switch from the x87 fpu state set by windows to the state expected by the gnu abi.
+    if (builtin.abi == .gnu) asm volatile ("fninit");
+
     if (!builtin.single_threaded and !builtin.link_libc) {
         _ = @import("os/windows/tls.zig");
     }
 
@@ -122,8 +122,10 @@ pub const Feature = enum {
 
     /// Legalize (shift lhs, (splat rhs)) -> (shift lhs, rhs)
     unsplat_shift_rhs,
-    /// Legalize reduce of a one element vector to a bitcast
+    /// Legalize reduce of a one element vector to a bitcast.
     reduce_one_elem_to_bitcast,
+    /// Legalize splat to a one element vector to a bitcast.
+    splat_one_elem_to_bitcast,
 
     /// Replace `intcast_safe` with an explicit safety check which `call`s the panic function on failure.
     /// Not compatible with `scalarize_intcast_safe`.
@@ -628,7 +630,17 @@ fn legalizeBody(l: *Legalize, body_start: usize, body_len: usize) Error!void {
                     else => {},
                 }
             },
-            .splat => {},
+            .splat => if (l.features.has(.splat_one_elem_to_bitcast)) {
+                const ty_op = l.air_instructions.items(.data)[@intFromEnum(inst)].ty_op;
+                switch (ty_op.ty.toType().vectorLen(zcu)) {
+                    0 => unreachable,
+                    1 => continue :inst l.replaceInst(inst, .bitcast, .{ .ty_op = .{
+                        .ty = ty_op.ty,
+                        .operand = ty_op.operand,
+                    } }),
+                    else => {},
+                }
+            },
             .shuffle_one => if (l.features.has(.scalarize_shuffle_one)) continue :inst try l.scalarize(inst, .shuffle_one),
             .shuffle_two => if (l.features.has(.scalarize_shuffle_two)) continue :inst try l.scalarize(inst, .shuffle_two),
             .select => if (l.features.has(.scalarize_select)) continue :inst try l.scalarize(inst, .select),
 
@@ -5962,10 +5962,14 @@ fn airBr(func: *Func, inst: Air.Inst.Index) !void {
             if (first_br) break :result src_mcv;
 
             try func.getValue(block_tracking.short, br.block_inst);
-            // .long = .none to avoid merging operand and block result stack frames.
-            const current_tracking: InstTracking = .{ .long = .none, .short = src_mcv };
-            try current_tracking.materializeUnsafe(func, br.block_inst, block_tracking.*);
-            for (current_tracking.getRegs()) |src_reg| func.register_manager.freeReg(src_reg);
+            try InstTracking.materializeUnsafe(
+                // .long = .none to avoid merging operand and block result stack frames.
+                .{ .long = .none, .short = src_mcv },
+                func,
+                br.block_inst,
+                block_tracking.*,
+            );
+            try func.freeValue(src_mcv);
             break :result block_tracking.short;
         }
 
@@ -8192,8 +8196,11 @@ fn genTypedValue(func: *Func, val: Value) InnerError!MCValue {
     const lf = func.bin_file;
     const src_loc = func.src_loc;
 
-    const result = if (val.isUndef(pt.zcu))
-        try lf.lowerUav(pt, val.toIntern(), .none, src_loc)
+    const result: codegen.GenResult = if (val.isUndef(pt.zcu))
+        switch (try lf.lowerUav(pt, val.toIntern(), .none, src_loc)) {
+            .sym_index => |sym_index| .{ .mcv = .{ .load_symbol = sym_index } },
+            .fail => |em| .{ .fail = em },
+        }
     else
         try codegen.genTypedValue(lf, pt, src_loc, val, func.target);
     const mcv: MCValue = switch (result) {
Original file line number	Diff line number	Diff line change
`@@ -485,6 +485,9 @@ fn _start() callconv(.naked) noreturn {`
`485`	`485`	`}`
`486`	`486`
`487`	`487`	`fn WinStartup() callconv(.withStackAlign(.c, 1)) noreturn {`
	`488`	`+ // Switch from the x87 fpu state set by windows to the state expected by the gnu abi.`
	`489`	`+ if (builtin.abi == .gnu) asm volatile ("fninit");`
	`490`	`+`
`488`	`491`	`if (!builtin.single_threaded and !builtin.link_libc) {`
`489`	`492`	`_ = @import("os/windows/tls.zig");`
`490`	`493`	`}`
`@@ -495,6 +498,9 @@ fn WinStartup() callconv(.withStackAlign(.c, 1)) noreturn {`
`495`	`498`	`}`
`496`	`499`
`497`	`500`	`fn wWinMainCRTStartup() callconv(.withStackAlign(.c, 1)) noreturn {`
	`501`	`+ // Switch from the x87 fpu state set by windows to the state expected by the gnu abi.`
	`502`	`+ if (builtin.abi == .gnu) asm volatile ("fninit");`
	`503`	`+`
`498`	`504`	`if (!builtin.single_threaded and !builtin.link_libc) {`
`499`	`505`	`_ = @import("os/windows/tls.zig");`
`500`	`506`	`}`