ziglang
diff --git a/‎lib/std/math.zig
+21-11 b/‎lib/std/math.zig
+21-11
diff --git a/‎lib/std/math/big/int.zig
+4-4 b/‎lib/std/math/big/int.zig
+4-4
diff --git a/‎lib/std/math/big/int_test.zig
-4 b/‎lib/std/math/big/int_test.zig
-4
diff --git a/‎lib/std/math/log2.zig
+11-10 b/‎lib/std/math/log2.zig
+11-10
diff --git a/‎lib/zig.h
+20-11 b/‎lib/zig.h
+20-11
diff --git a/‎src/Air.zig
+3-1 b/‎src/Air.zig
+3-1
diff --git a/‎src/Sema.zig
+43-28 b/‎src/Sema.zig
+43-28
diff --git a/‎src/Type.zig
+4-4 b/‎src/Type.zig
+4-4
@@ -774,18 +774,15 @@ pub fn Log2IntCeil(comptime T: type) type {
 /// Returns the smallest integer type that can hold both from and to.
 pub fn IntFittingRange(comptime from: comptime_int, comptime to: comptime_int) type {
     assert(from <= to);
-    if (from == 0 and to == 0) {
-        return u0;
-    }
     const signedness: std.builtin.Signedness = if (from < 0) .signed else .unsigned;
-    const largest_positive_integer = @max(if (from < 0) (-from) - 1 else from, to); // two's complement
-    const base = log2(largest_positive_integer);
-    const upper = (1 << base) - 1;
-    var magnitude_bits = if (upper >= largest_positive_integer) base else base + 1;
-    if (signedness == .signed) {
-        magnitude_bits += 1;
-    }
-    return std.meta.Int(signedness, magnitude_bits);
+    return @Type(.{ .int = .{
+        .signedness = signedness,
+        .bits = @as(u16, @intFromBool(signedness == .signed)) +
+            switch (if (from < 0) @max(@abs(from) - 1, to) else to) {
+                0 => 0,
+                else => |pos_max| 1 + log2(pos_max),
+            },
+    } });
 }
 
 test IntFittingRange {
@@ -1267,6 +1264,19 @@ pub fn log2_int(comptime T: type, x: T) Log2Int(T) {
     return @as(Log2Int(T), @intCast(@typeInfo(T).int.bits - 1 - @clz(x)));
 }
 
+test log2_int {
+    try testing.expect(log2_int(u32, 1) == 0);
+    try testing.expect(log2_int(u32, 2) == 1);
+    try testing.expect(log2_int(u32, 3) == 1);
+    try testing.expect(log2_int(u32, 4) == 2);
+    try testing.expect(log2_int(u32, 5) == 2);
+    try testing.expect(log2_int(u32, 6) == 2);
+    try testing.expect(log2_int(u32, 7) == 2);
+    try testing.expect(log2_int(u32, 8) == 3);
+    try testing.expect(log2_int(u32, 9) == 3);
+    try testing.expect(log2_int(u32, 10) == 3);
+}
+
 /// Return the log base 2 of integer value x, rounding up to the
 /// nearest integer.
 pub fn log2_int_ceil(comptime T: type, x: T) Log2IntCeil(T) {
 
@@ -415,12 +415,12 @@ pub const Mutable = struct {
         // in the case that scalar happens to be small in magnitude within its type, but it
         // is well worth being able to use the stack and not needing an allocator passed in.
         // Note that Mutable.init still sets len to calcLimbLen(scalar) in any case.
-        const limb_len = comptime switch (@typeInfo(@TypeOf(scalar))) {
+        const limbs_len = comptime switch (@typeInfo(@TypeOf(scalar))) {
             .comptime_int => calcLimbLen(scalar),
             .int => |info| calcTwosCompLimbCount(info.bits),
             else => @compileError("expected scalar to be an int"),
         };
-        var limbs: [limb_len]Limb = undefined;
+        var limbs: [limbs_len]Limb = undefined;
         const operand = init(&limbs, scalar).toConst();
         return add(r, a, operand);
     }
@@ -2454,12 +2454,12 @@ pub const Const = struct {
         // in the case that scalar happens to be small in magnitude within its type, but it
         // is well worth being able to use the stack and not needing an allocator passed in.
         // Note that Mutable.init still sets len to calcLimbLen(scalar) in any case.
-        const limb_len = comptime switch (@typeInfo(@TypeOf(scalar))) {
+        const limbs_len = comptime switch (@typeInfo(@TypeOf(scalar))) {
             .comptime_int => calcLimbLen(scalar),
             .int => |info| calcTwosCompLimbCount(info.bits),
             else => @compileError("expected scalar to be an int"),
         };
-        var limbs: [limb_len]Limb = undefined;
+        var limbs: [limbs_len]Limb = undefined;
         const rhs = Mutable.init(&limbs, scalar);
         return order(lhs, rhs.toConst());
     }
 
@@ -2295,8 +2295,6 @@ test "sat shift-left signed simple positive" {
 }
 
 test "sat shift-left signed multi positive" {
-    if (builtin.zig_backend == .stage2_x86_64) return error.SkipZigTest;
-
     var x: SignedDoubleLimb = 1;
     _ = &x;
 
@@ -2310,8 +2308,6 @@ test "sat shift-left signed multi positive" {
 }
 
 test "sat shift-left signed multi negative" {
-    if (builtin.zig_backend == .stage2_x86_64) return error.SkipZigTest;
-
     var x: SignedDoubleLimb = -1;
     _ = &x;
 
 
@@ -12,12 +12,10 @@ const expect = std.testing.expect;
 ///  - log2(nan)   = nan
 pub fn log2(x: anytype) @TypeOf(x) {
     const T = @TypeOf(x);
-    switch (@typeInfo(T)) {
-        .comptime_float => {
-            return @as(comptime_float, @log2(x));
-        },
-        .float => return @log2(x),
+    return switch (@typeInfo(T)) {
+        .comptime_float, .float => @log2(x),
         .comptime_int => comptime {
+            std.debug.assert(x > 0);
             var x_shifted = x;
             // First, calculate floorPowerOfTwo(x)
             var shift_amt = 1;
@@ -34,12 +32,15 @@ pub fn log2(x: anytype) @TypeOf(x) {
             }
             return result;
         },
-        .int => |IntType| switch (IntType.signedness) {
-            .signed => @compileError("log2 not implemented for signed integers"),
-            .unsigned => return math.log2_int(T, x),
-        },
+        .int => |int_info| math.log2_int(switch (int_info.signedness) {
+            .signed => @Type(.{ .int = .{
+                .signedness = .unsigned,
+                .bits = int_info.bits -| 1,
+            } }),
+            .unsigned => T,
+        }, @intCast(x)),
         else => @compileError("log2 not implemented for " ++ @typeName(T)),
-    }
+    };
 }
 
 test log2 {
 
@@ -1115,14 +1115,15 @@ static inline bool zig_mulo_i16(int16_t *res, int16_t lhs, int16_t rhs, uint8_t
 \
     static inline uint##w##_t zig_shls_u##w(uint##w##_t lhs, uint##w##_t rhs, uint8_t bits) { \
         uint##w##_t res; \
-        if (rhs >= bits) return lhs != UINT##w##_C(0) ? zig_maxInt_u(w, bits) : lhs; \
-        return zig_shlo_u##w(&res, lhs, (uint8_t)rhs, bits) ? zig_maxInt_u(w, bits) : res; \
+        if (rhs < bits && !zig_shlo_u##w(&res, lhs, rhs, bits)) return res; \
+        return lhs == INT##w##_C(0) ? INT##w##_C(0) : zig_maxInt_u(w, bits); \
     } \
 \
-    static inline int##w##_t zig_shls_i##w(int##w##_t lhs, int##w##_t rhs, uint8_t bits) { \
+    static inline int##w##_t zig_shls_i##w(int##w##_t lhs, uint##w##_t rhs, uint8_t bits) { \
         int##w##_t res; \
-        if ((uint##w##_t)rhs < (uint##w##_t)bits && !zig_shlo_i##w(&res, lhs, (uint8_t)rhs, bits)) return res; \
-        return lhs < INT##w##_C(0) ? zig_minInt_i(w, bits) : zig_maxInt_i(w, bits); \
+        if (rhs < bits && !zig_shlo_i##w(&res, lhs, rhs, bits)) return res; \
+        return lhs == INT##w##_C(0) ? INT##w##_C(0) : \
+            lhs < INT##w##_C(0) ? zig_minInt_i(w, bits) : zig_maxInt_i(w, bits); \
     } \
 \
     static inline uint##w##_t zig_adds_u##w(uint##w##_t lhs, uint##w##_t rhs, uint8_t bits) { \
@@ -1851,15 +1852,23 @@ static inline bool zig_shlo_i128(zig_i128 *res, zig_i128 lhs, uint8_t rhs, uint8
 
 static inline zig_u128 zig_shls_u128(zig_u128 lhs, zig_u128 rhs, uint8_t bits) {
     zig_u128 res;
-    if (zig_cmp_u128(rhs, zig_make_u128(0, bits)) >= INT32_C(0))
-        return zig_cmp_u128(lhs, zig_make_u128(0, 0)) != INT32_C(0) ? zig_maxInt_u(128, bits) : lhs;
-    return zig_shlo_u128(&res, lhs, (uint8_t)zig_lo_u128(rhs), bits) ? zig_maxInt_u(128, bits) : res;
+    if (zig_cmp_u128(rhs, zig_make_u128(0, bits)) < INT32_C(0) && !zig_shlo_u128(&res, lhs, (uint8_t)zig_lo_u128(rhs), bits)) return res;
+    switch (zig_cmp_u128(lhs, zig_make_u128(0, 0))) {
+        case 0: return zig_make_i128(0, 0);
+        case 1: return zig_maxInt_u(128, bits);
+        default: zig_unreachable();
+    }
 }
 
-static inline zig_i128 zig_shls_i128(zig_i128 lhs, zig_i128 rhs, uint8_t bits) {
+static inline zig_i128 zig_shls_i128(zig_i128 lhs, zig_u128 rhs, uint8_t bits) {
     zig_i128 res;
-    if (zig_cmp_u128(zig_bitCast_u128(rhs), zig_make_u128(0, bits)) < INT32_C(0) && !zig_shlo_i128(&res, lhs, (uint8_t)zig_lo_i128(rhs), bits)) return res;
-    return zig_cmp_i128(lhs, zig_make_i128(0, 0)) < INT32_C(0) ? zig_minInt_i(128, bits) : zig_maxInt_i(128, bits);
+    if (zig_cmp_u128(rhs, zig_make_u128(0, bits)) < INT32_C(0) && !zig_shlo_i128(&res, lhs, (uint8_t)zig_lo_u128(rhs), bits)) return res;
+    switch (zig_cmp_i128(lhs, zig_make_i128(0, 0))) {
+        case -1: return zig_minInt_i(128, bits);
+        case  0: return zig_make_i128(0, 0);
+        case  1: return zig_maxInt_i(128, bits);
+        default: zig_unreachable();
+    }
 }
 
 static inline zig_u128 zig_adds_u128(zig_u128 lhs, zig_u128 rhs, uint8_t bits) {
 
@@ -257,7 +257,9 @@ pub const Inst = struct {
         /// it shifts out any bits that disagree with the resultant sign bit.
         /// Uses the `bin_op` field.
         shl_exact,
-        /// Saturating integer shift left. `<<|`
+        /// Saturating integer shift left. `<<|`. The result is the same type as the `lhs`.
+        /// The `rhs` must have the same vector shape as the `lhs`, but with any unsigned
+        /// integer as the scalar type.
         /// Uses the `bin_op` field.
         shl_sat,
         /// Bitwise XOR. `^`
 
@@ -14215,14 +14215,15 @@ fn zirShl(
     const rhs_ty = sema.typeOf(rhs);
 
     const src = block.nodeOffset(inst_data.src_node);
-    const lhs_src = switch (air_tag) {
-        .shl, .shl_sat => block.src(.{ .node_offset_bin_lhs = inst_data.src_node }),
-        .shl_exact => block.builtinCallArgSrc(inst_data.src_node, 0),
-        else => unreachable,
-    };
-    const rhs_src = switch (air_tag) {
-        .shl, .shl_sat => block.src(.{ .node_offset_bin_rhs = inst_data.src_node }),
-        .shl_exact => block.builtinCallArgSrc(inst_data.src_node, 1),
+    const lhs_src, const rhs_src = switch (air_tag) {
+        .shl, .shl_sat => .{
+            block.src(.{ .node_offset_bin_lhs = inst_data.src_node }),
+            block.src(.{ .node_offset_bin_rhs = inst_data.src_node }),
+        },
+        .shl_exact => .{
+            block.builtinCallArgSrc(inst_data.src_node, 0),
+            block.builtinCallArgSrc(inst_data.src_node, 1),
+        },
         else => unreachable,
     };
 
@@ -14231,8 +14232,7 @@ fn zirShl(
     const scalar_ty = lhs_ty.scalarType(zcu);
     const scalar_rhs_ty = rhs_ty.scalarType(zcu);
 
-    // TODO coerce rhs if air_tag is not shl_sat
-    const rhs_is_comptime_int = try sema.checkIntType(block, rhs_src, scalar_rhs_ty);
+    _ = try sema.checkIntType(block, rhs_src, scalar_rhs_ty);
 
     const maybe_lhs_val = try sema.resolveValueResolveLazy(lhs);
     const maybe_rhs_val = try sema.resolveValueResolveLazy(rhs);
@@ -14245,7 +14245,7 @@ fn zirShl(
         if (try rhs_val.compareAllWithZeroSema(.eq, pt)) {
             return lhs;
         }
-        if (scalar_ty.zigTypeTag(zcu) != .comptime_int and air_tag != .shl_sat) {
+        if (air_tag != .shl_sat and scalar_ty.zigTypeTag(zcu) != .comptime_int) {
             const bit_value = try pt.intValue(Type.comptime_int, scalar_ty.intInfo(zcu).bits);
             if (rhs_ty.zigTypeTag(zcu) == .vector) {
                 var i: usize = 0;
@@ -14282,6 +14282,8 @@ fn zirShl(
                 rhs_val.fmtValueSema(pt, sema),
             });
         }
+    } else if (scalar_rhs_ty.isSignedInt(zcu)) {
+        return sema.fail(block, rhs_src, "shift by signed type '{}'", .{rhs_ty.fmt(pt)});
     }
 
     const runtime_src = if (maybe_lhs_val) |lhs_val| rs: {
@@ -14309,18 +14311,34 @@ fn zirShl(
         return Air.internedToRef(val.toIntern());
     } else lhs_src;
 
-    const new_rhs = if (air_tag == .shl_sat) rhs: {
-        // Limit the RHS type for saturating shl to be an integer as small as the LHS.
-        if (rhs_is_comptime_int or
-            scalar_rhs_ty.intInfo(zcu).bits > scalar_ty.intInfo(zcu).bits)
-        {
-            const max_int = Air.internedToRef((try lhs_ty.maxInt(pt, lhs_ty)).toIntern());
-            const rhs_limited = try sema.analyzeMinMax(block, rhs_src, .min, &.{ rhs, max_int }, &.{ rhs_src, rhs_src });
-            break :rhs try sema.intCast(block, src, lhs_ty, rhs_src, rhs_limited, rhs_src, false, false);
-        } else {
-            break :rhs rhs;
-        }
-    } else rhs;
+    const rt_rhs = switch (air_tag) {
+        else => unreachable,
+        .shl, .shl_exact => rhs,
+        // The backend can handle a large runtime rhs better than we can, but
+        // we can limit a large comptime rhs better here. This also has the
+        // necessary side effect of preventing rhs from being a `comptime_int`.
+        .shl_sat => if (maybe_rhs_val) |rhs_val| Air.internedToRef(rt_rhs: {
+            const bit_count = scalar_ty.intInfo(zcu).bits;
+            const rt_rhs_scalar_ty = try pt.smallestUnsignedInt(bit_count);
+            if (!rhs_ty.isVector(zcu)) break :rt_rhs (try pt.intValue(
+                rt_rhs_scalar_ty,
+                @min(try rhs_val.getUnsignedIntSema(pt) orelse bit_count, bit_count),
+            )).toIntern();
+            const rhs_len = rhs_ty.vectorLen(zcu);
+            const rhs_elems = try sema.arena.alloc(InternPool.Index, rhs_len);
+            for (rhs_elems, 0..) |*rhs_elem, i| rhs_elem.* = (try pt.intValue(
+                rt_rhs_scalar_ty,
+                @min(try (try rhs_val.elemValue(pt, i)).getUnsignedIntSema(pt) orelse bit_count, bit_count),
+            )).toIntern();
+            break :rt_rhs try pt.intern(.{ .aggregate = .{
+                .ty = (try pt.vectorType(.{
+                    .len = rhs_len,
+                    .child = rt_rhs_scalar_ty.toIntern(),
+                })).toIntern(),
+                .storage = .{ .elems = rhs_elems },
+            } });
+        }) else rhs,
+    };
 
     try sema.requireRuntimeBlock(block, src, runtime_src);
     if (block.wantSafety()) {
@@ -14374,7 +14392,7 @@ fn zirShl(
             return sema.tupleFieldValByIndex(block, op_ov, 0, op_ov_tuple_ty);
         }
     }
-    return block.addBinOp(air_tag, lhs, new_rhs);
+    return block.addBinOp(air_tag, lhs, rt_rhs);
 }
 
 fn zirShr(
@@ -36432,10 +36450,7 @@ fn generateUnionTagTypeSimple(
     const enum_ty = try ip.getGeneratedTagEnumType(gpa, pt.tid, .{
         .name = name,
         .owner_union_ty = union_type,
-        .tag_ty = if (enum_field_names.len == 0)
-            (try pt.intType(.unsigned, 0)).toIntern()
-        else
-            (try pt.smallestUnsignedInt(enum_field_names.len - 1)).toIntern(),
+        .tag_ty = (try pt.smallestUnsignedInt(enum_field_names.len -| 1)).toIntern(),
         .names = enum_field_names,
         .values = &.{},
         .tag_mode = .auto,
 
@@ -4132,10 +4132,10 @@ pub const empty_tuple: Type = .{ .ip_index = .empty_tuple_type };
 pub const generic_poison: Type = .{ .ip_index = .generic_poison_type };
 
 pub fn smallestUnsignedBits(max: u64) u16 {
-    if (max == 0) return 0;
-    const base = std.math.log2(max);
-    const upper = (@as(u64, 1) << @as(u6, @intCast(base))) - 1;
-    return @as(u16, @intCast(base + @intFromBool(upper < max)));
+    return switch (max) {
+        0 => 0,
+        else => 1 + std.math.log2_int(u64, max),
+    };
 }
 
 /// This is only used for comptime asserts. Bump this number when you make a change
Original file line number	Diff line number	Diff line change
`@@ -2295,8 +2295,6 @@ test "sat shift-left signed simple positive" {`
`2295`	`2295`	`}`
`2296`	`2296`
`2297`	`2297`	`test "sat shift-left signed multi positive" {`
`2298`		`- if (builtin.zig_backend == .stage2_x86_64) return error.SkipZigTest;`
`2299`		`-`
`2300`	`2298`	`var x: SignedDoubleLimb = 1;`
`2301`	`2299`	`_ = &x;`
`2302`	`2300`
`@@ -2310,8 +2308,6 @@ test "sat shift-left signed multi positive" {`
`2310`	`2308`	`}`
`2311`	`2309`
`2312`	`2310`	`test "sat shift-left signed multi negative" {`
`2313`		`- if (builtin.zig_backend == .stage2_x86_64) return error.SkipZigTest;`
`2314`		`-`
`2315`	`2311`	`var x: SignedDoubleLimb = -1;`
`2316`	`2312`	`_ = &x;`
`2317`	`2313`