mirror of
https://github.com/ziglang/zig.git
synced 2026-01-10 17:35:12 +00:00
x64: handle signed mul_with_overflow for non-pow-2 ints
This commit is contained in:
parent
ebfc2825ab
commit
0fc1e8b54f
@ -1086,29 +1086,7 @@ fn airTrunc(self: *Self, inst: Air.Inst.Index) !void {
|
||||
// have to be removed. this only happens if the dst if not a power-of-two size.
|
||||
const dst_bit_size = dst_ty.bitSize(self.target.*);
|
||||
if (!math.isPowerOfTwo(dst_bit_size) or dst_bit_size < 8) {
|
||||
const max_reg_bit_width = Register.rax.size();
|
||||
const shift = @intCast(u6, max_reg_bit_width - dst_ty.bitSize(self.target.*));
|
||||
const mask = (~@as(u64, 0)) >> shift;
|
||||
try self.genBinMathOpMir(.@"and", Type.usize, .{ .register = reg }, .{ .immediate = mask });
|
||||
|
||||
if (src_ty.intInfo(self.target.*).signedness == .signed) {
|
||||
_ = try self.addInst(.{
|
||||
.tag = .sal,
|
||||
.ops = (Mir.Ops{
|
||||
.reg1 = reg,
|
||||
.flags = 0b10,
|
||||
}).encode(),
|
||||
.data = .{ .imm = shift },
|
||||
});
|
||||
_ = try self.addInst(.{
|
||||
.tag = .sar,
|
||||
.ops = (Mir.Ops{
|
||||
.reg1 = reg,
|
||||
.flags = 0b10,
|
||||
}).encode(),
|
||||
.data = .{ .imm = shift },
|
||||
});
|
||||
}
|
||||
try self.truncateRegister(dst_ty, reg);
|
||||
}
|
||||
|
||||
return self.finishAir(inst, .{ .register = reg }, .{ ty_op.operand, .none, .none });
|
||||
@ -1478,31 +1456,119 @@ fn airMulWithOverflow(self: *Self, inst: Air.Inst.Index) !void {
|
||||
switch (ty.zigTypeTag()) {
|
||||
.Vector => return self.fail("TODO implement mul_with_overflow for Vector type", .{}),
|
||||
.Int => {
|
||||
try self.spillCompareFlagsIfOccupied();
|
||||
self.compare_flags_inst = null;
|
||||
|
||||
const int_info = ty.intInfo(self.target.*);
|
||||
|
||||
if (int_info.bits > 64) {
|
||||
return self.fail("TODO implement mul_with_overflow for Ints larger than 64bits", .{});
|
||||
}
|
||||
|
||||
// Spill .rax and .rdx upfront to ensure we don't spill the operands too late.
|
||||
try self.register_manager.getReg(.rax, inst);
|
||||
try self.register_manager.getReg(.rdx, null);
|
||||
self.register_manager.freezeRegs(&.{ .rax, .rdx });
|
||||
defer self.register_manager.unfreezeRegs(&.{ .rax, .rdx });
|
||||
if (math.isPowerOfTwo(int_info.bits)) {
|
||||
// Spill .rax and .rdx upfront to ensure we don't spill the operands too late.
|
||||
try self.register_manager.getReg(.rax, inst);
|
||||
try self.register_manager.getReg(.rdx, null);
|
||||
self.register_manager.freezeRegs(&.{ .rax, .rdx });
|
||||
defer self.register_manager.unfreezeRegs(&.{ .rax, .rdx });
|
||||
|
||||
const lhs = try self.resolveInst(bin_op.lhs);
|
||||
const rhs = try self.resolveInst(bin_op.rhs);
|
||||
|
||||
try self.genIntMulDivOpMir(switch (int_info.signedness) {
|
||||
.signed => .imul,
|
||||
.unsigned => .mul,
|
||||
}, ty, int_info.signedness, lhs, rhs);
|
||||
|
||||
const result: MCValue = switch (int_info.signedness) {
|
||||
.signed => .{ .register_overflow_signed = .rax },
|
||||
.unsigned => .{ .register_overflow_unsigned = .rax },
|
||||
};
|
||||
break :result result;
|
||||
}
|
||||
|
||||
const lhs = try self.resolveInst(bin_op.lhs);
|
||||
const rhs = try self.resolveInst(bin_op.rhs);
|
||||
|
||||
try self.genIntMulDivOpMir(switch (int_info.signedness) {
|
||||
.signed => .imul,
|
||||
.unsigned => .mul,
|
||||
}, ty, int_info.signedness, lhs, rhs);
|
||||
rhs.freezeIfRegister(&self.register_manager);
|
||||
defer rhs.unfreezeIfRegister(&self.register_manager);
|
||||
|
||||
const result: MCValue = switch (int_info.signedness) {
|
||||
.signed => .{ .register_overflow_signed = .rax },
|
||||
.unsigned => .{ .register_overflow_unsigned = .rax },
|
||||
// TODO check if we could reuse rhs instead, and swap the values out.
|
||||
const dst_mcv = blk: {
|
||||
if (self.reuseOperand(inst, bin_op.lhs, 0, lhs)) {
|
||||
if (lhs.isRegister()) break :blk lhs;
|
||||
}
|
||||
break :blk MCValue{ .register = try self.copyToTmpRegister(ty, lhs) };
|
||||
};
|
||||
break :result result;
|
||||
dst_mcv.freezeIfRegister(&self.register_manager);
|
||||
defer dst_mcv.unfreezeIfRegister(&self.register_manager);
|
||||
|
||||
const rhs_mcv = blk: {
|
||||
if (rhs.isRegister() or rhs.isMemory()) break :blk rhs;
|
||||
break :blk MCValue{ .register = try self.copyToTmpRegister(ty, rhs) };
|
||||
};
|
||||
rhs_mcv.freezeIfRegister(&self.register_manager);
|
||||
defer rhs_mcv.unfreezeIfRegister(&self.register_manager);
|
||||
|
||||
const tuple_ty = self.air.typeOfIndex(inst);
|
||||
const tuple_size = @intCast(u32, tuple_ty.abiSize(self.target.*));
|
||||
const tuple_align = tuple_ty.abiAlignment(self.target.*);
|
||||
const overflow_bit_offset = @intCast(i32, tuple_ty.structFieldOffset(1, self.target.*));
|
||||
|
||||
const stack_offset = @intCast(i32, try self.allocMem(inst, tuple_size, tuple_align));
|
||||
const extended_ty = switch (int_info.signedness) {
|
||||
.signed => Type.isize,
|
||||
.unsigned => ty,
|
||||
};
|
||||
|
||||
try self.genIntMulComplexOpMir(extended_ty, dst_mcv, rhs_mcv);
|
||||
|
||||
const temp_regs = try self.register_manager.allocRegs(3, .{ null, null, null });
|
||||
self.register_manager.freezeRegs(&temp_regs);
|
||||
defer self.register_manager.unfreezeRegs(&temp_regs);
|
||||
|
||||
const overflow_reg = temp_regs[0];
|
||||
const flags: u2 = switch (int_info.signedness) {
|
||||
.signed => 0b00,
|
||||
.unsigned => 0b10,
|
||||
};
|
||||
_ = try self.addInst(.{
|
||||
.tag = .cond_set_byte_overflow,
|
||||
.ops = (Mir.Ops{
|
||||
.reg1 = overflow_reg.to8(),
|
||||
.flags = flags,
|
||||
}).encode(),
|
||||
.data = undefined,
|
||||
});
|
||||
|
||||
const scratch_reg = temp_regs[1];
|
||||
try self.genSetReg(extended_ty, scratch_reg, dst_mcv);
|
||||
try self.truncateRegister(ty, scratch_reg);
|
||||
try self.genBinMathOpMir(.cmp, extended_ty, dst_mcv, .{ .register = scratch_reg });
|
||||
|
||||
const eq_reg = temp_regs[2];
|
||||
_ = try self.addInst(.{
|
||||
.tag = .cond_set_byte_eq_ne,
|
||||
.ops = (Mir.Ops{
|
||||
.reg1 = eq_reg.to8(),
|
||||
.flags = 0b00,
|
||||
}).encode(),
|
||||
.data = undefined,
|
||||
});
|
||||
|
||||
try self.genBinMathOpMir(
|
||||
.@"or",
|
||||
Type.u8,
|
||||
.{ .register = overflow_reg },
|
||||
.{ .register = eq_reg },
|
||||
);
|
||||
|
||||
try self.genSetStack(ty, stack_offset, .{ .register = scratch_reg }, .{});
|
||||
try self.genSetStack(Type.initTag(.u1), stack_offset - overflow_bit_offset, .{
|
||||
.register = overflow_reg.to8(),
|
||||
}, .{});
|
||||
|
||||
break :result MCValue{ .stack_offset = stack_offset };
|
||||
},
|
||||
else => unreachable,
|
||||
}
|
||||
@ -1648,7 +1714,7 @@ fn genInlineIntDivFloor(self: *Self, ty: Type, lhs: MCValue, rhs: MCValue) !MCVa
|
||||
}).encode(),
|
||||
.data = undefined,
|
||||
});
|
||||
try self.genBinMathOpMir(.add, Type.isize, .{ .register = divisor.to64() }, .{ .register = .rax });
|
||||
try self.genBinMathOpMir(.add, Type.isize, .{ .register = divisor }, .{ .register = .rax });
|
||||
return MCValue{ .register = divisor };
|
||||
}
|
||||
|
||||
@ -2222,8 +2288,8 @@ fn genSliceElemPtr(self: *Self, lhs: Air.Inst.Ref, rhs: Air.Inst.Ref) !MCValue {
|
||||
}
|
||||
// TODO we could allocate register here, but need to expect addr register and potentially
|
||||
// offset register.
|
||||
try self.genBinMathOpMir(.add, slice_ptr_field_type, .{ .register = addr_reg.to64() }, .{
|
||||
.register = offset_reg.to64(),
|
||||
try self.genBinMathOpMir(.add, slice_ptr_field_type, .{ .register = addr_reg }, .{
|
||||
.register = offset_reg,
|
||||
});
|
||||
return MCValue{ .register = addr_reg.to64() };
|
||||
}
|
||||
@ -2315,7 +2381,7 @@ fn airArrayElemVal(self: *Self, inst: Air.Inst.Index) !void {
|
||||
// TODO we could allocate register here, but need to expect addr register and potentially
|
||||
// offset register.
|
||||
const dst_mcv = try self.allocRegOrMem(inst, false);
|
||||
try self.genBinMathOpMir(.add, array_ty, .{ .register = addr_reg.to64() }, .{ .register = offset_reg.to64() });
|
||||
try self.genBinMathOpMir(.add, Type.usize, .{ .register = addr_reg }, .{ .register = offset_reg });
|
||||
try self.load(dst_mcv, .{ .register = addr_reg.to64() }, array_ty);
|
||||
break :result dst_mcv;
|
||||
};
|
||||
@ -3178,8 +3244,8 @@ fn genBinMathOpMir(self: *Self, mir_tag: Mir.Inst.Tag, dst_ty: Type, dst_mcv: MC
|
||||
_ = try self.addInst(.{
|
||||
.tag = mir_tag,
|
||||
.ops = (Mir.Ops{
|
||||
.reg1 = registerAlias(dst_reg, @divExact(src_reg.size(), 8)),
|
||||
.reg2 = src_reg,
|
||||
.reg1 = registerAlias(dst_reg, abi_size),
|
||||
.reg2 = registerAlias(src_reg, abi_size),
|
||||
}).encode(),
|
||||
.data = undefined,
|
||||
});
|
||||
@ -6531,3 +6597,36 @@ fn shiftRegister(self: *Self, reg: Register, shift: u8) !void {
|
||||
});
|
||||
}
|
||||
}
|
||||
|
||||
/// Truncates the value in the register in place.
|
||||
/// Clobbers any remaining bits.
|
||||
fn truncateRegister(self: *Self, ty: Type, reg: Register) !void {
|
||||
const int_info = ty.intInfo(self.target.*);
|
||||
const max_reg_bit_width = Register.rax.size();
|
||||
switch (int_info.signedness) {
|
||||
.signed => {
|
||||
const shift = @intCast(u6, max_reg_bit_width - int_info.bits);
|
||||
_ = try self.addInst(.{
|
||||
.tag = .sal,
|
||||
.ops = (Mir.Ops{
|
||||
.reg1 = reg.to64(),
|
||||
.flags = 0b10,
|
||||
}).encode(),
|
||||
.data = .{ .imm = shift },
|
||||
});
|
||||
_ = try self.addInst(.{
|
||||
.tag = .sar,
|
||||
.ops = (Mir.Ops{
|
||||
.reg1 = reg.to64(),
|
||||
.flags = 0b10,
|
||||
}).encode(),
|
||||
.data = .{ .imm = shift },
|
||||
});
|
||||
},
|
||||
.unsigned => {
|
||||
const shift = @intCast(u6, max_reg_bit_width - int_info.bits);
|
||||
const mask = (~@as(u64, 0)) >> shift;
|
||||
try self.genBinMathOpMir(.@"and", Type.usize, .{ .register = reg }, .{ .immediate = mask });
|
||||
},
|
||||
}
|
||||
}
|
||||
|
||||
@ -1383,7 +1383,7 @@ inline fn getOpCode(tag: Tag, enc: Encoding, is_one_byte: bool) ?OpCode {
|
||||
.sub => OpCode.oneByte(if (is_one_byte) 0x2a else 0x2b),
|
||||
.xor => OpCode.oneByte(if (is_one_byte) 0x32 else 0x33),
|
||||
.@"and" => OpCode.oneByte(if (is_one_byte) 0x22 else 0x23),
|
||||
.@"or" => OpCode.oneByte(if (is_one_byte) 0x0b else 0x0b),
|
||||
.@"or" => OpCode.oneByte(if (is_one_byte) 0x0a else 0x0b),
|
||||
.sbb => OpCode.oneByte(if (is_one_byte) 0x1a else 0x1b),
|
||||
.cmp => OpCode.oneByte(if (is_one_byte) 0x3a else 0x3b),
|
||||
.mov => OpCode.oneByte(if (is_one_byte) 0x8a else 0x8b),
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user