add x86_64 subtraction support for gen_dev

2025-10-01 07:41:12 +00:00 · 2021-01-13 20:56:33 +01:00 · 2021-01-13 20:56:33 +01:00 · dfed317f8e
commit dfed317f8e
parent 05637eb3f8
5 changed files with 87 additions and 2 deletions
--- a/compiler/gen_dev/src/generic64/aarch64.rs
+++ b/compiler/gen_dev/src/generic64/aarch64.rs
@ -307,6 +307,16 @@ impl Assembler<AArch64GPReg> for AArch64Assembler {
        }
    }
    #[inline(always)]
    fn sub_reg64_reg64_reg64(
        _buf: &mut Vec<'_, u8>,
        _dst: AArch64GPReg,
        _src1: AArch64GPReg,
        _src2: AArch64GPReg,
    ) {
        unimplemented!("registers subtractions not implemented yet for AArch64");
    }
    #[inline(always)]
    fn ret(buf: &mut Vec<'_, u8>) {
        ret_reg64(buf, AArch64GPReg::LR)
--- a/compiler/gen_dev/src/generic64/mod.rs
+++ b/compiler/gen_dev/src/generic64/mod.rs
@ -51,6 +51,7 @@ pub trait Assembler<GPReg: GPRegTrait> {
    fn mov_reg64_stack32(buf: &mut Vec<'_, u8>, dst: GPReg, offset: i32);
    fn mov_stack32_reg64(buf: &mut Vec<'_, u8>, offset: i32, src: GPReg);
    fn sub_reg64_reg64_imm32(buf: &mut Vec<'_, u8>, dst: GPReg, src1: GPReg, imm32: i32);
    fn sub_reg64_reg64_reg64(buf: &mut Vec<'_, u8>, dst: GPReg, src1: GPReg, src2: GPReg);
    fn ret(buf: &mut Vec<'_, u8>);
 }
@ -194,6 +195,19 @@ impl<'a, GPReg: GPRegTrait, ASM: Assembler<GPReg>, CC: CallConv<GPReg>> Backend<
        Ok(())
    }
    fn build_num_sub_i64(
        &mut self,
        dst: &Symbol,
        src1: &Symbol,
        src2: &Symbol,
    ) -> Result<(), String> {
        let dst_reg = self.claim_gp_reg(dst)?;
        let src1_reg = self.load_to_reg(src1)?;
        let src2_reg = self.load_to_reg(src2)?;
        ASM::sub_reg64_reg64_reg64(&mut self.buf, dst_reg, src1_reg, src2_reg);
        Ok(())
    }
    fn load_literal(&mut self, sym: &Symbol, lit: &Literal<'a>) -> Result<(), String> {
        match lit {
            Literal::Int(x) => {
--- a/compiler/gen_dev/src/generic64/x86_64.rs
+++ b/compiler/gen_dev/src/generic64/x86_64.rs
@ -310,6 +310,22 @@ impl Assembler<X86_64GPReg> for X86_64Assembler {
        }
    }
    #[inline(always)]
    fn sub_reg64_reg64_reg64(
        buf: &mut Vec<'_, u8>,
        dst: X86_64GPReg,
        src1: X86_64GPReg,
        src2: X86_64GPReg,
    ) {
        if dst == src1 {
            sub_reg64_reg64(buf, dst, src2);
        } else if dst == src2 {
            sub_reg64_reg64(buf, dst, src1);
        } else {
            mov_reg64_reg64(buf, dst, src1);
            sub_reg64_reg64(buf, dst, src2);
        }
    }
    #[inline(always)]
    fn ret(buf: &mut Vec<'_, u8>) {
        ret(buf);
    }
@ -379,6 +395,16 @@ fn add_reg64_reg64(buf: &mut Vec<'_, u8>, dst: X86_64GPReg, src: X86_64GPReg) {
    buf.extend(&[rex, 0x01, 0xC0 + dst_mod + src_mod]);
 }
 /// `SUB r/m64,r64` -> Sub r64 to r/m64.
 #[inline(always)]
 fn sub_reg64_reg64(buf: &mut Vec<'_, u8>, dst: X86_64GPReg, src: X86_64GPReg) {
    let rex = add_rm_extension(dst, REX_W);
    let rex = add_reg_extension(src, rex);
    let dst_mod = dst as u8 % 8;
    let src_mod = (src as u8 % 8) << 3;
    buf.extend(&[rex, 0x29, 0xC0 + dst_mod + src_mod]);
 }
 /// `CMOVL r64,r/m64` -> Move if less (SF≠ OF).
 #[inline(always)]
 fn cmovl_reg64_reg64(buf: &mut Vec<'_, u8>, dst: X86_64GPReg, src: X86_64GPReg) {
--- a/compiler/gen_dev/src/lib.rs
+++ b/compiler/gen_dev/src/lib.rs
@ -24,7 +24,7 @@ pub struct Env<'a> {
 }
 // INLINED_SYMBOLS is a set of all of the functions we automatically inline if seen.
-const INLINED_SYMBOLS: [Symbol; 2] = [Symbol::NUM_ABS, Symbol::NUM_ADD];
+const INLINED_SYMBOLS: [Symbol; 3] = [Symbol::NUM_ABS, Symbol::NUM_ADD, Symbol::NUM_SUB];
 // These relocations likely will need a length.
 // They may even need more definition, but this should be at least good enough for how we will use elf.
@ -130,6 +130,10 @@ where
                                // Instead of calling the function, just inline it.
                                self.build_run_low_level(sym, &LowLevel::NumAdd, arguments, layout)
                            }
                            Symbol::NUM_SUB => {
                                // Instead of calling the function, just inline it.
                                self.build_run_low_level(sym, &LowLevel::NumSub, arguments, layout)
                            }
                            x => Err(format!("the function, {:?}, is not yet implemented", x)),
                        }
                    }
@ -172,6 +176,15 @@ where
                    x => Err(format!("layout, {:?}, not implemented yet", x)),
                }
            }
            LowLevel::NumSub => {
                // TODO: when this is expanded to floats. deal with typecasting here, and then call correct low level method.
                match layout {
                    Layout::Builtin(Builtin::Int64) => {
                        self.build_num_sub_i64(sym, &args[0], &args[1])
                    }
                    x => Err(format!("layout, {:?}, not implemented yet", x)),
                }
            }
            x => Err(format!("low level, {:?}. is not yet implemented", x)),
        }
    }
@ -180,7 +193,7 @@ where
    /// It only deals with inputs and outputs of i64 type.
    fn build_num_abs_i64(&mut self, dst: &Symbol, src: &Symbol) -> Result<(), String>;
-    /// build_num_add_i64 stores the absolute value of src into dst.
+    /// build_num_add_i64 stores the sum of src1 and src2 into dst.
    /// It only deals with inputs and outputs of i64 type.
    fn build_num_add_i64(
        &mut self,
@ -189,6 +202,15 @@ where
        src2: &Symbol,
    ) -> Result<(), String>;
    /// build_num_sub_i64 stores the `src1 - src2` difference  into dst.
    /// It only deals with inputs and outputs of i64 type.
    fn build_num_sub_i64(
        &mut self,
        dst: &Symbol,
        src1: &Symbol,
        src2: &Symbol,
    ) -> Result<(), String>;
    /// literal_map gets the map from symbol to literal, used for lazy loading and literal folding.
    fn literal_map(&mut self) -> &mut MutMap<Symbol, Literal<'a>>;
--- a/compiler/gen_dev/tests/gen_num.rs
+++ b/compiler/gen_dev/tests/gen_num.rs
@ -40,6 +40,19 @@ mod gen_num {
        );
    }
    #[test]
    fn gen_sub_i64() {
        assert_evals_to!(
            indoc!(
                r#"
                    1 - 2 - 3
                "#
            ),
            -4,
            i64
        );
    }
    #[test]
    fn i64_force_stack() {
        // This claims 33 registers. One more than Arm and RISC-V, and many more than x86-64.