2022-06-24 21:37:18 +00:00
|
|
|
#pragma once
|
|
|
|
|
|
|
|
asm(".set regnum_x0 , 0");
|
|
|
|
asm(".set regnum_x1 , 1");
|
|
|
|
asm(".set regnum_x2 , 2");
|
|
|
|
asm(".set regnum_x3 , 3");
|
|
|
|
asm(".set regnum_x4 , 4");
|
|
|
|
asm(".set regnum_x5 , 5");
|
|
|
|
asm(".set regnum_x6 , 6");
|
|
|
|
asm(".set regnum_x7 , 7");
|
|
|
|
asm(".set regnum_x8 , 8");
|
|
|
|
asm(".set regnum_x9 , 9");
|
|
|
|
asm(".set regnum_x10 , 10");
|
|
|
|
asm(".set regnum_x11 , 11");
|
|
|
|
asm(".set regnum_x12 , 12");
|
|
|
|
asm(".set regnum_x13 , 13");
|
|
|
|
asm(".set regnum_x14 , 14");
|
|
|
|
asm(".set regnum_x15 , 15");
|
|
|
|
asm(".set regnum_x16 , 16");
|
|
|
|
asm(".set regnum_x17 , 17");
|
|
|
|
asm(".set regnum_x18 , 18");
|
|
|
|
asm(".set regnum_x19 , 19");
|
|
|
|
asm(".set regnum_x20 , 20");
|
|
|
|
asm(".set regnum_x21 , 21");
|
|
|
|
asm(".set regnum_x22 , 22");
|
|
|
|
asm(".set regnum_x23 , 23");
|
|
|
|
asm(".set regnum_x24 , 24");
|
|
|
|
asm(".set regnum_x25 , 25");
|
|
|
|
asm(".set regnum_x26 , 26");
|
|
|
|
asm(".set regnum_x27 , 27");
|
|
|
|
asm(".set regnum_x28 , 28");
|
|
|
|
asm(".set regnum_x29 , 29");
|
|
|
|
asm(".set regnum_x30 , 30");
|
|
|
|
asm(".set regnum_x31 , 31");
|
|
|
|
|
|
|
|
asm(".set regnum_zero, 0");
|
|
|
|
asm(".set regnum_ra , 1");
|
|
|
|
asm(".set regnum_sp , 2");
|
|
|
|
asm(".set regnum_gp , 3");
|
|
|
|
asm(".set regnum_tp , 4");
|
|
|
|
asm(".set regnum_t0 , 5");
|
|
|
|
asm(".set regnum_t1 , 6");
|
|
|
|
asm(".set regnum_t2 , 7");
|
|
|
|
asm(".set regnum_s0 , 8");
|
|
|
|
asm(".set regnum_s1 , 9");
|
|
|
|
asm(".set regnum_a0 , 10");
|
|
|
|
asm(".set regnum_a1 , 11");
|
|
|
|
asm(".set regnum_a2 , 12");
|
|
|
|
asm(".set regnum_a3 , 13");
|
|
|
|
asm(".set regnum_a4 , 14");
|
|
|
|
asm(".set regnum_a5 , 15");
|
|
|
|
asm(".set regnum_a6 , 16");
|
|
|
|
asm(".set regnum_a7 , 17");
|
|
|
|
asm(".set regnum_s2 , 18");
|
|
|
|
asm(".set regnum_s3 , 19");
|
|
|
|
asm(".set regnum_s4 , 20");
|
|
|
|
asm(".set regnum_s5 , 21");
|
|
|
|
asm(".set regnum_s6 , 22");
|
|
|
|
asm(".set regnum_s7 , 23");
|
|
|
|
asm(".set regnum_s8 , 24");
|
|
|
|
asm(".set regnum_s9 , 25");
|
|
|
|
asm(".set regnum_s10 , 26");
|
|
|
|
asm(".set regnum_s11 , 27");
|
|
|
|
asm(".set regnum_t3 , 28");
|
|
|
|
asm(".set regnum_t4 , 29");
|
|
|
|
asm(".set regnum_t5 , 30");
|
|
|
|
asm(".set regnum_t6 , 31");
|
|
|
|
|
|
|
|
#define opcode_ld(opcode, func3, base, imm12, o1, o2) \
|
|
|
|
asm volatile(".word ((" #opcode ") | (regnum_%0 << 7) | (regnum_%2 << 15) | (" #imm12 " << 20) | ((" #func3 ") << 12));" \
|
|
|
|
: "=&r" (o1), "=&r" (o2) \
|
|
|
|
: "r" (base) \
|
|
|
|
); \
|
|
|
|
|
2022-08-20 16:54:30 +00:00
|
|
|
#define _custom_ld(base, imm12, o1, o2) opcode_ld(0x03, 0x03, base, imm12, o1, o2)
|
|
|
|
#define _custom_ldu(base, imm12, o1, o2) opcode_ld(0x03, 0x07, base, imm12, o1, o2)
|
2022-06-24 21:37:18 +00:00
|
|
|
|
|
|
|
#define opcode_sd(opcode, func3, base, imm04, imm511, i1, i2) \
|
|
|
|
asm volatile(".word ((" #opcode ") | (" #imm04 " << 7) | (regnum_%0 << 15) | (regnum_%1 << 20) | (" #imm511 " << 25) | ((" #func3 ") << 12));" \
|
|
|
|
: \
|
|
|
|
: "r" (base), "r" (i1), "r" (i2) \
|
|
|
|
); \
|
|
|
|
|
2022-08-20 16:54:30 +00:00
|
|
|
#define _custom_sd(base, imm04, imm511, i1, i2) opcode_sd(0x23, 0x03, base, imm04, imm511, i1, i2)
|
|
|
|
|
|
|
|
|
|
|
|
#define opcode_p(opcode, func3, func7, rd, rs1, rs2) \
|
|
|
|
asm volatile(".word ((" #opcode ") | (regnum_%0 << 7) | (regnum_%1 << 15) | (regnum_%2 << 20) | ((" #func3 ") << 12) | ((" #func7 ") << 25));" \
|
|
|
|
: "=r" (rd) \
|
|
|
|
: "r" (rs1), "r" (rs2) \
|
|
|
|
);
|
|
|
|
#define opcode_p_ter(opcode, func3, func7, rd, rs1, rs2) \
|
|
|
|
asm volatile(".word ((" #opcode ") | (regnum_%0 << 7) | (regnum_%1 << 15) | (regnum_%2 << 20) | ((" #func3 ") << 12) | ((" #func7 ") << 25));" \
|
|
|
|
: "+r" (rd) \
|
|
|
|
: "r" (rs1), "r" (rs2) \
|
|
|
|
);
|
|
|
|
|
|
|
|
#define _ukadd8(rd, rs1, rs2) opcode_p(0x00000077, 0x00, 0x1c, rd, rs1, rs2)
|
|
|
|
#define _uksub8(rd, rs1, rs2) opcode_p(0x00000077, 0x00, 0x1d, rd, rs1, rs2)
|
|
|
|
#define _ufma8vhv(rd, rs1, rs2) opcode_p_ter(0x00000077, 0x00, 0x64, rd, rs1, rs2)
|
|
|
|
#define _ufma8vlv(rd, rs1, rs2) opcode_p_ter(0x00000077, 0x00, 0x66, rd, rs1, rs2)
|
|
|
|
|
|
|
|
static inline unsigned int ukadd8(const unsigned int a, const unsigned int b) {
|
|
|
|
unsigned int r;
|
|
|
|
_ukadd8(r, a, b);
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
static inline unsigned int uksub8(const unsigned int a, const unsigned int b) {
|
|
|
|
unsigned int r;
|
|
|
|
_uksub8(r, a, b);
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
|
|
|
|
static inline unsigned int ufma8vhv(const unsigned int a, const unsigned int b, const unsigned int c) {
|
|
|
|
unsigned int r = c;
|
|
|
|
_ufma8vhv(r, a, b);
|
|
|
|
return r;
|
|
|
|
}
|
|
|
|
static inline unsigned int ufma8vlv(const unsigned int a, const unsigned int b, const unsigned int c) {
|
|
|
|
unsigned int r = c;
|
|
|
|
_ufma8vlv(r, a, b);
|
|
|
|
return r;
|
|
|
|
}
|