|
| 1 | +Refs: |
| 2 | + |
| 3 | +- https://arxiv.org/pdf/1607.02318 |
| 4 | + |
| 5 | +- https://en.wikichip.org/wiki/macro-operation_fusion#RISC-V |
| 6 | + |
| 7 | +- https://github.com/llvm/llvm-project/blob/173907b5d77115623f160978a95159e36e05ee6c/llvm/lib/Target/RISCV/RISCVMacroFusion.td |
| 8 | + |
| 9 | +--- |
| 10 | + |
| 11 | +Load immediate |
| 12 | + |
| 13 | ++---------------------------+-------------------------------------------------+--------------------------------------+ |
| 14 | +| Instructions | Fusion condition | Fused instruction | |
| 15 | ++===========================+=================================================+======================================+ |
| 16 | +| auipc rd_a, imm_a | rd_a == rd_b && rd_a == rs1_b | addi rd_b, x0, (imm_a + imm_b) | |
| 17 | +| addi rd_b, rs1_b, imm_b | | | |
| 18 | ++---------------------------+-------------------------------------------------+--------------------------------------+ |
| 19 | +| lui rd_a, imm_a | rd_a == rd_b && rd_a == rs1_b && rs1_b != rs2_b | addi rd_a, rs2_b, imm_a | |
| 20 | +| add rd_b, rs1_b, rs2_b | | | |
| 21 | ++---------------------------+-------------------------------------------------+--------------------------------------+ |
| 22 | +| lui rd_a, imm_a | rd_a == rd_b && rd_a == rs1_b | addi rd_b, x0, (imm_a + imm_b) | |
| 23 | +| addi rd_b, rs1_b, imm_b | | | |
| 24 | ++---------------------------+-------------------------------------------------+--------------------------------------+ |
| 25 | +| lui rd_a, imm_a | rd_a == rd_b && rd_a == rs1_b | addiw rd_b, x0, (imm_a + imm_b) | |
| 26 | +| addiw rd_b, rs1_b, imm_b | | | |
| 27 | ++---------------------------+-------------------------------------------------+--------------------------------------+ |
| 28 | + |
| 29 | +Op |
| 30 | + |
| 31 | ++---------------------------+-------------------------------------------------+--------------------------------------+ |
| 32 | +| Instructions | Fusion condition | Fused instruction | |
| 33 | ++===========================+=================================================+======================================+ |
| 34 | +| sub rd_a, x0, rs2_a | rd_a == rd_b && rd_a == rs1_b | abs rd_b, rs2_a | |
| 35 | +| max rd_b, rs1_b, rs2_b | | | |
| 36 | ++---------------------------+-------------------------------------------------+--------------------------------------+ |
| 37 | + |
| 38 | +Jump |
| 39 | + |
| 40 | ++---------------------------+-------------------------------------------------+--------------------------------------+ |
| 41 | +| Instructions | Fusion condition | Fused instruction | |
| 42 | ++===========================+=================================================+======================================+ |
| 43 | +| auipc rd_a, imm_a | rd_a == rd_b && rd_a == rs1_b | jal rd_b, (imm_a + imm_b) | |
| 44 | +| jalr rd_b, imm_b(rs1_b) | | | |
| 45 | ++---------------------------+-------------------------------------------------+--------------------------------------+ |
| 46 | + |
| 47 | +Load |
| 48 | + |
| 49 | ++---------------------------+-------------------------------------------------+--------------------------------------+ |
| 50 | +| Instructions | Fusion condition | Fused instruction | |
| 51 | ++===========================+=================================================+======================================+ |
| 52 | +| auipc rd_a, imm_a | rd_a == rd_b && rd_a == rs1_b | ld.pc rd_b, (imm_a + imm_b)pc | |
| 53 | +| ld rd_b, imm_b(rs1_b) | | | |
| 54 | ++---------------------------+-------------------------------------------------+--------------------------------------+ |
| 55 | +| lui rd_a, imm_a | rd_a == rd_b && rd_a == rs1_b | ld rd_b, (imm_a + imm_b)x0 | |
| 56 | +| ld rd_b, imm_b(rs1_b) | | | |
| 57 | ++---------------------------+-------------------------------------------------+--------------------------------------+ |
| 58 | +| add rd_a, rs1_a, rs2_a | rd_a == rd_b && rd_a == rs1_b && imm_b == 0 | ld.add rd_b, (rs1_a)(rs2_a) | |
| 59 | +| ld rd_b, imm_b(rs1_b) | | | |
| 60 | ++---------------------------+-------------------------------------------------+--------------------------------------+ |
| 61 | +| sh1add rd_a, rs1_a, rs2_a | rd_a == rd_b && rd_a == rs1_b && imm_b == 0 | ld.sh1add rd_b, rs1_a, rs2_a | |
| 62 | +| ld rd_b, imm_b(rs1_b) | | | |
| 63 | ++---------------------------+-------------------------------------------------+--------------------------------------+ |
| 64 | + |
| 65 | +--- |
| 66 | + |
| 67 | +Fused instruction length |
| 68 | + |
| 69 | ++------+-------+-------+------+------+------+ |
| 70 | +| fuse | RVC_2 | RVC_1 | len2 | len4 | len8 | |
| 71 | ++======+=======+=======+======+======+======+ |
| 72 | +| 0 | 0 | 0 | 0 | 1 | 0 | |
| 73 | +| 0 | 0 | 1 | 1 | 0 | 0 | |
| 74 | +| 0 | 1 | 0 | 0 | 1 | 0 | |
| 75 | +| 0 | 1 | 1 | 1 | 0 | 0 | |
| 76 | +| 1 | 0 | 0 | 0 | 0 | 1 | |
| 77 | +| 1 | 0 | 1 | 1 | 1 | 0 | |
| 78 | +| 1 | 1 | 0 | 1 | 1 | 0 | |
| 79 | +| 1 | 1 | 1 | 0 | 1 | 0 | |
| 80 | ++------+-------+-------+------+------+------+ |
0 commit comments