1 // See LICENSE for license details.
10 struct : public arg_t
{
11 std::string
to_string(insn_t insn
) const {
12 return std::to_string((int)insn
.i_imm()) + '(' + xpr_name
[insn
.rs1()] + ')';
16 struct : public arg_t
{
17 std::string
to_string(insn_t insn
) const {
18 return std::to_string((int)insn
.s_imm()) + '(' + xpr_name
[insn
.rs1()] + ')';
22 struct : public arg_t
{
23 std::string
to_string(insn_t insn
) const {
24 return std::string("(") + xpr_name
[insn
.rs1()] + ')';
28 struct : public arg_t
{
29 std::string
to_string(insn_t insn
) const {
30 return xpr_name
[insn
.rd()];
34 struct : public arg_t
{
35 std::string
to_string(insn_t insn
) const {
36 return xpr_name
[insn
.rs1()];
40 struct : public arg_t
{
41 std::string
to_string(insn_t insn
) const {
42 return xpr_name
[insn
.rs2()];
46 struct : public arg_t
{
47 std::string
to_string(insn_t insn
) const {
48 return fpr_name
[insn
.rd()];
52 struct : public arg_t
{
53 std::string
to_string(insn_t insn
) const {
54 return fpr_name
[insn
.rs1()];
58 struct : public arg_t
{
59 std::string
to_string(insn_t insn
) const {
60 return fpr_name
[insn
.rs2()];
64 struct : public arg_t
{
65 std::string
to_string(insn_t insn
) const {
66 return fpr_name
[insn
.rs3()];
70 struct : public arg_t
{
71 std::string
to_string(insn_t insn
) const {
74 #define DECLARE_CSR(name, num) case num: return #name;
80 snprintf(buf
, sizeof buf
, "unknown_%03" PRIx64
, insn
.csr());
81 return std::string(buf
);
87 struct : public arg_t
{
88 std::string
to_string(insn_t insn
) const {
89 return std::to_string((int)insn
.i_imm());
93 struct : public arg_t
{
94 std::string
to_string(insn_t insn
) const {
96 s
<< std::hex
<< "0x" << ((uint32_t)insn
.u_imm() >> 12);
101 struct : public arg_t
{
102 std::string
to_string(insn_t insn
) const {
103 return std::to_string(insn
.rs1());
107 struct : public arg_t
{
108 std::string
to_string(insn_t insn
) const {
110 int32_t target
= insn
.sb_imm();
111 char sign
= target
>= 0 ? '+' : '-';
112 s
<< "pc " << sign
<< ' ' << abs(target
);
117 struct : public arg_t
{
118 std::string
to_string(insn_t insn
) const {
120 int32_t target
= insn
.uj_imm();
121 char sign
= target
>= 0 ? '+' : '-';
122 s
<< "pc " << sign
<< std::hex
<< " 0x" << abs(target
);
127 struct : public arg_t
{
128 std::string
to_string(insn_t insn
) const {
129 return xpr_name
[insn
.rvc_rs1()];
133 struct : public arg_t
{
134 std::string
to_string(insn_t insn
) const {
135 return xpr_name
[insn
.rvc_rs2()];
139 struct : public arg_t
{
140 std::string
to_string(insn_t insn
) const {
141 return xpr_name
[insn
.rvc_rs1s()];
145 struct : public arg_t
{
146 std::string
to_string(insn_t insn
) const {
147 return xpr_name
[insn
.rvc_rs2s()];
151 struct : public arg_t
{
152 std::string
to_string(insn_t insn
) const {
153 return xpr_name
[X_SP
];
157 struct : public arg_t
{
158 std::string
to_string(insn_t insn
) const {
159 return std::to_string((int)insn
.rvc_imm());
163 struct : public arg_t
{
164 std::string
to_string(insn_t insn
) const {
165 return std::to_string((int)insn
.rvc_addi4spn_imm());
169 struct : public arg_t
{
170 std::string
to_string(insn_t insn
) const {
171 return std::to_string((int)insn
.rvc_addi16sp_imm());
175 struct : public arg_t
{
176 std::string
to_string(insn_t insn
) const {
177 return std::to_string((int)insn
.rvc_lwsp_imm());
181 struct : public arg_t
{
182 std::string
to_string(insn_t insn
) const {
183 return std::to_string((int)(insn
.rvc_imm() & 0x3f));
187 struct : public arg_t
{
188 std::string
to_string(insn_t insn
) const {
190 s
<< std::hex
<< "0x" << (uint32_t)insn
.rvc_imm();
195 struct : public arg_t
{
196 std::string
to_string(insn_t insn
) const {
197 return std::to_string((int)insn
.rvc_lwsp_imm()) + '(' + xpr_name
[X_SP
] + ')';
201 struct : public arg_t
{
202 std::string
to_string(insn_t insn
) const {
203 return std::to_string((int)insn
.rvc_ldsp_imm()) + '(' + xpr_name
[X_SP
] + ')';
207 struct : public arg_t
{
208 std::string
to_string(insn_t insn
) const {
209 return std::to_string((int)insn
.rvc_swsp_imm()) + '(' + xpr_name
[X_SP
] + ')';
213 struct : public arg_t
{
214 std::string
to_string(insn_t insn
) const {
215 return std::to_string((int)insn
.rvc_sdsp_imm()) + '(' + xpr_name
[X_SP
] + ')';
219 struct : public arg_t
{
220 std::string
to_string(insn_t insn
) const {
221 return std::to_string((int)insn
.rvc_lw_imm()) + '(' + xpr_name
[insn
.rvc_rs1s()] + ')';
225 struct : public arg_t
{
226 std::string
to_string(insn_t insn
) const {
227 return std::to_string((int)insn
.rvc_ld_imm()) + '(' + xpr_name
[insn
.rvc_rs1s()] + ')';
231 struct : public arg_t
{
232 std::string
to_string(insn_t insn
) const {
234 int32_t target
= insn
.rvc_b_imm();
235 char sign
= target
>= 0 ? '+' : '-';
236 s
<< "pc " << sign
<< ' ' << abs(target
);
241 struct : public arg_t
{
242 std::string
to_string(insn_t insn
) const {
244 int32_t target
= insn
.rvc_j_imm();
245 char sign
= target
>= 0 ? '+' : '-';
246 s
<< "pc " << sign
<< ' ' << abs(target
);
251 std::string
disassembler_t::disassemble(insn_t insn
) const
253 const disasm_insn_t
* disasm_insn
= lookup(insn
);
254 return disasm_insn
? disasm_insn
->to_string(insn
) : "unknown";
257 disassembler_t::disassembler_t(int xlen
)
259 const uint32_t mask_rd
= 0x1fUL
<< 7;
260 const uint32_t match_rd_ra
= 1UL << 7;
261 const uint32_t mask_rs1
= 0x1fUL
<< 15;
262 const uint32_t match_rs1_ra
= 1UL << 15;
263 const uint32_t mask_rs2
= 0x1fUL
<< 20;
264 const uint32_t mask_imm
= 0xfffUL
<< 20;
265 const uint32_t match_imm_1
= 1UL << 20;
266 const uint32_t mask_rvc_rs2
= 0x1fUL
<< 2;
267 const uint32_t mask_rvc_imm
= mask_rvc_rs2
| 0x1000UL
;
269 #define DECLARE_INSN(code, match, mask) \
270 const uint32_t match_##code = match; \
271 const uint32_t mask_##code = mask;
272 #include "encoding.h"
275 // explicit per-instruction disassembly
276 #define DISASM_INSN(name, code, extra, ...) \
277 add_insn(new disasm_insn_t(name, match_##code, mask_##code | (extra), __VA_ARGS__));
278 #define DEFINE_NOARG(code) \
279 add_insn(new disasm_insn_t(#code, match_##code, mask_##code, {}));
280 #define DEFINE_RTYPE(code) DISASM_INSN(#code, code, 0, {&xrd, &xrs1, &xrs2})
281 #define DEFINE_ITYPE(code) DISASM_INSN(#code, code, 0, {&xrd, &xrs1, &imm})
282 #define DEFINE_I0TYPE(name, code) DISASM_INSN(name, code, mask_rs1, {&xrd, &imm})
283 #define DEFINE_I1TYPE(name, code) DISASM_INSN(name, code, mask_imm, {&xrd, &xrs1})
284 #define DEFINE_I2TYPE(name, code) DISASM_INSN(name, code, mask_rd | mask_imm, {&xrs1})
285 #define DEFINE_LTYPE(code) DISASM_INSN(#code, code, 0, {&xrd, &bigimm})
286 #define DEFINE_BTYPE(code) DISASM_INSN(#code, code, 0, {&xrs1, &xrs2, &branch_target})
287 #define DEFINE_B0TYPE(name, code) DISASM_INSN(name, code, mask_rs1 | mask_rs2, {&branch_target})
288 #define DEFINE_B1TYPE(name, code) DISASM_INSN(name, code, mask_rs2, {&xrs1, &branch_target})
289 #define DEFINE_XLOAD(code) DISASM_INSN(#code, code, 0, {&xrd, &load_address})
290 #define DEFINE_XSTORE(code) DISASM_INSN(#code, code, 0, {&xrs2, &store_address})
291 #define DEFINE_XAMO(code) DISASM_INSN(#code, code, 0, {&xrd, &xrs2, &amo_address})
292 #define DEFINE_FLOAD(code) DISASM_INSN(#code, code, 0, {&frd, &load_address})
293 #define DEFINE_FSTORE(code) DISASM_INSN(#code, code, 0, {&frs2, &store_address})
294 #define DEFINE_FRTYPE(code) DISASM_INSN(#code, code, 0, {&frd, &frs1, &frs2})
295 #define DEFINE_FR1TYPE(code) DISASM_INSN(#code, code, 0, {&frd, &frs1})
296 #define DEFINE_FR3TYPE(code) DISASM_INSN(#code, code, 0, {&frd, &frs1, &frs2, &frs3})
297 #define DEFINE_FXTYPE(code) DISASM_INSN(#code, code, 0, {&xrd, &frs1})
298 #define DEFINE_XFTYPE(code) DISASM_INSN(#code, code, 0, {&frd, &xrs1})
313 DEFINE_XAMO(amoadd_w
)
314 DEFINE_XAMO(amoswap_w
)
315 DEFINE_XAMO(amoand_w
)
317 DEFINE_XAMO(amoxor_w
)
318 DEFINE_XAMO(amomin_w
)
319 DEFINE_XAMO(amomax_w
)
320 DEFINE_XAMO(amominu_w
)
321 DEFINE_XAMO(amomaxu_w
)
322 DEFINE_XAMO(amoadd_d
)
323 DEFINE_XAMO(amoswap_d
)
324 DEFINE_XAMO(amoand_d
)
326 DEFINE_XAMO(amoxor_d
)
327 DEFINE_XAMO(amomin_d
)
328 DEFINE_XAMO(amomax_d
)
329 DEFINE_XAMO(amominu_d
)
330 DEFINE_XAMO(amomaxu_d
)
343 add_insn(new disasm_insn_t("j", match_jal
, mask_jal
| mask_rd
, {&jump_target
}));
344 add_insn(new disasm_insn_t("jal", match_jal
| match_rd_ra
, mask_jal
| mask_rd
, {&jump_target
}));
345 add_insn(new disasm_insn_t("jal", match_jal
, mask_jal
, {&xrd
, &jump_target
}));
347 DEFINE_B1TYPE("beqz", beq
);
348 DEFINE_B1TYPE("bnez", bne
);
349 DEFINE_B1TYPE("bltz", blt
);
350 DEFINE_B1TYPE("bgez", bge
);
361 add_insn(new disasm_insn_t("ret", match_jalr
| match_rs1_ra
, mask_jalr
| mask_rd
| mask_rs1
| mask_imm
, {}));
362 DEFINE_I2TYPE("jr", jalr
);
363 add_insn(new disasm_insn_t("jalr", match_jalr
| match_rd_ra
, mask_jalr
| mask_rd
| mask_imm
, {&xrs1
}));
366 add_insn(new disasm_insn_t("nop", match_addi
, mask_addi
| mask_rd
| mask_rs1
| mask_imm
, {}));
367 add_insn(new disasm_insn_t(" - ", match_xor
, mask_xor
| mask_rd
| mask_rs1
| mask_rs2
, {})); // for machine-generated bubbles
368 DEFINE_I0TYPE("li", addi
);
369 DEFINE_I1TYPE("mv", addi
);
373 add_insn(new disasm_insn_t("seqz", match_sltiu
| match_imm_1
, mask_sltiu
| mask_imm
, {&xrd
, &xrs1
}));
375 add_insn(new disasm_insn_t("not", match_xori
| mask_imm
, mask_xori
| mask_imm
, {&xrd
, &xrs1
}));
381 DEFINE_I1TYPE("sext.w", addiw
);
391 add_insn(new disasm_insn_t("snez", match_sltu
, mask_sltu
| mask_rs1
, {&xrd
, &xrs2
}));
401 DEFINE_RTYPE(mulhsu
);
418 DEFINE_NOARG(ebreak
);
423 DEFINE_NOARG(fence_i
);
425 add_insn(new disasm_insn_t("csrr", match_csrrs
, mask_csrrs
| mask_rs1
, {&xrd
, &csr
}));
426 add_insn(new disasm_insn_t("csrw", match_csrrw
, mask_csrrw
| mask_rd
, {&csr
, &xrs1
}));
427 add_insn(new disasm_insn_t("csrs", match_csrrs
, mask_csrrs
| mask_rd
, {&csr
, &xrs1
}));
428 add_insn(new disasm_insn_t("csrc", match_csrrc
, mask_csrrc
| mask_rd
, {&csr
, &xrs1
}));
429 add_insn(new disasm_insn_t("csrwi", match_csrrwi
, mask_csrrwi
| mask_rd
, {&csr
, &zimm5
}));
430 add_insn(new disasm_insn_t("csrsi", match_csrrsi
, mask_csrrsi
| mask_rd
, {&csr
, &zimm5
}));
431 add_insn(new disasm_insn_t("csrci", match_csrrci
, mask_csrrci
| mask_rd
, {&csr
, &zimm5
}));
432 add_insn(new disasm_insn_t("csrrw", match_csrrw
, mask_csrrw
, {&xrd
, &csr
, &xrs1
}));
433 add_insn(new disasm_insn_t("csrrs", match_csrrs
, mask_csrrs
, {&xrd
, &csr
, &xrs1
}));
434 add_insn(new disasm_insn_t("csrrc", match_csrrc
, mask_csrrc
, {&xrd
, &csr
, &xrs1
}));
435 add_insn(new disasm_insn_t("csrrwi", match_csrrwi
, mask_csrrwi
, {&xrd
, &csr
, &zimm5
}));
436 add_insn(new disasm_insn_t("csrrsi", match_csrrsi
, mask_csrrsi
, {&xrd
, &csr
, &zimm5
}));
437 add_insn(new disasm_insn_t("csrrci", match_csrrci
, mask_csrrci
, {&xrd
, &csr
, &zimm5
}));
439 DEFINE_FRTYPE(fadd_s
);
440 DEFINE_FRTYPE(fsub_s
);
441 DEFINE_FRTYPE(fmul_s
);
442 DEFINE_FRTYPE(fdiv_s
);
443 DEFINE_FR1TYPE(fsqrt_s
);
444 DEFINE_FRTYPE(fmin_s
);
445 DEFINE_FRTYPE(fmax_s
);
446 DEFINE_FR3TYPE(fmadd_s
);
447 DEFINE_FR3TYPE(fmsub_s
);
448 DEFINE_FR3TYPE(fnmadd_s
);
449 DEFINE_FR3TYPE(fnmsub_s
);
450 DEFINE_FRTYPE(fsgnj_s
);
451 DEFINE_FRTYPE(fsgnjn_s
);
452 DEFINE_FRTYPE(fsgnjx_s
);
453 DEFINE_FR1TYPE(fcvt_s_d
);
454 DEFINE_XFTYPE(fcvt_s_l
);
455 DEFINE_XFTYPE(fcvt_s_lu
);
456 DEFINE_XFTYPE(fcvt_s_w
);
457 DEFINE_XFTYPE(fcvt_s_wu
);
458 DEFINE_XFTYPE(fcvt_s_wu
);
459 DEFINE_XFTYPE(fmv_w_x
);
460 DEFINE_FXTYPE(fcvt_l_s
);
461 DEFINE_FXTYPE(fcvt_lu_s
);
462 DEFINE_FXTYPE(fcvt_w_s
);
463 DEFINE_FXTYPE(fcvt_wu_s
);
464 DEFINE_FXTYPE(fclass_s
);
465 DEFINE_FXTYPE(fmv_x_w
);
466 DEFINE_FXTYPE(feq_s
);
467 DEFINE_FXTYPE(flt_s
);
468 DEFINE_FXTYPE(fle_s
);
470 DEFINE_FRTYPE(fadd_d
);
471 DEFINE_FRTYPE(fsub_d
);
472 DEFINE_FRTYPE(fmul_d
);
473 DEFINE_FRTYPE(fdiv_d
);
474 DEFINE_FR1TYPE(fsqrt_d
);
475 DEFINE_FRTYPE(fmin_d
);
476 DEFINE_FRTYPE(fmax_d
);
477 DEFINE_FR3TYPE(fmadd_d
);
478 DEFINE_FR3TYPE(fmsub_d
);
479 DEFINE_FR3TYPE(fnmadd_d
);
480 DEFINE_FR3TYPE(fnmsub_d
);
481 DEFINE_FRTYPE(fsgnj_d
);
482 DEFINE_FRTYPE(fsgnjn_d
);
483 DEFINE_FRTYPE(fsgnjx_d
);
484 DEFINE_FR1TYPE(fcvt_d_s
);
485 DEFINE_XFTYPE(fcvt_d_l
);
486 DEFINE_XFTYPE(fcvt_d_lu
);
487 DEFINE_XFTYPE(fcvt_d_w
);
488 DEFINE_XFTYPE(fcvt_d_wu
);
489 DEFINE_XFTYPE(fcvt_d_wu
);
490 DEFINE_XFTYPE(fmv_d_x
);
491 DEFINE_FXTYPE(fcvt_l_d
);
492 DEFINE_FXTYPE(fcvt_lu_d
);
493 DEFINE_FXTYPE(fcvt_w_d
);
494 DEFINE_FXTYPE(fcvt_wu_d
);
495 DEFINE_FXTYPE(fclass_d
);
496 DEFINE_FXTYPE(fmv_x_d
);
497 DEFINE_FXTYPE(feq_d
);
498 DEFINE_FXTYPE(flt_d
);
499 DEFINE_FXTYPE(fle_d
);
501 DISASM_INSN("ebreak", c_add
, mask_rd
| mask_rvc_rs2
, {});
502 add_insn(new disasm_insn_t("ret", match_c_li
| match_rd_ra
, mask_c_li
| mask_rd
| mask_rvc_imm
, {}));
503 DISASM_INSN("jr", c_li
, mask_rvc_imm
, {&rvc_rs1
});
504 DISASM_INSN("jalr", c_lui
, mask_rvc_imm
, {&rvc_rs1
});
505 DISASM_INSN("nop", c_addi
, mask_rd
| mask_rvc_imm
, {});
506 DISASM_INSN("addi", c_addi16sp
, mask_rd
, {&rvc_sp
, &rvc_sp
, &rvc_addi16sp_imm
});
507 DISASM_INSN("addi", c_addi4spn
, 0, {&rvc_rs1s
, &rvc_sp
, &rvc_addi4spn_imm
});
508 DISASM_INSN("li", c_li
, 0, {&xrd
, &rvc_imm
});
509 DISASM_INSN("lui", c_lui
, 0, {&xrd
, &rvc_uimm
});
510 DISASM_INSN("addi", c_addi
, 0, {&xrd
, &xrd
, &rvc_imm
});
511 DISASM_INSN("slli", c_slli
, 0, {&xrd
, &rvc_shamt
});
512 DISASM_INSN("mv", c_mv
, 0, {&xrd
, &rvc_rs2
});
513 DISASM_INSN("add", c_add
, 0, {&xrd
, &xrd
, &rvc_rs2
});
514 DISASM_INSN("addw", c_addw
, 0, {&rvc_rs1s
, &rvc_rs1s
, &rvc_rs2s
});
515 DISASM_INSN("sub", c_sub
, 0, {&rvc_rs1s
, &rvc_rs1s
, &rvc_rs2s
});
516 DISASM_INSN("subw", c_subw
, 0, {&rvc_rs1s
, &rvc_rs1s
, &rvc_rs2s
});
517 DISASM_INSN("and", c_and
, 0, {&rvc_rs1s
, &rvc_rs1s
, &rvc_rs2s
});
518 DISASM_INSN("or", c_or
, 0, {&rvc_rs1s
, &rvc_rs1s
, &rvc_rs2s
});
519 DISASM_INSN("xor", c_xor
, 0, {&rvc_rs1s
, &rvc_rs1s
, &rvc_rs2s
});
520 DISASM_INSN("lw", c_lwsp
, 0, {&xrd
, &rvc_lwsp_address
});
521 DISASM_INSN("fld", c_fld
, 0, {&rvc_rs2s
, &rvc_ld_address
});
522 DISASM_INSN("sw", c_swsp
, 0, {&rvc_rs2
, &rvc_swsp_address
});
523 DISASM_INSN("lw", c_lw
, 0, {&rvc_rs2s
, &rvc_lw_address
});
524 DISASM_INSN("sw", c_sw
, 0, {&rvc_rs2s
, &rvc_lw_address
});
525 DISASM_INSN("beqz", c_beqz
, 0, {&rvc_rs1s
, &rvc_branch_target
});
526 DISASM_INSN("bnez", c_bnez
, 0, {&rvc_rs1s
, &rvc_branch_target
});
527 DISASM_INSN("j", c_j
, 0, {&rvc_jump_target
});
530 DISASM_INSN("flw", c_flw
, 0, {&rvc_rs2s
, &rvc_lw_address
});
531 DISASM_INSN("flw", c_flwsp
, 0, {&xrd
, &rvc_lwsp_address
});
532 DISASM_INSN("fsw", c_fsw
, 0, {&rvc_rs2s
, &rvc_lw_address
});
533 DISASM_INSN("fsw", c_fswsp
, 0, {&rvc_rs2
, &rvc_swsp_address
});
534 DISASM_INSN("jal", c_jal
, 0, {&rvc_jump_target
});
536 DISASM_INSN("ld", c_ld
, 0, {&rvc_rs2s
, &rvc_ld_address
});
537 DISASM_INSN("ld", c_ldsp
, 0, {&xrd
, &rvc_ldsp_address
});
538 DISASM_INSN("sd", c_sd
, 0, {&rvc_rs2s
, &rvc_ld_address
});
539 DISASM_INSN("sd", c_sdsp
, 0, {&rvc_rs2
, &rvc_sdsp_address
});
540 DISASM_INSN("addiw", c_addiw
, 0, {&xrd
, &xrd
, &rvc_imm
});
543 // provide a default disassembly for all instructions as a fallback
544 #define DECLARE_INSN(code, match, mask) \
545 add_insn(new disasm_insn_t(#code " (args unknown)", match, mask, {}));
546 #include "encoding.h"
550 const disasm_insn_t
* disassembler_t::lookup(insn_t insn
) const
552 size_t idx
= insn
.bits() % HASH_SIZE
;
553 for (size_t j
= 0; j
< chain
[idx
].size(); j
++)
554 if(*chain
[idx
][j
] == insn
)
555 return chain
[idx
][j
];
558 for (size_t j
= 0; j
< chain
[idx
].size(); j
++)
559 if(*chain
[idx
][j
] == insn
)
560 return chain
[idx
][j
];
565 void disassembler_t::add_insn(disasm_insn_t
* insn
)
567 size_t idx
= HASH_SIZE
;
568 if (insn
->get_mask() % HASH_SIZE
== HASH_SIZE
- 1)
569 idx
= insn
->get_match() % HASH_SIZE
;
570 chain
[idx
].push_back(insn
);
573 disassembler_t::~disassembler_t()
575 for (size_t i
= 0; i
< HASH_SIZE
+1; i
++)
576 for (size_t j
= 0; j
< chain
[i
].size(); j
++)