2 * Tiny Code Generator for QEMU
4 * Copyright (c) 2009, 2011 Stefan Weil
6 * Permission is hereby granted, free of charge, to any person obtaining a copy
7 * of this software and associated documentation files (the "Software"), to deal
8 * in the Software without restriction, including without limitation the rights
9 * to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
10 * copies of the Software, and to permit persons to whom the Software is
11 * furnished to do so, subject to the following conditions:
13 * The above copyright notice and this permission notice shall be included in
14 * all copies or substantial portions of the Software.
16 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
17 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
18 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
19 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
20 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
21 * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
26 * - See TODO comments in code.
29 /* Marker for missing code. */
32 fprintf(stderr, "TODO %s:%u: %s()\n", \
33 __FILE__, __LINE__, __func__); \
37 /* Bitfield n...m (in 32 bit value). */
38 #define BITS(n, m) (((0xffffffffU << (31 - n)) >> (31 - n + m)) << m)
40 static TCGConstraintSetIndex tcg_target_op_def(TCGOpcode op)
43 case INDEX_op_ld8u_i32:
44 case INDEX_op_ld8s_i32:
45 case INDEX_op_ld16u_i32:
46 case INDEX_op_ld16s_i32:
48 case INDEX_op_ld8u_i64:
49 case INDEX_op_ld8s_i64:
50 case INDEX_op_ld16u_i64:
51 case INDEX_op_ld16s_i64:
52 case INDEX_op_ld32u_i64:
53 case INDEX_op_ld32s_i64:
55 case INDEX_op_not_i32:
56 case INDEX_op_not_i64:
57 case INDEX_op_neg_i32:
58 case INDEX_op_neg_i64:
59 case INDEX_op_ext8s_i32:
60 case INDEX_op_ext8s_i64:
61 case INDEX_op_ext16s_i32:
62 case INDEX_op_ext16s_i64:
63 case INDEX_op_ext8u_i32:
64 case INDEX_op_ext8u_i64:
65 case INDEX_op_ext16u_i32:
66 case INDEX_op_ext16u_i64:
67 case INDEX_op_ext32s_i64:
68 case INDEX_op_ext32u_i64:
69 case INDEX_op_ext_i32_i64:
70 case INDEX_op_extu_i32_i64:
71 case INDEX_op_bswap16_i32:
72 case INDEX_op_bswap16_i64:
73 case INDEX_op_bswap32_i32:
74 case INDEX_op_bswap32_i64:
75 case INDEX_op_bswap64_i64:
78 case INDEX_op_st8_i32:
79 case INDEX_op_st16_i32:
81 case INDEX_op_st8_i64:
82 case INDEX_op_st16_i64:
83 case INDEX_op_st32_i64:
87 case INDEX_op_div_i32:
88 case INDEX_op_div_i64:
89 case INDEX_op_divu_i32:
90 case INDEX_op_divu_i64:
91 case INDEX_op_rem_i32:
92 case INDEX_op_rem_i64:
93 case INDEX_op_remu_i32:
94 case INDEX_op_remu_i64:
95 case INDEX_op_add_i32:
96 case INDEX_op_add_i64:
97 case INDEX_op_sub_i32:
98 case INDEX_op_sub_i64:
99 case INDEX_op_mul_i32:
100 case INDEX_op_mul_i64:
101 case INDEX_op_and_i32:
102 case INDEX_op_and_i64:
103 case INDEX_op_andc_i32:
104 case INDEX_op_andc_i64:
105 case INDEX_op_eqv_i32:
106 case INDEX_op_eqv_i64:
107 case INDEX_op_nand_i32:
108 case INDEX_op_nand_i64:
109 case INDEX_op_nor_i32:
110 case INDEX_op_nor_i64:
111 case INDEX_op_or_i32:
112 case INDEX_op_or_i64:
113 case INDEX_op_orc_i32:
114 case INDEX_op_orc_i64:
115 case INDEX_op_xor_i32:
116 case INDEX_op_xor_i64:
117 case INDEX_op_shl_i32:
118 case INDEX_op_shl_i64:
119 case INDEX_op_shr_i32:
120 case INDEX_op_shr_i64:
121 case INDEX_op_sar_i32:
122 case INDEX_op_sar_i64:
123 case INDEX_op_rotl_i32:
124 case INDEX_op_rotl_i64:
125 case INDEX_op_rotr_i32:
126 case INDEX_op_rotr_i64:
127 case INDEX_op_setcond_i32:
128 case INDEX_op_setcond_i64:
129 case INDEX_op_deposit_i32:
130 case INDEX_op_deposit_i64:
131 return C_O1_I2(r, r, r);
133 case INDEX_op_brcond_i32:
134 case INDEX_op_brcond_i64:
135 return C_O0_I2(r, r);
137 #if TCG_TARGET_REG_BITS == 32
138 /* TODO: Support R, R, R, R, RI, RI? Will it be faster? */
139 case INDEX_op_add2_i32:
140 case INDEX_op_sub2_i32:
141 return C_O2_I4(r, r, r, r, r, r);
142 case INDEX_op_brcond2_i32:
143 return C_O0_I4(r, r, r, r);
144 case INDEX_op_mulu2_i32:
145 return C_O2_I2(r, r, r, r);
146 case INDEX_op_setcond2_i32:
147 return C_O1_I4(r, r, r, r, r);
150 case INDEX_op_qemu_ld_i32:
151 return (TARGET_LONG_BITS <= TCG_TARGET_REG_BITS
154 case INDEX_op_qemu_ld_i64:
155 return (TCG_TARGET_REG_BITS == 64 ? C_O1_I1(r, r)
156 : TARGET_LONG_BITS <= TCG_TARGET_REG_BITS ? C_O2_I1(r, r, r)
157 : C_O2_I2(r, r, r, r));
158 case INDEX_op_qemu_st_i32:
159 return (TARGET_LONG_BITS <= TCG_TARGET_REG_BITS
162 case INDEX_op_qemu_st_i64:
163 return (TCG_TARGET_REG_BITS == 64 ? C_O0_I2(r, r)
164 : TARGET_LONG_BITS <= TCG_TARGET_REG_BITS ? C_O0_I3(r, r, r)
165 : C_O0_I4(r, r, r, r));
168 g_assert_not_reached();
172 static const int tcg_target_reg_alloc_order[] = {
191 #if MAX_OPC_PARAM_IARGS != 6
192 # error Fix needed, number of supported input arguments changed!
195 static const int tcg_target_call_iarg_regs[] = {
202 #if TCG_TARGET_REG_BITS == 32
203 /* 32 bit hosts need 2 * MAX_OPC_PARAM_IARGS registers. */
213 static const int tcg_target_call_oarg_regs[] = {
215 #if TCG_TARGET_REG_BITS == 32
220 #ifdef CONFIG_DEBUG_TCG
221 static const char *const tcg_target_reg_names[TCG_TARGET_NB_REGS] = {
241 static bool patch_reloc(tcg_insn_unit *code_ptr, int type,
242 intptr_t value, intptr_t addend)
244 /* tcg_out_reloc always uses the same type, addend. */
245 tcg_debug_assert(type == sizeof(tcg_target_long));
246 tcg_debug_assert(addend == 0);
247 tcg_debug_assert(value != 0);
248 if (TCG_TARGET_REG_BITS == 32) {
249 tcg_patch32(code_ptr, value);
251 tcg_patch64(code_ptr, value);
256 /* Write value (native size). */
257 static void tcg_out_i(TCGContext *s, tcg_target_ulong v)
259 if (TCG_TARGET_REG_BITS == 32) {
267 static void tcg_out_op_t(TCGContext *s, TCGOpcode op)
273 /* Write register. */
274 static void tcg_out_r(TCGContext *s, TCGArg t0)
276 tcg_debug_assert(t0 < TCG_TARGET_NB_REGS);
281 static void tci_out_label(TCGContext *s, TCGLabel *label)
283 if (label->has_value) {
284 tcg_out_i(s, label->u.value);
285 tcg_debug_assert(label->u.value);
287 tcg_out_reloc(s, s->code_ptr, sizeof(tcg_target_ulong), label, 0);
288 s->code_ptr += sizeof(tcg_target_ulong);
292 static void stack_bounds_check(TCGReg base, target_long offset)
294 if (base == TCG_REG_CALL_STACK) {
295 tcg_debug_assert(offset < 0);
296 tcg_debug_assert(offset >= -(CPU_TEMP_BUF_NLONGS * sizeof(long)));
300 static void tcg_out_op_l(TCGContext *s, TCGOpcode op, TCGLabel *l0)
302 uint8_t *old_code_ptr = s->code_ptr;
305 tci_out_label(s, l0);
307 old_code_ptr[1] = s->code_ptr - old_code_ptr;
310 static void tcg_out_op_p(TCGContext *s, TCGOpcode op, void *p0)
312 uint8_t *old_code_ptr = s->code_ptr;
315 tcg_out_i(s, (uintptr_t)p0);
317 old_code_ptr[1] = s->code_ptr - old_code_ptr;
320 static void tcg_out_op_rr(TCGContext *s, TCGOpcode op, TCGReg r0, TCGReg r1)
322 uint8_t *old_code_ptr = s->code_ptr;
328 old_code_ptr[1] = s->code_ptr - old_code_ptr;
331 static void tcg_out_op_rrr(TCGContext *s, TCGOpcode op,
332 TCGReg r0, TCGReg r1, TCGReg r2)
334 uint8_t *old_code_ptr = s->code_ptr;
341 old_code_ptr[1] = s->code_ptr - old_code_ptr;
344 static void tcg_out_op_rrs(TCGContext *s, TCGOpcode op,
345 TCGReg r0, TCGReg r1, intptr_t i2)
347 uint8_t *old_code_ptr = s->code_ptr;
352 tcg_debug_assert(i2 == (int32_t)i2);
355 old_code_ptr[1] = s->code_ptr - old_code_ptr;
358 static void tcg_out_op_rrrc(TCGContext *s, TCGOpcode op,
359 TCGReg r0, TCGReg r1, TCGReg r2, TCGCond c3)
361 uint8_t *old_code_ptr = s->code_ptr;
369 old_code_ptr[1] = s->code_ptr - old_code_ptr;
372 static void tcg_out_op_rrrbb(TCGContext *s, TCGOpcode op, TCGReg r0,
373 TCGReg r1, TCGReg r2, uint8_t b3, uint8_t b4)
375 uint8_t *old_code_ptr = s->code_ptr;
384 old_code_ptr[1] = s->code_ptr - old_code_ptr;
387 #if TCG_TARGET_REG_BITS == 32
388 static void tcg_out_op_rrrrrc(TCGContext *s, TCGOpcode op,
389 TCGReg r0, TCGReg r1, TCGReg r2,
390 TCGReg r3, TCGReg r4, TCGCond c5)
392 uint8_t *old_code_ptr = s->code_ptr;
402 old_code_ptr[1] = s->code_ptr - old_code_ptr;
406 static void tcg_out_ld(TCGContext *s, TCGType type, TCGReg val, TCGReg base,
409 stack_bounds_check(base, offset);
412 tcg_out_op_rrs(s, INDEX_op_ld_i32, val, base, offset);
414 #if TCG_TARGET_REG_BITS == 64
416 tcg_out_op_rrs(s, INDEX_op_ld_i64, val, base, offset);
420 g_assert_not_reached();
424 static bool tcg_out_mov(TCGContext *s, TCGType type, TCGReg ret, TCGReg arg)
428 tcg_out_op_rr(s, INDEX_op_mov_i32, ret, arg);
430 #if TCG_TARGET_REG_BITS == 64
432 tcg_out_op_rr(s, INDEX_op_mov_i64, ret, arg);
436 g_assert_not_reached();
441 static void tcg_out_movi(TCGContext *s, TCGType type,
442 TCGReg t0, tcg_target_long arg)
444 uint8_t *old_code_ptr = s->code_ptr;
445 uint32_t arg32 = arg;
446 if (type == TCG_TYPE_I32 || arg == arg32) {
447 tcg_out_op_t(s, INDEX_op_tci_movi_i32);
451 tcg_debug_assert(type == TCG_TYPE_I64);
452 #if TCG_TARGET_REG_BITS == 64
453 tcg_out_op_t(s, INDEX_op_tci_movi_i64);
460 old_code_ptr[1] = s->code_ptr - old_code_ptr;
463 static inline void tcg_out_call(TCGContext *s, const tcg_insn_unit *arg)
465 uint8_t *old_code_ptr = s->code_ptr;
466 tcg_out_op_t(s, INDEX_op_call);
467 tcg_out_i(s, (uintptr_t)arg);
468 old_code_ptr[1] = s->code_ptr - old_code_ptr;
471 #if TCG_TARGET_REG_BITS == 64
472 # define CASE_32_64(x) \
473 case glue(glue(INDEX_op_, x), _i64): \
474 case glue(glue(INDEX_op_, x), _i32):
475 # define CASE_64(x) \
476 case glue(glue(INDEX_op_, x), _i64):
478 # define CASE_32_64(x) \
479 case glue(glue(INDEX_op_, x), _i32):
483 static void tcg_out_op(TCGContext *s, TCGOpcode opc, const TCGArg *args,
484 const int *const_args)
486 uint8_t *old_code_ptr = s->code_ptr;
489 case INDEX_op_exit_tb:
490 tcg_out_op_p(s, opc, (void *)args[0]);
493 case INDEX_op_goto_tb:
494 tcg_debug_assert(s->tb_jmp_insn_offset == 0);
495 /* indirect jump method. */
496 tcg_out_op_p(s, opc, s->tb_jmp_target_addr + args[0]);
497 set_jmp_reset_offset(s, args[0]);
501 tcg_out_op_l(s, opc, arg_label(args[0]));
505 tcg_out_op_rrrc(s, opc, args[0], args[1], args[2], args[3]);
508 #if TCG_TARGET_REG_BITS == 32
509 case INDEX_op_setcond2_i32:
510 tcg_out_op_rrrrrc(s, opc, args[0], args[1], args[2],
511 args[3], args[4], args[5]);
519 case INDEX_op_ld_i32:
525 case INDEX_op_st_i32:
528 stack_bounds_check(args[1], args[2]);
529 tcg_out_op_rrs(s, opc, args[0], args[1], args[2]);
538 CASE_32_64(andc) /* Optional (TCG_TARGET_HAS_andc_*). */
539 CASE_32_64(orc) /* Optional (TCG_TARGET_HAS_orc_*). */
540 CASE_32_64(eqv) /* Optional (TCG_TARGET_HAS_eqv_*). */
541 CASE_32_64(nand) /* Optional (TCG_TARGET_HAS_nand_*). */
542 CASE_32_64(nor) /* Optional (TCG_TARGET_HAS_nor_*). */
546 CASE_32_64(rotl) /* Optional (TCG_TARGET_HAS_rot_*). */
547 CASE_32_64(rotr) /* Optional (TCG_TARGET_HAS_rot_*). */
548 CASE_32_64(div) /* Optional (TCG_TARGET_HAS_div_*). */
549 CASE_32_64(divu) /* Optional (TCG_TARGET_HAS_div_*). */
550 CASE_32_64(rem) /* Optional (TCG_TARGET_HAS_div_*). */
551 CASE_32_64(remu) /* Optional (TCG_TARGET_HAS_div_*). */
552 tcg_out_op_rrr(s, opc, args[0], args[1], args[2]);
555 CASE_32_64(deposit) /* Optional (TCG_TARGET_HAS_deposit_*). */
557 TCGArg pos = args[3], len = args[4];
558 TCGArg max = opc == INDEX_op_deposit_i32 ? 32 : 64;
560 tcg_debug_assert(pos < max);
561 tcg_debug_assert(pos + len <= max);
563 tcg_out_op_rrrbb(s, opc, args[0], args[1], args[2], pos, len);
568 tcg_out_op_t(s, opc);
569 tcg_out_r(s, args[0]);
570 tcg_out_r(s, args[1]);
571 tcg_out8(s, args[2]); /* condition */
572 tci_out_label(s, arg_label(args[3]));
573 old_code_ptr[1] = s->code_ptr - old_code_ptr;
576 CASE_32_64(neg) /* Optional (TCG_TARGET_HAS_neg_*). */
577 CASE_32_64(not) /* Optional (TCG_TARGET_HAS_not_*). */
578 CASE_32_64(ext8s) /* Optional (TCG_TARGET_HAS_ext8s_*). */
579 CASE_32_64(ext8u) /* Optional (TCG_TARGET_HAS_ext8u_*). */
580 CASE_32_64(ext16s) /* Optional (TCG_TARGET_HAS_ext16s_*). */
581 CASE_32_64(ext16u) /* Optional (TCG_TARGET_HAS_ext16u_*). */
582 CASE_64(ext32s) /* Optional (TCG_TARGET_HAS_ext32s_i64). */
583 CASE_64(ext32u) /* Optional (TCG_TARGET_HAS_ext32u_i64). */
586 CASE_32_64(bswap16) /* Optional (TCG_TARGET_HAS_bswap16_*). */
587 CASE_32_64(bswap32) /* Optional (TCG_TARGET_HAS_bswap32_*). */
588 CASE_64(bswap64) /* Optional (TCG_TARGET_HAS_bswap64_i64). */
589 tcg_out_op_rr(s, opc, args[0], args[1]);
592 #if TCG_TARGET_REG_BITS == 32
593 case INDEX_op_add2_i32:
594 case INDEX_op_sub2_i32:
595 tcg_out_op_t(s, opc);
596 tcg_out_r(s, args[0]);
597 tcg_out_r(s, args[1]);
598 tcg_out_r(s, args[2]);
599 tcg_out_r(s, args[3]);
600 tcg_out_r(s, args[4]);
601 tcg_out_r(s, args[5]);
602 old_code_ptr[1] = s->code_ptr - old_code_ptr;
604 case INDEX_op_brcond2_i32:
605 tcg_out_op_t(s, opc);
606 tcg_out_r(s, args[0]);
607 tcg_out_r(s, args[1]);
608 tcg_out_r(s, args[2]);
609 tcg_out_r(s, args[3]);
610 tcg_out8(s, args[4]); /* condition */
611 tci_out_label(s, arg_label(args[5]));
612 old_code_ptr[1] = s->code_ptr - old_code_ptr;
614 case INDEX_op_mulu2_i32:
615 tcg_out_op_t(s, opc);
616 tcg_out_r(s, args[0]);
617 tcg_out_r(s, args[1]);
618 tcg_out_r(s, args[2]);
619 tcg_out_r(s, args[3]);
620 old_code_ptr[1] = s->code_ptr - old_code_ptr;
624 case INDEX_op_qemu_ld_i32:
625 case INDEX_op_qemu_st_i32:
626 tcg_out_op_t(s, opc);
627 tcg_out_r(s, *args++);
628 tcg_out_r(s, *args++);
629 if (TARGET_LONG_BITS > TCG_TARGET_REG_BITS) {
630 tcg_out_r(s, *args++);
632 tcg_out32(s, *args++);
633 old_code_ptr[1] = s->code_ptr - old_code_ptr;
636 case INDEX_op_qemu_ld_i64:
637 case INDEX_op_qemu_st_i64:
638 tcg_out_op_t(s, opc);
639 tcg_out_r(s, *args++);
640 if (TCG_TARGET_REG_BITS == 32) {
641 tcg_out_r(s, *args++);
643 tcg_out_r(s, *args++);
644 if (TARGET_LONG_BITS > TCG_TARGET_REG_BITS) {
645 tcg_out_r(s, *args++);
647 tcg_out32(s, *args++);
648 old_code_ptr[1] = s->code_ptr - old_code_ptr;
652 tcg_out_op_t(s, opc);
653 old_code_ptr[1] = s->code_ptr - old_code_ptr;
656 case INDEX_op_mov_i32: /* Always emitted via tcg_out_mov. */
657 case INDEX_op_mov_i64:
658 case INDEX_op_call: /* Always emitted via tcg_out_call. */
664 static void tcg_out_st(TCGContext *s, TCGType type, TCGReg val, TCGReg base,
667 stack_bounds_check(base, offset);
670 tcg_out_op_rrs(s, INDEX_op_st_i32, val, base, offset);
672 #if TCG_TARGET_REG_BITS == 64
674 tcg_out_op_rrs(s, INDEX_op_st_i64, val, base, offset);
678 g_assert_not_reached();
682 static inline bool tcg_out_sti(TCGContext *s, TCGType type, TCGArg val,
683 TCGReg base, intptr_t ofs)
688 /* Test if a constant matches the constraint. */
689 static int tcg_target_const_match(tcg_target_long val, TCGType type,
690 const TCGArgConstraint *arg_ct)
692 /* No need to return 0 or 1, 0 or != 0 is good enough. */
693 return arg_ct->ct & TCG_CT_CONST;
696 static void tcg_target_init(TCGContext *s)
698 #if defined(CONFIG_DEBUG_TCG_INTERPRETER)
699 const char *envval = getenv("DEBUG_TCG");
701 qemu_set_log(strtol(envval, NULL, 0));
705 /* The current code uses uint8_t for tcg operations. */
706 tcg_debug_assert(tcg_op_defs_max <= UINT8_MAX);
708 /* Registers available for 32 bit operations. */
709 tcg_target_available_regs[TCG_TYPE_I32] = BIT(TCG_TARGET_NB_REGS) - 1;
710 /* Registers available for 64 bit operations. */
711 tcg_target_available_regs[TCG_TYPE_I64] = BIT(TCG_TARGET_NB_REGS) - 1;
712 /* TODO: Which registers should be set here? */
713 tcg_target_call_clobber_regs = BIT(TCG_TARGET_NB_REGS) - 1;
715 s->reserved_regs = 0;
716 tcg_regset_set_reg(s->reserved_regs, TCG_REG_CALL_STACK);
718 /* We use negative offsets from "sp" so that we can distinguish
719 stores that might pretend to be call arguments. */
720 tcg_set_frame(s, TCG_REG_CALL_STACK,
721 -CPU_TEMP_BUF_NLONGS * sizeof(long),
722 CPU_TEMP_BUF_NLONGS * sizeof(long));
725 /* Generate global QEMU prologue and epilogue code. */
726 static inline void tcg_target_qemu_prologue(TCGContext *s)