4 #if (JITC_ARCNUM == 0x0001)
9 // F5の場合、decoderが対応するalloc-freeを結びつけるのが簡単で、typやlenを指定必須にしてもフロントエンドコードに影響はない.
10 int jitCompiler(unsigned char *dst, unsigned char *dst1, const unsigned char *src, const unsigned char *src1, const unsigned char *src0, HOSECPU_LabelListTag *label, int maxLabels, int level, int debugInfo1, int flags)
12 // For IA-32 (x86, 32-bit)
13 // 本来ならこのレイヤでは文法チェックしない
16 // dst1 : 書き込みアドレスの最大値
17 // src : 現在の読み込みアドレス(ヘッダ部は飛ばしてある
18 // src1 : 読み込みアドレスの最大値
19 // src0 : 読み込みバイナリのアドレス
21 unsigned char *dst00 = dst, *enter0 = NULL, *tmp_ucp;
23 const unsigned char *oldsrc;
24 int timecount = 0, i, j = 0, lastlabel = -1, debugInfo0 = -1;
25 int reg0, reg1, reg2, cmp0reg = -1, cmp0lev = 0;
29 w.maxLabels = maxLabels;
31 if ((flags & JITC_NOSTARTUP) == 0) {
32 jitCompPutOp_PUSHAD(w.dst);
34 jitCompA000_loadRegCacheAll(&w);
35 jitCompA000_loadPRegCacheAll(&w);
37 if (level <= JITC_LV_SLOWER) {
38 // env.debugInfo0 <- 0;
39 // env.debugInfo1 <- debugInfo1;
40 jitCompPutOp_MOV_EAX_ZERO(w.dst);
41 jitCompPutOp_MOV_EBPDisp_GReg(&w, envOffset_DBGINFO0, IA32_REG0_EAX);
42 jitCompPutOp_MOV_GReg_Imm32(w.dst, IA32_REG0_EAX, debugInfo1);
43 jitCompPutOp_MOV_EBPDisp_GReg(&w, envOffset_DBGINFO1, IA32_REG0_EAX);
46 w.prefix = 0; //0x04 CND 命令で変更される
47 if (w.dst + 256 > dst1) {
48 // 書き込み領域が残り256バイト未満ならエラー
49 w.err = JITC_ERR_DST1;
53 if (timecount >= 64) {
55 /* 未完成(timeoutチェックコードを入れる) */
57 if(*src != 0x00 && *src != 0x01 && *src != 0x34){
66 // 「条件付きでNOPを実行」するなんて、矛盾している!
67 w.err = JITC_ERR_PREFIX;
73 // LB : ラベル設置命令。(6byte)
75 // ・timecount++し、timecountのチェックをする。
77 // ・割り込みがある場合、このタイミングで割り込みを発生させる。
82 if (enter0 == NULL && (src[6] == 0x3c /* 多数のレジスタをスタックに退避 */ || (src[6] == 0xfe/* REMARK */ && src[7] == 0x01 && src[9] == 0x3c))) {
84 // LB命令の後に0x3C命令・・・beginFunc()
86 jitCompPutOp_JMPnear(w.dst, 0);
91 // なので、DATA部分をJMPですっとばすコードを生成
92 // DAT_SA0(label, typ32, length) ・・・メモリ確保命令
94 i = jitCompGetImm32(&src[6 + 1]); // type32 を取得
98 i = jitCompA000_convTyp(i);
113 j *= jitCompGetImm32(&src[6 + 5]); // len32
115 w.err = JITC_ERR_BADTYPE;
119 jitCompPutOp_JMPnear(w.dst, j);
121 #if (jitCompA0001_OPTIMIZE_JMP != 0)
122 if (j < 127 - jitCompA0001_OPTIMIZE_ALIGN) {
127 jitCompPutOp_JMPshort(w.dst, j);
131 #if (jitCompA0001_OPTIMIZE_ALIGN != 0)
132 // アラインを jitCompA0001_OPTIMIZE_ALIGNにそろえる
134 i = ((int)w.dst + 1) & (jitCompA0001_OPTIMIZE_ALIGN - 1); /* ALIGNで割ったあまりを計算 */
135 i = jitCompA0001_OPTIMIZE_ALIGN - i;
136 if (i == 1) { jitCompPutByte1(w.dst, 0x90); j += i; } /* NOP(); */
137 if (i == 2) { jitCompPutByte2(w.dst, 0x89, 0xc0); j += i; } /* MOV(EAX, EAX); */
138 if (i == 3) { jitCompPutByte3(w.dst, 0x8d, 0x76, 0x00); j += i; } /* LEA(ESI, [ESI+0]); */
139 if (i == 4) { jitCompPutByte4(w.dst, 0x8d, 0x74, 0x26, 0x00); j += i; } /* LEA(ESI, [ESI*1+0]); */
140 if (i == 5) { jitCompPutByte1(w.dst, 0x0d); jitCompPutImm32(w.dst, 0); j += i; } /* OR(EAX, 0); */
141 if (i == 6) { jitCompPutByte2(w.dst, 0x8d, 0xb6); jitCompPutImm32(w.dst, 0); j += i; } /* LEA(ESI, [ESI+0]); */
142 if (i == 7) { jitCompPutByte3(w.dst, 0x8d, 0xb4, 0x26); jitCompPutImm32(w.dst, 0); j += 7; } /* LEA(ESI, [ESI*1+0]); */
144 if (src[6] == 0x34) {
146 // パディングに合わせて一個前の相対ジャンプを修正
147 tmp_ucp[1] = j & 0xff;
148 if (*tmp_ucp == 0xe9) {
149 // Near jump so imm is DWORD
150 tmp_ucp[2] = (j >> 8) & 0xff;
151 tmp_ucp[3] = (j >> 16) & 0xff;
152 tmp_ucp[4] = (j >> 24) & 0xff;
155 if ((flags & JITC_PHASE1) == 0) {
156 i = jitCompGetLabelNum(&w, src + 2);
157 if (label[i].opt != 0 && w.err == 0) {
158 w.err = JITC_ERR_LABELREDEF;
162 w.err = JITC_ERR_PREFIX;
165 label[i].opt = src[1] + 1;
166 label[i].typ = 0; /* TYP_CODE */
168 label[i].p1 = w.dst + 1;
173 /* 未完成(timeoutチェックコードを入れる) */
177 // LIMM : 定数即値代入命令(6byte)
182 // reg3F は条件比較慣用句指定用&演算命令即値慣用句指定用。よってCND命令の直後では使用できない。
184 if (src[1] == 0x3f && w.prefix != 0){
185 // CND命令の直後でR3Fを書き換えるなんて変だよね
186 w.err = JITC_ERR_PREFIX;
189 #if (jitCompA0001_USE_R3F_IMM32 != 0)
190 if (src[1] == 0x3f) {
191 // R3Fへの代入は例外で、 w.r3f を使用
192 w.r3f = jitCompGetImm32(src + 2);
196 i = jitCompGetImm32(src + 2); // 与えられた即値(第二引数)を取得
197 /* R00-R02 なら EBX, ECX, EDX 、それ以外なら EAX のレジスタIDを reg0 に代入 */
198 reg0 = jitCompA000_selectRegCache(src[1], IA32_REG0_EAX);
200 #if (jitCompA0001_OPTIMIZE_MOV != 0)
202 // MOV reg, 0 -> XOR reg, reg
204 jitCompPutOp_XOR_GReg_GReg(w.dst, reg0, reg0);
205 jitCompA0001_movRxxEax(&w, src[1]);
209 /* reg0 のレジスタに対応したMOV命令を発行 */
210 jitCompPutOp_MOV_GReg_Imm32(w.dst, reg0, i);
213 // R03以降の、レジスタの内容をメモリ上に格納してエミュレートする場合
214 jitCompA0001_movRxxEax(&w, src[1]);
219 case 0x03: /* 未完成(plsまで対応) */
220 // PLIMM : ラベル番号代入命令(6byte)
230 i = jitCompGetLabelNum(&w, src + 2); // Pxxに代入するラベルの番号(第二引数)
231 if ((flags & JITC_PHASE1) != 0 && w.err == 0) {
233 if (label[i].opt == 0) {
235 w.err = JITC_ERR_LABELNODEF;
238 if (src[1] != 0x3f && label[i].opt != 2) {
240 w.err = JITC_ERR_LABELTYP;
243 if (src[1] == 0x3f && label[i].typ != 0) {
244 // プログラムカウンタに TYP_CODEでない値は代入できない
245 w.err = JITC_ERR_LABELTYP;
249 if (src[1] == 0x3f) {
252 // CND命令による条件付きでなければ、即座に移動
253 jitCompPutByte1(w.dst, 0xe9); /* JMP(?); */
262 * いま、dstの末端はJZ命令になっている。 0x0F 0x84 cd
267 w.dst[-1] = w.dst[-2] ^ 0xf1; /* 74->85, 75->84 */
273 if ((flags & JITC_PHASE1) != 0 || (((flags & JITC_PHASE1) == 0) && label[i].opt != 0)) // label番号iが確保されていれば (このif文は意味をなさない)
274 j = label[i].p - (w.dst + 4); // j はとび先の相対番地
275 jitCompPutImm32(w.dst, j); // JMP もしくは JZ 命令のアドレス部を記述
276 #if (jitCompA0001_OPTIMIZE_JMP != 0)
277 if (-128 - 3 <= j && j < 0) {
278 if (w.dst[-5] == 0xe9) {
281 jitCompPutByte1(w.dst, 0xeb); /* JMP(?); */
285 jitCompPutByte1(w.dst, w.dst[1] ^ 0xf0);
287 jitCompPutByte1(w.dst, j & 0xff);
290 } else { // プログラムカウンタ以外への代入
291 // 代入先が P01, P02なら ESI, EDI,それ以外ならEAXを指定
292 reg0 = jitCompA000_selectPRegCache(src[1], IA32_REG0_EAX);
294 jitCompPutOp_MOV_GReg_Imm32(w.dst, reg0, (int)label[i].p);
295 // レジスタへの代入をメモリでエミュレーションする場合は、スタックに書き込む。
297 jitCompPutOp_MOV_EBPDisp_GReg(&w, PRegOffset(src[1]) + 0, IA32_REG0_EAX); /* MOV([EBP+?], EAX); */
300 if (level < JITC_LV_FASTEST) {
301 jitCompPutOp_MOV_EBPDisp_GReg(&w, PRegOffset(src[1]) + 8, reg0); /* p0 */
302 jitCompPutOp_MOV_GReg_Imm32(w.dst, IA32_REG0_EAX, label[i].typ);
303 jitCompPutOp_MOV_EBPDisp_GReg(&w, PRegOffset(src[1]) + 4, IA32_REG0_EAX); /* typ */
304 jitCompPutOp_MOV_GReg_Imm32(w.dst, IA32_REG0_EAX, (int)label[i].p1);
305 jitCompPutOp_MOV_EBPDisp_GReg(&w, PRegOffset(src[1]) + 12, IA32_REG0_EAX); /* p1 */
306 jitCompPutOp_MOV_EAX_ZERO(w.dst);
307 jitCompPutOp_MOV_EBPDisp_GReg(&w, PRegOffset(src[1]) + 16, IA32_REG0_EAX); /* liveSign */
308 jitCompPutOp_MOV_GReg_EBPDisp(&w, IA32_REG0_EAX, envOffset_PTRCTRL);
309 jitCompPutOp_MOV_EBPDisp_GReg(&w, PRegOffset(src[1]) + 20, IA32_REG0_EAX); /* pls */
316 // 与えられたRxxの最下位ビットが1であれば後続の命令を実行、そうでなければ飛ばす。
319 // R00-R3F 以外のレジスタは比較対象にできない
320 w.err = JITC_ERR_REGNUM;
324 // 比較対象のレジスタがメモリ上にあれば-1, それ以外なら適切なレジスタ番号を返す
325 reg0 = jitCompA000_selectRegCache(src[1], -1 /* mem */);
330 jitCompPutByte1(w.dst, 0xf7); /* TEST = 1111 011w : mod 000 r/m : immediate data */
331 jitCompPutModRM_Disp_BaseEBP(&w, src[1] * 4, 0);
333 // 比較対象はキャッシュレジスタ上にある
334 jitCompPutByte2(w.dst, 0xf7, 0xc0 | reg0); /* TEST = 1111 011w : 11 000 reg : immediate data */
336 jitCompPutImm32(w.dst, 1);
339 jitCompPutByte2(w.dst, 0x74, 0x00); /* JZ($+2) */
345 w.prefix = 1; // プリフィックスをセット
347 goto prefix_continue;
349 case 0x08: /* LMEM */ /* 完成 */
350 i = jitCompGetImm32(src + 2);
352 w.err = JITC_ERR_BADTYPE;
354 if (level < JITC_LV_FASTER) {
355 jitCompA0001_checkType(&w, src[6], i, 0); // read
358 reg0 = jitCompA000_selectRegCache(src[1], IA32_REG0_EAX);
359 reg1 = jitCompA000_selectPRegCache(src[6], IA32_REG2_EDX);
360 if (reg0 != IA32_REG0_EAX && reg1 == IA32_REG2_EDX){
361 reg1 = IA32_REG0_EAX;
363 if (reg1 == IA32_REG2_EDX){
364 jitCompA000_storeRegCacheEdx(&w);
366 if (reg1 <= 3 /* EAX, EDX */){
367 jitCompPutOp_MOV_GReg_EBPDisp(&w, reg1, PRegOffset(src[6]));
369 if (level < JITC_LV_FASTER){
370 jitCompA0001_checkLimit(&w, reg1, src[6]);
372 i = jitCompA000_convTyp(jitCompGetImm32(src + 2));
375 jitCompPutByte3(w.dst, 0x0f, 0xbe, reg0 << 3 | reg1); /* MOVSX(reg0,BYTE [reg1]); */
378 jitCompPutByte3(w.dst, 0x0f, 0xb6, reg0 << 3 | reg1); /* MOVZX(reg0,BYTE [reg1]); */
381 jitCompPutByte3(w.dst, 0x0f, 0xbf, reg0 << 3 | reg1); /* MOVSX(reg0,WORD [reg1]); */
384 jitCompPutByte3(w.dst, 0x0f, 0xb7, reg0 << 3 | reg1); /* MOVZX(reg0,WORD [reg1]); */
388 jitCompPutByte2(w.dst, 0x8b, reg0 << 3 | reg1); /* MOV(reg0, [reg1]); */
391 w.err = JITC_ERR_BADTYPE;
393 if (reg0 == IA32_REG0_EAX){
394 jitCompA0001_movRxxEax(&w, src[1]);
396 if (reg1 == IA32_REG2_EDX){
397 jitCompA000_loadRegCacheEdx(&w);
401 case 0x09: /* SMEM */ /* 完成 */
402 i = jitCompGetImm32(src + 2);
404 w.err = JITC_ERR_BADTYPE;
406 if (level < JITC_LV_FASTER) {
407 jitCompA0001_checkType(&w, src[6], i, 1); // write
410 reg0 = jitCompA000_selectRegCache(src[1], IA32_REG0_EAX);
411 reg1 = jitCompA000_selectPRegCache(src[6], IA32_REG2_EDX);
412 if (reg0 != IA32_REG0_EAX && reg1 == IA32_REG2_EDX){
413 reg1 = IA32_REG0_EAX;
415 if (reg1 == IA32_REG2_EDX){
416 jitCompA000_storeRegCacheEdx(&w);
418 if (reg1 <= 3 /* EAX, EDX */){
419 jitCompPutOp_MOV_GReg_EBPDisp(&w, reg1, PRegOffset(src[6]) + 0); /* MOV(reg1, [EBP+?]); */
421 if (level < JITC_LV_FASTER){
422 jitCompA0001_checkLimit(&w, reg1, src[6]);
424 if (reg0 == IA32_REG0_EAX){
425 jitCompA0001_movEaxRxx(&w, src[1]);
428 i = jitCompA000_convTyp(jitCompGetImm32(src + 2));
432 jitCompPutByte2(w.dst, 0x88, reg0 << 3 | reg1); /* MOV([reg1], BYTE(reg0)); */
436 jitCompPutByte3(w.dst, 0x66, 0x89, reg0 << 3 | reg1); /* MOV([reg1], WORD(reg0)); */
440 jitCompPutByte2(w.dst, 0x89, reg0 << 3 | reg1); /* MOV([reg1], reg0); */
443 w.err = JITC_ERR_BADTYPE;
445 if (reg1 == IA32_REG2_EDX){
446 jitCompA000_loadRegCacheEdx(&w);
450 case 0x0a: /* PLMEM */ /* 完成 */
451 i = jitCompGetImm32(src + 2);
453 w.err = JITC_ERR_BADTYPE;
455 if (level < JITC_LV_FASTER) {
456 jitCompA0001_checkType(&w, src[6], i, 0); // read
459 reg0 = jitCompA000_selectPRegCache(src[1], IA32_REG0_EAX);
460 reg1 = jitCompA000_selectPRegCache(src[6], IA32_REG2_EDX);
461 // if (reg0 != 0 /* EAX */ && reg1 == 2 /* EDX */) /* これをやってはいけない!(by K, 2013.08.02) */
462 // reg1 = 0; /* EAX */
463 if (reg0 == reg1 && reg0 != 0) {
464 // bugfix: hinted by yao, 2013.09.14. thanks!
465 jitCompA000_storePRegCacheAll(&w);
466 reg1 = IA32_REG2_EDX;
468 if (reg1 == IA32_REG2_EDX){
469 jitCompA000_storeRegCacheEdx(&w);
471 if (reg1 <= 3 /* EAX, EDX */){
472 jitCompPutOp_MOV_GReg_EBPDisp(&w, reg1, PRegOffset(src[6])); /* MOV(reg1, [EBP+?]); */
474 if (level < JITC_LV_FASTER){
475 jitCompA0001_checkLimit(&w, reg1, src[6]);
477 jitCompPutByte2(w.dst, 0x8b, reg0 << 3 | reg1); /* MOV(reg0, [reg1]); */
478 if (reg0 == IA32_REG0_EAX){
479 jitCompPutOp_MOV_EBPDisp_GReg(&w, PRegOffset(src[1]), IA32_REG0_EAX); /* MOV([EBP+?], EAX); */
481 for (i = 4; i < 32; i += 4) {
482 jitCompPutByte3(w.dst, 0x8b, 0x40 | reg1, i); /* MOV(EAX, [reg1+?]); */
483 jitCompPutOp_MOV_EBPDisp_GReg(&w, PRegOffset(src[1]) + i, IA32_REG0_EAX); /* MOV([EBP+?], EAX); */
485 if (reg1 == IA32_REG2_EDX){
486 jitCompA000_loadRegCacheEdx(&w);
490 case 0x0b: /* PSMEM */ /* 完成 */
491 i = jitCompGetImm32(src + 2);
492 if (i != 0x0001) w.err = JITC_ERR_BADTYPE;
493 if (level < JITC_LV_FASTER) {
494 jitCompA0001_checkType(&w, src[6], i, 1); // write
497 reg0 = jitCompA000_selectPRegCache(src[1], IA32_REG0_EAX);
498 reg1 = jitCompA000_selectPRegCache(src[6], IA32_REG2_EDX);
499 /* これをやってはいけない!(by K, 2013.08.02) */
500 // if (reg0 != 0 /* EAX */ && reg1 == 2 /* EDX */)
501 // reg1 = 0; /* EAX */
502 if (reg1 == IA32_REG2_EDX){
503 jitCompA000_storeRegCacheEdx(&w);
505 if (reg1 <= 3 /* EAX, EDX */){
506 jitCompPutOp_MOV_GReg_EBPDisp(&w, reg1, PRegOffset(src[6])); /* MOV(reg1, [EBP+?]); */
508 if (level < JITC_LV_FASTER){
509 jitCompA0001_checkLimit(&w, reg1, src[6]);
511 if (reg0 == IA32_REG0_EAX){
512 jitCompPutOp_MOV_GReg_EBPDisp(&w, reg0, PRegOffset(src[1])); /* MOV(reg0, [EBP+?]); */
514 jitCompPutByte2(w.dst, 0x89, reg0 << 3 | reg1); /* MOV([reg1], reg0); */
515 for (i = 4; i < 32; i += 4) {
516 jitCompPutOp_MOV_GReg_EBPDisp(&w, IA32_REG0_EAX, PRegOffset(src[1]) + i); /* MOV(EAX, [EBP+?]); */
517 jitCompPutByte3(w.dst, 0x89, 0x40 | reg1, i); /* MOV([reg1+?], EAX); */
519 if (reg1 == IA32_REG2_EDX)
520 jitCompA000_loadRegCacheEdx(&w);
523 case 0x0e: /* PADD */ /* 完成 */
524 if (level < JITC_LV_FASTER) {
525 jitCompA0001_checkType0(&w, src[6], jitCompGetImm32(src + 2), 2); // other, aliveテストはとりあえずしない.
528 reg0 = jitCompA000_selectPRegCache(src[1], IA32_REG0_EAX);
529 reg1 = jitCompA000_selectPRegCache(src[6], -1 /* mem */);
530 if (reg1 < 0 /* mem */){
531 jitCompPutOp_MOV_GReg_EBPDisp(&w, reg0, PRegOffset(src[6])); /* MOV(reg0, [EBP+?]); */
533 if (reg1 >= 0 && reg0 != reg1) {
534 jitCompPutByte2(w.dst, 0x89, 0xc0 | reg1 << 3 | reg0); /* MOV(reg0, reg1); */
536 i = jitCompGetImm32(src + 2);
541 i = jitCompA000_convTyp(i);
542 if (0x0002 <= i && i <= 0x0007){
543 j = (i - 0x0002) >> 1;
547 w.err = JITC_ERR_BADTYPE;
550 #if (jitCompA0001_USE_R3F_IMM32 != 0)
551 if (src[7] == 0x3f) {
553 #if (jitCompA0001_USE_R3F_IMM8 != 0)
554 if (-0x80 <= j && j <= 0x7f) {
555 #if (jitCompA0001_USE_R3F_INCDEC != 0)
558 jitCompPutByte1(w.dst, 0x40 | reg0);
563 jitCompPutByte1(w.dst, 0x48 | reg0);
567 /* ADD(reg0, im8); */
568 jitCompPutByte3(w.dst, 0x83, 0xc0 | reg0, j & 0xff);
573 jitCompPutByte1(w.dst, 0x05); /* ADD(reg0, ?); */
575 jitCompPutByte2(w.dst, 0x81, 0xc0 | reg0); /* ADD(reg0, ?); */
577 jitCompPutImm32(w.dst, j);
582 w.err = JITC_ERR_REGNUM;
585 reg1 = jitCompA000_selectRegCache(src[7], -1 /* mem */);
587 jitCompPutByte2(w.dst, 0x01, 0xc0 | reg1 << 3 | reg0); /* ADD(reg0, reg1); */
589 jitCompPutByte1(w.dst, 0x03); /* ADD(reg0, [EBP+?]); */
590 jitCompPutModRM_Disp_BaseEBP(&w, src[7] * 4, reg0);
594 reg1 = jitCompA000_selectRegCache(src[7], -1 /* mem */);
595 reg2 = IA32_REG2_EDX;
596 jitCompA000_storeRegCacheEdx(&w);
598 jitCompPutOp_MOV_GReg_EBPDisp(&w, reg2, src[7] * 4); /* MOV(reg2, [EBP+?]); */
600 if (reg1 >= 0 && reg1 != reg2) {
601 jitCompPutByte2(w.dst, 0x89, 0xc0 | reg1 << 3 | reg2); /* MOV(reg2, reg1); */
603 jitCompPutByte3(w.dst, 0xc1, 0xe0 | reg2, j); /* SHL(reg2, ?); */
604 jitCompPutByte2(w.dst, 0x01, 0xc0 | reg2 << 3 | reg0); /* ADD(reg0, reg2); */
605 jitCompA000_loadRegCacheEdx(&w);
607 #if (jitCompA0001_USE_R3F_IMM32 != 0)
610 if (reg0 == IA32_REG0_EAX){
611 jitCompPutOp_MOV_EBPDisp_GReg(&w, PRegOffset(src[1]), reg0); /* MOV([EBP+?], reg0); */
613 if (src[1] != src[6]) {
614 for (i = 4; i < 32; i += 4) {
615 jitCompPutOp_MOV_GReg_EBPDisp(&w, IA32_REG0_EAX, PRegOffset(src[6]) + i); /* MOV(EAX, [EBP+?]); */
616 jitCompPutOp_MOV_EBPDisp_GReg(&w, PRegOffset(src[1]) + i, IA32_REG0_EAX); /* MOV([EBP+?], EAX); */
622 case 0x0f: /* PDIF */ /* 未完成 */
623 reg0 = jitCompA000_selectRegCache(src[1], IA32_REG0_EAX);
624 jitCompA000_storePRegCacheAll(&w); // 手抜き.
625 jitCompA0001_checkCompPtr(&w, src[6], src[7]);
626 jitCompPutOp_MOV_GReg_EBPDisp(&w, reg0, PRegOffset(src[6])); /* MOV(reg0, [EBP+?]); */
627 jitCompPutByte1(w.dst, 0x2b); /* SUB(EAX, [EBP+?]); */
628 jitCompPutModRM_Disp_BaseEBP(&w, PRegOffset(src[7]) + 0, reg0);
629 i = jitCompA000_convTyp(jitCompGetImm32(src + 2));
631 if (0x0002 <= i && i <= 0x0007){
632 j = (i - 0x0002) >> 1;
635 w.err = JITC_ERR_BADTYPE;
639 jitCompPutByte3(w.dst, 0xc1, 0xf8 | reg0, j); /* SAR(reg0,?); */
641 if (reg0 == IA32_REG0_EAX){
642 jitCompA0001_movRxxEax(&w, src[1]);
655 w.err = JITC_ERR_REGNUM;
657 reg0 = jitCompA000_selectRegCache(src[1], IA32_REG0_EAX);
658 reg1 = jitCompA000_selectRegCache(src[2], -1 /* mem */);
659 #if (jitCompA0001_USE_R3F_IMM32 != 0)
660 if (src[2] == 0x3f) { // SUBのみ該当.
662 w.err = JITC_ERR_REGNUM;
664 reg2 = jitCompA000_selectRegCache(src[3], -1 /* mem */);
666 jitCompA000_storeRegCacheAll(&w);
668 jitCompPutByte1(w.dst, 0xb8 | reg0); /* MOV(reg0, ?); */
669 jitCompPutImm32(w.dst, w.r3f);
670 jitCompPutByte1(w.dst, 0x2b);
671 jitCompPutModRM_Disp_BaseEBP(&w, src[3] * 4, reg0);
673 jitCompA0001_movRxxEax(&w, src[1]);
679 jitCompPutOp_MOV_GReg_EBPDisp(&w, reg0, src[2] * 4); /* MOV(reg0, [EBP+?]); */
681 if (reg1 >= 0 && reg0 != reg1) {
682 jitCompPutByte2(w.dst, 0x89, 0xc0 | reg1 << 3 | reg0); /* MOV(reg0, reg1); */
684 if (!(src[0] == 0x10 && src[3] == 0xff)) {
685 // bugfix: hinted by Iris, 2013.06.26. thanks!
695 if (!(src[0] == 0x10 && src[3] == 0xff)) {
696 #if (jitCompA0001_USE_R3F_IMM32 != 0)
697 if (src[3] == 0x3f) {
698 if (*src == 0x16 && w.r3f == -1) {
699 jitCompPutByte2(w.dst, 0xf7, 0xd8 | reg0); /* NEG(reg0); */
701 jitCompA0001_movRxxEax(&w, src[1]);
705 #if (jitCompA0001_USE_R3F_INCDEC != 0)
706 if ((*src == 0x14 && w.r3f == 1) || (*src == 0x15 && w.r3f == -1)) {
707 jitCompPutByte1(w.dst, 0x40 | reg0); /* INC(reg0); */
709 jitCompA0001_movRxxEax(&w, src[1]);
713 if ((*src == 0x15 && w.r3f == 1) || (*src == 0x14 && w.r3f == -1)) {
714 jitCompPutByte1(w.dst, 0x48 | reg0); /* DEC(reg0); */
716 jitCompA0001_movRxxEax(&w, src[1]);
721 #if (jitCompA0001_USE_R3F_IMM8 != 0)
722 if (-0x80 <= w.r3f && w.r3f <= 0x7f) {
724 static unsigned char basic_op_table_im8[] = { 0xc8, 0xf0, 0xe0, 0, 0xc0, 0xe8 };
725 jitCompPutByte3(w.dst, 0x83, basic_op_table_im8[*src - 0x10] | reg0, w.r3f & 0xff);
727 jitCompPutByte3(w.dst, 0x6b, 0xc0 | reg0 << 3 | reg0, w.r3f & 0xff);
730 jitCompA0001_movRxxEax(&w, src[1]);
735 if (reg0 == IA32_REG0_EAX) {
736 static unsigned char basic_op_table_im32_eax[] = { 0x0d, 0x35, 0x25, 0, 0x05, 0x2d, 0xc0 };
738 jitCompPutByte1(w.dst, 0x69);
740 jitCompPutByte1(w.dst, basic_op_table_im32_eax[*src - 0x10]);
743 static unsigned char basic_op_table_im32_reg[] = { 0xc8, 0xf0, 0xe0, 0, 0xc0, 0xe8 };
744 jitCompPutByte2(w.dst, 0x81, basic_op_table_im32_reg[*src - 0x10] | reg0);
747 jitCompPutByte2(w.dst, 0x69, 0xc0 | reg0 << 3 | reg0);
750 jitCompPutImm32(w.dst, w.r3f);
752 jitCompA0001_movRxxEax(&w, src[1]);
757 reg1 = jitCompA000_selectRegCache(src[3], -1 /* mem */);
759 w.err = JITC_ERR_REGNUM;
763 static unsigned char basic_op_table_rr[] = { 0x09, 0x31, 0x21, 0, 0x01, 0x29 }; /* op(reg,reg); */
764 jitCompPutByte2(w.dst, basic_op_table_rr[*src - 0x10], 0xc0 | reg1 << 3 | reg0);
766 static unsigned char basic_op_table_rm[] = { 0x0b, 0x33, 0x23, 0, 0x03, 0x2b, 0xaf }; /* op(reg,mem); */
767 jitCompPutByte1(w.dst, basic_op_table_rm[*src - 0x10]);
768 jitCompPutModRM_Disp_BaseEBP(&w, src[3] * 4, reg0);
772 jitCompPutByte3(w.dst, 0x0f, 0xaf, 0xc0 | reg0 << 3 | reg1);
774 jitCompPutByte2(w.dst, 0x0f, 0xaf);
775 jitCompPutModRM_Disp_BaseEBP(&w, src[3] * 4, reg0);
780 jitCompA0001_movRxxEax(&w, src[1]);
787 w.err = JITC_ERR_REGNUM;
790 w.err = JITC_ERR_REGNUM;
792 #if (jitCompA0001_USE_R3F_IMM32 != 0)
793 if (src[3] == 0x3f) {
794 reg0 = jitCompA000_selectRegCache(src[1], IA32_REG0_EAX);
795 reg1 = jitCompA000_selectRegCache(src[2], -1 /* mem */);
797 w.err = JITC_ERR_REGNUM;
800 jitCompPutOp_MOV_GReg_EBPDisp(&w, reg0, src[2] * 4); /* MOV(reg1, [EBP+?]); */
803 jitCompPutByte2(w.dst, 0x89, 0xc0 | reg1 << 3 | reg0); /* MOV(reg0, reg1); */
807 /* SHL(reg0, im8); */
808 jitCompPutByte3(w.dst, 0xc1, 0xe0 | reg0, w.r3f);
811 /* SAR(reg0, im8); */
812 jitCompPutByte3(w.dst, 0xc1, 0xf8 | reg0, w.r3f);
814 if (reg0 == IA32_REG0_EAX){
815 jitCompA0001_movRxxEax(&w, src[1]);
822 jitCompA000_storeRegCacheAll(&w); // 手抜き.
823 jitCompPutOp_MOV_GReg_EBPDisp(&w, IA32_REG1_ECX, src[3] * 4); /* MOV(ECX, [EBP+?]); */
824 #if (jitCompA0001_USE_R3F_IMM32 != 0)
825 if (src[2] == 0x3f) {
826 jitCompPutByte1(w.dst, 0xb8); /* MOV(EAX, ?); */
827 jitCompPutImm32(w.dst, w.r3f);
829 jitCompA0001_movEaxRxx(&w, src[2]);
832 jitCompA0001_movEaxRxx(&w, src[2]);
836 jitCompPutByte2(w.dst, 0xd3, 0xe0);
840 jitCompPutByte2(w.dst, 0xd3, 0xf8);
842 jitCompA0001_movRxxEax(&w, src[1]);
843 jitCompA000_loadRegCacheAll(&w); // 手抜き.
850 if (src[1] >= 0x3f || src[2] >= 0x40 || src[3] >= 0x40){
851 w.err = JITC_ERR_REGNUM;
853 jitCompA000_storeRegCacheAll(&w); // 手抜き.
854 #if (jitCompA0001_USE_R3F_IMM32 != 0)
855 if (src[3] == 0x3f) {
856 jitCompPutByte1(w.dst, 0xb8 | 1); /* MOV(ECX, ?); */
857 jitCompPutImm32(w.dst, w.r3f);
859 jitCompPutOp_MOV_GReg_EBPDisp(&w, IA32_REG1_ECX, src[3] * 4); /* MOV(ECX, [EBP+?]); */
861 if (src[2] == 0x3f) {
862 jitCompPutByte1(w.dst, 0xb8 | 0); /* MOV(EAX, ?); */
863 jitCompPutImm32(w.dst, w.r3f);
865 jitCompPutOp_MOV_GReg_EBPDisp(&w, IA32_REG0_EAX, src[2] * 4); /* MOV(EAX, [EBP+?]); */
868 jitCompPutOp_MOV_GReg_EBPDisp(&w, IA32_REG1_ECX, src[3] * 4); /* MOV(ECX, [EBP+?]); */
869 jitCompPutOp_MOV_GReg_EBPDisp(&w, IA32_REG0_EAX, src[2] * 4); /* MOV(EAX, [EBP+?]); */
871 jitCompPutByte1(w.dst, 0x99); /* CDQ(); */
872 /* ECXがゼロではないことを確認すべき */
873 jitCompPutByte2(w.dst, 0xf7, 0xf9); /* IDIV(ECX); */
875 jitCompPutOp_MOV_EBPDisp_GReg(&w, src[1] * 4, IA32_REG0_EAX);
878 jitCompPutOp_MOV_EBPDisp_GReg(&w, src[1] * 4, IA32_REG2_EDX);
880 jitCompA000_loadRegCacheAll(&w); // 手抜き.
884 case 0x1c: /* PLMT0 */
885 case 0x1d: /* PLMT1 */
886 if (src[1] >= 0x40 || src[2] >= 0x40){
887 w.err = JITC_ERR_PREGNUM;
889 if (level < JITC_LV_FASTEST) {
891 if (level < JITC_LV_FASTER) {
893 // plsとliveSignが一致していることを確認.
895 // preg1はp0 <= p <= p1 を満たしているか?.
896 // 新しいp0/p1は古いp0?p1に適合しているか?.
901 case 0x1e: /* PCP */ /* 未完成(p1まで完成) */
902 if (src[1] >= 0x40 || src[2] >= 0x40){
903 w.err = JITC_ERR_PREGNUM;
906 w.err = JITC_ERR_PREGNUM;
908 if (src[1] != 0x3f) {
909 /* src[2] == 0xff の場合に対応できてない */
910 jitCompA000_storePRegCacheAll(&w); // 手抜き.
911 for (i = 0; i < 32; i += 4) {
912 jitCompPutOp_MOV_GReg_EBPDisp(&w, IA32_REG0_EAX, PRegOffset(src[2]) + i); /* MOV(EAX, [EBP+?]); */
913 jitCompPutOp_MOV_EBPDisp_GReg(&w, PRegOffset(src[1]) + i, IA32_REG0_EAX); /* MOV([EBP+?], EAX); */
915 jitCompA000_loadPRegCacheAll(&w); // 手抜き.
917 if (level < JITC_LV_FASTER) {
918 jitCompPutOp_MOV_GReg_EBPDisp(&w, IA32_REG0_EAX, PRegOffset(src[2]) + 4); /* MOV(EAX, [EBP+?]); */ /* typ */
919 jitCompPutByte3(w.dst, 0x83, 0xf8, 0); /* CMP(EAX, 0); */
920 jitCompPutByte2(w.dst, 0x0f, 0x85); /* JNE */
921 jitCompPutImm32(w.dst, errfnc - (w.dst + 4));
922 /* セキュリティチェックが足りてない!(aliveとか) */
924 reg0 = IA32_REG0_EAX;
925 jitCompA000_storePRegCacheAll(&w); // 手抜き.
926 jitCompPutOp_MOV_GReg_EBPDisp(&w, reg0, PRegOffset(src[2]) + 0); /* MOV(EAX, [EBP+?]); */
927 if (level < JITC_LV_FASTER) {
928 jitCompPutByte1(w.dst, 0x3b); /* CMP(reg0, [EBP+?]); */
929 jitCompPutModRM_Disp_BaseEBP(&w, PRegOffset(src[2]) + 8, reg0); /* p0 */
930 jitCompPutByte2(w.dst, 0x0f, 0x85); /* JNE */
931 jitCompPutImm32(w.dst, errfnc - (w.dst + 4));
933 jitCompPutByte2(w.dst, 0xff, 0xe0); /* JMP(EAX); */
937 case 0x1f: /* PCST */
938 if (jitCompGetImm32(src + 2) == 0) {
939 if (level < JITC_LV_FASTER){
940 jitCompA0001_checkType0(&w, src[6], jitCompGetImm32(src + 7), 2);
942 jitCompA000_storePRegCacheAll(&w); // 手抜き.
943 for (i = 0; i < 32 - 4; i += 4) {
944 jitCompPutOp_MOV_GReg_EBPDisp(&w, IA32_REG0_EAX, PRegOffset(src[6]) + i); /* MOV(EAX, [EBP+?]); */
946 jitCompPutByte1(w.dst, 0x0d); /* OR(EAX, ?); */
947 jitCompPutImm32(w.dst, 0x80000000);
949 jitCompPutOp_MOV_EBPDisp_GReg(&w, PRegOffset(src[1]) + i, IA32_REG0_EAX); /* MOV([EBP+?], EAX); */
951 jitCompPutOp_MOV_GReg_Imm32(w.dst, IA32_REG0_EAX, debugInfo1);
952 jitCompPutOp_MOV_EBPDisp_GReg(&w, PRegOffset(src[1]) + 28, IA32_REG0_EAX); /* MOV([EBP+?], EAX); */
953 jitCompA000_loadPRegCacheAll(&w); // 手抜き.
957 if (jitCompGetImm32(src + 7) == 0) {
958 jitCompA000_storePRegCacheAll(&w); // 手抜き.
959 for (i = 0; i < 32 - 4; i += 4) {
960 jitCompPutOp_MOV_GReg_EBPDisp(&w, IA32_REG0_EAX, PRegOffset(src[6]) + i); /* MOV(EAX, [EBP+?]); */
962 jitCompPutByte1(w.dst, 0x25); /* AND(EAX, ?); */
963 jitCompPutImm32(w.dst, 0x7fffffff);
965 jitCompPutOp_MOV_EBPDisp_GReg(&w, PRegOffset(src[1]) + i, IA32_REG0_EAX); /* MOV([EBP+?], EAX); */
967 if (level < JITC_LV_FASTER) {
968 jitCompPutOp_MOV_GReg_EBPDisp(&w, IA32_REG0_EAX, PRegOffset(src[6]) + 28); /* MOV(EAX, [EBP+?]); */
969 jitCompPutByte1(w.dst, 0x3d); /* CMP(EAX, ?); */
970 jitCompPutImm32(w.dst, debugInfo1);
971 jitCompPutByte2(w.dst, 0x74, 8); /* JE */
972 jitCompPutOp_MOV_EAX_ZERO(w.dst);
973 jitCompPutOp_MOV_EBPDisp_GReg(&w, PRegOffset(src[1]) + 0, IA32_REG0_EAX); /* MOV([EBP+?], EAX); (1+1+4) */
975 jitCompA000_loadPRegCacheAll(&w); // 手抜き.
979 w.err = JITC_ERR_OPECODE;
982 case 0x20: /* CMPE */
983 case 0x21: /* CMPNE */
984 case 0x22: /* CMPL */
985 case 0x23: /* CMPGE */
986 case 0x24: /* CMPLE */
987 case 0x25: /* CMPG */
988 case 0x26: /* TSTZ */
989 case 0x27: /* TSTNZ */
990 reg0 = jitCompA000_selectRegCache(src[2], IA32_REG0_EAX);
991 reg1 = jitCompA000_selectRegCache(src[3], -1 /* mem */);
992 if (src[1] == 0x3f) {
995 w.err = JITC_ERR_PREFIX;
998 if (src[4] != 0x04 || src[5] != 0x3f || src[6] != 0x03 || src[7] != 0x3f) {
999 w.err = JITC_ERR_IDIOM;
1004 jitCompA0001_movEaxRxx(&w, src[2]);
1005 #if (jitCompA0001_USE_R3F_IMM32 != 0)
1006 if (src[3] == 0x3f) {
1007 #if (jitCompA0001_OPTIMIZE_CMP != 0)
1008 if ((*src <= 0x25 && w.r3f == 0) || (*src >= 0x26 && w.r3f == -1)) {
1010 if (cmp0reg == src[2]) {
1011 if (cmp0lev >= 1 && (src[0] == 0x20 || src[0] == 0x21 || src[0] == 0x26 || src[0] == 0x27)){
1014 if (cmp0lev >= 2 && (src[0] == 0x22 || src[0] == 0x23 || src[0] == 0x24 || src[0] == 0x25)){
1019 jitCompPutByte2(w.dst, 0x85, 0xc0 | reg0 << 3 | reg0); /* TEST(reg0, reg0); */
1026 #if (jitCompA0001_USE_R3F_IMM8 != 0)
1027 if (-0x80 <= w.r3f && w.r3f <= 0x7f && *src <= 0x25) {
1028 jitCompPutByte3(w.dst, 0x83, 0xf8 | reg0, w.r3f);
1034 jitCompPutByte1(w.dst, 0x3d);
1037 jitCompPutByte1(w.dst, 0xa9);
1042 jitCompPutByte2(w.dst, 0x81, 0xf8 | reg0);
1045 jitCompPutByte2(w.dst, 0xf7, 0xc0 | reg0);
1048 jitCompPutImm32(w.dst, w.r3f);
1052 if (src[3] >= 0x40){
1053 w.err = JITC_ERR_PREGNUM;
1057 jitCompPutByte2(w.dst, 0x39, 0xc0 | reg1 << 3 | reg0);
1060 jitCompPutByte2(w.dst, 0x85, 0xc0 | reg1 << 3 | reg0);
1064 jitCompPutByte1(w.dst, 0x3b);
1067 jitCompPutByte1(w.dst, 0x85);
1069 jitCompPutModRM_Disp_BaseEBP(&w, src[3] * 4, reg0);
1075 static unsigned char cmpcc_table0[] = {
1076 0x04, 0x05, 0x0c, 0x0d, 0x0e, 0x0f, 0x04, 0x05, /* CMPcc, TSTcc */
1077 0x04, 0x05, 0x02, 0x03, 0x06, 0x07 /* PCMPcc */
1079 #if (jitCompA0001_USE_R3F_CMPJMP != 0)
1080 if (src[1] == 0x3f) {
1082 jitCompPutByte2(w.dst, 0x0f, 0x80 | cmpcc_table0[*src - 0x20]);
1084 i = jitCompGetLabelNum(&w, src + 2);
1085 if ((flags & JITC_PHASE1) != 0 && w.err != 0) {
1086 if (label[i].opt == 0) {
1087 w.err = JITC_ERR_LABELNODEF;
1090 // if (label[i].typ != 1) { w.err = JITC_ERR_LABELTYP; goto err_w; }
1093 if ((flags & JITC_PHASE1) != 0 || (((flags & JITC_PHASE1) == 0) && label[i].opt != 0)){
1094 j = label[i].p - (w.dst + 4);
1096 jitCompPutImm32(w.dst, j);
1097 #if (jitCompA0001_OPTIMIZE_JMP != 0)
1098 if (-128 - 4 <= j && j < 0) {
1101 jitCompPutByte2(w.dst, w.dst[1] ^ 0xf0, j & 0xff);
1112 reg0 = jitCompA000_selectRegCache(src[1], IA32_REG0_EAX);
1113 jitCompPutByte3(w.dst, 0x0f, 0x90 | cmpcc_table0[*src - 0x20], 0xc0 | reg0); /* SETcc(BYTE(reg0)); */
1114 jitCompPutByte3(w.dst, 0x0f, 0xb6, 0xc0 | reg0 << 3 | reg0); /* MOVZX(reg0, BYTE(reg0)); */
1115 jitCompPutByte2(w.dst, 0xf7, 0xd8 | reg0); /* NEG(reg0); */
1117 jitCompA0001_movRxxEax(&w, src[1]);
1123 case 0x28: /* PCMPE */
1124 case 0x29: /* PCMPNE */
1125 case 0x2a: /* PCMPL */
1126 case 0x2b: /* PCMPGE */
1127 case 0x2c: /* PCMPLE */
1128 case 0x2d: /* PCMPG */
1129 if (src[1] == 0x3f) {
1131 if (w.prefix != 0) {
1132 w.err = JITC_ERR_PREFIX;
1135 if (src[4] != 0x04 || src[5] != 0x3f || src[6] != 0x03 || src[7] != 0x3f) {
1136 w.err = JITC_ERR_IDIOM;
1140 if (src[2] >= 0x40) {
1141 w.err = JITC_ERR_PREGNUM;
1143 jitCompA000_storePRegCacheAll(&w); // 手抜き.
1144 if (src[3] != 0xff){
1145 jitCompA0001_checkCompPtr(&w, src[2], src[3]);
1147 jitCompPutOp_MOV_GReg_EBPDisp(&w, IA32_REG0_EAX, PRegOffset(src[2]) + 0); /* MOV(EAX, [EBP+?]); */
1148 if (src[3] != 0xff) {
1149 jitCompPutByte1(w.dst, 0x3b); /* CMP(EAX, [EBP+?]); */
1150 jitCompPutModRM_Disp_BaseEBP(&w, PRegOffset(src[3]) + 0, 0);
1152 /* ヌルポインタとの比較はこれでいいのか?たぶんよくない */
1153 jitCompPutByte3(w.dst, 0x83, 0xf8, 0x00); /* CMP(EAX, 0); */
1158 case 0x30: /* talloc(old:F4) */
1159 case 0x31: /* tfree(old:F5) */
1160 case 0x32: /* malloc(old:F6) */
1161 case 0x33: /* mfree(old:F7) */
1162 jitCompA000_storeRegCacheAll(&w); // 手抜き.
1163 jitCompA000_storePRegCacheAll(&w); // 手抜き.
1165 jitCompPutOp_PUSH_Imm8(w.dst, src[3]);
1166 jitCompPutOp_PUSH_Imm8(w.dst, src[2]);
1167 jitCompPutOp_PUSH_Imm8(w.dst, src[1]);
1168 jitCompPutOp_PUSH_GReg(w.dst, IA32_REG5_EBP);
1172 j = ((unsigned char *)&funcf4) - (w.dst + 1 + 4);
1175 j = ((unsigned char *)&funcf5) - (w.dst + 1 + 4);
1178 j = ((unsigned char *)&funcf6) - (w.dst + 1 + 4);
1181 j = ((unsigned char *)&funcf7) - (w.dst + 1 + 4);
1184 jitCompPutOp_CALL_Relative(w.dst, j);
1185 jitCompPutOp_ADD_GReg_Imm8(w.dst, IA32_REG4_ESP, 16);
1187 jitCompA000_loadRegCacheAll(&w); // 手抜き.
1188 jitCompA000_loadPRegCacheAll(&w); // 手抜き.
1192 case 0x34: /* data (暫定) */
1194 // 34 typ32 len32 data...
1195 // len32 is NOT byte size!
1198 if (w.prefix != 0) {
1199 w.err = JITC_ERR_PREFIX;
1202 int k, tmpData, bitCount, dataWidth;
1204 k = jitCompGetImm32(&src[1]);
1205 dataWidth = jitCompA000_dataWidth(k);
1206 if (lastlabel >= 0 && label[lastlabel].typ == 0){
1208 label[lastlabel].typ = k;
1211 i = jitCompA000_convTyp(k);
1212 if (i < 2 || i > 7) {
1213 w.err = JITC_ERR_BADTYPE;
1218 j = jitCompGetImm32(&src[5]);
1228 // バイトコードを末端を超えて読もうとした
1229 w.err = JITC_ERR_SRC1;
1233 if (w.dst + 256 > dst1) {
1234 // 書き込み先の残り容量が256Bytesを切った
1235 w.err = JITC_ERR_DST1;
1240 for (k = 0; k < dataWidth; k++) {
1241 // dataWidthビットごとに切り出してtmpDataに入れる
1242 tmpData = tmpData << 1 | ((*src >> bitCount) & 1);
1249 if ((i & 1) == 0 && dataWidth <= 31 && (tmpData >> (dataWidth - 1)) != 0) {
1250 // 符号あり型で、かつtmpDataの符号ビットが1なので、マイナスにする
1251 tmpData -= 1 << dataWidth;
1253 if (i == 2 || i == 3) {
1255 jitCompPutByte1(w.dst, tmpData & 0xff);
1257 if (i == 4 || i == 5) {
1259 jitCompPutByte2(w.dst, tmpData & 0xff, (tmpData >> 8) & 0xff);
1261 if (i == 6 || i == 7) {
1263 jitCompPutByte4(w.dst, tmpData & 0xff, (tmpData >> 8) & 0xff, (tmpData >> 16) & 0xff, (tmpData >> 24) & 0xff);
1271 // バイトコードを末端を超えて読もうとした
1272 w.err = JITC_ERR_SRC1;
1276 if (w.dst + 256 > dst1) {
1277 // 書き込み先の残り容量が256Bytesを切った
1278 w.err = JITC_ERR_DST1;
1282 i = jitCompGetImm32(src);
1284 if ((flags & JITC_PHASE1) != 0 && w.err == 0) {
1286 if (label[i].opt == 0) {
1288 w.err = JITC_ERR_LABELNODEF;
1292 jitCompPutImm32(w.dst, (int)label[i].p);
1293 jitCompPutImm32(w.dst, label[i].typ);
1294 jitCompPutImm32(w.dst, (int)label[i].p);
1295 jitCompPutImm32(w.dst, (int)label[i].p1);
1296 jitCompPutImm32(w.dst, 0); /* liveSign */
1297 jitCompPutImm32(w.dst, envOffset_PTRCTRL); /* pls */
1298 jitCompPutImm32(w.dst, 0);
1299 jitCompPutImm32(w.dst, 0);
1303 if (lastlabel >= 0 && label[lastlabel].p1 < w.dst){
1304 label[lastlabel].p1 = w.dst;
1308 case 0x3c: /* ENTER */
1309 jitCompA000_storeRegCacheAll(&w); // 手抜き.
1310 jitCompA000_storePRegCacheAll(&w); // 手抜き.
1311 jitCompPutOp_PUSH_Imm8(w.dst, src[6]);
1312 jitCompPutOp_PUSH_Imm8(w.dst, src[5]);
1313 jitCompPutOp_PUSH_Imm8(w.dst, src[4] & 0x0f);
1314 jitCompPutOp_PUSH_Imm8(w.dst, (src[4] >> 4) & 0x0f);
1315 jitCompPutOp_PUSH_Imm8(w.dst, src[3]);
1316 jitCompPutOp_PUSH_Imm8(w.dst, src[2]);
1317 jitCompPutOp_PUSH_Imm8(w.dst, src[1]);
1318 jitCompPutOp_PUSH_GReg(w.dst, IA32_REG5_EBP);
1319 j = ((unsigned char *)&func3c) - (w.dst + 1 + 4);
1320 jitCompPutOp_CALL_Relative(w.dst, j)
1321 jitCompPutOp_ADD_GReg_Imm8(w.dst, IA32_REG4_ESP, 32);
1322 jitCompA000_loadRegCacheAll(&w); // 手抜き.
1323 jitCompA000_loadPRegCacheAll(&w); // 手抜き.
1327 case 0x3d: /* LEAVE */
1328 jitCompA000_storeRegCacheAll(&w); // 手抜き.
1329 jitCompA000_storePRegCacheAll(&w); // 手抜き.
1330 jitCompPutOp_PUSH_Imm8(w.dst, src[6]);
1331 jitCompPutOp_PUSH_Imm8(w.dst, src[5]);
1332 jitCompPutOp_PUSH_Imm8(w.dst, src[4] & 0x0f);
1333 jitCompPutOp_PUSH_Imm8(w.dst, (src[4] >> 4) & 0x0f);
1334 jitCompPutOp_PUSH_Imm8(w.dst, src[3]);
1335 jitCompPutOp_PUSH_Imm8(w.dst, src[2]);
1336 jitCompPutOp_PUSH_Imm8(w.dst, src[1]);
1337 jitCompPutOp_PUSH_GReg(w.dst, IA32_REG5_EBP);
1338 j = ((unsigned char *)&func3d) - (w.dst + 1 + 4);
1339 jitCompPutOp_CALL_Relative(w.dst, j)
1340 jitCompPutOp_ADD_GReg_Imm8(w.dst, IA32_REG4_ESP, 32);
1341 jitCompA000_loadRegCacheAll(&w); // 手抜き.
1342 jitCompA000_loadPRegCacheAll(&w); // 手抜き.
1346 case 0xfe: /* remark */
1347 if (src[1] == 0x01 && src[2] == 0x00) {
1349 if (level <= JITC_LV_SLOWER) {
1350 jitCompPutOp_MOV_GReg_Imm32(w.dst, IA32_REG0_EAX, debugInfo1);
1351 jitCompPutOp_MOV_EBPDisp_GReg(&w, envOffset_DBGINFO1, IA32_REG0_EAX);
1354 if (src[1] == 0x01 && src[2] == 0x03) {
1356 if (level <= JITC_LV_SLOWER) {
1357 jitCompPutOp_MOV_GReg_Imm32(w.dst, IA32_REG0_EAX, -1);
1358 jitCompPutOp_MOV_EBPDisp_GReg(&w, envOffset_DBGINFO1, IA32_REG0_EAX);
1361 if (src[1] == 0x05 && src[2] == 0x00) {
1363 if (level <= JITC_LV_SLOWEST) {
1364 debugInfo0 = jitCompGetImm32(src + 3);
1365 jitCompPutOp_MOV_GReg_Imm32(w.dst, IA32_REG0_EAX, debugInfo0);
1366 jitCompPutOp_MOV_EBPDisp_GReg(&w, envOffset_DBGINFO0, IA32_REG0_EAX);
1372 w.err = JITC_ERR_OPECODE;
1378 jitCompA0001_fixPrefix(&w);
1383 if(*src != 0x00 && *src != 0x01 && *src != 0x34){
1384 DEBUGCode(&w, 315315);
1387 src += jitCompCmdLen(src);
1389 if (enter0 != NULL) {
1390 j = w.dst - (enter0 + 4);
1391 enter0[0] = j & 0xff;
1392 enter0[1] = (j >> 8) & 0xff;
1393 enter0[2] = (j >> 16) & 0xff;
1394 enter0[3] = (j >> 24) & 0xff;
1396 if ((flags & JITC_NOSTARTUP) == 0) {
1397 jitCompA000_storeRegCacheAll(&w);
1398 jitCompA000_storePRegCacheAll(&w);
1399 jitCompPutOp_POPAD(w.dst);
1401 if ((flags & JITC_PHASE1) != 0){
1402 return w.dst - dst00;
1407 if ((w.err & JITC_ERR_PHASE0ONLY) != 0) {
1408 if ((flags & JITC_PHASE1) == 0){
1409 w.err &= ~JITC_ERR_PHASE0ONLY;
1412 if (w.err == (JITC_ERR_MASK & JITC_ERR_REGNUM)) errmsg = "reg-number error";
1413 if (w.err == (JITC_ERR_MASK & JITC_ERR_DST1)) errmsg = "dst1 error";
1414 if (w.err == (JITC_ERR_MASK & JITC_ERR_OPECODE)) errmsg = "opecode error";
1415 if (w.err == (JITC_ERR_MASK & JITC_ERR_LABELNUM)) errmsg = "label number too large";
1416 if (w.err == (JITC_ERR_MASK & JITC_ERR_LABELREDEF)) errmsg = "label redefine";
1417 if (w.err == (JITC_ERR_MASK & JITC_ERR_PREFIX)) { errmsg = "prefix redefine"; w.dst -= 2; }
1418 if (w.err == (JITC_ERR_MASK & JITC_ERR_LABELNODEF)) errmsg = "label not defined";
1419 if (w.err == (JITC_ERR_MASK & JITC_ERR_LABELTYP)) errmsg = "label type error";
1420 if (w.err == (JITC_ERR_MASK & JITC_ERR_IDIOM)) errmsg = "idiom error";
1421 if (w.err == (JITC_ERR_MASK & JITC_ERR_PREGNUM)) errmsg = "preg-number error";
1422 if (w.err == (JITC_ERR_MASK & JITC_ERR_SRC1)) errmsg = "src1 error";
1423 if (w.err == (JITC_ERR_MASK & JITC_ERR_BADTYPE)) errmsg = "bad type code";
1424 if (w.err == (JITC_ERR_MASK & JITC_ERR_PREFIXFAR)) errmsg = "prefix internal error";
1425 if (w.err == (JITC_ERR_MASK & JITC_ERR_INTERNAL)) errmsg = "general internal error";
1426 if (*errmsg != '\0') {
1427 fprintf(stderr, "JITC: %s at %06X (debugInfo0=%d)\n ", errmsg, src - src0, debugInfo0);
1428 for (i = 0; i < 16; i++)
1429 fprintf(stderr, "%02X ", src[i]);
1430 static char *table[0x30] = {
1431 "NOP", "LB", "LIMM", "PLIMM", "CND", "??", "??", "??",
1432 "LMEM", "SMEM", "PLMEM", "PSMEM", "LEA", "??", "PADD", "PDIF",
1433 "CP/OR", "XOR", "AND", "??", "ADD", "SUB", "MUL", "??",
1434 "SHL", "SAR", "DIV", "MOD", "PLMT0", "PLMT1", "PCP", "PCST",
1435 "CMPE", "CMPNE", "CMPL", "CMPGE", "CMPLE", "CMPG", "TSTZ", "TSTNZ",
1436 "PCMPE", "PCMPNE", "PCMPL", "PCMPGE", "PCMPLE", "PCMPG", "??", "EXT" };
1438 if (*src < 0x30) errmsg = table[*src];
1439 fprintf(stderr, "(%s)\n", errmsg);
1444 unsigned char *jitCompCallFunc(unsigned char *dst, void *func)
1446 //この関数の中では結局w->dstしか参照していない
1447 struct JitCompWork w;
1449 jitCompA000_storeRegCacheAll(&w);
1450 jitCompA000_storePRegCacheAll(&w);
1451 jitCompPutOp_PUSHAD(w.dst);
1452 jitCompPutOp_PUSH_GReg(w.dst, IA32_REG0_EAX); /* for 16Byte-align(Mac OSX) */
1453 jitCompPutOp_PUSH_GReg(w.dst, IA32_REG5_EBP);
1455 int j = ((unsigned char *)func) - (w.dst + 1 + 4);
1456 jitCompPutOp_CALL_Relative(w.dst, j);
1458 jitCompPutOp_POP_GReg(w.dst, IA32_REG0_EAX);
1459 jitCompPutOp_POP_GReg(w.dst, IA32_REG0_EAX); /* for 16Byte-align (Mac OSX) */
1460 jitCompPutOp_POPAD(w.dst);
1461 jitCompA000_loadRegCacheAll(&w);
1462 jitCompA000_loadPRegCacheAll(&w);
1463 jitCompPutOp_MOV_GReg_EBPDisp(&w, IA32_REG0_EAX, PRegOffset(0x30) + 0);
1465 jitCompPutByte2(w.dst, 0xff, 0xe0); /* JMP(EAX); */
1469 unsigned char *jitCompInit(unsigned char *dst)
1472 return jitCompCallFunc(dst, &errHndl);
1475 void jitcRunBinary(void (*bin)(char *), HOSECPU_RuntimeEnvironment *env)
1477 (*bin)(((char *)env) + jitCompA0001_EBP128); /* サイズを節約するためにEBPをjitCompA0001_EBP128バイトずらす */
1481 void func3c(char *ebp, int opt, int r1, int p1, int lenR, int lenP, int r0, int p0)
1483 HOSECPU_RuntimeEnvironment *r = (HOSECPU_RuntimeEnvironment *) (ebp - jitCompA0001_EBP128);
1485 HOSECPU_PointerRegisterEntry *pp;
1487 if (r->junkStack + 2048 > r->junkStack1) {
1490 pi = (void *)r->junkStack;
1491 r->junkStack += r1 * 4;
1492 for (i = 0; i < r1; i++){
1495 pp = (void *)r->junkStack;
1496 r->junkStack += p1 * 32;
1497 for (i = 0; i < p1; i++){
1498 //pp[i] = r->preg[i];
1499 PRegCopy(&pp[i], &r->preg[i]);
1502 pp = (void *)r->junkStack;
1504 //*pp = r->preg[0x30];
1505 PRegCopy(pp, &r->preg[0x30]);
1507 pi = (void *)r->junkStack;
1509 *pi = opt << 16 | r1 << 8 | p1;
1510 for (i = 0; i < lenR; i++){
1511 r->ireg[r0 + i] = r->ireg[0x30 + i];
1513 for (i = 0; i < lenP; i++){
1514 r->preg[p0 + i] = r->preg[0x31 + i];
1519 void func3d(char *ebp, int opt, int r1, int p1, int lenR, int lenP, int r0, int p0)
1521 HOSECPU_RuntimeEnvironment *r = (HOSECPU_RuntimeEnvironment *) (ebp - jitCompA0001_EBP128);
1525 HOSECPU_PointerRegisterEntry *pp = (void *)r->junkStack;
1527 //r->preg[0x30] = *pp;
1528 PRegCopy(&r->preg[0x30], pp);
1530 r->junkStack -= p1 * 32; pp = (void *)r->junkStack;
1531 for (i = 0; i < p1; i++){
1532 //r->preg[i] = pp[i];
1533 PRegCopy(&r->preg[i], &pp[i]);
1536 r->junkStack -= r1 * 4; int *pi = (void *)r->junkStack;
1537 for (i = 0; i < r1; i++){
1543 void funcf4(char *ebp, int pxx, int typ, int len)
1545 HOSECPU_RuntimeEnvironment *r = (HOSECPU_RuntimeEnvironment *) (ebp - jitCompA0001_EBP128);
1546 int width = jitCompA000_dataWidth(jitCompA000_convTyp(r->ireg[typ])) >> 3;
1547 if (width < 0 || r->ireg[len] < 0){
1550 void *p = r->junkStack;
1551 if (r->junkStack + width * r->ireg[len] + 256 > r->junkStack1){
1554 r->junkStack += width * r->ireg[len];
1556 r->preg[pxx].typ = r->ireg[typ];
1557 r->preg[pxx].p0 = p;
1558 r->preg[pxx].p1 = (void *)r->junkStack;
1559 int *pi = (int *)r->junkStack;
1560 *pi = width * r->ireg[len];
1561 r->junkStack += sizeof (int);
1562 if (r->ireg[typ] == 1) {
1563 int i, i1 = (width * r->ireg[len]) >> 2;
1565 for (i = 0; i < i1; i++){
1572 void funcf5(char *ebp, int pxx, int typ, int len)
1575 HOSECPU_RuntimeEnvironment *r = (HOSECPU_RuntimeEnvironment *) (ebp - jitCompA0001_EBP128);
1576 r->junkStack -= sizeof (int);
1577 int *pi = (int *)r->junkStack;
1578 r->junkStack -= *pi;
1580 int width = jitCompA000_dataWidth(r->ireg[typ]);
1581 void *p = r->junkStack;
1582 r->junkStack -= width * r->ireg[len];
1587 void funcf6(char *ebp, int pxx, int typ, int len)
1589 HOSECPU_RuntimeEnvironment *r = (HOSECPU_RuntimeEnvironment *) (ebp - jitCompA0001_EBP128);
1590 int width = jitCompA000_dataWidth(jitCompA000_convTyp(r->ireg[typ])) >> 3;
1591 if (width < 0 || r->ireg[len] < 0){
1594 void *p = malloc(width * r->ireg[len]);
1596 r->preg[pxx].typ = r->ireg[typ];
1597 r->preg[pxx].p0 = p;
1598 r->preg[pxx].p1 = (unsigned char *)p + width * r->ireg[len];
1599 if (r->ireg[typ] == 1) {
1600 int i, i1 = (width * r->ireg[len]) >> 2, *pi;
1602 for (i = 0; i < i1; i++){
1605 for (i = 1; i < i1; i += 8){
1612 void funcf7(char *ebp, int pxx, int typ, int len)
1614 // typとlenはダミーで参照されない
1615 HOSECPU_RuntimeEnvironment *r = (HOSECPU_RuntimeEnvironment *) (ebp - jitCompA0001_EBP128);
1616 free(r->preg[pxx].p);
1620 void errHndl(HOSECPU_RuntimeEnvironment *r)
1622 r = (HOSECPU_RuntimeEnvironment *) (((char *)r) - jitCompA0001_EBP128);
1628 * jitcの出力コードをひとまとめにする関数を作成しその中身をjitCompile()で生成
1630 * qq : 出力バイナリの書き込み位置のアドレスへの参照(書き込み位置を呼び出しに反映させるため参照渡しにする)
1631 * q1 : 出力バイナリの書き込み位置のアドレスの最大値
1632 * p0 : (*.ose)バイナリの読み込み位置のアドレス(ヘッダ部除去済)
1633 * p1 : (*.ose)バイナリの読み込み位置の取りうる最大値
1634 * (ただし、「確保したメモリ」の最大値なのでこれより手前にゴミデータが入っているかもしれない)
1636 * ret=2 : jitコンパイルエラー
1638 int jitc0(unsigned char **qq, unsigned char *q1, const unsigned char *p0, const unsigned char *p1, int level, HOSECPU_LabelListTag *label)
1640 unsigned char *q = *qq;
1643 if (p0[0] != 0x05 || p0[1] != SIGN1){
1644 // OSECPUのヘッダ (05E1) を確認
1648 jitCompPutOp_PUSH_GReg(q, IA32_REG5_EBP);
1650 *q++ = 0x8b; *q++ = 0x6c; *q++ = 0x24; *q++ = 0x08; /* MOV(EBP,[ESP+8]); */
1652 for (i = 0; i < JITC_MAXLABELS; i++){
1656 // 以下のjitCompile()呼び出しでは第二引数をq1-2にした方がよいのではないか?
1657 i = jitCompiler(q, q1, p0 + 2, p1, p0, label, JITC_MAXLABELS, level, di1_serial, 0);
1661 i = jitCompiler(q, q1, p0 + 2, p1, p0, label, JITC_MAXLABELS, level, di1_serial, JITC_PHASE1 + 0);
1667 jitCompPutOp_POP_GReg(q, IA32_REG5_EBP);
1668 *q++ = 0xc3; /* RET(); */
1673 #if (USE_DEBUGGER != 0)
1675 int dbgrGetRegNum(const char *p)
1682 i -= 'A' - '0' - 10;
1685 j -= 'A' - '0' - 10;
1687 if (0 <= i && i <= 15 && 0 <= j && j <= 15){
1694 void dbgrMain(HOSECPU_RuntimeEnvironment *r)
1704 p = fgets(cmd, 64, stdin);
1708 if (cmd[0] == '\0'){
1711 if (cmd[0] == 'q' && cmd[1] <= ' '){
1714 if (cmd[0] == 'p' && cmd[1] <= ' ' && cmd[1] != '\0') {
1716 while (*p <= ' ' && *p != '\0'){
1720 i = dbgrGetRegNum(p + 1);
1721 if (0 <= i && i <= 0x3f) {
1722 printf("R%02X = 0x%08X = %d\n", i, r->ireg[i], r->ireg[i]);
1724 puts("register name error");
1729 i = dbgrGetRegNum(p + 1);
1730 if (0 <= i && i <= 0x3f) {
1732 if (0 <= r->preg[i].typ && r->preg[i].typ <= 0x15) {
1733 static char *typName[] = {
1734 "T_CODE", "T_VPTR", "T_SINT8", "T_UINT8",
1735 "T_SINT16", "T_UINT16", "T_SINT32", "T_UINT32",
1736 "T_SINT4", "T_UINT4", "T_SINT2", "T_UINT2",
1737 "T_SINT1", "T_UINT1", "T_SINT12", "T_UINT12",
1738 "T_SINT20", "T_UINT20", "T_SINT24", "T_UINT24",
1739 "T_SINT28", "T_UINT28"
1741 p = typName[r->preg[i].typ];
1743 printf("P%02X:\n type = %s(%04X), (origin-ptr) = 0x%08X\n", i, p, r->preg[i].typ, (unsigned int)(r->preg[i].p0));
1744 if (r->preg[i].p != NULL && r->preg[i].p0 != NULL) {
1745 j = jitCompA000_dataWidth(jitCompA000_convTyp(r->preg[i].typ)) >> 3;
1749 k = (r->preg[i].p1 - r->preg[i].p0) / j;
1750 printf(" size = 0x%08X = %d\n", k, k);
1751 k = (r->preg[i].p - r->preg[i].p0) / j;
1752 printf(" pos = 0x%08X = %d\n", k, k);
1755 puts(" null pointer");
1759 puts("register name error");
1763 puts("command error");