1
Fork 0
mirror of https://git.savannah.gnu.org/git/guile.git synced 2025-05-02 21:10:27 +02:00
guile/lib/jit_x86.c
pcpa 712877a5a4 Correct implementation problems on ix86.
* check/all.tst, check/lightning.c: Only declare or use 64 bit
	interfaces on 64 bit builds.

	* check/fib.tst: Use simpler logic to not need preprocessor
	conditionals for 32 or 64 bit.

	* include/lightning.h: Only declare 64 bit macros on a 64 bit
	build. Code using lightning must know about wordsize and the
	jit generation limitations, also, this way it generates a
	compile time failure, not a runtime assertion.

	* include/lightning/jit_x86.h: Correct typo in macro name.

	* lib/jit_arm.c, lib/jit_arm-cpu.c, lib/jit_mips.c,
	lib/jit_mips-cpu.c, lib/jit_ppc.c, lib/jit_ppc-cpu.c,
	lib/jit_x86.c, lib/jit_x86-cpu.c: Correct wrong code to get
	current jit function pointer.

	* lib/lightning.c: Move call to the simplify() optimization
	to after register liveness is known. Previous code did work
	by accident but now with proper test cases the problem was
	noticed.

	* lib/jit_disasm.c: Always cast bfd_vma to long long when
	passing it as printf argument.
2012-12-03 09:40:08 -02:00

1700 lines
42 KiB
C

/*
* Copyright (C) 2012 Free Software Foundation, Inc.
*
* This is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This software is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* Authors:
* Paulo Cesar Pereira de Andrade
*/
#include <lightning.h>
#include <lightning/jit_private.h>
#define rc(value) jit_class_##value
#define rn(reg) (jit_regno(_rvs[jit_regno(reg)].spec))
#if __WORDSIZE == 32
# define stack_alignment 4
# define stack_framesize 20
#else
# define stack_alignment 8
# define stack_framesize 56
#endif
/*
* Prototypes
*/
#define patch(instr, node) _patch(_jit, instr, node)
static void _patch(jit_state_t*,jit_word_t,jit_node_t*);
#define sse_from_x87_f(r0, r1) _sse_from_x87_f(_jit, r0, r1)
static void _sse_from_x87_f(jit_state_t*,jit_int32_t,jit_int32_t);
#define sse_from_x87_d(r0, r1) _sse_from_x87_d(_jit, r0, r1)
static void _sse_from_x87_d(jit_state_t*,jit_int32_t,jit_int32_t);
#define x87_from_sse_f(r0, r1) _x87_from_sse_f(_jit, r0, r1)
static void _x87_from_sse_f(jit_state_t*,jit_int32_t,jit_int32_t);
#define x87_from_sse_d(r0, r1) _x87_from_sse_d(_jit, r0, r1)
static void _x87_from_sse_d(jit_state_t*,jit_int32_t,jit_int32_t);
#define PROTO 1
# include "jit_x86-cpu.c"
# include "jit_x86-sse.c"
# include "jit_x86-x87.c"
#undef PROTO
/*
* Initialization
*/
jit_cpu_t jit_cpu;
jit_register_t _rvs[] = {
#if __WORDSIZE == 32
{ rc(gpr) | rc(rg8) | 0, "%eax" },
{ rc(gpr) | rc(rg8) | 1, "%ecx" },
{ rc(gpr) | rc(rg8) | 2, "%edx" },
{ rc(sav) | rc(rg8) | rc(gpr) | 3, "%ebx" },
{ rc(sav) | rc(gpr) | 6, "%esi" },
{ rc(sav) | rc(gpr) | 7, "%edi" },
{ rc(sav) | 4, "%esp" },
{ rc(sav) | 5, "%ebp" },
{ rc(xpr) | rc(fpr) | 0, "%xmm0" },
{ rc(xpr) | rc(fpr) | 1, "%xmm1" },
{ rc(xpr) | rc(fpr) | 2, "%xmm2" },
{ rc(xpr) | rc(fpr) | 3, "%xmm3" },
{ rc(xpr) | rc(fpr) | 4, "%xmm4" },
{ rc(xpr) | rc(fpr) | 5, "%xmm5" },
{ rc(xpr) | rc(fpr) | 6, "%xmm6" },
{ rc(xpr) | rc(fpr) | 7, "%xmm7" },
{ rc(fpr) | 0, "st(0)" },
{ rc(fpr) | 1, "st(1)" },
{ rc(fpr) | 2, "st(2)" },
{ rc(fpr) | 3, "st(3)" },
{ rc(fpr) | 4, "st(4)" },
{ rc(fpr) | 5, "st(5)" },
{ rc(fpr) | 6, "st(6)" },
{ rc(fpr) | 7, "st(7)" },
#else
/* %rax is a pseudo flag argument for varargs functions */
{ rc(arg) | rc(gpr) | rc(rg8) | 0, "%rax" },
{ rc(gpr) | rc(rg8) | 10, "%r10" },
{ rc(gpr) | rc(rg8) | 11, "%r11" },
{ rc(gpr) | rc(rg8) | 12, "%r12" },
{ rc(sav) | rc(rg8) | rc(gpr) | 3, "%rbx" },
{ rc(sav) | rc(rg8) | rc(gpr) | 13, "%r13" },
{ rc(sav) | rc(rg8) | rc(gpr) | 14, "%r14" },
{ rc(sav) | rc(rg8) | rc(gpr) | 15, "%r15" },
{ rc(arg) | rc(rg8) | rc(gpr) | 9, "%r9" },
{ rc(arg) | rc(rg8) | rc(gpr) | 8, "%r8" },
{ rc(arg) | rc(rg8) | rc(gpr) | 1, "%rcx" },
{ rc(arg) | rc(rg8) | rc(gpr) | 2, "%rdx" },
{ rc(arg) | rc(rg8) | rc(gpr) | 6, "%rsi" },
{ rc(arg) | rc(rg8) | rc(gpr) | 7, "%rdi" },
{ rc(sav) | 4, "%rsp" },
{ rc(sav) | 5, "%rbp" },
{ rc(xpr) | rc(fpr) | 8, "%xmm8" },
{ rc(xpr) | rc(fpr) | 9, "%xmm9" },
{ rc(xpr) | rc(fpr) | 10, "%xmm10" },
{ rc(xpr) | rc(fpr) | 11, "%xmm11" },
{ rc(xpr) | rc(fpr) | 12, "%xmm12" },
{ rc(xpr) | rc(fpr) | 13, "%xmm13" },
{ rc(xpr) | rc(fpr) | 14, "%xmm14" },
{ rc(xpr) | rc(fpr) | 15, "%xmm15" },
{ rc(xpr) | rc(arg) | rc(fpr) | 7, "%xmm7" },
{ rc(xpr) | rc(arg) | rc(fpr) | 6, "%xmm6" },
{ rc(xpr) | rc(arg) | rc(fpr) | 5, "%xmm5" },
{ rc(xpr) | rc(arg) | rc(fpr) | 4, "%xmm4" },
{ rc(xpr) | rc(arg) | rc(fpr) | 3, "%xmm3" },
{ rc(xpr) | rc(arg) | rc(fpr) | 2, "%xmm2" },
{ rc(xpr) | rc(arg) | rc(fpr) | 1, "%xmm1" },
{ rc(xpr) | rc(arg) | rc(fpr) | 0, "%xmm0" },
{ rc(fpr) | 0, "st(0)" },
{ rc(fpr) | 1, "st(1)" },
{ rc(fpr) | 2, "st(2)" },
{ rc(fpr) | 3, "st(3)" },
{ rc(fpr) | 4, "st(4)" },
{ rc(fpr) | 5, "st(5)" },
{ rc(fpr) | 6, "st(6)" },
{ rc(fpr) | 7, "st(7)" },
#endif
{ _NOREG, "<none>" },
};
/*
* Implementation
*/
void
jit_get_cpu(void)
{
union {
struct {
jit_uint32_t sse3 : 1;
jit_uint32_t pclmulqdq : 1;
jit_uint32_t dtes64 : 1; /* amd reserved */
jit_uint32_t monitor : 1;
jit_uint32_t ds_cpl : 1; /* amd reserved */
jit_uint32_t vmx : 1; /* amd reserved */
jit_uint32_t smx : 1; /* amd reserved */
jit_uint32_t est : 1; /* amd reserved */
jit_uint32_t tm2 : 1; /* amd reserved */
jit_uint32_t ssse3 : 1;
jit_uint32_t cntx_id : 1; /* amd reserved */
jit_uint32_t __reserved0 : 1;
jit_uint32_t fma : 1;
jit_uint32_t cmpxchg16b : 1;
jit_uint32_t xtpr : 1; /* amd reserved */
jit_uint32_t pdcm : 1; /* amd reserved */
jit_uint32_t __reserved1 : 1;
jit_uint32_t pcid : 1; /* amd reserved */
jit_uint32_t dca : 1; /* amd reserved */
jit_uint32_t sse4_1 : 1;
jit_uint32_t sse4_2 : 1;
jit_uint32_t x2apic : 1; /* amd reserved */
jit_uint32_t movbe : 1; /* amd reserved */
jit_uint32_t popcnt : 1;
jit_uint32_t tsc : 1; /* amd reserved */
jit_uint32_t aes : 1;
jit_uint32_t xsave : 1;
jit_uint32_t osxsave : 1;
jit_uint32_t avx : 1;
jit_uint32_t __reserved2 : 1; /* amd F16C */
jit_uint32_t __reserved3 : 1;
jit_uint32_t __alwayszero : 1; /* amd RAZ */
} bits;
jit_uint32_t cpuid;
} ecx;
union {
struct {
jit_uint32_t fpu : 1;
jit_uint32_t vme : 1;
jit_uint32_t de : 1;
jit_uint32_t pse : 1;
jit_uint32_t tsc : 1;
jit_uint32_t msr : 1;
jit_uint32_t pae : 1;
jit_uint32_t mce : 1;
jit_uint32_t cmpxchg8b : 1;
jit_uint32_t apic : 1;
jit_uint32_t __reserved0 : 1;
jit_uint32_t sep : 1;
jit_uint32_t mtrr : 1;
jit_uint32_t pge : 1;
jit_uint32_t mca : 1;
jit_uint32_t cmov : 1;
jit_uint32_t pat : 1;
jit_uint32_t pse36 : 1;
jit_uint32_t psn : 1; /* amd reserved */
jit_uint32_t clfsh : 1;
jit_uint32_t __reserved1 : 1;
jit_uint32_t ds : 1; /* amd reserved */
jit_uint32_t acpi : 1; /* amd reserved */
jit_uint32_t mmx : 1;
jit_uint32_t fxsr : 1;
jit_uint32_t sse : 1;
jit_uint32_t sse2 : 1;
jit_uint32_t ss : 1; /* amd reserved */
jit_uint32_t htt : 1;
jit_uint32_t tm : 1; /* amd reserved */
jit_uint32_t __reserved2 : 1;
jit_uint32_t pbe : 1; /* amd reserved */
} bits;
jit_uint32_t cpuid;
} edx;
#if __WORDSIZE == 32
int ac, flags;
#endif
jit_uint32_t eax, ebx;
#if __WORDSIZE == 32
/* adapted from glibc __sysconf */
__asm__ volatile ("pushfl;\n\t"
"popl %0;\n\t"
"movl $0x240000, %1;\n\t"
"xorl %0, %1;\n\t"
"pushl %1;\n\t"
"popfl;\n\t"
"pushfl;\n\t"
"popl %1;\n\t"
"xorl %0, %1;\n\t"
"pushl %0;\n\t"
"popfl"
: "=r" (flags), "=r" (ac));
/* i386 or i486 without cpuid */
if ((ac & (1 << 21)) == 0)
/* probably without x87 as well */
return;
#endif
/* query %eax = 1 function */
__asm__ volatile ("xchgl %%ebx, %1; cpuid; xchgl %%ebx, %1"
: "=a" (eax), "=r" (ebx),
"=c" (ecx.cpuid), "=d" (edx.cpuid)
: "0" (1));
jit_cpu.fpu = edx.bits.fpu;
jit_cpu.cmpxchg8b = edx.bits.cmpxchg8b;
jit_cpu.cmov = edx.bits.cmov;
jit_cpu.mmx = edx.bits.mmx;
jit_cpu.sse = edx.bits.sse;
jit_cpu.sse2 = edx.bits.sse2;
jit_cpu.sse3 = ecx.bits.sse3;
jit_cpu.pclmulqdq = ecx.bits.pclmulqdq;
jit_cpu.ssse3 = ecx.bits.ssse3;
jit_cpu.fma = ecx.bits.fma;
jit_cpu.cmpxchg16b = ecx.bits.cmpxchg16b;
jit_cpu.sse4_1 = ecx.bits.sse4_1;
jit_cpu.sse4_2 = ecx.bits.sse4_2;
jit_cpu.movbe = ecx.bits.movbe;
jit_cpu.popcnt = ecx.bits.popcnt;
jit_cpu.aes = ecx.bits.aes;
jit_cpu.avx = ecx.bits.avx;
#if __WORDSIZE == 64
/* query %eax = 0x80000001 function */
__asm__ volatile ("xchgl %%ebx, %1; cpuid; xchgl %%ebx, %1"
: "=a" (eax), "=r" (ebx),
"=c" (ecx.cpuid), "=d" (edx.cpuid)
: "0" (0x80000001));
jit_cpu.lahf = ecx.cpuid & 1;
#endif
}
void
_jit_init(jit_state_t *_jit)
{
_jit->reglen = jit_size(_rvs) - 1;
#if __WORDSIZE == 32
if (!jit_cpu.sse2) {
jit_int32_t regno;
for (regno = _jit->reglen; regno >= 0; regno--) {
if (_rvs[regno].spec & jit_class_xpr)
_rvs[regno].spec = 0;
}
}
#endif
}
void
_jit_prolog(jit_state_t *_jit)
{
jit_int32_t offset;
if (_jit->function)
jit_epilog();
assert(jit_regset_cmp_ui(_jit->regarg, 0) == 0);
jit_regset_set_ui(_jit->regsav, 0);
offset = _jit->functions.offset;
if (offset >= _jit->functions.length) {
_jit->functions.ptr = realloc(_jit->functions.ptr,
(_jit->functions.length + 16) *
sizeof(jit_function_t));
memset(_jit->functions.ptr + _jit->functions.length, 0,
16 * sizeof(jit_function_t));
_jit->functions.length += 16;
}
_jit->function = _jit->functions.ptr + _jit->functions.offset++;
_jit->function->self.size = stack_framesize;
_jit->function->self.argi = _jit->function->self.argf =
_jit->function->self.aoff = _jit->function->self.alen = 0;
/* sse/x87 conversion */
_jit->function->self.aoff = -8;
_jit->function->regoff = calloc(_jit->reglen, sizeof(jit_int32_t));
_jit->function->prolog = jit_new_node_no_link(jit_code_prolog);
jit_link(_jit->function->prolog);
_jit->function->prolog->w.w = offset;
_jit->function->epilog = jit_new_node_no_link(jit_code_epilog);
/* u: label value
* v: offset in blocks vector
* w: offset in functions vector
*/
_jit->function->epilog->w.w = offset;
jit_regset_new(_jit->function->regset);
}
jit_int32_t
_jit_allocai(jit_state_t *_jit, jit_int32_t length)
{
assert(_jit->function);
switch (length) {
case 0: case 1: break;
case 2: _jit->function->self.aoff &= -2; break;
case 3: case 4: _jit->function->self.aoff &= -4; break;
default: _jit->function->self.aoff &= -8; break;
}
_jit->function->self.aoff -= length;
return (_jit->function->self.aoff);
}
void
_jit_ret(jit_state_t *_jit)
{
jit_node_t *instr;
assert(_jit->function);
/* jump to epilog */
instr = jit_jmpi();
jit_patch_at(instr, _jit->function->epilog);
}
void
_jit_retr(jit_state_t *_jit, jit_int32_t u)
{
if (JIT_RET != u)
jit_movr(JIT_RET, u);
jit_ret();
}
void
_jit_reti(jit_state_t *_jit, jit_word_t u)
{
jit_movi(JIT_RET, u);
jit_ret();
}
void
_jit_retr_f(jit_state_t *_jit, jit_int32_t u)
{
if (JIT_FRET != u)
jit_movr_f(JIT_FRET, u);
jit_ret();
}
void
_jit_reti_f(jit_state_t *_jit, jit_float32_t u)
{
jit_movi_f(JIT_FRET, u);
jit_ret();
}
void
_jit_retr_d(jit_state_t *_jit, jit_int32_t u)
{
if (JIT_FRET != u)
jit_movr_d(JIT_FRET, u);
jit_ret();
}
void
_jit_reti_d(jit_state_t *_jit, jit_float64_t u)
{
jit_movi_d(JIT_FRET, u);
jit_ret();
}
void
_jit_epilog(jit_state_t *_jit)
{
assert(_jit->function);
#if __WORDSIZE == 32
_jit->function->stack = (((_jit->function->self.alen -
_jit->function->self.aoff) + 15) & -16) + 12;
#else
_jit->function->stack = (((_jit->function->self.alen -
_jit->function->self.aoff) + 15) & -16) + 8;
#endif
assert(_jit->function->epilog->next == NULL);
jit_link(_jit->function->epilog);
_jit->function = NULL;
}
jit_int32_t
_jit_arg(jit_state_t *_jit)
{
jit_int32_t offset;
assert(_jit->function);
#if __WORDSIZE == 64
if (_jit->function->self.argi < 6)
return (_jit->function->self.argi++);
#endif
offset = _jit->function->self.size;
_jit->function->self.size += sizeof(jit_word_t);
return (offset);
}
jit_bool_t
_jit_arg_reg_p(jit_state_t *_jit, jit_int32_t offset)
{
#if __WORDSIZE == 32
return (0);
#else
return (offset >= 0 && offset < 6);
#endif
}
jit_int32_t
_jit_arg_f(jit_state_t *_jit)
{
jit_int32_t offset;
assert(_jit->function);
#if __WORDSIZE == 64
if (_jit->function->self.argf < 8)
return (_jit->function->self.argf++);
#endif
offset = _jit->function->self.size;
_jit->function->self.size += sizeof(jit_float32_t);
return (offset);
}
jit_bool_t
_jit_arg_f_reg_p(jit_state_t *_jit, jit_int32_t offset)
{
#if __WORDSIZE == 32
return (0);
#else
return (offset >= 0 && offset < 8);
#endif
}
jit_int32_t
_jit_arg_d(jit_state_t *_jit)
{
#if __WORDSIZE == 64
return (jit_arg_f());
#else
jit_int32_t offset;
assert(_jit->function);
offset = _jit->function->self.size;
_jit->function->self.size += sizeof(jit_float64_t);
return (offset);
#endif
}
jit_bool_t
_jit_arg_d_reg_p(jit_state_t *_jit, jit_int32_t offset)
{
return (jit_arg_f_reg_p(offset));
}
void
_jit_getarg_c(jit_state_t *_jit, jit_int32_t u, jit_int32_t v)
{
#if __WORDSIZE == 64
if (v < 6)
jit_extr_c(u, _RDI - v);
else
#endif
jit_ldxi_c(u, _RBP, v);
}
void
_jit_getarg_uc(jit_state_t *_jit, jit_int32_t u, jit_int32_t v)
{
#if __WORDSIZE == 64
if (v < 6)
jit_extr_uc(u, _RDI - v);
else
#endif
jit_ldxi_uc(u, _RBP, v);
}
void
_jit_getarg_s(jit_state_t *_jit, jit_int32_t u, jit_int32_t v)
{
#if __WORDSIZE == 64
if (v < 6)
jit_extr_s(u, _RDI - v);
else
#endif
jit_ldxi_s(u, _RBP, v);
}
void
_jit_getarg_us(jit_state_t *_jit, jit_int32_t u, jit_int32_t v)
{
#if __WORDSIZE == 64
if (v < 6)
jit_extr_us(u, _RDI - v);
else
#endif
jit_ldxi_us(u, _RBP, v);
}
void
_jit_getarg_i(jit_state_t *_jit, jit_int32_t u, jit_int32_t v)
{
#if __WORDSIZE == 64
if (v < 6)
jit_extr_i(u, _RDI - v);
else
#endif
jit_ldxi_i(u, _RBP, v);
}
#if __WORDSIZE == 64
void
_jit_getarg_ui(jit_state_t *_jit, jit_int32_t u, jit_int32_t v)
{
if (v < 6)
jit_extr_ui(u, _RDI - v);
else
jit_ldxi_ui(u, _RBP, v);
}
void
_jit_getarg_l(jit_state_t *_jit, jit_int32_t u, jit_int32_t v)
{
if (v < 6)
jit_movr(u, _RDI - v);
else
jit_ldxi_l(u, _RBP, v);
}
#endif
void
_jit_getarg_f(jit_state_t *_jit, jit_int32_t u, jit_int32_t v)
{
#if __WORDSIZE == 64
if (v < 8)
jit_movr_f(u, _XMM0 - v);
else
#endif
jit_ldxi_f(u, _RBP, v);
}
void
_jit_getarg_d(jit_state_t *_jit, jit_int32_t u, jit_int32_t v)
{
#if __WORDSIZE == 64
if (v < 8)
jit_movr_d(u, _XMM0 - v);
else
#endif
jit_ldxi_d(u, _RBP, v);
}
void
_jit_pushargr(jit_state_t *_jit, jit_int32_t u)
{
assert(_jit->function);
#if __WORDSIZE == 64
if (_jit->function->call.argi < 6) {
jit_movr(_RDI - _jit->function->call.argi, u);
++_jit->function->call.argi;
}
else
#endif
{
jit_stxi(_jit->function->call.size, _RSP, u);
_jit->function->call.size += sizeof(jit_word_t);
}
}
void
_jit_pushargi(jit_state_t *_jit, jit_word_t u)
{
jit_int32_t regno;
assert(_jit->function);
#if __WORDSIZE == 64
if (_jit->function->call.argi < 6) {
jit_movi(_RDI - _jit->function->call.argi, u);
++_jit->function->call.argi;
}
else
#endif
{
regno = jit_get_reg(jit_class_gpr);
jit_movi(regno, u);
jit_stxi(_jit->function->call.size, _RSP, regno);
_jit->function->call.size += sizeof(jit_word_t);
jit_unget_reg(regno);
}
}
void
_jit_pushargr_f(jit_state_t *_jit, jit_int32_t u)
{
assert(_jit->function);
#if __WORDSIZE == 64
if (_jit->function->call.argf < 8) {
jit_movr_f(_XMM0 - _jit->function->call.argf, u);
++_jit->function->call.argf;
}
else
#endif
{
jit_stxi_f(_jit->function->call.size, _RSP, u);
_jit->function->call.size += sizeof(jit_word_t);
}
}
void
_jit_pushargi_f(jit_state_t *_jit, jit_float32_t u)
{
jit_int32_t regno;
assert(_jit->function);
#if __WORDSIZE == 64
if (_jit->function->call.argf < 8) {
jit_movi_f(_XMM0 - _jit->function->call.argf, u);
++_jit->function->call.argf;
}
else
#endif
{
regno = jit_get_reg(jit_class_fpr);
jit_movi_f(regno, u);
jit_stxi_f(_jit->function->call.size, _RSP, regno);
_jit->function->call.size += sizeof(jit_word_t);
jit_unget_reg(regno);
}
}
void
_jit_pushargr_d(jit_state_t *_jit, jit_int32_t u)
{
assert(_jit->function);
#if __WORDSIZE == 64
if (_jit->function->call.argf < 8) {
jit_movr_d(_XMM0 - _jit->function->call.argf, u);
++_jit->function->call.argf;
}
else
#endif
{
jit_stxi_d(_jit->function->call.size, _RSP, u);
_jit->function->call.size += sizeof(jit_float64_t);
}
}
void
_jit_pushargi_d(jit_state_t *_jit, jit_float64_t u)
{
jit_int32_t regno;
assert(_jit->function);
#if __WORDSIZE == 64
if (_jit->function->call.argf < 8) {
jit_movi_d(_XMM0 - _jit->function->call.argf, u);
++_jit->function->call.argf;
}
else
#endif
{
regno = jit_get_reg(jit_class_fpr);
jit_movi_d(regno, u);
jit_stxi_d(_jit->function->call.size, _RSP, regno);
_jit->function->call.size += sizeof(jit_float64_t);
jit_unget_reg(regno);
}
}
jit_bool_t
_jit_regarg_p(jit_state_t *_jit, jit_node_t *node, jit_int32_t regno)
{
#if __WORDSIZE == 64
jit_int32_t spec;
spec = jit_class(_rvs[regno].spec);
if (spec & jit_class_arg) {
if (spec & jit_class_gpr) {
regno = _RDI - regno;
if (regno >= 0 && regno < node->v.w)
return (1);
}
else if (spec & jit_class_fpr) {
regno = _XMM0 - regno;
if (regno >= 0 && regno < node->w.w)
return (1);
}
}
#endif
return (0);
}
void
_jit_finishr(jit_state_t *_jit, jit_int32_t r0)
{
jit_int32_t reg;
jit_node_t *call;
reg = r0;
assert(_jit->function);
if (_jit->function->self.alen < _jit->function->call.size)
_jit->function->self.alen = _jit->function->call.size;
#if __WORDSIZE == 64
if (_jit->function->call.kind & jit_call_varargs) {
if (jit_regno(reg) == _RAX) {
reg = jit_get_reg(jit_class_gpr);
jit_movr(reg, _RAX);
}
if (_jit->function->call.argf)
jit_movi(_RAX, _jit->function->call.argf);
else
jit_movi(_RAX, 0);
if (reg != r0)
jit_unget_reg(reg);
}
#endif
call = jit_callr(reg);
call->v.w = _jit->function->call.argi;
call->w.w = _jit->function->call.argf;
_jit->function->call.argi = _jit->function->call.argf =
_jit->function->call.size = 0;
}
jit_node_t *
_jit_finishi(jit_state_t *_jit, jit_pointer_t i0)
{
#if __WORDSIZE == 64
jit_int32_t reg;
#endif
jit_node_t *node;
assert(_jit->function);
if (_jit->function->self.alen < _jit->function->call.size)
_jit->function->self.alen = _jit->function->call.size;
#if __WORDSIZE == 64
if (_jit->function->call.kind & jit_call_varargs)
jit_regset_setbit(_jit->regarg, _RAX);
reg = jit_get_reg(jit_class_gpr);
node = jit_movi(reg, (jit_word_t)i0);
jit_finishr(reg);
jit_unget_reg(reg);
if (_jit->function->call.kind & jit_call_varargs)
jit_regset_clrbit(_jit->regarg, _RAX);
#else
node = jit_calli(i0);
node->v.w = _jit->function->call.argi;
node->w.w = _jit->function->call.argf;
#endif
_jit->function->call.argi = _jit->function->call.argf =
_jit->function->call.size = 0;
return (node);
}
void
_jit_retval_c(jit_state_t *_jit, jit_int32_t r0)
{
jit_extr_c(r0, JIT_RET);
}
void
_jit_retval_uc(jit_state_t *_jit, jit_int32_t r0)
{
jit_extr_uc(r0, JIT_RET);
}
void
_jit_retval_s(jit_state_t *_jit, jit_int32_t r0)
{
jit_extr_s(r0, JIT_RET);
}
void
_jit_retval_us(jit_state_t *_jit, jit_int32_t r0)
{
jit_extr_us(r0, JIT_RET);
}
void
_jit_retval_i(jit_state_t *_jit, jit_int32_t r0)
{
#if __WORDSIZE == 32
if (r0 != JIT_RET)
jit_movr(r0, JIT_RET);
#else
jit_extr_i(r0, JIT_RET);
#endif
}
#if __WORDSIZE == 64
void
_jit_retval_ui(jit_state_t *_jit, jit_int32_t r0)
{
jit_extr_ui(r0, JIT_RET);
}
void
_jit_retval_l(jit_state_t *_jit, jit_int32_t r0)
{
if (r0 != JIT_RET)
jit_movr(r0, JIT_RET);
}
#endif
void
_jit_retval_f(jit_state_t *_jit, jit_int32_t r0)
{
# if __WORDSIZE == 32
jit_new_node_w(jit_code_retval_f, r0);
# else
if (r0 != JIT_FRET)
jit_movr_f(r0, JIT_FRET);
# endif
}
void
_jit_retval_d(jit_state_t *_jit, jit_int32_t r0)
{
# if __WORDSIZE == 32
jit_new_node_w(jit_code_retval_d, r0);
# else
if (r0 != JIT_FRET)
jit_movr_d(r0, JIT_FRET);
# endif
}
jit_pointer_t
_jit_emit(jit_state_t *_jit)
{
jit_node_t *node;
jit_node_t *temp;
jit_word_t word;
jit_int32_t value;
jit_int32_t offset;
struct {
jit_node_t *node;
jit_word_t word;
jit_int32_t patch_offset;
} undo;
if (_jit->function)
jit_epilog();
jit_optimize();
_jit->emit = 1;
_jit->code.length = 16 * 1024 * 1024;
_jit->code.ptr = mmap(NULL, _jit->code.length,
PROT_EXEC | PROT_READ | PROT_WRITE,
MAP_PRIVATE | MAP_ANON, -1, 0);
assert(_jit->code.ptr != MAP_FAILED);
_jit->pc.uc = _jit->code.ptr;
/* clear jit_flag_patch from label nodes if reallocating buffer
* and starting over
*/
_jit->function = NULL;
jit_reglive_setup();
undo.word = 0;
undo.node = NULL;
undo.patch_offset = 0;
#define case_rr(name, type) \
case jit_code_##name##r##type: \
name##r##type(rn(node->u.w), rn(node->v.w)); \
break
#define case_rw(name, type) \
case jit_code_##name##i##type: \
name##i##type(rn(node->u.w), node->v.w); \
break
#define case_rf(name, type) \
case jit_code_##name##r##type: \
if (jit_x87_reg_p(node->v.w)) \
x87_##name##r##type(rn(node->u.w), rn(node->v.w)); \
else \
sse_##name##r##type(rn(node->u.w), rn(node->v.w)); \
break
#define case_fr(name, type) \
case jit_code_##name##r##type: \
if (jit_x87_reg_p(node->u.w)) \
x87_##name##r##type(rn(node->u.w), rn(node->v.w)); \
else \
sse_##name##r##type(rn(node->u.w), rn(node->v.w)); \
break
#define case_fw(name, type) \
case jit_code_##name##i##type: \
if (jit_x87_reg_p(node->u.w)) \
x87_##name##i##type(rn(node->u.w), node->v.w); \
else \
sse_##name##i##type(rn(node->u.w), node->v.w); \
break
#define case_wr(name, type) \
case jit_code_##name##i##type: \
name##i##type(node->u.w, rn(node->v.w)); \
break
#define case_wf(name, type) \
case jit_code_##name##i##type: \
if (jit_x87_reg_p(node->v.w)) \
x87_##name##i##type(node->u.w, rn(node->v.w)); \
else \
sse_##name##i##type(node->u.w, rn(node->v.w)); \
break
#define case_ff(name, type) \
case jit_code_##name##r##type: \
if (jit_x87_reg_p(node->u.w) && \
jit_x87_reg_p(node->v.w)) \
x87_##name##r##type(rn(node->u.w), rn(node->v.w)); \
else \
sse_##name##r##type(rn(node->u.w), rn(node->v.w)); \
break;
#define case_rrr(name, type) \
case jit_code_##name##r##type: \
name##r##type(rn(node->u.w), \
rn(node->v.w), rn(node->w.w)); \
break
#define case_frr(name, type) \
case jit_code_##name##r##type: \
if (jit_x87_reg_p(node->u.w)) \
x87_##name##r##type(rn(node->u.w), \
rn(node->v.w), rn(node->w.w)); \
else \
sse_##name##r##type(rn(node->u.w), \
rn(node->v.w), rn(node->w.w)); \
break
#define case_rrf(name, type) \
case jit_code_##name##r##type: \
if (jit_x87_reg_p(node->u.w)) \
x87_##name##r##type(rn(node->u.w), \
rn(node->v.w), rn(node->w.w)); \
else \
sse_##name##r##type(rn(node->u.w), \
rn(node->v.w), rn(node->w.w)); \
break
#define case_rrw(name, type) \
case jit_code_##name##i##type: \
name##i##type(rn(node->u.w), rn(node->v.w), node->w.w); \
break
#define case_frw(name, type) \
case jit_code_##name##i##type: \
if (jit_x87_reg_p(node->u.w)) \
x87_##name##i##type(rn(node->u.w), \
rn(node->v.w), node->w.w); \
else \
sse_##name##i##type(rn(node->u.w), \
rn(node->v.w), node->w.w); \
break
#define case_wrr(name, type) \
case jit_code_##name##i##type: \
name##i##type(node->u.w, rn(node->v.w), rn(node->w.w)); \
break
#define case_wrf(name, type) \
case jit_code_##name##i##type: \
if (jit_x87_reg_p(node->w.w)) \
x87_##name##i##type(node->u.w, \
rn(node->v.w), rn(node->w.w)); \
else \
sse_##name##i##type(node->u.w, \
rn(node->v.w), rn(node->w.w)); \
break
#define case_brr(name, type) \
case jit_code_##name##r##type: \
temp = node->u.n; \
assert(temp->code == jit_code_label || \
temp->code == jit_code_epilog); \
if (temp->flag & jit_flag_patch) \
name##r##type(temp->u.w, rn(node->v.w), \
rn(node->w.w)); \
else { \
word = name##r##type(_jit->pc.w, \
rn(node->v.w), rn(node->w.w)); \
patch(word, node); \
} \
break
#define case_brw(name, type) \
case jit_code_##name##i##type: \
temp = node->u.n; \
assert(temp->code == jit_code_label || \
temp->code == jit_code_epilog); \
if (temp->flag & jit_flag_patch) \
name##i##type(temp->u.w, \
rn(node->v.w), node->w.w); \
else { \
word = name##i##type(_jit->pc.w, \
rn(node->v.w), node->w.w); \
patch(word, node); \
} \
break
#define case_rff(name, type) \
case jit_code_##name##r##type: \
if (jit_x87_reg_p(node->v.w) && \
jit_x87_reg_p(node->w.w)) \
x87_##name##r##type(rn(node->u.w), rn(node->v.w), \
rn(node->w.w)); \
else \
sse_##name##r##type(rn(node->u.w), rn(node->v.w), \
rn(node->w.w)); \
break;
#define case_rfw(name, type, size) \
case jit_code_##name##i##type: \
assert(node->flag & jit_flag_data); \
if (jit_x87_reg_p(node->v.w)) \
x87_##name##i##type(rn(node->u.w), rn(node->v.w), \
(jit_float##size##_t *)node->w.n->u.w); \
else \
sse_##name##i##type(rn(node->u.w), rn(node->v.w), \
(jit_float##size##_t *)node->w.n->u.w); \
break
#define case_fff(name, type) \
case jit_code_##name##r##type: \
if (jit_x87_reg_p(node->u.w) && \
jit_x87_reg_p(node->v.w) && \
jit_x87_reg_p(node->w.w)) \
x87_##name##r##type(rn(node->u.w), \
rn(node->v.w), rn(node->w.w)); \
else \
sse_##name##r##type(rn(node->u.w), \
rn(node->v.w), rn(node->w.w)); \
break
#define case_ffw(name, type, size) \
case jit_code_##name##i##type: \
assert(node->flag & jit_flag_data); \
if (jit_x87_reg_p(node->u.w) && \
jit_x87_reg_p(node->v.w)) \
x87_##name##i##type(rn(node->u.w), rn(node->v.w), \
(jit_float##size##_t *)node->w.n->u.w); \
else \
sse_##name##i##type(rn(node->u.w), rn(node->v.w), \
(jit_float##size##_t *)node->w.n->u.w); \
break
#define case_bff(name, type) \
case jit_code_b##name##r##type: \
temp = node->u.n; \
assert(temp->code == jit_code_label || \
temp->code == jit_code_epilog); \
if (temp->flag & jit_flag_patch) { \
if (jit_x87_reg_p(node->v.w) && \
jit_x87_reg_p(node->w.w)) \
x87_b##name##r##type(temp->u.w, \
rn(node->v.w), rn(node->w.w)); \
else \
sse_b##name##r##type(temp->u.w, \
rn(node->v.w), rn(node->w.w)); \
} \
else { \
if (jit_x87_reg_p(node->v.w) && \
jit_x87_reg_p(node->w.w)) \
word = x87_b##name##r##type(_jit->pc.w, \
rn(node->v.w), rn(node->w.w)); \
else \
word = sse_b##name##r##type(_jit->pc.w, \
rn(node->v.w), rn(node->w.w)); \
patch(word, node); \
} \
break
#define case_bfw(name, type, size) \
case jit_code_b##name##i##type: \
temp = node->u.n; \
assert(temp->code == jit_code_label || \
temp->code == jit_code_epilog); \
if (temp->flag & jit_flag_patch) { \
if (jit_x87_reg_p(node->v.w)) \
x87_b##name##i##type(temp->u.w, \
rn(node->v.w), \
(jit_float##size##_t *)node->w.n->u.w); \
else \
sse_b##name##i##type(temp->u.w, \
rn(node->v.w), \
(jit_float##size##_t *)node->w.n->u.w); \
} \
else { \
if (jit_x87_reg_p(node->v.w)) \
word = x87_b##name##i##type(_jit->pc.w, \
rn(node->v.w), \
(jit_float##size##_t *)node->w.n->u.w); \
else \
word = sse_b##name##i##type(_jit->pc.w, \
rn(node->v.w), \
(jit_float##size##_t *)node->w.n->u.w); \
patch(word, node); \
} \
break
for (node = _jit->head; node; node = node->next) {
value = jit_classify(node->code);
jit_regarg_set(node, value);
switch (node->code) {
case jit_code_note:
node->u.w = _jit->pc.w;
break;
case jit_code_label:
if (node->link &&
(word = _jit->pc.w & (sizeof(jit_word_t) - 1)))
nop(sizeof(jit_word_t) - word);
/* remember label is defined */
node->flag |= jit_flag_patch;
node->u.w = _jit->pc.w;
break;
case_rrr(add,);
case_rrw(add,);
case_rrr(addx,);
case_rrw(addx,);
case_rrr(addc,);
case_rrw(addc,);
case_rrr(sub,);
case_rrw(sub,);
case_rrr(subx,);
case_rrw(subx,);
case_rrr(subc,);
case_rrw(subc,);
case_rrr(mul,);
case_rrw(mul,);
case_rrr(div,);
case_rrw(div,);
case_rrr(div, _u);
case_rrw(div, _u);
case_rrr(rem,);
case_rrw(rem,);
case_rrr(rem, _u);
case_rrw(rem, _u);
case_rrr(and,);
case_rrw(and,);
case_rrr(or,);
case_rrw(or,);
case_rrr(xor,);
case_rrw(xor,);
case_rrr(lsh,);
case_rrw(lsh,);
case_rrr(rsh,);
case_rrw(rsh,);
case_rrr(rsh, _u);
case_rrw(rsh, _u);
case_rr(neg,);
case_rr(com,);
case_rrr(lt,);
case_rrw(lt,);
case_rrr(lt, _u);
case_rrw(lt, _u);
case_rrr(le,);
case_rrw(le,);
case_rrr(le, _u);
case_rrw(le, _u);
case_rrr(eq,);
case_rrw(eq,);
case_rrr(ge,);
case_rrw(ge,);
case_rrr(ge, _u);
case_rrw(ge, _u);
case_rrr(gt,);
case_rrw(gt,);
case_rrr(gt, _u);
case_rrw(gt, _u);
case_rrr(ne,);
case_rrw(ne,);
case_rr(mov,);
case jit_code_movi:
if (node->flag & jit_flag_node) {
temp = node->v.n;
if (temp->code == jit_code_data ||
(temp->code == jit_code_label &&
(temp->flag & jit_flag_patch)))
movi(rn(node->u.w), temp->u.w);
else {
assert(temp->code == jit_code_label ||
temp->code == jit_code_epilog);
word = movi_p(rn(node->u.w), node->v.w);
patch(word, node);
}
}
else
movi(rn(node->u.w), node->v.w);
break;
case_rr(hton,);
case_rr(ext, _c);
case_rr(ext, _uc);
case_rr(ext, _s);
case_rr(ext, _us);
#if __WORDSIZE == 64
case_rr(ext, _i);
case_rr(ext, _ui);
#endif
case_rf(trunc, _f_i);
case_rf(trunc, _d_i);
#if __WORDSIZE == 64
case_rf(trunc, _f_l);
case_rf(trunc, _d_l);
#endif
case_rr(ld, _c);
case_rw(ld, _c);
case_rr(ld, _uc);
case_rw(ld, _uc);
case_rr(ld, _s);
case_rw(ld, _s);
case_rr(ld, _us);
case_rw(ld, _us);
case_rr(ld, _i);
case_rw(ld, _i);
#if __WORDSIZE == 64
case_rr(ld, _ui);
case_rw(ld, _ui);
case_rr(ld, _l);
case_rw(ld, _l);
#endif
case_rrr(ldx, _c);
case_rrw(ldx, _c);
case_rrr(ldx, _uc);
case_rrw(ldx, _uc);
case_rrr(ldx, _s);
case_rrw(ldx, _s);
case_rrr(ldx, _us);
case_rrw(ldx, _us);
case_rrr(ldx, _i);
case_rrw(ldx, _i);
#if __WORDSIZE == 64
case_rrr(ldx, _ui);
case_rrw(ldx, _ui);
case_rrr(ldx, _l);
case_rrw(ldx, _l);
#endif
case_rr(st, _c);
case_wr(st, _c);
case_rr(st, _s);
case_wr(st, _s);
case_rr(st, _i);
case_wr(st, _i);
#if __WORDSIZE == 64
case_rr(st, _l);
case_wr(st, _l);
#endif
case_rrr(stx, _c);
case_wrr(stx, _c);
case_rrr(stx, _s);
case_wrr(stx, _s);
case_rrr(stx, _i);
case_wrr(stx, _i);
#if __WORDSIZE == 64
case_rrr(stx, _l);
case_wrr(stx, _l);
#endif
case_brr(blt,);
case_brw(blt,);
case_brr(blt, _u);
case_brw(blt, _u);
case_brr(ble,);
case_brw(ble,);
case_brr(ble, _u);
case_brw(ble, _u);
case_brr(beq,);
case_brw(beq,);
case_brr(bge,);
case_brw(bge,);
case_brr(bge, _u);
case_brw(bge, _u);
case_brr(bgt,);
case_brw(bgt,);
case_brr(bgt, _u);
case_brw(bgt, _u);
case_brr(bne,);
case_brw(bne,);
case_brr(bms,);
case_brw(bms,);
case_brr(bmc,);
case_brw(bmc,);
case_brr(boadd,);
case_brw(boadd,);
case_brr(boadd, _u);
case_brw(boadd, _u);
case_brr(bxadd,);
case_brw(bxadd,);
case_brr(bxadd, _u);
case_brw(bxadd, _u);
case_brr(bosub,);
case_brw(bosub,);
case_brr(bosub, _u);
case_brw(bosub, _u);
case_brr(bxsub,);
case_brw(bxsub,);
case_brr(bxsub, _u);
case_brw(bxsub, _u);
case_fff(add, _f);
case_ffw(add, _f, 32);
case_fff(sub, _f);
case_ffw(sub, _f, 32);
case_fff(mul, _f);
case_ffw(mul, _f, 32);
case_fff(div, _f);
case_ffw(div, _f, 32);
case_ff(abs, _f);
case_ff(neg, _f);
case_ff(sqrt, _f);
case_fr(ext, _f);
case_fr(ext, _d_f);
case_rff(lt, _f);
case_rfw(lt, _f, 32);
case_rff(le, _f);
case_rfw(le, _f, 32);
case_rff(eq, _f);
case_rfw(eq, _f, 32);
case_rff(ge, _f);
case_rfw(ge, _f, 32);
case_rff(gt, _f);
case_rfw(gt, _f, 32);
case_rff(ne, _f);
case_rfw(ne, _f, 32);
case_rff(unlt, _f);
case_rfw(unlt, _f, 32);
case_rff(unle, _f);
case_rfw(unle, _f, 32);
case_rff(uneq, _f);
case_rfw(uneq, _f, 32);
case_rff(unge, _f);
case_rfw(unge, _f, 32);
case_rff(ungt, _f);
case_rfw(ungt, _f, 32);
case_rff(ltgt, _f);
case_rfw(ltgt, _f, 32);
case_rff(ord, _f);
case_rfw(ord, _f, 32);
case_rff(unord, _f);
case_rfw(unord, _f, 32);
case jit_code_movr_f:
if (jit_x87_reg_p(node->u.w)) {
if (jit_x87_reg_p(node->v.w))
x87_movr_f(rn(node->u.w), rn(node->v.w));
else
x87_from_sse_f(rn(node->u.w), rn(node->v.w));
}
else {
if (jit_sse_reg_p(node->v.w))
sse_movr_f(rn(node->u.w), rn(node->v.w));
else
sse_from_x87_f(rn(node->u.w), rn(node->v.w));
}
break;
case jit_code_movi_f:
assert(node->flag & jit_flag_data);
if (jit_x87_reg_p(node->u.w))
x87_movi_f(rn(node->u.w), (jit_float32_t *)node->v.n->u.w);
else
sse_movi_f(rn(node->u.w), (jit_float32_t *)node->v.n->u.w);
break;
case_fr(ld, _f);
case_fw(ld, _f);
case_frr(ldx, _f);
case_frw(ldx, _f);
case_rf(st, _f);
case_wf(st, _f);
case_rrf(stx, _f);
case_wrf(stx, _f);
case_bff(lt, _f);
case_bfw(lt, _f, 32);
case_bff(le, _f);
case_bfw(le, _f, 32);
case_bff(eq, _f);
case_bfw(eq, _f, 32);
case_bff(ge, _f);
case_bfw(ge, _f, 32);
case_bff(gt, _f);
case_bfw(gt, _f, 32);
case_bff(ne, _f);
case_bfw(ne, _f, 32);
case_bff(unlt, _f);
case_bfw(unlt, _f, 32);
case_bff(unle, _f);
case_bfw(unle, _f, 32);
case_bff(uneq, _f);
case_bfw(uneq, _f, 32);
case_bff(unge, _f);
case_bfw(unge, _f, 32);
case_bff(ungt, _f);
case_bfw(ungt, _f, 32);
case_bff(ltgt, _f);
case_bfw(ltgt, _f, 32);
case_bff(ord, _f);
case_bfw(ord, _f, 32);
case_bff(unord, _f);
case_bfw(unord, _f, 32);
case_fff(add, _d);
case_ffw(add, _d, 64);
case_fff(sub, _d);
case_ffw(sub, _d, 64);
case_fff(mul, _d);
case_ffw(mul, _d, 64);
case_fff(div, _d);
case_ffw(div, _d, 64);
case_ff(abs, _d);
case_ff(neg, _d);
case_ff(sqrt, _d);
case_fr(ext, _d);
case_fr(ext, _f_d);
case_rff(lt, _d);
case_rfw(lt, _d, 64);
case_rff(le, _d);
case_rfw(le, _d, 64);
case_rff(eq, _d);
case_rfw(eq, _d, 64);
case_rff(ge, _d);
case_rfw(ge, _d, 64);
case_rff(gt, _d);
case_rfw(gt, _d, 64);
case_rff(ne, _d);
case_rfw(ne, _d, 64);
case_rff(unlt, _d);
case_rfw(unlt, _d, 64);
case_rff(unle, _d);
case_rfw(unle, _d, 64);
case_rff(uneq, _d);
case_rfw(uneq, _d, 64);
case_rff(unge, _d);
case_rfw(unge, _d, 64);
case_rff(ungt, _d);
case_rfw(ungt, _d, 64);
case_rff(ltgt, _d);
case_rfw(ltgt, _d, 64);
case_rff(ord, _d);
case_rfw(ord, _d, 64);
case_rff(unord, _d);
case_rfw(unord, _d, 64);
case jit_code_movr_d:
if (jit_x87_reg_p(node->u.w)) {
if (jit_x87_reg_p(node->v.w))
x87_movr_d(rn(node->u.w), rn(node->v.w));
else
x87_from_sse_d(rn(node->u.w), rn(node->v.w));
}
else {
if (jit_sse_reg_p(node->v.w))
sse_movr_d(rn(node->u.w), rn(node->v.w));
else
sse_from_x87_d(rn(node->u.w), rn(node->v.w));
}
break;
case jit_code_movi_d:
assert(node->flag & jit_flag_data);
if (jit_x87_reg_p(node->u.w))
x87_movi_d(rn(node->u.w), (jit_float64_t *)node->v.n->u.w);
else
sse_movi_d(rn(node->u.w), (jit_float64_t *)node->v.n->u.w);
break;
case_fr(ld, _d);
case_fw(ld, _d);
case_frr(ldx, _d);
case_frw(ldx, _d);
case_rf(st, _d);
case_wf(st, _d);
case_rrf(stx, _d);
case_wrf(stx, _d);
case_bff(lt, _d);
case_bfw(lt, _d, 64);
case_bff(le, _d);
case_bfw(le, _d, 64);
case_bff(eq, _d);
case_bfw(eq, _d, 64);
case_bff(ge, _d);
case_bfw(ge, _d, 64);
case_bff(gt, _d);
case_bfw(gt, _d, 64);
case_bff(ne, _d);
case_bfw(ne, _d, 64);
case_bff(unlt, _d);
case_bfw(unlt, _d, 64);
case_bff(unle, _d);
case_bfw(unle, _d, 64);
case_bff(uneq, _d);
case_bfw(uneq, _d, 64);
case_bff(unge, _d);
case_bfw(unge, _d, 64);
case_bff(ungt, _d);
case_bfw(ungt, _d, 64);
case_bff(ltgt, _d);
case_bfw(ltgt, _d, 64);
case_bff(ord, _d);
case_bfw(ord, _d, 64);
case_bff(unord, _d);
case_bfw(unord, _d, 64);
case jit_code_jmpr:
jmpr(rn(node->u.w));
break;
case jit_code_jmpi:
temp = node->u.n;
assert(temp->code == jit_code_label ||
temp->code == jit_code_epilog);
if (temp->flag & jit_flag_patch)
jmpi(temp->u.w);
else {
word = jmpi(_jit->pc.w);
patch(word, node);
}
break;
case jit_code_callr:
callr(rn(node->u.w));
break;
case jit_code_calli:
if (node->flag & jit_flag_node) {
temp = node->u.n;
assert(temp->code == jit_code_label ||
temp->code == jit_code_epilog);
word = calli(temp->u.w);
if (!(temp->flag & jit_flag_patch))
patch(word, node);
}
else
calli(node->u.w);
break;
case jit_code_prolog:
_jit->function = _jit->functions.ptr + node->w.w;
undo.node = node;
undo.word = _jit->pc.w;
undo.patch_offset = _jit->patches.offset;
restart_function:
_jit->again = 0;
prolog(node);
break;
case jit_code_epilog:
assert(_jit->function == _jit->functions.ptr + node->w.w);
if (_jit->again) {
for (temp = undo.node->next;
temp != node; temp = temp->next) {
if (temp->code == jit_code_label ||
temp->code == jit_code_epilog)
temp->flag &= ~jit_flag_patch;
}
node = undo.node;
_jit->pc.w = undo.word;
_jit->patches.offset = undo.patch_offset;
goto restart_function;
}
if (node->link &&
(word = _jit->pc.w & (sizeof(jit_word_t) - 1)))
nop(sizeof(jit_word_t) - word);
/* remember label is defined */
node->flag |= jit_flag_patch;
node->u.w = _jit->pc.w;
epilog(node);
_jit->function = NULL;
break;
#if __WORDSIZE == 32
case jit_code_retval_f:
if (jit_sse_reg_p(node->u.w)) {
fstpr(_ST1_REGNO);
sse_from_x87_f(rn(node->u.w), _ST0_REGNO);
}
else
fstpr(rn(node->u.w) + 1);
break;
case jit_code_retval_d:
if (jit_sse_reg_p(node->u.w)) {
fstpr(_ST1_REGNO);
sse_from_x87_d(rn(node->u.w), _ST0_REGNO);
}
else
fstpr(rn(node->u.w) + 1);
break;
#endif
default:
abort();
}
jit_regarg_clr(node, value);
/* update register live state */
jit_reglive(node);
}
#undef case_bfw
#undef case_bff
#undef case_ffw
#undef case_rfw
#undef case_rff
#undef case_brw
#undef case_brr
#undef case_wrf
#undef case_wrr
#undef case_frw
#undef case_rrf
#undef case_rrw
#undef case_frr
#undef case_rrr
#undef case_wf
#undef case_fw
#undef case_fr
#undef case_rr
for (offset = 0; offset < _jit->patches.offset; offset++) {
node = _jit->patches.ptr[offset].node;
word = node->code == jit_code_movi ? node->v.n->u.w : node->u.n->u.w;
patch_at(node, _jit->patches.ptr[offset].inst, word);
}
return (_jit->code.ptr);
}
#define CODE 1
# include "jit_x86-cpu.c"
# include "jit_x86-sse.c"
# include "jit_x86-x87.c"
#undef CODE
void
_emit_ldxi(jit_state_t *_jit, jit_gpr_t r0, jit_gpr_t r1, jit_word_t i0)
{
ldxi(rn(r0), rn(r1), i0);
}
void
_emit_stxi(jit_state_t *_jit, jit_word_t i0, jit_gpr_t r0, jit_gpr_t r1)
{
stxi(i0, rn(r0), rn(r1));
}
void
_emit_ldxi_d(jit_state_t *_jit, jit_fpr_t r0, jit_gpr_t r1, jit_word_t i0)
{
if (jit_x87_reg_p(r0))
x87_ldxi_d(rn(r0), rn(r1), i0);
else
sse_ldxi_d(rn(r0), rn(r1), i0);
}
void
_emit_stxi_d(jit_state_t *_jit, jit_word_t i0, jit_gpr_t r0, jit_fpr_t r1)
{
if (jit_x87_reg_p(r1))
x87_stxi_d(i0, rn(r0), rn(r1));
else
sse_stxi_d(i0, rn(r0), rn(r1));
}
static void
_patch(jit_state_t *_jit, jit_word_t instr, jit_node_t *node)
{
jit_int32_t flag;
assert(node->flag & jit_flag_node);
if (node->code == jit_code_movi)
flag = node->v.n->flag;
else
flag = node->u.n->flag;
assert(!(flag & jit_flag_patch));
if (_jit->patches.offset >= _jit->patches.length) {
_jit->patches.ptr = realloc(_jit->patches.ptr,
(_jit->patches.length + 1024) *
sizeof(jit_patch_t));
memset(_jit->patches.ptr + _jit->patches.length, 0,
1024 * sizeof(jit_patch_t));
_jit->patches.length += 1024;
}
_jit->patches.ptr[_jit->patches.offset].inst = instr;
_jit->patches.ptr[_jit->patches.offset].node = node;
++_jit->patches.offset;
}
static void
_sse_from_x87_f(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
{
x87_stxi_f(-8, _RBP_REGNO, r1);
sse_ldxi_f(r0, _RBP_REGNO, -8);
}
static void
_sse_from_x87_d(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
{
x87_stxi_d(-8, _RBP_REGNO, r1);
sse_ldxi_d(r0, _RBP_REGNO, -8);
}
static void
_x87_from_sse_f(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
{
sse_stxi_f(-8, _RBP_REGNO, r1);
x87_ldxi_f(r0, _RBP_REGNO, -8);
}
static void
_x87_from_sse_d(jit_state_t *_jit, jit_int32_t r0, jit_int32_t r1)
{
sse_stxi_d(-8, _RBP_REGNO, r1);
x87_ldxi_d(r0, _RBP_REGNO, -8);
}