1*22dc650dSSadaf Ebrahimi /*
2*22dc650dSSadaf Ebrahimi * Stack-less Just-In-Time compiler
3*22dc650dSSadaf Ebrahimi *
4*22dc650dSSadaf Ebrahimi * Copyright Zoltan Herczeg ([email protected]). All rights reserved.
5*22dc650dSSadaf Ebrahimi *
6*22dc650dSSadaf Ebrahimi * Redistribution and use in source and binary forms, with or without modification, are
7*22dc650dSSadaf Ebrahimi * permitted provided that the following conditions are met:
8*22dc650dSSadaf Ebrahimi *
9*22dc650dSSadaf Ebrahimi * 1. Redistributions of source code must retain the above copyright notice, this list of
10*22dc650dSSadaf Ebrahimi * conditions and the following disclaimer.
11*22dc650dSSadaf Ebrahimi *
12*22dc650dSSadaf Ebrahimi * 2. Redistributions in binary form must reproduce the above copyright notice, this list
13*22dc650dSSadaf Ebrahimi * of conditions and the following disclaimer in the documentation and/or other materials
14*22dc650dSSadaf Ebrahimi * provided with the distribution.
15*22dc650dSSadaf Ebrahimi *
16*22dc650dSSadaf Ebrahimi * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) AND CONTRIBUTORS ``AS IS'' AND ANY
17*22dc650dSSadaf Ebrahimi * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
18*22dc650dSSadaf Ebrahimi * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT
19*22dc650dSSadaf Ebrahimi * SHALL THE COPYRIGHT HOLDER(S) OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
20*22dc650dSSadaf Ebrahimi * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
21*22dc650dSSadaf Ebrahimi * TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
22*22dc650dSSadaf Ebrahimi * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
23*22dc650dSSadaf Ebrahimi * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
24*22dc650dSSadaf Ebrahimi * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
25*22dc650dSSadaf Ebrahimi */
26*22dc650dSSadaf Ebrahimi
load_immediate(struct sljit_compiler * compiler,sljit_s32 dst_r,sljit_sw imm,sljit_s32 tmp_r)27*22dc650dSSadaf Ebrahimi static sljit_s32 load_immediate(struct sljit_compiler *compiler, sljit_s32 dst_r, sljit_sw imm, sljit_s32 tmp_r)
28*22dc650dSSadaf Ebrahimi {
29*22dc650dSSadaf Ebrahimi SLJIT_UNUSED_ARG(tmp_r);
30*22dc650dSSadaf Ebrahimi
31*22dc650dSSadaf Ebrahimi if (imm <= SIMM_MAX && imm >= SIMM_MIN)
32*22dc650dSSadaf Ebrahimi return push_inst(compiler, ADDI | RD(dst_r) | RS1(TMP_ZERO) | IMM_I(imm));
33*22dc650dSSadaf Ebrahimi
34*22dc650dSSadaf Ebrahimi if (imm & 0x800)
35*22dc650dSSadaf Ebrahimi imm += 0x1000;
36*22dc650dSSadaf Ebrahimi
37*22dc650dSSadaf Ebrahimi FAIL_IF(push_inst(compiler, LUI | RD(dst_r) | (sljit_ins)(imm & ~0xfff)));
38*22dc650dSSadaf Ebrahimi
39*22dc650dSSadaf Ebrahimi if ((imm & 0xfff) == 0)
40*22dc650dSSadaf Ebrahimi return SLJIT_SUCCESS;
41*22dc650dSSadaf Ebrahimi
42*22dc650dSSadaf Ebrahimi return push_inst(compiler, ADDI | RD(dst_r) | RS1(dst_r) | IMM_I(imm));
43*22dc650dSSadaf Ebrahimi }
44*22dc650dSSadaf Ebrahimi
sljit_emit_fset64(struct sljit_compiler * compiler,sljit_s32 freg,sljit_f64 value)45*22dc650dSSadaf Ebrahimi SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_fset64(struct sljit_compiler *compiler,
46*22dc650dSSadaf Ebrahimi sljit_s32 freg, sljit_f64 value)
47*22dc650dSSadaf Ebrahimi {
48*22dc650dSSadaf Ebrahimi union {
49*22dc650dSSadaf Ebrahimi sljit_s32 imm[2];
50*22dc650dSSadaf Ebrahimi sljit_f64 value;
51*22dc650dSSadaf Ebrahimi } u;
52*22dc650dSSadaf Ebrahimi
53*22dc650dSSadaf Ebrahimi CHECK_ERROR();
54*22dc650dSSadaf Ebrahimi CHECK(check_sljit_emit_fset64(compiler, freg, value));
55*22dc650dSSadaf Ebrahimi
56*22dc650dSSadaf Ebrahimi u.value = value;
57*22dc650dSSadaf Ebrahimi
58*22dc650dSSadaf Ebrahimi if (u.imm[0] != 0)
59*22dc650dSSadaf Ebrahimi FAIL_IF(load_immediate(compiler, TMP_REG1, u.imm[0], TMP_REG3));
60*22dc650dSSadaf Ebrahimi if (u.imm[1] != 0)
61*22dc650dSSadaf Ebrahimi FAIL_IF(load_immediate(compiler, TMP_REG2, u.imm[1], TMP_REG3));
62*22dc650dSSadaf Ebrahimi
63*22dc650dSSadaf Ebrahimi FAIL_IF(push_inst(compiler, ADDI | RD(SLJIT_SP) | RS1(SLJIT_SP) | IMM_I(-16)));
64*22dc650dSSadaf Ebrahimi FAIL_IF(push_inst(compiler, SW | RS1(SLJIT_SP) | RS2(u.imm[0] != 0 ? TMP_REG1 : TMP_ZERO) | (8 << 7)));
65*22dc650dSSadaf Ebrahimi FAIL_IF(push_inst(compiler, SW | RS1(SLJIT_SP) | RS2(u.imm[1] != 0 ? TMP_REG2 : TMP_ZERO) | (12 << 7)));
66*22dc650dSSadaf Ebrahimi FAIL_IF(push_inst(compiler, FLD | FRD(freg) | RS1(SLJIT_SP) | IMM_I(8)));
67*22dc650dSSadaf Ebrahimi return push_inst(compiler, ADDI | RD(SLJIT_SP) | RS1(SLJIT_SP) | IMM_I(16));
68*22dc650dSSadaf Ebrahimi }
69*22dc650dSSadaf Ebrahimi
sljit_emit_fcopy(struct sljit_compiler * compiler,sljit_s32 op,sljit_s32 freg,sljit_s32 reg)70*22dc650dSSadaf Ebrahimi SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_fcopy(struct sljit_compiler *compiler, sljit_s32 op,
71*22dc650dSSadaf Ebrahimi sljit_s32 freg, sljit_s32 reg)
72*22dc650dSSadaf Ebrahimi {
73*22dc650dSSadaf Ebrahimi sljit_ins inst;
74*22dc650dSSadaf Ebrahimi sljit_s32 reg2 = 0;
75*22dc650dSSadaf Ebrahimi
76*22dc650dSSadaf Ebrahimi CHECK_ERROR();
77*22dc650dSSadaf Ebrahimi CHECK(check_sljit_emit_fcopy(compiler, op, freg, reg));
78*22dc650dSSadaf Ebrahimi
79*22dc650dSSadaf Ebrahimi if (op & SLJIT_32) {
80*22dc650dSSadaf Ebrahimi if (op == SLJIT_COPY32_TO_F32)
81*22dc650dSSadaf Ebrahimi inst = FMV_W_X | RS1(reg) | FRD(freg);
82*22dc650dSSadaf Ebrahimi else
83*22dc650dSSadaf Ebrahimi inst = FMV_X_W | FRS1(freg) | RD(reg);
84*22dc650dSSadaf Ebrahimi
85*22dc650dSSadaf Ebrahimi return push_inst(compiler, inst);
86*22dc650dSSadaf Ebrahimi }
87*22dc650dSSadaf Ebrahimi
88*22dc650dSSadaf Ebrahimi FAIL_IF(push_inst(compiler, ADDI | RD(SLJIT_SP) | RS1(SLJIT_SP) | IMM_I(-16)));
89*22dc650dSSadaf Ebrahimi
90*22dc650dSSadaf Ebrahimi if (reg & REG_PAIR_MASK) {
91*22dc650dSSadaf Ebrahimi reg2 = REG_PAIR_SECOND(reg);
92*22dc650dSSadaf Ebrahimi reg = REG_PAIR_FIRST(reg);
93*22dc650dSSadaf Ebrahimi }
94*22dc650dSSadaf Ebrahimi
95*22dc650dSSadaf Ebrahimi if (op == SLJIT_COPY_TO_F64) {
96*22dc650dSSadaf Ebrahimi if (reg2 != 0)
97*22dc650dSSadaf Ebrahimi FAIL_IF(push_inst(compiler, SW | RS1(SLJIT_SP) | RS2(reg2) | (8 << 7)));
98*22dc650dSSadaf Ebrahimi else
99*22dc650dSSadaf Ebrahimi FAIL_IF(push_inst(compiler, FSW | RS1(SLJIT_SP) | FRS2(freg) | (8 << 7)));
100*22dc650dSSadaf Ebrahimi
101*22dc650dSSadaf Ebrahimi FAIL_IF(push_inst(compiler, SW | RS1(SLJIT_SP) | RS2(reg) | (12 << 7)));
102*22dc650dSSadaf Ebrahimi FAIL_IF(push_inst(compiler, FLD | FRD(freg) | RS1(SLJIT_SP) | IMM_I(8)));
103*22dc650dSSadaf Ebrahimi } else {
104*22dc650dSSadaf Ebrahimi FAIL_IF(push_inst(compiler, FSD | RS1(SLJIT_SP) | FRS2(freg) | (8 << 7)));
105*22dc650dSSadaf Ebrahimi
106*22dc650dSSadaf Ebrahimi if (reg2 != 0)
107*22dc650dSSadaf Ebrahimi FAIL_IF(push_inst(compiler, FMV_X_W | FRS1(freg) | RD(reg2)));
108*22dc650dSSadaf Ebrahimi
109*22dc650dSSadaf Ebrahimi FAIL_IF(push_inst(compiler, LW | RD(reg) | RS1(SLJIT_SP) | IMM_I(12)));
110*22dc650dSSadaf Ebrahimi }
111*22dc650dSSadaf Ebrahimi
112*22dc650dSSadaf Ebrahimi return push_inst(compiler, ADDI | RD(SLJIT_SP) | RS1(SLJIT_SP) | IMM_I(16));
113*22dc650dSSadaf Ebrahimi }
114*22dc650dSSadaf Ebrahimi
emit_const(struct sljit_compiler * compiler,sljit_s32 dst,sljit_sw init_value,sljit_ins last_ins)115*22dc650dSSadaf Ebrahimi static SLJIT_INLINE sljit_s32 emit_const(struct sljit_compiler *compiler, sljit_s32 dst, sljit_sw init_value, sljit_ins last_ins)
116*22dc650dSSadaf Ebrahimi {
117*22dc650dSSadaf Ebrahimi if ((init_value & 0x800) != 0)
118*22dc650dSSadaf Ebrahimi init_value += 0x1000;
119*22dc650dSSadaf Ebrahimi
120*22dc650dSSadaf Ebrahimi FAIL_IF(push_inst(compiler, LUI | RD(dst) | (sljit_ins)(init_value & ~0xfff)));
121*22dc650dSSadaf Ebrahimi return push_inst(compiler, last_ins | RS1(dst) | IMM_I(init_value));
122*22dc650dSSadaf Ebrahimi }
123*22dc650dSSadaf Ebrahimi
sljit_set_jump_addr(sljit_uw addr,sljit_uw new_target,sljit_sw executable_offset)124*22dc650dSSadaf Ebrahimi SLJIT_API_FUNC_ATTRIBUTE void sljit_set_jump_addr(sljit_uw addr, sljit_uw new_target, sljit_sw executable_offset)
125*22dc650dSSadaf Ebrahimi {
126*22dc650dSSadaf Ebrahimi sljit_ins *inst = (sljit_ins*)addr;
127*22dc650dSSadaf Ebrahimi SLJIT_UNUSED_ARG(executable_offset);
128*22dc650dSSadaf Ebrahimi
129*22dc650dSSadaf Ebrahimi if ((new_target & 0x800) != 0)
130*22dc650dSSadaf Ebrahimi new_target += 0x1000;
131*22dc650dSSadaf Ebrahimi
132*22dc650dSSadaf Ebrahimi SLJIT_UPDATE_WX_FLAGS(inst, inst + 5, 0);
133*22dc650dSSadaf Ebrahimi
134*22dc650dSSadaf Ebrahimi SLJIT_ASSERT((inst[0] & 0x7f) == LUI);
135*22dc650dSSadaf Ebrahimi inst[0] = (inst[0] & 0xfff) | (sljit_ins)((sljit_sw)new_target & ~0xfff);
136*22dc650dSSadaf Ebrahimi SLJIT_ASSERT((inst[1] & 0x707f) == ADDI || (inst[1] & 0x707f) == JALR);
137*22dc650dSSadaf Ebrahimi inst[1] = (inst[1] & 0xfffff) | IMM_I(new_target);
138*22dc650dSSadaf Ebrahimi
139*22dc650dSSadaf Ebrahimi SLJIT_UPDATE_WX_FLAGS(inst, inst + 5, 1);
140*22dc650dSSadaf Ebrahimi inst = (sljit_ins *)SLJIT_ADD_EXEC_OFFSET(inst, executable_offset);
141*22dc650dSSadaf Ebrahimi SLJIT_CACHE_FLUSH(inst, inst + 5);
142*22dc650dSSadaf Ebrahimi }
143