sljitNativePPC_64.c 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502
  1. /*
  2. * Stack-less Just-In-Time compiler
  3. *
  4. * Copyright Zoltan Herczeg (hzmester@freemail.hu). All rights reserved.
  5. *
  6. * Redistribution and use in source and binary forms, with or without modification, are
  7. * permitted provided that the following conditions are met:
  8. *
  9. * 1. Redistributions of source code must retain the above copyright notice, this list of
  10. * conditions and the following disclaimer.
  11. *
  12. * 2. Redistributions in binary form must reproduce the above copyright notice, this list
  13. * of conditions and the following disclaimer in the documentation and/or other materials
  14. * provided with the distribution.
  15. *
  16. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) AND CONTRIBUTORS ``AS IS'' AND ANY
  17. * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  18. * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT
  19. * SHALL THE COPYRIGHT HOLDER(S) OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
  20. * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
  21. * TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
  22. * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  23. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
  24. * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  25. */
  26. /* ppc 64-bit arch dependent functions. */
  27. #if defined(__GNUC__) || (defined(__IBM_GCC_ASM) && __IBM_GCC_ASM)
  28. #define ASM_SLJIT_CLZ(src, dst) \
  29. __asm__ volatile ( "cntlzd %0, %1" : "=r"(dst) : "r"(src) )
  30. #elif defined(__xlc__)
  31. #error "Please enable GCC syntax for inline assembly statements"
  32. #else
  33. #error "Must implement count leading zeroes"
  34. #endif
  35. #define RLDI(dst, src, sh, mb, type) \
  36. (HI(30) | S(src) | A(dst) | ((type) << 2) | (((sh) & 0x1f) << 11) | (((sh) & 0x20) >> 4) | (((mb) & 0x1f) << 6) | ((mb) & 0x20))
  37. #define PUSH_RLDICR(reg, shift) \
  38. push_inst(compiler, RLDI(reg, reg, 63 - shift, shift, 1))
  39. static sljit_s32 load_immediate(struct sljit_compiler *compiler, sljit_s32 reg, sljit_sw imm)
  40. {
  41. sljit_uw tmp;
  42. sljit_uw shift;
  43. sljit_uw tmp2;
  44. sljit_uw shift2;
  45. if (imm <= SIMM_MAX && imm >= SIMM_MIN)
  46. return push_inst(compiler, ADDI | D(reg) | A(0) | IMM(imm));
  47. if (!(imm & ~0xffff))
  48. return push_inst(compiler, ORI | S(TMP_ZERO) | A(reg) | IMM(imm));
  49. if (imm <= 0x7fffffffl && imm >= -0x80000000l) {
  50. FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(imm >> 16)));
  51. return (imm & 0xffff) ? push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm)) : SLJIT_SUCCESS;
  52. }
  53. /* Count leading zeroes. */
  54. tmp = (imm >= 0) ? imm : ~imm;
  55. ASM_SLJIT_CLZ(tmp, shift);
  56. SLJIT_ASSERT(shift > 0);
  57. shift--;
  58. tmp = (imm << shift);
  59. if ((tmp & ~0xffff000000000000ul) == 0) {
  60. FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | IMM(tmp >> 48)));
  61. shift += 15;
  62. return PUSH_RLDICR(reg, shift);
  63. }
  64. if ((tmp & ~0xffffffff00000000ul) == 0) {
  65. FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(tmp >> 48)));
  66. FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(tmp >> 32)));
  67. shift += 31;
  68. return PUSH_RLDICR(reg, shift);
  69. }
  70. /* Cut out the 16 bit from immediate. */
  71. shift += 15;
  72. tmp2 = imm & ((1ul << (63 - shift)) - 1);
  73. if (tmp2 <= 0xffff) {
  74. FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | IMM(tmp >> 48)));
  75. FAIL_IF(PUSH_RLDICR(reg, shift));
  76. return push_inst(compiler, ORI | S(reg) | A(reg) | tmp2);
  77. }
  78. if (tmp2 <= 0xffffffff) {
  79. FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | IMM(tmp >> 48)));
  80. FAIL_IF(PUSH_RLDICR(reg, shift));
  81. FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | (tmp2 >> 16)));
  82. return (imm & 0xffff) ? push_inst(compiler, ORI | S(reg) | A(reg) | IMM(tmp2)) : SLJIT_SUCCESS;
  83. }
  84. ASM_SLJIT_CLZ(tmp2, shift2);
  85. tmp2 <<= shift2;
  86. if ((tmp2 & ~0xffff000000000000ul) == 0) {
  87. FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | IMM(tmp >> 48)));
  88. shift2 += 15;
  89. shift += (63 - shift2);
  90. FAIL_IF(PUSH_RLDICR(reg, shift));
  91. FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | (tmp2 >> 48)));
  92. return PUSH_RLDICR(reg, shift2);
  93. }
  94. /* The general version. */
  95. FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(imm >> 48)));
  96. FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm >> 32)));
  97. FAIL_IF(PUSH_RLDICR(reg, 31));
  98. FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | IMM(imm >> 16)));
  99. return push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm));
  100. }
  101. /* Simplified mnemonics: clrldi. */
  102. #define INS_CLEAR_LEFT(dst, src, from) \
  103. (RLDICL | S(src) | A(dst) | ((from) << 6) | (1 << 5))
  104. /* Sign extension for integer operations. */
  105. #define UN_EXTS() \
  106. if ((flags & (ALT_SIGN_EXT | REG2_SOURCE)) == (ALT_SIGN_EXT | REG2_SOURCE)) { \
  107. FAIL_IF(push_inst(compiler, EXTSW | S(src2) | A(TMP_REG2))); \
  108. src2 = TMP_REG2; \
  109. }
  110. #define BIN_EXTS() \
  111. if (flags & ALT_SIGN_EXT) { \
  112. if (flags & REG1_SOURCE) { \
  113. FAIL_IF(push_inst(compiler, EXTSW | S(src1) | A(TMP_REG1))); \
  114. src1 = TMP_REG1; \
  115. } \
  116. if (flags & REG2_SOURCE) { \
  117. FAIL_IF(push_inst(compiler, EXTSW | S(src2) | A(TMP_REG2))); \
  118. src2 = TMP_REG2; \
  119. } \
  120. }
  121. #define BIN_IMM_EXTS() \
  122. if ((flags & (ALT_SIGN_EXT | REG1_SOURCE)) == (ALT_SIGN_EXT | REG1_SOURCE)) { \
  123. FAIL_IF(push_inst(compiler, EXTSW | S(src1) | A(TMP_REG1))); \
  124. src1 = TMP_REG1; \
  125. }
  126. static SLJIT_INLINE sljit_s32 emit_single_op(struct sljit_compiler *compiler, sljit_s32 op, sljit_s32 flags,
  127. sljit_s32 dst, sljit_s32 src1, sljit_s32 src2)
  128. {
  129. switch (op) {
  130. case SLJIT_MOV:
  131. case SLJIT_MOV_P:
  132. SLJIT_ASSERT(src1 == TMP_REG1);
  133. if (dst != src2)
  134. return push_inst(compiler, OR | S(src2) | A(dst) | B(src2));
  135. return SLJIT_SUCCESS;
  136. case SLJIT_MOV_U32:
  137. case SLJIT_MOV_S32:
  138. SLJIT_ASSERT(src1 == TMP_REG1);
  139. if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
  140. if (op == SLJIT_MOV_S32)
  141. return push_inst(compiler, EXTSW | S(src2) | A(dst));
  142. return push_inst(compiler, INS_CLEAR_LEFT(dst, src2, 0));
  143. }
  144. else {
  145. SLJIT_ASSERT(dst == src2);
  146. }
  147. return SLJIT_SUCCESS;
  148. case SLJIT_MOV_U8:
  149. case SLJIT_MOV_S8:
  150. SLJIT_ASSERT(src1 == TMP_REG1);
  151. if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
  152. if (op == SLJIT_MOV_S8)
  153. return push_inst(compiler, EXTSB | S(src2) | A(dst));
  154. return push_inst(compiler, INS_CLEAR_LEFT(dst, src2, 24));
  155. }
  156. else if ((flags & REG_DEST) && op == SLJIT_MOV_S8)
  157. return push_inst(compiler, EXTSB | S(src2) | A(dst));
  158. else {
  159. SLJIT_ASSERT(dst == src2);
  160. }
  161. return SLJIT_SUCCESS;
  162. case SLJIT_MOV_U16:
  163. case SLJIT_MOV_S16:
  164. SLJIT_ASSERT(src1 == TMP_REG1);
  165. if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
  166. if (op == SLJIT_MOV_S16)
  167. return push_inst(compiler, EXTSH | S(src2) | A(dst));
  168. return push_inst(compiler, INS_CLEAR_LEFT(dst, src2, 16));
  169. }
  170. else {
  171. SLJIT_ASSERT(dst == src2);
  172. }
  173. return SLJIT_SUCCESS;
  174. case SLJIT_NOT:
  175. SLJIT_ASSERT(src1 == TMP_REG1);
  176. UN_EXTS();
  177. return push_inst(compiler, NOR | RC(flags) | S(src2) | A(dst) | B(src2));
  178. case SLJIT_NEG:
  179. SLJIT_ASSERT(src1 == TMP_REG1);
  180. if ((flags & (ALT_FORM1 | ALT_SIGN_EXT)) == (ALT_FORM1 | ALT_SIGN_EXT)) {
  181. FAIL_IF(push_inst(compiler, RLDI(TMP_REG2, src2, 32, 31, 1)));
  182. FAIL_IF(push_inst(compiler, NEG | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(TMP_REG2)));
  183. return push_inst(compiler, RLDI(dst, dst, 32, 32, 0));
  184. }
  185. UN_EXTS();
  186. /* Setting XER SO is not enough, CR SO is also needed. */
  187. return push_inst(compiler, NEG | OE((flags & ALT_FORM1) ? ALT_SET_FLAGS : 0) | RC(flags) | D(dst) | A(src2));
  188. case SLJIT_CLZ:
  189. SLJIT_ASSERT(src1 == TMP_REG1);
  190. if (flags & ALT_FORM1)
  191. return push_inst(compiler, CNTLZW | S(src2) | A(dst));
  192. return push_inst(compiler, CNTLZD | S(src2) | A(dst));
  193. case SLJIT_ADD:
  194. if (flags & ALT_FORM1) {
  195. if (flags & ALT_SIGN_EXT) {
  196. FAIL_IF(push_inst(compiler, RLDI(TMP_REG1, src1, 32, 31, 1)));
  197. src1 = TMP_REG1;
  198. FAIL_IF(push_inst(compiler, RLDI(TMP_REG2, src2, 32, 31, 1)));
  199. src2 = TMP_REG2;
  200. }
  201. /* Setting XER SO is not enough, CR SO is also needed. */
  202. FAIL_IF(push_inst(compiler, ADD | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src1) | B(src2)));
  203. if (flags & ALT_SIGN_EXT)
  204. return push_inst(compiler, RLDI(dst, dst, 32, 32, 0));
  205. return SLJIT_SUCCESS;
  206. }
  207. if (flags & ALT_FORM2) {
  208. /* Flags does not set: BIN_IMM_EXTS unnecessary. */
  209. SLJIT_ASSERT(src2 == TMP_REG2);
  210. if (flags & ALT_FORM3)
  211. return push_inst(compiler, ADDIS | D(dst) | A(src1) | compiler->imm);
  212. if (flags & ALT_FORM4) {
  213. FAIL_IF(push_inst(compiler, ADDIS | D(dst) | A(src1) | (((compiler->imm >> 16) & 0xffff) + ((compiler->imm >> 15) & 0x1))));
  214. src1 = dst;
  215. }
  216. return push_inst(compiler, ADDI | D(dst) | A(src1) | (compiler->imm & 0xffff));
  217. }
  218. if (flags & ALT_FORM3) {
  219. SLJIT_ASSERT(src2 == TMP_REG2);
  220. BIN_IMM_EXTS();
  221. return push_inst(compiler, ADDIC | D(dst) | A(src1) | compiler->imm);
  222. }
  223. if (!(flags & ALT_SET_FLAGS))
  224. return push_inst(compiler, ADD | D(dst) | A(src1) | B(src2));
  225. BIN_EXTS();
  226. if (flags & ALT_FORM4)
  227. return push_inst(compiler, ADDC | RC(ALT_SET_FLAGS) | D(dst) | A(src1) | B(src2));
  228. return push_inst(compiler, ADD | RC(flags) | D(dst) | A(src1) | B(src2));
  229. case SLJIT_ADDC:
  230. BIN_EXTS();
  231. return push_inst(compiler, ADDE | D(dst) | A(src1) | B(src2));
  232. case SLJIT_SUB:
  233. if (flags & ALT_FORM1) {
  234. if (flags & ALT_FORM2) {
  235. FAIL_IF(push_inst(compiler, CMPLI | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | compiler->imm));
  236. if (!(flags & ALT_FORM3))
  237. return SLJIT_SUCCESS;
  238. return push_inst(compiler, ADDI | D(dst) | A(src1) | (-compiler->imm & 0xffff));
  239. }
  240. FAIL_IF(push_inst(compiler, CMPL | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | B(src2)));
  241. if (!(flags & ALT_FORM3))
  242. return SLJIT_SUCCESS;
  243. return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));
  244. }
  245. if (flags & ALT_FORM2) {
  246. if (flags & ALT_SIGN_EXT) {
  247. FAIL_IF(push_inst(compiler, RLDI(TMP_REG1, src1, 32, 31, 1)));
  248. src1 = TMP_REG1;
  249. FAIL_IF(push_inst(compiler, RLDI(TMP_REG2, src2, 32, 31, 1)));
  250. src2 = TMP_REG2;
  251. }
  252. /* Setting XER SO is not enough, CR SO is also needed. */
  253. FAIL_IF(push_inst(compiler, SUBF | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1)));
  254. if (flags & ALT_SIGN_EXT)
  255. return push_inst(compiler, RLDI(dst, dst, 32, 32, 0));
  256. return SLJIT_SUCCESS;
  257. }
  258. if (flags & ALT_FORM3) {
  259. /* Flags does not set: BIN_IMM_EXTS unnecessary. */
  260. SLJIT_ASSERT(src2 == TMP_REG2);
  261. return push_inst(compiler, SUBFIC | D(dst) | A(src1) | compiler->imm);
  262. }
  263. if (flags & ALT_FORM4) {
  264. if (flags & ALT_FORM5) {
  265. SLJIT_ASSERT(src2 == TMP_REG2);
  266. return push_inst(compiler, CMPI | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | compiler->imm);
  267. }
  268. return push_inst(compiler, CMP | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | B(src2));
  269. }
  270. if (!(flags & ALT_SET_FLAGS))
  271. return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));
  272. BIN_EXTS();
  273. if (flags & ALT_FORM5)
  274. return push_inst(compiler, SUBFC | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1));
  275. return push_inst(compiler, SUBF | RC(flags) | D(dst) | A(src2) | B(src1));
  276. case SLJIT_SUBC:
  277. BIN_EXTS();
  278. return push_inst(compiler, SUBFE | D(dst) | A(src2) | B(src1));
  279. case SLJIT_MUL:
  280. if (flags & ALT_FORM1) {
  281. SLJIT_ASSERT(src2 == TMP_REG2);
  282. return push_inst(compiler, MULLI | D(dst) | A(src1) | compiler->imm);
  283. }
  284. BIN_EXTS();
  285. if (flags & ALT_FORM2)
  286. return push_inst(compiler, MULLW | OE(flags) | RC(flags) | D(dst) | A(src2) | B(src1));
  287. return push_inst(compiler, MULLD | OE(flags) | RC(flags) | D(dst) | A(src2) | B(src1));
  288. case SLJIT_AND:
  289. if (flags & ALT_FORM1) {
  290. SLJIT_ASSERT(src2 == TMP_REG2);
  291. return push_inst(compiler, ANDI | S(src1) | A(dst) | compiler->imm);
  292. }
  293. if (flags & ALT_FORM2) {
  294. SLJIT_ASSERT(src2 == TMP_REG2);
  295. return push_inst(compiler, ANDIS | S(src1) | A(dst) | compiler->imm);
  296. }
  297. return push_inst(compiler, AND | RC(flags) | S(src1) | A(dst) | B(src2));
  298. case SLJIT_OR:
  299. if (flags & ALT_FORM1) {
  300. SLJIT_ASSERT(src2 == TMP_REG2);
  301. return push_inst(compiler, ORI | S(src1) | A(dst) | compiler->imm);
  302. }
  303. if (flags & ALT_FORM2) {
  304. SLJIT_ASSERT(src2 == TMP_REG2);
  305. return push_inst(compiler, ORIS | S(src1) | A(dst) | compiler->imm);
  306. }
  307. if (flags & ALT_FORM3) {
  308. SLJIT_ASSERT(src2 == TMP_REG2);
  309. FAIL_IF(push_inst(compiler, ORI | S(src1) | A(dst) | IMM(compiler->imm)));
  310. return push_inst(compiler, ORIS | S(dst) | A(dst) | IMM(compiler->imm >> 16));
  311. }
  312. return push_inst(compiler, OR | RC(flags) | S(src1) | A(dst) | B(src2));
  313. case SLJIT_XOR:
  314. if (flags & ALT_FORM1) {
  315. SLJIT_ASSERT(src2 == TMP_REG2);
  316. return push_inst(compiler, XORI | S(src1) | A(dst) | compiler->imm);
  317. }
  318. if (flags & ALT_FORM2) {
  319. SLJIT_ASSERT(src2 == TMP_REG2);
  320. return push_inst(compiler, XORIS | S(src1) | A(dst) | compiler->imm);
  321. }
  322. if (flags & ALT_FORM3) {
  323. SLJIT_ASSERT(src2 == TMP_REG2);
  324. FAIL_IF(push_inst(compiler, XORI | S(src1) | A(dst) | IMM(compiler->imm)));
  325. return push_inst(compiler, XORIS | S(dst) | A(dst) | IMM(compiler->imm >> 16));
  326. }
  327. return push_inst(compiler, XOR | RC(flags) | S(src1) | A(dst) | B(src2));
  328. case SLJIT_SHL:
  329. if (flags & ALT_FORM1) {
  330. SLJIT_ASSERT(src2 == TMP_REG2);
  331. if (flags & ALT_FORM2) {
  332. compiler->imm &= 0x1f;
  333. return push_inst(compiler, RLWINM | RC(flags) | S(src1) | A(dst) | (compiler->imm << 11) | ((31 - compiler->imm) << 1));
  334. }
  335. compiler->imm &= 0x3f;
  336. return push_inst(compiler, RLDI(dst, src1, compiler->imm, 63 - compiler->imm, 1) | RC(flags));
  337. }
  338. return push_inst(compiler, ((flags & ALT_FORM2) ? SLW : SLD) | RC(flags) | S(src1) | A(dst) | B(src2));
  339. case SLJIT_LSHR:
  340. if (flags & ALT_FORM1) {
  341. SLJIT_ASSERT(src2 == TMP_REG2);
  342. if (flags & ALT_FORM2) {
  343. compiler->imm &= 0x1f;
  344. return push_inst(compiler, RLWINM | RC(flags) | S(src1) | A(dst) | (((32 - compiler->imm) & 0x1f) << 11) | (compiler->imm << 6) | (31 << 1));
  345. }
  346. compiler->imm &= 0x3f;
  347. return push_inst(compiler, RLDI(dst, src1, 64 - compiler->imm, compiler->imm, 0) | RC(flags));
  348. }
  349. return push_inst(compiler, ((flags & ALT_FORM2) ? SRW : SRD) | RC(flags) | S(src1) | A(dst) | B(src2));
  350. case SLJIT_ASHR:
  351. if (flags & ALT_FORM1) {
  352. SLJIT_ASSERT(src2 == TMP_REG2);
  353. if (flags & ALT_FORM2) {
  354. compiler->imm &= 0x1f;
  355. return push_inst(compiler, SRAWI | RC(flags) | S(src1) | A(dst) | (compiler->imm << 11));
  356. }
  357. compiler->imm &= 0x3f;
  358. return push_inst(compiler, SRADI | RC(flags) | S(src1) | A(dst) | ((compiler->imm & 0x1f) << 11) | ((compiler->imm & 0x20) >> 4));
  359. }
  360. return push_inst(compiler, ((flags & ALT_FORM2) ? SRAW : SRAD) | RC(flags) | S(src1) | A(dst) | B(src2));
  361. }
  362. SLJIT_UNREACHABLE();
  363. return SLJIT_SUCCESS;
  364. }
  365. static sljit_s32 call_with_args(struct sljit_compiler *compiler, sljit_s32 arg_types, sljit_s32 *src)
  366. {
  367. sljit_s32 arg_count = 0;
  368. sljit_s32 word_arg_count = 0;
  369. sljit_s32 types = 0;
  370. sljit_s32 reg = 0;
  371. if (src)
  372. reg = *src & REG_MASK;
  373. arg_types >>= SLJIT_DEF_SHIFT;
  374. while (arg_types) {
  375. types = (types << SLJIT_DEF_SHIFT) | (arg_types & SLJIT_DEF_MASK);
  376. switch (arg_types & SLJIT_DEF_MASK) {
  377. case SLJIT_ARG_TYPE_F32:
  378. case SLJIT_ARG_TYPE_F64:
  379. arg_count++;
  380. break;
  381. default:
  382. arg_count++;
  383. word_arg_count++;
  384. if (arg_count != word_arg_count && arg_count == reg) {
  385. FAIL_IF(push_inst(compiler, OR | S(reg) | A(TMP_CALL_REG) | B(reg)));
  386. *src = TMP_CALL_REG;
  387. }
  388. break;
  389. }
  390. arg_types >>= SLJIT_DEF_SHIFT;
  391. }
  392. while (types) {
  393. switch (types & SLJIT_DEF_MASK) {
  394. case SLJIT_ARG_TYPE_F32:
  395. case SLJIT_ARG_TYPE_F64:
  396. arg_count--;
  397. break;
  398. default:
  399. if (arg_count != word_arg_count)
  400. FAIL_IF(push_inst(compiler, OR | S(word_arg_count) | A(arg_count) | B(word_arg_count)));
  401. arg_count--;
  402. word_arg_count--;
  403. break;
  404. }
  405. types >>= SLJIT_DEF_SHIFT;
  406. }
  407. return SLJIT_SUCCESS;
  408. }
  409. static SLJIT_INLINE sljit_s32 emit_const(struct sljit_compiler *compiler, sljit_s32 reg, sljit_sw init_value)
  410. {
  411. FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(init_value >> 48)));
  412. FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(init_value >> 32)));
  413. FAIL_IF(PUSH_RLDICR(reg, 31));
  414. FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | IMM(init_value >> 16)));
  415. return push_inst(compiler, ORI | S(reg) | A(reg) | IMM(init_value));
  416. }
  417. SLJIT_API_FUNC_ATTRIBUTE void sljit_set_jump_addr(sljit_uw addr, sljit_uw new_target, sljit_sw executable_offset)
  418. {
  419. sljit_ins *inst = (sljit_ins*)addr;
  420. inst[0] = (inst[0] & 0xffff0000) | ((new_target >> 48) & 0xffff);
  421. inst[1] = (inst[1] & 0xffff0000) | ((new_target >> 32) & 0xffff);
  422. inst[3] = (inst[3] & 0xffff0000) | ((new_target >> 16) & 0xffff);
  423. inst[4] = (inst[4] & 0xffff0000) | (new_target & 0xffff);
  424. inst = (sljit_ins *)SLJIT_ADD_EXEC_OFFSET(inst, executable_offset);
  425. SLJIT_CACHE_FLUSH(inst, inst + 5);
  426. }
  427. SLJIT_API_FUNC_ATTRIBUTE void sljit_set_const(sljit_uw addr, sljit_sw new_constant, sljit_sw executable_offset)
  428. {
  429. sljit_ins *inst = (sljit_ins*)addr;
  430. inst[0] = (inst[0] & 0xffff0000) | ((new_constant >> 48) & 0xffff);
  431. inst[1] = (inst[1] & 0xffff0000) | ((new_constant >> 32) & 0xffff);
  432. inst[3] = (inst[3] & 0xffff0000) | ((new_constant >> 16) & 0xffff);
  433. inst[4] = (inst[4] & 0xffff0000) | (new_constant & 0xffff);
  434. inst = (sljit_ins *)SLJIT_ADD_EXEC_OFFSET(inst, executable_offset);
  435. SLJIT_CACHE_FLUSH(inst, inst + 5);
  436. }