sljitNativePPC_64.c 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507
  1. /*
  2. * Stack-less Just-In-Time compiler
  3. *
  4. * Copyright Zoltan Herczeg (hzmester@freemail.hu). All rights reserved.
  5. *
  6. * Redistribution and use in source and binary forms, with or without modification, are
  7. * permitted provided that the following conditions are met:
  8. *
  9. * 1. Redistributions of source code must retain the above copyright notice, this list of
  10. * conditions and the following disclaimer.
  11. *
  12. * 2. Redistributions in binary form must reproduce the above copyright notice, this list
  13. * of conditions and the following disclaimer in the documentation and/or other materials
  14. * provided with the distribution.
  15. *
  16. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) AND CONTRIBUTORS ``AS IS'' AND ANY
  17. * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  18. * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT
  19. * SHALL THE COPYRIGHT HOLDER(S) OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
  20. * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
  21. * TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
  22. * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  23. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
  24. * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  25. */
  26. /* ppc 64-bit arch dependent functions. */
  27. #if defined(__GNUC__) || (defined(__IBM_GCC_ASM) && __IBM_GCC_ASM)
  28. #define ASM_SLJIT_CLZ(src, dst) \
  29. __asm__ volatile ( "cntlzd %0, %1" : "=r"(dst) : "r"(src) )
  30. #elif defined(__xlc__)
  31. #error "Please enable GCC syntax for inline assembly statements"
  32. #else
  33. #error "Must implement count leading zeroes"
  34. #endif
  35. #define PUSH_RLDICR(reg, shift) \
  36. push_inst(compiler, RLDI(reg, reg, 63 - shift, shift, 1))
  37. static sljit_s32 load_immediate(struct sljit_compiler *compiler, sljit_s32 reg, sljit_sw imm)
  38. {
  39. sljit_uw tmp;
  40. sljit_uw shift;
  41. sljit_uw tmp2;
  42. sljit_uw shift2;
  43. if (imm <= SIMM_MAX && imm >= SIMM_MIN)
  44. return push_inst(compiler, ADDI | D(reg) | A(0) | IMM(imm));
  45. if (!(imm & ~0xffff))
  46. return push_inst(compiler, ORI | S(TMP_ZERO) | A(reg) | IMM(imm));
  47. if (imm <= 0x7fffffffl && imm >= -0x80000000l) {
  48. FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(imm >> 16)));
  49. return (imm & 0xffff) ? push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm)) : SLJIT_SUCCESS;
  50. }
  51. /* Count leading zeroes. */
  52. tmp = (imm >= 0) ? imm : ~imm;
  53. ASM_SLJIT_CLZ(tmp, shift);
  54. SLJIT_ASSERT(shift > 0);
  55. shift--;
  56. tmp = (imm << shift);
  57. if ((tmp & ~0xffff000000000000ul) == 0) {
  58. FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | IMM(tmp >> 48)));
  59. shift += 15;
  60. return PUSH_RLDICR(reg, shift);
  61. }
  62. if ((tmp & ~0xffffffff00000000ul) == 0) {
  63. FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(tmp >> 48)));
  64. FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(tmp >> 32)));
  65. shift += 31;
  66. return PUSH_RLDICR(reg, shift);
  67. }
  68. /* Cut out the 16 bit from immediate. */
  69. shift += 15;
  70. tmp2 = imm & ((1ul << (63 - shift)) - 1);
  71. if (tmp2 <= 0xffff) {
  72. FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | IMM(tmp >> 48)));
  73. FAIL_IF(PUSH_RLDICR(reg, shift));
  74. return push_inst(compiler, ORI | S(reg) | A(reg) | tmp2);
  75. }
  76. if (tmp2 <= 0xffffffff) {
  77. FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | IMM(tmp >> 48)));
  78. FAIL_IF(PUSH_RLDICR(reg, shift));
  79. FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | (tmp2 >> 16)));
  80. return (imm & 0xffff) ? push_inst(compiler, ORI | S(reg) | A(reg) | IMM(tmp2)) : SLJIT_SUCCESS;
  81. }
  82. ASM_SLJIT_CLZ(tmp2, shift2);
  83. tmp2 <<= shift2;
  84. if ((tmp2 & ~0xffff000000000000ul) == 0) {
  85. FAIL_IF(push_inst(compiler, ADDI | D(reg) | A(0) | IMM(tmp >> 48)));
  86. shift2 += 15;
  87. shift += (63 - shift2);
  88. FAIL_IF(PUSH_RLDICR(reg, shift));
  89. FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | (tmp2 >> 48)));
  90. return PUSH_RLDICR(reg, shift2);
  91. }
  92. /* The general version. */
  93. FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(imm >> 48)));
  94. FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm >> 32)));
  95. FAIL_IF(PUSH_RLDICR(reg, 31));
  96. FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | IMM(imm >> 16)));
  97. return push_inst(compiler, ORI | S(reg) | A(reg) | IMM(imm));
  98. }
  99. /* Simplified mnemonics: clrldi. */
  100. #define INS_CLEAR_LEFT(dst, src, from) \
  101. (RLDICL | S(src) | A(dst) | ((from) << 6) | (1 << 5))
  102. /* Sign extension for integer operations. */
  103. #define UN_EXTS() \
  104. if ((flags & (ALT_SIGN_EXT | REG2_SOURCE)) == (ALT_SIGN_EXT | REG2_SOURCE)) { \
  105. FAIL_IF(push_inst(compiler, EXTSW | S(src2) | A(TMP_REG2))); \
  106. src2 = TMP_REG2; \
  107. }
  108. #define BIN_EXTS() \
  109. if (flags & ALT_SIGN_EXT) { \
  110. if (flags & REG1_SOURCE) { \
  111. FAIL_IF(push_inst(compiler, EXTSW | S(src1) | A(TMP_REG1))); \
  112. src1 = TMP_REG1; \
  113. } \
  114. if (flags & REG2_SOURCE) { \
  115. FAIL_IF(push_inst(compiler, EXTSW | S(src2) | A(TMP_REG2))); \
  116. src2 = TMP_REG2; \
  117. } \
  118. }
  119. #define BIN_IMM_EXTS() \
  120. if ((flags & (ALT_SIGN_EXT | REG1_SOURCE)) == (ALT_SIGN_EXT | REG1_SOURCE)) { \
  121. FAIL_IF(push_inst(compiler, EXTSW | S(src1) | A(TMP_REG1))); \
  122. src1 = TMP_REG1; \
  123. }
  124. static SLJIT_INLINE sljit_s32 emit_single_op(struct sljit_compiler *compiler, sljit_s32 op, sljit_s32 flags,
  125. sljit_s32 dst, sljit_s32 src1, sljit_s32 src2)
  126. {
  127. switch (op) {
  128. case SLJIT_MOV:
  129. case SLJIT_MOV_P:
  130. SLJIT_ASSERT(src1 == TMP_REG1);
  131. if (dst != src2)
  132. return push_inst(compiler, OR | S(src2) | A(dst) | B(src2));
  133. return SLJIT_SUCCESS;
  134. case SLJIT_MOV_U32:
  135. case SLJIT_MOV_S32:
  136. SLJIT_ASSERT(src1 == TMP_REG1);
  137. if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
  138. if (op == SLJIT_MOV_S32)
  139. return push_inst(compiler, EXTSW | S(src2) | A(dst));
  140. return push_inst(compiler, INS_CLEAR_LEFT(dst, src2, 0));
  141. }
  142. else {
  143. SLJIT_ASSERT(dst == src2);
  144. }
  145. return SLJIT_SUCCESS;
  146. case SLJIT_MOV_U8:
  147. case SLJIT_MOV_S8:
  148. SLJIT_ASSERT(src1 == TMP_REG1);
  149. if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
  150. if (op == SLJIT_MOV_S8)
  151. return push_inst(compiler, EXTSB | S(src2) | A(dst));
  152. return push_inst(compiler, INS_CLEAR_LEFT(dst, src2, 24));
  153. }
  154. else if ((flags & REG_DEST) && op == SLJIT_MOV_S8)
  155. return push_inst(compiler, EXTSB | S(src2) | A(dst));
  156. else {
  157. SLJIT_ASSERT(dst == src2);
  158. }
  159. return SLJIT_SUCCESS;
  160. case SLJIT_MOV_U16:
  161. case SLJIT_MOV_S16:
  162. SLJIT_ASSERT(src1 == TMP_REG1);
  163. if ((flags & (REG_DEST | REG2_SOURCE)) == (REG_DEST | REG2_SOURCE)) {
  164. if (op == SLJIT_MOV_S16)
  165. return push_inst(compiler, EXTSH | S(src2) | A(dst));
  166. return push_inst(compiler, INS_CLEAR_LEFT(dst, src2, 16));
  167. }
  168. else {
  169. SLJIT_ASSERT(dst == src2);
  170. }
  171. return SLJIT_SUCCESS;
  172. case SLJIT_NOT:
  173. SLJIT_ASSERT(src1 == TMP_REG1);
  174. UN_EXTS();
  175. return push_inst(compiler, NOR | RC(flags) | S(src2) | A(dst) | B(src2));
  176. case SLJIT_NEG:
  177. SLJIT_ASSERT(src1 == TMP_REG1);
  178. if ((flags & (ALT_FORM1 | ALT_SIGN_EXT)) == (ALT_FORM1 | ALT_SIGN_EXT)) {
  179. FAIL_IF(push_inst(compiler, RLDI(TMP_REG2, src2, 32, 31, 1)));
  180. FAIL_IF(push_inst(compiler, NEG | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(TMP_REG2)));
  181. return push_inst(compiler, RLDI(dst, dst, 32, 32, 0));
  182. }
  183. UN_EXTS();
  184. /* Setting XER SO is not enough, CR SO is also needed. */
  185. return push_inst(compiler, NEG | OE((flags & ALT_FORM1) ? ALT_SET_FLAGS : 0) | RC(flags) | D(dst) | A(src2));
  186. case SLJIT_CLZ:
  187. SLJIT_ASSERT(src1 == TMP_REG1);
  188. if (flags & ALT_FORM1)
  189. return push_inst(compiler, CNTLZW | S(src2) | A(dst));
  190. return push_inst(compiler, CNTLZD | S(src2) | A(dst));
  191. case SLJIT_ADD:
  192. if (flags & ALT_FORM1) {
  193. if (flags & ALT_SIGN_EXT) {
  194. FAIL_IF(push_inst(compiler, RLDI(TMP_REG1, src1, 32, 31, 1)));
  195. src1 = TMP_REG1;
  196. FAIL_IF(push_inst(compiler, RLDI(TMP_REG2, src2, 32, 31, 1)));
  197. src2 = TMP_REG2;
  198. }
  199. /* Setting XER SO is not enough, CR SO is also needed. */
  200. FAIL_IF(push_inst(compiler, ADD | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src1) | B(src2)));
  201. if (flags & ALT_SIGN_EXT)
  202. return push_inst(compiler, RLDI(dst, dst, 32, 32, 0));
  203. return SLJIT_SUCCESS;
  204. }
  205. if (flags & ALT_FORM2) {
  206. /* Flags does not set: BIN_IMM_EXTS unnecessary. */
  207. SLJIT_ASSERT(src2 == TMP_REG2);
  208. if (flags & ALT_FORM3)
  209. return push_inst(compiler, ADDIS | D(dst) | A(src1) | compiler->imm);
  210. if (flags & ALT_FORM4) {
  211. FAIL_IF(push_inst(compiler, ADDIS | D(dst) | A(src1) | (((compiler->imm >> 16) & 0xffff) + ((compiler->imm >> 15) & 0x1))));
  212. src1 = dst;
  213. }
  214. return push_inst(compiler, ADDI | D(dst) | A(src1) | (compiler->imm & 0xffff));
  215. }
  216. if (flags & ALT_FORM3) {
  217. SLJIT_ASSERT(src2 == TMP_REG2);
  218. BIN_IMM_EXTS();
  219. return push_inst(compiler, ADDIC | D(dst) | A(src1) | compiler->imm);
  220. }
  221. if (flags & ALT_FORM4) {
  222. if (flags & ALT_FORM5)
  223. FAIL_IF(push_inst(compiler, ADDI | D(dst) | A(src1) | compiler->imm));
  224. else
  225. FAIL_IF(push_inst(compiler, ADD | D(dst) | A(src1) | B(src2)));
  226. return push_inst(compiler, CMPI | A(dst) | 0);
  227. }
  228. if (!(flags & ALT_SET_FLAGS))
  229. return push_inst(compiler, ADD | D(dst) | A(src1) | B(src2));
  230. BIN_EXTS();
  231. if (flags & ALT_FORM5)
  232. return push_inst(compiler, ADDC | RC(ALT_SET_FLAGS) | D(dst) | A(src1) | B(src2));
  233. return push_inst(compiler, ADD | RC(flags) | D(dst) | A(src1) | B(src2));
  234. case SLJIT_ADDC:
  235. BIN_EXTS();
  236. return push_inst(compiler, ADDE | D(dst) | A(src1) | B(src2));
  237. case SLJIT_SUB:
  238. if (flags & ALT_FORM1) {
  239. if (flags & ALT_FORM2) {
  240. FAIL_IF(push_inst(compiler, CMPLI | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | compiler->imm));
  241. if (!(flags & ALT_FORM3))
  242. return SLJIT_SUCCESS;
  243. return push_inst(compiler, ADDI | D(dst) | A(src1) | (-compiler->imm & 0xffff));
  244. }
  245. FAIL_IF(push_inst(compiler, CMPL | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | B(src2)));
  246. if (!(flags & ALT_FORM3))
  247. return SLJIT_SUCCESS;
  248. return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));
  249. }
  250. if (flags & ALT_FORM2) {
  251. if (flags & ALT_FORM3) {
  252. FAIL_IF(push_inst(compiler, CMPI | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | compiler->imm));
  253. if (!(flags & ALT_FORM4))
  254. return SLJIT_SUCCESS;
  255. return push_inst(compiler, ADDI | D(dst) | A(src1) | (-compiler->imm & 0xffff));
  256. }
  257. FAIL_IF(push_inst(compiler, CMP | CRD(0 | ((flags & ALT_SIGN_EXT) ? 0 : 1)) | A(src1) | B(src2)));
  258. if (!(flags & ALT_FORM4))
  259. return SLJIT_SUCCESS;
  260. return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));
  261. }
  262. if (flags & ALT_FORM3) {
  263. if (flags & ALT_SIGN_EXT) {
  264. FAIL_IF(push_inst(compiler, RLDI(TMP_REG1, src1, 32, 31, 1)));
  265. src1 = TMP_REG1;
  266. FAIL_IF(push_inst(compiler, RLDI(TMP_REG2, src2, 32, 31, 1)));
  267. src2 = TMP_REG2;
  268. }
  269. /* Setting XER SO is not enough, CR SO is also needed. */
  270. FAIL_IF(push_inst(compiler, SUBF | OE(ALT_SET_FLAGS) | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1)));
  271. if (flags & ALT_SIGN_EXT)
  272. return push_inst(compiler, RLDI(dst, dst, 32, 32, 0));
  273. return SLJIT_SUCCESS;
  274. }
  275. if (flags & ALT_FORM4) {
  276. /* Flags does not set: BIN_IMM_EXTS unnecessary. */
  277. SLJIT_ASSERT(src2 == TMP_REG2);
  278. return push_inst(compiler, SUBFIC | D(dst) | A(src1) | compiler->imm);
  279. }
  280. if (!(flags & ALT_SET_FLAGS))
  281. return push_inst(compiler, SUBF | D(dst) | A(src2) | B(src1));
  282. BIN_EXTS();
  283. if (flags & ALT_FORM5)
  284. return push_inst(compiler, SUBFC | RC(ALT_SET_FLAGS) | D(dst) | A(src2) | B(src1));
  285. return push_inst(compiler, SUBF | RC(flags) | D(dst) | A(src2) | B(src1));
  286. case SLJIT_SUBC:
  287. BIN_EXTS();
  288. return push_inst(compiler, SUBFE | D(dst) | A(src2) | B(src1));
  289. case SLJIT_MUL:
  290. if (flags & ALT_FORM1) {
  291. SLJIT_ASSERT(src2 == TMP_REG2);
  292. return push_inst(compiler, MULLI | D(dst) | A(src1) | compiler->imm);
  293. }
  294. BIN_EXTS();
  295. if (flags & ALT_FORM2)
  296. return push_inst(compiler, MULLW | OE(flags) | RC(flags) | D(dst) | A(src2) | B(src1));
  297. return push_inst(compiler, MULLD | OE(flags) | RC(flags) | D(dst) | A(src2) | B(src1));
  298. case SLJIT_AND:
  299. if (flags & ALT_FORM1) {
  300. SLJIT_ASSERT(src2 == TMP_REG2);
  301. return push_inst(compiler, ANDI | S(src1) | A(dst) | compiler->imm);
  302. }
  303. if (flags & ALT_FORM2) {
  304. SLJIT_ASSERT(src2 == TMP_REG2);
  305. return push_inst(compiler, ANDIS | S(src1) | A(dst) | compiler->imm);
  306. }
  307. return push_inst(compiler, AND | RC(flags) | S(src1) | A(dst) | B(src2));
  308. case SLJIT_OR:
  309. if (flags & ALT_FORM1) {
  310. SLJIT_ASSERT(src2 == TMP_REG2);
  311. return push_inst(compiler, ORI | S(src1) | A(dst) | compiler->imm);
  312. }
  313. if (flags & ALT_FORM2) {
  314. SLJIT_ASSERT(src2 == TMP_REG2);
  315. return push_inst(compiler, ORIS | S(src1) | A(dst) | compiler->imm);
  316. }
  317. if (flags & ALT_FORM3) {
  318. SLJIT_ASSERT(src2 == TMP_REG2);
  319. FAIL_IF(push_inst(compiler, ORI | S(src1) | A(dst) | IMM(compiler->imm)));
  320. return push_inst(compiler, ORIS | S(dst) | A(dst) | IMM(compiler->imm >> 16));
  321. }
  322. return push_inst(compiler, OR | RC(flags) | S(src1) | A(dst) | B(src2));
  323. case SLJIT_XOR:
  324. if (flags & ALT_FORM1) {
  325. SLJIT_ASSERT(src2 == TMP_REG2);
  326. return push_inst(compiler, XORI | S(src1) | A(dst) | compiler->imm);
  327. }
  328. if (flags & ALT_FORM2) {
  329. SLJIT_ASSERT(src2 == TMP_REG2);
  330. return push_inst(compiler, XORIS | S(src1) | A(dst) | compiler->imm);
  331. }
  332. if (flags & ALT_FORM3) {
  333. SLJIT_ASSERT(src2 == TMP_REG2);
  334. FAIL_IF(push_inst(compiler, XORI | S(src1) | A(dst) | IMM(compiler->imm)));
  335. return push_inst(compiler, XORIS | S(dst) | A(dst) | IMM(compiler->imm >> 16));
  336. }
  337. return push_inst(compiler, XOR | RC(flags) | S(src1) | A(dst) | B(src2));
  338. case SLJIT_SHL:
  339. if (flags & ALT_FORM1) {
  340. SLJIT_ASSERT(src2 == TMP_REG2);
  341. if (flags & ALT_FORM2) {
  342. compiler->imm &= 0x1f;
  343. return push_inst(compiler, RLWINM | RC(flags) | S(src1) | A(dst) | (compiler->imm << 11) | ((31 - compiler->imm) << 1));
  344. }
  345. compiler->imm &= 0x3f;
  346. return push_inst(compiler, RLDI(dst, src1, compiler->imm, 63 - compiler->imm, 1) | RC(flags));
  347. }
  348. return push_inst(compiler, ((flags & ALT_FORM2) ? SLW : SLD) | RC(flags) | S(src1) | A(dst) | B(src2));
  349. case SLJIT_LSHR:
  350. if (flags & ALT_FORM1) {
  351. SLJIT_ASSERT(src2 == TMP_REG2);
  352. if (flags & ALT_FORM2) {
  353. compiler->imm &= 0x1f;
  354. return push_inst(compiler, RLWINM | RC(flags) | S(src1) | A(dst) | (((32 - compiler->imm) & 0x1f) << 11) | (compiler->imm << 6) | (31 << 1));
  355. }
  356. compiler->imm &= 0x3f;
  357. return push_inst(compiler, RLDI(dst, src1, 64 - compiler->imm, compiler->imm, 0) | RC(flags));
  358. }
  359. return push_inst(compiler, ((flags & ALT_FORM2) ? SRW : SRD) | RC(flags) | S(src1) | A(dst) | B(src2));
  360. case SLJIT_ASHR:
  361. if (flags & ALT_FORM1) {
  362. SLJIT_ASSERT(src2 == TMP_REG2);
  363. if (flags & ALT_FORM2) {
  364. compiler->imm &= 0x1f;
  365. return push_inst(compiler, SRAWI | RC(flags) | S(src1) | A(dst) | (compiler->imm << 11));
  366. }
  367. compiler->imm &= 0x3f;
  368. return push_inst(compiler, SRADI | RC(flags) | S(src1) | A(dst) | ((compiler->imm & 0x1f) << 11) | ((compiler->imm & 0x20) >> 4));
  369. }
  370. return push_inst(compiler, ((flags & ALT_FORM2) ? SRAW : SRAD) | RC(flags) | S(src1) | A(dst) | B(src2));
  371. }
  372. SLJIT_UNREACHABLE();
  373. return SLJIT_SUCCESS;
  374. }
  375. static sljit_s32 call_with_args(struct sljit_compiler *compiler, sljit_s32 arg_types, sljit_s32 *src)
  376. {
  377. sljit_s32 arg_count = 0;
  378. sljit_s32 word_arg_count = 0;
  379. sljit_s32 types = 0;
  380. sljit_s32 reg = 0;
  381. if (src)
  382. reg = *src & REG_MASK;
  383. arg_types >>= SLJIT_DEF_SHIFT;
  384. while (arg_types) {
  385. types = (types << SLJIT_DEF_SHIFT) | (arg_types & SLJIT_DEF_MASK);
  386. switch (arg_types & SLJIT_DEF_MASK) {
  387. case SLJIT_ARG_TYPE_F32:
  388. case SLJIT_ARG_TYPE_F64:
  389. arg_count++;
  390. break;
  391. default:
  392. arg_count++;
  393. word_arg_count++;
  394. if (arg_count != word_arg_count && arg_count == reg) {
  395. FAIL_IF(push_inst(compiler, OR | S(reg) | A(TMP_CALL_REG) | B(reg)));
  396. *src = TMP_CALL_REG;
  397. }
  398. break;
  399. }
  400. arg_types >>= SLJIT_DEF_SHIFT;
  401. }
  402. while (types) {
  403. switch (types & SLJIT_DEF_MASK) {
  404. case SLJIT_ARG_TYPE_F32:
  405. case SLJIT_ARG_TYPE_F64:
  406. arg_count--;
  407. break;
  408. default:
  409. if (arg_count != word_arg_count)
  410. FAIL_IF(push_inst(compiler, OR | S(word_arg_count) | A(arg_count) | B(word_arg_count)));
  411. arg_count--;
  412. word_arg_count--;
  413. break;
  414. }
  415. types >>= SLJIT_DEF_SHIFT;
  416. }
  417. return SLJIT_SUCCESS;
  418. }
  419. static SLJIT_INLINE sljit_s32 emit_const(struct sljit_compiler *compiler, sljit_s32 reg, sljit_sw init_value)
  420. {
  421. FAIL_IF(push_inst(compiler, ADDIS | D(reg) | A(0) | IMM(init_value >> 48)));
  422. FAIL_IF(push_inst(compiler, ORI | S(reg) | A(reg) | IMM(init_value >> 32)));
  423. FAIL_IF(PUSH_RLDICR(reg, 31));
  424. FAIL_IF(push_inst(compiler, ORIS | S(reg) | A(reg) | IMM(init_value >> 16)));
  425. return push_inst(compiler, ORI | S(reg) | A(reg) | IMM(init_value));
  426. }
  427. SLJIT_API_FUNC_ATTRIBUTE void sljit_set_jump_addr(sljit_uw addr, sljit_uw new_target, sljit_sw executable_offset)
  428. {
  429. sljit_ins *inst = (sljit_ins*)addr;
  430. SLJIT_UNUSED_ARG(executable_offset);
  431. SLJIT_UPDATE_WX_FLAGS(inst, inst + 5, 0);
  432. inst[0] = (inst[0] & 0xffff0000) | ((new_target >> 48) & 0xffff);
  433. inst[1] = (inst[1] & 0xffff0000) | ((new_target >> 32) & 0xffff);
  434. inst[3] = (inst[3] & 0xffff0000) | ((new_target >> 16) & 0xffff);
  435. inst[4] = (inst[4] & 0xffff0000) | (new_target & 0xffff);
  436. SLJIT_UPDATE_WX_FLAGS(inst, inst + 5, 1);
  437. inst = (sljit_ins *)SLJIT_ADD_EXEC_OFFSET(inst, executable_offset);
  438. SLJIT_CACHE_FLUSH(inst, inst + 5);
  439. }
  440. SLJIT_API_FUNC_ATTRIBUTE void sljit_set_const(sljit_uw addr, sljit_sw new_constant, sljit_sw executable_offset)
  441. {
  442. sljit_set_jump_addr(addr, new_constant, executable_offset);
  443. }