sljitNativePPC_common.c 75 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447
  1. /*
  2. * Stack-less Just-In-Time compiler
  3. *
  4. * Copyright Zoltan Herczeg (hzmester@freemail.hu). All rights reserved.
  5. *
  6. * Redistribution and use in source and binary forms, with or without modification, are
  7. * permitted provided that the following conditions are met:
  8. *
  9. * 1. Redistributions of source code must retain the above copyright notice, this list of
  10. * conditions and the following disclaimer.
  11. *
  12. * 2. Redistributions in binary form must reproduce the above copyright notice, this list
  13. * of conditions and the following disclaimer in the documentation and/or other materials
  14. * provided with the distribution.
  15. *
  16. * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDER(S) AND CONTRIBUTORS ``AS IS'' AND ANY
  17. * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
  18. * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT
  19. * SHALL THE COPYRIGHT HOLDER(S) OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
  20. * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED
  21. * TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR
  22. * BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
  23. * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
  24. * ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  25. */
  26. SLJIT_API_FUNC_ATTRIBUTE const char* sljit_get_platform_name(void)
  27. {
  28. return "PowerPC" SLJIT_CPUINFO;
  29. }
  30. /* Length of an instruction word.
  31. Both for ppc-32 and ppc-64. */
  32. typedef sljit_u32 sljit_ins;
  33. #if ((defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32) && (defined _AIX)) \
  34. || (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  35. #define SLJIT_PPC_STACK_FRAME_V2 1
  36. #endif
  37. #ifdef _AIX
  38. #include <sys/cache.h>
  39. #endif
  40. #if (defined _CALL_ELF && _CALL_ELF == 2)
  41. #define SLJIT_PASS_ENTRY_ADDR_TO_CALL 1
  42. #endif
  43. #if (defined SLJIT_CACHE_FLUSH_OWN_IMPL && SLJIT_CACHE_FLUSH_OWN_IMPL)
  44. static void ppc_cache_flush(sljit_ins *from, sljit_ins *to)
  45. {
  46. #ifdef _AIX
  47. _sync_cache_range((caddr_t)from, (int)((size_t)to - (size_t)from));
  48. #elif defined(__GNUC__) || (defined(__IBM_GCC_ASM) && __IBM_GCC_ASM)
  49. # if defined(_ARCH_PWR) || defined(_ARCH_PWR2)
  50. /* Cache flush for POWER architecture. */
  51. while (from < to) {
  52. __asm__ volatile (
  53. "clf 0, %0\n"
  54. "dcs\n"
  55. : : "r"(from)
  56. );
  57. from++;
  58. }
  59. __asm__ volatile ( "ics" );
  60. # elif defined(_ARCH_COM) && !defined(_ARCH_PPC)
  61. # error "Cache flush is not implemented for PowerPC/POWER common mode."
  62. # else
  63. /* Cache flush for PowerPC architecture. */
  64. while (from < to) {
  65. __asm__ volatile (
  66. "dcbf 0, %0\n"
  67. "sync\n"
  68. "icbi 0, %0\n"
  69. : : "r"(from)
  70. );
  71. from++;
  72. }
  73. __asm__ volatile ( "isync" );
  74. # endif
  75. # ifdef __xlc__
  76. # warning "This file may fail to compile if -qfuncsect is used"
  77. # endif
  78. #elif defined(__xlc__)
  79. #error "Please enable GCC syntax for inline assembly statements with -qasm=gcc"
  80. #else
  81. #error "This platform requires a cache flush implementation."
  82. #endif /* _AIX */
  83. }
  84. #endif /* (defined SLJIT_CACHE_FLUSH_OWN_IMPL && SLJIT_CACHE_FLUSH_OWN_IMPL) */
  85. #define TMP_REG1 (SLJIT_NUMBER_OF_REGISTERS + 2)
  86. #define TMP_REG2 (SLJIT_NUMBER_OF_REGISTERS + 3)
  87. #define TMP_ZERO (SLJIT_NUMBER_OF_REGISTERS + 4)
  88. #if (defined SLJIT_PASS_ENTRY_ADDR_TO_CALL && SLJIT_PASS_ENTRY_ADDR_TO_CALL)
  89. #define TMP_CALL_REG (SLJIT_NUMBER_OF_REGISTERS + 5)
  90. #else
  91. #define TMP_CALL_REG TMP_REG2
  92. #endif
  93. #define TMP_FREG1 (SLJIT_NUMBER_OF_FLOAT_REGISTERS + 1)
  94. #define TMP_FREG2 (SLJIT_NUMBER_OF_FLOAT_REGISTERS + 2)
  95. static const sljit_u8 reg_map[SLJIT_NUMBER_OF_REGISTERS + 7] = {
  96. 0, 3, 4, 5, 6, 7, 8, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 1, 9, 10, 31, 12
  97. };
  98. static const sljit_u8 freg_map[SLJIT_NUMBER_OF_FLOAT_REGISTERS + 3] = {
  99. 0, 1, 2, 3, 4, 5, 6, 0, 7
  100. };
  101. /* --------------------------------------------------------------------- */
  102. /* Instrucion forms */
  103. /* --------------------------------------------------------------------- */
  104. #define D(d) (reg_map[d] << 21)
  105. #define S(s) (reg_map[s] << 21)
  106. #define A(a) (reg_map[a] << 16)
  107. #define B(b) (reg_map[b] << 11)
  108. #define C(c) (reg_map[c] << 6)
  109. #define FD(fd) (freg_map[fd] << 21)
  110. #define FS(fs) (freg_map[fs] << 21)
  111. #define FA(fa) (freg_map[fa] << 16)
  112. #define FB(fb) (freg_map[fb] << 11)
  113. #define FC(fc) (freg_map[fc] << 6)
  114. #define IMM(imm) ((imm) & 0xffff)
  115. #define CRD(d) ((d) << 21)
  116. /* Instruction bit sections.
  117. OE and Rc flag (see ALT_SET_FLAGS). */
  118. #define OE(flags) ((flags) & ALT_SET_FLAGS)
  119. /* Rc flag (see ALT_SET_FLAGS). */
  120. #define RC(flags) (((flags) & ALT_SET_FLAGS) >> 10)
  121. #define HI(opcode) ((opcode) << 26)
  122. #define LO(opcode) ((opcode) << 1)
  123. #define ADD (HI(31) | LO(266))
  124. #define ADDC (HI(31) | LO(10))
  125. #define ADDE (HI(31) | LO(138))
  126. #define ADDI (HI(14))
  127. #define ADDIC (HI(13))
  128. #define ADDIS (HI(15))
  129. #define ADDME (HI(31) | LO(234))
  130. #define AND (HI(31) | LO(28))
  131. #define ANDI (HI(28))
  132. #define ANDIS (HI(29))
  133. #define Bx (HI(18))
  134. #define BCx (HI(16))
  135. #define BCCTR (HI(19) | LO(528) | (3 << 11))
  136. #define BLR (HI(19) | LO(16) | (0x14 << 21))
  137. #define CNTLZD (HI(31) | LO(58))
  138. #define CNTLZW (HI(31) | LO(26))
  139. #define CMP (HI(31) | LO(0))
  140. #define CMPI (HI(11))
  141. #define CMPL (HI(31) | LO(32))
  142. #define CMPLI (HI(10))
  143. #define CROR (HI(19) | LO(449))
  144. #define DCBT (HI(31) | LO(278))
  145. #define DIVD (HI(31) | LO(489))
  146. #define DIVDU (HI(31) | LO(457))
  147. #define DIVW (HI(31) | LO(491))
  148. #define DIVWU (HI(31) | LO(459))
  149. #define EXTSB (HI(31) | LO(954))
  150. #define EXTSH (HI(31) | LO(922))
  151. #define EXTSW (HI(31) | LO(986))
  152. #define FABS (HI(63) | LO(264))
  153. #define FADD (HI(63) | LO(21))
  154. #define FADDS (HI(59) | LO(21))
  155. #define FCFID (HI(63) | LO(846))
  156. #define FCMPU (HI(63) | LO(0))
  157. #define FCTIDZ (HI(63) | LO(815))
  158. #define FCTIWZ (HI(63) | LO(15))
  159. #define FDIV (HI(63) | LO(18))
  160. #define FDIVS (HI(59) | LO(18))
  161. #define FMR (HI(63) | LO(72))
  162. #define FMUL (HI(63) | LO(25))
  163. #define FMULS (HI(59) | LO(25))
  164. #define FNEG (HI(63) | LO(40))
  165. #define FRSP (HI(63) | LO(12))
  166. #define FSUB (HI(63) | LO(20))
  167. #define FSUBS (HI(59) | LO(20))
  168. #define LD (HI(58) | 0)
  169. #define LWZ (HI(32))
  170. #define MFCR (HI(31) | LO(19))
  171. #define MFLR (HI(31) | LO(339) | 0x80000)
  172. #define MFXER (HI(31) | LO(339) | 0x10000)
  173. #define MTCTR (HI(31) | LO(467) | 0x90000)
  174. #define MTLR (HI(31) | LO(467) | 0x80000)
  175. #define MTXER (HI(31) | LO(467) | 0x10000)
  176. #define MULHD (HI(31) | LO(73))
  177. #define MULHDU (HI(31) | LO(9))
  178. #define MULHW (HI(31) | LO(75))
  179. #define MULHWU (HI(31) | LO(11))
  180. #define MULLD (HI(31) | LO(233))
  181. #define MULLI (HI(7))
  182. #define MULLW (HI(31) | LO(235))
  183. #define NEG (HI(31) | LO(104))
  184. #define NOP (HI(24))
  185. #define NOR (HI(31) | LO(124))
  186. #define OR (HI(31) | LO(444))
  187. #define ORI (HI(24))
  188. #define ORIS (HI(25))
  189. #define RLDICL (HI(30))
  190. #define RLWINM (HI(21))
  191. #define SLD (HI(31) | LO(27))
  192. #define SLW (HI(31) | LO(24))
  193. #define SRAD (HI(31) | LO(794))
  194. #define SRADI (HI(31) | LO(413 << 1))
  195. #define SRAW (HI(31) | LO(792))
  196. #define SRAWI (HI(31) | LO(824))
  197. #define SRD (HI(31) | LO(539))
  198. #define SRW (HI(31) | LO(536))
  199. #define STD (HI(62) | 0)
  200. #define STDU (HI(62) | 1)
  201. #define STDUX (HI(31) | LO(181))
  202. #define STFIWX (HI(31) | LO(983))
  203. #define STW (HI(36))
  204. #define STWU (HI(37))
  205. #define STWUX (HI(31) | LO(183))
  206. #define SUBF (HI(31) | LO(40))
  207. #define SUBFC (HI(31) | LO(8))
  208. #define SUBFE (HI(31) | LO(136))
  209. #define SUBFIC (HI(8))
  210. #define XOR (HI(31) | LO(316))
  211. #define XORI (HI(26))
  212. #define XORIS (HI(27))
  213. #define SIMM_MAX (0x7fff)
  214. #define SIMM_MIN (-0x8000)
  215. #define UIMM_MAX (0xffff)
  216. #define RLDI(dst, src, sh, mb, type) \
  217. (HI(30) | S(src) | A(dst) | ((type) << 2) | (((sh) & 0x1f) << 11) | (((sh) & 0x20) >> 4) | (((mb) & 0x1f) << 6) | ((mb) & 0x20))
  218. #if (defined SLJIT_INDIRECT_CALL && SLJIT_INDIRECT_CALL)
  219. SLJIT_API_FUNC_ATTRIBUTE void sljit_set_function_context(void** func_ptr, struct sljit_function_context* context, sljit_sw addr, void* func)
  220. {
  221. sljit_sw* ptrs;
  222. if (func_ptr)
  223. *func_ptr = (void*)context;
  224. ptrs = (sljit_sw*)func;
  225. context->addr = addr ? addr : ptrs[0];
  226. context->r2 = ptrs[1];
  227. context->r11 = ptrs[2];
  228. }
  229. #endif
  230. static sljit_s32 push_inst(struct sljit_compiler *compiler, sljit_ins ins)
  231. {
  232. sljit_ins *ptr = (sljit_ins*)ensure_buf(compiler, sizeof(sljit_ins));
  233. FAIL_IF(!ptr);
  234. *ptr = ins;
  235. compiler->size++;
  236. return SLJIT_SUCCESS;
  237. }
  238. static SLJIT_INLINE sljit_s32 detect_jump_type(struct sljit_jump *jump, sljit_ins *code_ptr, sljit_ins *code, sljit_sw executable_offset)
  239. {
  240. sljit_sw diff;
  241. sljit_uw target_addr;
  242. sljit_sw extra_jump_flags;
  243. #if (defined SLJIT_PASS_ENTRY_ADDR_TO_CALL && SLJIT_PASS_ENTRY_ADDR_TO_CALL) && (defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32)
  244. if (jump->flags & (SLJIT_REWRITABLE_JUMP | IS_CALL))
  245. return 0;
  246. #else
  247. if (jump->flags & SLJIT_REWRITABLE_JUMP)
  248. return 0;
  249. #endif
  250. if (jump->flags & JUMP_ADDR)
  251. target_addr = jump->u.target;
  252. else {
  253. SLJIT_ASSERT(jump->flags & JUMP_LABEL);
  254. target_addr = (sljit_uw)(code + jump->u.label->size) + (sljit_uw)executable_offset;
  255. }
  256. #if (defined SLJIT_PASS_ENTRY_ADDR_TO_CALL && SLJIT_PASS_ENTRY_ADDR_TO_CALL) && (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  257. if (jump->flags & IS_CALL)
  258. goto keep_address;
  259. #endif
  260. diff = ((sljit_sw)target_addr - (sljit_sw)(code_ptr) - executable_offset) & ~0x3l;
  261. extra_jump_flags = 0;
  262. if (jump->flags & IS_COND) {
  263. if (diff <= 0x7fff && diff >= -0x8000) {
  264. jump->flags |= PATCH_B;
  265. return 1;
  266. }
  267. if (target_addr <= 0xffff) {
  268. jump->flags |= PATCH_B | PATCH_ABS_B;
  269. return 1;
  270. }
  271. extra_jump_flags = REMOVE_COND;
  272. diff -= sizeof(sljit_ins);
  273. }
  274. if (diff <= 0x01ffffff && diff >= -0x02000000) {
  275. jump->flags |= PATCH_B | extra_jump_flags;
  276. return 1;
  277. }
  278. if (target_addr <= 0x03ffffff) {
  279. jump->flags |= PATCH_B | PATCH_ABS_B | extra_jump_flags;
  280. return 1;
  281. }
  282. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  283. #if (defined SLJIT_PASS_ENTRY_ADDR_TO_CALL && SLJIT_PASS_ENTRY_ADDR_TO_CALL)
  284. keep_address:
  285. #endif
  286. if (target_addr <= 0x7fffffff) {
  287. jump->flags |= PATCH_ABS32;
  288. return 1;
  289. }
  290. if (target_addr <= 0x7fffffffffffl) {
  291. jump->flags |= PATCH_ABS48;
  292. return 1;
  293. }
  294. #endif
  295. return 0;
  296. }
  297. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  298. static SLJIT_INLINE sljit_sw put_label_get_length(struct sljit_put_label *put_label, sljit_uw max_label)
  299. {
  300. if (max_label < 0x100000000l) {
  301. put_label->flags = 0;
  302. return 1;
  303. }
  304. if (max_label < 0x1000000000000l) {
  305. put_label->flags = 1;
  306. return 3;
  307. }
  308. put_label->flags = 2;
  309. return 4;
  310. }
  311. static SLJIT_INLINE void put_label_set(struct sljit_put_label *put_label)
  312. {
  313. sljit_uw addr = put_label->label->addr;
  314. sljit_ins *inst = (sljit_ins *)put_label->addr;
  315. sljit_s32 reg = *inst;
  316. if (put_label->flags == 0) {
  317. SLJIT_ASSERT(addr < 0x100000000l);
  318. inst[0] = ORIS | S(TMP_ZERO) | A(reg) | IMM(addr >> 16);
  319. }
  320. else {
  321. if (put_label->flags == 1) {
  322. SLJIT_ASSERT(addr < 0x1000000000000l);
  323. inst[0] = ORI | S(TMP_ZERO) | A(reg) | IMM(addr >> 32);
  324. }
  325. else {
  326. inst[0] = ORIS | S(TMP_ZERO) | A(reg) | IMM(addr >> 48);
  327. inst[1] = ORI | S(reg) | A(reg) | IMM((addr >> 32) & 0xffff);
  328. inst ++;
  329. }
  330. inst[1] = RLDI(reg, reg, 32, 31, 1);
  331. inst[2] = ORIS | S(reg) | A(reg) | IMM((addr >> 16) & 0xffff);
  332. inst += 2;
  333. }
  334. inst[1] = ORI | S(reg) | A(reg) | IMM(addr & 0xffff);
  335. }
  336. #endif
  337. SLJIT_API_FUNC_ATTRIBUTE void* sljit_generate_code(struct sljit_compiler *compiler)
  338. {
  339. struct sljit_memory_fragment *buf;
  340. sljit_ins *code;
  341. sljit_ins *code_ptr;
  342. sljit_ins *buf_ptr;
  343. sljit_ins *buf_end;
  344. sljit_uw word_count;
  345. sljit_uw next_addr;
  346. sljit_sw executable_offset;
  347. sljit_uw addr;
  348. struct sljit_label *label;
  349. struct sljit_jump *jump;
  350. struct sljit_const *const_;
  351. struct sljit_put_label *put_label;
  352. CHECK_ERROR_PTR();
  353. CHECK_PTR(check_sljit_generate_code(compiler));
  354. reverse_buf(compiler);
  355. #if (defined SLJIT_INDIRECT_CALL && SLJIT_INDIRECT_CALL)
  356. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  357. compiler->size += (compiler->size & 0x1) + (sizeof(struct sljit_function_context) / sizeof(sljit_ins));
  358. #else
  359. compiler->size += (sizeof(struct sljit_function_context) / sizeof(sljit_ins));
  360. #endif
  361. #endif
  362. code = (sljit_ins*)SLJIT_MALLOC_EXEC(compiler->size * sizeof(sljit_ins), compiler->exec_allocator_data);
  363. PTR_FAIL_WITH_EXEC_IF(code);
  364. buf = compiler->buf;
  365. code_ptr = code;
  366. word_count = 0;
  367. next_addr = 0;
  368. executable_offset = SLJIT_EXEC_OFFSET(code);
  369. label = compiler->labels;
  370. jump = compiler->jumps;
  371. const_ = compiler->consts;
  372. put_label = compiler->put_labels;
  373. do {
  374. buf_ptr = (sljit_ins*)buf->memory;
  375. buf_end = buf_ptr + (buf->used_size >> 2);
  376. do {
  377. *code_ptr = *buf_ptr++;
  378. if (next_addr == word_count) {
  379. SLJIT_ASSERT(!label || label->size >= word_count);
  380. SLJIT_ASSERT(!jump || jump->addr >= word_count);
  381. SLJIT_ASSERT(!const_ || const_->addr >= word_count);
  382. SLJIT_ASSERT(!put_label || put_label->addr >= word_count);
  383. /* These structures are ordered by their address. */
  384. if (label && label->size == word_count) {
  385. /* Just recording the address. */
  386. label->addr = (sljit_uw)SLJIT_ADD_EXEC_OFFSET(code_ptr, executable_offset);
  387. label->size = code_ptr - code;
  388. label = label->next;
  389. }
  390. if (jump && jump->addr == word_count) {
  391. #if (defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32)
  392. jump->addr = (sljit_uw)(code_ptr - 3);
  393. #else
  394. jump->addr = (sljit_uw)(code_ptr - 6);
  395. #endif
  396. if (detect_jump_type(jump, code_ptr, code, executable_offset)) {
  397. #if (defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32)
  398. code_ptr[-3] = code_ptr[0];
  399. code_ptr -= 3;
  400. #else
  401. if (jump->flags & PATCH_ABS32) {
  402. code_ptr -= 3;
  403. code_ptr[-1] = code_ptr[2];
  404. code_ptr[0] = code_ptr[3];
  405. }
  406. else if (jump->flags & PATCH_ABS48) {
  407. code_ptr--;
  408. code_ptr[-1] = code_ptr[0];
  409. code_ptr[0] = code_ptr[1];
  410. /* rldicr rX,rX,32,31 -> rX,rX,16,47 */
  411. SLJIT_ASSERT((code_ptr[-3] & 0xfc00ffff) == 0x780007c6);
  412. code_ptr[-3] ^= 0x8422;
  413. /* oris -> ori */
  414. code_ptr[-2] ^= 0x4000000;
  415. }
  416. else {
  417. code_ptr[-6] = code_ptr[0];
  418. code_ptr -= 6;
  419. }
  420. #endif
  421. if (jump->flags & REMOVE_COND) {
  422. code_ptr[0] = BCx | (2 << 2) | ((code_ptr[0] ^ (8 << 21)) & 0x03ff0001);
  423. code_ptr++;
  424. jump->addr += sizeof(sljit_ins);
  425. code_ptr[0] = Bx;
  426. jump->flags -= IS_COND;
  427. }
  428. }
  429. jump = jump->next;
  430. }
  431. if (const_ && const_->addr == word_count) {
  432. const_->addr = (sljit_uw)code_ptr;
  433. const_ = const_->next;
  434. }
  435. if (put_label && put_label->addr == word_count) {
  436. SLJIT_ASSERT(put_label->label);
  437. put_label->addr = (sljit_uw)code_ptr;
  438. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  439. code_ptr += put_label_get_length(put_label, (sljit_uw)(SLJIT_ADD_EXEC_OFFSET(code, executable_offset) + put_label->label->size));
  440. word_count += 4;
  441. #endif
  442. put_label = put_label->next;
  443. }
  444. next_addr = compute_next_addr(label, jump, const_, put_label);
  445. }
  446. code_ptr ++;
  447. word_count ++;
  448. } while (buf_ptr < buf_end);
  449. buf = buf->next;
  450. } while (buf);
  451. if (label && label->size == word_count) {
  452. label->addr = (sljit_uw)SLJIT_ADD_EXEC_OFFSET(code_ptr, executable_offset);
  453. label->size = code_ptr - code;
  454. label = label->next;
  455. }
  456. SLJIT_ASSERT(!label);
  457. SLJIT_ASSERT(!jump);
  458. SLJIT_ASSERT(!const_);
  459. SLJIT_ASSERT(!put_label);
  460. #if (defined SLJIT_INDIRECT_CALL && SLJIT_INDIRECT_CALL)
  461. SLJIT_ASSERT(code_ptr - code <= (sljit_sw)compiler->size - (sizeof(struct sljit_function_context) / sizeof(sljit_ins)));
  462. #else
  463. SLJIT_ASSERT(code_ptr - code <= (sljit_sw)compiler->size);
  464. #endif
  465. jump = compiler->jumps;
  466. while (jump) {
  467. do {
  468. addr = (jump->flags & JUMP_LABEL) ? jump->u.label->addr : jump->u.target;
  469. buf_ptr = (sljit_ins *)jump->addr;
  470. if (jump->flags & PATCH_B) {
  471. if (jump->flags & IS_COND) {
  472. if (!(jump->flags & PATCH_ABS_B)) {
  473. addr -= (sljit_uw)SLJIT_ADD_EXEC_OFFSET(buf_ptr, executable_offset);
  474. SLJIT_ASSERT((sljit_sw)addr <= 0x7fff && (sljit_sw)addr >= -0x8000);
  475. *buf_ptr = BCx | (addr & 0xfffc) | ((*buf_ptr) & 0x03ff0001);
  476. }
  477. else {
  478. SLJIT_ASSERT(addr <= 0xffff);
  479. *buf_ptr = BCx | (addr & 0xfffc) | 0x2 | ((*buf_ptr) & 0x03ff0001);
  480. }
  481. }
  482. else {
  483. if (!(jump->flags & PATCH_ABS_B)) {
  484. addr -= (sljit_uw)SLJIT_ADD_EXEC_OFFSET(buf_ptr, executable_offset);
  485. SLJIT_ASSERT((sljit_sw)addr <= 0x01ffffff && (sljit_sw)addr >= -0x02000000);
  486. *buf_ptr = Bx | (addr & 0x03fffffc) | ((*buf_ptr) & 0x1);
  487. }
  488. else {
  489. SLJIT_ASSERT(addr <= 0x03ffffff);
  490. *buf_ptr = Bx | (addr & 0x03fffffc) | 0x2 | ((*buf_ptr) & 0x1);
  491. }
  492. }
  493. break;
  494. }
  495. /* Set the fields of immediate loads. */
  496. #if (defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32)
  497. buf_ptr[0] = (buf_ptr[0] & 0xffff0000) | ((addr >> 16) & 0xffff);
  498. buf_ptr[1] = (buf_ptr[1] & 0xffff0000) | (addr & 0xffff);
  499. #else
  500. if (jump->flags & PATCH_ABS32) {
  501. SLJIT_ASSERT(addr <= 0x7fffffff);
  502. buf_ptr[0] = (buf_ptr[0] & 0xffff0000) | ((addr >> 16) & 0xffff);
  503. buf_ptr[1] = (buf_ptr[1] & 0xffff0000) | (addr & 0xffff);
  504. break;
  505. }
  506. if (jump->flags & PATCH_ABS48) {
  507. SLJIT_ASSERT(addr <= 0x7fffffffffff);
  508. buf_ptr[0] = (buf_ptr[0] & 0xffff0000) | ((addr >> 32) & 0xffff);
  509. buf_ptr[1] = (buf_ptr[1] & 0xffff0000) | ((addr >> 16) & 0xffff);
  510. buf_ptr[3] = (buf_ptr[3] & 0xffff0000) | (addr & 0xffff);
  511. break;
  512. }
  513. buf_ptr[0] = (buf_ptr[0] & 0xffff0000) | ((addr >> 48) & 0xffff);
  514. buf_ptr[1] = (buf_ptr[1] & 0xffff0000) | ((addr >> 32) & 0xffff);
  515. buf_ptr[3] = (buf_ptr[3] & 0xffff0000) | ((addr >> 16) & 0xffff);
  516. buf_ptr[4] = (buf_ptr[4] & 0xffff0000) | (addr & 0xffff);
  517. #endif
  518. } while (0);
  519. jump = jump->next;
  520. }
  521. put_label = compiler->put_labels;
  522. while (put_label) {
  523. #if (defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32)
  524. addr = put_label->label->addr;
  525. buf_ptr = (sljit_ins *)put_label->addr;
  526. SLJIT_ASSERT((buf_ptr[0] & 0xfc1f0000) == ADDIS && (buf_ptr[1] & 0xfc000000) == ORI);
  527. buf_ptr[0] |= (addr >> 16) & 0xffff;
  528. buf_ptr[1] |= addr & 0xffff;
  529. #else
  530. put_label_set(put_label);
  531. #endif
  532. put_label = put_label->next;
  533. }
  534. compiler->error = SLJIT_ERR_COMPILED;
  535. compiler->executable_offset = executable_offset;
  536. compiler->executable_size = (code_ptr - code) * sizeof(sljit_ins);
  537. code = (sljit_ins *)SLJIT_ADD_EXEC_OFFSET(code, executable_offset);
  538. #if (defined SLJIT_INDIRECT_CALL && SLJIT_INDIRECT_CALL)
  539. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  540. if (((sljit_sw)code_ptr) & 0x4)
  541. code_ptr++;
  542. #endif
  543. sljit_set_function_context(NULL, (struct sljit_function_context*)code_ptr, (sljit_sw)code, (void*)sljit_generate_code);
  544. #endif
  545. code_ptr = (sljit_ins *)SLJIT_ADD_EXEC_OFFSET(code_ptr, executable_offset);
  546. SLJIT_CACHE_FLUSH(code, code_ptr);
  547. SLJIT_UPDATE_WX_FLAGS(code, code_ptr, 1);
  548. #if (defined SLJIT_INDIRECT_CALL && SLJIT_INDIRECT_CALL)
  549. return code_ptr;
  550. #else
  551. return code;
  552. #endif
  553. }
  554. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_has_cpu_feature(sljit_s32 feature_type)
  555. {
  556. switch (feature_type) {
  557. case SLJIT_HAS_FPU:
  558. #ifdef SLJIT_IS_FPU_AVAILABLE
  559. return SLJIT_IS_FPU_AVAILABLE;
  560. #else
  561. /* Available by default. */
  562. return 1;
  563. #endif
  564. /* A saved register is set to a zero value. */
  565. case SLJIT_HAS_ZERO_REGISTER:
  566. case SLJIT_HAS_CLZ:
  567. case SLJIT_HAS_PREFETCH:
  568. return 1;
  569. default:
  570. return 0;
  571. }
  572. }
  573. /* --------------------------------------------------------------------- */
  574. /* Entry, exit */
  575. /* --------------------------------------------------------------------- */
  576. /* inp_flags: */
  577. /* Creates an index in data_transfer_insts array. */
  578. #define LOAD_DATA 0x01
  579. #define INDEXED 0x02
  580. #define SIGNED_DATA 0x04
  581. #define WORD_DATA 0x00
  582. #define BYTE_DATA 0x08
  583. #define HALF_DATA 0x10
  584. #define INT_DATA 0x18
  585. /* Separates integer and floating point registers */
  586. #define GPR_REG 0x1f
  587. #define DOUBLE_DATA 0x20
  588. #define MEM_MASK 0x7f
  589. /* Other inp_flags. */
  590. /* Integer opertion and set flags -> requires exts on 64 bit systems. */
  591. #define ALT_SIGN_EXT 0x000100
  592. /* This flag affects the RC() and OERC() macros. */
  593. #define ALT_SET_FLAGS 0x000400
  594. #define ALT_FORM1 0x001000
  595. #define ALT_FORM2 0x002000
  596. #define ALT_FORM3 0x004000
  597. #define ALT_FORM4 0x008000
  598. #define ALT_FORM5 0x010000
  599. /* Source and destination is register. */
  600. #define REG_DEST 0x000001
  601. #define REG1_SOURCE 0x000002
  602. #define REG2_SOURCE 0x000004
  603. /*
  604. ALT_SIGN_EXT 0x000100
  605. ALT_SET_FLAGS 0x000200
  606. ALT_FORM1 0x001000
  607. ...
  608. ALT_FORM5 0x010000 */
  609. #if (defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32)
  610. #include "sljitNativePPC_32.c"
  611. #else
  612. #include "sljitNativePPC_64.c"
  613. #endif
  614. #if (defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32)
  615. #define STACK_STORE STW
  616. #define STACK_LOAD LWZ
  617. #else
  618. #define STACK_STORE STD
  619. #define STACK_LOAD LD
  620. #endif
  621. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_enter(struct sljit_compiler *compiler,
  622. sljit_s32 options, sljit_s32 arg_types, sljit_s32 scratches, sljit_s32 saveds,
  623. sljit_s32 fscratches, sljit_s32 fsaveds, sljit_s32 local_size)
  624. {
  625. sljit_s32 args, i, tmp, offs;
  626. CHECK_ERROR();
  627. CHECK(check_sljit_emit_enter(compiler, options, arg_types, scratches, saveds, fscratches, fsaveds, local_size));
  628. set_emit_enter(compiler, options, arg_types, scratches, saveds, fscratches, fsaveds, local_size);
  629. FAIL_IF(push_inst(compiler, MFLR | D(0)));
  630. offs = -(sljit_s32)(sizeof(sljit_sw));
  631. FAIL_IF(push_inst(compiler, STACK_STORE | S(TMP_ZERO) | A(SLJIT_SP) | IMM(offs)));
  632. tmp = saveds < SLJIT_NUMBER_OF_SAVED_REGISTERS ? (SLJIT_S0 + 1 - saveds) : SLJIT_FIRST_SAVED_REG;
  633. for (i = SLJIT_S0; i >= tmp; i--) {
  634. offs -= (sljit_s32)(sizeof(sljit_sw));
  635. FAIL_IF(push_inst(compiler, STACK_STORE | S(i) | A(SLJIT_SP) | IMM(offs)));
  636. }
  637. for (i = scratches; i >= SLJIT_FIRST_SAVED_REG; i--) {
  638. offs -= (sljit_s32)(sizeof(sljit_sw));
  639. FAIL_IF(push_inst(compiler, STACK_STORE | S(i) | A(SLJIT_SP) | IMM(offs)));
  640. }
  641. SLJIT_ASSERT(offs == -(sljit_s32)GET_SAVED_REGISTERS_SIZE(compiler->scratches, compiler->saveds, 1));
  642. #if (defined SLJIT_PPC_STACK_FRAME_V2 && SLJIT_PPC_STACK_FRAME_V2)
  643. FAIL_IF(push_inst(compiler, STACK_STORE | S(0) | A(SLJIT_SP) | IMM(2 * sizeof(sljit_sw))));
  644. #else
  645. FAIL_IF(push_inst(compiler, STACK_STORE | S(0) | A(SLJIT_SP) | IMM(sizeof(sljit_sw))));
  646. #endif
  647. FAIL_IF(push_inst(compiler, ADDI | D(TMP_ZERO) | A(0) | 0));
  648. args = get_arg_count(arg_types);
  649. if (args >= 1)
  650. FAIL_IF(push_inst(compiler, OR | S(SLJIT_R0) | A(SLJIT_S0) | B(SLJIT_R0)));
  651. if (args >= 2)
  652. FAIL_IF(push_inst(compiler, OR | S(SLJIT_R1) | A(SLJIT_S1) | B(SLJIT_R1)));
  653. if (args >= 3)
  654. FAIL_IF(push_inst(compiler, OR | S(SLJIT_R2) | A(SLJIT_S2) | B(SLJIT_R2)));
  655. local_size += GET_SAVED_REGISTERS_SIZE(scratches, saveds, 1) + SLJIT_LOCALS_OFFSET;
  656. local_size = (local_size + 15) & ~0xf;
  657. compiler->local_size = local_size;
  658. #if (defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32)
  659. if (local_size <= SIMM_MAX)
  660. FAIL_IF(push_inst(compiler, STWU | S(SLJIT_SP) | A(SLJIT_SP) | IMM(-local_size)));
  661. else {
  662. FAIL_IF(load_immediate(compiler, 0, -local_size));
  663. FAIL_IF(push_inst(compiler, STWUX | S(SLJIT_SP) | A(SLJIT_SP) | B(0)));
  664. }
  665. #else
  666. if (local_size <= SIMM_MAX)
  667. FAIL_IF(push_inst(compiler, STDU | S(SLJIT_SP) | A(SLJIT_SP) | IMM(-local_size)));
  668. else {
  669. FAIL_IF(load_immediate(compiler, 0, -local_size));
  670. FAIL_IF(push_inst(compiler, STDUX | S(SLJIT_SP) | A(SLJIT_SP) | B(0)));
  671. }
  672. #endif
  673. return SLJIT_SUCCESS;
  674. }
  675. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_set_context(struct sljit_compiler *compiler,
  676. sljit_s32 options, sljit_s32 arg_types, sljit_s32 scratches, sljit_s32 saveds,
  677. sljit_s32 fscratches, sljit_s32 fsaveds, sljit_s32 local_size)
  678. {
  679. CHECK_ERROR();
  680. CHECK(check_sljit_set_context(compiler, options, arg_types, scratches, saveds, fscratches, fsaveds, local_size));
  681. set_set_context(compiler, options, arg_types, scratches, saveds, fscratches, fsaveds, local_size);
  682. local_size += GET_SAVED_REGISTERS_SIZE(scratches, saveds, 1) + SLJIT_LOCALS_OFFSET;
  683. compiler->local_size = (local_size + 15) & ~0xf;
  684. return SLJIT_SUCCESS;
  685. }
  686. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_return(struct sljit_compiler *compiler, sljit_s32 op, sljit_s32 src, sljit_sw srcw)
  687. {
  688. sljit_s32 i, tmp, offs;
  689. CHECK_ERROR();
  690. CHECK(check_sljit_emit_return(compiler, op, src, srcw));
  691. FAIL_IF(emit_mov_before_return(compiler, op, src, srcw));
  692. if (compiler->local_size <= SIMM_MAX)
  693. FAIL_IF(push_inst(compiler, ADDI | D(SLJIT_SP) | A(SLJIT_SP) | IMM(compiler->local_size)));
  694. else {
  695. FAIL_IF(load_immediate(compiler, 0, compiler->local_size));
  696. FAIL_IF(push_inst(compiler, ADD | D(SLJIT_SP) | A(SLJIT_SP) | B(0)));
  697. }
  698. #if (defined SLJIT_PPC_STACK_FRAME_V2 && SLJIT_PPC_STACK_FRAME_V2)
  699. FAIL_IF(push_inst(compiler, STACK_LOAD | D(0) | A(SLJIT_SP) | IMM(2 * sizeof(sljit_sw))));
  700. #else
  701. FAIL_IF(push_inst(compiler, STACK_LOAD | D(0) | A(SLJIT_SP) | IMM(sizeof(sljit_sw))));
  702. #endif
  703. offs = -(sljit_s32)GET_SAVED_REGISTERS_SIZE(compiler->scratches, compiler->saveds, 1);
  704. tmp = compiler->scratches;
  705. for (i = SLJIT_FIRST_SAVED_REG; i <= tmp; i++) {
  706. FAIL_IF(push_inst(compiler, STACK_LOAD | D(i) | A(SLJIT_SP) | IMM(offs)));
  707. offs += (sljit_s32)(sizeof(sljit_sw));
  708. }
  709. tmp = compiler->saveds < SLJIT_NUMBER_OF_SAVED_REGISTERS ? (SLJIT_S0 + 1 - compiler->saveds) : SLJIT_FIRST_SAVED_REG;
  710. for (i = tmp; i <= SLJIT_S0; i++) {
  711. FAIL_IF(push_inst(compiler, STACK_LOAD | D(i) | A(SLJIT_SP) | IMM(offs)));
  712. offs += (sljit_s32)(sizeof(sljit_sw));
  713. }
  714. FAIL_IF(push_inst(compiler, STACK_LOAD | D(TMP_ZERO) | A(SLJIT_SP) | IMM(offs)));
  715. SLJIT_ASSERT(offs == -(sljit_sw)(sizeof(sljit_sw)));
  716. FAIL_IF(push_inst(compiler, MTLR | S(0)));
  717. FAIL_IF(push_inst(compiler, BLR));
  718. return SLJIT_SUCCESS;
  719. }
  720. #undef STACK_STORE
  721. #undef STACK_LOAD
  722. /* --------------------------------------------------------------------- */
  723. /* Operators */
  724. /* --------------------------------------------------------------------- */
  725. /* s/l - store/load (1 bit)
  726. i/x - immediate/indexed form
  727. u/s - signed/unsigned (1 bit)
  728. w/b/h/i - word/byte/half/int allowed (2 bit)
  729. Some opcodes are repeated (e.g. store signed / unsigned byte is the same instruction). */
  730. /* 64 bit only: [reg+imm] must be aligned to 4 bytes. */
  731. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  732. #define INT_ALIGNED 0x10000
  733. #endif
  734. #if (defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32)
  735. #define ARCH_32_64(a, b) a
  736. #define INST_CODE_AND_DST(inst, flags, reg) \
  737. ((inst) | (((flags) & MEM_MASK) <= GPR_REG ? D(reg) : FD(reg)))
  738. #else
  739. #define ARCH_32_64(a, b) b
  740. #define INST_CODE_AND_DST(inst, flags, reg) \
  741. (((inst) & ~INT_ALIGNED) | (((flags) & MEM_MASK) <= GPR_REG ? D(reg) : FD(reg)))
  742. #endif
  743. static const sljit_ins data_transfer_insts[64 + 16] = {
  744. /* -------- Integer -------- */
  745. /* Word. */
  746. /* w u i s */ ARCH_32_64(HI(36) /* stw */, HI(62) | INT_ALIGNED | 0x0 /* std */),
  747. /* w u i l */ ARCH_32_64(HI(32) /* lwz */, HI(58) | INT_ALIGNED | 0x0 /* ld */),
  748. /* w u x s */ ARCH_32_64(HI(31) | LO(151) /* stwx */, HI(31) | LO(149) /* stdx */),
  749. /* w u x l */ ARCH_32_64(HI(31) | LO(23) /* lwzx */, HI(31) | LO(21) /* ldx */),
  750. /* w s i s */ ARCH_32_64(HI(36) /* stw */, HI(62) | INT_ALIGNED | 0x0 /* std */),
  751. /* w s i l */ ARCH_32_64(HI(32) /* lwz */, HI(58) | INT_ALIGNED | 0x0 /* ld */),
  752. /* w s x s */ ARCH_32_64(HI(31) | LO(151) /* stwx */, HI(31) | LO(149) /* stdx */),
  753. /* w s x l */ ARCH_32_64(HI(31) | LO(23) /* lwzx */, HI(31) | LO(21) /* ldx */),
  754. /* Byte. */
  755. /* b u i s */ HI(38) /* stb */,
  756. /* b u i l */ HI(34) /* lbz */,
  757. /* b u x s */ HI(31) | LO(215) /* stbx */,
  758. /* b u x l */ HI(31) | LO(87) /* lbzx */,
  759. /* b s i s */ HI(38) /* stb */,
  760. /* b s i l */ HI(34) /* lbz */ /* EXTS_REQ */,
  761. /* b s x s */ HI(31) | LO(215) /* stbx */,
  762. /* b s x l */ HI(31) | LO(87) /* lbzx */ /* EXTS_REQ */,
  763. /* Half. */
  764. /* h u i s */ HI(44) /* sth */,
  765. /* h u i l */ HI(40) /* lhz */,
  766. /* h u x s */ HI(31) | LO(407) /* sthx */,
  767. /* h u x l */ HI(31) | LO(279) /* lhzx */,
  768. /* h s i s */ HI(44) /* sth */,
  769. /* h s i l */ HI(42) /* lha */,
  770. /* h s x s */ HI(31) | LO(407) /* sthx */,
  771. /* h s x l */ HI(31) | LO(343) /* lhax */,
  772. /* Int. */
  773. /* i u i s */ HI(36) /* stw */,
  774. /* i u i l */ HI(32) /* lwz */,
  775. /* i u x s */ HI(31) | LO(151) /* stwx */,
  776. /* i u x l */ HI(31) | LO(23) /* lwzx */,
  777. /* i s i s */ HI(36) /* stw */,
  778. /* i s i l */ ARCH_32_64(HI(32) /* lwz */, HI(58) | INT_ALIGNED | 0x2 /* lwa */),
  779. /* i s x s */ HI(31) | LO(151) /* stwx */,
  780. /* i s x l */ ARCH_32_64(HI(31) | LO(23) /* lwzx */, HI(31) | LO(341) /* lwax */),
  781. /* -------- Floating point -------- */
  782. /* d i s */ HI(54) /* stfd */,
  783. /* d i l */ HI(50) /* lfd */,
  784. /* d x s */ HI(31) | LO(727) /* stfdx */,
  785. /* d x l */ HI(31) | LO(599) /* lfdx */,
  786. /* s i s */ HI(52) /* stfs */,
  787. /* s i l */ HI(48) /* lfs */,
  788. /* s x s */ HI(31) | LO(663) /* stfsx */,
  789. /* s x l */ HI(31) | LO(535) /* lfsx */,
  790. };
  791. static const sljit_ins updated_data_transfer_insts[64] = {
  792. /* -------- Integer -------- */
  793. /* Word. */
  794. /* w u i s */ ARCH_32_64(HI(37) /* stwu */, HI(62) | INT_ALIGNED | 0x1 /* stdu */),
  795. /* w u i l */ ARCH_32_64(HI(33) /* lwzu */, HI(58) | INT_ALIGNED | 0x1 /* ldu */),
  796. /* w u x s */ ARCH_32_64(HI(31) | LO(183) /* stwux */, HI(31) | LO(181) /* stdux */),
  797. /* w u x l */ ARCH_32_64(HI(31) | LO(55) /* lwzux */, HI(31) | LO(53) /* ldux */),
  798. /* w s i s */ ARCH_32_64(HI(37) /* stwu */, HI(62) | INT_ALIGNED | 0x1 /* stdu */),
  799. /* w s i l */ ARCH_32_64(HI(33) /* lwzu */, HI(58) | INT_ALIGNED | 0x1 /* ldu */),
  800. /* w s x s */ ARCH_32_64(HI(31) | LO(183) /* stwux */, HI(31) | LO(181) /* stdux */),
  801. /* w s x l */ ARCH_32_64(HI(31) | LO(55) /* lwzux */, HI(31) | LO(53) /* ldux */),
  802. /* Byte. */
  803. /* b u i s */ HI(39) /* stbu */,
  804. /* b u i l */ HI(35) /* lbzu */,
  805. /* b u x s */ HI(31) | LO(247) /* stbux */,
  806. /* b u x l */ HI(31) | LO(119) /* lbzux */,
  807. /* b s i s */ HI(39) /* stbu */,
  808. /* b s i l */ 0 /* no such instruction */,
  809. /* b s x s */ HI(31) | LO(247) /* stbux */,
  810. /* b s x l */ 0 /* no such instruction */,
  811. /* Half. */
  812. /* h u i s */ HI(45) /* sthu */,
  813. /* h u i l */ HI(41) /* lhzu */,
  814. /* h u x s */ HI(31) | LO(439) /* sthux */,
  815. /* h u x l */ HI(31) | LO(311) /* lhzux */,
  816. /* h s i s */ HI(45) /* sthu */,
  817. /* h s i l */ HI(43) /* lhau */,
  818. /* h s x s */ HI(31) | LO(439) /* sthux */,
  819. /* h s x l */ HI(31) | LO(375) /* lhaux */,
  820. /* Int. */
  821. /* i u i s */ HI(37) /* stwu */,
  822. /* i u i l */ HI(33) /* lwzu */,
  823. /* i u x s */ HI(31) | LO(183) /* stwux */,
  824. /* i u x l */ HI(31) | LO(55) /* lwzux */,
  825. /* i s i s */ HI(37) /* stwu */,
  826. /* i s i l */ ARCH_32_64(HI(33) /* lwzu */, 0 /* no such instruction */),
  827. /* i s x s */ HI(31) | LO(183) /* stwux */,
  828. /* i s x l */ ARCH_32_64(HI(31) | LO(55) /* lwzux */, HI(31) | LO(373) /* lwaux */),
  829. /* -------- Floating point -------- */
  830. /* d i s */ HI(55) /* stfdu */,
  831. /* d i l */ HI(51) /* lfdu */,
  832. /* d x s */ HI(31) | LO(759) /* stfdux */,
  833. /* d x l */ HI(31) | LO(631) /* lfdux */,
  834. /* s i s */ HI(53) /* stfsu */,
  835. /* s i l */ HI(49) /* lfsu */,
  836. /* s x s */ HI(31) | LO(695) /* stfsux */,
  837. /* s x l */ HI(31) | LO(567) /* lfsux */,
  838. };
  839. #undef ARCH_32_64
  840. /* Simple cases, (no caching is required). */
  841. static sljit_s32 emit_op_mem(struct sljit_compiler *compiler, sljit_s32 inp_flags, sljit_s32 reg,
  842. sljit_s32 arg, sljit_sw argw, sljit_s32 tmp_reg)
  843. {
  844. sljit_ins inst;
  845. sljit_s32 offs_reg;
  846. sljit_sw high_short;
  847. /* Should work when (arg & REG_MASK) == 0. */
  848. SLJIT_ASSERT(A(0) == 0);
  849. SLJIT_ASSERT(arg & SLJIT_MEM);
  850. if (SLJIT_UNLIKELY(arg & OFFS_REG_MASK)) {
  851. argw &= 0x3;
  852. offs_reg = OFFS_REG(arg);
  853. if (argw != 0) {
  854. #if (defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32)
  855. FAIL_IF(push_inst(compiler, RLWINM | S(OFFS_REG(arg)) | A(tmp_reg) | (argw << 11) | ((31 - argw) << 1)));
  856. #else
  857. FAIL_IF(push_inst(compiler, RLDI(tmp_reg, OFFS_REG(arg), argw, 63 - argw, 1)));
  858. #endif
  859. offs_reg = tmp_reg;
  860. }
  861. inst = data_transfer_insts[(inp_flags | INDEXED) & MEM_MASK];
  862. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  863. SLJIT_ASSERT(!(inst & INT_ALIGNED));
  864. #endif
  865. return push_inst(compiler, INST_CODE_AND_DST(inst, inp_flags, reg) | A(arg & REG_MASK) | B(offs_reg));
  866. }
  867. inst = data_transfer_insts[inp_flags & MEM_MASK];
  868. arg &= REG_MASK;
  869. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  870. if ((inst & INT_ALIGNED) && (argw & 0x3) != 0) {
  871. FAIL_IF(load_immediate(compiler, tmp_reg, argw));
  872. inst = data_transfer_insts[(inp_flags | INDEXED) & MEM_MASK];
  873. return push_inst(compiler, INST_CODE_AND_DST(inst, inp_flags, reg) | A(arg) | B(tmp_reg));
  874. }
  875. #endif
  876. if (argw <= SIMM_MAX && argw >= SIMM_MIN)
  877. return push_inst(compiler, INST_CODE_AND_DST(inst, inp_flags, reg) | A(arg) | IMM(argw));
  878. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  879. if (argw <= 0x7fff7fffl && argw >= -0x80000000l) {
  880. #endif
  881. high_short = (sljit_s32)(argw + ((argw & 0x8000) << 1)) & ~0xffff;
  882. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  883. SLJIT_ASSERT(high_short && high_short <= 0x7fffffffl && high_short >= -0x80000000l);
  884. #else
  885. SLJIT_ASSERT(high_short);
  886. #endif
  887. FAIL_IF(push_inst(compiler, ADDIS | D(tmp_reg) | A(arg) | IMM(high_short >> 16)));
  888. return push_inst(compiler, INST_CODE_AND_DST(inst, inp_flags, reg) | A(tmp_reg) | IMM(argw));
  889. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  890. }
  891. /* The rest is PPC-64 only. */
  892. FAIL_IF(load_immediate(compiler, tmp_reg, argw));
  893. inst = data_transfer_insts[(inp_flags | INDEXED) & MEM_MASK];
  894. return push_inst(compiler, INST_CODE_AND_DST(inst, inp_flags, reg) | A(arg) | B(tmp_reg));
  895. #endif
  896. }
  897. static sljit_s32 emit_op(struct sljit_compiler *compiler, sljit_s32 op, sljit_s32 input_flags,
  898. sljit_s32 dst, sljit_sw dstw,
  899. sljit_s32 src1, sljit_sw src1w,
  900. sljit_s32 src2, sljit_sw src2w)
  901. {
  902. /* arg1 goes to TMP_REG1 or src reg
  903. arg2 goes to TMP_REG2, imm or src reg
  904. result goes to TMP_REG2, so put result can use TMP_REG1. */
  905. sljit_s32 dst_r = TMP_REG2;
  906. sljit_s32 src1_r;
  907. sljit_s32 src2_r;
  908. sljit_s32 sugg_src2_r = TMP_REG2;
  909. sljit_s32 flags = input_flags & (ALT_FORM1 | ALT_FORM2 | ALT_FORM3 | ALT_FORM4 | ALT_FORM5 | ALT_SIGN_EXT | ALT_SET_FLAGS);
  910. /* Destination check. */
  911. if (SLOW_IS_REG(dst)) {
  912. dst_r = dst;
  913. flags |= REG_DEST;
  914. if (op >= SLJIT_MOV && op <= SLJIT_MOV_P)
  915. sugg_src2_r = dst_r;
  916. }
  917. /* Source 1. */
  918. if (FAST_IS_REG(src1)) {
  919. src1_r = src1;
  920. flags |= REG1_SOURCE;
  921. }
  922. else if (src1 & SLJIT_IMM) {
  923. FAIL_IF(load_immediate(compiler, TMP_REG1, src1w));
  924. src1_r = TMP_REG1;
  925. }
  926. else {
  927. FAIL_IF(emit_op_mem(compiler, input_flags | LOAD_DATA, TMP_REG1, src1, src1w, TMP_REG1));
  928. src1_r = TMP_REG1;
  929. }
  930. /* Source 2. */
  931. if (FAST_IS_REG(src2)) {
  932. src2_r = src2;
  933. flags |= REG2_SOURCE;
  934. if (!(flags & REG_DEST) && op >= SLJIT_MOV && op <= SLJIT_MOV_P)
  935. dst_r = src2_r;
  936. }
  937. else if (src2 & SLJIT_IMM) {
  938. FAIL_IF(load_immediate(compiler, sugg_src2_r, src2w));
  939. src2_r = sugg_src2_r;
  940. }
  941. else {
  942. FAIL_IF(emit_op_mem(compiler, input_flags | LOAD_DATA, sugg_src2_r, src2, src2w, TMP_REG2));
  943. src2_r = sugg_src2_r;
  944. }
  945. FAIL_IF(emit_single_op(compiler, op, flags, dst_r, src1_r, src2_r));
  946. if (!(dst & SLJIT_MEM))
  947. return SLJIT_SUCCESS;
  948. return emit_op_mem(compiler, input_flags, dst_r, dst, dstw, TMP_REG1);
  949. }
  950. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_op0(struct sljit_compiler *compiler, sljit_s32 op)
  951. {
  952. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  953. sljit_s32 int_op = op & SLJIT_I32_OP;
  954. #endif
  955. CHECK_ERROR();
  956. CHECK(check_sljit_emit_op0(compiler, op));
  957. op = GET_OPCODE(op);
  958. switch (op) {
  959. case SLJIT_BREAKPOINT:
  960. case SLJIT_NOP:
  961. return push_inst(compiler, NOP);
  962. case SLJIT_LMUL_UW:
  963. case SLJIT_LMUL_SW:
  964. FAIL_IF(push_inst(compiler, OR | S(SLJIT_R0) | A(TMP_REG1) | B(SLJIT_R0)));
  965. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  966. FAIL_IF(push_inst(compiler, MULLD | D(SLJIT_R0) | A(TMP_REG1) | B(SLJIT_R1)));
  967. return push_inst(compiler, (op == SLJIT_LMUL_UW ? MULHDU : MULHD) | D(SLJIT_R1) | A(TMP_REG1) | B(SLJIT_R1));
  968. #else
  969. FAIL_IF(push_inst(compiler, MULLW | D(SLJIT_R0) | A(TMP_REG1) | B(SLJIT_R1)));
  970. return push_inst(compiler, (op == SLJIT_LMUL_UW ? MULHWU : MULHW) | D(SLJIT_R1) | A(TMP_REG1) | B(SLJIT_R1));
  971. #endif
  972. case SLJIT_DIVMOD_UW:
  973. case SLJIT_DIVMOD_SW:
  974. FAIL_IF(push_inst(compiler, OR | S(SLJIT_R0) | A(TMP_REG1) | B(SLJIT_R0)));
  975. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  976. FAIL_IF(push_inst(compiler, (int_op ? (op == SLJIT_DIVMOD_UW ? DIVWU : DIVW) : (op == SLJIT_DIVMOD_UW ? DIVDU : DIVD)) | D(SLJIT_R0) | A(SLJIT_R0) | B(SLJIT_R1)));
  977. FAIL_IF(push_inst(compiler, (int_op ? MULLW : MULLD) | D(SLJIT_R1) | A(SLJIT_R0) | B(SLJIT_R1)));
  978. #else
  979. FAIL_IF(push_inst(compiler, (op == SLJIT_DIVMOD_UW ? DIVWU : DIVW) | D(SLJIT_R0) | A(SLJIT_R0) | B(SLJIT_R1)));
  980. FAIL_IF(push_inst(compiler, MULLW | D(SLJIT_R1) | A(SLJIT_R0) | B(SLJIT_R1)));
  981. #endif
  982. return push_inst(compiler, SUBF | D(SLJIT_R1) | A(SLJIT_R1) | B(TMP_REG1));
  983. case SLJIT_DIV_UW:
  984. case SLJIT_DIV_SW:
  985. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  986. return push_inst(compiler, (int_op ? (op == SLJIT_DIV_UW ? DIVWU : DIVW) : (op == SLJIT_DIV_UW ? DIVDU : DIVD)) | D(SLJIT_R0) | A(SLJIT_R0) | B(SLJIT_R1));
  987. #else
  988. return push_inst(compiler, (op == SLJIT_DIV_UW ? DIVWU : DIVW) | D(SLJIT_R0) | A(SLJIT_R0) | B(SLJIT_R1));
  989. #endif
  990. case SLJIT_ENDBR:
  991. case SLJIT_SKIP_FRAMES_BEFORE_RETURN:
  992. return SLJIT_SUCCESS;
  993. }
  994. return SLJIT_SUCCESS;
  995. }
  996. static sljit_s32 emit_prefetch(struct sljit_compiler *compiler,
  997. sljit_s32 src, sljit_sw srcw)
  998. {
  999. if (!(src & OFFS_REG_MASK)) {
  1000. if (srcw == 0 && (src & REG_MASK) != SLJIT_UNUSED)
  1001. return push_inst(compiler, DCBT | A(0) | B(src & REG_MASK));
  1002. FAIL_IF(load_immediate(compiler, TMP_REG1, srcw));
  1003. /* Works with SLJIT_MEM0() case as well. */
  1004. return push_inst(compiler, DCBT | A(src & REG_MASK) | B(TMP_REG1));
  1005. }
  1006. srcw &= 0x3;
  1007. if (srcw == 0)
  1008. return push_inst(compiler, DCBT | A(src & REG_MASK) | B(OFFS_REG(src)));
  1009. #if (defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32)
  1010. FAIL_IF(push_inst(compiler, RLWINM | S(OFFS_REG(src)) | A(TMP_REG1) | (srcw << 11) | ((31 - srcw) << 1)));
  1011. #else
  1012. FAIL_IF(push_inst(compiler, RLDI(TMP_REG1, OFFS_REG(src), srcw, 63 - srcw, 1)));
  1013. #endif
  1014. return push_inst(compiler, DCBT | A(src & REG_MASK) | B(TMP_REG1));
  1015. }
  1016. #define EMIT_MOV(type, type_flags, type_cast) \
  1017. emit_op(compiler, (src & SLJIT_IMM) ? SLJIT_MOV : type, flags | (type_flags), dst, dstw, TMP_REG1, 0, src, (src & SLJIT_IMM) ? type_cast srcw : srcw)
  1018. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_op1(struct sljit_compiler *compiler, sljit_s32 op,
  1019. sljit_s32 dst, sljit_sw dstw,
  1020. sljit_s32 src, sljit_sw srcw)
  1021. {
  1022. sljit_s32 flags = HAS_FLAGS(op) ? ALT_SET_FLAGS : 0;
  1023. sljit_s32 op_flags = GET_ALL_FLAGS(op);
  1024. CHECK_ERROR();
  1025. CHECK(check_sljit_emit_op1(compiler, op, dst, dstw, src, srcw));
  1026. ADJUST_LOCAL_OFFSET(dst, dstw);
  1027. ADJUST_LOCAL_OFFSET(src, srcw);
  1028. op = GET_OPCODE(op);
  1029. if ((src & SLJIT_IMM) && srcw == 0)
  1030. src = TMP_ZERO;
  1031. if (GET_FLAG_TYPE(op_flags) == SLJIT_OVERFLOW)
  1032. FAIL_IF(push_inst(compiler, MTXER | S(TMP_ZERO)));
  1033. if (op < SLJIT_NOT && FAST_IS_REG(src) && src == dst) {
  1034. if (!TYPE_CAST_NEEDED(op))
  1035. return SLJIT_SUCCESS;
  1036. }
  1037. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1038. if (op_flags & SLJIT_I32_OP) {
  1039. if (op < SLJIT_NOT) {
  1040. if (src & SLJIT_MEM) {
  1041. if (op == SLJIT_MOV_S32)
  1042. op = SLJIT_MOV_U32;
  1043. }
  1044. else if (src & SLJIT_IMM) {
  1045. if (op == SLJIT_MOV_U32)
  1046. op = SLJIT_MOV_S32;
  1047. }
  1048. }
  1049. else {
  1050. /* Most operations expect sign extended arguments. */
  1051. flags |= INT_DATA | SIGNED_DATA;
  1052. if (HAS_FLAGS(op_flags))
  1053. flags |= ALT_SIGN_EXT;
  1054. }
  1055. }
  1056. #endif
  1057. switch (op) {
  1058. case SLJIT_MOV:
  1059. case SLJIT_MOV_P:
  1060. #if (defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32)
  1061. case SLJIT_MOV_U32:
  1062. case SLJIT_MOV_S32:
  1063. #endif
  1064. return emit_op(compiler, SLJIT_MOV, flags | WORD_DATA, dst, dstw, TMP_REG1, 0, src, srcw);
  1065. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1066. case SLJIT_MOV_U32:
  1067. return EMIT_MOV(SLJIT_MOV_U32, INT_DATA, (sljit_u32));
  1068. case SLJIT_MOV_S32:
  1069. return EMIT_MOV(SLJIT_MOV_S32, INT_DATA | SIGNED_DATA, (sljit_s32));
  1070. #endif
  1071. case SLJIT_MOV_U8:
  1072. return EMIT_MOV(SLJIT_MOV_U8, BYTE_DATA, (sljit_u8));
  1073. case SLJIT_MOV_S8:
  1074. return EMIT_MOV(SLJIT_MOV_S8, BYTE_DATA | SIGNED_DATA, (sljit_s8));
  1075. case SLJIT_MOV_U16:
  1076. return EMIT_MOV(SLJIT_MOV_U16, HALF_DATA, (sljit_u16));
  1077. case SLJIT_MOV_S16:
  1078. return EMIT_MOV(SLJIT_MOV_S16, HALF_DATA | SIGNED_DATA, (sljit_s16));
  1079. case SLJIT_NOT:
  1080. return emit_op(compiler, SLJIT_NOT, flags, dst, dstw, TMP_REG1, 0, src, srcw);
  1081. case SLJIT_NEG:
  1082. return emit_op(compiler, SLJIT_NEG, flags | (GET_FLAG_TYPE(op_flags) ? ALT_FORM1 : 0), dst, dstw, TMP_REG1, 0, src, srcw);
  1083. case SLJIT_CLZ:
  1084. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1085. return emit_op(compiler, SLJIT_CLZ, flags | (!(op_flags & SLJIT_I32_OP) ? 0 : ALT_FORM1), dst, dstw, TMP_REG1, 0, src, srcw);
  1086. #else
  1087. return emit_op(compiler, SLJIT_CLZ, flags, dst, dstw, TMP_REG1, 0, src, srcw);
  1088. #endif
  1089. }
  1090. return SLJIT_SUCCESS;
  1091. }
  1092. #undef EMIT_MOV
  1093. #define TEST_SL_IMM(src, srcw) \
  1094. (((src) & SLJIT_IMM) && (srcw) <= SIMM_MAX && (srcw) >= SIMM_MIN)
  1095. #define TEST_UL_IMM(src, srcw) \
  1096. (((src) & SLJIT_IMM) && !((srcw) & ~0xffff))
  1097. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1098. #define TEST_SH_IMM(src, srcw) \
  1099. (((src) & SLJIT_IMM) && !((srcw) & 0xffff) && (srcw) <= 0x7fffffffl && (srcw) >= -0x80000000l)
  1100. #else
  1101. #define TEST_SH_IMM(src, srcw) \
  1102. (((src) & SLJIT_IMM) && !((srcw) & 0xffff))
  1103. #endif
  1104. #define TEST_UH_IMM(src, srcw) \
  1105. (((src) & SLJIT_IMM) && !((srcw) & ~0xffff0000))
  1106. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1107. #define TEST_ADD_IMM(src, srcw) \
  1108. (((src) & SLJIT_IMM) && (srcw) <= 0x7fff7fffl && (srcw) >= -0x80000000l)
  1109. #else
  1110. #define TEST_ADD_IMM(src, srcw) \
  1111. ((src) & SLJIT_IMM)
  1112. #endif
  1113. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1114. #define TEST_UI_IMM(src, srcw) \
  1115. (((src) & SLJIT_IMM) && !((srcw) & ~0xffffffff))
  1116. #else
  1117. #define TEST_UI_IMM(src, srcw) \
  1118. ((src) & SLJIT_IMM)
  1119. #endif
  1120. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1121. #define TEST_ADD_FORM1(op) \
  1122. (GET_FLAG_TYPE(op) == SLJIT_OVERFLOW \
  1123. || (op & (SLJIT_I32_OP | SLJIT_SET_Z | VARIABLE_FLAG_MASK)) == (SLJIT_I32_OP | SLJIT_SET_Z | SLJIT_SET_CARRY))
  1124. #define TEST_SUB_FORM2(op) \
  1125. ((GET_FLAG_TYPE(op) >= SLJIT_SIG_LESS && GET_FLAG_TYPE(op) <= SLJIT_SIG_LESS_EQUAL) \
  1126. || (op & (SLJIT_I32_OP | SLJIT_SET_Z | VARIABLE_FLAG_MASK)) == (SLJIT_I32_OP | SLJIT_SET_Z))
  1127. #define TEST_SUB_FORM3(op) \
  1128. (GET_FLAG_TYPE(op) == SLJIT_OVERFLOW \
  1129. || (op & (SLJIT_I32_OP | SLJIT_SET_Z)) == (SLJIT_I32_OP | SLJIT_SET_Z))
  1130. #else
  1131. #define TEST_ADD_FORM1(op) \
  1132. (GET_FLAG_TYPE(op) == SLJIT_OVERFLOW)
  1133. #define TEST_SUB_FORM2(op) \
  1134. (GET_FLAG_TYPE(op) >= SLJIT_SIG_LESS && GET_FLAG_TYPE(op) <= SLJIT_SIG_LESS_EQUAL)
  1135. #define TEST_SUB_FORM3(op) \
  1136. (GET_FLAG_TYPE(op) == SLJIT_OVERFLOW)
  1137. #endif
  1138. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_op2(struct sljit_compiler *compiler, sljit_s32 op,
  1139. sljit_s32 dst, sljit_sw dstw,
  1140. sljit_s32 src1, sljit_sw src1w,
  1141. sljit_s32 src2, sljit_sw src2w)
  1142. {
  1143. sljit_s32 flags = HAS_FLAGS(op) ? ALT_SET_FLAGS : 0;
  1144. CHECK_ERROR();
  1145. CHECK(check_sljit_emit_op2(compiler, op, dst, dstw, src1, src1w, src2, src2w));
  1146. ADJUST_LOCAL_OFFSET(dst, dstw);
  1147. ADJUST_LOCAL_OFFSET(src1, src1w);
  1148. ADJUST_LOCAL_OFFSET(src2, src2w);
  1149. if (dst == SLJIT_UNUSED && !HAS_FLAGS(op))
  1150. return SLJIT_SUCCESS;
  1151. if ((src1 & SLJIT_IMM) && src1w == 0)
  1152. src1 = TMP_ZERO;
  1153. if ((src2 & SLJIT_IMM) && src2w == 0)
  1154. src2 = TMP_ZERO;
  1155. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1156. if (op & SLJIT_I32_OP) {
  1157. /* Most operations expect sign extended arguments. */
  1158. flags |= INT_DATA | SIGNED_DATA;
  1159. if (src1 & SLJIT_IMM)
  1160. src1w = (sljit_s32)(src1w);
  1161. if (src2 & SLJIT_IMM)
  1162. src2w = (sljit_s32)(src2w);
  1163. if (HAS_FLAGS(op))
  1164. flags |= ALT_SIGN_EXT;
  1165. }
  1166. #endif
  1167. if (GET_FLAG_TYPE(op) == SLJIT_OVERFLOW)
  1168. FAIL_IF(push_inst(compiler, MTXER | S(TMP_ZERO)));
  1169. switch (GET_OPCODE(op)) {
  1170. case SLJIT_ADD:
  1171. if (TEST_ADD_FORM1(op))
  1172. return emit_op(compiler, SLJIT_ADD, flags | ALT_FORM1, dst, dstw, src1, src1w, src2, src2w);
  1173. if (!HAS_FLAGS(op) && ((src1 | src2) & SLJIT_IMM)) {
  1174. if (TEST_SL_IMM(src2, src2w)) {
  1175. compiler->imm = src2w & 0xffff;
  1176. return emit_op(compiler, SLJIT_ADD, flags | ALT_FORM2, dst, dstw, src1, src1w, TMP_REG2, 0);
  1177. }
  1178. if (TEST_SL_IMM(src1, src1w)) {
  1179. compiler->imm = src1w & 0xffff;
  1180. return emit_op(compiler, SLJIT_ADD, flags | ALT_FORM2, dst, dstw, src2, src2w, TMP_REG2, 0);
  1181. }
  1182. if (TEST_SH_IMM(src2, src2w)) {
  1183. compiler->imm = (src2w >> 16) & 0xffff;
  1184. return emit_op(compiler, SLJIT_ADD, flags | ALT_FORM2 | ALT_FORM3, dst, dstw, src1, src1w, TMP_REG2, 0);
  1185. }
  1186. if (TEST_SH_IMM(src1, src1w)) {
  1187. compiler->imm = (src1w >> 16) & 0xffff;
  1188. return emit_op(compiler, SLJIT_ADD, flags | ALT_FORM2 | ALT_FORM3, dst, dstw, src2, src2w, TMP_REG2, 0);
  1189. }
  1190. /* Range between -1 and -32768 is covered above. */
  1191. if (TEST_ADD_IMM(src2, src2w)) {
  1192. compiler->imm = src2w & 0xffffffff;
  1193. return emit_op(compiler, SLJIT_ADD, flags | ALT_FORM2 | ALT_FORM4, dst, dstw, src1, src1w, TMP_REG2, 0);
  1194. }
  1195. if (TEST_ADD_IMM(src1, src1w)) {
  1196. compiler->imm = src1w & 0xffffffff;
  1197. return emit_op(compiler, SLJIT_ADD, flags | ALT_FORM2 | ALT_FORM4, dst, dstw, src2, src2w, TMP_REG2, 0);
  1198. }
  1199. }
  1200. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1201. if ((op & (SLJIT_I32_OP | SLJIT_SET_Z)) == (SLJIT_I32_OP | SLJIT_SET_Z)) {
  1202. if (TEST_SL_IMM(src2, src2w)) {
  1203. compiler->imm = src2w & 0xffff;
  1204. return emit_op(compiler, SLJIT_ADD, flags | ALT_FORM4 | ALT_FORM5, dst, dstw, src1, src1w, TMP_REG2, 0);
  1205. }
  1206. if (TEST_SL_IMM(src1, src1w)) {
  1207. compiler->imm = src1w & 0xffff;
  1208. return emit_op(compiler, SLJIT_ADD, flags | ALT_FORM4 | ALT_FORM5, dst, dstw, src2, src2w, TMP_REG2, 0);
  1209. }
  1210. return emit_op(compiler, SLJIT_ADD, flags | ALT_FORM4, dst, dstw, src1, src1w, src2, src2w);
  1211. }
  1212. #endif
  1213. if (HAS_FLAGS(op)) {
  1214. if (TEST_SL_IMM(src2, src2w)) {
  1215. compiler->imm = src2w & 0xffff;
  1216. return emit_op(compiler, SLJIT_ADD, flags | ALT_FORM3, dst, dstw, src1, src1w, TMP_REG2, 0);
  1217. }
  1218. if (TEST_SL_IMM(src1, src1w)) {
  1219. compiler->imm = src1w & 0xffff;
  1220. return emit_op(compiler, SLJIT_ADD, flags | ALT_FORM3, dst, dstw, src2, src2w, TMP_REG2, 0);
  1221. }
  1222. }
  1223. return emit_op(compiler, SLJIT_ADD, flags | ((GET_FLAG_TYPE(op) == GET_FLAG_TYPE(SLJIT_SET_CARRY)) ? ALT_FORM5 : 0), dst, dstw, src1, src1w, src2, src2w);
  1224. case SLJIT_ADDC:
  1225. return emit_op(compiler, SLJIT_ADDC, flags, dst, dstw, src1, src1w, src2, src2w);
  1226. case SLJIT_SUB:
  1227. if (GET_FLAG_TYPE(op) >= SLJIT_LESS && GET_FLAG_TYPE(op) <= SLJIT_LESS_EQUAL) {
  1228. if (dst == SLJIT_UNUSED) {
  1229. if (TEST_UL_IMM(src2, src2w)) {
  1230. compiler->imm = src2w & 0xffff;
  1231. return emit_op(compiler, SLJIT_SUB, flags | ALT_FORM1 | ALT_FORM2, dst, dstw, src1, src1w, TMP_REG2, 0);
  1232. }
  1233. return emit_op(compiler, SLJIT_SUB, flags | ALT_FORM1, dst, dstw, src1, src1w, src2, src2w);
  1234. }
  1235. if ((src2 & SLJIT_IMM) && src2w >= 0 && src2w <= (SIMM_MAX + 1)) {
  1236. compiler->imm = src2w;
  1237. return emit_op(compiler, SLJIT_SUB, flags | ALT_FORM1 | ALT_FORM2 | ALT_FORM3, dst, dstw, src1, src1w, TMP_REG2, 0);
  1238. }
  1239. return emit_op(compiler, SLJIT_SUB, flags | ALT_FORM1 | ALT_FORM3, dst, dstw, src1, src1w, src2, src2w);
  1240. }
  1241. if (dst == SLJIT_UNUSED && GET_FLAG_TYPE(op) <= SLJIT_SIG_LESS_EQUAL) {
  1242. if (TEST_SL_IMM(src2, src2w)) {
  1243. compiler->imm = src2w & 0xffff;
  1244. return emit_op(compiler, SLJIT_SUB, flags | ALT_FORM2 | ALT_FORM3, dst, dstw, src1, src1w, TMP_REG2, 0);
  1245. }
  1246. return emit_op(compiler, SLJIT_SUB, flags | ALT_FORM2, dst, dstw, src1, src1w, src2, src2w);
  1247. }
  1248. if (TEST_SUB_FORM2(op)) {
  1249. if ((src2 & SLJIT_IMM) && src2w >= -SIMM_MAX && src2w <= SIMM_MAX) {
  1250. compiler->imm = src2w & 0xffff;
  1251. return emit_op(compiler, SLJIT_SUB, flags | ALT_FORM2 | ALT_FORM3 | ALT_FORM4, dst, dstw, src1, src1w, TMP_REG2, 0);
  1252. }
  1253. return emit_op(compiler, SLJIT_SUB, flags | ALT_FORM2 | ALT_FORM4, dst, dstw, src1, src1w, src2, src2w);
  1254. }
  1255. if (TEST_SUB_FORM3(op))
  1256. return emit_op(compiler, SLJIT_SUB, flags | ALT_FORM3, dst, dstw, src1, src1w, src2, src2w);
  1257. if (TEST_SL_IMM(src2, -src2w)) {
  1258. compiler->imm = (-src2w) & 0xffff;
  1259. return emit_op(compiler, SLJIT_ADD, flags | (!HAS_FLAGS(op) ? ALT_FORM2 : ALT_FORM3), dst, dstw, src1, src1w, TMP_REG2, 0);
  1260. }
  1261. if (TEST_SL_IMM(src1, src1w) && !(op & SLJIT_SET_Z)) {
  1262. compiler->imm = src1w & 0xffff;
  1263. return emit_op(compiler, SLJIT_SUB, flags | ALT_FORM4, dst, dstw, src2, src2w, TMP_REG2, 0);
  1264. }
  1265. if (!HAS_FLAGS(op)) {
  1266. if (TEST_SH_IMM(src2, -src2w)) {
  1267. compiler->imm = ((-src2w) >> 16) & 0xffff;
  1268. return emit_op(compiler, SLJIT_ADD, flags | ALT_FORM2 | ALT_FORM3, dst, dstw, src1, src1w, TMP_REG2, 0);
  1269. }
  1270. /* Range between -1 and -32768 is covered above. */
  1271. if (TEST_ADD_IMM(src2, -src2w)) {
  1272. compiler->imm = -src2w & 0xffffffff;
  1273. return emit_op(compiler, SLJIT_ADD, flags | ALT_FORM2 | ALT_FORM4, dst, dstw, src1, src1w, TMP_REG2, 0);
  1274. }
  1275. }
  1276. /* We know ALT_SIGN_EXT is set if it is an SLJIT_I32_OP on 64 bit systems. */
  1277. return emit_op(compiler, SLJIT_SUB, flags | ((GET_FLAG_TYPE(op) == GET_FLAG_TYPE(SLJIT_SET_CARRY)) ? ALT_FORM5 : 0), dst, dstw, src1, src1w, src2, src2w);
  1278. case SLJIT_SUBC:
  1279. return emit_op(compiler, SLJIT_SUBC, flags, dst, dstw, src1, src1w, src2, src2w);
  1280. case SLJIT_MUL:
  1281. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1282. if (op & SLJIT_I32_OP)
  1283. flags |= ALT_FORM2;
  1284. #endif
  1285. if (!HAS_FLAGS(op)) {
  1286. if (TEST_SL_IMM(src2, src2w)) {
  1287. compiler->imm = src2w & 0xffff;
  1288. return emit_op(compiler, SLJIT_MUL, flags | ALT_FORM1, dst, dstw, src1, src1w, TMP_REG2, 0);
  1289. }
  1290. if (TEST_SL_IMM(src1, src1w)) {
  1291. compiler->imm = src1w & 0xffff;
  1292. return emit_op(compiler, SLJIT_MUL, flags | ALT_FORM1, dst, dstw, src2, src2w, TMP_REG2, 0);
  1293. }
  1294. }
  1295. else
  1296. FAIL_IF(push_inst(compiler, MTXER | S(TMP_ZERO)));
  1297. return emit_op(compiler, SLJIT_MUL, flags, dst, dstw, src1, src1w, src2, src2w);
  1298. case SLJIT_AND:
  1299. case SLJIT_OR:
  1300. case SLJIT_XOR:
  1301. /* Commutative unsigned operations. */
  1302. if (!HAS_FLAGS(op) || GET_OPCODE(op) == SLJIT_AND) {
  1303. if (TEST_UL_IMM(src2, src2w)) {
  1304. compiler->imm = src2w;
  1305. return emit_op(compiler, GET_OPCODE(op), flags | ALT_FORM1, dst, dstw, src1, src1w, TMP_REG2, 0);
  1306. }
  1307. if (TEST_UL_IMM(src1, src1w)) {
  1308. compiler->imm = src1w;
  1309. return emit_op(compiler, GET_OPCODE(op), flags | ALT_FORM1, dst, dstw, src2, src2w, TMP_REG2, 0);
  1310. }
  1311. if (TEST_UH_IMM(src2, src2w)) {
  1312. compiler->imm = (src2w >> 16) & 0xffff;
  1313. return emit_op(compiler, GET_OPCODE(op), flags | ALT_FORM2, dst, dstw, src1, src1w, TMP_REG2, 0);
  1314. }
  1315. if (TEST_UH_IMM(src1, src1w)) {
  1316. compiler->imm = (src1w >> 16) & 0xffff;
  1317. return emit_op(compiler, GET_OPCODE(op), flags | ALT_FORM2, dst, dstw, src2, src2w, TMP_REG2, 0);
  1318. }
  1319. }
  1320. if (GET_OPCODE(op) != SLJIT_AND && GET_OPCODE(op) != SLJIT_AND) {
  1321. /* Unlike or and xor, and resets unwanted bits as well. */
  1322. if (TEST_UI_IMM(src2, src2w)) {
  1323. compiler->imm = src2w;
  1324. return emit_op(compiler, GET_OPCODE(op), flags | ALT_FORM3, dst, dstw, src1, src1w, TMP_REG2, 0);
  1325. }
  1326. if (TEST_UI_IMM(src1, src1w)) {
  1327. compiler->imm = src1w;
  1328. return emit_op(compiler, GET_OPCODE(op), flags | ALT_FORM3, dst, dstw, src2, src2w, TMP_REG2, 0);
  1329. }
  1330. }
  1331. return emit_op(compiler, GET_OPCODE(op), flags, dst, dstw, src1, src1w, src2, src2w);
  1332. case SLJIT_SHL:
  1333. case SLJIT_LSHR:
  1334. case SLJIT_ASHR:
  1335. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1336. if (op & SLJIT_I32_OP)
  1337. flags |= ALT_FORM2;
  1338. #endif
  1339. if (src2 & SLJIT_IMM) {
  1340. compiler->imm = src2w;
  1341. return emit_op(compiler, GET_OPCODE(op), flags | ALT_FORM1, dst, dstw, src1, src1w, TMP_REG2, 0);
  1342. }
  1343. return emit_op(compiler, GET_OPCODE(op), flags, dst, dstw, src1, src1w, src2, src2w);
  1344. }
  1345. return SLJIT_SUCCESS;
  1346. }
  1347. #undef TEST_ADD_FORM1
  1348. #undef TEST_SUB_FORM2
  1349. #undef TEST_SUB_FORM3
  1350. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_op_src(struct sljit_compiler *compiler, sljit_s32 op,
  1351. sljit_s32 src, sljit_sw srcw)
  1352. {
  1353. CHECK_ERROR();
  1354. CHECK(check_sljit_emit_op_src(compiler, op, src, srcw));
  1355. ADJUST_LOCAL_OFFSET(src, srcw);
  1356. switch (op) {
  1357. case SLJIT_FAST_RETURN:
  1358. if (FAST_IS_REG(src))
  1359. FAIL_IF(push_inst(compiler, MTLR | S(src)));
  1360. else {
  1361. FAIL_IF(emit_op(compiler, SLJIT_MOV, WORD_DATA, TMP_REG2, 0, TMP_REG1, 0, src, srcw));
  1362. FAIL_IF(push_inst(compiler, MTLR | S(TMP_REG2)));
  1363. }
  1364. return push_inst(compiler, BLR);
  1365. case SLJIT_SKIP_FRAMES_BEFORE_FAST_RETURN:
  1366. return SLJIT_SUCCESS;
  1367. case SLJIT_PREFETCH_L1:
  1368. case SLJIT_PREFETCH_L2:
  1369. case SLJIT_PREFETCH_L3:
  1370. case SLJIT_PREFETCH_ONCE:
  1371. return emit_prefetch(compiler, src, srcw);
  1372. }
  1373. return SLJIT_SUCCESS;
  1374. }
  1375. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_get_register_index(sljit_s32 reg)
  1376. {
  1377. CHECK_REG_INDEX(check_sljit_get_register_index(reg));
  1378. return reg_map[reg];
  1379. }
  1380. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_get_float_register_index(sljit_s32 reg)
  1381. {
  1382. CHECK_REG_INDEX(check_sljit_get_float_register_index(reg));
  1383. return freg_map[reg];
  1384. }
  1385. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_op_custom(struct sljit_compiler *compiler,
  1386. void *instruction, sljit_s32 size)
  1387. {
  1388. CHECK_ERROR();
  1389. CHECK(check_sljit_emit_op_custom(compiler, instruction, size));
  1390. return push_inst(compiler, *(sljit_ins*)instruction);
  1391. }
  1392. /* --------------------------------------------------------------------- */
  1393. /* Floating point operators */
  1394. /* --------------------------------------------------------------------- */
  1395. #define FLOAT_DATA(op) (DOUBLE_DATA | ((op & SLJIT_F32_OP) >> 6))
  1396. #define SELECT_FOP(op, single, double) ((op & SLJIT_F32_OP) ? single : double)
  1397. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1398. #define FLOAT_TMP_MEM_OFFSET (6 * sizeof(sljit_sw))
  1399. #else
  1400. #define FLOAT_TMP_MEM_OFFSET (2 * sizeof(sljit_sw))
  1401. #if (defined SLJIT_LITTLE_ENDIAN && SLJIT_LITTLE_ENDIAN)
  1402. #define FLOAT_TMP_MEM_OFFSET_LOW (2 * sizeof(sljit_sw))
  1403. #define FLOAT_TMP_MEM_OFFSET_HI (3 * sizeof(sljit_sw))
  1404. #else
  1405. #define FLOAT_TMP_MEM_OFFSET_LOW (3 * sizeof(sljit_sw))
  1406. #define FLOAT_TMP_MEM_OFFSET_HI (2 * sizeof(sljit_sw))
  1407. #endif
  1408. #endif /* SLJIT_CONFIG_PPC_64 */
  1409. static SLJIT_INLINE sljit_s32 sljit_emit_fop1_conv_sw_from_f64(struct sljit_compiler *compiler, sljit_s32 op,
  1410. sljit_s32 dst, sljit_sw dstw,
  1411. sljit_s32 src, sljit_sw srcw)
  1412. {
  1413. if (src & SLJIT_MEM) {
  1414. /* We can ignore the temporary data store on the stack from caching point of view. */
  1415. FAIL_IF(emit_op_mem(compiler, FLOAT_DATA(op) | LOAD_DATA, TMP_FREG1, src, srcw, TMP_REG1));
  1416. src = TMP_FREG1;
  1417. }
  1418. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1419. op = GET_OPCODE(op);
  1420. FAIL_IF(push_inst(compiler, (op == SLJIT_CONV_S32_FROM_F64 ? FCTIWZ : FCTIDZ) | FD(TMP_FREG1) | FB(src)));
  1421. if (op == SLJIT_CONV_SW_FROM_F64) {
  1422. if (FAST_IS_REG(dst)) {
  1423. FAIL_IF(emit_op_mem(compiler, DOUBLE_DATA, TMP_FREG1, SLJIT_MEM1(SLJIT_SP), FLOAT_TMP_MEM_OFFSET, TMP_REG1));
  1424. return emit_op_mem(compiler, WORD_DATA | LOAD_DATA, dst, SLJIT_MEM1(SLJIT_SP), FLOAT_TMP_MEM_OFFSET, TMP_REG1);
  1425. }
  1426. return emit_op_mem(compiler, DOUBLE_DATA, TMP_FREG1, dst, dstw, TMP_REG1);
  1427. }
  1428. #else
  1429. FAIL_IF(push_inst(compiler, FCTIWZ | FD(TMP_FREG1) | FB(src)));
  1430. #endif
  1431. if (FAST_IS_REG(dst)) {
  1432. FAIL_IF(load_immediate(compiler, TMP_REG1, FLOAT_TMP_MEM_OFFSET));
  1433. FAIL_IF(push_inst(compiler, STFIWX | FS(TMP_FREG1) | A(SLJIT_SP) | B(TMP_REG1)));
  1434. return emit_op_mem(compiler, INT_DATA | LOAD_DATA, dst, SLJIT_MEM1(SLJIT_SP), FLOAT_TMP_MEM_OFFSET, TMP_REG1);
  1435. }
  1436. SLJIT_ASSERT(dst & SLJIT_MEM);
  1437. if (dst & OFFS_REG_MASK) {
  1438. dstw &= 0x3;
  1439. if (dstw) {
  1440. #if (defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32)
  1441. FAIL_IF(push_inst(compiler, RLWINM | S(OFFS_REG(dst)) | A(TMP_REG1) | (dstw << 11) | ((31 - dstw) << 1)));
  1442. #else
  1443. FAIL_IF(push_inst(compiler, RLDI(TMP_REG1, OFFS_REG(dst), dstw, 63 - dstw, 1)));
  1444. #endif
  1445. dstw = TMP_REG1;
  1446. }
  1447. else
  1448. dstw = OFFS_REG(dst);
  1449. }
  1450. else {
  1451. if ((dst & REG_MASK) && !dstw) {
  1452. dstw = dst & REG_MASK;
  1453. dst = 0;
  1454. }
  1455. else {
  1456. /* This works regardless we have SLJIT_MEM1 or SLJIT_MEM0. */
  1457. FAIL_IF(load_immediate(compiler, TMP_REG1, dstw));
  1458. dstw = TMP_REG1;
  1459. }
  1460. }
  1461. return push_inst(compiler, STFIWX | FS(TMP_FREG1) | A(dst & REG_MASK) | B(dstw));
  1462. }
  1463. static SLJIT_INLINE sljit_s32 sljit_emit_fop1_conv_f64_from_sw(struct sljit_compiler *compiler, sljit_s32 op,
  1464. sljit_s32 dst, sljit_sw dstw,
  1465. sljit_s32 src, sljit_sw srcw)
  1466. {
  1467. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1468. sljit_s32 dst_r = FAST_IS_REG(dst) ? dst : TMP_FREG1;
  1469. if (src & SLJIT_IMM) {
  1470. if (GET_OPCODE(op) == SLJIT_CONV_F64_FROM_S32)
  1471. srcw = (sljit_s32)srcw;
  1472. FAIL_IF(load_immediate(compiler, TMP_REG1, srcw));
  1473. src = TMP_REG1;
  1474. }
  1475. else if (GET_OPCODE(op) == SLJIT_CONV_F64_FROM_S32) {
  1476. if (FAST_IS_REG(src))
  1477. FAIL_IF(push_inst(compiler, EXTSW | S(src) | A(TMP_REG1)));
  1478. else
  1479. FAIL_IF(emit_op_mem(compiler, INT_DATA | SIGNED_DATA | LOAD_DATA, TMP_REG1, src, srcw, TMP_REG1));
  1480. src = TMP_REG1;
  1481. }
  1482. if (FAST_IS_REG(src)) {
  1483. FAIL_IF(emit_op_mem(compiler, WORD_DATA, src, SLJIT_MEM1(SLJIT_SP), FLOAT_TMP_MEM_OFFSET, TMP_REG1));
  1484. FAIL_IF(emit_op_mem(compiler, DOUBLE_DATA | LOAD_DATA, TMP_FREG1, SLJIT_MEM1(SLJIT_SP), FLOAT_TMP_MEM_OFFSET, TMP_REG1));
  1485. }
  1486. else
  1487. FAIL_IF(emit_op_mem(compiler, DOUBLE_DATA | LOAD_DATA, TMP_FREG1, src, srcw, TMP_REG1));
  1488. FAIL_IF(push_inst(compiler, FCFID | FD(dst_r) | FB(TMP_FREG1)));
  1489. if (dst & SLJIT_MEM)
  1490. return emit_op_mem(compiler, FLOAT_DATA(op), TMP_FREG1, dst, dstw, TMP_REG1);
  1491. if (op & SLJIT_F32_OP)
  1492. return push_inst(compiler, FRSP | FD(dst_r) | FB(dst_r));
  1493. return SLJIT_SUCCESS;
  1494. #else
  1495. sljit_s32 dst_r = FAST_IS_REG(dst) ? dst : TMP_FREG1;
  1496. sljit_s32 invert_sign = 1;
  1497. if (src & SLJIT_IMM) {
  1498. FAIL_IF(load_immediate(compiler, TMP_REG1, srcw ^ 0x80000000));
  1499. src = TMP_REG1;
  1500. invert_sign = 0;
  1501. }
  1502. else if (!FAST_IS_REG(src)) {
  1503. FAIL_IF(emit_op_mem(compiler, WORD_DATA | SIGNED_DATA | LOAD_DATA, TMP_REG1, src, srcw, TMP_REG1));
  1504. src = TMP_REG1;
  1505. }
  1506. /* First, a special double floating point value is constructed: (2^53 + (input xor (2^31)))
  1507. The double precision format has exactly 53 bit precision, so the lower 32 bit represents
  1508. the lower 32 bit of such value. The result of xor 2^31 is the same as adding 0x80000000
  1509. to the input, which shifts it into the 0 - 0xffffffff range. To get the converted floating
  1510. point value, we need to substract 2^53 + 2^31 from the constructed value. */
  1511. FAIL_IF(push_inst(compiler, ADDIS | D(TMP_REG2) | A(0) | 0x4330));
  1512. if (invert_sign)
  1513. FAIL_IF(push_inst(compiler, XORIS | S(src) | A(TMP_REG1) | 0x8000));
  1514. FAIL_IF(emit_op_mem(compiler, WORD_DATA, TMP_REG2, SLJIT_MEM1(SLJIT_SP), FLOAT_TMP_MEM_OFFSET_HI, TMP_REG1));
  1515. FAIL_IF(emit_op_mem(compiler, WORD_DATA, TMP_REG1, SLJIT_MEM1(SLJIT_SP), FLOAT_TMP_MEM_OFFSET_LOW, TMP_REG2));
  1516. FAIL_IF(push_inst(compiler, ADDIS | D(TMP_REG1) | A(0) | 0x8000));
  1517. FAIL_IF(emit_op_mem(compiler, DOUBLE_DATA | LOAD_DATA, TMP_FREG1, SLJIT_MEM1(SLJIT_SP), FLOAT_TMP_MEM_OFFSET, TMP_REG1));
  1518. FAIL_IF(emit_op_mem(compiler, WORD_DATA, TMP_REG1, SLJIT_MEM1(SLJIT_SP), FLOAT_TMP_MEM_OFFSET_LOW, TMP_REG2));
  1519. FAIL_IF(emit_op_mem(compiler, DOUBLE_DATA | LOAD_DATA, TMP_FREG2, SLJIT_MEM1(SLJIT_SP), FLOAT_TMP_MEM_OFFSET, TMP_REG1));
  1520. FAIL_IF(push_inst(compiler, FSUB | FD(dst_r) | FA(TMP_FREG1) | FB(TMP_FREG2)));
  1521. if (dst & SLJIT_MEM)
  1522. return emit_op_mem(compiler, FLOAT_DATA(op), TMP_FREG1, dst, dstw, TMP_REG1);
  1523. if (op & SLJIT_F32_OP)
  1524. return push_inst(compiler, FRSP | FD(dst_r) | FB(dst_r));
  1525. return SLJIT_SUCCESS;
  1526. #endif
  1527. }
  1528. static SLJIT_INLINE sljit_s32 sljit_emit_fop1_cmp(struct sljit_compiler *compiler, sljit_s32 op,
  1529. sljit_s32 src1, sljit_sw src1w,
  1530. sljit_s32 src2, sljit_sw src2w)
  1531. {
  1532. if (src1 & SLJIT_MEM) {
  1533. FAIL_IF(emit_op_mem(compiler, FLOAT_DATA(op) | LOAD_DATA, TMP_FREG1, src1, src1w, TMP_REG1));
  1534. src1 = TMP_FREG1;
  1535. }
  1536. if (src2 & SLJIT_MEM) {
  1537. FAIL_IF(emit_op_mem(compiler, FLOAT_DATA(op) | LOAD_DATA, TMP_FREG2, src2, src2w, TMP_REG2));
  1538. src2 = TMP_FREG2;
  1539. }
  1540. return push_inst(compiler, FCMPU | CRD(4) | FA(src1) | FB(src2));
  1541. }
  1542. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_fop1(struct sljit_compiler *compiler, sljit_s32 op,
  1543. sljit_s32 dst, sljit_sw dstw,
  1544. sljit_s32 src, sljit_sw srcw)
  1545. {
  1546. sljit_s32 dst_r;
  1547. CHECK_ERROR();
  1548. SLJIT_COMPILE_ASSERT((SLJIT_F32_OP == 0x100) && !(DOUBLE_DATA & 0x4), float_transfer_bit_error);
  1549. SELECT_FOP1_OPERATION_WITH_CHECKS(compiler, op, dst, dstw, src, srcw);
  1550. if (GET_OPCODE(op) == SLJIT_CONV_F64_FROM_F32)
  1551. op ^= SLJIT_F32_OP;
  1552. dst_r = FAST_IS_REG(dst) ? dst : TMP_FREG1;
  1553. if (src & SLJIT_MEM) {
  1554. FAIL_IF(emit_op_mem(compiler, FLOAT_DATA(op) | LOAD_DATA, dst_r, src, srcw, TMP_REG1));
  1555. src = dst_r;
  1556. }
  1557. switch (GET_OPCODE(op)) {
  1558. case SLJIT_CONV_F64_FROM_F32:
  1559. op ^= SLJIT_F32_OP;
  1560. if (op & SLJIT_F32_OP) {
  1561. FAIL_IF(push_inst(compiler, FRSP | FD(dst_r) | FB(src)));
  1562. break;
  1563. }
  1564. /* Fall through. */
  1565. case SLJIT_MOV_F64:
  1566. if (src != dst_r) {
  1567. if (dst_r != TMP_FREG1)
  1568. FAIL_IF(push_inst(compiler, FMR | FD(dst_r) | FB(src)));
  1569. else
  1570. dst_r = src;
  1571. }
  1572. break;
  1573. case SLJIT_NEG_F64:
  1574. FAIL_IF(push_inst(compiler, FNEG | FD(dst_r) | FB(src)));
  1575. break;
  1576. case SLJIT_ABS_F64:
  1577. FAIL_IF(push_inst(compiler, FABS | FD(dst_r) | FB(src)));
  1578. break;
  1579. }
  1580. if (dst & SLJIT_MEM)
  1581. FAIL_IF(emit_op_mem(compiler, FLOAT_DATA(op), dst_r, dst, dstw, TMP_REG1));
  1582. return SLJIT_SUCCESS;
  1583. }
  1584. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_fop2(struct sljit_compiler *compiler, sljit_s32 op,
  1585. sljit_s32 dst, sljit_sw dstw,
  1586. sljit_s32 src1, sljit_sw src1w,
  1587. sljit_s32 src2, sljit_sw src2w)
  1588. {
  1589. sljit_s32 dst_r;
  1590. CHECK_ERROR();
  1591. CHECK(check_sljit_emit_fop2(compiler, op, dst, dstw, src1, src1w, src2, src2w));
  1592. ADJUST_LOCAL_OFFSET(dst, dstw);
  1593. ADJUST_LOCAL_OFFSET(src1, src1w);
  1594. ADJUST_LOCAL_OFFSET(src2, src2w);
  1595. dst_r = FAST_IS_REG(dst) ? dst : TMP_FREG2;
  1596. if (src1 & SLJIT_MEM) {
  1597. FAIL_IF(emit_op_mem(compiler, FLOAT_DATA(op) | LOAD_DATA, TMP_FREG1, src1, src1w, TMP_REG1));
  1598. src1 = TMP_FREG1;
  1599. }
  1600. if (src2 & SLJIT_MEM) {
  1601. FAIL_IF(emit_op_mem(compiler, FLOAT_DATA(op) | LOAD_DATA, TMP_FREG2, src2, src2w, TMP_REG2));
  1602. src2 = TMP_FREG2;
  1603. }
  1604. switch (GET_OPCODE(op)) {
  1605. case SLJIT_ADD_F64:
  1606. FAIL_IF(push_inst(compiler, SELECT_FOP(op, FADDS, FADD) | FD(dst_r) | FA(src1) | FB(src2)));
  1607. break;
  1608. case SLJIT_SUB_F64:
  1609. FAIL_IF(push_inst(compiler, SELECT_FOP(op, FSUBS, FSUB) | FD(dst_r) | FA(src1) | FB(src2)));
  1610. break;
  1611. case SLJIT_MUL_F64:
  1612. FAIL_IF(push_inst(compiler, SELECT_FOP(op, FMULS, FMUL) | FD(dst_r) | FA(src1) | FC(src2) /* FMUL use FC as src2 */));
  1613. break;
  1614. case SLJIT_DIV_F64:
  1615. FAIL_IF(push_inst(compiler, SELECT_FOP(op, FDIVS, FDIV) | FD(dst_r) | FA(src1) | FB(src2)));
  1616. break;
  1617. }
  1618. if (dst & SLJIT_MEM)
  1619. FAIL_IF(emit_op_mem(compiler, FLOAT_DATA(op), TMP_FREG2, dst, dstw, TMP_REG1));
  1620. return SLJIT_SUCCESS;
  1621. }
  1622. #undef SELECT_FOP
  1623. /* --------------------------------------------------------------------- */
  1624. /* Other instructions */
  1625. /* --------------------------------------------------------------------- */
  1626. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_fast_enter(struct sljit_compiler *compiler, sljit_s32 dst, sljit_sw dstw)
  1627. {
  1628. CHECK_ERROR();
  1629. CHECK(check_sljit_emit_fast_enter(compiler, dst, dstw));
  1630. ADJUST_LOCAL_OFFSET(dst, dstw);
  1631. if (FAST_IS_REG(dst))
  1632. return push_inst(compiler, MFLR | D(dst));
  1633. /* Memory. */
  1634. FAIL_IF(push_inst(compiler, MFLR | D(TMP_REG2)));
  1635. return emit_op(compiler, SLJIT_MOV, WORD_DATA, dst, dstw, TMP_REG1, 0, TMP_REG2, 0);
  1636. }
  1637. /* --------------------------------------------------------------------- */
  1638. /* Conditional instructions */
  1639. /* --------------------------------------------------------------------- */
  1640. SLJIT_API_FUNC_ATTRIBUTE struct sljit_label* sljit_emit_label(struct sljit_compiler *compiler)
  1641. {
  1642. struct sljit_label *label;
  1643. CHECK_ERROR_PTR();
  1644. CHECK_PTR(check_sljit_emit_label(compiler));
  1645. if (compiler->last_label && compiler->last_label->size == compiler->size)
  1646. return compiler->last_label;
  1647. label = (struct sljit_label*)ensure_abuf(compiler, sizeof(struct sljit_label));
  1648. PTR_FAIL_IF(!label);
  1649. set_label(label, compiler);
  1650. return label;
  1651. }
  1652. static sljit_ins get_bo_bi_flags(sljit_s32 type)
  1653. {
  1654. switch (type) {
  1655. case SLJIT_EQUAL:
  1656. return (12 << 21) | (2 << 16);
  1657. case SLJIT_NOT_EQUAL:
  1658. return (4 << 21) | (2 << 16);
  1659. case SLJIT_LESS:
  1660. case SLJIT_SIG_LESS:
  1661. return (12 << 21) | (0 << 16);
  1662. case SLJIT_GREATER_EQUAL:
  1663. case SLJIT_SIG_GREATER_EQUAL:
  1664. return (4 << 21) | (0 << 16);
  1665. case SLJIT_GREATER:
  1666. case SLJIT_SIG_GREATER:
  1667. return (12 << 21) | (1 << 16);
  1668. case SLJIT_LESS_EQUAL:
  1669. case SLJIT_SIG_LESS_EQUAL:
  1670. return (4 << 21) | (1 << 16);
  1671. case SLJIT_LESS_F64:
  1672. return (12 << 21) | ((4 + 0) << 16);
  1673. case SLJIT_GREATER_EQUAL_F64:
  1674. return (4 << 21) | ((4 + 0) << 16);
  1675. case SLJIT_GREATER_F64:
  1676. return (12 << 21) | ((4 + 1) << 16);
  1677. case SLJIT_LESS_EQUAL_F64:
  1678. return (4 << 21) | ((4 + 1) << 16);
  1679. case SLJIT_OVERFLOW:
  1680. return (12 << 21) | (3 << 16);
  1681. case SLJIT_NOT_OVERFLOW:
  1682. return (4 << 21) | (3 << 16);
  1683. case SLJIT_EQUAL_F64:
  1684. return (12 << 21) | ((4 + 2) << 16);
  1685. case SLJIT_NOT_EQUAL_F64:
  1686. return (4 << 21) | ((4 + 2) << 16);
  1687. case SLJIT_UNORDERED_F64:
  1688. return (12 << 21) | ((4 + 3) << 16);
  1689. case SLJIT_ORDERED_F64:
  1690. return (4 << 21) | ((4 + 3) << 16);
  1691. default:
  1692. SLJIT_ASSERT(type >= SLJIT_JUMP && type <= SLJIT_CALL_CDECL);
  1693. return (20 << 21);
  1694. }
  1695. }
  1696. SLJIT_API_FUNC_ATTRIBUTE struct sljit_jump* sljit_emit_jump(struct sljit_compiler *compiler, sljit_s32 type)
  1697. {
  1698. struct sljit_jump *jump;
  1699. sljit_ins bo_bi_flags;
  1700. CHECK_ERROR_PTR();
  1701. CHECK_PTR(check_sljit_emit_jump(compiler, type));
  1702. bo_bi_flags = get_bo_bi_flags(type & 0xff);
  1703. if (!bo_bi_flags)
  1704. return NULL;
  1705. jump = (struct sljit_jump*)ensure_abuf(compiler, sizeof(struct sljit_jump));
  1706. PTR_FAIL_IF(!jump);
  1707. set_jump(jump, compiler, type & SLJIT_REWRITABLE_JUMP);
  1708. type &= 0xff;
  1709. /* In PPC, we don't need to touch the arguments. */
  1710. if (type < SLJIT_JUMP)
  1711. jump->flags |= IS_COND;
  1712. #if (defined SLJIT_PASS_ENTRY_ADDR_TO_CALL && SLJIT_PASS_ENTRY_ADDR_TO_CALL)
  1713. if (type >= SLJIT_CALL)
  1714. jump->flags |= IS_CALL;
  1715. #endif
  1716. PTR_FAIL_IF(emit_const(compiler, TMP_CALL_REG, 0));
  1717. PTR_FAIL_IF(push_inst(compiler, MTCTR | S(TMP_CALL_REG)));
  1718. jump->addr = compiler->size;
  1719. PTR_FAIL_IF(push_inst(compiler, BCCTR | bo_bi_flags | (type >= SLJIT_FAST_CALL ? 1 : 0)));
  1720. return jump;
  1721. }
  1722. SLJIT_API_FUNC_ATTRIBUTE struct sljit_jump* sljit_emit_call(struct sljit_compiler *compiler, sljit_s32 type,
  1723. sljit_s32 arg_types)
  1724. {
  1725. CHECK_ERROR_PTR();
  1726. CHECK_PTR(check_sljit_emit_call(compiler, type, arg_types));
  1727. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1728. PTR_FAIL_IF(call_with_args(compiler, arg_types, NULL));
  1729. #endif
  1730. #if (defined SLJIT_VERBOSE && SLJIT_VERBOSE) \
  1731. || (defined SLJIT_ARGUMENT_CHECKS && SLJIT_ARGUMENT_CHECKS)
  1732. compiler->skip_checks = 1;
  1733. #endif
  1734. return sljit_emit_jump(compiler, type);
  1735. }
  1736. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_ijump(struct sljit_compiler *compiler, sljit_s32 type, sljit_s32 src, sljit_sw srcw)
  1737. {
  1738. struct sljit_jump *jump = NULL;
  1739. sljit_s32 src_r;
  1740. CHECK_ERROR();
  1741. CHECK(check_sljit_emit_ijump(compiler, type, src, srcw));
  1742. ADJUST_LOCAL_OFFSET(src, srcw);
  1743. if (FAST_IS_REG(src)) {
  1744. #if (defined SLJIT_PASS_ENTRY_ADDR_TO_CALL && SLJIT_PASS_ENTRY_ADDR_TO_CALL)
  1745. if (type >= SLJIT_CALL) {
  1746. FAIL_IF(push_inst(compiler, OR | S(src) | A(TMP_CALL_REG) | B(src)));
  1747. src_r = TMP_CALL_REG;
  1748. }
  1749. else
  1750. src_r = src;
  1751. #else
  1752. src_r = src;
  1753. #endif
  1754. } else if (src & SLJIT_IMM) {
  1755. /* These jumps are converted to jump/call instructions when possible. */
  1756. jump = (struct sljit_jump*)ensure_abuf(compiler, sizeof(struct sljit_jump));
  1757. FAIL_IF(!jump);
  1758. set_jump(jump, compiler, JUMP_ADDR);
  1759. jump->u.target = srcw;
  1760. #if (defined SLJIT_PASS_ENTRY_ADDR_TO_CALL && SLJIT_PASS_ENTRY_ADDR_TO_CALL)
  1761. if (type >= SLJIT_CALL)
  1762. jump->flags |= IS_CALL;
  1763. #endif
  1764. FAIL_IF(emit_const(compiler, TMP_CALL_REG, 0));
  1765. src_r = TMP_CALL_REG;
  1766. }
  1767. else {
  1768. FAIL_IF(emit_op(compiler, SLJIT_MOV, WORD_DATA, TMP_CALL_REG, 0, TMP_REG1, 0, src, srcw));
  1769. src_r = TMP_CALL_REG;
  1770. }
  1771. FAIL_IF(push_inst(compiler, MTCTR | S(src_r)));
  1772. if (jump)
  1773. jump->addr = compiler->size;
  1774. return push_inst(compiler, BCCTR | (20 << 21) | (type >= SLJIT_FAST_CALL ? 1 : 0));
  1775. }
  1776. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_icall(struct sljit_compiler *compiler, sljit_s32 type,
  1777. sljit_s32 arg_types,
  1778. sljit_s32 src, sljit_sw srcw)
  1779. {
  1780. CHECK_ERROR();
  1781. CHECK(check_sljit_emit_icall(compiler, type, arg_types, src, srcw));
  1782. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1783. if (src & SLJIT_MEM) {
  1784. ADJUST_LOCAL_OFFSET(src, srcw);
  1785. FAIL_IF(emit_op(compiler, SLJIT_MOV, WORD_DATA, TMP_CALL_REG, 0, TMP_REG1, 0, src, srcw));
  1786. src = TMP_CALL_REG;
  1787. }
  1788. FAIL_IF(call_with_args(compiler, arg_types, &src));
  1789. #endif
  1790. #if (defined SLJIT_VERBOSE && SLJIT_VERBOSE) \
  1791. || (defined SLJIT_ARGUMENT_CHECKS && SLJIT_ARGUMENT_CHECKS)
  1792. compiler->skip_checks = 1;
  1793. #endif
  1794. return sljit_emit_ijump(compiler, type, src, srcw);
  1795. }
  1796. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_op_flags(struct sljit_compiler *compiler, sljit_s32 op,
  1797. sljit_s32 dst, sljit_sw dstw,
  1798. sljit_s32 type)
  1799. {
  1800. sljit_s32 reg, input_flags, cr_bit, invert;
  1801. sljit_s32 saved_op = op;
  1802. sljit_sw saved_dstw = dstw;
  1803. CHECK_ERROR();
  1804. CHECK(check_sljit_emit_op_flags(compiler, op, dst, dstw, type));
  1805. ADJUST_LOCAL_OFFSET(dst, dstw);
  1806. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1807. input_flags = (op & SLJIT_I32_OP) ? INT_DATA : WORD_DATA;
  1808. #else
  1809. input_flags = WORD_DATA;
  1810. #endif
  1811. op = GET_OPCODE(op);
  1812. reg = (op < SLJIT_ADD && FAST_IS_REG(dst)) ? dst : TMP_REG2;
  1813. if (op >= SLJIT_ADD && (dst & SLJIT_MEM))
  1814. FAIL_IF(emit_op_mem(compiler, input_flags | LOAD_DATA, TMP_REG1, dst, dstw, TMP_REG1));
  1815. invert = 0;
  1816. cr_bit = 0;
  1817. switch (type & 0xff) {
  1818. case SLJIT_LESS:
  1819. case SLJIT_SIG_LESS:
  1820. break;
  1821. case SLJIT_GREATER_EQUAL:
  1822. case SLJIT_SIG_GREATER_EQUAL:
  1823. invert = 1;
  1824. break;
  1825. case SLJIT_GREATER:
  1826. case SLJIT_SIG_GREATER:
  1827. cr_bit = 1;
  1828. break;
  1829. case SLJIT_LESS_EQUAL:
  1830. case SLJIT_SIG_LESS_EQUAL:
  1831. cr_bit = 1;
  1832. invert = 1;
  1833. break;
  1834. case SLJIT_EQUAL:
  1835. cr_bit = 2;
  1836. break;
  1837. case SLJIT_NOT_EQUAL:
  1838. cr_bit = 2;
  1839. invert = 1;
  1840. break;
  1841. case SLJIT_OVERFLOW:
  1842. cr_bit = 3;
  1843. break;
  1844. case SLJIT_NOT_OVERFLOW:
  1845. cr_bit = 3;
  1846. invert = 1;
  1847. break;
  1848. case SLJIT_LESS_F64:
  1849. cr_bit = 4 + 0;
  1850. break;
  1851. case SLJIT_GREATER_EQUAL_F64:
  1852. cr_bit = 4 + 0;
  1853. invert = 1;
  1854. break;
  1855. case SLJIT_GREATER_F64:
  1856. cr_bit = 4 + 1;
  1857. break;
  1858. case SLJIT_LESS_EQUAL_F64:
  1859. cr_bit = 4 + 1;
  1860. invert = 1;
  1861. break;
  1862. case SLJIT_EQUAL_F64:
  1863. cr_bit = 4 + 2;
  1864. break;
  1865. case SLJIT_NOT_EQUAL_F64:
  1866. cr_bit = 4 + 2;
  1867. invert = 1;
  1868. break;
  1869. case SLJIT_UNORDERED_F64:
  1870. cr_bit = 4 + 3;
  1871. break;
  1872. case SLJIT_ORDERED_F64:
  1873. cr_bit = 4 + 3;
  1874. invert = 1;
  1875. break;
  1876. default:
  1877. SLJIT_UNREACHABLE();
  1878. break;
  1879. }
  1880. FAIL_IF(push_inst(compiler, MFCR | D(reg)));
  1881. FAIL_IF(push_inst(compiler, RLWINM | S(reg) | A(reg) | ((1 + (cr_bit)) << 11) | (31 << 6) | (31 << 1)));
  1882. if (invert)
  1883. FAIL_IF(push_inst(compiler, XORI | S(reg) | A(reg) | 0x1));
  1884. if (op < SLJIT_ADD) {
  1885. if (!(dst & SLJIT_MEM))
  1886. return SLJIT_SUCCESS;
  1887. return emit_op_mem(compiler, input_flags, reg, dst, dstw, TMP_REG1);
  1888. }
  1889. #if (defined SLJIT_VERBOSE && SLJIT_VERBOSE) \
  1890. || (defined SLJIT_ARGUMENT_CHECKS && SLJIT_ARGUMENT_CHECKS)
  1891. compiler->skip_checks = 1;
  1892. #endif
  1893. if (dst & SLJIT_MEM)
  1894. return sljit_emit_op2(compiler, saved_op, dst, saved_dstw, TMP_REG1, 0, TMP_REG2, 0);
  1895. return sljit_emit_op2(compiler, saved_op, dst, 0, dst, 0, TMP_REG2, 0);
  1896. }
  1897. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_cmov(struct sljit_compiler *compiler, sljit_s32 type,
  1898. sljit_s32 dst_reg,
  1899. sljit_s32 src, sljit_sw srcw)
  1900. {
  1901. CHECK_ERROR();
  1902. CHECK(check_sljit_emit_cmov(compiler, type, dst_reg, src, srcw));
  1903. return sljit_emit_cmov_generic(compiler, type, dst_reg, src, srcw);;
  1904. }
  1905. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_mem(struct sljit_compiler *compiler, sljit_s32 type,
  1906. sljit_s32 reg,
  1907. sljit_s32 mem, sljit_sw memw)
  1908. {
  1909. sljit_s32 mem_flags;
  1910. sljit_ins inst;
  1911. CHECK_ERROR();
  1912. CHECK(check_sljit_emit_mem(compiler, type, reg, mem, memw));
  1913. if (type & SLJIT_MEM_POST)
  1914. return SLJIT_ERR_UNSUPPORTED;
  1915. switch (type & 0xff) {
  1916. case SLJIT_MOV:
  1917. case SLJIT_MOV_P:
  1918. #if (defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32)
  1919. case SLJIT_MOV_U32:
  1920. case SLJIT_MOV_S32:
  1921. #endif
  1922. mem_flags = WORD_DATA;
  1923. break;
  1924. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1925. case SLJIT_MOV_U32:
  1926. mem_flags = INT_DATA;
  1927. break;
  1928. case SLJIT_MOV_S32:
  1929. mem_flags = INT_DATA;
  1930. if (!(type & SLJIT_MEM_STORE) && !(type & SLJIT_I32_OP)) {
  1931. if (mem & OFFS_REG_MASK)
  1932. mem_flags |= SIGNED_DATA;
  1933. else
  1934. return SLJIT_ERR_UNSUPPORTED;
  1935. }
  1936. break;
  1937. #endif
  1938. case SLJIT_MOV_U8:
  1939. case SLJIT_MOV_S8:
  1940. mem_flags = BYTE_DATA;
  1941. break;
  1942. case SLJIT_MOV_U16:
  1943. mem_flags = HALF_DATA;
  1944. break;
  1945. case SLJIT_MOV_S16:
  1946. mem_flags = HALF_DATA | SIGNED_DATA;
  1947. break;
  1948. default:
  1949. SLJIT_UNREACHABLE();
  1950. mem_flags = WORD_DATA;
  1951. break;
  1952. }
  1953. if (!(type & SLJIT_MEM_STORE))
  1954. mem_flags |= LOAD_DATA;
  1955. if (SLJIT_UNLIKELY(mem & OFFS_REG_MASK)) {
  1956. if (memw != 0)
  1957. return SLJIT_ERR_UNSUPPORTED;
  1958. if (type & SLJIT_MEM_SUPP)
  1959. return SLJIT_SUCCESS;
  1960. inst = updated_data_transfer_insts[mem_flags | INDEXED];
  1961. FAIL_IF(push_inst(compiler, INST_CODE_AND_DST(inst, 0, reg) | A(mem & REG_MASK) | B(OFFS_REG(mem))));
  1962. }
  1963. else {
  1964. if (memw > SIMM_MAX || memw < SIMM_MIN)
  1965. return SLJIT_ERR_UNSUPPORTED;
  1966. inst = updated_data_transfer_insts[mem_flags];
  1967. #if (defined SLJIT_CONFIG_PPC_64 && SLJIT_CONFIG_PPC_64)
  1968. if ((inst & INT_ALIGNED) && (memw & 0x3) != 0)
  1969. return SLJIT_ERR_UNSUPPORTED;
  1970. #endif
  1971. if (type & SLJIT_MEM_SUPP)
  1972. return SLJIT_SUCCESS;
  1973. FAIL_IF(push_inst(compiler, INST_CODE_AND_DST(inst, 0, reg) | A(mem & REG_MASK) | IMM(memw)));
  1974. }
  1975. if ((mem_flags & LOAD_DATA) && (type & 0xff) == SLJIT_MOV_S8)
  1976. return push_inst(compiler, EXTSB | S(reg) | A(reg));
  1977. return SLJIT_SUCCESS;
  1978. }
  1979. SLJIT_API_FUNC_ATTRIBUTE sljit_s32 sljit_emit_fmem(struct sljit_compiler *compiler, sljit_s32 type,
  1980. sljit_s32 freg,
  1981. sljit_s32 mem, sljit_sw memw)
  1982. {
  1983. sljit_s32 mem_flags;
  1984. sljit_ins inst;
  1985. CHECK_ERROR();
  1986. CHECK(check_sljit_emit_fmem(compiler, type, freg, mem, memw));
  1987. if (type & SLJIT_MEM_POST)
  1988. return SLJIT_ERR_UNSUPPORTED;
  1989. if (SLJIT_UNLIKELY(mem & OFFS_REG_MASK)) {
  1990. if (memw != 0)
  1991. return SLJIT_ERR_UNSUPPORTED;
  1992. }
  1993. else {
  1994. if (memw > SIMM_MAX || memw < SIMM_MIN)
  1995. return SLJIT_ERR_UNSUPPORTED;
  1996. }
  1997. if (type & SLJIT_MEM_SUPP)
  1998. return SLJIT_SUCCESS;
  1999. mem_flags = FLOAT_DATA(type);
  2000. if (!(type & SLJIT_MEM_STORE))
  2001. mem_flags |= LOAD_DATA;
  2002. if (SLJIT_UNLIKELY(mem & OFFS_REG_MASK)) {
  2003. inst = updated_data_transfer_insts[mem_flags | INDEXED];
  2004. return push_inst(compiler, INST_CODE_AND_DST(inst, DOUBLE_DATA, freg) | A(mem & REG_MASK) | B(OFFS_REG(mem)));
  2005. }
  2006. inst = updated_data_transfer_insts[mem_flags];
  2007. return push_inst(compiler, INST_CODE_AND_DST(inst, DOUBLE_DATA, freg) | A(mem & REG_MASK) | IMM(memw));
  2008. }
  2009. SLJIT_API_FUNC_ATTRIBUTE struct sljit_const* sljit_emit_const(struct sljit_compiler *compiler, sljit_s32 dst, sljit_sw dstw, sljit_sw init_value)
  2010. {
  2011. struct sljit_const *const_;
  2012. sljit_s32 dst_r;
  2013. CHECK_ERROR_PTR();
  2014. CHECK_PTR(check_sljit_emit_const(compiler, dst, dstw, init_value));
  2015. ADJUST_LOCAL_OFFSET(dst, dstw);
  2016. const_ = (struct sljit_const*)ensure_abuf(compiler, sizeof(struct sljit_const));
  2017. PTR_FAIL_IF(!const_);
  2018. set_const(const_, compiler);
  2019. dst_r = FAST_IS_REG(dst) ? dst : TMP_REG2;
  2020. PTR_FAIL_IF(emit_const(compiler, dst_r, init_value));
  2021. if (dst & SLJIT_MEM)
  2022. PTR_FAIL_IF(emit_op(compiler, SLJIT_MOV, WORD_DATA, dst, dstw, TMP_REG1, 0, TMP_REG2, 0));
  2023. return const_;
  2024. }
  2025. SLJIT_API_FUNC_ATTRIBUTE struct sljit_put_label* sljit_emit_put_label(struct sljit_compiler *compiler, sljit_s32 dst, sljit_sw dstw)
  2026. {
  2027. struct sljit_put_label *put_label;
  2028. sljit_s32 dst_r;
  2029. CHECK_ERROR_PTR();
  2030. CHECK_PTR(check_sljit_emit_put_label(compiler, dst, dstw));
  2031. ADJUST_LOCAL_OFFSET(dst, dstw);
  2032. put_label = (struct sljit_put_label*)ensure_abuf(compiler, sizeof(struct sljit_put_label));
  2033. PTR_FAIL_IF(!put_label);
  2034. set_put_label(put_label, compiler, 0);
  2035. dst_r = FAST_IS_REG(dst) ? dst : TMP_REG2;
  2036. #if (defined SLJIT_CONFIG_PPC_32 && SLJIT_CONFIG_PPC_32)
  2037. PTR_FAIL_IF(emit_const(compiler, dst_r, 0));
  2038. #else
  2039. PTR_FAIL_IF(push_inst(compiler, dst_r));
  2040. compiler->size += 4;
  2041. #endif
  2042. if (dst & SLJIT_MEM)
  2043. PTR_FAIL_IF(emit_op(compiler, SLJIT_MOV, WORD_DATA, dst, dstw, TMP_REG1, 0, TMP_REG2, 0));
  2044. return put_label;
  2045. }