dasm_x86.lua 74 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388
  1. ------------------------------------------------------------------------------
  2. -- DynASM x86/x64 module.
  3. --
  4. -- Copyright (C) 2005-2021 Mike Pall. All rights reserved.
  5. -- See dynasm.lua for full copyright notice.
  6. ------------------------------------------------------------------------------
  7. local x64 = x64
  8. -- Module information:
  9. local _info = {
  10. arch = x64 and "x64" or "x86",
  11. description = "DynASM x86/x64 module",
  12. version = "1.5.0",
  13. vernum = 10500,
  14. release = "2021-05-02",
  15. author = "Mike Pall",
  16. license = "MIT",
  17. }
  18. -- Exported glue functions for the arch-specific module.
  19. local _M = { _info = _info }
  20. -- Cache library functions.
  21. local type, tonumber, pairs, ipairs = type, tonumber, pairs, ipairs
  22. local assert, unpack, setmetatable = assert, unpack or table.unpack, setmetatable
  23. local _s = string
  24. local sub, format, byte, char = _s.sub, _s.format, _s.byte, _s.char
  25. local find, match, gmatch, gsub = _s.find, _s.match, _s.gmatch, _s.gsub
  26. local concat, sort, remove = table.concat, table.sort, table.remove
  27. local bit = bit or require("bit")
  28. local band, bxor, shl, shr = bit.band, bit.bxor, bit.lshift, bit.rshift
  29. -- Inherited tables and callbacks.
  30. local g_opt, g_arch
  31. local wline, werror, wfatal, wwarn
  32. -- Action name list.
  33. -- CHECK: Keep this in sync with the C code!
  34. local action_names = {
  35. -- int arg, 1 buffer pos:
  36. "DISP", "IMM_S", "IMM_B", "IMM_W", "IMM_D", "IMM_WB", "IMM_DB",
  37. -- action arg (1 byte), int arg, 1 buffer pos (reg/num):
  38. "VREG", "SPACE",
  39. -- ptrdiff_t arg, 1 buffer pos (address): !x64
  40. "SETLABEL", "REL_A",
  41. -- action arg (1 byte) or int arg, 2 buffer pos (link, offset):
  42. "REL_LG", "REL_PC",
  43. -- action arg (1 byte) or int arg, 1 buffer pos (link):
  44. "IMM_LG", "IMM_PC",
  45. -- action arg (1 byte) or int arg, 1 buffer pos (offset):
  46. "LABEL_LG", "LABEL_PC",
  47. -- action arg (1 byte), 1 buffer pos (offset):
  48. "ALIGN",
  49. -- action args (2 bytes), no buffer pos.
  50. "EXTERN",
  51. -- action arg (1 byte), no buffer pos.
  52. "ESC",
  53. -- no action arg, no buffer pos.
  54. "MARK",
  55. -- action arg (1 byte), no buffer pos, terminal action:
  56. "SECTION",
  57. -- no args, no buffer pos, terminal action:
  58. "STOP"
  59. }
  60. -- Maximum number of section buffer positions for dasm_put().
  61. -- CHECK: Keep this in sync with the C code!
  62. local maxsecpos = 25 -- Keep this low, to avoid excessively long C lines.
  63. -- Action name -> action number (dynamically generated below).
  64. local map_action = {}
  65. -- First action number. Everything below does not need to be escaped.
  66. local actfirst = 256-#action_names
  67. -- Action list buffer and string (only used to remove dupes).
  68. local actlist = {}
  69. local actstr = ""
  70. -- Argument list for next dasm_put(). Start with offset 0 into action list.
  71. local actargs = { 0 }
  72. -- Current number of section buffer positions for dasm_put().
  73. local secpos = 1
  74. -- VREG kind encodings, pre-shifted by 5 bits.
  75. local map_vreg = {
  76. ["modrm.rm.m"] = 0x00,
  77. ["modrm.rm.r"] = 0x20,
  78. ["opcode"] = 0x20,
  79. ["sib.base"] = 0x20,
  80. ["sib.index"] = 0x40,
  81. ["modrm.reg"] = 0x80,
  82. ["vex.v"] = 0xa0,
  83. ["imm.hi"] = 0xc0,
  84. }
  85. -- Current number of VREG actions contributing to REX/VEX shrinkage.
  86. local vreg_shrink_count = 0
  87. ------------------------------------------------------------------------------
  88. -- Compute action numbers for action names.
  89. for n,name in ipairs(action_names) do
  90. local num = actfirst + n - 1
  91. map_action[name] = num
  92. end
  93. -- Dump action names and numbers.
  94. local function dumpactions(out)
  95. out:write("DynASM encoding engine action codes:\n")
  96. for n,name in ipairs(action_names) do
  97. local num = map_action[name]
  98. out:write(format(" %-10s %02X %d\n", name, num, num))
  99. end
  100. out:write("\n")
  101. end
  102. -- Write action list buffer as a huge static C array.
  103. local function writeactions(out, name)
  104. local nn = #actlist
  105. local last = actlist[nn] or 255
  106. actlist[nn] = nil -- Remove last byte.
  107. if nn == 0 then nn = 1 end
  108. out:write("static const unsigned char ", name, "[", nn, "] = {\n")
  109. local s = " "
  110. for n,b in ipairs(actlist) do
  111. s = s..b..","
  112. if #s >= 75 then
  113. assert(out:write(s, "\n"))
  114. s = " "
  115. end
  116. end
  117. out:write(s, last, "\n};\n\n") -- Add last byte back.
  118. end
  119. ------------------------------------------------------------------------------
  120. -- Add byte to action list.
  121. local function wputxb(n)
  122. assert(n >= 0 and n <= 255 and n % 1 == 0, "byte out of range")
  123. actlist[#actlist+1] = n
  124. end
  125. -- Add action to list with optional arg. Advance buffer pos, too.
  126. local function waction(action, a, num)
  127. wputxb(assert(map_action[action], "bad action name `"..action.."'"))
  128. if a then actargs[#actargs+1] = a end
  129. if a or num then secpos = secpos + (num or 1) end
  130. end
  131. -- Optionally add a VREG action.
  132. local function wvreg(kind, vreg, psz, sk, defer)
  133. if not vreg then return end
  134. waction("VREG", vreg)
  135. local b = assert(map_vreg[kind], "bad vreg kind `"..vreg.."'")
  136. if b < (sk or 0) then
  137. vreg_shrink_count = vreg_shrink_count + 1
  138. end
  139. if not defer then
  140. b = b + vreg_shrink_count * 8
  141. vreg_shrink_count = 0
  142. end
  143. wputxb(b + (psz or 0))
  144. end
  145. -- Add call to embedded DynASM C code.
  146. local function wcall(func, args)
  147. wline(format("dasm_%s(Dst, %s);", func, concat(args, ", ")), true)
  148. end
  149. -- Delete duplicate action list chunks. A tad slow, but so what.
  150. local function dedupechunk(offset)
  151. local al, as = actlist, actstr
  152. local chunk = char(unpack(al, offset+1, #al))
  153. local orig = find(as, chunk, 1, true)
  154. if orig then
  155. actargs[1] = orig-1 -- Replace with original offset.
  156. for i=offset+1,#al do al[i] = nil end -- Kill dupe.
  157. else
  158. actstr = as..chunk
  159. end
  160. end
  161. -- Flush action list (intervening C code or buffer pos overflow).
  162. local function wflush(term)
  163. local offset = actargs[1]
  164. if #actlist == offset then return end -- Nothing to flush.
  165. if not term then waction("STOP") end -- Terminate action list.
  166. dedupechunk(offset)
  167. wcall("put", actargs) -- Add call to dasm_put().
  168. actargs = { #actlist } -- Actionlist offset is 1st arg to next dasm_put().
  169. secpos = 1 -- The actionlist offset occupies a buffer position, too.
  170. end
  171. -- Put escaped byte.
  172. local function wputb(n)
  173. if n >= actfirst then waction("ESC") end -- Need to escape byte.
  174. wputxb(n)
  175. end
  176. ------------------------------------------------------------------------------
  177. -- Global label name -> global label number. With auto assignment on 1st use.
  178. local next_global = 10
  179. local map_global = setmetatable({}, { __index = function(t, name)
  180. if not match(name, "^[%a_][%w_@]*$") then werror("bad global label") end
  181. local n = next_global
  182. if n > 246 then werror("too many global labels") end
  183. next_global = n + 1
  184. t[name] = n
  185. return n
  186. end})
  187. -- Dump global labels.
  188. local function dumpglobals(out, lvl)
  189. local t = {}
  190. for name, n in pairs(map_global) do t[n] = name end
  191. out:write("Global labels:\n")
  192. for i=10,next_global-1 do
  193. out:write(format(" %s\n", t[i]))
  194. end
  195. out:write("\n")
  196. end
  197. -- Write global label enum.
  198. local function writeglobals(out, prefix)
  199. local t = {}
  200. for name, n in pairs(map_global) do t[n] = name end
  201. out:write("enum {\n")
  202. for i=10,next_global-1 do
  203. out:write(" ", prefix, gsub(t[i], "@.*", ""), ",\n")
  204. end
  205. out:write(" ", prefix, "_MAX\n};\n")
  206. end
  207. -- Write global label names.
  208. local function writeglobalnames(out, name)
  209. local t = {}
  210. for name, n in pairs(map_global) do t[n] = name end
  211. out:write("static const char *const ", name, "[] = {\n")
  212. for i=10,next_global-1 do
  213. out:write(" \"", t[i], "\",\n")
  214. end
  215. out:write(" (const char *)0\n};\n")
  216. end
  217. ------------------------------------------------------------------------------
  218. -- Extern label name -> extern label number. With auto assignment on 1st use.
  219. local next_extern = -1
  220. local map_extern = setmetatable({}, { __index = function(t, name)
  221. -- No restrictions on the name for now.
  222. local n = next_extern
  223. if n < -256 then werror("too many extern labels") end
  224. next_extern = n - 1
  225. t[name] = n
  226. return n
  227. end})
  228. -- Dump extern labels.
  229. local function dumpexterns(out, lvl)
  230. local t = {}
  231. for name, n in pairs(map_extern) do t[-n] = name end
  232. out:write("Extern labels:\n")
  233. for i=1,-next_extern-1 do
  234. out:write(format(" %s\n", t[i]))
  235. end
  236. out:write("\n")
  237. end
  238. -- Write extern label names.
  239. local function writeexternnames(out, name)
  240. local t = {}
  241. for name, n in pairs(map_extern) do t[-n] = name end
  242. out:write("static const char *const ", name, "[] = {\n")
  243. for i=1,-next_extern-1 do
  244. out:write(" \"", t[i], "\",\n")
  245. end
  246. out:write(" (const char *)0\n};\n")
  247. end
  248. ------------------------------------------------------------------------------
  249. -- Arch-specific maps.
  250. local map_archdef = {} -- Ext. register name -> int. name.
  251. local map_reg_rev = {} -- Int. register name -> ext. name.
  252. local map_reg_num = {} -- Int. register name -> register number.
  253. local map_reg_opsize = {} -- Int. register name -> operand size.
  254. local map_reg_valid_base = {} -- Int. register name -> valid base register?
  255. local map_reg_valid_index = {} -- Int. register name -> valid index register?
  256. local map_reg_needrex = {} -- Int. register name -> need rex vs. no rex.
  257. local reg_list = {} -- Canonical list of int. register names.
  258. local map_type = {} -- Type name -> { ctype, reg }
  259. local ctypenum = 0 -- Type number (for _PTx macros).
  260. local addrsize = x64 and "q" or "d" -- Size for address operands.
  261. -- Helper functions to fill register maps.
  262. local function mkrmap(sz, cl, names)
  263. local cname = format("@%s", sz)
  264. reg_list[#reg_list+1] = cname
  265. map_archdef[cl] = cname
  266. map_reg_rev[cname] = cl
  267. map_reg_num[cname] = -1
  268. map_reg_opsize[cname] = sz
  269. if sz == addrsize or sz == "d" then
  270. map_reg_valid_base[cname] = true
  271. map_reg_valid_index[cname] = true
  272. end
  273. if names then
  274. for n,name in ipairs(names) do
  275. local iname = format("@%s%x", sz, n-1)
  276. reg_list[#reg_list+1] = iname
  277. map_archdef[name] = iname
  278. map_reg_rev[iname] = name
  279. map_reg_num[iname] = n-1
  280. map_reg_opsize[iname] = sz
  281. if sz == "b" and n > 4 then map_reg_needrex[iname] = false end
  282. if sz == addrsize or sz == "d" then
  283. map_reg_valid_base[iname] = true
  284. map_reg_valid_index[iname] = true
  285. end
  286. end
  287. end
  288. for i=0,(x64 and sz ~= "f") and 15 or 7 do
  289. local needrex = sz == "b" and i > 3
  290. local iname = format("@%s%x%s", sz, i, needrex and "R" or "")
  291. if needrex then map_reg_needrex[iname] = true end
  292. local name
  293. if sz == "o" or sz == "y" then name = format("%s%d", cl, i)
  294. elseif sz == "f" then name = format("st%d", i)
  295. else name = format("r%d%s", i, sz == addrsize and "" or sz) end
  296. map_archdef[name] = iname
  297. if not map_reg_rev[iname] then
  298. reg_list[#reg_list+1] = iname
  299. map_reg_rev[iname] = name
  300. map_reg_num[iname] = i
  301. map_reg_opsize[iname] = sz
  302. if sz == addrsize or sz == "d" then
  303. map_reg_valid_base[iname] = true
  304. map_reg_valid_index[iname] = true
  305. end
  306. end
  307. end
  308. reg_list[#reg_list+1] = ""
  309. end
  310. -- Integer registers (qword, dword, word and byte sized).
  311. if x64 then
  312. mkrmap("q", "Rq", {"rax", "rcx", "rdx", "rbx", "rsp", "rbp", "rsi", "rdi"})
  313. end
  314. mkrmap("d", "Rd", {"eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi"})
  315. mkrmap("w", "Rw", {"ax", "cx", "dx", "bx", "sp", "bp", "si", "di"})
  316. mkrmap("b", "Rb", {"al", "cl", "dl", "bl", "ah", "ch", "dh", "bh"})
  317. map_reg_valid_index[map_archdef.esp] = false
  318. if x64 then map_reg_valid_index[map_archdef.rsp] = false end
  319. if x64 then map_reg_needrex[map_archdef.Rb] = true end
  320. map_archdef["Ra"] = "@"..addrsize
  321. -- FP registers (internally tword sized, but use "f" as operand size).
  322. mkrmap("f", "Rf")
  323. -- SSE registers (oword sized, but qword and dword accessible).
  324. mkrmap("o", "xmm")
  325. -- AVX registers (yword sized, but oword, qword and dword accessible).
  326. mkrmap("y", "ymm")
  327. -- Operand size prefixes to codes.
  328. local map_opsize = {
  329. byte = "b", word = "w", dword = "d", qword = "q", oword = "o", yword = "y",
  330. tword = "t", aword = addrsize,
  331. }
  332. -- Operand size code to number.
  333. local map_opsizenum = {
  334. b = 1, w = 2, d = 4, q = 8, o = 16, y = 32, t = 10,
  335. }
  336. -- Operand size code to name.
  337. local map_opsizename = {
  338. b = "byte", w = "word", d = "dword", q = "qword", o = "oword", y = "yword",
  339. t = "tword", f = "fpword",
  340. }
  341. -- Valid index register scale factors.
  342. local map_xsc = {
  343. ["1"] = 0, ["2"] = 1, ["4"] = 2, ["8"] = 3,
  344. }
  345. -- Condition codes.
  346. local map_cc = {
  347. o = 0, no = 1, b = 2, nb = 3, e = 4, ne = 5, be = 6, nbe = 7,
  348. s = 8, ns = 9, p = 10, np = 11, l = 12, nl = 13, le = 14, nle = 15,
  349. c = 2, nae = 2, nc = 3, ae = 3, z = 4, nz = 5, na = 6, a = 7,
  350. pe = 10, po = 11, nge = 12, ge = 13, ng = 14, g = 15,
  351. }
  352. -- Reverse defines for registers.
  353. function _M.revdef(s)
  354. return gsub(s, "@%w+", map_reg_rev)
  355. end
  356. -- Dump register names and numbers
  357. local function dumpregs(out)
  358. out:write("Register names, sizes and internal numbers:\n")
  359. for _,reg in ipairs(reg_list) do
  360. if reg == "" then
  361. out:write("\n")
  362. else
  363. local name = map_reg_rev[reg]
  364. local num = map_reg_num[reg]
  365. local opsize = map_opsizename[map_reg_opsize[reg]]
  366. out:write(format(" %-5s %-8s %s\n", name, opsize,
  367. num < 0 and "(variable)" or num))
  368. end
  369. end
  370. end
  371. ------------------------------------------------------------------------------
  372. -- Put action for label arg (IMM_LG, IMM_PC, REL_LG, REL_PC).
  373. local function wputlabel(aprefix, imm, num)
  374. if type(imm) == "number" then
  375. if imm < 0 then
  376. waction("EXTERN")
  377. wputxb(aprefix == "IMM_" and 0 or 1)
  378. imm = -imm-1
  379. else
  380. waction(aprefix.."LG", nil, num);
  381. end
  382. wputxb(imm)
  383. else
  384. waction(aprefix.."PC", imm, num)
  385. end
  386. end
  387. -- Put signed byte or arg.
  388. local function wputsbarg(n)
  389. if type(n) == "number" then
  390. if n < -128 or n > 127 then
  391. werror("signed immediate byte out of range")
  392. end
  393. if n < 0 then n = n + 256 end
  394. wputb(n)
  395. else waction("IMM_S", n) end
  396. end
  397. -- Put unsigned byte or arg.
  398. local function wputbarg(n)
  399. if type(n) == "number" then
  400. if n < 0 or n > 255 then
  401. werror("unsigned immediate byte out of range")
  402. end
  403. wputb(n)
  404. else waction("IMM_B", n) end
  405. end
  406. -- Put unsigned word or arg.
  407. local function wputwarg(n)
  408. if type(n) == "number" then
  409. if shr(n, 16) ~= 0 then
  410. werror("unsigned immediate word out of range")
  411. end
  412. wputb(band(n, 255)); wputb(shr(n, 8));
  413. else waction("IMM_W", n) end
  414. end
  415. -- Put signed or unsigned dword or arg.
  416. local function wputdarg(n)
  417. local tn = type(n)
  418. if tn == "number" then
  419. wputb(band(n, 255))
  420. wputb(band(shr(n, 8), 255))
  421. wputb(band(shr(n, 16), 255))
  422. wputb(shr(n, 24))
  423. elseif tn == "table" then
  424. wputlabel("IMM_", n[1], 1)
  425. else
  426. waction("IMM_D", n)
  427. end
  428. end
  429. -- Put signed or unsigned qword or arg.
  430. local function wputqarg(n)
  431. local tn = type(n)
  432. if tn == "number" then -- This is only used for numbers from -2^31..2^32-1.
  433. wputb(band(n, 255))
  434. wputb(band(shr(n, 8), 255))
  435. wputb(band(shr(n, 16), 255))
  436. wputb(shr(n, 24))
  437. local sign = n < 0 and 255 or 0
  438. wputb(sign); wputb(sign); wputb(sign); wputb(sign)
  439. else
  440. waction("IMM_D", format("(unsigned int)(%s)", n))
  441. waction("IMM_D", format("(unsigned int)((unsigned long long)(%s)>>32)", n))
  442. end
  443. end
  444. -- Put operand-size dependent number or arg (defaults to dword).
  445. local function wputszarg(sz, n)
  446. if not sz or sz == "d" or sz == "q" then wputdarg(n)
  447. elseif sz == "w" then wputwarg(n)
  448. elseif sz == "b" then wputbarg(n)
  449. elseif sz == "s" then wputsbarg(n)
  450. else werror("bad operand size") end
  451. end
  452. -- Put multi-byte opcode with operand-size dependent modifications.
  453. local function wputop(sz, op, rex, vex, vregr, vregxb)
  454. local psz, sk = 0, nil
  455. if vex then
  456. local tail
  457. if vex.m == 1 and band(rex, 11) == 0 then
  458. if x64 and vregxb then
  459. sk = map_vreg["modrm.reg"]
  460. else
  461. wputb(0xc5)
  462. tail = shl(bxor(band(rex, 4), 4), 5)
  463. psz = 3
  464. end
  465. end
  466. if not tail then
  467. wputb(0xc4)
  468. wputb(shl(bxor(band(rex, 7), 7), 5) + vex.m)
  469. tail = shl(band(rex, 8), 4)
  470. psz = 4
  471. end
  472. local reg, vreg = 0, nil
  473. if vex.v then
  474. reg = vex.v.reg
  475. if not reg then werror("bad vex operand") end
  476. if reg < 0 then reg = 0; vreg = vex.v.vreg end
  477. end
  478. if sz == "y" or vex.l then tail = tail + 4 end
  479. wputb(tail + shl(bxor(reg, 15), 3) + vex.p)
  480. wvreg("vex.v", vreg)
  481. rex = 0
  482. if op >= 256 then werror("bad vex opcode") end
  483. else
  484. if rex ~= 0 then
  485. if not x64 then werror("bad operand size") end
  486. elseif (vregr or vregxb) and x64 then
  487. rex = 0x10
  488. sk = map_vreg["vex.v"]
  489. end
  490. end
  491. local r
  492. if sz == "w" then wputb(102) end
  493. -- Needs >32 bit numbers, but only for crc32 eax, word [ebx]
  494. if op >= 4294967296 then r = op%4294967296 wputb((op-r)/4294967296) op = r end
  495. if op >= 16777216 then wputb(shr(op, 24)); op = band(op, 0xffffff) end
  496. if op >= 65536 then
  497. if rex ~= 0 then
  498. local opc3 = band(op, 0xffff00)
  499. if opc3 == 0x0f3a00 or opc3 == 0x0f3800 then
  500. wputb(64 + band(rex, 15)); rex = 0; psz = 2
  501. end
  502. end
  503. wputb(shr(op, 16)); op = band(op, 0xffff); psz = psz + 1
  504. end
  505. if op >= 256 then
  506. local b = shr(op, 8)
  507. if b == 15 and rex ~= 0 then wputb(64 + band(rex, 15)); rex = 0; psz = 2 end
  508. wputb(b); op = band(op, 255); psz = psz + 1
  509. end
  510. if rex ~= 0 then wputb(64 + band(rex, 15)); psz = 2 end
  511. if sz == "b" then op = op - 1 end
  512. wputb(op)
  513. return psz, sk
  514. end
  515. -- Put ModRM or SIB formatted byte.
  516. local function wputmodrm(m, s, rm, vs, vrm)
  517. assert(m < 4 and s < 16 and rm < 16, "bad modrm operands")
  518. wputb(shl(m, 6) + shl(band(s, 7), 3) + band(rm, 7))
  519. end
  520. -- Put ModRM/SIB plus optional displacement.
  521. local function wputmrmsib(t, imark, s, vsreg, psz, sk)
  522. local vreg, vxreg
  523. local reg, xreg = t.reg, t.xreg
  524. if reg and reg < 0 then reg = 0; vreg = t.vreg end
  525. if xreg and xreg < 0 then xreg = 0; vxreg = t.vxreg end
  526. if s < 0 then s = 0 end
  527. -- Register mode.
  528. if sub(t.mode, 1, 1) == "r" then
  529. wputmodrm(3, s, reg)
  530. wvreg("modrm.reg", vsreg, psz+1, sk, vreg)
  531. wvreg("modrm.rm.r", vreg, psz+1, sk)
  532. return
  533. end
  534. local disp = t.disp
  535. local tdisp = type(disp)
  536. -- No base register?
  537. if not reg then
  538. local riprel = false
  539. if xreg then
  540. -- Indexed mode with index register only.
  541. -- [xreg*xsc+disp] -> (0, s, esp) (xsc, xreg, ebp)
  542. wputmodrm(0, s, 4)
  543. if imark == "I" then waction("MARK") end
  544. wvreg("modrm.reg", vsreg, psz+1, sk, vxreg)
  545. wputmodrm(t.xsc, xreg, 5)
  546. wvreg("sib.index", vxreg, psz+2, sk)
  547. else
  548. -- Pure 32 bit displacement.
  549. if x64 and tdisp ~= "table" then
  550. wputmodrm(0, s, 4) -- [disp] -> (0, s, esp) (0, esp, ebp)
  551. wvreg("modrm.reg", vsreg, psz+1, sk)
  552. if imark == "I" then waction("MARK") end
  553. wputmodrm(0, 4, 5)
  554. else
  555. riprel = x64
  556. wputmodrm(0, s, 5) -- [disp|rip-label] -> (0, s, ebp)
  557. wvreg("modrm.reg", vsreg, psz+1, sk)
  558. if imark == "I" then waction("MARK") end
  559. end
  560. end
  561. if riprel then -- Emit rip-relative displacement.
  562. if match("UWSiI", imark) then
  563. werror("NYI: rip-relative displacement followed by immediate")
  564. end
  565. -- The previous byte in the action buffer cannot be 0xe9 or 0x80-0x8f.
  566. wputlabel("REL_", disp[1], 2)
  567. else
  568. wputdarg(disp)
  569. end
  570. return
  571. end
  572. local m
  573. if tdisp == "number" then -- Check displacement size at assembly time.
  574. if disp == 0 and band(reg, 7) ~= 5 then -- [ebp] -> [ebp+0] (in SIB, too)
  575. if not vreg then m = 0 end -- Force DISP to allow [Rd(5)] -> [ebp+0]
  576. elseif disp >= -128 and disp <= 127 then m = 1
  577. else m = 2 end
  578. elseif tdisp == "table" then
  579. m = 2
  580. end
  581. -- Index register present or esp as base register: need SIB encoding.
  582. if xreg or band(reg, 7) == 4 then
  583. wputmodrm(m or 2, s, 4) -- ModRM.
  584. if m == nil or imark == "I" then waction("MARK") end
  585. wvreg("modrm.reg", vsreg, psz+1, sk, vxreg or vreg)
  586. wputmodrm(t.xsc or 0, xreg or 4, reg) -- SIB.
  587. wvreg("sib.index", vxreg, psz+2, sk, vreg)
  588. wvreg("sib.base", vreg, psz+2, sk)
  589. else
  590. wputmodrm(m or 2, s, reg) -- ModRM.
  591. if (imark == "I" and (m == 1 or m == 2)) or
  592. (m == nil and (vsreg or vreg)) then waction("MARK") end
  593. wvreg("modrm.reg", vsreg, psz+1, sk, vreg)
  594. wvreg("modrm.rm.m", vreg, psz+1, sk)
  595. end
  596. -- Put displacement.
  597. if m == 1 then wputsbarg(disp)
  598. elseif m == 2 then wputdarg(disp)
  599. elseif m == nil then waction("DISP", disp) end
  600. end
  601. ------------------------------------------------------------------------------
  602. -- Return human-readable operand mode string.
  603. local function opmodestr(op, args)
  604. local m = {}
  605. for i=1,#args do
  606. local a = args[i]
  607. m[#m+1] = sub(a.mode, 1, 1)..(a.opsize or "?")
  608. end
  609. return op.." "..concat(m, ",")
  610. end
  611. -- Convert number to valid integer or nil.
  612. local function toint(expr, isqword)
  613. local n = tonumber(expr)
  614. if n then
  615. if n % 1 ~= 0 then
  616. werror("not an integer number `"..expr.."'")
  617. elseif isqword then
  618. if n < -2147483648 or n > 2147483647 then
  619. n = nil -- Handle it as an expression to avoid precision loss.
  620. end
  621. elseif n < -2147483648 or n > 4294967295 then
  622. werror("bad integer number `"..expr.."'")
  623. end
  624. return n
  625. end
  626. end
  627. -- Parse immediate expression.
  628. local function immexpr(expr)
  629. -- &expr (pointer)
  630. if sub(expr, 1, 1) == "&" then
  631. return "iPJ", format("(ptrdiff_t)(%s)", sub(expr,2))
  632. end
  633. local prefix = sub(expr, 1, 2)
  634. -- =>expr (pc label reference)
  635. if prefix == "=>" then
  636. return "iJ", sub(expr, 3)
  637. end
  638. -- ->name (global label reference)
  639. if prefix == "->" then
  640. return "iJ", map_global[sub(expr, 3)]
  641. end
  642. -- [<>][1-9] (local label reference)
  643. local dir, lnum = match(expr, "^([<>])([1-9])$")
  644. if dir then -- Fwd: 247-255, Bkwd: 1-9.
  645. return "iJ", lnum + (dir == ">" and 246 or 0)
  646. end
  647. local extname = match(expr, "^extern%s+(%S+)$")
  648. if extname then
  649. return "iJ", map_extern[extname]
  650. end
  651. -- expr (interpreted as immediate)
  652. return "iI", expr
  653. end
  654. -- Parse displacement expression: +-num, +-expr, +-opsize*num
  655. local function dispexpr(expr)
  656. local disp = expr == "" and 0 or toint(expr)
  657. if disp then return disp end
  658. local c, dispt = match(expr, "^([+-])%s*(.+)$")
  659. if c == "+" then
  660. expr = dispt
  661. elseif not c then
  662. werror("bad displacement expression `"..expr.."'")
  663. end
  664. local opsize, tailops = match(dispt, "^(%w+)%s*%*%s*(.+)$")
  665. local ops, imm = map_opsize[opsize], toint(tailops)
  666. if ops and imm then
  667. if c == "-" then imm = -imm end
  668. return imm*map_opsizenum[ops]
  669. end
  670. local mode, iexpr = immexpr(dispt)
  671. if mode == "iJ" then
  672. if c == "-" then werror("cannot invert label reference") end
  673. return { iexpr }
  674. end
  675. return expr -- Need to return original signed expression.
  676. end
  677. -- Parse register or type expression.
  678. local function rtexpr(expr)
  679. if not expr then return end
  680. local tname, ovreg = match(expr, "^([%w_]+):(@[%w_]+)$")
  681. local tp = map_type[tname or expr]
  682. if tp then
  683. local reg = ovreg or tp.reg
  684. local rnum = map_reg_num[reg]
  685. if not rnum then
  686. werror("type `"..(tname or expr).."' needs a register override")
  687. end
  688. if not map_reg_valid_base[reg] then
  689. werror("bad base register override `"..(map_reg_rev[reg] or reg).."'")
  690. end
  691. return reg, rnum, tp
  692. end
  693. return expr, map_reg_num[expr]
  694. end
  695. -- Parse operand and return { mode, opsize, reg, xreg, xsc, disp, imm }.
  696. local function parseoperand(param, isqword)
  697. local t = {}
  698. local expr = param
  699. local opsize, tailops = match(param, "^(%w+)%s*(.+)$")
  700. if opsize then
  701. t.opsize = map_opsize[opsize]
  702. if t.opsize then expr = tailops end
  703. end
  704. local br = match(expr, "^%[%s*(.-)%s*%]$")
  705. repeat
  706. if br then
  707. t.mode = "xm"
  708. -- [disp]
  709. t.disp = toint(br)
  710. if t.disp then
  711. t.mode = x64 and "xm" or "xmO"
  712. break
  713. end
  714. -- [reg...]
  715. local tp
  716. local reg, tailr = match(br, "^([@%w_:]+)%s*(.*)$")
  717. reg, t.reg, tp = rtexpr(reg)
  718. if not t.reg then
  719. -- [expr]
  720. t.mode = x64 and "xm" or "xmO"
  721. t.disp = dispexpr("+"..br)
  722. break
  723. end
  724. if t.reg == -1 then
  725. t.vreg, tailr = match(tailr, "^(%b())(.*)$")
  726. if not t.vreg then werror("bad variable register expression") end
  727. end
  728. -- [xreg*xsc] or [xreg*xsc+-disp] or [xreg*xsc+-expr]
  729. local xsc, tailsc = match(tailr, "^%*%s*([1248])%s*(.*)$")
  730. if xsc then
  731. if not map_reg_valid_index[reg] then
  732. werror("bad index register `"..map_reg_rev[reg].."'")
  733. end
  734. t.xsc = map_xsc[xsc]
  735. t.xreg = t.reg
  736. t.vxreg = t.vreg
  737. t.reg = nil
  738. t.vreg = nil
  739. t.disp = dispexpr(tailsc)
  740. break
  741. end
  742. if not map_reg_valid_base[reg] then
  743. werror("bad base register `"..map_reg_rev[reg].."'")
  744. end
  745. -- [reg] or [reg+-disp]
  746. t.disp = toint(tailr) or (tailr == "" and 0)
  747. if t.disp then break end
  748. -- [reg+xreg...]
  749. local xreg, tailx = match(tailr, "^%+%s*([@%w_:]+)%s*(.*)$")
  750. xreg, t.xreg, tp = rtexpr(xreg)
  751. if not t.xreg then
  752. -- [reg+-expr]
  753. t.disp = dispexpr(tailr)
  754. break
  755. end
  756. if not map_reg_valid_index[xreg] then
  757. werror("bad index register `"..map_reg_rev[xreg].."'")
  758. end
  759. if t.xreg == -1 then
  760. t.vxreg, tailx = match(tailx, "^(%b())(.*)$")
  761. if not t.vxreg then werror("bad variable register expression") end
  762. end
  763. -- [reg+xreg*xsc...]
  764. local xsc, tailsc = match(tailx, "^%*%s*([1248])%s*(.*)$")
  765. if xsc then
  766. t.xsc = map_xsc[xsc]
  767. tailx = tailsc
  768. end
  769. -- [...] or [...+-disp] or [...+-expr]
  770. t.disp = dispexpr(tailx)
  771. else
  772. -- imm or opsize*imm
  773. local imm = toint(expr, isqword)
  774. if not imm and sub(expr, 1, 1) == "*" and t.opsize then
  775. imm = toint(sub(expr, 2))
  776. if imm then
  777. imm = imm * map_opsizenum[t.opsize]
  778. t.opsize = nil
  779. end
  780. end
  781. if imm then
  782. if t.opsize then werror("bad operand size override") end
  783. local m = "i"
  784. if imm == 1 then m = m.."1" end
  785. if imm >= 4294967168 and imm <= 4294967295 then imm = imm-4294967296 end
  786. if imm >= -128 and imm <= 127 then m = m.."S" end
  787. t.imm = imm
  788. t.mode = m
  789. break
  790. end
  791. local tp
  792. local reg, tailr = match(expr, "^([@%w_:]+)%s*(.*)$")
  793. reg, t.reg, tp = rtexpr(reg)
  794. if t.reg then
  795. if t.reg == -1 then
  796. t.vreg, tailr = match(tailr, "^(%b())(.*)$")
  797. if not t.vreg then werror("bad variable register expression") end
  798. end
  799. -- reg
  800. if tailr == "" then
  801. if t.opsize then werror("bad operand size override") end
  802. t.opsize = map_reg_opsize[reg]
  803. if t.opsize == "f" then
  804. t.mode = t.reg == 0 and "fF" or "f"
  805. else
  806. if reg == "@w4" or (x64 and reg == "@d4") then
  807. wwarn("bad idea, try again with `"..(x64 and "rsp'" or "esp'"))
  808. end
  809. t.mode = t.reg == 0 and "rmR" or (reg == "@b1" and "rmC" or "rm")
  810. end
  811. t.needrex = map_reg_needrex[reg]
  812. break
  813. end
  814. -- type[idx], type[idx].field, type->field -> [reg+offset_expr]
  815. if not tp then werror("bad operand `"..param.."'") end
  816. t.mode = "xm"
  817. t.disp = format(tp.ctypefmt, tailr)
  818. else
  819. t.mode, t.imm = immexpr(expr)
  820. if sub(t.mode, -1) == "J" then
  821. if t.opsize and t.opsize ~= addrsize then
  822. werror("bad operand size override")
  823. end
  824. t.opsize = addrsize
  825. end
  826. end
  827. end
  828. until true
  829. return t
  830. end
  831. ------------------------------------------------------------------------------
  832. -- x86 Template String Description
  833. -- ===============================
  834. --
  835. -- Each template string is a list of [match:]pattern pairs,
  836. -- separated by "|". The first match wins. No match means a
  837. -- bad or unsupported combination of operand modes or sizes.
  838. --
  839. -- The match part and the ":" is omitted if the operation has
  840. -- no operands. Otherwise the first N characters are matched
  841. -- against the mode strings of each of the N operands.
  842. --
  843. -- The mode string for each operand type is (see parseoperand()):
  844. -- Integer register: "rm", +"R" for eax, ax, al, +"C" for cl
  845. -- FP register: "f", +"F" for st0
  846. -- Index operand: "xm", +"O" for [disp] (pure offset)
  847. -- Immediate: "i", +"S" for signed 8 bit, +"1" for 1,
  848. -- +"I" for arg, +"P" for pointer
  849. -- Any: +"J" for valid jump targets
  850. --
  851. -- So a match character "m" (mixed) matches both an integer register
  852. -- and an index operand (to be encoded with the ModRM/SIB scheme).
  853. -- But "r" matches only a register and "x" only an index operand
  854. -- (e.g. for FP memory access operations).
  855. --
  856. -- The operand size match string starts right after the mode match
  857. -- characters and ends before the ":". "dwb" or "qdwb" is assumed, if empty.
  858. -- The effective data size of the operation is matched against this list.
  859. --
  860. -- If only the regular "b", "w", "d", "q", "t" operand sizes are
  861. -- present, then all operands must be the same size. Unspecified sizes
  862. -- are ignored, but at least one operand must have a size or the pattern
  863. -- won't match (use the "byte", "word", "dword", "qword", "tword"
  864. -- operand size overrides. E.g.: mov dword [eax], 1).
  865. --
  866. -- If the list has a "1" or "2" prefix, the operand size is taken
  867. -- from the respective operand and any other operand sizes are ignored.
  868. -- If the list contains only ".", all operand sizes are ignored.
  869. -- If the list has a "/" prefix, the concatenated (mixed) operand sizes
  870. -- are compared to the match.
  871. --
  872. -- E.g. "rrdw" matches for either two dword registers or two word
  873. -- registers. "Fx2dq" matches an st0 operand plus an index operand
  874. -- pointing to a dword (float) or qword (double).
  875. --
  876. -- Every character after the ":" is part of the pattern string:
  877. -- Hex chars are accumulated to form the opcode (left to right).
  878. -- "n" disables the standard opcode mods
  879. -- (otherwise: -1 for "b", o16 prefix for "w", rex.w for "q")
  880. -- "X" Force REX.W.
  881. -- "r"/"R" adds the reg. number from the 1st/2nd operand to the opcode.
  882. -- "m"/"M" generates ModRM/SIB from the 1st/2nd operand.
  883. -- The spare 3 bits are either filled with the last hex digit or
  884. -- the result from a previous "r"/"R". The opcode is restored.
  885. -- "u" Use VEX encoding, vvvv unused.
  886. -- "v"/"V" Use VEX encoding, vvvv from 1st/2nd operand (the operand is
  887. -- removed from the list used by future characters).
  888. -- "w" Use VEX encoding, vvvv from 3rd operand.
  889. -- "L" Force VEX.L
  890. --
  891. -- All of the following characters force a flush of the opcode:
  892. -- "o"/"O" stores a pure 32 bit disp (offset) from the 1st/2nd operand.
  893. -- "s" stores a 4 bit immediate from the last register operand,
  894. -- followed by 4 zero bits.
  895. -- "S" stores a signed 8 bit immediate from the last operand.
  896. -- "U" stores an unsigned 8 bit immediate from the last operand.
  897. -- "W" stores an unsigned 16 bit immediate from the last operand.
  898. -- "i" stores an operand sized immediate from the last operand.
  899. -- "I" dito, but generates an action code to optionally modify
  900. -- the opcode (+2) for a signed 8 bit immediate.
  901. -- "J" generates one of the REL action codes from the last operand.
  902. --
  903. ------------------------------------------------------------------------------
  904. -- Template strings for x86 instructions. Ordered by first opcode byte.
  905. -- Unimplemented opcodes (deliberate omissions) are marked with *.
  906. local map_op = {
  907. -- 00-05: add...
  908. -- 06: *push es
  909. -- 07: *pop es
  910. -- 08-0D: or...
  911. -- 0E: *push cs
  912. -- 0F: two byte opcode prefix
  913. -- 10-15: adc...
  914. -- 16: *push ss
  915. -- 17: *pop ss
  916. -- 18-1D: sbb...
  917. -- 1E: *push ds
  918. -- 1F: *pop ds
  919. -- 20-25: and...
  920. es_0 = "26",
  921. -- 27: *daa
  922. -- 28-2D: sub...
  923. cs_0 = "2E",
  924. -- 2F: *das
  925. -- 30-35: xor...
  926. ss_0 = "36",
  927. -- 37: *aaa
  928. -- 38-3D: cmp...
  929. ds_0 = "3E",
  930. -- 3F: *aas
  931. inc_1 = x64 and "m:FF0m" or "rdw:40r|m:FF0m",
  932. dec_1 = x64 and "m:FF1m" or "rdw:48r|m:FF1m",
  933. push_1 = (x64 and "rq:n50r|rw:50r|mq:nFF6m|mw:FF6m" or
  934. "rdw:50r|mdw:FF6m").."|S.:6AS|ib:n6Ai|i.:68i",
  935. pop_1 = x64 and "rq:n58r|rw:58r|mq:n8F0m|mw:8F0m" or "rdw:58r|mdw:8F0m",
  936. -- 60: *pusha, *pushad, *pushaw
  937. -- 61: *popa, *popad, *popaw
  938. -- 62: *bound rdw,x
  939. -- 63: x86: *arpl mw,rw
  940. movsxd_2 = x64 and "rm/qd:63rM",
  941. fs_0 = "64",
  942. gs_0 = "65",
  943. o16_0 = "66",
  944. a16_0 = not x64 and "67" or nil,
  945. a32_0 = x64 and "67",
  946. -- 68: push idw
  947. -- 69: imul rdw,mdw,idw
  948. -- 6A: push ib
  949. -- 6B: imul rdw,mdw,S
  950. -- 6C: *insb
  951. -- 6D: *insd, *insw
  952. -- 6E: *outsb
  953. -- 6F: *outsd, *outsw
  954. -- 70-7F: jcc lb
  955. -- 80: add... mb,i
  956. -- 81: add... mdw,i
  957. -- 82: *undefined
  958. -- 83: add... mdw,S
  959. test_2 = "mr:85Rm|rm:85rM|Ri:A9ri|mi:F70mi",
  960. -- 86: xchg rb,mb
  961. -- 87: xchg rdw,mdw
  962. -- 88: mov mb,r
  963. -- 89: mov mdw,r
  964. -- 8A: mov r,mb
  965. -- 8B: mov r,mdw
  966. -- 8C: *mov mdw,seg
  967. lea_2 = "rx1dq:8DrM",
  968. -- 8E: *mov seg,mdw
  969. -- 8F: pop mdw
  970. nop_0 = "90",
  971. xchg_2 = "Rrqdw:90R|rRqdw:90r|rm:87rM|mr:87Rm",
  972. cbw_0 = "6698",
  973. cwde_0 = "98",
  974. cdqe_0 = "4898",
  975. cwd_0 = "6699",
  976. cdq_0 = "99",
  977. cqo_0 = "4899",
  978. -- 9A: *call iw:idw
  979. wait_0 = "9B",
  980. fwait_0 = "9B",
  981. pushf_0 = "9C",
  982. pushfd_0 = not x64 and "9C",
  983. pushfq_0 = x64 and "9C",
  984. popf_0 = "9D",
  985. popfd_0 = not x64 and "9D",
  986. popfq_0 = x64 and "9D",
  987. sahf_0 = "9E",
  988. lahf_0 = "9F",
  989. mov_2 = "OR:A3o|RO:A1O|mr:89Rm|rm:8BrM|rib:nB0ri|ridw:B8ri|mi:C70mi",
  990. movsb_0 = "A4",
  991. movsw_0 = "66A5",
  992. movsd_0 = "A5",
  993. cmpsb_0 = "A6",
  994. cmpsw_0 = "66A7",
  995. cmpsd_0 = "A7",
  996. -- A8: test Rb,i
  997. -- A9: test Rdw,i
  998. stosb_0 = "AA",
  999. stosw_0 = "66AB",
  1000. stosd_0 = "AB",
  1001. lodsb_0 = "AC",
  1002. lodsw_0 = "66AD",
  1003. lodsd_0 = "AD",
  1004. scasb_0 = "AE",
  1005. scasw_0 = "66AF",
  1006. scasd_0 = "AF",
  1007. -- B0-B7: mov rb,i
  1008. -- B8-BF: mov rdw,i
  1009. -- C0: rol... mb,i
  1010. -- C1: rol... mdw,i
  1011. ret_1 = "i.:nC2W",
  1012. ret_0 = "C3",
  1013. -- C4: *les rdw,mq
  1014. -- C5: *lds rdw,mq
  1015. -- C6: mov mb,i
  1016. -- C7: mov mdw,i
  1017. -- C8: *enter iw,ib
  1018. leave_0 = "C9",
  1019. -- CA: *retf iw
  1020. -- CB: *retf
  1021. int3_0 = "CC",
  1022. int_1 = "i.:nCDU",
  1023. into_0 = "CE",
  1024. -- CF: *iret
  1025. -- D0: rol... mb,1
  1026. -- D1: rol... mdw,1
  1027. -- D2: rol... mb,cl
  1028. -- D3: rol... mb,cl
  1029. -- D4: *aam ib
  1030. -- D5: *aad ib
  1031. -- D6: *salc
  1032. -- D7: *xlat
  1033. -- D8-DF: floating point ops
  1034. -- E0: *loopne
  1035. -- E1: *loope
  1036. -- E2: *loop
  1037. -- E3: *jcxz, *jecxz
  1038. -- E4: *in Rb,ib
  1039. -- E5: *in Rdw,ib
  1040. -- E6: *out ib,Rb
  1041. -- E7: *out ib,Rdw
  1042. call_1 = x64 and "mq:nFF2m|J.:E8nJ" or "md:FF2m|J.:E8J",
  1043. jmp_1 = x64 and "mq:nFF4m|J.:E9nJ" or "md:FF4m|J.:E9J", -- short: EB
  1044. -- EA: *jmp iw:idw
  1045. -- EB: jmp ib
  1046. -- EC: *in Rb,dx
  1047. -- ED: *in Rdw,dx
  1048. -- EE: *out dx,Rb
  1049. -- EF: *out dx,Rdw
  1050. lock_0 = "F0",
  1051. int1_0 = "F1",
  1052. repne_0 = "F2",
  1053. repnz_0 = "F2",
  1054. rep_0 = "F3",
  1055. repe_0 = "F3",
  1056. repz_0 = "F3",
  1057. -- F4: *hlt
  1058. cmc_0 = "F5",
  1059. -- F6: test... mb,i; div... mb
  1060. -- F7: test... mdw,i; div... mdw
  1061. clc_0 = "F8",
  1062. stc_0 = "F9",
  1063. -- FA: *cli
  1064. cld_0 = "FC",
  1065. std_0 = "FD",
  1066. -- FE: inc... mb
  1067. -- FF: inc... mdw
  1068. -- misc ops
  1069. not_1 = "m:F72m",
  1070. neg_1 = "m:F73m",
  1071. mul_1 = "m:F74m",
  1072. imul_1 = "m:F75m",
  1073. div_1 = "m:F76m",
  1074. idiv_1 = "m:F77m",
  1075. imul_2 = "rmqdw:0FAFrM|rIqdw:69rmI|rSqdw:6BrmS|riqdw:69rmi",
  1076. imul_3 = "rmIqdw:69rMI|rmSqdw:6BrMS|rmiqdw:69rMi",
  1077. movzx_2 = "rm/db:0FB6rM|rm/qb:|rm/wb:0FB6rM|rm/dw:0FB7rM|rm/qw:",
  1078. movsx_2 = "rm/db:0FBErM|rm/qb:|rm/wb:0FBErM|rm/dw:0FBFrM|rm/qw:",
  1079. bswap_1 = "rqd:0FC8r",
  1080. bsf_2 = "rmqdw:0FBCrM",
  1081. bsr_2 = "rmqdw:0FBDrM",
  1082. bt_2 = "mrqdw:0FA3Rm|miqdw:0FBA4mU",
  1083. btc_2 = "mrqdw:0FBBRm|miqdw:0FBA7mU",
  1084. btr_2 = "mrqdw:0FB3Rm|miqdw:0FBA6mU",
  1085. bts_2 = "mrqdw:0FABRm|miqdw:0FBA5mU",
  1086. shld_3 = "mriqdw:0FA4RmU|mrC/qq:0FA5Rm|mrC/dd:|mrC/ww:",
  1087. shrd_3 = "mriqdw:0FACRmU|mrC/qq:0FADRm|mrC/dd:|mrC/ww:",
  1088. rdtsc_0 = "0F31", -- P1+
  1089. rdpmc_0 = "0F33", -- P6+
  1090. cpuid_0 = "0FA2", -- P1+
  1091. -- floating point ops
  1092. fst_1 = "ff:DDD0r|xd:D92m|xq:nDD2m",
  1093. fstp_1 = "ff:DDD8r|xd:D93m|xq:nDD3m|xt:DB7m",
  1094. fld_1 = "ff:D9C0r|xd:D90m|xq:nDD0m|xt:DB5m",
  1095. fpop_0 = "DDD8", -- Alias for fstp st0.
  1096. fist_1 = "xw:nDF2m|xd:DB2m",
  1097. fistp_1 = "xw:nDF3m|xd:DB3m|xq:nDF7m",
  1098. fild_1 = "xw:nDF0m|xd:DB0m|xq:nDF5m",
  1099. fxch_0 = "D9C9",
  1100. fxch_1 = "ff:D9C8r",
  1101. fxch_2 = "fFf:D9C8r|Fff:D9C8R",
  1102. fucom_1 = "ff:DDE0r",
  1103. fucom_2 = "Fff:DDE0R",
  1104. fucomp_1 = "ff:DDE8r",
  1105. fucomp_2 = "Fff:DDE8R",
  1106. fucomi_1 = "ff:DBE8r", -- P6+
  1107. fucomi_2 = "Fff:DBE8R", -- P6+
  1108. fucomip_1 = "ff:DFE8r", -- P6+
  1109. fucomip_2 = "Fff:DFE8R", -- P6+
  1110. fcomi_1 = "ff:DBF0r", -- P6+
  1111. fcomi_2 = "Fff:DBF0R", -- P6+
  1112. fcomip_1 = "ff:DFF0r", -- P6+
  1113. fcomip_2 = "Fff:DFF0R", -- P6+
  1114. fucompp_0 = "DAE9",
  1115. fcompp_0 = "DED9",
  1116. fldenv_1 = "x.:D94m",
  1117. fnstenv_1 = "x.:D96m",
  1118. fstenv_1 = "x.:9BD96m",
  1119. fldcw_1 = "xw:nD95m",
  1120. fstcw_1 = "xw:n9BD97m",
  1121. fnstcw_1 = "xw:nD97m",
  1122. fstsw_1 = "Rw:n9BDFE0|xw:n9BDD7m",
  1123. fnstsw_1 = "Rw:nDFE0|xw:nDD7m",
  1124. fclex_0 = "9BDBE2",
  1125. fnclex_0 = "DBE2",
  1126. fnop_0 = "D9D0",
  1127. -- D9D1-D9DF: unassigned
  1128. fchs_0 = "D9E0",
  1129. fabs_0 = "D9E1",
  1130. -- D9E2: unassigned
  1131. -- D9E3: unassigned
  1132. ftst_0 = "D9E4",
  1133. fxam_0 = "D9E5",
  1134. -- D9E6: unassigned
  1135. -- D9E7: unassigned
  1136. fld1_0 = "D9E8",
  1137. fldl2t_0 = "D9E9",
  1138. fldl2e_0 = "D9EA",
  1139. fldpi_0 = "D9EB",
  1140. fldlg2_0 = "D9EC",
  1141. fldln2_0 = "D9ED",
  1142. fldz_0 = "D9EE",
  1143. -- D9EF: unassigned
  1144. f2xm1_0 = "D9F0",
  1145. fyl2x_0 = "D9F1",
  1146. fptan_0 = "D9F2",
  1147. fpatan_0 = "D9F3",
  1148. fxtract_0 = "D9F4",
  1149. fprem1_0 = "D9F5",
  1150. fdecstp_0 = "D9F6",
  1151. fincstp_0 = "D9F7",
  1152. fprem_0 = "D9F8",
  1153. fyl2xp1_0 = "D9F9",
  1154. fsqrt_0 = "D9FA",
  1155. fsincos_0 = "D9FB",
  1156. frndint_0 = "D9FC",
  1157. fscale_0 = "D9FD",
  1158. fsin_0 = "D9FE",
  1159. fcos_0 = "D9FF",
  1160. -- SSE, SSE2
  1161. andnpd_2 = "rmo:660F55rM",
  1162. andnps_2 = "rmo:0F55rM",
  1163. andpd_2 = "rmo:660F54rM",
  1164. andps_2 = "rmo:0F54rM",
  1165. clflush_1 = "x.:0FAE7m",
  1166. cmppd_3 = "rmio:660FC2rMU",
  1167. cmpps_3 = "rmio:0FC2rMU",
  1168. cmpsd_3 = "rrio:F20FC2rMU|rxi/oq:",
  1169. cmpss_3 = "rrio:F30FC2rMU|rxi/od:",
  1170. comisd_2 = "rro:660F2FrM|rx/oq:",
  1171. comiss_2 = "rro:0F2FrM|rx/od:",
  1172. cvtdq2pd_2 = "rro:F30FE6rM|rx/oq:",
  1173. cvtdq2ps_2 = "rmo:0F5BrM",
  1174. cvtpd2dq_2 = "rmo:F20FE6rM",
  1175. cvtpd2ps_2 = "rmo:660F5ArM",
  1176. cvtpi2pd_2 = "rx/oq:660F2ArM",
  1177. cvtpi2ps_2 = "rx/oq:0F2ArM",
  1178. cvtps2dq_2 = "rmo:660F5BrM",
  1179. cvtps2pd_2 = "rro:0F5ArM|rx/oq:",
  1180. cvtsd2si_2 = "rr/do:F20F2DrM|rr/qo:|rx/dq:|rxq:",
  1181. cvtsd2ss_2 = "rro:F20F5ArM|rx/oq:",
  1182. cvtsi2sd_2 = "rm/od:F20F2ArM|rm/oq:F20F2ArXM",
  1183. cvtsi2ss_2 = "rm/od:F30F2ArM|rm/oq:F30F2ArXM",
  1184. cvtss2sd_2 = "rro:F30F5ArM|rx/od:",
  1185. cvtss2si_2 = "rr/do:F30F2DrM|rr/qo:|rxd:|rx/qd:",
  1186. cvttpd2dq_2 = "rmo:660FE6rM",
  1187. cvttps2dq_2 = "rmo:F30F5BrM",
  1188. cvttsd2si_2 = "rr/do:F20F2CrM|rr/qo:|rx/dq:|rxq:",
  1189. cvttss2si_2 = "rr/do:F30F2CrM|rr/qo:|rxd:|rx/qd:",
  1190. fxsave_1 = "x.:0FAE0m",
  1191. fxrstor_1 = "x.:0FAE1m",
  1192. ldmxcsr_1 = "xd:0FAE2m",
  1193. lfence_0 = "0FAEE8",
  1194. maskmovdqu_2 = "rro:660FF7rM",
  1195. mfence_0 = "0FAEF0",
  1196. movapd_2 = "rmo:660F28rM|mro:660F29Rm",
  1197. movaps_2 = "rmo:0F28rM|mro:0F29Rm",
  1198. movd_2 = "rm/od:660F6ErM|rm/oq:660F6ErXM|mr/do:660F7ERm|mr/qo:",
  1199. movdqa_2 = "rmo:660F6FrM|mro:660F7FRm",
  1200. movdqu_2 = "rmo:F30F6FrM|mro:F30F7FRm",
  1201. movhlps_2 = "rro:0F12rM",
  1202. movhpd_2 = "rx/oq:660F16rM|xr/qo:n660F17Rm",
  1203. movhps_2 = "rx/oq:0F16rM|xr/qo:n0F17Rm",
  1204. movlhps_2 = "rro:0F16rM",
  1205. movlpd_2 = "rx/oq:660F12rM|xr/qo:n660F13Rm",
  1206. movlps_2 = "rx/oq:0F12rM|xr/qo:n0F13Rm",
  1207. movmskpd_2 = "rr/do:660F50rM",
  1208. movmskps_2 = "rr/do:0F50rM",
  1209. movntdq_2 = "xro:660FE7Rm",
  1210. movnti_2 = "xrqd:0FC3Rm",
  1211. movntpd_2 = "xro:660F2BRm",
  1212. movntps_2 = "xro:0F2BRm",
  1213. movq_2 = "rro:F30F7ErM|rx/oq:|xr/qo:n660FD6Rm",
  1214. movsd_2 = "rro:F20F10rM|rx/oq:|xr/qo:nF20F11Rm",
  1215. movss_2 = "rro:F30F10rM|rx/od:|xr/do:F30F11Rm",
  1216. movupd_2 = "rmo:660F10rM|mro:660F11Rm",
  1217. movups_2 = "rmo:0F10rM|mro:0F11Rm",
  1218. orpd_2 = "rmo:660F56rM",
  1219. orps_2 = "rmo:0F56rM",
  1220. pause_0 = "F390",
  1221. pextrw_3 = "rri/do:660FC5rMU|xri/wo:660F3A15nRmU", -- Mem op: SSE4.1 only.
  1222. pinsrw_3 = "rri/od:660FC4rMU|rxi/ow:",
  1223. pmovmskb_2 = "rr/do:660FD7rM",
  1224. prefetchnta_1 = "xb:n0F180m",
  1225. prefetcht0_1 = "xb:n0F181m",
  1226. prefetcht1_1 = "xb:n0F182m",
  1227. prefetcht2_1 = "xb:n0F183m",
  1228. pshufd_3 = "rmio:660F70rMU",
  1229. pshufhw_3 = "rmio:F30F70rMU",
  1230. pshuflw_3 = "rmio:F20F70rMU",
  1231. pslld_2 = "rmo:660FF2rM|rio:660F726mU",
  1232. pslldq_2 = "rio:660F737mU",
  1233. psllq_2 = "rmo:660FF3rM|rio:660F736mU",
  1234. psllw_2 = "rmo:660FF1rM|rio:660F716mU",
  1235. psrad_2 = "rmo:660FE2rM|rio:660F724mU",
  1236. psraw_2 = "rmo:660FE1rM|rio:660F714mU",
  1237. psrld_2 = "rmo:660FD2rM|rio:660F722mU",
  1238. psrldq_2 = "rio:660F733mU",
  1239. psrlq_2 = "rmo:660FD3rM|rio:660F732mU",
  1240. psrlw_2 = "rmo:660FD1rM|rio:660F712mU",
  1241. rcpps_2 = "rmo:0F53rM",
  1242. rcpss_2 = "rro:F30F53rM|rx/od:",
  1243. rsqrtps_2 = "rmo:0F52rM",
  1244. rsqrtss_2 = "rmo:F30F52rM",
  1245. sfence_0 = "0FAEF8",
  1246. shufpd_3 = "rmio:660FC6rMU",
  1247. shufps_3 = "rmio:0FC6rMU",
  1248. stmxcsr_1 = "xd:0FAE3m",
  1249. ucomisd_2 = "rro:660F2ErM|rx/oq:",
  1250. ucomiss_2 = "rro:0F2ErM|rx/od:",
  1251. unpckhpd_2 = "rmo:660F15rM",
  1252. unpckhps_2 = "rmo:0F15rM",
  1253. unpcklpd_2 = "rmo:660F14rM",
  1254. unpcklps_2 = "rmo:0F14rM",
  1255. xorpd_2 = "rmo:660F57rM",
  1256. xorps_2 = "rmo:0F57rM",
  1257. -- SSE3 ops
  1258. fisttp_1 = "xw:nDF1m|xd:DB1m|xq:nDD1m",
  1259. addsubpd_2 = "rmo:660FD0rM",
  1260. addsubps_2 = "rmo:F20FD0rM",
  1261. haddpd_2 = "rmo:660F7CrM",
  1262. haddps_2 = "rmo:F20F7CrM",
  1263. hsubpd_2 = "rmo:660F7DrM",
  1264. hsubps_2 = "rmo:F20F7DrM",
  1265. lddqu_2 = "rxo:F20FF0rM",
  1266. movddup_2 = "rmo:F20F12rM",
  1267. movshdup_2 = "rmo:F30F16rM",
  1268. movsldup_2 = "rmo:F30F12rM",
  1269. -- SSSE3 ops
  1270. pabsb_2 = "rmo:660F381CrM",
  1271. pabsd_2 = "rmo:660F381ErM",
  1272. pabsw_2 = "rmo:660F381DrM",
  1273. palignr_3 = "rmio:660F3A0FrMU",
  1274. phaddd_2 = "rmo:660F3802rM",
  1275. phaddsw_2 = "rmo:660F3803rM",
  1276. phaddw_2 = "rmo:660F3801rM",
  1277. phsubd_2 = "rmo:660F3806rM",
  1278. phsubsw_2 = "rmo:660F3807rM",
  1279. phsubw_2 = "rmo:660F3805rM",
  1280. pmaddubsw_2 = "rmo:660F3804rM",
  1281. pmulhrsw_2 = "rmo:660F380BrM",
  1282. pshufb_2 = "rmo:660F3800rM",
  1283. psignb_2 = "rmo:660F3808rM",
  1284. psignd_2 = "rmo:660F380ArM",
  1285. psignw_2 = "rmo:660F3809rM",
  1286. -- SSE4.1 ops
  1287. blendpd_3 = "rmio:660F3A0DrMU",
  1288. blendps_3 = "rmio:660F3A0CrMU",
  1289. blendvpd_3 = "rmRo:660F3815rM",
  1290. blendvps_3 = "rmRo:660F3814rM",
  1291. dppd_3 = "rmio:660F3A41rMU",
  1292. dpps_3 = "rmio:660F3A40rMU",
  1293. extractps_3 = "mri/do:660F3A17RmU|rri/qo:660F3A17RXmU",
  1294. insertps_3 = "rrio:660F3A41rMU|rxi/od:",
  1295. movntdqa_2 = "rxo:660F382ArM",
  1296. mpsadbw_3 = "rmio:660F3A42rMU",
  1297. packusdw_2 = "rmo:660F382BrM",
  1298. pblendvb_3 = "rmRo:660F3810rM",
  1299. pblendw_3 = "rmio:660F3A0ErMU",
  1300. pcmpeqq_2 = "rmo:660F3829rM",
  1301. pextrb_3 = "rri/do:660F3A14nRmU|rri/qo:|xri/bo:",
  1302. pextrd_3 = "mri/do:660F3A16RmU",
  1303. pextrq_3 = "mri/qo:660F3A16RmU",
  1304. -- pextrw is SSE2, mem operand is SSE4.1 only
  1305. phminposuw_2 = "rmo:660F3841rM",
  1306. pinsrb_3 = "rri/od:660F3A20nrMU|rxi/ob:",
  1307. pinsrd_3 = "rmi/od:660F3A22rMU",
  1308. pinsrq_3 = "rmi/oq:660F3A22rXMU",
  1309. pmaxsb_2 = "rmo:660F383CrM",
  1310. pmaxsd_2 = "rmo:660F383DrM",
  1311. pmaxud_2 = "rmo:660F383FrM",
  1312. pmaxuw_2 = "rmo:660F383ErM",
  1313. pminsb_2 = "rmo:660F3838rM",
  1314. pminsd_2 = "rmo:660F3839rM",
  1315. pminud_2 = "rmo:660F383BrM",
  1316. pminuw_2 = "rmo:660F383ArM",
  1317. pmovsxbd_2 = "rro:660F3821rM|rx/od:",
  1318. pmovsxbq_2 = "rro:660F3822rM|rx/ow:",
  1319. pmovsxbw_2 = "rro:660F3820rM|rx/oq:",
  1320. pmovsxdq_2 = "rro:660F3825rM|rx/oq:",
  1321. pmovsxwd_2 = "rro:660F3823rM|rx/oq:",
  1322. pmovsxwq_2 = "rro:660F3824rM|rx/od:",
  1323. pmovzxbd_2 = "rro:660F3831rM|rx/od:",
  1324. pmovzxbq_2 = "rro:660F3832rM|rx/ow:",
  1325. pmovzxbw_2 = "rro:660F3830rM|rx/oq:",
  1326. pmovzxdq_2 = "rro:660F3835rM|rx/oq:",
  1327. pmovzxwd_2 = "rro:660F3833rM|rx/oq:",
  1328. pmovzxwq_2 = "rro:660F3834rM|rx/od:",
  1329. pmuldq_2 = "rmo:660F3828rM",
  1330. pmulld_2 = "rmo:660F3840rM",
  1331. ptest_2 = "rmo:660F3817rM",
  1332. roundpd_3 = "rmio:660F3A09rMU",
  1333. roundps_3 = "rmio:660F3A08rMU",
  1334. roundsd_3 = "rrio:660F3A0BrMU|rxi/oq:",
  1335. roundss_3 = "rrio:660F3A0ArMU|rxi/od:",
  1336. -- SSE4.2 ops
  1337. crc32_2 = "rmqd:F20F38F1rM|rm/dw:66F20F38F1rM|rm/db:F20F38F0rM|rm/qb:",
  1338. pcmpestri_3 = "rmio:660F3A61rMU",
  1339. pcmpestrm_3 = "rmio:660F3A60rMU",
  1340. pcmpgtq_2 = "rmo:660F3837rM",
  1341. pcmpistri_3 = "rmio:660F3A63rMU",
  1342. pcmpistrm_3 = "rmio:660F3A62rMU",
  1343. popcnt_2 = "rmqdw:F30FB8rM",
  1344. -- SSE4a
  1345. extrq_2 = "rro:660F79rM",
  1346. extrq_3 = "riio:660F780mUU",
  1347. insertq_2 = "rro:F20F79rM",
  1348. insertq_4 = "rriio:F20F78rMUU",
  1349. lzcnt_2 = "rmqdw:F30FBDrM",
  1350. movntsd_2 = "xr/qo:nF20F2BRm",
  1351. movntss_2 = "xr/do:F30F2BRm",
  1352. -- popcnt is also in SSE4.2
  1353. -- AES-NI
  1354. aesdec_2 = "rmo:660F38DErM",
  1355. aesdeclast_2 = "rmo:660F38DFrM",
  1356. aesenc_2 = "rmo:660F38DCrM",
  1357. aesenclast_2 = "rmo:660F38DDrM",
  1358. aesimc_2 = "rmo:660F38DBrM",
  1359. aeskeygenassist_3 = "rmio:660F3ADFrMU",
  1360. pclmulqdq_3 = "rmio:660F3A44rMU",
  1361. -- AVX FP ops
  1362. vaddsubpd_3 = "rrmoy:660FVD0rM",
  1363. vaddsubps_3 = "rrmoy:F20FVD0rM",
  1364. vandpd_3 = "rrmoy:660FV54rM",
  1365. vandps_3 = "rrmoy:0FV54rM",
  1366. vandnpd_3 = "rrmoy:660FV55rM",
  1367. vandnps_3 = "rrmoy:0FV55rM",
  1368. vblendpd_4 = "rrmioy:660F3AV0DrMU",
  1369. vblendps_4 = "rrmioy:660F3AV0CrMU",
  1370. vblendvpd_4 = "rrmroy:660F3AV4BrMs",
  1371. vblendvps_4 = "rrmroy:660F3AV4ArMs",
  1372. vbroadcastf128_2 = "rx/yo:660F38u1ArM",
  1373. vcmppd_4 = "rrmioy:660FVC2rMU",
  1374. vcmpps_4 = "rrmioy:0FVC2rMU",
  1375. vcmpsd_4 = "rrrio:F20FVC2rMU|rrxi/ooq:",
  1376. vcmpss_4 = "rrrio:F30FVC2rMU|rrxi/ood:",
  1377. vcomisd_2 = "rro:660Fu2FrM|rx/oq:",
  1378. vcomiss_2 = "rro:0Fu2FrM|rx/od:",
  1379. vcvtdq2pd_2 = "rro:F30FuE6rM|rx/oq:|rm/yo:",
  1380. vcvtdq2ps_2 = "rmoy:0Fu5BrM",
  1381. vcvtpd2dq_2 = "rmoy:F20FuE6rM",
  1382. vcvtpd2ps_2 = "rmoy:660Fu5ArM",
  1383. vcvtps2dq_2 = "rmoy:660Fu5BrM",
  1384. vcvtps2pd_2 = "rro:0Fu5ArM|rx/oq:|rm/yo:",
  1385. vcvtsd2si_2 = "rr/do:F20Fu2DrM|rx/dq:|rr/qo:|rxq:",
  1386. vcvtsd2ss_3 = "rrro:F20FV5ArM|rrx/ooq:",
  1387. vcvtsi2sd_3 = "rrm/ood:F20FV2ArM|rrm/ooq:F20FVX2ArM",
  1388. vcvtsi2ss_3 = "rrm/ood:F30FV2ArM|rrm/ooq:F30FVX2ArM",
  1389. vcvtss2sd_3 = "rrro:F30FV5ArM|rrx/ood:",
  1390. vcvtss2si_2 = "rr/do:F30Fu2DrM|rxd:|rr/qo:|rx/qd:",
  1391. vcvttpd2dq_2 = "rmo:660FuE6rM|rm/oy:660FuLE6rM",
  1392. vcvttps2dq_2 = "rmoy:F30Fu5BrM",
  1393. vcvttsd2si_2 = "rr/do:F20Fu2CrM|rx/dq:|rr/qo:|rxq:",
  1394. vcvttss2si_2 = "rr/do:F30Fu2CrM|rxd:|rr/qo:|rx/qd:",
  1395. vdppd_4 = "rrmio:660F3AV41rMU",
  1396. vdpps_4 = "rrmioy:660F3AV40rMU",
  1397. vextractf128_3 = "mri/oy:660F3AuL19RmU",
  1398. vextractps_3 = "mri/do:660F3Au17RmU",
  1399. vhaddpd_3 = "rrmoy:660FV7CrM",
  1400. vhaddps_3 = "rrmoy:F20FV7CrM",
  1401. vhsubpd_3 = "rrmoy:660FV7DrM",
  1402. vhsubps_3 = "rrmoy:F20FV7DrM",
  1403. vinsertf128_4 = "rrmi/yyo:660F3AV18rMU",
  1404. vinsertps_4 = "rrrio:660F3AV21rMU|rrxi/ood:",
  1405. vldmxcsr_1 = "xd:0FuAE2m",
  1406. vmaskmovps_3 = "rrxoy:660F38V2CrM|xrroy:660F38V2ERm",
  1407. vmaskmovpd_3 = "rrxoy:660F38V2DrM|xrroy:660F38V2FRm",
  1408. vmovapd_2 = "rmoy:660Fu28rM|mroy:660Fu29Rm",
  1409. vmovaps_2 = "rmoy:0Fu28rM|mroy:0Fu29Rm",
  1410. vmovd_2 = "rm/od:660Fu6ErM|rm/oq:660FuX6ErM|mr/do:660Fu7ERm|mr/qo:",
  1411. vmovq_2 = "rro:F30Fu7ErM|rx/oq:|xr/qo:660FuD6Rm",
  1412. vmovddup_2 = "rmy:F20Fu12rM|rro:|rx/oq:",
  1413. vmovhlps_3 = "rrro:0FV12rM",
  1414. vmovhpd_2 = "xr/qo:660Fu17Rm",
  1415. vmovhpd_3 = "rrx/ooq:660FV16rM",
  1416. vmovhps_2 = "xr/qo:0Fu17Rm",
  1417. vmovhps_3 = "rrx/ooq:0FV16rM",
  1418. vmovlhps_3 = "rrro:0FV16rM",
  1419. vmovlpd_2 = "xr/qo:660Fu13Rm",
  1420. vmovlpd_3 = "rrx/ooq:660FV12rM",
  1421. vmovlps_2 = "xr/qo:0Fu13Rm",
  1422. vmovlps_3 = "rrx/ooq:0FV12rM",
  1423. vmovmskpd_2 = "rr/do:660Fu50rM|rr/dy:660FuL50rM",
  1424. vmovmskps_2 = "rr/do:0Fu50rM|rr/dy:0FuL50rM",
  1425. vmovntpd_2 = "xroy:660Fu2BRm",
  1426. vmovntps_2 = "xroy:0Fu2BRm",
  1427. vmovsd_2 = "rx/oq:F20Fu10rM|xr/qo:F20Fu11Rm",
  1428. vmovsd_3 = "rrro:F20FV10rM",
  1429. vmovshdup_2 = "rmoy:F30Fu16rM",
  1430. vmovsldup_2 = "rmoy:F30Fu12rM",
  1431. vmovss_2 = "rx/od:F30Fu10rM|xr/do:F30Fu11Rm",
  1432. vmovss_3 = "rrro:F30FV10rM",
  1433. vmovupd_2 = "rmoy:660Fu10rM|mroy:660Fu11Rm",
  1434. vmovups_2 = "rmoy:0Fu10rM|mroy:0Fu11Rm",
  1435. vorpd_3 = "rrmoy:660FV56rM",
  1436. vorps_3 = "rrmoy:0FV56rM",
  1437. vpermilpd_3 = "rrmoy:660F38V0DrM|rmioy:660F3Au05rMU",
  1438. vpermilps_3 = "rrmoy:660F38V0CrM|rmioy:660F3Au04rMU",
  1439. vperm2f128_4 = "rrmiy:660F3AV06rMU",
  1440. vptestpd_2 = "rmoy:660F38u0FrM",
  1441. vptestps_2 = "rmoy:660F38u0ErM",
  1442. vrcpps_2 = "rmoy:0Fu53rM",
  1443. vrcpss_3 = "rrro:F30FV53rM|rrx/ood:",
  1444. vrsqrtps_2 = "rmoy:0Fu52rM",
  1445. vrsqrtss_3 = "rrro:F30FV52rM|rrx/ood:",
  1446. vroundpd_3 = "rmioy:660F3Au09rMU",
  1447. vroundps_3 = "rmioy:660F3Au08rMU",
  1448. vroundsd_4 = "rrrio:660F3AV0BrMU|rrxi/ooq:",
  1449. vroundss_4 = "rrrio:660F3AV0ArMU|rrxi/ood:",
  1450. vshufpd_4 = "rrmioy:660FVC6rMU",
  1451. vshufps_4 = "rrmioy:0FVC6rMU",
  1452. vsqrtps_2 = "rmoy:0Fu51rM",
  1453. vsqrtss_2 = "rro:F30Fu51rM|rx/od:",
  1454. vsqrtpd_2 = "rmoy:660Fu51rM",
  1455. vsqrtsd_2 = "rro:F20Fu51rM|rx/oq:",
  1456. vstmxcsr_1 = "xd:0FuAE3m",
  1457. vucomisd_2 = "rro:660Fu2ErM|rx/oq:",
  1458. vucomiss_2 = "rro:0Fu2ErM|rx/od:",
  1459. vunpckhpd_3 = "rrmoy:660FV15rM",
  1460. vunpckhps_3 = "rrmoy:0FV15rM",
  1461. vunpcklpd_3 = "rrmoy:660FV14rM",
  1462. vunpcklps_3 = "rrmoy:0FV14rM",
  1463. vxorpd_3 = "rrmoy:660FV57rM",
  1464. vxorps_3 = "rrmoy:0FV57rM",
  1465. vzeroall_0 = "0FuL77",
  1466. vzeroupper_0 = "0Fu77",
  1467. -- AVX2 FP ops
  1468. vbroadcastss_2 = "rx/od:660F38u18rM|rx/yd:|rro:|rr/yo:",
  1469. vbroadcastsd_2 = "rx/yq:660F38u19rM|rr/yo:",
  1470. -- *vgather* (!vsib)
  1471. vpermpd_3 = "rmiy:660F3AuX01rMU",
  1472. vpermps_3 = "rrmy:660F38V16rM",
  1473. -- AVX, AVX2 integer ops
  1474. -- In general, xmm requires AVX, ymm requires AVX2.
  1475. vaesdec_3 = "rrmo:660F38VDErM",
  1476. vaesdeclast_3 = "rrmo:660F38VDFrM",
  1477. vaesenc_3 = "rrmo:660F38VDCrM",
  1478. vaesenclast_3 = "rrmo:660F38VDDrM",
  1479. vaesimc_2 = "rmo:660F38uDBrM",
  1480. vaeskeygenassist_3 = "rmio:660F3AuDFrMU",
  1481. vlddqu_2 = "rxoy:F20FuF0rM",
  1482. vmaskmovdqu_2 = "rro:660FuF7rM",
  1483. vmovdqa_2 = "rmoy:660Fu6FrM|mroy:660Fu7FRm",
  1484. vmovdqu_2 = "rmoy:F30Fu6FrM|mroy:F30Fu7FRm",
  1485. vmovntdq_2 = "xroy:660FuE7Rm",
  1486. vmovntdqa_2 = "rxoy:660F38u2ArM",
  1487. vmpsadbw_4 = "rrmioy:660F3AV42rMU",
  1488. vpabsb_2 = "rmoy:660F38u1CrM",
  1489. vpabsd_2 = "rmoy:660F38u1ErM",
  1490. vpabsw_2 = "rmoy:660F38u1DrM",
  1491. vpackusdw_3 = "rrmoy:660F38V2BrM",
  1492. vpalignr_4 = "rrmioy:660F3AV0FrMU",
  1493. vpblendvb_4 = "rrmroy:660F3AV4CrMs",
  1494. vpblendw_4 = "rrmioy:660F3AV0ErMU",
  1495. vpclmulqdq_4 = "rrmio:660F3AV44rMU",
  1496. vpcmpeqq_3 = "rrmoy:660F38V29rM",
  1497. vpcmpestri_3 = "rmio:660F3Au61rMU",
  1498. vpcmpestrm_3 = "rmio:660F3Au60rMU",
  1499. vpcmpgtq_3 = "rrmoy:660F38V37rM",
  1500. vpcmpistri_3 = "rmio:660F3Au63rMU",
  1501. vpcmpistrm_3 = "rmio:660F3Au62rMU",
  1502. vpextrb_3 = "rri/do:660F3Au14nRmU|rri/qo:|xri/bo:",
  1503. vpextrw_3 = "rri/do:660FuC5rMU|xri/wo:660F3Au15nRmU",
  1504. vpextrd_3 = "mri/do:660F3Au16RmU",
  1505. vpextrq_3 = "mri/qo:660F3Au16RmU",
  1506. vphaddw_3 = "rrmoy:660F38V01rM",
  1507. vphaddd_3 = "rrmoy:660F38V02rM",
  1508. vphaddsw_3 = "rrmoy:660F38V03rM",
  1509. vphminposuw_2 = "rmo:660F38u41rM",
  1510. vphsubw_3 = "rrmoy:660F38V05rM",
  1511. vphsubd_3 = "rrmoy:660F38V06rM",
  1512. vphsubsw_3 = "rrmoy:660F38V07rM",
  1513. vpinsrb_4 = "rrri/ood:660F3AV20rMU|rrxi/oob:",
  1514. vpinsrw_4 = "rrri/ood:660FVC4rMU|rrxi/oow:",
  1515. vpinsrd_4 = "rrmi/ood:660F3AV22rMU",
  1516. vpinsrq_4 = "rrmi/ooq:660F3AVX22rMU",
  1517. vpmaddubsw_3 = "rrmoy:660F38V04rM",
  1518. vpmaxsb_3 = "rrmoy:660F38V3CrM",
  1519. vpmaxsd_3 = "rrmoy:660F38V3DrM",
  1520. vpmaxuw_3 = "rrmoy:660F38V3ErM",
  1521. vpmaxud_3 = "rrmoy:660F38V3FrM",
  1522. vpminsb_3 = "rrmoy:660F38V38rM",
  1523. vpminsd_3 = "rrmoy:660F38V39rM",
  1524. vpminuw_3 = "rrmoy:660F38V3ArM",
  1525. vpminud_3 = "rrmoy:660F38V3BrM",
  1526. vpmovmskb_2 = "rr/do:660FuD7rM|rr/dy:660FuLD7rM",
  1527. vpmovsxbw_2 = "rroy:660F38u20rM|rx/oq:|rx/yo:",
  1528. vpmovsxbd_2 = "rroy:660F38u21rM|rx/od:|rx/yq:",
  1529. vpmovsxbq_2 = "rroy:660F38u22rM|rx/ow:|rx/yd:",
  1530. vpmovsxwd_2 = "rroy:660F38u23rM|rx/oq:|rx/yo:",
  1531. vpmovsxwq_2 = "rroy:660F38u24rM|rx/od:|rx/yq:",
  1532. vpmovsxdq_2 = "rroy:660F38u25rM|rx/oq:|rx/yo:",
  1533. vpmovzxbw_2 = "rroy:660F38u30rM|rx/oq:|rx/yo:",
  1534. vpmovzxbd_2 = "rroy:660F38u31rM|rx/od:|rx/yq:",
  1535. vpmovzxbq_2 = "rroy:660F38u32rM|rx/ow:|rx/yd:",
  1536. vpmovzxwd_2 = "rroy:660F38u33rM|rx/oq:|rx/yo:",
  1537. vpmovzxwq_2 = "rroy:660F38u34rM|rx/od:|rx/yq:",
  1538. vpmovzxdq_2 = "rroy:660F38u35rM|rx/oq:|rx/yo:",
  1539. vpmuldq_3 = "rrmoy:660F38V28rM",
  1540. vpmulhrsw_3 = "rrmoy:660F38V0BrM",
  1541. vpmulld_3 = "rrmoy:660F38V40rM",
  1542. vpshufb_3 = "rrmoy:660F38V00rM",
  1543. vpshufd_3 = "rmioy:660Fu70rMU",
  1544. vpshufhw_3 = "rmioy:F30Fu70rMU",
  1545. vpshuflw_3 = "rmioy:F20Fu70rMU",
  1546. vpsignb_3 = "rrmoy:660F38V08rM",
  1547. vpsignw_3 = "rrmoy:660F38V09rM",
  1548. vpsignd_3 = "rrmoy:660F38V0ArM",
  1549. vpslldq_3 = "rrioy:660Fv737mU",
  1550. vpsllw_3 = "rrmoy:660FVF1rM|rrioy:660Fv716mU",
  1551. vpslld_3 = "rrmoy:660FVF2rM|rrioy:660Fv726mU",
  1552. vpsllq_3 = "rrmoy:660FVF3rM|rrioy:660Fv736mU",
  1553. vpsraw_3 = "rrmoy:660FVE1rM|rrioy:660Fv714mU",
  1554. vpsrad_3 = "rrmoy:660FVE2rM|rrioy:660Fv724mU",
  1555. vpsrldq_3 = "rrioy:660Fv733mU",
  1556. vpsrlw_3 = "rrmoy:660FVD1rM|rrioy:660Fv712mU",
  1557. vpsrld_3 = "rrmoy:660FVD2rM|rrioy:660Fv722mU",
  1558. vpsrlq_3 = "rrmoy:660FVD3rM|rrioy:660Fv732mU",
  1559. vptest_2 = "rmoy:660F38u17rM",
  1560. -- AVX2 integer ops
  1561. vbroadcasti128_2 = "rx/yo:660F38u5ArM",
  1562. vinserti128_4 = "rrmi/yyo:660F3AV38rMU",
  1563. vextracti128_3 = "mri/oy:660F3AuL39RmU",
  1564. vpblendd_4 = "rrmioy:660F3AV02rMU",
  1565. vpbroadcastb_2 = "rro:660F38u78rM|rx/ob:|rr/yo:|rx/yb:",
  1566. vpbroadcastw_2 = "rro:660F38u79rM|rx/ow:|rr/yo:|rx/yw:",
  1567. vpbroadcastd_2 = "rro:660F38u58rM|rx/od:|rr/yo:|rx/yd:",
  1568. vpbroadcastq_2 = "rro:660F38u59rM|rx/oq:|rr/yo:|rx/yq:",
  1569. vpermd_3 = "rrmy:660F38V36rM",
  1570. vpermq_3 = "rmiy:660F3AuX00rMU",
  1571. -- *vpgather* (!vsib)
  1572. vperm2i128_4 = "rrmiy:660F3AV46rMU",
  1573. vpmaskmovd_3 = "rrxoy:660F38V8CrM|xrroy:660F38V8ERm",
  1574. vpmaskmovq_3 = "rrxoy:660F38VX8CrM|xrroy:660F38VX8ERm",
  1575. vpsllvd_3 = "rrmoy:660F38V47rM",
  1576. vpsllvq_3 = "rrmoy:660F38VX47rM",
  1577. vpsravd_3 = "rrmoy:660F38V46rM",
  1578. vpsrlvd_3 = "rrmoy:660F38V45rM",
  1579. vpsrlvq_3 = "rrmoy:660F38VX45rM",
  1580. -- Intel ADX
  1581. adcx_2 = "rmqd:660F38F6rM",
  1582. adox_2 = "rmqd:F30F38F6rM",
  1583. -- BMI1
  1584. andn_3 = "rrmqd:0F38VF2rM",
  1585. bextr_3 = "rmrqd:0F38wF7rM",
  1586. blsi_2 = "rmqd:0F38vF33m",
  1587. blsmsk_2 = "rmqd:0F38vF32m",
  1588. blsr_2 = "rmqd:0F38vF31m",
  1589. tzcnt_2 = "rmqdw:F30FBCrM",
  1590. -- BMI2
  1591. bzhi_3 = "rmrqd:0F38wF5rM",
  1592. mulx_3 = "rrmqd:F20F38VF6rM",
  1593. pdep_3 = "rrmqd:F20F38VF5rM",
  1594. pext_3 = "rrmqd:F30F38VF5rM",
  1595. rorx_3 = "rmSqd:F20F3AuF0rMS",
  1596. sarx_3 = "rmrqd:F30F38wF7rM",
  1597. shrx_3 = "rmrqd:F20F38wF7rM",
  1598. shlx_3 = "rmrqd:660F38wF7rM",
  1599. -- FMA3
  1600. vfmaddsub132pd_3 = "rrmoy:660F38VX96rM",
  1601. vfmaddsub132ps_3 = "rrmoy:660F38V96rM",
  1602. vfmaddsub213pd_3 = "rrmoy:660F38VXA6rM",
  1603. vfmaddsub213ps_3 = "rrmoy:660F38VA6rM",
  1604. vfmaddsub231pd_3 = "rrmoy:660F38VXB6rM",
  1605. vfmaddsub231ps_3 = "rrmoy:660F38VB6rM",
  1606. vfmsubadd132pd_3 = "rrmoy:660F38VX97rM",
  1607. vfmsubadd132ps_3 = "rrmoy:660F38V97rM",
  1608. vfmsubadd213pd_3 = "rrmoy:660F38VXA7rM",
  1609. vfmsubadd213ps_3 = "rrmoy:660F38VA7rM",
  1610. vfmsubadd231pd_3 = "rrmoy:660F38VXB7rM",
  1611. vfmsubadd231ps_3 = "rrmoy:660F38VB7rM",
  1612. vfmadd132pd_3 = "rrmoy:660F38VX98rM",
  1613. vfmadd132ps_3 = "rrmoy:660F38V98rM",
  1614. vfmadd132sd_3 = "rrro:660F38VX99rM|rrx/ooq:",
  1615. vfmadd132ss_3 = "rrro:660F38V99rM|rrx/ood:",
  1616. vfmadd213pd_3 = "rrmoy:660F38VXA8rM",
  1617. vfmadd213ps_3 = "rrmoy:660F38VA8rM",
  1618. vfmadd213sd_3 = "rrro:660F38VXA9rM|rrx/ooq:",
  1619. vfmadd213ss_3 = "rrro:660F38VA9rM|rrx/ood:",
  1620. vfmadd231pd_3 = "rrmoy:660F38VXB8rM",
  1621. vfmadd231ps_3 = "rrmoy:660F38VB8rM",
  1622. vfmadd231sd_3 = "rrro:660F38VXB9rM|rrx/ooq:",
  1623. vfmadd231ss_3 = "rrro:660F38VB9rM|rrx/ood:",
  1624. vfmsub132pd_3 = "rrmoy:660F38VX9ArM",
  1625. vfmsub132ps_3 = "rrmoy:660F38V9ArM",
  1626. vfmsub132sd_3 = "rrro:660F38VX9BrM|rrx/ooq:",
  1627. vfmsub132ss_3 = "rrro:660F38V9BrM|rrx/ood:",
  1628. vfmsub213pd_3 = "rrmoy:660F38VXAArM",
  1629. vfmsub213ps_3 = "rrmoy:660F38VAArM",
  1630. vfmsub213sd_3 = "rrro:660F38VXABrM|rrx/ooq:",
  1631. vfmsub213ss_3 = "rrro:660F38VABrM|rrx/ood:",
  1632. vfmsub231pd_3 = "rrmoy:660F38VXBArM",
  1633. vfmsub231ps_3 = "rrmoy:660F38VBArM",
  1634. vfmsub231sd_3 = "rrro:660F38VXBBrM|rrx/ooq:",
  1635. vfmsub231ss_3 = "rrro:660F38VBBrM|rrx/ood:",
  1636. vfnmadd132pd_3 = "rrmoy:660F38VX9CrM",
  1637. vfnmadd132ps_3 = "rrmoy:660F38V9CrM",
  1638. vfnmadd132sd_3 = "rrro:660F38VX9DrM|rrx/ooq:",
  1639. vfnmadd132ss_3 = "rrro:660F38V9DrM|rrx/ood:",
  1640. vfnmadd213pd_3 = "rrmoy:660F38VXACrM",
  1641. vfnmadd213ps_3 = "rrmoy:660F38VACrM",
  1642. vfnmadd213sd_3 = "rrro:660F38VXADrM|rrx/ooq:",
  1643. vfnmadd213ss_3 = "rrro:660F38VADrM|rrx/ood:",
  1644. vfnmadd231pd_3 = "rrmoy:660F38VXBCrM",
  1645. vfnmadd231ps_3 = "rrmoy:660F38VBCrM",
  1646. vfnmadd231sd_3 = "rrro:660F38VXBDrM|rrx/ooq:",
  1647. vfnmadd231ss_3 = "rrro:660F38VBDrM|rrx/ood:",
  1648. vfnmsub132pd_3 = "rrmoy:660F38VX9ErM",
  1649. vfnmsub132ps_3 = "rrmoy:660F38V9ErM",
  1650. vfnmsub132sd_3 = "rrro:660F38VX9FrM|rrx/ooq:",
  1651. vfnmsub132ss_3 = "rrro:660F38V9FrM|rrx/ood:",
  1652. vfnmsub213pd_3 = "rrmoy:660F38VXAErM",
  1653. vfnmsub213ps_3 = "rrmoy:660F38VAErM",
  1654. vfnmsub213sd_3 = "rrro:660F38VXAFrM|rrx/ooq:",
  1655. vfnmsub213ss_3 = "rrro:660F38VAFrM|rrx/ood:",
  1656. vfnmsub231pd_3 = "rrmoy:660F38VXBErM",
  1657. vfnmsub231ps_3 = "rrmoy:660F38VBErM",
  1658. vfnmsub231sd_3 = "rrro:660F38VXBFrM|rrx/ooq:",
  1659. vfnmsub231ss_3 = "rrro:660F38VBFrM|rrx/ood:",
  1660. }
  1661. ------------------------------------------------------------------------------
  1662. -- Arithmetic ops.
  1663. for name,n in pairs{ add = 0, ["or"] = 1, adc = 2, sbb = 3,
  1664. ["and"] = 4, sub = 5, xor = 6, cmp = 7 } do
  1665. local n8 = shl(n, 3)
  1666. map_op[name.."_2"] = format(
  1667. "mr:%02XRm|rm:%02XrM|mI1qdw:81%XmI|mS1qdw:83%XmS|Ri1qdwb:%02Xri|mi1qdwb:81%Xmi",
  1668. 1+n8, 3+n8, n, n, 5+n8, n)
  1669. end
  1670. -- Shift ops.
  1671. for name,n in pairs{ rol = 0, ror = 1, rcl = 2, rcr = 3,
  1672. shl = 4, shr = 5, sar = 7, sal = 4 } do
  1673. map_op[name.."_2"] = format("m1:D1%Xm|mC1qdwb:D3%Xm|mi:C1%XmU", n, n, n)
  1674. end
  1675. -- Conditional ops.
  1676. for cc,n in pairs(map_cc) do
  1677. map_op["j"..cc.."_1"] = format("J.:n0F8%XJ", n) -- short: 7%X
  1678. map_op["set"..cc.."_1"] = format("mb:n0F9%X2m", n)
  1679. map_op["cmov"..cc.."_2"] = format("rmqdw:0F4%XrM", n) -- P6+
  1680. end
  1681. -- FP arithmetic ops.
  1682. for name,n in pairs{ add = 0, mul = 1, com = 2, comp = 3,
  1683. sub = 4, subr = 5, div = 6, divr = 7 } do
  1684. local nc = 0xc0 + shl(n, 3)
  1685. local nr = nc + (n < 4 and 0 or (n % 2 == 0 and 8 or -8))
  1686. local fn = "f"..name
  1687. map_op[fn.."_1"] = format("ff:D8%02Xr|xd:D8%Xm|xq:nDC%Xm", nc, n, n)
  1688. if n == 2 or n == 3 then
  1689. map_op[fn.."_2"] = format("Fff:D8%02XR|Fx2d:D8%XM|Fx2q:nDC%XM", nc, n, n)
  1690. else
  1691. map_op[fn.."_2"] = format("Fff:D8%02XR|fFf:DC%02Xr|Fx2d:D8%XM|Fx2q:nDC%XM", nc, nr, n, n)
  1692. map_op[fn.."p_1"] = format("ff:DE%02Xr", nr)
  1693. map_op[fn.."p_2"] = format("fFf:DE%02Xr", nr)
  1694. end
  1695. map_op["fi"..name.."_1"] = format("xd:DA%Xm|xw:nDE%Xm", n, n)
  1696. end
  1697. -- FP conditional moves.
  1698. for cc,n in pairs{ b=0, e=1, be=2, u=3, nb=4, ne=5, nbe=6, nu=7 } do
  1699. local nc = 0xdac0 + shl(band(n, 3), 3) + shl(band(n, 4), 6)
  1700. map_op["fcmov"..cc.."_1"] = format("ff:%04Xr", nc) -- P6+
  1701. map_op["fcmov"..cc.."_2"] = format("Fff:%04XR", nc) -- P6+
  1702. end
  1703. -- SSE / AVX FP arithmetic ops.
  1704. for name,n in pairs{ sqrt = 1, add = 8, mul = 9,
  1705. sub = 12, min = 13, div = 14, max = 15 } do
  1706. map_op[name.."ps_2"] = format("rmo:0F5%XrM", n)
  1707. map_op[name.."ss_2"] = format("rro:F30F5%XrM|rx/od:", n)
  1708. map_op[name.."pd_2"] = format("rmo:660F5%XrM", n)
  1709. map_op[name.."sd_2"] = format("rro:F20F5%XrM|rx/oq:", n)
  1710. if n ~= 1 then
  1711. map_op["v"..name.."ps_3"] = format("rrmoy:0FV5%XrM", n)
  1712. map_op["v"..name.."ss_3"] = format("rrro:F30FV5%XrM|rrx/ood:", n)
  1713. map_op["v"..name.."pd_3"] = format("rrmoy:660FV5%XrM", n)
  1714. map_op["v"..name.."sd_3"] = format("rrro:F20FV5%XrM|rrx/ooq:", n)
  1715. end
  1716. end
  1717. -- SSE2 / AVX / AVX2 integer arithmetic ops (66 0F leaf).
  1718. for name,n in pairs{
  1719. paddb = 0xFC, paddw = 0xFD, paddd = 0xFE, paddq = 0xD4,
  1720. paddsb = 0xEC, paddsw = 0xED, packssdw = 0x6B,
  1721. packsswb = 0x63, packuswb = 0x67, paddusb = 0xDC,
  1722. paddusw = 0xDD, pand = 0xDB, pandn = 0xDF, pavgb = 0xE0,
  1723. pavgw = 0xE3, pcmpeqb = 0x74, pcmpeqd = 0x76,
  1724. pcmpeqw = 0x75, pcmpgtb = 0x64, pcmpgtd = 0x66,
  1725. pcmpgtw = 0x65, pmaddwd = 0xF5, pmaxsw = 0xEE,
  1726. pmaxub = 0xDE, pminsw = 0xEA, pminub = 0xDA,
  1727. pmulhuw = 0xE4, pmulhw = 0xE5, pmullw = 0xD5,
  1728. pmuludq = 0xF4, por = 0xEB, psadbw = 0xF6, psubb = 0xF8,
  1729. psubw = 0xF9, psubd = 0xFA, psubq = 0xFB, psubsb = 0xE8,
  1730. psubsw = 0xE9, psubusb = 0xD8, psubusw = 0xD9,
  1731. punpckhbw = 0x68, punpckhwd = 0x69, punpckhdq = 0x6A,
  1732. punpckhqdq = 0x6D, punpcklbw = 0x60, punpcklwd = 0x61,
  1733. punpckldq = 0x62, punpcklqdq = 0x6C, pxor = 0xEF
  1734. } do
  1735. map_op[name.."_2"] = format("rmo:660F%02XrM", n)
  1736. map_op["v"..name.."_3"] = format("rrmoy:660FV%02XrM", n)
  1737. end
  1738. ------------------------------------------------------------------------------
  1739. local map_vexarg = { u = false, v = 1, V = 2, w = 3 }
  1740. -- Process pattern string.
  1741. local function dopattern(pat, args, sz, op, needrex)
  1742. local digit, addin, vex
  1743. local opcode = 0
  1744. local szov = sz
  1745. local narg = 1
  1746. local rex = 0
  1747. -- Limit number of section buffer positions used by a single dasm_put().
  1748. -- A single opcode needs a maximum of 6 positions.
  1749. if secpos+6 > maxsecpos then wflush() end
  1750. -- Process each character.
  1751. for c in gmatch(pat.."|", ".") do
  1752. if match(c, "%x") then -- Hex digit.
  1753. digit = byte(c) - 48
  1754. if digit > 48 then digit = digit - 39
  1755. elseif digit > 16 then digit = digit - 7 end
  1756. opcode = opcode*16 + digit
  1757. addin = nil
  1758. elseif c == "n" then -- Disable operand size mods for opcode.
  1759. szov = nil
  1760. elseif c == "X" then -- Force REX.W.
  1761. rex = 8
  1762. elseif c == "L" then -- Force VEX.L.
  1763. vex.l = true
  1764. elseif c == "r" then -- Merge 1st operand regno. into opcode.
  1765. addin = args[1]; opcode = opcode + (addin.reg % 8)
  1766. if narg < 2 then narg = 2 end
  1767. elseif c == "R" then -- Merge 2nd operand regno. into opcode.
  1768. addin = args[2]; opcode = opcode + (addin.reg % 8)
  1769. narg = 3
  1770. elseif c == "m" or c == "M" then -- Encode ModRM/SIB.
  1771. local s
  1772. if addin then
  1773. s = addin.reg
  1774. opcode = opcode - band(s, 7) -- Undo regno opcode merge.
  1775. else
  1776. s = band(opcode, 15) -- Undo last digit.
  1777. opcode = shr(opcode, 4)
  1778. end
  1779. local nn = c == "m" and 1 or 2
  1780. local t = args[nn]
  1781. if narg <= nn then narg = nn + 1 end
  1782. if szov == "q" and rex == 0 then rex = rex + 8 end
  1783. if t.reg and t.reg > 7 then rex = rex + 1 end
  1784. if t.xreg and t.xreg > 7 then rex = rex + 2 end
  1785. if s > 7 then rex = rex + 4 end
  1786. if needrex then rex = rex + 16 end
  1787. local psz, sk = wputop(szov, opcode, rex, vex, s < 0, t.vreg or t.vxreg)
  1788. opcode = nil
  1789. local imark = sub(pat, -1) -- Force a mark (ugly).
  1790. -- Put ModRM/SIB with regno/last digit as spare.
  1791. wputmrmsib(t, imark, s, addin and addin.vreg, psz, sk)
  1792. addin = nil
  1793. elseif map_vexarg[c] ~= nil then -- Encode using VEX prefix
  1794. local b = band(opcode, 255); opcode = shr(opcode, 8)
  1795. local m = 1
  1796. if b == 0x38 then m = 2
  1797. elseif b == 0x3a then m = 3 end
  1798. if m ~= 1 then b = band(opcode, 255); opcode = shr(opcode, 8) end
  1799. if b ~= 0x0f then
  1800. werror("expected `0F', `0F38', or `0F3A' to precede `"..c..
  1801. "' in pattern `"..pat.."' for `"..op.."'")
  1802. end
  1803. local v = map_vexarg[c]
  1804. if v then v = remove(args, v) end
  1805. b = band(opcode, 255)
  1806. local p = 0
  1807. if b == 0x66 then p = 1
  1808. elseif b == 0xf3 then p = 2
  1809. elseif b == 0xf2 then p = 3 end
  1810. if p ~= 0 then opcode = shr(opcode, 8) end
  1811. if opcode ~= 0 then wputop(nil, opcode, 0); opcode = 0 end
  1812. vex = { m = m, p = p, v = v }
  1813. else
  1814. if opcode then -- Flush opcode.
  1815. if szov == "q" and rex == 0 then rex = rex + 8 end
  1816. if needrex then rex = rex + 16 end
  1817. if addin and addin.reg == -1 then
  1818. local psz, sk = wputop(szov, opcode - 7, rex, vex, true)
  1819. wvreg("opcode", addin.vreg, psz, sk)
  1820. else
  1821. if addin and addin.reg > 7 then rex = rex + 1 end
  1822. wputop(szov, opcode, rex, vex)
  1823. end
  1824. opcode = nil
  1825. end
  1826. if c == "|" then break end
  1827. if c == "o" then -- Offset (pure 32 bit displacement).
  1828. wputdarg(args[1].disp); if narg < 2 then narg = 2 end
  1829. elseif c == "O" then
  1830. wputdarg(args[2].disp); narg = 3
  1831. else
  1832. -- Anything else is an immediate operand.
  1833. local a = args[narg]
  1834. narg = narg + 1
  1835. local mode, imm = a.mode, a.imm
  1836. if mode == "iJ" and not match(x64 and "J" or "iIJ", c) then
  1837. werror("bad operand size for label")
  1838. end
  1839. if c == "S" then
  1840. wputsbarg(imm)
  1841. elseif c == "U" then
  1842. wputbarg(imm)
  1843. elseif c == "W" then
  1844. wputwarg(imm)
  1845. elseif c == "i" or c == "I" then
  1846. if mode == "iJ" then
  1847. wputlabel("IMM_", imm, 1)
  1848. elseif mode == "iI" and c == "I" then
  1849. waction(sz == "w" and "IMM_WB" or "IMM_DB", imm)
  1850. else
  1851. wputszarg(sz, imm)
  1852. end
  1853. elseif c == "J" then
  1854. if mode == "iPJ" then
  1855. waction("REL_A", imm) -- !x64 (secpos)
  1856. else
  1857. wputlabel("REL_", imm, 2)
  1858. end
  1859. elseif c == "s" then
  1860. local reg = a.reg
  1861. if reg < 0 then
  1862. wputb(0)
  1863. wvreg("imm.hi", a.vreg)
  1864. else
  1865. wputb(shl(reg, 4))
  1866. end
  1867. else
  1868. werror("bad char `"..c.."' in pattern `"..pat.."' for `"..op.."'")
  1869. end
  1870. end
  1871. end
  1872. end
  1873. end
  1874. ------------------------------------------------------------------------------
  1875. -- Mapping of operand modes to short names. Suppress output with '#'.
  1876. local map_modename = {
  1877. r = "reg", R = "eax", C = "cl", x = "mem", m = "mrm", i = "imm",
  1878. f = "stx", F = "st0", J = "lbl", ["1"] = "1",
  1879. I = "#", S = "#", O = "#",
  1880. }
  1881. -- Return a table/string showing all possible operand modes.
  1882. local function templatehelp(template, nparams)
  1883. if nparams == 0 then return "" end
  1884. local t = {}
  1885. for tm in gmatch(template, "[^%|]+") do
  1886. local s = map_modename[sub(tm, 1, 1)]
  1887. s = s..gsub(sub(tm, 2, nparams), ".", function(c)
  1888. return ", "..map_modename[c]
  1889. end)
  1890. if not match(s, "#") then t[#t+1] = s end
  1891. end
  1892. return t
  1893. end
  1894. -- Match operand modes against mode match part of template.
  1895. local function matchtm(tm, args)
  1896. for i=1,#args do
  1897. if not match(args[i].mode, sub(tm, i, i)) then return end
  1898. end
  1899. return true
  1900. end
  1901. -- Handle opcodes defined with template strings.
  1902. map_op[".template__"] = function(params, template, nparams)
  1903. if not params then return templatehelp(template, nparams) end
  1904. local args = {}
  1905. -- Zero-operand opcodes have no match part.
  1906. if #params == 0 then
  1907. dopattern(template, args, "d", params.op, nil)
  1908. return
  1909. end
  1910. -- Determine common operand size (coerce undefined size) or flag as mixed.
  1911. local sz, szmix, needrex
  1912. for i,p in ipairs(params) do
  1913. args[i] = parseoperand(p)
  1914. local nsz = args[i].opsize
  1915. if nsz then
  1916. if sz and sz ~= nsz then szmix = true else sz = nsz end
  1917. end
  1918. local nrex = args[i].needrex
  1919. if nrex ~= nil then
  1920. if needrex == nil then
  1921. needrex = nrex
  1922. elseif needrex ~= nrex then
  1923. werror("bad mix of byte-addressable registers")
  1924. end
  1925. end
  1926. end
  1927. -- Try all match:pattern pairs (separated by '|').
  1928. local gotmatch, lastpat
  1929. for tm in gmatch(template, "[^%|]+") do
  1930. -- Split off size match (starts after mode match) and pattern string.
  1931. local szm, pat = match(tm, "^(.-):(.*)$", #args+1)
  1932. if pat == "" then pat = lastpat else lastpat = pat end
  1933. if matchtm(tm, args) then
  1934. local prefix = sub(szm, 1, 1)
  1935. if prefix == "/" then -- Exactly match leading operand sizes.
  1936. for i = #szm,1,-1 do
  1937. if i == 1 then
  1938. dopattern(pat, args, sz, params.op, needrex) -- Process pattern.
  1939. return
  1940. elseif args[i-1].opsize ~= sub(szm, i, i) then
  1941. break
  1942. end
  1943. end
  1944. else -- Match common operand size.
  1945. local szp = sz
  1946. if szm == "" then szm = x64 and "qdwb" or "dwb" end -- Default sizes.
  1947. if prefix == "1" then szp = args[1].opsize; szmix = nil
  1948. elseif prefix == "2" then szp = args[2].opsize; szmix = nil end
  1949. if not szmix and (prefix == "." or match(szm, szp or "#")) then
  1950. dopattern(pat, args, szp, params.op, needrex) -- Process pattern.
  1951. return
  1952. end
  1953. end
  1954. gotmatch = true
  1955. end
  1956. end
  1957. local msg = "bad operand mode"
  1958. if gotmatch then
  1959. if szmix then
  1960. msg = "mixed operand size"
  1961. else
  1962. msg = sz and "bad operand size" or "missing operand size"
  1963. end
  1964. end
  1965. werror(msg.." in `"..opmodestr(params.op, args).."'")
  1966. end
  1967. ------------------------------------------------------------------------------
  1968. -- x64-specific opcode for 64 bit immediates and displacements.
  1969. if x64 then
  1970. function map_op.mov64_2(params)
  1971. if not params then return { "reg, imm", "reg, [disp]", "[disp], reg" } end
  1972. if secpos+2 > maxsecpos then wflush() end
  1973. local opcode, op64, sz, rex, vreg
  1974. local op64 = match(params[1], "^%[%s*(.-)%s*%]$")
  1975. if op64 then
  1976. local a = parseoperand(params[2])
  1977. if a.mode ~= "rmR" then werror("bad operand mode") end
  1978. sz = a.opsize
  1979. rex = sz == "q" and 8 or 0
  1980. opcode = 0xa3
  1981. else
  1982. op64 = match(params[2], "^%[%s*(.-)%s*%]$")
  1983. local a = parseoperand(params[1])
  1984. if op64 then
  1985. if a.mode ~= "rmR" then werror("bad operand mode") end
  1986. sz = a.opsize
  1987. rex = sz == "q" and 8 or 0
  1988. opcode = 0xa1
  1989. else
  1990. if sub(a.mode, 1, 1) ~= "r" or a.opsize ~= "q" then
  1991. werror("bad operand mode")
  1992. end
  1993. op64 = params[2]
  1994. if a.reg == -1 then
  1995. vreg = a.vreg
  1996. opcode = 0xb8
  1997. else
  1998. opcode = 0xb8 + band(a.reg, 7)
  1999. end
  2000. rex = a.reg > 7 and 9 or 8
  2001. end
  2002. end
  2003. local psz, sk = wputop(sz, opcode, rex, nil, vreg)
  2004. wvreg("opcode", vreg, psz, sk)
  2005. waction("IMM_D", format("(unsigned int)(%s)", op64))
  2006. waction("IMM_D", format("(unsigned int)((%s)>>32)", op64))
  2007. end
  2008. end
  2009. ------------------------------------------------------------------------------
  2010. -- Pseudo-opcodes for data storage.
  2011. local function op_data(params)
  2012. if not params then return "imm..." end
  2013. local sz = sub(params.op, 2, 2)
  2014. if sz == "l" then sz = "d" elseif sz == "a" then sz = addrsize end
  2015. for _,p in ipairs(params) do
  2016. local a = parseoperand(p, sz == "q")
  2017. if sub(a.mode, 1, 1) ~= "i" or (a.opsize and a.opsize ~= sz) then
  2018. werror("bad mode or size in `"..p.."'")
  2019. end
  2020. if a.mode == "iJ" then
  2021. wputlabel("IMM_", a.imm, 1)
  2022. elseif sz == "q" then
  2023. wputqarg(a.imm)
  2024. else
  2025. wputszarg(sz, a.imm)
  2026. end
  2027. if secpos+2 > maxsecpos then wflush() end
  2028. end
  2029. end
  2030. map_op[".byte_*"] = op_data
  2031. map_op[".sbyte_*"] = op_data
  2032. map_op[".word_*"] = op_data
  2033. map_op[".dword_*"] = op_data
  2034. map_op[".qword_*"] = op_data
  2035. map_op[".aword_*"] = op_data
  2036. map_op[".long_*"] = op_data
  2037. map_op[".quad_*"] = op_data
  2038. map_op[".addr_*"] = op_data
  2039. ------------------------------------------------------------------------------
  2040. -- Pseudo-opcode to mark the position where the action list is to be emitted.
  2041. map_op[".actionlist_1"] = function(params)
  2042. if not params then return "cvar" end
  2043. local name = params[1] -- No syntax check. You get to keep the pieces.
  2044. wline(function(out) writeactions(out, name) end)
  2045. end
  2046. -- Pseudo-opcode to mark the position where the global enum is to be emitted.
  2047. map_op[".globals_1"] = function(params)
  2048. if not params then return "prefix" end
  2049. local prefix = params[1] -- No syntax check. You get to keep the pieces.
  2050. wline(function(out) writeglobals(out, prefix) end)
  2051. end
  2052. -- Pseudo-opcode to mark the position where the global names are to be emitted.
  2053. map_op[".globalnames_1"] = function(params)
  2054. if not params then return "cvar" end
  2055. local name = params[1] -- No syntax check. You get to keep the pieces.
  2056. wline(function(out) writeglobalnames(out, name) end)
  2057. end
  2058. -- Pseudo-opcode to mark the position where the extern names are to be emitted.
  2059. map_op[".externnames_1"] = function(params)
  2060. if not params then return "cvar" end
  2061. local name = params[1] -- No syntax check. You get to keep the pieces.
  2062. wline(function(out) writeexternnames(out, name) end)
  2063. end
  2064. ------------------------------------------------------------------------------
  2065. -- Label pseudo-opcode (converted from trailing colon form).
  2066. map_op[".label_2"] = function(params)
  2067. if not params then return "[1-9] | ->global | =>pcexpr [, addr]" end
  2068. if secpos+2 > maxsecpos then wflush() end
  2069. local a = parseoperand(params[1])
  2070. local mode, imm = a.mode, a.imm
  2071. if type(imm) == "number" and (mode == "iJ" or (imm >= 1 and imm <= 9)) then
  2072. -- Local label (1: ... 9:) or global label (->global:).
  2073. waction("LABEL_LG", nil, 1)
  2074. wputxb(imm)
  2075. elseif mode == "iJ" then
  2076. -- PC label (=>pcexpr:).
  2077. waction("LABEL_PC", imm)
  2078. else
  2079. werror("bad label definition")
  2080. end
  2081. -- SETLABEL must immediately follow LABEL_LG/LABEL_PC.
  2082. local addr = params[2]
  2083. if addr then
  2084. local a = parseoperand(addr)
  2085. if a.mode == "iPJ" then
  2086. waction("SETLABEL", a.imm)
  2087. else
  2088. werror("bad label assignment")
  2089. end
  2090. end
  2091. end
  2092. map_op[".label_1"] = map_op[".label_2"]
  2093. ------------------------------------------------------------------------------
  2094. -- Alignment pseudo-opcode.
  2095. map_op[".align_1"] = function(params)
  2096. if not params then return "numpow2" end
  2097. if secpos+1 > maxsecpos then wflush() end
  2098. local align = tonumber(params[1]) or map_opsizenum[map_opsize[params[1]]]
  2099. if align then
  2100. local x = align
  2101. -- Must be a power of 2 in the range (2 ... 256).
  2102. for i=1,8 do
  2103. x = x / 2
  2104. if x == 1 then
  2105. waction("ALIGN", nil, 1)
  2106. wputxb(align-1) -- Action byte is 2**n-1.
  2107. return
  2108. end
  2109. end
  2110. end
  2111. werror("bad alignment")
  2112. end
  2113. -- Spacing pseudo-opcode.
  2114. map_op[".space_2"] = function(params)
  2115. if not params then return "num [, filler]" end
  2116. if secpos+1 > maxsecpos then wflush() end
  2117. waction("SPACE", params[1])
  2118. local fill = params[2]
  2119. if fill then
  2120. fill = tonumber(fill)
  2121. if not fill or fill < 0 or fill > 255 then werror("bad filler") end
  2122. end
  2123. wputxb(fill or 0)
  2124. end
  2125. map_op[".space_1"] = map_op[".space_2"]
  2126. ------------------------------------------------------------------------------
  2127. -- Pseudo-opcode for (primitive) type definitions (map to C types).
  2128. map_op[".type_3"] = function(params, nparams)
  2129. if not params then
  2130. return nparams == 2 and "name, ctype" or "name, ctype, reg"
  2131. end
  2132. local name, ctype, reg = params[1], params[2], params[3]
  2133. if not match(name, "^[%a_][%w_]*$") then
  2134. werror("bad type name `"..name.."'")
  2135. end
  2136. local tp = map_type[name]
  2137. if tp then
  2138. werror("duplicate type `"..name.."'")
  2139. end
  2140. if reg and not map_reg_valid_base[reg] then
  2141. werror("bad base register `"..(map_reg_rev[reg] or reg).."'")
  2142. end
  2143. -- Add #type to defines. A bit unclean to put it in map_archdef.
  2144. map_archdef["#"..name] = "sizeof("..ctype..")"
  2145. -- Add new type and emit shortcut define.
  2146. local num = ctypenum + 1
  2147. map_type[name] = {
  2148. ctype = ctype,
  2149. ctypefmt = format("Dt%X(%%s)", num),
  2150. reg = reg,
  2151. }
  2152. wline(format("#define Dt%X(_V) (int)(ptrdiff_t)&(((%s *)0)_V)", num, ctype))
  2153. ctypenum = num
  2154. end
  2155. map_op[".type_2"] = map_op[".type_3"]
  2156. -- Dump type definitions.
  2157. local function dumptypes(out, lvl)
  2158. local t = {}
  2159. for name in pairs(map_type) do t[#t+1] = name end
  2160. sort(t)
  2161. out:write("Type definitions:\n")
  2162. for _,name in ipairs(t) do
  2163. local tp = map_type[name]
  2164. local reg = tp.reg and map_reg_rev[tp.reg] or ""
  2165. out:write(format(" %-20s %-20s %s\n", name, tp.ctype, reg))
  2166. end
  2167. out:write("\n")
  2168. end
  2169. ------------------------------------------------------------------------------
  2170. -- Set the current section.
  2171. function _M.section(num)
  2172. waction("SECTION")
  2173. wputxb(num)
  2174. wflush(true) -- SECTION is a terminal action.
  2175. end
  2176. ------------------------------------------------------------------------------
  2177. -- Dump architecture description.
  2178. function _M.dumparch(out)
  2179. out:write(format("DynASM %s version %s, released %s\n\n",
  2180. _info.arch, _info.version, _info.release))
  2181. dumpregs(out)
  2182. dumpactions(out)
  2183. end
  2184. -- Dump all user defined elements.
  2185. function _M.dumpdef(out, lvl)
  2186. dumptypes(out, lvl)
  2187. dumpglobals(out, lvl)
  2188. dumpexterns(out, lvl)
  2189. end
  2190. ------------------------------------------------------------------------------
  2191. -- Pass callbacks from/to the DynASM core.
  2192. function _M.passcb(wl, we, wf, ww)
  2193. wline, werror, wfatal, wwarn = wl, we, wf, ww
  2194. return wflush
  2195. end
  2196. -- Setup the arch-specific module.
  2197. function _M.setup(arch, opt)
  2198. g_arch, g_opt = arch, opt
  2199. end
  2200. -- Merge the core maps and the arch-specific maps.
  2201. function _M.mergemaps(map_coreop, map_def)
  2202. setmetatable(map_op, { __index = map_coreop })
  2203. setmetatable(map_def, { __index = map_archdef })
  2204. return map_op, map_def
  2205. end
  2206. return _M
  2207. ------------------------------------------------------------------------------