1------------------------------------------------------------------------------ 2-- DynASM ARM64 module. 3-- 4-- Copyright (C) 2005-2016 Mike Pall. All rights reserved. 5-- See dynasm.lua for full copyright notice. 6------------------------------------------------------------------------------ 7 8-- Module information: 9local _info = { 10 arch = "arm", 11 description = "DynASM ARM64 module", 12 version = "1.4.0", 13 vernum = 10400, 14 release = "2015-10-18", 15 author = "Mike Pall", 16 license = "MIT", 17} 18 19-- Exported glue functions for the arch-specific module. 20local _M = { _info = _info } 21 22-- Cache library functions. 23local type, tonumber, pairs, ipairs = type, tonumber, pairs, ipairs 24local assert, setmetatable, rawget = assert, setmetatable, rawget 25local _s = string 26local sub, format, byte, char = _s.sub, _s.format, _s.byte, _s.char 27local match, gmatch, gsub = _s.match, _s.gmatch, _s.gsub 28local concat, sort, insert = table.concat, table.sort, table.insert 29local bit = bit or require("bit") 30local band, shl, shr, sar = bit.band, bit.lshift, bit.rshift, bit.arshift 31local ror, tohex = bit.ror, bit.tohex 32 33-- Inherited tables and callbacks. 34local g_opt, g_arch 35local wline, werror, wfatal, wwarn 36 37-- Action name list. 38-- CHECK: Keep this in sync with the C code! 39local action_names = { 40 "STOP", "SECTION", "ESC", "REL_EXT", 41 "ALIGN", "REL_LG", "LABEL_LG", 42 "REL_PC", "LABEL_PC", "IMM", "IMM6", "IMM12", "IMM13W", "IMM13X", "IMML", 43} 44 45-- Maximum number of section buffer positions for dasm_put(). 46-- CHECK: Keep this in sync with the C code! 47local maxsecpos = 25 -- Keep this low, to avoid excessively long C lines. 48 49-- Action name -> action number. 50local map_action = {} 51for n,name in ipairs(action_names) do 52 map_action[name] = n-1 53end 54 55-- Action list buffer. 56local actlist = {} 57 58-- Argument list for next dasm_put(). Start with offset 0 into action list. 59local actargs = { 0 } 60 61-- Current number of section buffer positions for dasm_put(). 62local secpos = 1 63 64------------------------------------------------------------------------------ 65 66-- Dump action names and numbers. 67local function dumpactions(out) 68 out:write("DynASM encoding engine action codes:\n") 69 for n,name in ipairs(action_names) do 70 local num = map_action[name] 71 out:write(format(" %-10s %02X %d\n", name, num, num)) 72 end 73 out:write("\n") 74end 75 76-- Write action list buffer as a huge static C array. 77local function writeactions(out, name) 78 local nn = #actlist 79 if nn == 0 then nn = 1; actlist[0] = map_action.STOP end 80 out:write("static const unsigned int ", name, "[", nn, "] = {\n") 81 for i = 1,nn-1 do 82 assert(out:write("0x", tohex(actlist[i]), ",\n")) 83 end 84 assert(out:write("0x", tohex(actlist[nn]), "\n};\n\n")) 85end 86 87------------------------------------------------------------------------------ 88 89-- Add word to action list. 90local function wputxw(n) 91 assert(n >= 0 and n <= 0xffffffff and n % 1 == 0, "word out of range") 92 actlist[#actlist+1] = n 93end 94 95-- Add action to list with optional arg. Advance buffer pos, too. 96local function waction(action, val, a, num) 97 local w = assert(map_action[action], "bad action name `"..action.."'") 98 wputxw(w * 0x10000 + (val or 0)) 99 if a then actargs[#actargs+1] = a end 100 if a or num then secpos = secpos + (num or 1) end 101end 102 103-- Flush action list (intervening C code or buffer pos overflow). 104local function wflush(term) 105 if #actlist == actargs[1] then return end -- Nothing to flush. 106 if not term then waction("STOP") end -- Terminate action list. 107 wline(format("dasm_put(Dst, %s);", concat(actargs, ", ")), true) 108 actargs = { #actlist } -- Actionlist offset is 1st arg to next dasm_put(). 109 secpos = 1 -- The actionlist offset occupies a buffer position, too. 110end 111 112-- Put escaped word. 113local function wputw(n) 114 if n <= 0x000fffff then waction("ESC") end 115 wputxw(n) 116end 117 118-- Reserve position for word. 119local function wpos() 120 local pos = #actlist+1 121 actlist[pos] = "" 122 return pos 123end 124 125-- Store word to reserved position. 126local function wputpos(pos, n) 127 assert(n >= 0 and n <= 0xffffffff and n % 1 == 0, "word out of range") 128 if n <= 0x000fffff then 129 insert(actlist, pos+1, n) 130 n = map_action.ESC * 0x10000 131 end 132 actlist[pos] = n 133end 134 135------------------------------------------------------------------------------ 136 137-- Global label name -> global label number. With auto assignment on 1st use. 138local next_global = 20 139local map_global = setmetatable({}, { __index = function(t, name) 140 if not match(name, "^[%a_][%w_]*$") then werror("bad global label") end 141 local n = next_global 142 if n > 2047 then werror("too many global labels") end 143 next_global = n + 1 144 t[name] = n 145 return n 146end}) 147 148-- Dump global labels. 149local function dumpglobals(out, lvl) 150 local t = {} 151 for name, n in pairs(map_global) do t[n] = name end 152 out:write("Global labels:\n") 153 for i=20,next_global-1 do 154 out:write(format(" %s\n", t[i])) 155 end 156 out:write("\n") 157end 158 159-- Write global label enum. 160local function writeglobals(out, prefix) 161 local t = {} 162 for name, n in pairs(map_global) do t[n] = name end 163 out:write("enum {\n") 164 for i=20,next_global-1 do 165 out:write(" ", prefix, t[i], ",\n") 166 end 167 out:write(" ", prefix, "_MAX\n};\n") 168end 169 170-- Write global label names. 171local function writeglobalnames(out, name) 172 local t = {} 173 for name, n in pairs(map_global) do t[n] = name end 174 out:write("static const char *const ", name, "[] = {\n") 175 for i=20,next_global-1 do 176 out:write(" \"", t[i], "\",\n") 177 end 178 out:write(" (const char *)0\n};\n") 179end 180 181------------------------------------------------------------------------------ 182 183-- Extern label name -> extern label number. With auto assignment on 1st use. 184local next_extern = 0 185local map_extern_ = {} 186local map_extern = setmetatable({}, { __index = function(t, name) 187 -- No restrictions on the name for now. 188 local n = next_extern 189 if n > 2047 then werror("too many extern labels") end 190 next_extern = n + 1 191 t[name] = n 192 map_extern_[n] = name 193 return n 194end}) 195 196-- Dump extern labels. 197local function dumpexterns(out, lvl) 198 out:write("Extern labels:\n") 199 for i=0,next_extern-1 do 200 out:write(format(" %s\n", map_extern_[i])) 201 end 202 out:write("\n") 203end 204 205-- Write extern label names. 206local function writeexternnames(out, name) 207 out:write("static const char *const ", name, "[] = {\n") 208 for i=0,next_extern-1 do 209 out:write(" \"", map_extern_[i], "\",\n") 210 end 211 out:write(" (const char *)0\n};\n") 212end 213 214------------------------------------------------------------------------------ 215 216-- Arch-specific maps. 217 218-- Ext. register name -> int. name. 219local map_archdef = { xzr = "@x31", wzr = "@w31", lr = "x30", } 220 221-- Int. register name -> ext. name. 222local map_reg_rev = { ["@x31"] = "xzr", ["@w31"] = "wzr", x30 = "lr", } 223 224local map_type = {} -- Type name -> { ctype, reg } 225local ctypenum = 0 -- Type number (for Dt... macros). 226 227-- Reverse defines for registers. 228function _M.revdef(s) 229 return map_reg_rev[s] or s 230end 231 232local map_shift = { lsl = 0, lsr = 1, asr = 2, } 233 234local map_extend = { 235 uxtb = 0, uxth = 1, uxtw = 2, uxtx = 3, 236 sxtb = 4, sxth = 5, sxtw = 6, sxtx = 7, 237} 238 239local map_cond = { 240 eq = 0, ne = 1, cs = 2, cc = 3, mi = 4, pl = 5, vs = 6, vc = 7, 241 hi = 8, ls = 9, ge = 10, lt = 11, gt = 12, le = 13, al = 14, 242 hs = 2, lo = 3, 243} 244 245------------------------------------------------------------------------------ 246 247local parse_reg_type 248 249local function parse_reg(expr) 250 if not expr then werror("expected register name") end 251 local tname, ovreg = match(expr, "^([%w_]+):(@?%l%d+)$") 252 local tp = map_type[tname or expr] 253 if tp then 254 local reg = ovreg or tp.reg 255 if not reg then 256 werror("type `"..(tname or expr).."' needs a register override") 257 end 258 expr = reg 259 end 260 local ok31, rt, r = match(expr, "^(@?)([xwqdshb])([123]?[0-9])$") 261 if r then 262 r = tonumber(r) 263 if r <= 30 or (r == 31 and ok31 ~= "" or (rt ~= "w" and rt ~= "x")) then 264 if not parse_reg_type then 265 parse_reg_type = rt 266 elseif parse_reg_type ~= rt then 267 werror("register size mismatch") 268 end 269 return r, tp 270 end 271 end 272 werror("bad register name `"..expr.."'") 273end 274 275local function parse_reg_base(expr) 276 if expr == "sp" then return 0x3e0 end 277 local base, tp = parse_reg(expr) 278 if parse_reg_type ~= "x" then werror("bad register type") end 279 parse_reg_type = false 280 return shl(base, 5), tp 281end 282 283local parse_ctx = {} 284 285local loadenv = setfenv and function(s) 286 local code = loadstring(s, "") 287 if code then setfenv(code, parse_ctx) end 288 return code 289end or function(s) 290 return load(s, "", nil, parse_ctx) 291end 292 293-- Try to parse simple arithmetic, too, since some basic ops are aliases. 294local function parse_number(n) 295 local x = tonumber(n) 296 if x then return x end 297 local code = loadenv("return "..n) 298 if code then 299 local ok, y = pcall(code) 300 if ok then return y end 301 end 302 return nil 303end 304 305local function parse_imm(imm, bits, shift, scale, signed) 306 imm = match(imm, "^#(.*)$") 307 if not imm then werror("expected immediate operand") end 308 local n = parse_number(imm) 309 if n then 310 local m = sar(n, scale) 311 if shl(m, scale) == n then 312 if signed then 313 local s = sar(m, bits-1) 314 if s == 0 then return shl(m, shift) 315 elseif s == -1 then return shl(m + shl(1, bits), shift) end 316 else 317 if sar(m, bits) == 0 then return shl(m, shift) end 318 end 319 end 320 werror("out of range immediate `"..imm.."'") 321 else 322 waction("IMM", (signed and 32768 or 0)+scale*1024+bits*32+shift, imm) 323 return 0 324 end 325end 326 327local function parse_imm12(imm) 328 imm = match(imm, "^#(.*)$") 329 if not imm then werror("expected immediate operand") end 330 local n = parse_number(imm) 331 if n then 332 if shr(n, 12) == 0 then 333 return shl(n, 10) 334 elseif band(n, 0xff000fff) == 0 then 335 return shr(n, 2) + 0x00400000 336 end 337 werror("out of range immediate `"..imm.."'") 338 else 339 waction("IMM12", 0, imm) 340 return 0 341 end 342end 343 344local function parse_imm13(imm) 345 imm = match(imm, "^#(.*)$") 346 if not imm then werror("expected immediate operand") end 347 local n = parse_number(imm) 348 local r64 = parse_reg_type == "x" 349 if n and n % 1 == 0 and n >= 0 and n <= 0xffffffff then 350 local inv = false 351 if band(n, 1) == 1 then n = bit.bnot(n); inv = true end 352 local t = {} 353 for i=1,32 do t[i] = band(n, 1); n = shr(n, 1) end 354 local b = table.concat(t) 355 b = b..(r64 and (inv and "1" or "0"):rep(32) or b) 356 local p0, p1, p0a, p1a = b:match("^(0+)(1+)(0*)(1*)") 357 if p0 then 358 local w = p1a == "" and (r64 and 64 or 32) or #p1+#p0a 359 if band(w, w-1) == 0 and b == b:sub(1, w):rep(64/w) then 360 local s = band(-2*w, 0x3f) - 1 361 if w == 64 then s = s + 0x1000 end 362 if inv then 363 return shl(w-#p1-#p0, 16) + shl(s+w-#p1, 10) 364 else 365 return shl(w-#p0, 16) + shl(s+#p1, 10) 366 end 367 end 368 end 369 werror("out of range immediate `"..imm.."'") 370 elseif r64 then 371 waction("IMM13X", 0, format("(unsigned int)(%s)", imm)) 372 actargs[#actargs+1] = format("(unsigned int)((unsigned long long)(%s)>>32)", imm) 373 return 0 374 else 375 waction("IMM13W", 0, imm) 376 return 0 377 end 378end 379 380local function parse_imm6(imm) 381 imm = match(imm, "^#(.*)$") 382 if not imm then werror("expected immediate operand") end 383 local n = parse_number(imm) 384 if n then 385 if n >= 0 and n <= 63 then 386 return shl(band(n, 0x1f), 19) + (n >= 32 and 0x80000000 or 0) 387 end 388 werror("out of range immediate `"..imm.."'") 389 else 390 waction("IMM6", 0, imm) 391 return 0 392 end 393end 394 395local function parse_imm_load(imm, scale) 396 local n = parse_number(imm) 397 if n then 398 local m = sar(n, scale) 399 if shl(m, scale) == n and m >= 0 and m < 0x1000 then 400 return shl(m, 10) + 0x01000000 -- Scaled, unsigned 12 bit offset. 401 elseif n >= -256 and n < 256 then 402 return shl(band(n, 511), 12) -- Unscaled, signed 9 bit offset. 403 end 404 werror("out of range immediate `"..imm.."'") 405 else 406 waction("IMML", 0, imm) 407 return 0 408 end 409end 410 411local function parse_fpimm(imm) 412 imm = match(imm, "^#(.*)$") 413 if not imm then werror("expected immediate operand") end 414 local n = parse_number(imm) 415 if n then 416 local m, e = math.frexp(n) 417 local s, e2 = 0, band(e-2, 7) 418 if m < 0 then m = -m; s = 0x00100000 end 419 m = m*32-16 420 if m % 1 == 0 and m >= 0 and m <= 15 and sar(shl(e2, 29), 29)+2 == e then 421 return s + shl(e2, 17) + shl(m, 13) 422 end 423 werror("out of range immediate `"..imm.."'") 424 else 425 werror("NYI fpimm action") 426 end 427end 428 429local function parse_shift(expr) 430 local s, s2 = match(expr, "^(%S+)%s*(.*)$") 431 s = map_shift[s] 432 if not s then werror("expected shift operand") end 433 return parse_imm(s2, 6, 10, 0, false) + shl(s, 22) 434end 435 436local function parse_lslx16(expr) 437 local n = match(expr, "^lsl%s*#(%d+)$") 438 n = tonumber(n) 439 if not n then werror("expected shift operand") end 440 if band(n, parse_reg_type == "x" and 0xffffffcf or 0xffffffef) ~= 0 then 441 werror("bad shift amount") 442 end 443 return shl(n, 17) 444end 445 446local function parse_extend(expr) 447 local s, s2 = match(expr, "^(%S+)%s*(.*)$") 448 if s == "lsl" then 449 s = parse_reg_type == "x" and 3 or 2 450 else 451 s = map_extend[s] 452 end 453 if not s then werror("expected extend operand") end 454 return (s2 == "" and 0 or parse_imm(s2, 3, 10, 0, false)) + shl(s, 13) 455end 456 457local function parse_cond(expr, inv) 458 local c = map_cond[expr] 459 if not c then werror("expected condition operand") end 460 return shl(bit.bxor(c, inv), 12) 461end 462 463local function parse_load(params, nparams, n, op) 464 if params[n+2] then werror("too many operands") end 465 local pn, p2 = params[n], params[n+1] 466 local p1, wb = match(pn, "^%[%s*(.-)%s*%](!?)$") 467 if not p1 then 468 if not p2 then 469 local reg, tailr = match(pn, "^([%w_:]+)%s*(.*)$") 470 if reg and tailr ~= "" then 471 local base, tp = parse_reg_base(reg) 472 if tp then 473 waction("IMML", 0, format(tp.ctypefmt, tailr)) 474 return op + base 475 end 476 end 477 end 478 werror("expected address operand") 479 end 480 local scale = shr(op, 30) 481 if p2 then 482 if wb == "!" then werror("bad use of '!'") end 483 op = op + parse_reg_base(p1) + parse_imm(p2, 9, 12, 0, true) + 0x400 484 elseif wb == "!" then 485 local p1a, p2a = match(p1, "^([^,%s]*)%s*,%s*(.*)$") 486 if not p1a then werror("bad use of '!'") end 487 op = op + parse_reg_base(p1a) + parse_imm(p2a, 9, 12, 0, true) + 0xc00 488 else 489 local p1a, p2a = match(p1, "^([^,%s]*)%s*(.*)$") 490 op = op + parse_reg_base(p1a) 491 if p2a ~= "" then 492 local imm = match(p2a, "^,%s*#(.*)$") 493 if imm then 494 op = op + parse_imm_load(imm, scale) 495 else 496 local p2b, p3b, p3s = match(p2a, "^,%s*([^,%s]*)%s*,?%s*(%S*)%s*(.*)$") 497 op = op + shl(parse_reg(p2b), 16) + 0x00200800 498 if parse_reg_type ~= "x" and parse_reg_type ~= "w" then 499 werror("bad index register type") 500 end 501 if p3b == "" then 502 if parse_reg_type ~= "x" then werror("bad index register type") end 503 op = op + 0x6000 504 else 505 if p3s == "" or p3s == "#0" then 506 elseif p3s == "#"..scale then 507 op = op + 0x1000 508 else 509 werror("bad scale") 510 end 511 if parse_reg_type == "x" then 512 if p3b == "lsl" and p3s ~= "" then op = op + 0x6000 513 elseif p3b == "sxtx" then op = op + 0xe000 514 else 515 werror("bad extend/shift specifier") 516 end 517 else 518 if p3b == "uxtw" then op = op + 0x4000 519 elseif p3b == "sxtw" then op = op + 0xc000 520 else 521 werror("bad extend/shift specifier") 522 end 523 end 524 end 525 end 526 else 527 if wb == "!" then werror("bad use of '!'") end 528 op = op + 0x01000000 529 end 530 end 531 return op 532end 533 534local function parse_load_pair(params, nparams, n, op) 535 if params[n+2] then werror("too many operands") end 536 local pn, p2 = params[n], params[n+1] 537 local scale = shr(op, 30) == 0 and 2 or 3 538 local p1, wb = match(pn, "^%[%s*(.-)%s*%](!?)$") 539 if not p1 then 540 if not p2 then 541 local reg, tailr = match(pn, "^([%w_:]+)%s*(.*)$") 542 if reg and tailr ~= "" then 543 local base, tp = parse_reg_base(reg) 544 if tp then 545 waction("IMM", 32768+7*32+15+scale*1024, format(tp.ctypefmt, tailr)) 546 return op + base + 0x01000000 547 end 548 end 549 end 550 werror("expected address operand") 551 end 552 if p2 then 553 if wb == "!" then werror("bad use of '!'") end 554 op = op + 0x00800000 555 else 556 local p1a, p2a = match(p1, "^([^,%s]*)%s*,%s*(.*)$") 557 if p1a then p1, p2 = p1a, p2a else p2 = "#0" end 558 op = op + (wb == "!" and 0x01800000 or 0x01000000) 559 end 560 return op + parse_reg_base(p1) + parse_imm(p2, 7, 15, scale, true) 561end 562 563local function parse_label(label, def) 564 local prefix = sub(label, 1, 2) 565 -- =>label (pc label reference) 566 if prefix == "=>" then 567 return "PC", 0, sub(label, 3) 568 end 569 -- ->name (global label reference) 570 if prefix == "->" then 571 return "LG", map_global[sub(label, 3)] 572 end 573 if def then 574 -- [1-9] (local label definition) 575 if match(label, "^[1-9]$") then 576 return "LG", 10+tonumber(label) 577 end 578 else 579 -- [<>][1-9] (local label reference) 580 local dir, lnum = match(label, "^([<>])([1-9])$") 581 if dir then -- Fwd: 1-9, Bkwd: 11-19. 582 return "LG", lnum + (dir == ">" and 0 or 10) 583 end 584 -- extern label (extern label reference) 585 local extname = match(label, "^extern%s+(%S+)$") 586 if extname then 587 return "EXT", map_extern[extname] 588 end 589 end 590 werror("bad label `"..label.."'") 591end 592 593local function branch_type(op) 594 if band(op, 0x7c000000) == 0x14000000 then return 0 -- B, BL 595 elseif shr(op, 24) == 0x54 or band(op, 0x7e000000) == 0x34000000 or 596 band(op, 0x3b000000) == 0x18000000 then 597 return 0x800 -- B.cond, CBZ, CBNZ, LDR* literal 598 elseif band(op, 0x7e000000) == 0x36000000 then return 0x1000 -- TBZ, TBNZ 599 elseif band(op, 0x9f000000) == 0x10000000 then return 0x2000 -- ADR 600 elseif band(op, 0x9f000000) == band(0x90000000) then return 0x3000 -- ADRP 601 else 602 assert(false, "unknown branch type") 603 end 604end 605 606------------------------------------------------------------------------------ 607 608local map_op, op_template 609 610local function op_alias(opname, f) 611 return function(params, nparams) 612 if not params then return "-> "..opname:sub(1, -3) end 613 f(params, nparams) 614 op_template(params, map_op[opname], nparams) 615 end 616end 617 618local function alias_bfx(p) 619 p[4] = "#("..p[3]:sub(2)..")+("..p[4]:sub(2)..")-1" 620end 621 622local function alias_bfiz(p) 623 parse_reg(p[1]) 624 if parse_reg_type == "w" then 625 p[3] = "#-("..p[3]:sub(2)..")%32" 626 p[4] = "#("..p[4]:sub(2)..")-1" 627 else 628 p[3] = "#-("..p[3]:sub(2)..")%64" 629 p[4] = "#("..p[4]:sub(2)..")-1" 630 end 631end 632 633local alias_lslimm = op_alias("ubfm_4", function(p) 634 parse_reg(p[1]) 635 local sh = p[3]:sub(2) 636 if parse_reg_type == "w" then 637 p[3] = "#-("..sh..")%32" 638 p[4] = "#31-("..sh..")" 639 else 640 p[3] = "#-("..sh..")%64" 641 p[4] = "#63-("..sh..")" 642 end 643end) 644 645-- Template strings for ARM instructions. 646map_op = { 647 -- Basic data processing instructions. 648 add_3 = "0b000000DNMg|11000000pDpNIg|8b206000pDpNMx", 649 add_4 = "0b000000DNMSg|0b200000DNMXg|8b200000pDpNMXx|8b200000pDpNxMwX", 650 adds_3 = "2b000000DNMg|31000000DpNIg|ab206000DpNMx", 651 adds_4 = "2b000000DNMSg|2b200000DNMXg|ab200000DpNMXx|ab200000DpNxMwX", 652 cmn_2 = "2b00001fNMg|3100001fpNIg|ab20601fpNMx", 653 cmn_3 = "2b00001fNMSg|2b20001fNMXg|ab20001fpNMXx|ab20001fpNxMwX", 654 655 sub_3 = "4b000000DNMg|51000000pDpNIg|cb206000pDpNMx", 656 sub_4 = "4b000000DNMSg|4b200000DNMXg|cb200000pDpNMXx|cb200000pDpNxMwX", 657 subs_3 = "6b000000DNMg|71000000DpNIg|eb206000DpNMx", 658 subs_4 = "6b000000DNMSg|6b200000DNMXg|eb200000DpNMXx|eb200000DpNxMwX", 659 cmp_2 = "6b00001fNMg|7100001fpNIg|eb20601fpNMx", 660 cmp_3 = "6b00001fNMSg|6b20001fNMXg|eb20001fpNMXx|eb20001fpNxMwX", 661 662 neg_2 = "4b0003e0DMg", 663 neg_3 = "4b0003e0DMSg", 664 negs_2 = "6b0003e0DMg", 665 negs_3 = "6b0003e0DMSg", 666 667 adc_3 = "1a000000DNMg", 668 adcs_3 = "3a000000DNMg", 669 sbc_3 = "5a000000DNMg", 670 sbcs_3 = "7a000000DNMg", 671 ngc_2 = "5a0003e0DMg", 672 ngcs_2 = "7a0003e0DMg", 673 674 and_3 = "0a000000DNMg|12000000pDNig", 675 and_4 = "0a000000DNMSg", 676 orr_3 = "2a000000DNMg|32000000pDNig", 677 orr_4 = "2a000000DNMSg", 678 eor_3 = "4a000000DNMg|52000000pDNig", 679 eor_4 = "4a000000DNMSg", 680 ands_3 = "6a000000DNMg|72000000DNig", 681 ands_4 = "6a000000DNMSg", 682 tst_2 = "6a00001fNMg|7200001fNig", 683 tst_3 = "6a00001fNMSg", 684 685 bic_3 = "0a200000DNMg", 686 bic_4 = "0a200000DNMSg", 687 orn_3 = "2a200000DNMg", 688 orn_4 = "2a200000DNMSg", 689 eon_3 = "4a200000DNMg", 690 eon_4 = "4a200000DNMSg", 691 bics_3 = "6a200000DNMg", 692 bics_4 = "6a200000DNMSg", 693 694 movn_2 = "12800000DWg", 695 movn_3 = "12800000DWRg", 696 movz_2 = "52800000DWg", 697 movz_3 = "52800000DWRg", 698 movk_2 = "72800000DWg", 699 movk_3 = "72800000DWRg", 700 701 -- TODO: this doesn't cover all valid immediates for mov reg, #imm. 702 mov_2 = "2a0003e0DMg|52800000DW|320003e0pDig|11000000pDpNg", 703 mov_3 = "2a0003e0DMSg", 704 mvn_2 = "2a2003e0DMg", 705 mvn_3 = "2a2003e0DMSg", 706 707 adr_2 = "10000000DBx", 708 adrp_2 = "90000000DBx", 709 710 csel_4 = "1a800000DNMCg", 711 csinc_4 = "1a800400DNMCg", 712 csinv_4 = "5a800000DNMCg", 713 csneg_4 = "5a800400DNMCg", 714 cset_2 = "1a9f07e0Dcg", 715 csetm_2 = "5a9f03e0Dcg", 716 cinc_3 = "1a800400DNmcg", 717 cinv_3 = "5a800000DNmcg", 718 cneg_3 = "5a800400DNmcg", 719 720 ccmn_4 = "3a400000NMVCg|3a400800N5VCg", 721 ccmp_4 = "7a400000NMVCg|7a400800N5VCg", 722 723 madd_4 = "1b000000DNMAg", 724 msub_4 = "1b008000DNMAg", 725 mul_3 = "1b007c00DNMg", 726 mneg_3 = "1b00fc00DNMg", 727 728 smaddl_4 = "9b200000DxNMwAx", 729 smsubl_4 = "9b208000DxNMwAx", 730 smull_3 = "9b207c00DxNMw", 731 smnegl_3 = "9b20fc00DxNMw", 732 smulh_3 = "9b407c00DNMx", 733 umaddl_4 = "9ba00000DxNMwAx", 734 umsubl_4 = "9ba08000DxNMwAx", 735 umull_3 = "9ba07c00DxNMw", 736 umnegl_3 = "9ba0fc00DxNMw", 737 umulh_3 = "9bc07c00DNMx", 738 739 udiv_3 = "1ac00800DNMg", 740 sdiv_3 = "1ac00c00DNMg", 741 742 -- Bit operations. 743 sbfm_4 = "13000000DN12w|93400000DN12x", 744 bfm_4 = "33000000DN12w|b3400000DN12x", 745 ubfm_4 = "53000000DN12w|d3400000DN12x", 746 extr_4 = "13800000DNM2w|93c00000DNM2x", 747 748 sxtb_2 = "13001c00DNw|93401c00DNx", 749 sxth_2 = "13003c00DNw|93403c00DNx", 750 sxtw_2 = "93407c00DxNw", 751 uxtb_2 = "53001c00DNw", 752 uxth_2 = "53003c00DNw", 753 754 sbfx_4 = op_alias("sbfm_4", alias_bfx), 755 bfxil_4 = op_alias("bfm_4", alias_bfx), 756 ubfx_4 = op_alias("ubfm_4", alias_bfx), 757 sbfiz_4 = op_alias("sbfm_4", alias_bfiz), 758 bfi_4 = op_alias("bfm_4", alias_bfiz), 759 ubfiz_4 = op_alias("ubfm_4", alias_bfiz), 760 761 lsl_3 = function(params, nparams) 762 if params and params[3]:byte() == 35 then 763 return alias_lslimm(params, nparams) 764 else 765 return op_template(params, "1ac02000DNMg", nparams) 766 end 767 end, 768 lsr_3 = "1ac02400DNMg|53007c00DN1w|d340fc00DN1x", 769 asr_3 = "1ac02800DNMg|13007c00DN1w|9340fc00DN1x", 770 ror_3 = "1ac02c00DNMg|13800000DNm2w|93c00000DNm2x", 771 772 clz_2 = "5ac01000DNg", 773 cls_2 = "5ac01400DNg", 774 rbit_2 = "5ac00000DNg", 775 rev_2 = "5ac00800DNw|dac00c00DNx", 776 rev16_2 = "5ac00400DNg", 777 rev32_2 = "dac00800DNx", 778 779 -- Loads and stores. 780 ["strb_*"] = "38000000DwL", 781 ["ldrb_*"] = "38400000DwL", 782 ["ldrsb_*"] = "38c00000DwL|38800000DxL", 783 ["strh_*"] = "78000000DwL", 784 ["ldrh_*"] = "78400000DwL", 785 ["ldrsh_*"] = "78c00000DwL|78800000DxL", 786 ["str_*"] = "b8000000DwL|f8000000DxL|bc000000DsL|fc000000DdL", 787 ["ldr_*"] = "18000000DwB|58000000DxB|1c000000DsB|5c000000DdB|b8400000DwL|f8400000DxL|bc400000DsL|fc400000DdL", 788 ["ldrsw_*"] = "98000000DxB|b8800000DxL", 789 -- NOTE: ldur etc. are handled by ldr et al. 790 791 ["stp_*"] = "28000000DAwP|a8000000DAxP|2c000000DAsP|6c000000DAdP", 792 ["ldp_*"] = "28400000DAwP|a8400000DAxP|2c400000DAsP|6c400000DAdP", 793 ["ldpsw_*"] = "68400000DAxP", 794 795 -- Branches. 796 b_1 = "14000000B", 797 bl_1 = "94000000B", 798 blr_1 = "d63f0000Nx", 799 br_1 = "d61f0000Nx", 800 ret_0 = "d65f03c0", 801 ret_1 = "d65f0000Nx", 802 -- b.cond is added below. 803 cbz_2 = "34000000DBg", 804 cbnz_2 = "35000000DBg", 805 tbz_3 = "36000000DTBw|36000000DTBx", 806 tbnz_3 = "37000000DTBw|37000000DTBx", 807 808 -- Miscellaneous instructions. 809 -- TODO: hlt, hvc, smc, svc, eret, dcps[123], drps, mrs, msr 810 -- TODO: sys, sysl, ic, dc, at, tlbi 811 -- TODO: hint, yield, wfe, wfi, sev, sevl 812 -- TODO: clrex, dsb, dmb, isb 813 nop_0 = "d503201f", 814 brk_0 = "d4200000", 815 brk_1 = "d4200000W", 816 817 -- Floating point instructions. 818 fmov_2 = "1e204000DNf|1e260000DwNs|1e270000DsNw|9e660000DxNd|9e670000DdNx|1e201000DFf", 819 fabs_2 = "1e20c000DNf", 820 fneg_2 = "1e214000DNf", 821 fsqrt_2 = "1e21c000DNf", 822 823 fcvt_2 = "1e22c000DdNs|1e624000DsNd", 824 825 -- TODO: half-precision and fixed-point conversions. 826 fcvtas_2 = "1e240000DwNs|9e240000DxNs|1e640000DwNd|9e640000DxNd", 827 fcvtau_2 = "1e250000DwNs|9e250000DxNs|1e650000DwNd|9e650000DxNd", 828 fcvtms_2 = "1e300000DwNs|9e300000DxNs|1e700000DwNd|9e700000DxNd", 829 fcvtmu_2 = "1e310000DwNs|9e310000DxNs|1e710000DwNd|9e710000DxNd", 830 fcvtns_2 = "1e200000DwNs|9e200000DxNs|1e600000DwNd|9e600000DxNd", 831 fcvtnu_2 = "1e210000DwNs|9e210000DxNs|1e610000DwNd|9e610000DxNd", 832 fcvtps_2 = "1e280000DwNs|9e280000DxNs|1e680000DwNd|9e680000DxNd", 833 fcvtpu_2 = "1e290000DwNs|9e290000DxNs|1e690000DwNd|9e690000DxNd", 834 fcvtzs_2 = "1e380000DwNs|9e380000DxNs|1e780000DwNd|9e780000DxNd", 835 fcvtzu_2 = "1e390000DwNs|9e390000DxNs|1e790000DwNd|9e790000DxNd", 836 837 scvtf_2 = "1e220000DsNw|9e220000DsNx|1e620000DdNw|9e620000DdNx", 838 ucvtf_2 = "1e230000DsNw|9e230000DsNx|1e630000DdNw|9e630000DdNx", 839 840 frintn_2 = "1e244000DNf", 841 frintp_2 = "1e24c000DNf", 842 frintm_2 = "1e254000DNf", 843 frintz_2 = "1e25c000DNf", 844 frinta_2 = "1e264000DNf", 845 frintx_2 = "1e274000DNf", 846 frinti_2 = "1e27c000DNf", 847 848 fadd_3 = "1e202800DNMf", 849 fsub_3 = "1e203800DNMf", 850 fmul_3 = "1e200800DNMf", 851 fnmul_3 = "1e208800DNMf", 852 fdiv_3 = "1e201800DNMf", 853 854 fmadd_4 = "1f000000DNMAf", 855 fmsub_4 = "1f008000DNMAf", 856 fnmadd_4 = "1f200000DNMAf", 857 fnmsub_4 = "1f208000DNMAf", 858 859 fmax_3 = "1e204800DNMf", 860 fmaxnm_3 = "1e206800DNMf", 861 fmin_3 = "1e205800DNMf", 862 fminnm_3 = "1e207800DNMf", 863 864 fcmp_2 = "1e202000NMf|1e202008NZf", 865 fcmpe_2 = "1e202010NMf|1e202018NZf", 866 867 fccmp_4 = "1e200400NMVCf", 868 fccmpe_4 = "1e200410NMVCf", 869 870 fcsel_4 = "1e200c00DNMCf", 871 872 -- TODO: crc32*, aes*, sha*, pmull 873 -- TODO: SIMD instructions. 874} 875 876for cond,c in pairs(map_cond) do 877 map_op["b"..cond.."_1"] = tohex(0x54000000+c).."B" 878end 879 880------------------------------------------------------------------------------ 881 882-- Handle opcodes defined with template strings. 883local function parse_template(params, template, nparams, pos) 884 local op = tonumber(sub(template, 1, 8), 16) 885 local n = 1 886 local rtt = {} 887 888 parse_reg_type = false 889 890 -- Process each character. 891 for p in gmatch(sub(template, 9), ".") do 892 local q = params[n] 893 if p == "D" then 894 op = op + parse_reg(q); n = n + 1 895 elseif p == "N" then 896 op = op + shl(parse_reg(q), 5); n = n + 1 897 elseif p == "M" then 898 op = op + shl(parse_reg(q), 16); n = n + 1 899 elseif p == "A" then 900 op = op + shl(parse_reg(q), 10); n = n + 1 901 elseif p == "m" then 902 op = op + shl(parse_reg(params[n-1]), 16) 903 904 elseif p == "p" then 905 if q == "sp" then params[n] = "@x31" end 906 elseif p == "g" then 907 if parse_reg_type == "x" then 908 op = op + 0x80000000 909 elseif parse_reg_type ~= "w" then 910 werror("bad register type") 911 end 912 parse_reg_type = false 913 elseif p == "f" then 914 if parse_reg_type == "d" then 915 op = op + 0x00400000 916 elseif parse_reg_type ~= "s" then 917 werror("bad register type") 918 end 919 parse_reg_type = false 920 elseif p == "x" or p == "w" or p == "d" or p == "s" then 921 if parse_reg_type ~= p then 922 werror("register size mismatch") 923 end 924 parse_reg_type = false 925 926 elseif p == "L" then 927 op = parse_load(params, nparams, n, op) 928 elseif p == "P" then 929 op = parse_load_pair(params, nparams, n, op) 930 931 elseif p == "B" then 932 local mode, v, s = parse_label(q, false); n = n + 1 933 local m = branch_type(op) 934 waction("REL_"..mode, v+m, s, 1) 935 936 elseif p == "I" then 937 op = op + parse_imm12(q); n = n + 1 938 elseif p == "i" then 939 op = op + parse_imm13(q); n = n + 1 940 elseif p == "W" then 941 op = op + parse_imm(q, 16, 5, 0, false); n = n + 1 942 elseif p == "T" then 943 op = op + parse_imm6(q); n = n + 1 944 elseif p == "1" then 945 op = op + parse_imm(q, 6, 16, 0, false); n = n + 1 946 elseif p == "2" then 947 op = op + parse_imm(q, 6, 10, 0, false); n = n + 1 948 elseif p == "5" then 949 op = op + parse_imm(q, 5, 16, 0, false); n = n + 1 950 elseif p == "V" then 951 op = op + parse_imm(q, 4, 0, 0, false); n = n + 1 952 elseif p == "F" then 953 op = op + parse_fpimm(q); n = n + 1 954 elseif p == "Z" then 955 if q ~= "#0" and q ~= "#0.0" then werror("expected zero immediate") end 956 n = n + 1 957 958 elseif p == "S" then 959 op = op + parse_shift(q); n = n + 1 960 elseif p == "X" then 961 op = op + parse_extend(q); n = n + 1 962 elseif p == "R" then 963 op = op + parse_lslx16(q); n = n + 1 964 elseif p == "C" then 965 op = op + parse_cond(q, 0); n = n + 1 966 elseif p == "c" then 967 op = op + parse_cond(q, 1); n = n + 1 968 969 else 970 assert(false) 971 end 972 end 973 wputpos(pos, op) 974end 975 976function op_template(params, template, nparams) 977 if not params then return template:gsub("%x%x%x%x%x%x%x%x", "") end 978 979 -- Limit number of section buffer positions used by a single dasm_put(). 980 -- A single opcode needs a maximum of 3 positions. 981 if secpos+3 > maxsecpos then wflush() end 982 local pos = wpos() 983 local lpos, apos, spos = #actlist, #actargs, secpos 984 985 local ok, err 986 for t in gmatch(template, "[^|]+") do 987 ok, err = pcall(parse_template, params, t, nparams, pos) 988 if ok then return end 989 secpos = spos 990 actlist[lpos+1] = nil 991 actlist[lpos+2] = nil 992 actlist[lpos+3] = nil 993 actargs[apos+1] = nil 994 actargs[apos+2] = nil 995 actargs[apos+3] = nil 996 end 997 error(err, 0) 998end 999 1000map_op[".template__"] = op_template 1001 1002------------------------------------------------------------------------------ 1003 1004-- Pseudo-opcode to mark the position where the action list is to be emitted. 1005map_op[".actionlist_1"] = function(params) 1006 if not params then return "cvar" end 1007 local name = params[1] -- No syntax check. You get to keep the pieces. 1008 wline(function(out) writeactions(out, name) end) 1009end 1010 1011-- Pseudo-opcode to mark the position where the global enum is to be emitted. 1012map_op[".globals_1"] = function(params) 1013 if not params then return "prefix" end 1014 local prefix = params[1] -- No syntax check. You get to keep the pieces. 1015 wline(function(out) writeglobals(out, prefix) end) 1016end 1017 1018-- Pseudo-opcode to mark the position where the global names are to be emitted. 1019map_op[".globalnames_1"] = function(params) 1020 if not params then return "cvar" end 1021 local name = params[1] -- No syntax check. You get to keep the pieces. 1022 wline(function(out) writeglobalnames(out, name) end) 1023end 1024 1025-- Pseudo-opcode to mark the position where the extern names are to be emitted. 1026map_op[".externnames_1"] = function(params) 1027 if not params then return "cvar" end 1028 local name = params[1] -- No syntax check. You get to keep the pieces. 1029 wline(function(out) writeexternnames(out, name) end) 1030end 1031 1032------------------------------------------------------------------------------ 1033 1034-- Label pseudo-opcode (converted from trailing colon form). 1035map_op[".label_1"] = function(params) 1036 if not params then return "[1-9] | ->global | =>pcexpr" end 1037 if secpos+1 > maxsecpos then wflush() end 1038 local mode, n, s = parse_label(params[1], true) 1039 if mode == "EXT" then werror("bad label definition") end 1040 waction("LABEL_"..mode, n, s, 1) 1041end 1042 1043------------------------------------------------------------------------------ 1044 1045-- Pseudo-opcodes for data storage. 1046map_op[".long_*"] = function(params) 1047 if not params then return "imm..." end 1048 for _,p in ipairs(params) do 1049 local n = tonumber(p) 1050 if not n then werror("bad immediate `"..p.."'") end 1051 if n < 0 then n = n + 2^32 end 1052 wputw(n) 1053 if secpos+2 > maxsecpos then wflush() end 1054 end 1055end 1056 1057-- Alignment pseudo-opcode. 1058map_op[".align_1"] = function(params) 1059 if not params then return "numpow2" end 1060 if secpos+1 > maxsecpos then wflush() end 1061 local align = tonumber(params[1]) 1062 if align then 1063 local x = align 1064 -- Must be a power of 2 in the range (2 ... 256). 1065 for i=1,8 do 1066 x = x / 2 1067 if x == 1 then 1068 waction("ALIGN", align-1, nil, 1) -- Action byte is 2**n-1. 1069 return 1070 end 1071 end 1072 end 1073 werror("bad alignment") 1074end 1075 1076------------------------------------------------------------------------------ 1077 1078-- Pseudo-opcode for (primitive) type definitions (map to C types). 1079map_op[".type_3"] = function(params, nparams) 1080 if not params then 1081 return nparams == 2 and "name, ctype" or "name, ctype, reg" 1082 end 1083 local name, ctype, reg = params[1], params[2], params[3] 1084 if not match(name, "^[%a_][%w_]*$") then 1085 werror("bad type name `"..name.."'") 1086 end 1087 local tp = map_type[name] 1088 if tp then 1089 werror("duplicate type `"..name.."'") 1090 end 1091 -- Add #type to defines. A bit unclean to put it in map_archdef. 1092 map_archdef["#"..name] = "sizeof("..ctype..")" 1093 -- Add new type and emit shortcut define. 1094 local num = ctypenum + 1 1095 map_type[name] = { 1096 ctype = ctype, 1097 ctypefmt = format("Dt%X(%%s)", num), 1098 reg = reg, 1099 } 1100 wline(format("#define Dt%X(_V) (int)(ptrdiff_t)&(((%s *)0)_V)", num, ctype)) 1101 ctypenum = num 1102end 1103map_op[".type_2"] = map_op[".type_3"] 1104 1105-- Dump type definitions. 1106local function dumptypes(out, lvl) 1107 local t = {} 1108 for name in pairs(map_type) do t[#t+1] = name end 1109 sort(t) 1110 out:write("Type definitions:\n") 1111 for _,name in ipairs(t) do 1112 local tp = map_type[name] 1113 local reg = tp.reg or "" 1114 out:write(format(" %-20s %-20s %s\n", name, tp.ctype, reg)) 1115 end 1116 out:write("\n") 1117end 1118 1119------------------------------------------------------------------------------ 1120 1121-- Set the current section. 1122function _M.section(num) 1123 waction("SECTION", num) 1124 wflush(true) -- SECTION is a terminal action. 1125end 1126 1127------------------------------------------------------------------------------ 1128 1129-- Dump architecture description. 1130function _M.dumparch(out) 1131 out:write(format("DynASM %s version %s, released %s\n\n", 1132 _info.arch, _info.version, _info.release)) 1133 dumpactions(out) 1134end 1135 1136-- Dump all user defined elements. 1137function _M.dumpdef(out, lvl) 1138 dumptypes(out, lvl) 1139 dumpglobals(out, lvl) 1140 dumpexterns(out, lvl) 1141end 1142 1143------------------------------------------------------------------------------ 1144 1145-- Pass callbacks from/to the DynASM core. 1146function _M.passcb(wl, we, wf, ww) 1147 wline, werror, wfatal, wwarn = wl, we, wf, ww 1148 return wflush 1149end 1150 1151-- Setup the arch-specific module. 1152function _M.setup(arch, opt) 1153 g_arch, g_opt = arch, opt 1154end 1155 1156-- Merge the core maps and the arch-specific maps. 1157function _M.mergemaps(map_coreop, map_def) 1158 setmetatable(map_op, { __index = map_coreop }) 1159 setmetatable(map_def, { __index = map_archdef }) 1160 return map_op, map_def 1161end 1162 1163return _M 1164 1165------------------------------------------------------------------------------ 1166 1167