diff options
-rw-r--r-- | dynasm/dasm_x86.lua | 34 |
1 files changed, 24 insertions, 10 deletions
diff --git a/dynasm/dasm_x86.lua b/dynasm/dasm_x86.lua index e7f894d6..c51b8c5d 100644 --- a/dynasm/dasm_x86.lua +++ b/dynasm/dasm_x86.lua | |||
@@ -258,6 +258,7 @@ local map_reg_num = {} -- Int. register name -> register number. | |||
258 | local map_reg_opsize = {} -- Int. register name -> operand size. | 258 | local map_reg_opsize = {} -- Int. register name -> operand size. |
259 | local map_reg_valid_base = {} -- Int. register name -> valid base register? | 259 | local map_reg_valid_base = {} -- Int. register name -> valid base register? |
260 | local map_reg_valid_index = {} -- Int. register name -> valid index register? | 260 | local map_reg_valid_index = {} -- Int. register name -> valid index register? |
261 | local map_reg_needrex = {} -- Int. register name -> need rex vs. no rex. | ||
261 | local reg_list = {} -- Canonical list of int. register names. | 262 | local reg_list = {} -- Canonical list of int. register names. |
262 | 263 | ||
263 | local map_type = {} -- Type name -> { ctype, reg } | 264 | local map_type = {} -- Type name -> { ctype, reg } |
@@ -285,6 +286,7 @@ local function mkrmap(sz, cl, names) | |||
285 | map_reg_rev[iname] = name | 286 | map_reg_rev[iname] = name |
286 | map_reg_num[iname] = n-1 | 287 | map_reg_num[iname] = n-1 |
287 | map_reg_opsize[iname] = sz | 288 | map_reg_opsize[iname] = sz |
289 | if sz == "b" and n > 4 then map_reg_needrex[iname] = false end | ||
288 | if sz == addrsize or sz == "d" then | 290 | if sz == addrsize or sz == "d" then |
289 | map_reg_valid_base[iname] = true | 291 | map_reg_valid_base[iname] = true |
290 | map_reg_valid_index[iname] = true | 292 | map_reg_valid_index[iname] = true |
@@ -292,7 +294,9 @@ local function mkrmap(sz, cl, names) | |||
292 | end | 294 | end |
293 | end | 295 | end |
294 | for i=0,(x64 and sz ~= "f") and 15 or 7 do | 296 | for i=0,(x64 and sz ~= "f") and 15 or 7 do |
295 | local iname = format("@%s%x", sz, i) | 297 | local needrex = sz == "b" and i > 3 |
298 | local iname = format("@%s%x%s", sz, i, needrex and "R" or "") | ||
299 | if needrex then map_reg_needrex[iname] = true end | ||
296 | local name | 300 | local name |
297 | if sz == "o" then name = format("xmm%d", i) | 301 | if sz == "o" then name = format("xmm%d", i) |
298 | elseif sz == "f" then name = format("st%d", i) | 302 | elseif sz == "f" then name = format("st%d", i) |
@@ -319,7 +323,6 @@ end | |||
319 | mkrmap("d", "Rd", {"eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi"}) | 323 | mkrmap("d", "Rd", {"eax", "ecx", "edx", "ebx", "esp", "ebp", "esi", "edi"}) |
320 | mkrmap("w", "Rw", {"ax", "cx", "dx", "bx", "sp", "bp", "si", "di"}) | 324 | mkrmap("w", "Rw", {"ax", "cx", "dx", "bx", "sp", "bp", "si", "di"}) |
321 | mkrmap("b", "Rb", {"al", "cl", "dl", "bl", "ah", "ch", "dh", "bh"}) | 325 | mkrmap("b", "Rb", {"al", "cl", "dl", "bl", "ah", "ch", "dh", "bh"}) |
322 | -- !x64: ah, ch, dh, bh not valid with REX, r4b-r15b require REX | ||
323 | map_reg_valid_index[map_archdef.esp] = false | 326 | map_reg_valid_index[map_archdef.esp] = false |
324 | if x64 then map_reg_valid_index[map_archdef.rsp] = false end | 327 | if x64 then map_reg_valid_index[map_archdef.rsp] = false end |
325 | map_archdef["Ra"] = "@"..addrsize | 328 | map_archdef["Ra"] = "@"..addrsize |
@@ -467,7 +470,7 @@ local function wputop(sz, op, rex) | |||
467 | if rex ~= 0 then | 470 | if rex ~= 0 then |
468 | local opc3 = op - op % 256 | 471 | local opc3 = op - op % 256 |
469 | if opc3 == 0x0f3a00 or opc3 == 0x0f3800 then | 472 | if opc3 == 0x0f3a00 or opc3 == 0x0f3800 then |
470 | wputb(64 + rex % 15); rex = 0 | 473 | wputb(64 + rex % 16); rex = 0 |
471 | end | 474 | end |
472 | end | 475 | end |
473 | r = op % 65536 wputb((op-r) / 65536) op = r | 476 | r = op % 65536 wputb((op-r) / 65536) op = r |
@@ -475,11 +478,11 @@ local function wputop(sz, op, rex) | |||
475 | if op >= 256 then | 478 | if op >= 256 then |
476 | r = op % 256 | 479 | r = op % 256 |
477 | local b = (op-r) / 256 | 480 | local b = (op-r) / 256 |
478 | if b == 15 and rex ~= 0 then wputb(64 + rex % 15); rex = 0 end | 481 | if b == 15 and rex ~= 0 then wputb(64 + rex % 16); rex = 0 end |
479 | wputb(b) | 482 | wputb(b) |
480 | op = r | 483 | op = r |
481 | end | 484 | end |
482 | if rex ~= 0 then wputb(64 + rex % 15) end | 485 | if rex ~= 0 then wputb(64 + rex % 16) end |
483 | if sz == "b" then op = op - 1 end | 486 | if sz == "b" then op = op - 1 end |
484 | wputb(op) | 487 | wputb(op) |
485 | end | 488 | end |
@@ -801,6 +804,7 @@ local function parseoperand(param) | |||
801 | end | 804 | end |
802 | t.mode = t.reg == 0 and "rmR" or (reg == "@b1" and "rmC" or "rm") | 805 | t.mode = t.reg == 0 and "rmR" or (reg == "@b1" and "rmC" or "rm") |
803 | end | 806 | end |
807 | t.needrex = map_reg_needrex[reg] | ||
804 | break | 808 | break |
805 | end | 809 | end |
806 | 810 | ||
@@ -1461,7 +1465,7 @@ end | |||
1461 | ------------------------------------------------------------------------------ | 1465 | ------------------------------------------------------------------------------ |
1462 | 1466 | ||
1463 | -- Process pattern string. | 1467 | -- Process pattern string. |
1464 | local function dopattern(pat, args, sz, op) | 1468 | local function dopattern(pat, args, sz, op, needrex) |
1465 | local digit, addin | 1469 | local digit, addin |
1466 | local opcode = 0 | 1470 | local opcode = 0 |
1467 | local szov = sz | 1471 | local szov = sz |
@@ -1506,6 +1510,7 @@ local function dopattern(pat, args, sz, op) | |||
1506 | if t.reg and t.reg > 7 then rex = rex + 1 end | 1510 | if t.reg and t.reg > 7 then rex = rex + 1 end |
1507 | if t.xreg and t.xreg > 7 then rex = rex + 2 end | 1511 | if t.xreg and t.xreg > 7 then rex = rex + 2 end |
1508 | if s > 7 then rex = rex + 4 end | 1512 | if s > 7 then rex = rex + 4 end |
1513 | if needrex then rex = rex + 16 end | ||
1509 | wputop(szov, opcode, rex); opcode = nil | 1514 | wputop(szov, opcode, rex); opcode = nil |
1510 | local imark = sub(pat, -1) -- Force a mark (ugly). | 1515 | local imark = sub(pat, -1) -- Force a mark (ugly). |
1511 | -- Put ModRM/SIB with regno/last digit as spare. | 1516 | -- Put ModRM/SIB with regno/last digit as spare. |
@@ -1514,6 +1519,7 @@ local function dopattern(pat, args, sz, op) | |||
1514 | else | 1519 | else |
1515 | if opcode then -- Flush opcode. | 1520 | if opcode then -- Flush opcode. |
1516 | if szov == "q" and rex == 0 then rex = rex + 8 end | 1521 | if szov == "q" and rex == 0 then rex = rex + 8 end |
1522 | if needrex then rex = rex + 16 end | ||
1517 | if addin and addin.reg == -1 then | 1523 | if addin and addin.reg == -1 then |
1518 | wputop(szov, opcode + 1, rex) | 1524 | wputop(szov, opcode + 1, rex) |
1519 | waction("VREG", addin.vreg); wputxb(0) | 1525 | waction("VREG", addin.vreg); wputxb(0) |
@@ -1602,18 +1608,26 @@ map_op[".template__"] = function(params, template, nparams) | |||
1602 | 1608 | ||
1603 | -- Zero-operand opcodes have no match part. | 1609 | -- Zero-operand opcodes have no match part. |
1604 | if #params == 0 then | 1610 | if #params == 0 then |
1605 | dopattern(template, args, "d", params.op) | 1611 | dopattern(template, args, "d", params.op, nil) |
1606 | return | 1612 | return |
1607 | end | 1613 | end |
1608 | 1614 | ||
1609 | -- Determine common operand size (coerce undefined size) or flag as mixed. | 1615 | -- Determine common operand size (coerce undefined size) or flag as mixed. |
1610 | local sz, szmix | 1616 | local sz, szmix, needrex |
1611 | for i,p in ipairs(params) do | 1617 | for i,p in ipairs(params) do |
1612 | args[i] = parseoperand(p) | 1618 | args[i] = parseoperand(p) |
1613 | local nsz = args[i].opsize | 1619 | local nsz = args[i].opsize |
1614 | if nsz then | 1620 | if nsz then |
1615 | if sz and sz ~= nsz then szmix = true else sz = nsz end | 1621 | if sz and sz ~= nsz then szmix = true else sz = nsz end |
1616 | end | 1622 | end |
1623 | local nrex = args[i].needrex | ||
1624 | if nrex ~= nil then | ||
1625 | if needrex == nil then | ||
1626 | needrex = nrex | ||
1627 | elseif needrex ~= nrex then | ||
1628 | werror("bad mix of byte-addressable registers") | ||
1629 | end | ||
1630 | end | ||
1617 | end | 1631 | end |
1618 | 1632 | ||
1619 | -- Try all match:pattern pairs (separated by '|'). | 1633 | -- Try all match:pattern pairs (separated by '|'). |
@@ -1627,7 +1641,7 @@ map_op[".template__"] = function(params, template, nparams) | |||
1627 | if prefix == "/" then -- Match both operand sizes. | 1641 | if prefix == "/" then -- Match both operand sizes. |
1628 | if args[1].opsize == sub(szm, 2, 2) and | 1642 | if args[1].opsize == sub(szm, 2, 2) and |
1629 | args[2].opsize == sub(szm, 3, 3) then | 1643 | args[2].opsize == sub(szm, 3, 3) then |
1630 | dopattern(pat, args, sz, params.op) -- Process pattern string. | 1644 | dopattern(pat, args, sz, params.op, needrex) -- Process pattern. |
1631 | return | 1645 | return |
1632 | end | 1646 | end |
1633 | else -- Match common operand size. | 1647 | else -- Match common operand size. |
@@ -1636,7 +1650,7 @@ map_op[".template__"] = function(params, template, nparams) | |||
1636 | if prefix == "1" then szp = args[1].opsize; szmix = nil | 1650 | if prefix == "1" then szp = args[1].opsize; szmix = nil |
1637 | elseif prefix == "2" then szp = args[2].opsize; szmix = nil end | 1651 | elseif prefix == "2" then szp = args[2].opsize; szmix = nil end |
1638 | if not szmix and (prefix == "." or match(szm, szp or "#")) then | 1652 | if not szmix and (prefix == "." or match(szm, szp or "#")) then |
1639 | dopattern(pat, args, szp, params.op) -- Process pattern string. | 1653 | dopattern(pat, args, szp, params.op, needrex) -- Process pattern. |
1640 | return | 1654 | return |
1641 | end | 1655 | end |
1642 | end | 1656 | end |