Skip to content

ARM:ASTI: add lifting support for LDMIB #219

New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Merged
merged 1 commit into from
May 2, 2025
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion chb/app/CHVersion.py
Original file line number Diff line number Diff line change
@@ -1 +1 @@
chbversion: str = "0.3.0-20250420"
chbversion: str = "0.3.0-20250502"
323 changes: 309 additions & 14 deletions chb/arm/opcodes/ARMLoadMultipleIncrementBefore.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@
# ------------------------------------------------------------------------------
# The MIT License (MIT)
#
# Copyright (c) 2021-2023 Aarno Labs LLC
# Copyright (c) 2021-2025 Aarno Labs LLC
#
# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
Expand All @@ -25,27 +25,187 @@
# SOFTWARE.
# ------------------------------------------------------------------------------

from typing import List, TYPE_CHECKING
from typing import Iterable, List, Tuple, TYPE_CHECKING

from chb.app.InstrXData import InstrXData

from chb.arm.ARMDictionaryRecord import armregistry
from chb.arm.ARMOpcode import ARMOpcode, simplify_result
from chb.arm.ARMOpcode import ARMOpcode, ARMOpcodeXData, simplify_result
from chb.arm.ARMOperand import ARMOperand

import chb.util.fileutil as UF
import chb.ast.ASTNode as AST
from chb.astinterface.ASTInterface import ASTInterface

import chb.invariants.XXprUtil as XU

import chb.util.fileutil as UF
from chb.util.IndexedTable import IndexedTableValue
from chb.util.loggingutil import chklogger

if TYPE_CHECKING:
from chb.arm.ARMDictionary import ARMDictionary
from chb.invariants.XVariable import XVariable
from chb.invariants.XXpr import XXpr


class ARMLoadMultipleIncrementBeforeXData(ARMOpcodeXData):
"""Data format:
- variables:
0: baselhs
1..n: lhsvars

- expressions:
0: baserhs
1..n: memrhss
n+1..2n: rmemrhss (memrhss, rewritten)
2n+1..3n: xaddrs

- c expressions:
0..n-1: cmemrhss
"""

def __init__(self, xdata: InstrXData) -> None:
ARMOpcodeXData.__init__(self, xdata)

@property
def regcount(self) -> int:
return len(self.xdata.vars_r) - 1

def has_index(self, index: int) -> bool:
"""returns true if index is between 1 and regcount (inclusive)."""

return index > 0 and index <= self.regcount

@property
def memrhs_range(self) -> Iterable[int]:
return range(1, self.regcount + 1)

@property
def rmemrhs_range(self) -> Iterable[int]:
return range(self.regcount + 1, (2 * self.regcount) + 1)

@property
def xaddr_range(self) -> Iterable[int]:
return range((2 * self.regcount) + 1, (3 * self.regcount) + 1)

@property
def baselhs(self) -> "XVariable":
return self.var(0, "baselhs")

@property
def lhsvars(self) -> List["XVariable"]:
return [self.var(i, "lhsvar") for i in range(1, self.regcount + 1)]

def lhsvar(self, index: int) -> "XVariable":
"""returns the lhsvar at (1-based) position index"""

if self.has_index(index):
return self.lhsvars[index]
else:
raise UF.CHBError("LDMIB: index out of bounds: " + str(index))

@property
def baserhs(self) -> "XXpr":
return self.xpr(0, "baserhs")

@property
def memrhss(self) -> List["XXpr"]:
return [self.xpr(i, "memrhs") for i in self.memrhs_range]

@property
def are_memrhss_ok(self) -> bool:
return all(self.is_xpr_ok(i) for i in self.memrhs_range)

def memrhs(self, index) -> "XXpr":
"""returns the rhs expression at (1-based) position index"""

if self.has_index(index):
if self.are_memrhss_ok:
return self.memrhss[index - 1]
else:
raise UF.CHBError("LDMIB: memrhss have error values")
else:
raise UF.CHBError("LDMIB: index out of bounds for memrhs")

@property
def rmemrhss(self) -> List["XXpr"]:
return [self.xpr(i, "rmemrhs") for i in self.rmemrhs_range]

@property
def are_rmemrhss_ok(self) -> bool:
return all(self.is_xpr_ok(i) for i in self.rmemrhs_range)

def rmemrhs(self, index) -> "XXpr":
"""returns the rewritten rhs expr at (1-based) position index"""

if self.has_index(index):
if self.are_rmemrhss_ok:
return self.rmemrhss[index - 1]
else:
raise UF.CHBError("LDMIB: rmemrhss have error values")
else:
raise UF.CHBError("LDMIB: index out of bounds for rmemrhs")

@property
def xaddrs(self) -> List["XXpr"]:
return [self.xpr(i, "xaddr") for i in self.xaddr_range]

@property
def are_xaddrs_ok(self) -> bool:
return all(self.is_xpr_ok(i) for i in self.xaddr_range)

def xaddr(self, index) -> "XXpr":
"""returns the rhs addr at (1-based) position index"""

if self.has_index(index):
if self.are_xaddrs_ok:
return self.xaddrs[index - 1]
else:
raise UF.CHBError("LDMIB: xaddrs have error values")
else:
raise UF.CHBError("LDMIB: index out of bounds for xaddr")

@property
def cmemrhss(self) -> List["XXpr"]:
return [self.cxpr(i, "cmemrhs") for i in range(0, self.regcount)]

@property
def are_cmemrhss_ok(self) -> bool:
return all(self.is_cxpr_ok(i) for i in range(0, self.regcount))

def cmemrhs(self, index) -> "XXpr":
"""returns the rhs addr at (1-based) position index"""

if self.has_index(index):
if self.are_cmemrhss_ok:
return self.cmemrhss[index - 1]
else:
raise UF.CHBError("LDMIB: cmemrhss have error values")
else:
raise UF.CHBError("LDMIB: index out of bounds cmemrhs")

@property
def annotation(self) -> str:
if self.are_rmemrhss_ok:
pairs = list(zip(self.lhsvars, self.rmemrhss))
elif self.are_memrhss_ok:
pairs = list(zip(self.lhsvars, self.memrhss))
else:
pairs = []
if len(pairs) > 0:
assigns = "; ".join(str(v) + " := " + str(x) for (x, v) in pairs)
else:
assigns = "unknown rhs memory"
wbu = self.writeback_update()
return self.add_instruction_condition(assigns + wbu)



@armregistry.register_tag("LDMIB", ARMOpcode)
class ARMLoadMultipleIncrementBefore(ARMOpcode):
"""Loads multiple registers from consecutive memory locations.

LDMDB<c> <Rn>, <registers>
LDMIB<c> <Rn>, <registers>

tags[1]: <c>
args[0]: writeback
Expand All @@ -63,19 +223,154 @@ def __init__(

@property
def operands(self) -> List[ARMOperand]:
return [self.armd.arm_operand(i) for i in self.args[1:-1]]
return [self.armd.arm_operand(i) for i in self.args[1:]]

@property
def opargs(self) -> List[ARMOperand]:
return [self.armd.arm_operand(i) for i in self.args[1:]]

@property
def operandstring(self) -> str:
return (
str(self.armd.arm_operand(self.args[1]))
+ ("!" if self.args[0] == 1 else "")
+ ", "
+ str(self.armd.arm_operand(self.args[2])))

@property
def writeback(self) -> bool:
return self.args[0] == 1

def is_load_instruction(self, xdata: InstrXData) -> bool:
return True

def annotation(self, xdata: InstrXData) -> str:
"""xdata format: a:v..x.. .
xd = ARMLoadMultipleIncrementBeforeXData(xdata)
return xd.annotation

vars[0..]: lhs variables
xprs[0..]: rhs expressions
"""
def ast_prov(
self,
astree: ASTInterface,
iaddr: str,
bytestring: str,
xdata: InstrXData) -> Tuple[
List[AST.ASTInstruction], List[AST.ASTInstruction]]:

return (
'; '.join(str(v)
+ " := "
+ str(x) for (v, x) in zip(xdata.vars, xdata.xprs)))
xd = ARMLoadMultipleIncrementBeforeXData(xdata)

if xd.are_cmemrhss_ok:
rhsexprs = xd.cmemrhss
elif xd.are_rmemrhss_ok:
rhsexprs = xd.rmemrhss
elif xd.are_memrhss_ok:
rhsexprs = xd.memrhss

else:
chklogger.logger.error(
"LDMIB: Error value encountered at address %s", iaddr)
return ([], [])

baselhs = xd.baselhs
lhsvars = xd.lhsvars
baserhs = xd.baserhs

baserdef = xdata.reachingdefs[0]
memrdefs = xdata.reachingdefs[1:]
baseuses = xdata.defuses[0]
reguses = xdata.defuses[1:]
baseuseshigh = xdata.defuseshigh[0]
reguseshigh = xdata.defuseshigh[1:]

annotations: List[str] = [iaddr, "LDMIB"]

ll_instrs: List[AST.ASTInstruction] = []
hl_instrs: List[AST.ASTInstruction] = []

# low-level assignments

(baselval, _, _) = self.opargs[0].ast_lvalue(astree)
(baserval, _, _) = self.opargs[0].ast_rvalue(astree)

regsop = self.opargs[1]
registers = regsop.registers
base_offset = 0
for (i, r) in enumerate(registers):

# low-level assignments

base_offset += 4

base_offset_c = astree.mk_integer_constant(base_offset)
addr = astree.mk_binary_op("plus", baserval, base_offset_c)
ll_lhs = astree.mk_variable_lval(r)
ll_rhs = astree.mk_memref_expr(addr)
ll_assign = astree.mk_assign(
ll_lhs,
ll_rhs,
iaddr=iaddr,
bytestring=bytestring,
annotations=annotations)
ll_instrs.append(ll_assign)

# high-level assignments

lhs = lhsvars[i]
rhs = rhsexprs[i]
hl_lhs = XU.xvariable_to_ast_lval(lhs, xdata, iaddr, astree)
hl_rhs = XU.xxpr_to_ast_def_expr(rhs, xdata, iaddr, astree)
hl_assign = astree.mk_assign(
hl_lhs,
hl_rhs,
iaddr=iaddr,
bytestring=bytestring,
annotations=annotations)
hl_instrs.append(hl_assign)

astree.add_instr_mapping(hl_assign, ll_assign)
astree.add_instr_address(hl_assign, [iaddr])
astree.add_expr_mapping(hl_rhs, ll_rhs)
astree.add_lval_mapping(hl_lhs, ll_lhs)
astree.add_expr_reachingdefs(ll_rhs, [memrdefs[i]])
astree.add_lval_defuses(hl_lhs, reguses[i])
astree.add_lval_defuses_high(hl_lhs, reguseshigh[i])

if self.writeback:

# low-level base assignment

baseincr = 4 * xd.regcount
baseincr_c = astree.mk_integer_constant(baseincr)

ll_base_lhs = baselval
ll_base_rhs = astree.mk_binary_op("plus", baserval, baseincr_c)
ll_base_assign = astree.mk_assign(
ll_base_lhs,
ll_base_rhs,
iaddr=iaddr,
bytestring=bytestring,
annotations=annotations)
ll_instrs.append(ll_base_assign)

# high-level base assignment

baseresult = xd.get_base_update_xpr()
hl_base_lhs = XU.xvariable_to_ast_lval(baselhs, xdata, iaddr, astree)
hl_base_rhs = XU.xxpr_to_ast_def_expr(
baseresult, xdata, iaddr, astree)
hl_base_assign = astree.mk_assign(
hl_base_lhs,
hl_base_rhs,
iaddr=iaddr,
bytestring=bytestring,
annotations=annotations)
hl_instrs.append(hl_base_assign)

astree.add_instr_mapping(hl_base_assign, ll_base_assign)
astree.add_instr_address(hl_base_assign, [iaddr])
astree.add_expr_mapping(hl_base_rhs, ll_base_rhs)
astree.add_lval_mapping(hl_base_lhs, ll_base_lhs)
astree.add_expr_reachingdefs(ll_base_rhs, [baserdef])
astree.add_lval_defuses(hl_base_lhs, baseuses)
astree.add_lval_defuses_high(hl_base_lhs, baseuseshigh)

return (hl_instrs, ll_instrs)