mirror of
https://github.com/NationalSecurityAgency/ghidra.git
synced 2025-10-05 02:39:44 +02:00
963 lines
28 KiB
C++
963 lines
28 KiB
C++
/* ###
|
|
* IP: GHIDRA
|
|
*
|
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
|
* you may not use this file except in compliance with the License.
|
|
* You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
#include "address.hh"
|
|
#include "translate.hh"
|
|
|
|
namespace ghidra {
|
|
|
|
AttributeId ATTRIB_FIRST = AttributeId("first",27);
|
|
AttributeId ATTRIB_LAST = AttributeId("last",28);
|
|
AttributeId ATTRIB_UNIQ = AttributeId("uniq",29);
|
|
|
|
ElementId ELEM_ADDR = ElementId("addr",11);
|
|
ElementId ELEM_RANGE = ElementId("range",12);
|
|
ElementId ELEM_RANGELIST = ElementId("rangelist",13);
|
|
ElementId ELEM_REGISTER = ElementId("register",14);
|
|
ElementId ELEM_SEQNUM = ElementId("seqnum",15);
|
|
ElementId ELEM_VARNODE = ElementId("varnode",16);
|
|
|
|
ostream &operator<<(ostream &s,const SeqNum &sq)
|
|
|
|
{
|
|
sq.pc.printRaw(s);
|
|
s << ':' << sq.uniq;
|
|
return s;
|
|
}
|
|
|
|
/// This allows an Address to be written to a stream using
|
|
/// the standard '<<' operator. This is a wrapper for the
|
|
/// printRaw method and is intended for debugging and console
|
|
/// mode uses.
|
|
/// \param s is the stream being written to
|
|
/// \param addr is the Address to write
|
|
/// \return the output stream
|
|
ostream &operator<<(ostream &s,const Address &addr)
|
|
|
|
{
|
|
addr.printRaw(s);
|
|
return s;
|
|
}
|
|
|
|
SeqNum::SeqNum(Address::mach_extreme ex) : pc(ex)
|
|
|
|
{
|
|
uniq = (ex == Address::m_minimal) ? 0 : ~((uintm)0);
|
|
}
|
|
|
|
void SeqNum::encode(Encoder &encoder) const
|
|
|
|
{
|
|
encoder.openElement(ELEM_SEQNUM);
|
|
pc.getSpace()->encodeAttributes(encoder,pc.getOffset());
|
|
encoder.writeUnsignedInteger(ATTRIB_UNIQ, uniq);
|
|
encoder.closeElement(ELEM_SEQNUM);
|
|
}
|
|
|
|
SeqNum SeqNum::decode(Decoder &decoder)
|
|
|
|
{
|
|
uintm uniq = ~((uintm)0);
|
|
uint4 elemId = decoder.openElement(ELEM_SEQNUM);
|
|
Address pc = Address::decode(decoder); // Recover address
|
|
for(;;) {
|
|
uint4 attribId = decoder.getNextAttributeId();
|
|
if (attribId == 0) break;
|
|
if (attribId == ATTRIB_UNIQ) {
|
|
uniq = decoder.readUnsignedInteger();
|
|
break;
|
|
}
|
|
}
|
|
decoder.closeElement(elemId);
|
|
return SeqNum(pc,uniq);
|
|
}
|
|
|
|
/// Some data structures sort on an Address, and it is convenient
|
|
/// to be able to create an Address that is either bigger than
|
|
/// or smaller than all other Addresses.
|
|
/// \param ex is either \e m_minimal or \e m_maximal
|
|
Address::Address(mach_extreme ex)
|
|
|
|
{
|
|
if (ex == m_minimal) {
|
|
base = (AddrSpace *)0;
|
|
offset = 0;
|
|
}
|
|
else {
|
|
base = (AddrSpace *) ~((uintp)0);
|
|
offset = ~((uintb)0);
|
|
}
|
|
}
|
|
|
|
/// Return \b true if the range starting at \b this extending the given number of bytes
|
|
/// is contained by the second given range.
|
|
/// \param sz is the given number of bytes in \b this range
|
|
/// \param op2 is the start of the second given range
|
|
/// \param sz2 is the number of bytes in the second given range
|
|
/// \return \b true if the second given range contains \b this range
|
|
bool Address::containedBy(int4 sz,const Address &op2,int4 sz2) const
|
|
|
|
{
|
|
if (base != op2.base) return false;
|
|
if (op2.offset > offset) return false;
|
|
uintb off1 = offset + (sz-1);
|
|
uintb off2 = op2.offset + (sz2-1);
|
|
return (off2 >= off1);
|
|
}
|
|
|
|
/// Return -1 if (\e op2,\e sz2) is not properly contained in (\e this,\e sz).
|
|
/// If it is contained, return the endian aware offset of (\e op2,\e sz2)
|
|
/// I.e. if the least significant byte of the \e op2 range falls on the least significant
|
|
/// byte of the \e this range, return 0. If it intersects the second least significant, return 1, etc.
|
|
/// The -forceleft- toggle causes the check to be made against the left (lowest address) side
|
|
/// of the container, regardless of the endianness. I.e. it forces a little endian interpretation.
|
|
/// \param sz is the size of \e this range
|
|
/// \param op2 is the address of the second range
|
|
/// \param sz2 is the size of the second range
|
|
/// \param forceleft is \b true if containments is forced to be on the left even for big endian
|
|
/// \return the endian aware offset, or -1
|
|
int4 Address::justifiedContain(int4 sz,const Address &op2,int4 sz2,bool forceleft) const
|
|
|
|
{ if (base != op2.base) return -1;
|
|
if (op2.offset < offset) return -1;
|
|
uintb off1 = offset + (sz-1);
|
|
uintb off2 = op2.offset + (sz2-1);
|
|
if (off2 > off1) return -1;
|
|
if (base->isBigEndian()&&(!forceleft)) {
|
|
return (int4)(off1 - off2);
|
|
}
|
|
return (int4)(op2.offset - offset);
|
|
}
|
|
|
|
/// If \e this + \e skip falls in the range
|
|
/// \e op to \e op + \e size, then a non-negative integer is
|
|
/// returned indicating where in the interval it falls. I.e.
|
|
/// if \e this + \e skip == \e op, then 0 is returned. Otherwise
|
|
/// -1 is returned.
|
|
/// \param skip is an adjust to \e this address
|
|
/// \param op is the start of the range to check
|
|
/// \param size is the size of the range
|
|
/// \return an integer indicating how overlap occurs
|
|
int4 Address::overlap(int4 skip,const Address &op,int4 size) const
|
|
|
|
{
|
|
uintb dist;
|
|
|
|
if (base != op.base) return -1; // Must be in same address space to overlap
|
|
if (base->getType()==IPTR_CONSTANT) return -1; // Must not be constants
|
|
|
|
dist = base->wrapOffset(offset+skip-op.offset);
|
|
|
|
if (dist >= size) return -1; // but must fall before op+size
|
|
return (int4) dist;
|
|
}
|
|
|
|
/// Does the location \e this, \e sz form a contiguous region to \e loaddr, \e losz,
|
|
/// where \e this forms the most significant piece of the logical whole
|
|
/// \param sz is the size of \e this hi region
|
|
/// \param loaddr is the starting address of the low region
|
|
/// \param losz is the size of the low region
|
|
/// \return \b true if the pieces form a contiguous whole
|
|
bool Address::isContiguous(int4 sz,const Address &loaddr,int4 losz) const
|
|
|
|
{
|
|
if (base != loaddr.base) return false;
|
|
if (base->isBigEndian()) {
|
|
uintb nextoff = base->wrapOffset(offset+sz);
|
|
if (nextoff == loaddr.offset) return true;
|
|
}
|
|
else {
|
|
uintb nextoff = base->wrapOffset(loaddr.offset+losz);
|
|
if (nextoff == offset) return true;
|
|
}
|
|
return false;
|
|
}
|
|
|
|
/// If \b this is (originally) a \e join address, reevaluate it in terms of its new
|
|
/// \e offset and \e size, changing the space and offset if necessary.
|
|
/// \param size is the new size in bytes of the underlying object
|
|
void Address::renormalize(int4 size) {
|
|
if (base->getType() == IPTR_JOIN)
|
|
base->getManager()->renormalizeJoinAddress(*this,size);
|
|
}
|
|
|
|
/// This is usually used to decode an address from an \b \<addr\>
|
|
/// element, but any element can be used if it has the appropriate attributes
|
|
/// - \e space indicates the address space of the tag
|
|
/// - \e offset indicates the offset within the space
|
|
///
|
|
/// or a \e name attribute can be used to recover an address
|
|
/// based on a register name.
|
|
/// \param decoder is the stream decoder
|
|
/// \return the resulting Address
|
|
Address Address::decode(Decoder &decoder)
|
|
|
|
{
|
|
VarnodeData var;
|
|
|
|
var.decode(decoder);
|
|
return Address(var.space,var.offset);
|
|
}
|
|
|
|
/// This is usually used to decode an address from an \b \<addr\>
|
|
/// element, but any element can be used if it has the appropriate attributes
|
|
/// - \e space indicates the address space of the tag
|
|
/// - \e offset indicates the offset within the space
|
|
/// - \e size indicates the size of an address range
|
|
///
|
|
/// or a \e name attribute can be used to recover an address
|
|
/// and size based on a register name. If a size is recovered
|
|
/// it is stored in \e size reference.
|
|
/// \param decoder is the stream decoder
|
|
/// \param size is the reference to any recovered size
|
|
/// \return the resulting Address
|
|
Address Address::decode(Decoder &decoder,int4 &size)
|
|
|
|
{
|
|
VarnodeData var;
|
|
|
|
var.decode(decoder);
|
|
size = var.size;
|
|
return Address(var.space,var.offset);
|
|
}
|
|
|
|
Range::Range(const RangeProperties &properties,const AddrSpaceManager *manage)
|
|
|
|
{
|
|
if (properties.isRegister) {
|
|
const Translate *trans = manage->getDefaultCodeSpace()->getTrans();
|
|
const VarnodeData &point(trans->getRegister(properties.spaceName));
|
|
spc = point.space;
|
|
first = point.offset;
|
|
last = (first-1) + point.size;
|
|
return;
|
|
}
|
|
spc = manage->getSpaceByName(properties.spaceName);
|
|
if (spc == (AddrSpace *)0)
|
|
throw LowlevelError("Undefined space: "+properties.spaceName);
|
|
|
|
if (spc == (AddrSpace *)0)
|
|
throw LowlevelError("No address space indicated in range tag");
|
|
first = properties.first;
|
|
last = properties.last;
|
|
if (!properties.seenLast) {
|
|
last = spc->getHighest();
|
|
}
|
|
if (first > spc->getHighest() || last > spc->getHighest() || last < first)
|
|
throw LowlevelError("Illegal range tag");
|
|
}
|
|
|
|
/// Get the last address +1, updating the space, or returning
|
|
/// the extremal address if necessary
|
|
/// \param manage is used to fetch the next address space
|
|
Address Range::getLastAddrOpen(const AddrSpaceManager *manage) const
|
|
|
|
{
|
|
AddrSpace *curspc = spc;
|
|
uintb curlast = last;
|
|
if (curlast == curspc->getHighest()) {
|
|
curspc = manage->getNextSpaceInOrder(curspc);
|
|
curlast = 0;
|
|
}
|
|
else
|
|
curlast += 1;
|
|
if (curspc == (AddrSpace *)0)
|
|
return Address(Address::m_maximal);
|
|
return Address(curspc,curlast);
|
|
}
|
|
|
|
/// Output a description of this Range like: ram: 7f-9c
|
|
/// \param s is the output stream
|
|
void Range::printBounds(ostream &s) const
|
|
|
|
{
|
|
s << spc->getName() << ": ";
|
|
s << hex << first << '-' << last;
|
|
}
|
|
|
|
/// Encode \b this to a stream as a \<range> element.
|
|
/// \param encoder is the stream encoder
|
|
void Range::encode(Encoder &encoder) const
|
|
|
|
{
|
|
encoder.openElement(ELEM_RANGE);
|
|
encoder.writeSpace(ATTRIB_SPACE, spc);
|
|
encoder.writeUnsignedInteger(ATTRIB_FIRST, first);
|
|
encoder.writeUnsignedInteger(ATTRIB_LAST, last);
|
|
encoder.closeElement(ELEM_RANGE);
|
|
}
|
|
|
|
/// Reconstruct this object from a \<range> or \<register> element
|
|
/// \param decoder is the stream decoder
|
|
void Range::decode(Decoder &decoder)
|
|
|
|
{
|
|
uint4 elemId = decoder.openElement();
|
|
if (elemId != ELEM_RANGE && elemId != ELEM_REGISTER)
|
|
throw DecoderError("Expecting <range> or <register> element");
|
|
decodeFromAttributes(decoder);
|
|
decoder.closeElement(elemId);
|
|
}
|
|
|
|
/// Reconstruct from attributes that may not be part of a \<range> element.
|
|
/// \param decoder is the stream decoder
|
|
void Range::decodeFromAttributes(Decoder &decoder)
|
|
|
|
{
|
|
spc = (AddrSpace *)0;
|
|
bool seenLast = false;
|
|
first = 0;
|
|
last = 0;
|
|
for(;;) {
|
|
uint4 attribId = decoder.getNextAttributeId();
|
|
if (attribId == 0) break;
|
|
if (attribId == ATTRIB_SPACE) {
|
|
spc = decoder.readSpace();
|
|
}
|
|
else if (attribId == ATTRIB_FIRST) {
|
|
first = decoder.readUnsignedInteger();
|
|
}
|
|
else if (attribId == ATTRIB_LAST) {
|
|
last = decoder.readUnsignedInteger();
|
|
seenLast = true;
|
|
}
|
|
else if (attribId == ATTRIB_NAME) {
|
|
const Translate *trans = decoder.getAddrSpaceManager()->getDefaultCodeSpace()->getTrans();
|
|
const VarnodeData &point(trans->getRegister(decoder.readString()));
|
|
spc = point.space;
|
|
first = point.offset;
|
|
last = (first-1) + point.size;
|
|
return; // There should be no (space,first,last) attributes
|
|
}
|
|
}
|
|
if (spc == (AddrSpace *)0)
|
|
throw LowlevelError("No address space indicated in range tag");
|
|
if (!seenLast) {
|
|
last = spc->getHighest();
|
|
}
|
|
if (first > spc->getHighest() || last > spc->getHighest() || last < first)
|
|
throw LowlevelError("Illegal range tag");
|
|
}
|
|
|
|
void RangeProperties::decode(Decoder &decoder)
|
|
|
|
{
|
|
uint4 elemId = decoder.openElement();
|
|
if (elemId != ELEM_RANGE && elemId != ELEM_REGISTER)
|
|
throw DecoderError("Expecting <range> or <register> element");
|
|
for(;;) {
|
|
uint4 attribId = decoder.getNextAttributeId();
|
|
if (attribId == 0) break;
|
|
if (attribId == ATTRIB_SPACE)
|
|
spaceName = decoder.readString();
|
|
else if (attribId == ATTRIB_FIRST)
|
|
first = decoder.readUnsignedInteger();
|
|
else if (attribId == ATTRIB_LAST) {
|
|
last = decoder.readUnsignedInteger();
|
|
seenLast = true;
|
|
}
|
|
else if (attribId == ATTRIB_NAME) {
|
|
spaceName = decoder.readString();
|
|
isRegister = true;
|
|
}
|
|
}
|
|
decoder.closeElement(elemId);
|
|
}
|
|
|
|
/// Insert a new Range merging as appropriate to maintain the disjoint cover
|
|
/// \param spc is the address space containing the new range
|
|
/// \param first is the offset of the first byte in the new range
|
|
/// \param last is the offset of the last byte in the new range
|
|
void RangeList::insertRange(AddrSpace *spc,uintb first,uintb last)
|
|
|
|
{
|
|
set<Range>::iterator iter1,iter2;
|
|
|
|
// we must have iter1.first > first
|
|
iter1 = tree.upper_bound(Range(spc,first,first));
|
|
|
|
// Set iter1 to first range with range.last >=first
|
|
// It is either current iter1 or the one before
|
|
if (iter1 != tree.begin()) {
|
|
--iter1;
|
|
if (((*iter1).spc!=spc)||((*iter1).last < first))
|
|
++iter1;
|
|
}
|
|
|
|
// Set iter2 to first range with range.first > last
|
|
iter2 = tree.upper_bound(Range(spc,last,last));
|
|
|
|
while(iter1!=iter2) {
|
|
if ((*iter1).first < first)
|
|
first = (*iter1).first;
|
|
if ((*iter1).last > last)
|
|
last = (*iter1).last;
|
|
tree.erase(iter1++);
|
|
}
|
|
tree.insert(Range(spc,first,last));
|
|
}
|
|
|
|
/// Remove/narrow/split existing Range objects to eliminate the indicated addresses
|
|
/// while still maintaining a disjoint cover.
|
|
/// \param spc is the address space of the address range to remove
|
|
/// \param first is the offset of the first byte of the range
|
|
/// \param last is the offset of the last byte of the range
|
|
void RangeList::removeRange(AddrSpace *spc,uintb first,uintb last)
|
|
|
|
{ // remove a range
|
|
set<Range>::iterator iter1,iter2;
|
|
|
|
if (tree.empty()) return; // Nothing to do
|
|
|
|
// we must have iter1.first > first
|
|
iter1 = tree.upper_bound(Range(spc,first,first));
|
|
|
|
// Set iter1 to first range with range.last >=first
|
|
// It is either current iter1 or the one before
|
|
if (iter1 != tree.begin()) {
|
|
--iter1;
|
|
if (((*iter1).spc!=spc)||((*iter1).last < first))
|
|
++iter1;
|
|
}
|
|
|
|
// Set iter2 to first range with range.first > last
|
|
iter2 = tree.upper_bound(Range(spc,last,last));
|
|
|
|
while(iter1!=iter2) {
|
|
uintb a,b;
|
|
|
|
a = (*iter1).first;
|
|
b = (*iter1).last;
|
|
tree.erase(iter1++);
|
|
if (a <first)
|
|
tree.insert(Range(spc,a,first-1));
|
|
if (b > last)
|
|
tree.insert(Range(spc,last+1,b));
|
|
}
|
|
}
|
|
|
|
void RangeList::merge(const RangeList &op2)
|
|
|
|
{ // Merge -op2- into this rangelist
|
|
set<Range>::const_iterator iter1,iter2;
|
|
iter1 = op2.tree.begin();
|
|
iter2 = op2.tree.end();
|
|
while(iter1 != iter2) {
|
|
const Range &range( *iter1 );
|
|
++iter1;
|
|
insertRange(range.spc, range.first, range.last);
|
|
}
|
|
}
|
|
|
|
/// Make sure indicated range of addresses is \e contained in \b this RangeList
|
|
/// \param addr is the first Address in the target range
|
|
/// \param size is the number of bytes in the target range
|
|
/// \return \b true is the range is fully contained by this RangeList
|
|
bool RangeList::inRange(const Address &addr,int4 size) const
|
|
|
|
{
|
|
set<Range>::const_iterator iter;
|
|
|
|
if (addr.isInvalid()) return true; // We don't really care
|
|
if (tree.empty()) return false;
|
|
|
|
// iter = first range with its first > addr
|
|
iter = tree.upper_bound(Range(addr.getSpace(),addr.getOffset(),addr.getOffset()));
|
|
if (iter == tree.begin()) return false;
|
|
// Set iter to last range with range.first <= addr
|
|
--iter;
|
|
// if (iter == tree.end()) // iter can't be end if non-empty
|
|
// return false;
|
|
if ((*iter).spc != addr.getSpace()) return false;
|
|
if ((*iter).last >= addr.getOffset()+size-1)
|
|
return true;
|
|
return false;
|
|
}
|
|
|
|
/// If \b this RangeList contains the specific address (spaceid,offset), return it
|
|
/// \return the containing Range or NULL
|
|
const Range *RangeList::getRange(AddrSpace *spaceid,uintb offset) const
|
|
|
|
{
|
|
if (tree.empty()) return (const Range *)0;
|
|
|
|
// iter = first range with its first > offset
|
|
set<Range>::const_iterator iter = tree.upper_bound(Range(spaceid,offset,offset));
|
|
if (iter == tree.begin()) return (const Range *)0;
|
|
// Set iter to last range with range.first <= offset
|
|
--iter;
|
|
if ((*iter).spc != spaceid) return (const Range *)0;
|
|
if ((*iter).last >= offset)
|
|
return &(*iter);
|
|
return (const Range *)0;
|
|
}
|
|
|
|
/// Return the size of the biggest contiguous sequence of addresses in
|
|
/// \b this RangeList which contain the given address
|
|
/// \param addr is the given address
|
|
/// \param maxsize is the large range to consider before giving up
|
|
/// \return the size (in bytes) of the biggest range
|
|
uintb RangeList::longestFit(const Address &addr,uintb maxsize) const
|
|
|
|
{
|
|
set<Range>::const_iterator iter;
|
|
|
|
if (addr.isInvalid()) return 0;
|
|
if (tree.empty()) return 0;
|
|
|
|
// iter = first range with its first > addr
|
|
uintb offset = addr.getOffset();
|
|
iter = tree.upper_bound(Range(addr.getSpace(),offset,offset));
|
|
if (iter == tree.begin()) return 0;
|
|
// Set iter to last range with range.first <= addr
|
|
--iter;
|
|
uintb sizeres = 0;
|
|
if ((*iter).last < offset) return sizeres;
|
|
do {
|
|
if ((*iter).spc != addr.getSpace()) break;
|
|
if ((*iter).first > offset) break;
|
|
sizeres += ((*iter).last + 1 - offset); // Size extends to end of range
|
|
offset = (*iter).last + 1; // Try to chain on the next range
|
|
if (sizeres >= maxsize) break; // Don't bother if past maxsize
|
|
++iter; // Next range in the chain
|
|
} while(iter != tree.end());
|
|
return sizeres;
|
|
}
|
|
|
|
/// \return the first contiguous range of addresses or NULL if empty
|
|
const Range *RangeList::getFirstRange(void) const
|
|
|
|
{
|
|
if (tree.empty()) return (const Range *)0;
|
|
return &(*tree.begin());
|
|
}
|
|
|
|
/// \return the last contiguous range of addresses or NULL if empty
|
|
const Range *RangeList::getLastRange(void) const
|
|
|
|
{
|
|
if (tree.empty()) return (const Range *)0;
|
|
set<Range>::const_iterator iter = tree.end();
|
|
--iter;
|
|
return &(*iter);
|
|
}
|
|
|
|
/// Treating offsets with their high-bits set as coming \e before
|
|
/// offset where the high-bit is clear, return the last/latest contiguous
|
|
/// Range within the given address space
|
|
/// \param spaceid is the given address space
|
|
/// \return indicated Range or NULL if empty
|
|
const Range *RangeList::getLastSignedRange(AddrSpace *spaceid) const
|
|
|
|
{
|
|
uintb midway = spaceid->getHighest() / 2; // Maximal signed value
|
|
Range range(spaceid,midway,midway);
|
|
set<Range>::const_iterator iter = tree.upper_bound(range); // First element greater than -range- (should be MOST negative)
|
|
|
|
if (iter!=tree.begin()) {
|
|
--iter;
|
|
if ((*iter).getSpace() == spaceid)
|
|
return &(*iter);
|
|
}
|
|
|
|
// If there were no "positive" ranges, search for biggest negative range
|
|
range = Range(spaceid,spaceid->getHighest(),spaceid->getHighest());
|
|
iter = tree.upper_bound(range);
|
|
if (iter != tree.begin()) {
|
|
--iter;
|
|
if ((*iter).getSpace() == spaceid)
|
|
return &(*iter);
|
|
}
|
|
return (const Range *)0;
|
|
}
|
|
|
|
/// Print a one line description of each disjoint Range making up \b this RangeList
|
|
/// \param s is the output stream
|
|
void RangeList::printBounds(ostream &s) const
|
|
|
|
{
|
|
if (tree.empty())
|
|
s << "all" << endl;
|
|
else {
|
|
set<Range>::const_iterator iter;
|
|
for(iter=tree.begin();iter!=tree.end();++iter) {
|
|
(*iter).printBounds(s);
|
|
s << endl;
|
|
}
|
|
}
|
|
}
|
|
|
|
/// Encode \b this as a \<rangelist> element
|
|
/// \param encoder is the stream encoder
|
|
void RangeList::encode(Encoder &encoder) const
|
|
|
|
{
|
|
set<Range>::const_iterator iter;
|
|
|
|
encoder.openElement(ELEM_RANGELIST);
|
|
for(iter=tree.begin();iter!=tree.end();++iter) {
|
|
(*iter).encode(encoder);
|
|
}
|
|
encoder.closeElement(ELEM_RANGELIST);
|
|
}
|
|
|
|
/// Recover each individual disjoint Range for \b this RangeList.
|
|
/// \param decoder is the stream decoder
|
|
void RangeList::decode(Decoder &decoder)
|
|
|
|
{
|
|
uint4 elemId = decoder.openElement(ELEM_RANGELIST);
|
|
while(decoder.peekElement() != 0) {
|
|
Range range;
|
|
range.decode(decoder);
|
|
tree.insert(range);
|
|
}
|
|
decoder.closeElement(elemId);
|
|
}
|
|
|
|
#ifdef UINTB4
|
|
uintb uintbmasks[9] = { 0, 0xff, 0xffff, 0xffffff, 0xffffffff, 0xffffffff, 0xffffffff, 0xffffffff, 0xffffffff };
|
|
#else
|
|
uintb uintbmasks[9] = { 0, 0xff, 0xffff, 0xffffff, 0xffffffff, 0xffffffffffLL,
|
|
0xffffffffffffLL, 0xffffffffffffffLL, 0xffffffffffffffffLL };
|
|
#endif
|
|
|
|
/// Treat the given \b val as a constant of \b size bytes
|
|
/// \param val is the given value
|
|
/// \param size is the size in bytes
|
|
/// \return \b true if the constant (as sized) has its sign bit set
|
|
bool signbit_negative(uintb val,int4 size)
|
|
|
|
{ // Return true if signbit is set (negative)
|
|
uintb mask = 0x80;
|
|
mask <<= 8*(size-1);
|
|
return ((val&mask) != 0);
|
|
}
|
|
|
|
/// Treat the given \b in as a constant of \b size bytes.
|
|
/// Negate this constant keeping the upper bytes zero.
|
|
/// \param in is the given value
|
|
/// \param size is the size in bytes
|
|
/// \return the negation of the sized constant
|
|
uintb uintb_negate(uintb in,int4 size)
|
|
|
|
{ // Invert bits
|
|
return ((~in)&calc_mask(size));
|
|
}
|
|
|
|
/// Take the first \b sizein bytes of the given \b in and sign-extend
|
|
/// this to \b sizeout bytes, keeping any more significant bytes zero
|
|
/// \param in is the given value
|
|
/// \param sizein is the size to treat that value as an input
|
|
/// \param sizeout is the size to sign-extend the value to
|
|
/// \return the sign-extended value
|
|
uintb sign_extend(uintb in,int4 sizein,int4 sizeout)
|
|
|
|
{
|
|
intb sval = in;
|
|
sval <<= (sizeof(intb) - sizein) * 8;
|
|
uintb res = (uintb)(sval >> (sizeout - sizein) * 8);
|
|
res >>= (sizeof(uintb) - sizeout)*8;
|
|
return res;
|
|
}
|
|
|
|
/// Swap the least significant \b size bytes in \b val
|
|
/// \param val is a reference to the value to swap
|
|
/// \param size is the number of bytes to swap
|
|
void byte_swap(intb &val,int4 size)
|
|
|
|
{
|
|
intb res = 0;
|
|
while(size>0) {
|
|
res <<= 8;
|
|
res |= (val&0xff);
|
|
val >>= 8;
|
|
size -= 1;
|
|
}
|
|
val = res;
|
|
}
|
|
|
|
/// Swap the least significant \b size bytes in \b val
|
|
/// \param val is the value to swap
|
|
/// \param size is the number of bytes to swap
|
|
/// \return the swapped value
|
|
uintb byte_swap(uintb val,int4 size)
|
|
|
|
{
|
|
uintb res=0;
|
|
while(size>0) {
|
|
res <<= 8;
|
|
res |= (val&0xff);
|
|
val >>= 8;
|
|
size -= 1;
|
|
}
|
|
return res;
|
|
}
|
|
|
|
/// The least significant bit is index 0.
|
|
/// \param val is the given value
|
|
/// \return the index of the least significant set bit, or -1 if none are set
|
|
int4 leastsigbit_set(uintb val)
|
|
|
|
{
|
|
if (val==0) return -1;
|
|
int4 res = 0;
|
|
int4 sz = 4*sizeof(uintb);
|
|
uintb mask = ~((uintb)0);
|
|
do {
|
|
mask >>= sz;
|
|
if ((mask&val)==0) {
|
|
res += sz;
|
|
val >>= sz;
|
|
}
|
|
sz >>= 1;
|
|
} while(sz!=0);
|
|
return res;
|
|
}
|
|
|
|
/// The least significant bit is index 0.
|
|
/// \param val is the given value
|
|
/// \return the index of the most significant set bit, or -1 if none are set
|
|
int4 mostsigbit_set(uintb val)
|
|
|
|
{
|
|
if (val==0) return -1;
|
|
int4 res = 8*sizeof(uintb)-1;
|
|
int4 sz = 4*sizeof(uintb);
|
|
uintb mask = ~((uintb)0);
|
|
do {
|
|
mask <<= sz;
|
|
if ((mask&val)==0) {
|
|
res -= sz;
|
|
val <<= sz;
|
|
}
|
|
sz >>= 1;
|
|
} while(sz != 0);
|
|
return res;
|
|
}
|
|
|
|
/// Count the number (population) bits set.
|
|
/// \param val is the given value
|
|
/// \return the number of one bits
|
|
int4 popcount(uintb val)
|
|
|
|
{
|
|
val = (val & 0x5555555555555555L) + ((val >> 1) & 0x5555555555555555L);
|
|
val = (val & 0x3333333333333333L) + ((val >> 2) & 0x3333333333333333L);
|
|
val = (val & 0x0f0f0f0f0f0f0f0fL) + ((val >> 4) & 0x0f0f0f0f0f0f0f0fL);
|
|
val = (val & 0x00ff00ff00ff00ffL) + ((val >> 8) & 0x00ff00ff00ff00ffL);
|
|
val = (val & 0x0000ffff0000ffffL) + ((val >> 16) & 0x0000ffff0000ffffL);
|
|
int4 res = (int4)(val & 0xff);
|
|
res += (int4)((val >> 32) & 0xff);
|
|
return res;
|
|
}
|
|
|
|
/// Count the number of more significant zero bits before the most significant
|
|
/// one bit in the representation of the given value;
|
|
/// \param val is the given value
|
|
/// \return the number of zero bits
|
|
int4 count_leading_zeros(uintb val)
|
|
|
|
{
|
|
if (val == 0)
|
|
return 8*sizeof(uintb);
|
|
uintb mask = ~((uintb)0);
|
|
int4 maskSize = 4*sizeof(uintb);
|
|
mask &= (mask << maskSize);
|
|
int4 bit = 0;
|
|
|
|
do {
|
|
if ((mask & val)==0) {
|
|
bit += maskSize;
|
|
maskSize >>= 1;
|
|
mask |= (mask >> maskSize);
|
|
}
|
|
else {
|
|
maskSize >>= 1;
|
|
mask &= (mask << maskSize);
|
|
}
|
|
} while(maskSize != 0);
|
|
return bit;
|
|
}
|
|
|
|
/// Return smallest number of form 2^n-1, bigger or equal to the given value
|
|
/// \param val is the given value
|
|
/// \return the mask
|
|
uintb coveringmask(uintb val)
|
|
|
|
{
|
|
uintb res = val;
|
|
int4 sz = 1;
|
|
while(sz < 8*sizeof(uintb)) {
|
|
res = res | (res>>sz);
|
|
sz <<= 1;
|
|
}
|
|
return res;
|
|
}
|
|
|
|
/// Treat \b val as a constant of size \b sz.
|
|
/// Scanning across the bits of \b val return the number of transitions (from 0->1 or 1->0)
|
|
/// If there are 2 or less transitions, this is an indication of a bit flag or a mask
|
|
/// \param val is the given value
|
|
/// \param sz is the size to treat the value as
|
|
/// \return the number of transitions
|
|
int4 bit_transitions(uintb val,int4 sz)
|
|
|
|
{
|
|
int4 res = 0;
|
|
int4 last = val & 1;
|
|
int4 cur;
|
|
for(int4 i=1;i<8*sz;++i) {
|
|
val >>= 1;
|
|
cur = val & 1;
|
|
if (cur != last) {
|
|
res += 1;
|
|
last = cur;
|
|
}
|
|
if (val==0) break;
|
|
}
|
|
return res;
|
|
}
|
|
|
|
/// \brief Multiply 2 unsigned 64-bit values, producing a 128-bit value
|
|
///
|
|
/// TODO: Remove once we import a full multiprecision library.
|
|
/// \param res points to the result array (2 uint8 pieces)
|
|
/// \param x is the first 64-bit value
|
|
/// \param y is the second 64-bit value
|
|
void mult64to128(uint8 *res,uint8 x,uint8 y)
|
|
|
|
{
|
|
uint8 f = x & 0xffffffff;
|
|
uint8 e = x >> 32;
|
|
uint8 d = y & 0xffffffff;
|
|
uint8 c = y >> 32;
|
|
uint8 fd = f * d;
|
|
uint8 fc = f * c;
|
|
uint8 ed = e * d;
|
|
uint8 ec = e * c;
|
|
uint8 tmp = (fd >> 32) + (fc & 0xffffffff) + (ed & 0xffffffff);
|
|
res[1] = (tmp>>32) + (fc>>32) + (ed>>32) + ec;
|
|
res[0] = (tmp<<32) + (fd & 0xffffffff);
|
|
}
|
|
|
|
/// \brief Subtract (in-place) a 128-bit value from a base 128-value
|
|
///
|
|
/// The base value is altered in place.
|
|
/// TODO: Remove once we import a full multiprecision library.
|
|
/// \param a is the base 128-bit value being subtracted from in-place
|
|
/// \param b is the other 128-bit value being subtracted
|
|
void unsignedSubtract128(uint8 *a,uint8 *b)
|
|
|
|
{
|
|
bool borrow = (a[0] < b[0]);
|
|
a[0] -= b[0];
|
|
a[1] -= b[1];
|
|
if (borrow)
|
|
a[1] -= 1;
|
|
}
|
|
|
|
/// \brief Compare two unsigned 128-bit values
|
|
///
|
|
/// TODO: Remove once we import a full multiprecision library.
|
|
/// Given a first and second value, return -1, 0, or 1 depending on whether the first value
|
|
/// is \e less, \e equal, or \e greater than the second value.
|
|
/// \param a is the first 128-bit value (as an array of 2 uint8 elements)
|
|
/// \param b is the second 128-bit value
|
|
/// \return the comparison code
|
|
int4 unsignedCompare128(uint8 *a,uint8 *b)
|
|
|
|
{
|
|
if (a[1] != b[1])
|
|
return (a[1] < b[1]) ? -1 : 1;
|
|
if (a[0] != b[0])
|
|
return (a[0] < b[0]) ? -1 : 1;
|
|
return 0;
|
|
}
|
|
|
|
/// \brief Unsigned division of a power of 2 (upto 2^127) by a 64-bit divisor
|
|
///
|
|
/// The result must be less than 2^64. The remainder is calculated.
|
|
/// \param n is the power of 2 for the numerand
|
|
/// \param divisor is the 64-bit divisor
|
|
/// \param q is the passed back 64-bit quotient
|
|
/// \param r is the passed back 64-bit remainder
|
|
/// \return 0 if successful, 1 if result is too big, 2 if divide by 0
|
|
int4 power2Divide(int4 n,uint8 divisor,uint8 &q,uint8 &r)
|
|
|
|
{
|
|
if (divisor == 0) return 2;
|
|
uint8 power = 1;
|
|
if (n < 64) {
|
|
power <<= n;
|
|
q = power / divisor;
|
|
r = power % divisor;
|
|
return 0;
|
|
}
|
|
// Divide numerand and divisor by 2^(n-63) to get approximation of result
|
|
uint8 y = divisor >> (n-64); // Most of the way on divisor
|
|
if (y == 0) return 1; // Check if result will be too big
|
|
y >>= 1; // Divide divisor by final bit
|
|
power <<= 63;
|
|
uint8 max;
|
|
if (y == 0) {
|
|
max = 0;
|
|
max -= 1; // Could be maximal
|
|
// Check if divisor is a power of 2
|
|
if ((((uint8)1) << (n-64)) == divisor)
|
|
return 1;
|
|
}
|
|
else
|
|
max = power / y + 1;
|
|
uint8 min = power / (y+1);
|
|
if (min != 0)
|
|
min -= 1;
|
|
uint8 fullpower[2];
|
|
fullpower[1] = ((uint8)1)<<(n-64);
|
|
fullpower[0] = 0;
|
|
uint8 mult[2];
|
|
mult[0] = 0;
|
|
mult[1] = 0;
|
|
uint8 tmpq = 0;
|
|
while(max > min+1) {
|
|
tmpq = max + min;
|
|
if (tmpq < min) {
|
|
tmpq = (tmpq>>1) + 0x8000000000000000L;
|
|
}
|
|
else
|
|
tmpq >>= 1;
|
|
mult64to128(mult,divisor,tmpq);
|
|
if (unsignedCompare128(fullpower,mult) < 0)
|
|
max = tmpq-1;
|
|
else
|
|
min = tmpq;
|
|
}
|
|
// min is now our putative quotient
|
|
if (tmpq != min)
|
|
mult64to128(mult,divisor,min);
|
|
unsignedSubtract128(fullpower,mult); // Calculate remainder
|
|
// min might be 1 too small
|
|
if (fullpower[1] != 0 || fullpower[0] >= divisor) {
|
|
q = min + 1;
|
|
r = fullpower[0] - divisor;
|
|
}
|
|
else {
|
|
q = min;
|
|
r = fullpower[0];
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
} // End namespace ghidra
|