ghidra/Ghidra/Features/Decompiler/src/decompile/cpp/userop.hh
2019-03-26 13:46:51 -04:00

297 lines
15 KiB
C++

/* ###
* IP: GHIDRA
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
/// \file userop.hh
/// \brief Classes for more detailed definitions of user defined p-code operations
#ifndef __CPUI_USEROP__
#define __CPUI_USEROP__
#include "typeop.hh"
/// \brief The base class for a detailed definition of a user-defined p-code operation
///
/// Within the raw p-code framework, the CALLOTHER opcode represents a user defined
/// operation. At this level, the operation is just a placeholder for inputs and outputs
/// to same black-box procedure. The first input parameter (index 0) must be a constant
/// id associated with the particular procedure. Classes derived off of this base class
/// provide a more specialized definition of an operation/procedure. The specialized classes
/// are managed via UserOpManage and are associated with CALLOTHER ops via the constant id.
///
/// The derived classes can in principle implement any functionality, tailored to the architecture
/// or program. At this base level, the only commonality is a formal \b name of the operator and
/// its CALLOTHER index. A facility for reading in implementation details is provided via restoreXml().
class UserPcodeOp {
protected:
string name; ///< Low-level name of p-code operator
int4 useropindex; ///< Index passed in the CALLOTHER op
Architecture *glb; ///< Architecture owning the user defined op
public:
UserPcodeOp(Architecture *g,const string &nm,int4 ind) {
name = nm; useropindex = ind; glb = g; } ///< Construct from name and index
const string &getName(void) const { return name; } ///< Get the low-level name of the p-code op
int4 getIndex(void) const { return useropindex; } ///< Get the constant id of the op
virtual ~UserPcodeOp(void) {} ///< Destructor
/// \brief Get the symbol representing this operation in decompiled code
///
/// This will return the symbol formally displayed in source code, which can be
/// tailored more than the low-level name
/// \param op is the operation (in context) where a symbol is needed
/// \return the symbol as a string
virtual string getOperatorName(const PcodeOp *op) const {
return name; }
/// \brief Restore the detailed description from an XML stream
///
/// The details of how a user defined operation behaves can be dynamically configured
/// from an XML tag.
/// \param el is the root XML element describing the op
virtual void restoreXml(const Element *el)=0;
};
/// \brief A user defined p-code op with no specialization
///
/// This class is used by the manager for CALLOTHER indices that have not been
/// mapped to a specialization. The p-code operation has the (SLEIGH assigned) name,
/// but still has an unknown effect.
class UnspecializedPcodeOp : public UserPcodeOp {
public:
UnspecializedPcodeOp(Architecture *g,const string &nm,int4 ind)
: UserPcodeOp(g,nm,ind) {} ///< Constructor
virtual void restoreXml(const Element *el) {}
};
/// \brief A user defined operation that is injected with other p-code
///
/// The system can configure user defined p-code ops as a hook point within the
/// control-flow where other p-code is injected during analysis. This class maps
/// the raw CALLOTHER p-code op, via its constant id, to its injection object.
/// The injection object is also referenced by an id and is managed by PcodeInjectLibrary.
class InjectedUserOp : public UserPcodeOp {
uint4 injectid; ///< The id of the injection object (to which this op maps)
public:
InjectedUserOp(Architecture *g,const string &nm,int4 ind,int4 injid)
: UserPcodeOp(g,nm,ind) { injectid = injid; } ///< Constructor
uint4 getInjectId(void) const { return injectid; } ///< Get the id of the injection object
virtual void restoreXml(const Element *el);
};
/// \brief A base class for operations that access volatile memory
///
/// The decompiler models volatile memory by converting any direct read or write of
/// the memory to a function that \e accesses the memory. This class and its derived
/// classes model such functions. Within the p-code control-flow, dedicated user defined
/// ops serve as a placeholder for the (possibly unknown) effects of modifying/accessing the
/// memory and prevent accidental constant propagation.
class VolatileOp : public UserPcodeOp {
protected:
static string appendSize(const string &base,int4 size); ///< Append a suffix to a string encoding a specific size
public:
VolatileOp(Architecture *g,const string &nm,int4 ind)
: UserPcodeOp(g,nm,ind) { } ///< Constructor
};
/// \brief An operation that reads from volatile memory
///
/// This CALLOTHER p-code operation takes as its input parameter, after the constant id,
/// a reference Varnode to the memory being read. The output returned by this operation
/// is the actual value read from memory.
class VolatileReadOp : public VolatileOp {
public:
VolatileReadOp(Architecture *g,const string &nm,int4 ind)
: VolatileOp(g,nm,ind) {} ///< Constructor
virtual string getOperatorName(const PcodeOp *op) const;
virtual void restoreXml(const Element *el);
};
/// \brief An operation that writes to volatile memory
///
/// This CALLOTHER p-code operation takes as its input parameters:
/// - Constant id
/// - Reference Varnode to the memory being written
/// - The Varnode value being written to the memory
class VolatileWriteOp : public VolatileOp {
public:
VolatileWriteOp(Architecture *g,const string &nm,int4 ind)
: VolatileOp(g,nm,ind) {} ///< Constructor
virtual string getOperatorName(const PcodeOp *op) const;
virtual void restoreXml(const Element *el);
};
/// \brief A user defined p-code op that has a dynamically defined procedure
///
/// The behavior of this op on constant inputs can be dynamically defined.
/// This class defines a unify() method that picks out the input varnodes to the
/// operation, given the root PcodeOp. The input varnodes would generally just be
/// the input varnodes to the raw CALLOTHER after the constant id, but skipping, reordering,
/// or other tree traversal is possible.
///
/// This class also defines an execute() method that computes the output given
/// constant inputs (matching the format determined by unify()).
class TermPatternOp : public UserPcodeOp {
public:
TermPatternOp(Architecture *g,const string &nm,int4 ind) : UserPcodeOp(g,nm,ind) {} ///< Constructor
virtual int4 getNumVariableTerms(void) const=0; ///< Get the number of input Varnodes expected
/// \brief Gather the formal input Varnode objects given the root PcodeOp
///
/// \param data is the function being analyzed
/// \param op is the root operation
/// \param bindlist will hold the ordered list of input Varnodes
/// \return \b true if the requisite inputs were found
virtual bool unify(Funcdata &data,PcodeOp *op,vector<Varnode *> &bindlist) const=0;
/// \brief Compute the output value of \b this operation, given constant inputs
///
/// \param input is the ordered list of constant inputs
/// \return the resulting value as a constant
virtual uintb execute(const vector<uintb> &input) const=0;
};
/// \brief A simple node used to dynamically define a sequence of operations
///
/// This should be deprecated in favor of ExecutablePcode objects. This
/// class holds a single operation (within a sequence). It acts on the output
/// of the previous operation with an optional constant value as the second input.
struct OpFollow {
OpCode opc; ///< The particular p-code operation
uintb val; ///< A possible constant second input
int4 slot; ///< Slot to follow
OpFollow(void) {} ///< Construct an empty object
void restoreXml(const Element *el); ///< Restore \b this node from an XML stream
};
/// \brief The \e segmented \e address operator
///
/// This op is a placeholder for address mappings involving \b segments.
///The map goes between a \b high-level view of a pointer, consisting of multiple pieces,
/// and a \b low-level view, where there is only a single absolute pointer.
/// The mapping could be
/// - a virtual to physical mapping for instance or
/// - a segment + near pointer to a full address
///
/// The output of the operator is always a full low-level pointer.
/// The operator takes two inputs:
/// - the \b base or \b segment and
/// - the high-level \b near pointer
///
/// High-level analysis can ignore the base/segment and any
/// normalization on the near pointer.
/// Emitted expressions involving \b this segment op prints only the \b near portion.
/// Data-type information propagates only through this high-level side.
///
/// The decompiler looks for the term-tree defined in SegmentOp
/// and replaces it with the SEGMENTOP operator in any p-code it analyzes.
/// The core routine that looks for the term-tree is unify().
class SegmentOp : public TermPatternOp {
AddrSpace *spc; ///< The physical address space into which a segmented pointer points
int4 baseinsize; ///< The size in bytes of the \e base or \e segment value
int4 innerinsize; ///< The size in bytes of the \e near pointer value
bool basepresent; ///< Is \b true is a base value must be present in the raw p-code
bool forcesegment; ///< Is \b true if an exception is thrown when a segment op can't be unified
bool supportsfarpointer; ///< Is \b true if the joined pair base:near acts as a \b far pointer
vector<OpFollow> basefollow; ///< Sequence of operations performed on the \b base value
vector<OpFollow> innerfollow; ///< Sequence of operations performed on the \b near value
VarnodeData constresolve; ///< How to resolve constant near pointers
static uintb executeSide(const vector<OpFollow> &follow,uintb input);
public:
SegmentOp(Architecture *g,const string &nm,int4 ind); ///< Constructor
AddrSpace *getSpace(void) const { return spc; } ///< Get the address space being pointed to
bool hasFarPointerSupport(void) const { return supportsfarpointer; } ///< Return \b true, if \b this op supports far pointers
bool isForced(void) const { return forcesegment; } ///< Return \b true if exceptions are thrown for bad unification
int4 getBaseSize(void) const { return baseinsize; } ///< Get size in bytes of the base/segment value
int4 getInnerSize(void) const { return innerinsize; } ///< Get size in bytes of the near value
const VarnodeData &getResolve(void) const { return constresolve; } ///< Get the default register for resolving indirect segments
virtual int4 getNumVariableTerms(void) const { if (basepresent) return 2; return 1; }
virtual bool unify(Funcdata &data,PcodeOp *op,vector<Varnode *> &bindlist) const;
virtual uintb execute(const vector<uintb> &input) const;
virtual void restoreXml(const Element *el);
};
/// \brief A user defined p-code op for assisting the recovery of jump tables.
///
/// An instance of this class refers to p-code script(s)
/// that describe how to parse the jump table from the load image. Possible scripts include:
/// - (if present) \b index2case describes how to get case values from an index 0..size-1
/// - \b index2addr describes how to get address values from the same index range
/// - \b defaultaddr describes how to calculate the switch's default address
/// - (if present) \b calcsize recovers the number of indices in the table
///
/// This class stores injection ids. The scripts themselves are managed by PcodeInjectLibrary.
class JumpAssistOp : public UserPcodeOp {
int4 index2case; ///< Id of p-code script performing index2case (== -1 if no script and index==case)
int4 index2addr; ///< Id of p-code script performing index2addr (must be present)
int4 defaultaddr; ///< Id of p-code script performing calculation of default address (must be present)
int4 calcsize; ///< Id of p-code script that calculates number of indices (== -1 if no script)
public:
JumpAssistOp(Architecture *g); ///< Constructor
int4 getIndex2Case(void) const { return index2case; } ///< Get the injection id for \b index2case
int4 getIndex2Addr(void) const { return index2addr; } ///< Get the injection id for \b index2addr
int4 getDefaultAddr(void) const { return defaultaddr; } ///< Get the injection id for \b defaultaddr
int4 getCalcSize(void) const { return calcsize; } ///< Get the injection id for \b calcsize
virtual void restoreXml(const Element *el);
};
/// \brief Manager/container for description objects (UserPcodeOp) of user defined p-code ops
///
/// The description objects are referenced by the CALLOTHER constant id, (or by name during initialization).
/// During initialize(), every user defined p-code op presented by the Architecture is
/// assigned a default UnspecializedPcodeOp description. Further processing of the .cspec or .pspec
/// may reassign a more specialized description object by parsing specific tags using
/// on of \b this class's parse* methods.
class UserOpManage {
vector<UserPcodeOp *> useroplist; ///< Description objects indexed by CALLOTHER constant id
map<string,UserPcodeOp *> useropmap; ///< A map from the name of the user defined operation to a description object
vector<SegmentOp *> segmentop; ///< Segment operations supported by this Architecture
VolatileReadOp *vol_read; ///< (Single) volatile read operation
VolatileWriteOp *vol_write; ///< (Single) volatile write operation
void registerOp(UserPcodeOp *op); ///< Insert a new UserPcodeOp description object in the map(s)
public:
UserOpManage(void); ///< Construct an empty manager
~UserOpManage(void); ///< Destructor
void initialize(Architecture *glb); ///< Initialize description objects for all user defined ops
void setDefaults(Architecture *glb); ///< Create any required operations if they weren't explicitly defined
int4 numSegmentOps(void) const { return segmentop.size(); } ///< Number of segment operations supported
/// Retrieve a user-op description object by index
/// \param i is the index
/// \return the indicated user-op description
UserPcodeOp *getOp(int4 i) const {
if (i>=useroplist.size()) return (UserPcodeOp *)0;
return useroplist[i];
}
UserPcodeOp *getOp(const string &nm) const; ///< Retrieve description by name
/// Retrieve a segment-op description object by index
/// \param i is the index
/// \return the indicated segment-op description
SegmentOp *getSegmentOp(int4 i) const {
if (i>=segmentop.size()) return (SegmentOp *)0;
return segmentop[i];
}
VolatileReadOp *getVolatileRead(void) const { return vol_read; } ///< Get (the) volatile read description
VolatileWriteOp *getVolatileWrite(void) const { return vol_write; } ///< Get (the) volatile write description
void parseSegmentOp(const Element *el,Architecture *glb); ///< Parse a \<segmentop> XML tag
void parseVolatile(const Element *el,Architecture *glb); ///< Parse a \<volatile> XML tag
void parseCallOtherFixup(const Element *el,Architecture *glb); ///< Parse a \<callotherfixup> XML tag
void parseJumpAssist(const Element *el,Architecture *glb); ///< Parse a \<jumpassist> XML tag
void manualCallOtherFixup(const string &useropname,const string &outname,
const vector<string> &inname,const string &snippet,Architecture *glb);
};
#endif