ROSE 0.11.145.272
Partitioner.h
1#ifndef ROSE_BinaryAnalysis_Partitioner2_Partitioner_H
2#define ROSE_BinaryAnalysis_Partitioner2_Partitioner_H
3#include <featureTests.h>
4#ifdef ROSE_ENABLE_BINARY_ANALYSIS
5#include <Rose/BinaryAnalysis/Partitioner2/BasicTypes.h>
6
7#include <Rose/BinaryAnalysis/Partitioner2/AddressUsageMap.h>
8#include <Rose/BinaryAnalysis/Partitioner2/Configuration.h>
9#include <Rose/BinaryAnalysis/Partitioner2/ControlFlowGraph.h>
10#include <Rose/BinaryAnalysis/Partitioner2/IndirectControlFlow.h>
11#include <Rose/BinaryAnalysis/Partitioner2/Semantics.h>
12
13#include <Rose/BinaryAnalysis/Architecture/BasicTypes.h>
14#include <Rose/BinaryAnalysis/InstructionProvider.h>
15#include <Rose/BinaryAnalysis/InstructionSemantics/SymbolicSemantics.h>
16#include <Rose/BinaryAnalysis/SerialIo.h>
17#include <Rose/BinaryAnalysis/SourceLocations.h>
18#include <Rose/BinaryAnalysis/Unparser/Settings.h>
19#include <Rose/Progress.h>
20
21#include <Sawyer/Attribute.h>
22#include <Sawyer/Callbacks.h>
23#include <Sawyer/IntervalSet.h>
24#include <Sawyer/Map.h>
25#include <Sawyer/Message.h>
26#include <Sawyer/Optional.h>
27#include <Sawyer/ProgressBar.h>
28#include <Sawyer/SharedObject.h>
29#include <Sawyer/SharedPointer.h>
30
31#include <boost/filesystem.hpp>
32#include <boost/format.hpp>
33#include <boost/move/utility_core.hpp>
34#ifdef ROSE_ENABLE_BOOST_SERIALIZATION
35#include <boost/serialization/access.hpp>
36#endif
37
38#include <ostream>
39#include <set>
40#include <string>
41#include <vector>
42
43// [Robb Matzke 2022-06-22]: deprecated. Needed because some user code doesn't include the old InstructionSemantics2 header
44// files where this same thing is defined, yet they use InstructionSemantics2 because such things were once declared by this
45// header file due to it originally including InstructionSemantics2 headers (which it no longer does).
46namespace Rose { namespace BinaryAnalysis { namespace InstructionSemantics2 = InstructionSemantics; }}
47
48namespace Rose {
49namespace BinaryAnalysis {
50namespace Partitioner2 {
51
264class ROSE_DLL_API Partitioner /*final*/
265 : public Sawyer::SharedObject, public Sawyer::SharedFromThis<Partitioner>, public Sawyer::Attribute::Storage<> {
266 BOOST_MOVABLE_BUT_NOT_COPYABLE(Partitioner)
267
268
270 //
271 // Types
272 //
275public:
283 // Callback list types
286 typedef std::vector<FunctionPrologueMatcherPtr> FunctionPrologueMatchers;
287 typedef std::vector<FunctionPaddingMatcherPtr> FunctionPaddingMatchers;
290 struct Thunk {
293 Thunk(const BasicBlockPtr&, Address target);
294 ~Thunk();
295 };
296
299
302 //
303 // Data members
304 //
307private:
308 BasePartitionerSettings settings_; // settings adjustable from the command-line
309 Configuration config_; // configuration information about functions, blocks, etc.
310 Architecture::BaseConstPtr architecture_; // architecture information such as the ISA, word size, etc.
311 InstructionProvider::Ptr instructionProvider_; // cache for all disassembled instructions
312 MemoryMap::Ptr memoryMap_; // description of memory, especially insns and non-writable
313 SgAsmInterpretation *interpretation_ = nullptr; // Interpretation corresponding to the memory map
314 ControlFlowGraph cfg_; // basic blocks that will become part of the ROSE AST
315 CfgVertexIndex vertexIndex_; // Vertex-by-address index for the CFG
316 AddressUsageMap aum_; // How addresses are used for each address represented by the CFG
317 SmtSolverPtr solver_; // Satisfiable modulo theory solver used by semantic expressions
318 Functions functions_; // List of all attached functions by entry address
319 bool autoAddCallReturnEdges_ = false; // Add E_CALL_RETURN edges when blocks are attached to CFG?
320 bool assumeFunctionsReturn_ = true; // Assume that unproven functions return to caller?
321 size_t stackDeltaInterproceduralLimit_ = 1; // Max depth of call stack when computing stack deltas
322 AddressNameMap addressNames_; // Names for various addresses
323 SourceLocations sourceLocations_; // Mapping between source locations and addresses
324 SemanticMemoryParadigm semanticMemoryParadigm_ = LIST_BASED_MEMORY; // Slow and precise, or fast and imprecise?
325 Unparser::BasePtr unparser_; // For unparsing things to pseudo-assembly
326 Unparser::BasePtr insnUnparser_; // For unparsing single instructions in diagnostics
327 Unparser::BasePtr insnPlainUnparser_; // For unparsing just instruction mnemonic and operands
328 IndirectControlFlow::State icf_; // State for various indirect control flow recovery analyses
329
330 // Callback lists
331 CfgAdjustmentCallbacks cfgAdjustmentCallbacks_;
332 BasicBlockCallbacks basicBlockCallbacks_;
333 FunctionPrologueMatchers functionPrologueMatchers_;
334 FunctionPaddingMatchers functionPaddingMatchers_;
335
336 // Special CFG vertices.
337 ControlFlowGraph::VertexIterator undiscoveredVertex_;
338 ControlFlowGraph::VertexIterator indeterminateVertex_;
339 ControlFlowGraph::VertexIterator nonexistingVertex_;
340 static const size_t nSpecialVertices = 3;
341
342 // Optional cached information
343 Sawyer::Optional<Address> elfGotVa_; // address of ELF GOT, set by findElfGotVa
344
345 // Protects the following data members
346 mutable SAWYER_THREAD_TRAITS::Mutex mutex_;
347 Progress::Ptr progress_; // Progress reporter to update, or null
348 mutable size_t cfgProgressTotal_ = 0; // Expected total for the CFG progress bar; initialized at first report
349
352 //
353 // Serialization
354 //
357#ifdef ROSE_ENABLE_BOOST_SERIALIZATION
358private:
359 friend class boost::serialization::access;
360 template<class Archive> void serializeCommon(Archive&, unsigned);
361 template<class Archive> void save(Archive&, unsigned) const;
362 template<class Archive> void load(Archive&, unsigned);
363 BOOST_SERIALIZATION_SPLIT_MEMBER();
364#endif
365
368 //
369 // Constructors
370 //
373private:
374 Partitioner(); // needed for Boost serialization
375
376 // Partitioner objects are reference counted and always allocated on the heap. Use the `instance` methods to construct
377 // these objects. Also, since the Partitioner class is final, we make the constructors private instead of the usual
378 // protected constructors elsewhere in ROSE.
381public:
382 ~Partitioner();
383
384public:
390
396
401 static PartitionerPtr instanceFromRbaFile(const boost::filesystem::path&, SerialIo::Format = SerialIo::BINARY);
402
404 void saveAsRbaFile(const boost::filesystem::path &name, SerialIo::Format fmt) const;
405
407 Partitioner(BOOST_RV_REF(Partitioner));
408
411
419
421 void clear();
422
438
456
468
469
472 //
473 // Unparsing
474 //
477public:
506
511
520 std::string unparse(SgAsmInstruction*) const;
521 void unparse(std::ostream&, SgAsmInstruction*) const;
522 void unparse(std::ostream&, const BasicBlockPtr&) const;
523 void unparse(std::ostream&, const DataBlockPtr&) const;
524 void unparse(std::ostream&, const FunctionPtr&) const;
525 void unparse(std::ostream&) const;
531 std::string unparsePlain(SgAsmInstruction*) const;
532
535 //
536 // Partitioner CFG queries
537 //
540public:
546 size_t nBytes() const;
547
555 ControlFlowGraph::VertexIterator undiscoveredVertex();
556 ControlFlowGraph::ConstVertexIterator undiscoveredVertex() const;
569 ControlFlowGraph::VertexIterator indeterminateVertex();
570 ControlFlowGraph::ConstVertexIterator indeterminateVertex() const;
582 ControlFlowGraph::VertexIterator nonexistingVertex();
583 ControlFlowGraph::ConstVertexIterator nonexistingVertex() const;
592 const ControlFlowGraph& cfg() const;
593
600 const AddressUsageMap& aum() const;
601
604
609 std::vector<AddressUser> users(Address) const;
610
618 std::set<Address> ghostSuccessors() const;
619
648 bool isEdgeIntraProcedural(ControlFlowGraph::ConstEdgeIterator edge, const FunctionPtr&) const;
649 bool isEdgeIntraProcedural(const ControlFlowGraph::Edge &edge, const FunctionPtr&) const;
650 bool isEdgeIntraProcedural(ControlFlowGraph::ConstEdgeIterator edge) const;
651 bool isEdgeIntraProcedural(const ControlFlowGraph::Edge &edge) const;
688 bool isEdgeInterProcedural(ControlFlowGraph::ConstEdgeIterator edge) const;
689 bool isEdgeInterProcedural(ControlFlowGraph::ConstEdgeIterator edge, const FunctionPtr &sourceFunction) const;
690 bool isEdgeInterProcedural(ControlFlowGraph::ConstEdgeIterator edge, const FunctionPtr &sourceFunction,
691 const FunctionPtr &targetFunction) const;
692
693 bool isEdgeInterProcedural(const ControlFlowGraph::Edge &edge) const;
694 bool isEdgeInterProcedural(const ControlFlowGraph::Edge &edge, const FunctionPtr &sourceFunction) const;
695 bool isEdgeInterProcedural(const ControlFlowGraph::Edge &edge, const FunctionPtr &sourceFunction,
696 const FunctionPtr &targetFunction) const;
703 //
704 // Partitioner instruction operations
705 //
708public:
714 size_t nInstructions() const;
715
735 ControlFlowGraph::ConstVertexIterator instructionVertex(Address insnVa) const;
736
745 std::vector<SgAsmInstruction*> instructionsOverlapping(const AddressInterval&) const;
746
755 std::vector<SgAsmInstruction*> instructionsSpanning(const AddressInterval&) const;
756
766 std::vector<SgAsmInstruction*> instructionsContainedIn(const AddressInterval&) const;
767
776
790
796
797
798
801 //
802 // Partitioner basic block placeholder operations
803 //
806public:
816 size_t nPlaceholders() const;
817
826 bool placeholderExists(Address startVa) const;
827
838 ControlFlowGraph::VertexIterator findPlaceholder(Address startVa);
839 ControlFlowGraph::ConstVertexIterator findPlaceholder(Address startVa) const;
858 ControlFlowGraph::VertexIterator insertPlaceholder(Address startVa);
859
873 BasicBlockPtr erasePlaceholder(const ControlFlowGraph::ConstVertexIterator &placeholder) /*final*/;
881 //
882 // Partitioner basic block operations
883 //
886public:
913
922 size_t nBasicBlocks() const;
923
931 std::vector<BasicBlockPtr> basicBlocks() const;
932
967 std::vector<BasicBlockPtr> basicBlocksOverlapping(const AddressInterval&) const;
968
979 std::vector<BasicBlockPtr> basicBlocksSpanning(const AddressInterval&) const;
980
990 std::vector<BasicBlockPtr> basicBlocksContainedIn(const AddressInterval&) const;
991
999
1010
1017
1044 BasicBlockPtr detachBasicBlock(const ControlFlowGraph::ConstVertexIterator &placeholder);
1058 ControlFlowGraph::VertexIterator truncateBasicBlock(const ControlFlowGraph::ConstVertexIterator &basicBlock,
1059 SgAsmInstruction *insn);
1060
1094 void attachBasicBlock(const ControlFlowGraph::ConstVertexIterator &placeholder, const BasicBlockPtr&);
1183 BasicBlockPtr discoverBasicBlock(const ControlFlowGraph::ConstVertexIterator &placeholder) const;
1201
1210 std::vector<Address> basicBlockConcreteSuccessors(const BasicBlockPtr&, bool *isComplete=NULL) const;
1211
1230 std::set<Address> basicBlockGhostSuccessors(const BasicBlockPtr&) const;
1231
1241 bool basicBlockIsFunctionCall(const BasicBlockPtr&, Precision::Level precision = Precision::HIGH) const;
1242
1254
1260
1302 basicBlockStackDeltaIn(const BasicBlockPtr&, const FunctionPtr &function) const;
1303
1305 basicBlockStackDeltaOut(const BasicBlockPtr&, const FunctionPtr &function) const;
1316 void forgetStackDeltas() const;
1317 void forgetStackDeltas(const FunctionPtr&) const;
1384 Sawyer::Optional<bool> basicBlockOptionalMayReturn(const ControlFlowGraph::ConstVertexIterator&) const;
1394
1395private:
1396 // Per-vertex data used during may-return analysis
1397 struct MayReturnVertexInfo {
1398 enum State {INIT, CALCULATING, FINISHED};
1399 State state; // current state of vertex
1400 bool processedCallees; // have we processed BBs this vertex calls?
1401 boost::logic::tribool anyCalleesReturn; // do any of those called BBs have a true may-return value?
1402 boost::logic::tribool result; // final result (eventually cached in BB)
1403 MayReturnVertexInfo(): state(INIT), processedCallees(false), anyCalleesReturn(false), result(boost::indeterminate) {}
1404 };
1405
1406 // Is edge significant for analysis? See .C file for full documentation.
1407 bool mayReturnIsSignificantEdge(const ControlFlowGraph::ConstEdgeIterator &edge,
1408 std::vector<MayReturnVertexInfo> &vertexInfo) const;
1409
1410 // Determine (and cache in vertexInfo) whether any callees return.
1411 boost::logic::tribool mayReturnDoesCalleeReturn(const ControlFlowGraph::ConstVertexIterator &vertex,
1412 std::vector<MayReturnVertexInfo> &vertexInfo) const;
1413
1414 // Maximum may-return result from significant successors including phantom call-return edge.
1415 boost::logic::tribool mayReturnDoesSuccessorReturn(const ControlFlowGraph::ConstVertexIterator &vertex,
1416 std::vector<MayReturnVertexInfo> &vertexInfo) const;
1417
1418 // The guts of the may-return analysis
1419 Sawyer::Optional<bool> basicBlockOptionalMayReturn(const ControlFlowGraph::ConstVertexIterator &start,
1420 std::vector<MayReturnVertexInfo> &vertexInfo) const;
1421
1422
1423
1426 //
1427 // Partitioner data block operations
1428 //
1431public:
1437 size_t nDataBlocks() const;
1438
1446
1456
1469
1477
1488
1502
1512 std::vector<DataBlockPtr> dataBlocksOverlapping(const AddressInterval&) const;
1513
1523 std::vector<DataBlockPtr> dataBlocksSpanning(const AddressInterval&) const;
1524
1534 std::vector<DataBlockPtr> dataBlocksContainedIn(const AddressInterval&) const;
1535
1543
1549 std::vector<DataBlockPtr> dataBlocks() const;
1550
1551
1552
1555 //
1556 // Partitioner function operations
1557 //
1560public:
1566 size_t nFunctions() const;
1567
1587 FunctionPtr functionExists(const BasicBlockPtr &entryBlock) const;
1596 std::vector<FunctionPtr> functions() const;
1597
1607 std::vector<FunctionPtr> functionsOverlapping(const AddressInterval&) const;
1608
1619 std::vector<FunctionPtr> functionsSpanning(const AddressInterval&) const;
1620
1630 std::vector<FunctionPtr> functionsContainedIn(const AddressInterval&) const;
1631
1649 void functionExtent(const FunctionPtr &function, AddressIntervalSet &retval /*in,out*/) const;
1651 void functionBasicBlockExtent(const FunctionPtr &function, AddressIntervalSet &retval /*in,out*/) const;
1653 void functionDataBlockExtent(const FunctionPtr &function, AddressIntervalSet &retval /*in,out*/) const;
1693
1728
1734 std::vector<Function::Ptr> entryFunctions();
1735
1770 std::vector<FunctionPtr>
1771 functionsOwningBasicBlock(const ControlFlowGraph::Vertex&, bool doSort = true) const;
1772
1773 std::vector<FunctionPtr>
1774 functionsOwningBasicBlock(const ControlFlowGraph::ConstVertexIterator&, bool doSort = true) const;
1775
1776 std::vector<FunctionPtr>
1777 functionsOwningBasicBlock(Address bblockVa, bool doSort = true) const;
1778
1779 std::vector<FunctionPtr>
1780 functionsOwningBasicBlock(const BasicBlockPtr&, bool doSort = true) const;
1781
1782 template<class Container> // container can hold any type accepted by functionsOwningBasicBlock
1783 std::vector<FunctionPtr>
1784 functionsOwningBasicBlocks(const Container &bblocks) const {
1785 std::vector<FunctionPtr> retval;
1786 for (const typename Container::value_type& bblock: bblocks) {
1787 for (const FunctionPtr &function: functionsOwningBasicBlock(bblock, false))
1788 insertUnique(retval, function, sortFunctionsByAddress);
1789 }
1790 return retval;
1791 }
1803 std::vector<FunctionPtr> discoverCalledFunctions() const;
1804
1816 std::vector<FunctionPtr> discoverFunctionEntryVertices() const;
1817
1828
1839 void discoverFunctionBasicBlocks(const FunctionPtr &function) const;
1840
1847 std::set<Address> functionGhostSuccessors(const FunctionPtr&) const;
1848
1857
1878
1883
1891
1896
1932 const CallingConvention::Definition::Ptr &dflt) const;
1951
2013 void fixInterFunctionEdge(const ControlFlowGraph::ConstEdgeIterator&);
2032 bool functionIsNoop(const FunctionPtr&) const;
2033
2039 void allFunctionIsNoop() const;
2040
2056 std::set<Address> functionDataFlowConstants(const FunctionPtr&) const;
2057
2058
2059
2062 //
2063 // Callbacks
2064 //
2067public:
2101public:
2137 std::vector<FunctionPtr> nextFunctionPrologue(Address startVa);
2138 std::vector<FunctionPtr> nextFunctionPrologue(Address startVa, Address &lastSearchedVa /*out*/);
2141public:
2159
2160
2161
2164 //
2165 // Partitioner miscellaneous
2166 //
2169public:
2181 void dumpCfg(std::ostream&, const std::string &prefix="", bool showBlocks=true, bool computeProperties=true) const;
2182
2196 void cfgGraphViz(std::ostream&, const AddressInterval &restrict = AddressInterval::whole(), bool showNeighbors=true) const;
2197
2203 static std::string vertexName(const ControlFlowGraph::Vertex&);
2204 std::string vertexName(const ControlFlowGraph::ConstVertexIterator&) const;
2210 static std::string vertexNameEnd(const ControlFlowGraph::Vertex&);
2211
2217 static std::string edgeNameSrc(const ControlFlowGraph::Edge&);
2218 std::string edgeNameSrc(const ControlFlowGraph::ConstEdgeIterator&) const;
2226 static std::string edgeNameDst(const ControlFlowGraph::Edge&);
2227 std::string edgeNameDst(const ControlFlowGraph::ConstEdgeIterator&) const;
2235 static std::string edgeName(const ControlFlowGraph::Edge&);
2236 std::string edgeName(const ControlFlowGraph::ConstEdgeIterator&) const;
2242 static std::string basicBlockName(const BasicBlockPtr&);
2243
2247 static std::string dataBlockName(const DataBlockPtr&);
2248
2252 static std::string functionName(const FunctionPtr&);
2253
2259
2285 void updateProgress(const std::string &phase, double completion) const;
2286
2288 void showStatistics() const;
2289
2290 // Checks consistency of internal data structures when debugging is enable (when NDEBUG is not defined).
2291 void checkConsistency() const;
2292
2299
2304
2315 //
2316 // Settings
2317 //
2320public:
2321
2341 void enableSymbolicSemantics(bool = true);
2398 void addressName(Address, const std::string&);
2399 const std::string& addressName(Address) const;
2428 //
2429 // Instruction semantics
2430 //
2433public:
2454
2478
2479
2480
2483 //
2484 // Python API support functions
2485 //
2488#ifdef ROSE_ENABLE_PYTHON_API
2489 void pythonUnparse() const;
2490#endif
2491
2492
2493
2496 //
2497 // Partitioner internal utilities
2498 //
2501private:
2502 void init(const MemoryMap::Ptr&);
2503 void init(const Partitioner&);
2504 void updateCfgProgress();
2505
2506private:
2507 // Convert a CFG vertex iterator from one partitioner to another. This is called during copy construction when the source
2508 // and destination CFGs are identical.
2509 ControlFlowGraph::VertexIterator convertFrom(const Partitioner &other,
2510 ControlFlowGraph::ConstVertexIterator otherIter);
2511
2512 // Adjusts edges for a placeholder vertex. This method erases all outgoing edges for the specified placeholder vertex and
2513 // then inserts a single edge from the placeholder to the special "undiscovered" vertex. */
2514 ControlFlowGraph::EdgeIterator adjustPlaceholderEdges(const ControlFlowGraph::VertexIterator &placeholder);
2515
2516 // Adjusts edges for a non-existing basic block. This method erases all outgoing edges for the specified vertex and
2517 // then inserts a single edge from the vertex to the special "non-existing" vertex. */
2518 ControlFlowGraph::EdgeIterator adjustNonexistingEdges(const ControlFlowGraph::VertexIterator &vertex);
2519
2520 // Implementation for the discoverBasicBlock methods. The startVa must not be the address of an existing placeholder.
2521 BasicBlockPtr discoverBasicBlockInternal(Address startVa) const;
2522
2523 // This method is called whenever a new placeholder is inserted into the CFG or a new basic block is attached to the
2524 // CFG/AUM. The call happens immediately after the CFG/AUM are updated.
2525 void bblockAttached(const ControlFlowGraph::VertexIterator &newVertex);
2526
2527 // This method is called whenever a basic block is detached from the CFG/AUM or when a placeholder is erased from the CFG.
2528 // The call happens immediately after the CFG/AUM are updated.
2529 void bblockDetached(Address startVa, const BasicBlockPtr &removedBlock);
2530
2531 // Rebuild the vertexIndex_ and other cache-like data members from the control flow graph
2532 void rebuildVertexIndices();
2533};
2534
2535} // namespace
2536} // namespace
2537} // namespace
2538
2539#endif
2540#endif
Provides and caches instructions.
Partitions instructions into basic blocks and functions.
AddressIntervalSet basicBlockInstructionExtent(const BasicBlockPtr &) const
Returns the addresses used by basic block instructions.
Sawyer::Callbacks< CfgAdjustmentCallback::Ptr > CfgAdjustmentCallbacks
See cfgAdjustmentCallbacks.
const Configuration & configuration() const
Property: Configuration information.
ControlFlowGraph::VertexIterator nonexistingVertex()
Returns the special "non-existing" vertex.
ControlFlowGraph::ConstVertexIterator nonexistingVertex() const
Returns the special "non-existing" vertex.
static std::string dataBlockName(const DataBlockPtr &)
Name of a data block.
bool basicBlockIsFunctionReturn(const BasicBlockPtr &) const
Determine if a basic block looks like a function return.
std::vector< Function::Ptr > entryFunctions()
Entry points of the binary.
std::vector< BasicBlockPtr > basicBlocksContainedIn(const AddressInterval &) const
Returns basic blocks that are fully contained in an address interval.
FunctionPrologueMatchers & functionPrologueMatchers()
Ordered list of function prologue matchers.
void addressName(Address, const std::string &)
Property: Name for address.
ControlFlowGraph::VertexIterator undiscoveredVertex()
Returns the special "undiscovered" vertex.
void basicBlockDropSemantics() const
Immediately drop semantic information for all attached basic blocks.
size_t nDataBlocks() const
Returns the number of data blocks attached to the CFG/AUM.
ControlFlowGraph::ConstVertexIterator indeterminateVertex() const
Returns the special "indeterminate" vertex.
void allFunctionCallingConvention() const
Compute calling conventions for all functions.
InstructionSemantics::BaseSemantics::SValuePtr functionStackDelta(const FunctionPtr &function) const
Stack delta analysis for one function.
void interpretation(SgAsmInterpretation *)
Property: Interpretation corresponding to the memory map.
BasicBlockPtr erasePlaceholder(Address startVa)
Remove a basic block placeholder from the CFG/AUM.
Unparser::BasePtr unparser() const
Returns an unparser.
void forgetFunctionIsNoop() const
Clears cached function no-op analysis results.
CfgAdjustmentCallbacks & cfgAdjustmentCallbacks()
List of all callbacks invoked when the CFG is adjusted.
Sawyer::Optional< bool > functionOptionalMayReturn(const FunctionPtr &function) const
May-return analysis for one function.
std::vector< SgAsmInstruction * > instructionsContainedIn(const AddressInterval &) const
Returns instructions that are fully contained in an address interval.
Sawyer::Optional< bool > basicBlockOptionalMayReturn(const BasicBlockPtr &) const
Determine if part of the CFG can pop the top stack frame.
BasicBlockSuccessors basicBlockSuccessors(const BasicBlockPtr &, Precision::Level precision=Precision::HIGH) const
Determine successors for a basic block.
std::vector< DataBlockPtr > dataBlocksContainedIn(const AddressInterval &) const
Returns data blocks that are fully contained in an address interval.
SemanticMemoryParadigm semanticMemoryParadigm() const
Property: Whether to use map- or list-based memory states.
void allFunctionCallingConvention(const CallingConvention::Definition::Ptr &dflt) const
Compute calling conventions for all functions.
FunctionCallGraph functionCallGraph(AllowParallelEdges::Type allowParallelEdges) const
Returns a function call graph.
size_t stackDeltaInterproceduralLimit() const
Property: max depth for inter-procedural stack delta analysis.
void stackDeltaInterproceduralLimit(size_t)
Property: max depth for inter-procedural stack delta analysis.
ControlFlowGraph::VertexIterator insertPlaceholder(Address startVa)
Insert a basic-block placeholder.
FunctionPtr functionExists(const FunctionPtr &function) const
Determines whether a function exists in the CFG/AUM.
void forgetStackDeltas(const FunctionPtr &) const
Clears all cached stack deltas.
void unparse(std::ostream &, const DataBlockPtr &) const
Unparse some entity.
std::vector< FunctionPtr > functionsOverlapping(const AddressInterval &) const
Returns functions that overlap with specified address interval.
DataBlockPtr matchFunctionPadding(const FunctionPtr &)
Finds function padding.
void configureInsnPlainUnparser(const Unparser::BasePtr &) const
Configure plain single-instruction unparser.
SgAsmInstruction * discoverInstruction(Address startVa) const
Discover an instruction.
bool functionIsNoop(const FunctionPtr &) const
Function no-op analysis.
void fixInterFunctionEdge(const ControlFlowGraph::ConstEdgeIterator &)
Adjust inter-function edge types.
ControlFlowGraph::VertexIterator truncateBasicBlock(const ControlFlowGraph::ConstVertexIterator &basicBlock, SgAsmInstruction *insn)
Truncate an attached basic-block.
Sawyer::Optional< Thunk > functionIsThunk(const FunctionPtr &) const
True if function is a thunk.
size_t attachFunctionBasicBlocks(const Functions &)
Create placeholders for function basic blocks.
const ControlFlowGraph & cfg() const
Returns the control flow graph.
const CallingConvention::Analysis & functionCallingConvention(const FunctionPtr &, const CallingConvention::Definition::Ptr &dflt) const
Calling convention analysis for one function.
const SourceLocations & sourceLocations() const
Property: Source locations.
Partitioner & operator=(BOOST_RV_REF(Partitioner))
Move assignment.
bool isEdgeInterProcedural(ControlFlowGraph::ConstEdgeIterator edge) const
Determine if an edge is inter-procedural.
void checkingCallBranch(bool)
Property: Whether to look for function calls used as branches.
std::vector< BasicBlockPtr > basicBlocksSpanning(const AddressInterval &) const
Returns basic blocks that span an entire address interval.
Configuration & configuration()
Property: Configuration information.
AddressUsageMap aum(const FunctionPtr &) const
Returns the address usage map for a single function.
std::vector< FunctionPaddingMatcherPtr > FunctionPaddingMatchers
See functionPaddingMatchers.
SgAsmGenericSection * elfGot(SgAsmElfFileHeader *)
Find the ELF global offset table and save its address.
std::vector< Address > basicBlockConcreteSuccessors(const BasicBlockPtr &, bool *isComplete=NULL) const
Determines concrete successors for a basic block.
std::vector< DataBlockPtr > dataBlocksSpanning(const AddressInterval &) const
Returns data blocks that span an entire address interval.
DataBlockPtr findBestDataBlock(const AddressInterval &) const
Find an existing data block.
void forgetStackDeltas() const
Clears all cached stack deltas.
void allFunctionStackDelta() const
Compute stack delta analysis for all functions.
bool assumeFunctionsReturn() const
Property: Assume (or not) that function calls return.
static std::string basicBlockName(const BasicBlockPtr &)
Name of a basic block.
void unparse(std::ostream &, const BasicBlockPtr &) const
Unparse some entity.
FunctionPtr functionExists(Address entryVa) const
Determines whether a function exists in the CFG/AUM.
AddressIntervalSet basicBlockDataExtent(const BasicBlockPtr &) const
Returns the addresses used by basic block data.
size_t nPlaceholders() const
Returns the number of basic basic block placeholders in the CFG.
AddressIntervalSet functionExtent(const FunctionPtr &) const
Returns the addresses used by a function.
std::vector< BasicBlockPtr > basicBlocks() const
Returns all basic blocks attached to the CFG.
bool isEdgeInterProcedural(const ControlFlowGraph::Edge &edge, const FunctionPtr &sourceFunction) const
Determine if an edge is inter-procedural.
size_t nFunctions() const
Returns the number of functions attached to the CFG/AUM.
std::vector< FunctionPtr > discoverCalledFunctions() const
Scans the CFG to find function calls.
bool isEdgeIntraProcedural(ControlFlowGraph::ConstEdgeIterator edge) const
Determine if an edge is intra-procedural.
BasicBlockPtr basicBlockExists(const BasicBlockPtr &) const
Determines whether a discovered basic block exists in the CFG/AUM.
void settings(const BasePartitionerSettings &)
Partitioner settings.
std::set< Address > ghostSuccessors() const
Determine all ghost successors in the control flow graph.
bool autoAddCallReturnEdges() const
Property: Insert (or not) function call return edges.
Architecture::BaseConstPtr architecture() const
Property: Architecture information.
void unparse(std::ostream &, SgAsmInstruction *) const
Unparse some entity.
std::set< Address > functionGhostSuccessors(const FunctionPtr &) const
Returns ghost successors for a single function.
bool isEdgeInterProcedural(const ControlFlowGraph::Edge &edge, const FunctionPtr &sourceFunction, const FunctionPtr &targetFunction) const
Determine if an edge is inter-procedural.
std::string edgeName(const ControlFlowGraph::ConstEdgeIterator &) const
Name of an edge.
void unparse(std::ostream &, const FunctionPtr &) const
Unparse some entity.
ControlFlowGraph::VertexIterator indeterminateVertex()
Returns the special "indeterminate" vertex.
bool isEdgeIntraProcedural(const ControlFlowGraph::Edge &edge, const FunctionPtr &) const
Determine if an edge is intra-procedural.
ControlFlowGraph::ConstVertexIterator instructionVertex(Address insnVa) const
Returns the CFG vertex containing specified instruction.
size_t nBytes() const
Returns the number of bytes represented by the CFG.
BasicBlockPtr basicBlockContainingInstruction(Address insnVa) const
Returns the basic block that contains a specific instruction address.
bool basicBlockIsFunctionCall(const BasicBlockPtr &, Precision::Level precision=Precision::HIGH) const
Determine if a basic block looks like a function call.
void attachBasicBlock(const ControlFlowGraph::ConstVertexIterator &placeholder, const BasicBlockPtr &)
Attach a basic block to the CFG/AUM.
InstructionSemantics::BaseSemantics::RiscOperatorsPtr newOperators(SemanticMemoryParadigm) const
Obtain new RiscOperators.
void basicBlockMayReturnReset() const
Clear all may-return properties.
BasicBlockPtr detachBasicBlock(Address startVa)
Detach a basic block from the CFG/AUM.
const std::string & addressName(Address) const
Property: Name for address.
void discoverFunctionBasicBlocks(const FunctionPtr &function) const
Adds basic blocks to a function.
IndirectControlFlow::State & icf()
Internal data structures for indirect control flow recovery.
const CallingConvention::Analysis & functionCallingConvention(const FunctionPtr &) const
Calling convention analysis for one function.
bool usingSymbolicSemantics() const
Use or not use symbolic semantics.
std::vector< FunctionPtr > functionsOwningBasicBlocks(const Container &bblocks) const
Finds functions that own the specified basic block.
bool checkingCallBranch() const
Property: Whether to look for function calls used as branches.
void cfgGraphViz(std::ostream &, const AddressInterval &restrict=AddressInterval::whole(), bool showNeighbors=true) const
Output CFG as GraphViz.
const BasicBlockCallbacks & basicBlockCallbacks() const
Callbacks for adjusting basic block during discovery.
std::vector< SgAsmInstruction * > instructionsSpanning(const AddressInterval &) const
Returns instructions that span an entire address interval.
AddressUser instructionExists(Address startVa) const
Determines whether an instruction is attached to the CFG/AUM.
ControlFlowGraph::VertexIterator findPlaceholder(Address startVa)
Find the CFG vertex for a basic block placeholder.
static std::string functionName(const FunctionPtr &)
Name of a function.
std::vector< FunctionPtr > functionsOwningBasicBlock(const BasicBlockPtr &, bool doSort=true) const
Finds functions that own the specified basic block.
void expandIndeterminateCalls()
Expands indeterminate function calls.
BasicBlockPtr discoverBasicBlock(Address startVa) const
Discover instructions for a detached basic block.
void unparse(std::ostream &) const
Unparse some entity.
bool isEdgeIntraProcedural(const ControlFlowGraph::Edge &edge) const
Determine if an edge is intra-procedural.
DataBlockPtr attachDataBlock(const DataBlockPtr &)
Attach a data block to the CFG/AUM.
size_t attachFunctionBasicBlocks(const FunctionPtr &)
Create placeholders for function basic blocks.
void dumpCfg(std::ostream &, const std::string &prefix="", bool showBlocks=true, bool computeProperties=true) const
Output the control flow graph.
InstructionSemantics::BaseSemantics::RiscOperatorsPtr newOperators() const
Obtain new RiscOperators.
void assumeFunctionsReturn(bool)
Property: Assume (or not) that function calls return.
DataBlockPtr dataBlockExists(const DataBlockPtr &) const
Determine if a data block or its equivalent is attached to the CFG/AUM.
DataBlockPtr attachDataBlockToBasicBlock(const DataBlockPtr &, const BasicBlockPtr &)
Attach a data block to a basic block.
bool basicBlockSemanticsAutoDrop() const
Property: Automatically drop semantics for attached basic blocks.
std::vector< AddressUser > users(Address) const
Entities that exist at a particular address.
std::vector< DataBlockPtr > dataBlocksOverlapping(const AddressInterval &) const
Returns data blocks that overlap with specified address interval.
Partitioner(BOOST_RV_REF(Partitioner))
Move constructor.
BasicBlockPtr detachBasicBlock(const BasicBlockPtr &basicBlock)
Detach a basic block from the CFG/AUM.
std::vector< FunctionPtr > nextFunctionPrologue(Address startVa)
Finds the next function by searching for a function prologue.
InstructionSemantics::BaseSemantics::DispatcherPtr newDispatcher(const InstructionSemantics::BaseSemantics::RiscOperatorsPtr &) const
Obtain a new instruction semantics dispatcher.
std::vector< BasicBlockPtr > basicBlocksOverlapping(const AddressInterval &) const
Returns basic blocks that overlap with specified address interval.
void attachBasicBlock(const BasicBlockPtr &)
Attach a basic block to the CFG/AUM.
SgAsmInterpretation * interpretation() const
Property: Interpretation corresponding to the memory map.
std::string unparsePlain(SgAsmInstruction *) const
Unparse an instruction in a plain way.
Progress::Ptr progress() const
Property: How to report progress.
void detachFunction(const FunctionPtr &)
Detaches a function from the CFG/AUM.
static std::string vertexNameEnd(const ControlFlowGraph::Vertex &)
Name of last instruction in vertex.
void insnUnparser(const Unparser::BasePtr &)
Returns an unparser.
bool addressIsExecutable(Address) const
Returns true if address is executable.
void detachDataBlock(const DataBlockPtr &)
Detaches a data block from the CFG/AUM.
std::string vertexName(const ControlFlowGraph::ConstVertexIterator &) const
Name of a vertex.
void showStatistics() const
Print some partitioner performance statistics.
static Ptr instance(const Architecture::BaseConstPtr &)
Default allocating constructor.
void disableSymbolicSemantics()
Use or not use symbolic semantics.
const AddressUsageMap & aum() const
Returns the address usage map.
const IndirectControlFlow::State & icf() const
Internal data structures for indirect control flow recovery.
std::set< Address > basicBlockGhostSuccessors(const BasicBlockPtr &) const
Determine ghost successors for a basic block.
std::vector< FunctionPtr > functions() const
All functions attached to the CFG/AUM.
void saveAsRbaFile(const boost::filesystem::path &name, SerialIo::Format fmt) const
Save this partitioner as an RBA file.
BasicBlockPtr erasePlaceholder(const ControlFlowGraph::ConstVertexIterator &placeholder)
Remove a basic block placeholder from the CFG/AUM.
void progress(const Progress::Ptr &)
Property: How to report progress.
std::vector< FunctionPtr > functionsSpanning(const AddressInterval &) const
Returns functions that span an entire address interval.
std::vector< SgAsmInstruction * > instructionsOverlapping(const AddressInterval &) const
Returns instructions that overlap with specified address interval.
void enableSymbolicSemantics(bool=true)
Use or not use symbolic semantics.
ControlFlowGraph::ConstVertexIterator findPlaceholder(Address startVa) const
Find the CFG vertex for a basic block placeholder.
const FunctionPrologueMatchers & functionPrologueMatchers() const
Ordered list of function prologue matchers.
Sawyer::Optional< Address > elfGotVa() const
Returns a previously cached ELF GOT address.
Sawyer::Container::Map< Address, std::string > AddressNameMap
Map address to name.
size_t nInstructions() const
Returns the number of instructions attached to the CFG/AUM.
void unparser(const Unparser::BasePtr &)
Returns an unparser.
static Ptr instance(const Architecture::BaseConstPtr &, const MemoryMap::Ptr &)
Construct a partitioner.
void autoAddCallReturnEdges(bool)
Property: Insert (or not) function call return edges.
InstructionSemantics::BaseSemantics::SValuePtr basicBlockStackDeltaOut(const BasicBlockPtr &, const FunctionPtr &function) const
Return the stack delta expression.
void clear()
Reset CFG/AUM to initial state.
BasicBlockPtr discoverBasicBlock(const ControlFlowGraph::ConstVertexIterator &placeholder) const
Discover instructions for a detached basic block.
std::vector< FunctionPtr > nextFunctionPrologue(Address startVa, Address &lastSearchedVa)
Finds the next function by searching for a function prologue.
bool isDefaultConstructed() const
Return true if this is a default constructed partitioner.
void allFunctionMayReturn() const
Compute may-return analysis for all functions.
std::vector< FunctionPrologueMatcherPtr > FunctionPrologueMatchers
See functionPrologueMatchers.
Unparser::BasePtr insnUnparser() const
Returns an unparser.
SmtSolverPtr smtSolver() const
SMT solver.
std::vector< FunctionPtr > functionsOwningBasicBlock(const ControlFlowGraph::Vertex &, bool doSort=true) const
Finds functions that own the specified basic block.
bool isEdgeIntraProcedural(ControlFlowGraph::ConstEdgeIterator edge, const FunctionPtr &) const
Determine if an edge is intra-procedural.
FunctionPtr attachOrMergeFunction(const FunctionPtr &)
Attaches or merges a function into the CFG/AUM.
DataBlockPtr attachDataBlockToFunction(const DataBlockPtr &, const FunctionPtr &)
Attach a data block to an attached or detached function.
BasicBlockPtr basicBlockExists(Address startVa) const
Determines whether a discovered basic block exists in the CFG/AUM.
size_t attachFunctions(const Functions &)
Attaches a function to the CFG/AUM.
BasicBlockPtr detachBasicBlock(const ControlFlowGraph::ConstVertexIterator &placeholder)
Detach a basic block from the CFG/AUM.
std::set< Address > functionDataFlowConstants(const FunctionPtr &) const
Find constants in function using data-flow.
void functionBasicBlockExtent(const FunctionPtr &function, AddressIntervalSet &retval) const
Returns the addresses used by a function.
size_t nBasicBlocks() const
Returns the number of basic blocks attached to the CFG/AUM.
const AddressNameMap & addressNames() const
Property: Name for address.
std::string edgeNameDst(const ControlFlowGraph::ConstEdgeIterator &) const
Name of an outgoing edge.
void configureInsnUnparser(const Unparser::BasePtr &) const
Configure the single-instruction unparser.
CallingConvention::Dictionary functionCallingConventionDefinitions(const FunctionPtr &) const
Return list of matching calling conventions.
bool basicBlockPopsStack(const BasicBlockPtr &) const
Determine if the basic block pops at least one byte from the stack.
std::vector< FunctionPtr > functionsOwningBasicBlock(const ControlFlowGraph::ConstVertexIterator &, bool doSort=true) const
Finds functions that own the specified basic block.
void fixInterFunctionEdges()
Adjust inter-function edge types.
void allFunctionIsNoop() const
Analyze all functions for whether they are effectivly no-ops.
std::vector< DataBlockPtr > dataBlocks() const
Returns the list of all attached data blocks.
void functionDataBlockExtent(const FunctionPtr &function, AddressIntervalSet &retval) const
Returns the addresses used by a function.
bool isEdgeInterProcedural(ControlFlowGraph::ConstEdgeIterator edge, const FunctionPtr &sourceFunction, const FunctionPtr &targetFunction) const
Determine if an edge is inter-procedural.
bool placeholderExists(Address startVa) const
Determines whether a basic block placeholder exists in the CFG.
const FunctionPaddingMatchers & functionPaddingMatchers() const
Ordered list of function padding matchers.
std::string edgeNameSrc(const ControlFlowGraph::ConstEdgeIterator &) const
Name of an incoming edge.
static std::string vertexName(const ControlFlowGraph::Vertex &)
Name of a vertex.
void semanticMemoryParadigm(SemanticMemoryParadigm)
Property: Whether to use map- or list-based memory states.
BasicBlockCallbacks & basicBlockCallbacks()
Callbacks for adjusting basic block during discovery.
FunctionPtr functionExists(const BasicBlockPtr &entryBlock) const
Determines whether a function exists in the CFG/AUM.
AddressIntervalSet functionDataBlockExtent(const FunctionPtr &function) const
Returns the addresses used by a function.
InstructionProvider & instructionProvider()
Returns the instruction provider.
Sawyer::Callbacks< BasicBlockCallbackPtr > BasicBlockCallbacks
See basicBlockCallbacks.
void sourceLocations(const SourceLocations &)
Property: Source locations.
size_t attachFunction(const FunctionPtr &)
Attaches a function to the CFG/AUM.
void forgetFunctionIsNoop(const FunctionPtr &) const
Clears cached function no-op analysis results.
static std::string edgeName(const ControlFlowGraph::Edge &)
Name of an edge.
static std::string edgeNameDst(const ControlFlowGraph::Edge &)
Name of an outgoing edge.
const CfgAdjustmentCallbacks & cfgAdjustmentCallbacks() const
List of all callbacks invoked when the CFG is adjusted.
void functionExtent(const FunctionPtr &function, AddressIntervalSet &retval) const
Returns the addresses used by a function.
AddressInterval instructionExtent(SgAsmInstruction *) const
Returns the address interval for an instruction.
void basicBlockSemanticsAutoDrop(bool)
Property: Automatically drop semantics for attached basic blocks.
MemoryMap::Ptr memoryMap() const
Returns the memory map.
CrossReferences instructionCrossReferences(const AddressIntervalSet &restriction) const
Cross references.
bool isEdgeInterProcedural(ControlFlowGraph::ConstEdgeIterator edge, const FunctionPtr &sourceFunction) const
Determine if an edge is inter-procedural.
std::vector< FunctionPtr > functionsContainedIn(const AddressInterval &) const
Returns functions that are fully contained in an address interval.
std::vector< FunctionPtr > discoverFunctionEntryVertices() const
Scans the CFG to find function entry basic blocks.
void allFunctionCallingConventionDefinition(const CallingConvention::Definition::Ptr &) const
Analyzes calling conventions and saves results.
SourceLocations & sourceLocations()
Property: Source locations.
bool isEdgeInterProcedural(const ControlFlowGraph::Edge &edge) const
Determine if an edge is inter-procedural.
AddressIntervalSet functionBasicBlockExtent(const FunctionPtr &function) const
Returns the addresses used by a function.
std::vector< FunctionPtr > functionsOwningBasicBlock(Address bblockVa, bool doSort=true) const
Finds functions that own the specified basic block.
const InstructionProvider & instructionProvider() const
Returns the instruction provider.
FunctionPaddingMatchers & functionPaddingMatchers()
Ordered list of function padding matchers.
Sawyer::Optional< bool > basicBlockOptionalMayReturn(const ControlFlowGraph::ConstVertexIterator &) const
Determine if part of the CFG can pop the top stack frame.
const BasePartitionerSettings & settings() const
Partitioner settings.
static std::string edgeNameSrc(const ControlFlowGraph::Edge &)
Name of an incoming edge.
ControlFlowGraph::ConstVertexIterator undiscoveredVertex() const
Returns the special "undiscovered" vertex.
std::string unparse(SgAsmInstruction *) const
Unparse some entity.
void updateProgress(const std::string &phase, double completion) const
Update partitioner with a new progress report.
CallingConvention::Dictionary functionCallingConventionDefinitions(const FunctionPtr &, const CallingConvention::Definition::Ptr &) const
Return list of matching calling conventions.
void allFunctionCallingConventionDefinition() const
Analyzes calling conventions and saves results.
AddressInterval dataBlockExtent(const DataBlockPtr &) const
Returns the addresses used by a data block.
static PartitionerPtr instanceFromRbaFile(const boost::filesystem::path &, SerialIo::Format=SerialIo::BINARY)
Construct a partitioner by loading it and an AST from a file.
InstructionSemantics::BaseSemantics::SValuePtr basicBlockStackDeltaIn(const BasicBlockPtr &, const FunctionPtr &function) const
Return the stack delta expression.
AddressUser instructionExists(SgAsmInstruction *insn) const
Determines whether an instruction is attached to the CFG/AUM.
Format
Format of the state file.
Definition SerialIo.h:102
Bidirectional mapping between addresses and source locations.
API and storage for attributes.
Definition Attribute.h:215
Container associating values with keys.
Definition Sawyer/Map.h:72
Holds a value or nothing.
Definition Optional.h:56
Creates SharedPointer from this.
Base class for reference counted objects.
Reference-counting intrusive smart pointer.
Represents the file header of an ELF binary container.
Contiguous region of a file.
Base class for machine instructions.
Represents an interpretation of a binary container.
std::shared_ptr< const Base > BaseConstPtr
Reference counted pointer for Architecture::Base.
std::vector< DefinitionPtr > Dictionary
An ordered collection of calling convention definitions.
boost::shared_ptr< RiscOperators > RiscOperatorsPtr
Shared-ownership pointer to a RISC operators object.
boost::shared_ptr< Dispatcher > DispatcherPtr
Shared-ownership pointer to a semantics instruction dispatcher.
std::vector< BasicBlockSuccessor > BasicBlockSuccessors
All successors in no particular order.
std::uint64_t Address
Address.
Definition Address.h:11
std::shared_ptr< SmtSolver > SmtSolverPtr
Reference counting pointer.
The ROSE library.
Represents information about a thunk.
Address target
The one and only successor for the basic block.
BasicBlockPtr bblock
The one and only basic block for the thunk.