ROSE 2.1.0
Loading...
Searching...
No Matches
Partitioner.h
1#ifndef ROSE_BinaryAnalysis_Partitioner2_Partitioner_H
2#define ROSE_BinaryAnalysis_Partitioner2_Partitioner_H
3#include <featureTests.h>
4#ifdef ROSE_ENABLE_BINARY_ANALYSIS
5#include <Rose/BinaryAnalysis/Partitioner2/BasicTypes.h>
6
7#include <Rose/BinaryAnalysis/Partitioner2/AddressUsageMap.h>
8#include <Rose/BinaryAnalysis/Partitioner2/Configuration.h>
9#include <Rose/BinaryAnalysis/Partitioner2/ControlFlowGraph.h>
10#include <Rose/BinaryAnalysis/Partitioner2/IndirectControlFlow.h>
11#include <Rose/BinaryAnalysis/Partitioner2/Semantics.h>
12
13#include <Rose/BinaryAnalysis/Architecture/BasicTypes.h>
14#include <Rose/BinaryAnalysis/InstructionProvider.h>
15#include <Rose/BinaryAnalysis/InstructionSemantics/SymbolicSemantics.h>
16#include <Rose/BinaryAnalysis/SerialIo.h>
17#include <Rose/BinaryAnalysis/SourceLocations.h>
18#include <Rose/BinaryAnalysis/Unparser/Settings.h>
19#include <Rose/Progress.h>
20
21#include <Sawyer/Attribute.h>
22#include <Sawyer/Callbacks.h>
23#include <Sawyer/IntervalSet.h>
24#include <Sawyer/Map.h>
25#include <Sawyer/Message.h>
26#include <Sawyer/Optional.h>
27#include <Sawyer/ProgressBar.h>
28#include <Sawyer/SharedObject.h>
29#include <Sawyer/SharedPointer.h>
30
31#include <boost/filesystem.hpp>
32#include <boost/format.hpp>
33#include <boost/move/utility_core.hpp>
34#ifdef ROSE_ENABLE_BOOST_SERIALIZATION
35#include <boost/serialization/access.hpp>
36#endif
37
38#ifdef ROSE_ENABLE_FLATBUFFERS
39#include <Rose/BinaryAnalysis/Serialization/FlatBuffers.h>
40#endif
41
42#include <ostream>
43#include <set>
44#include <string>
45#include <vector>
46
47namespace Rose {
48namespace BinaryAnalysis {
49namespace Partitioner2 {
50
263class ROSE_DLL_API Partitioner /*final*/
264 : public Sawyer::SharedObject, public Sawyer::SharedFromThis<Partitioner>, public Sawyer::Attribute::Storage<> {
265 BOOST_MOVABLE_BUT_NOT_COPYABLE(Partitioner)
266
267
269 //
270 // Types
271 //
274public:
282 // Callback list types
285 typedef std::vector<FunctionPrologueMatcherPtr> FunctionPrologueMatchers;
286 typedef std::vector<FunctionPaddingMatcherPtr> FunctionPaddingMatchers;
289 struct Thunk {
292 Thunk(const BasicBlockPtr&, Address target);
293 ~Thunk();
294 };
295
298
301 //
302 // Data members
303 //
306private:
307 friend class Rose::BinaryAnalysis::Serialization::FlatBuffers::Deserializer;
308
309 BasePartitionerSettings settings_; // settings adjustable from the command-line
310 Configuration config_; // configuration information about functions, blocks, etc.
311 Architecture::BaseConstPtr architecture_; // architecture information such as the ISA, word size, etc.
312 InstructionProvider::Ptr instructionProvider_; // cache for all disassembled instructions
313 MemoryMap::Ptr memoryMap_; // description of memory, especially insns and non-writable
314 SgAsmInterpretation *interpretation_ = nullptr; // Interpretation corresponding to the memory map
315 ControlFlowGraph cfg_; // basic blocks that will become part of the ROSE AST
316 CfgVertexIndex vertexIndex_; // Vertex-by-address index for the CFG
317 AddressUsageMap aum_; // How addresses are used for each address represented by the CFG
318 SmtSolverPtr solver_; // Satisfiable modulo theory solver used by semantic expressions
319 Functions functions_; // List of all attached functions by entry address
320 bool autoAddCallReturnEdges_ = false; // Add E_CALL_RETURN edges when blocks are attached to CFG?
321 bool assumeFunctionsReturn_ = true; // Assume that unproven functions return to caller?
322 size_t stackDeltaInterproceduralLimit_ = 1; // Max depth of call stack when computing stack deltas
323 AddressNameMap addressNames_; // Names for various addresses
324 SourceLocations sourceLocations_; // Mapping between source locations and addresses
325 SemanticMemoryParadigm semanticMemoryParadigm_ = LIST_BASED_MEMORY; // Slow and precise, or fast and imprecise?
326 Unparser::BasePtr unparser_; // For unparsing things to pseudo-assembly
327 Unparser::BasePtr insnUnparser_; // For unparsing single instructions in diagnostics
328 Unparser::BasePtr insnPlainUnparser_; // For unparsing just instruction mnemonic and operands
329 IndirectControlFlow::State icf_; // State for various indirect control flow recovery analyses
330
331 // Callback lists
332 CfgAdjustmentCallbacks cfgAdjustmentCallbacks_;
333 BasicBlockCallbacks basicBlockCallbacks_;
334 FunctionPrologueMatchers functionPrologueMatchers_;
335 FunctionPaddingMatchers functionPaddingMatchers_;
336
337 // Special CFG vertices.
338 ControlFlowGraph::VertexIterator undiscoveredVertex_;
339 ControlFlowGraph::VertexIterator indeterminateVertex_;
340 ControlFlowGraph::VertexIterator nonexistingVertex_;
341 static const size_t nSpecialVertices = 3;
342
343 // Optional cached information
344 Sawyer::Optional<Address> elfGotVa_; // address of ELF GOT, set by findElfGotVa
345
346 // Protects the following data members
347 mutable SAWYER_THREAD_TRAITS::Mutex mutex_;
348 Progress::Ptr progress_; // Progress reporter to update, or null
349 mutable size_t cfgProgressTotal_ = 0; // Expected total for the CFG progress bar; initialized at first report
350
353 //
354 // Serialization
355 //
358#ifdef ROSE_ENABLE_BOOST_SERIALIZATION
359private:
360 friend class boost::serialization::access;
361 template<class Archive> void serializeCommon(Archive&, unsigned);
362 template<class Archive> void save(Archive&, unsigned) const;
363 template<class Archive> void load(Archive&, unsigned);
364 BOOST_SERIALIZATION_SPLIT_MEMBER();
365#endif
366
367#ifdef ROSE_ENABLE_FLATBUFFERS
368private:
369 friend class Rose::BinaryAnalysis::Serialization::FlatBuffers::Deserializer;
370#endif
371
374 //
375 // Constructors
376 //
379private:
380 Partitioner(); // needed for Boost serialization
381
382 // Partitioner objects are reference counted and always allocated on the heap. Use the `instance` methods to construct
383 // these objects. Also, since the Partitioner class is final, we make the constructors private instead of the usual
384 // protected constructors elsewhere in ROSE.
387public:
388 ~Partitioner();
389
390public:
396
402
407 static PartitionerPtr instanceFromRbaFile(const boost::filesystem::path&, Serialization::Format = Serialization::BINARY);
408
410 void saveAsRbaFile(const boost::filesystem::path &name, Serialization::Format fmt) const;
411
413 Partitioner(BOOST_RV_REF(Partitioner));
414
417
425
427 void clear();
428
444
462
474
475
478 //
479 // Unparsing
480 //
483public:
512
517
526 std::string unparse(SgAsmInstruction*) const;
527 void unparse(std::ostream&, SgAsmInstruction*) const;
528 void unparse(std::ostream&, const BasicBlockPtr&) const;
529 void unparse(std::ostream&, const DataBlockPtr&) const;
530 void unparse(std::ostream&, const FunctionPtr&) const;
531 void unparse(std::ostream&) const;
537 std::string unparsePlain(SgAsmInstruction*) const;
538
541 //
542 // Partitioner CFG queries
543 //
546public:
552 size_t nBytes() const;
553
561 ControlFlowGraph::VertexIterator undiscoveredVertex();
562 ControlFlowGraph::ConstVertexIterator undiscoveredVertex() const;
575 ControlFlowGraph::VertexIterator indeterminateVertex();
576 ControlFlowGraph::ConstVertexIterator indeterminateVertex() const;
588 ControlFlowGraph::VertexIterator nonexistingVertex();
589 ControlFlowGraph::ConstVertexIterator nonexistingVertex() const;
598 const ControlFlowGraph& cfg() const;
599
606 const AddressUsageMap& aum() const;
607
610
615 std::vector<AddressUser> users(Address) const;
616
624 std::set<Address> ghostSuccessors() const;
625
654 bool isEdgeIntraProcedural(ControlFlowGraph::ConstEdgeIterator edge, const FunctionPtr&) const;
655 bool isEdgeIntraProcedural(const ControlFlowGraph::Edge &edge, const FunctionPtr&) const;
656 bool isEdgeIntraProcedural(ControlFlowGraph::ConstEdgeIterator edge) const;
657 bool isEdgeIntraProcedural(const ControlFlowGraph::Edge &edge) const;
694 bool isEdgeInterProcedural(ControlFlowGraph::ConstEdgeIterator edge) const;
695 bool isEdgeInterProcedural(ControlFlowGraph::ConstEdgeIterator edge, const FunctionPtr &sourceFunction) const;
696 bool isEdgeInterProcedural(ControlFlowGraph::ConstEdgeIterator edge, const FunctionPtr &sourceFunction,
697 const FunctionPtr &targetFunction) const;
698
699 bool isEdgeInterProcedural(const ControlFlowGraph::Edge &edge) const;
700 bool isEdgeInterProcedural(const ControlFlowGraph::Edge &edge, const FunctionPtr &sourceFunction) const;
701 bool isEdgeInterProcedural(const ControlFlowGraph::Edge &edge, const FunctionPtr &sourceFunction,
702 const FunctionPtr &targetFunction) const;
709 //
710 // Partitioner instruction operations
711 //
714public:
720 size_t nInstructions() const;
721
741 ControlFlowGraph::ConstVertexIterator instructionVertex(Address insnVa) const;
742
751 std::vector<SgAsmInstruction*> instructionsOverlapping(const AddressInterval&) const;
752
761 std::vector<SgAsmInstruction*> instructionsSpanning(const AddressInterval&) const;
762
772 std::vector<SgAsmInstruction*> instructionsContainedIn(const AddressInterval&) const;
773
782
796
802
803
804
807 //
808 // Partitioner basic block placeholder operations
809 //
812public:
822 size_t nPlaceholders() const;
823
832 bool placeholderExists(Address startVa) const;
833
844 ControlFlowGraph::VertexIterator findPlaceholder(Address startVa);
845 ControlFlowGraph::ConstVertexIterator findPlaceholder(Address startVa) const;
864 ControlFlowGraph::VertexIterator insertPlaceholder(Address startVa);
865
879 BasicBlockPtr erasePlaceholder(const ControlFlowGraph::ConstVertexIterator &placeholder) /*final*/;
887 //
888 // Partitioner basic block operations
889 //
892public:
919
928 size_t nBasicBlocks() const;
929
937 std::vector<BasicBlockPtr> basicBlocks() const;
938
973 std::vector<BasicBlockPtr> basicBlocksOverlapping(const AddressInterval&) const;
974
985 std::vector<BasicBlockPtr> basicBlocksSpanning(const AddressInterval&) const;
986
996 std::vector<BasicBlockPtr> basicBlocksContainedIn(const AddressInterval&) const;
997
1005
1016
1023
1050 BasicBlockPtr detachBasicBlock(const ControlFlowGraph::ConstVertexIterator &placeholder);
1064 ControlFlowGraph::VertexIterator truncateBasicBlock(const ControlFlowGraph::ConstVertexIterator &basicBlock,
1065 SgAsmInstruction *insn);
1066
1100 void attachBasicBlock(const ControlFlowGraph::ConstVertexIterator &placeholder, const BasicBlockPtr&);
1189 BasicBlockPtr discoverBasicBlock(const ControlFlowGraph::ConstVertexIterator &placeholder) const;
1207
1216 std::vector<Address> basicBlockConcreteSuccessors(const BasicBlockPtr&, bool *isComplete=NULL) const;
1217
1236 std::set<Address> basicBlockGhostSuccessors(const BasicBlockPtr&) const;
1237
1247 bool basicBlockIsFunctionCall(const BasicBlockPtr&, Precision::Level precision = Precision::HIGH) const;
1248
1260
1266
1308 basicBlockStackDeltaIn(const BasicBlockPtr&, const FunctionPtr &function) const;
1309
1311 basicBlockStackDeltaOut(const BasicBlockPtr&, const FunctionPtr &function) const;
1322 void forgetStackDeltas() const;
1323 void forgetStackDeltas(const FunctionPtr&) const;
1390 Sawyer::Optional<bool> basicBlockOptionalMayReturn(const ControlFlowGraph::ConstVertexIterator&) const;
1400
1401private:
1402 // Per-vertex data used during may-return analysis
1403 struct MayReturnVertexInfo {
1404 enum State {INIT, CALCULATING, FINISHED};
1405 State state; // current state of vertex
1406 bool processedCallees; // have we processed BBs this vertex calls?
1407 boost::logic::tribool anyCalleesReturn; // do any of those called BBs have a true may-return value?
1408 boost::logic::tribool result; // final result (eventually cached in BB)
1409 MayReturnVertexInfo(): state(INIT), processedCallees(false), anyCalleesReturn(false), result(boost::indeterminate) {}
1410 };
1411
1412 // Is edge significant for analysis? See .C file for full documentation.
1413 bool mayReturnIsSignificantEdge(const ControlFlowGraph::ConstEdgeIterator &edge,
1414 std::vector<MayReturnVertexInfo> &vertexInfo) const;
1415
1416 // Determine (and cache in vertexInfo) whether any callees return.
1417 boost::logic::tribool mayReturnDoesCalleeReturn(const ControlFlowGraph::ConstVertexIterator &vertex,
1418 std::vector<MayReturnVertexInfo> &vertexInfo) const;
1419
1420 // Maximum may-return result from significant successors including phantom call-return edge.
1421 boost::logic::tribool mayReturnDoesSuccessorReturn(const ControlFlowGraph::ConstVertexIterator &vertex,
1422 std::vector<MayReturnVertexInfo> &vertexInfo) const;
1423
1424 // The guts of the may-return analysis
1425 Sawyer::Optional<bool> basicBlockOptionalMayReturn(const ControlFlowGraph::ConstVertexIterator &start,
1426 std::vector<MayReturnVertexInfo> &vertexInfo) const;
1427
1428
1429
1432 //
1433 // Partitioner data block operations
1434 //
1437public:
1443 size_t nDataBlocks() const;
1444
1452
1462
1475
1483
1494
1508
1518 std::vector<DataBlockPtr> dataBlocksOverlapping(const AddressInterval&) const;
1519
1529 std::vector<DataBlockPtr> dataBlocksSpanning(const AddressInterval&) const;
1530
1540 std::vector<DataBlockPtr> dataBlocksContainedIn(const AddressInterval&) const;
1541
1549
1555 std::vector<DataBlockPtr> dataBlocks() const;
1556
1557
1558
1561 //
1562 // Partitioner function operations
1563 //
1566public:
1572 size_t nFunctions() const;
1573
1593 FunctionPtr functionExists(const BasicBlockPtr &entryBlock) const;
1602 std::vector<FunctionPtr> functions() const;
1603
1613 std::vector<FunctionPtr> functionsOverlapping(const AddressInterval&) const;
1614
1625 std::vector<FunctionPtr> functionsSpanning(const AddressInterval&) const;
1626
1636 std::vector<FunctionPtr> functionsContainedIn(const AddressInterval&) const;
1637
1655 void functionExtent(const FunctionPtr &function, AddressIntervalSet &retval /*in,out*/) const;
1657 void functionBasicBlockExtent(const FunctionPtr &function, AddressIntervalSet &retval /*in,out*/) const;
1659 void functionDataBlockExtent(const FunctionPtr &function, AddressIntervalSet &retval /*in,out*/) const;
1699
1734
1740 std::vector<Function::Ptr> entryFunctions();
1741
1776 std::vector<FunctionPtr>
1777 functionsOwningBasicBlock(const ControlFlowGraph::Vertex&, bool doSort = true) const;
1778
1779 std::vector<FunctionPtr>
1780 functionsOwningBasicBlock(const ControlFlowGraph::ConstVertexIterator&, bool doSort = true) const;
1781
1782 std::vector<FunctionPtr>
1783 functionsOwningBasicBlock(Address bblockVa, bool doSort = true) const;
1784
1785 std::vector<FunctionPtr>
1786 functionsOwningBasicBlock(const BasicBlockPtr&, bool doSort = true) const;
1787
1788 template<class Container> // container can hold any type accepted by functionsOwningBasicBlock
1789 std::vector<FunctionPtr>
1790 functionsOwningBasicBlocks(const Container &bblocks) const {
1791 std::vector<FunctionPtr> retval;
1792 for (const typename Container::value_type& bblock: bblocks) {
1793 for (const FunctionPtr &function: functionsOwningBasicBlock(bblock, false))
1794 insertUnique(retval, function, sortFunctionsByAddress);
1795 }
1796 return retval;
1797 }
1809 std::vector<FunctionPtr> discoverCalledFunctions() const;
1810
1822 std::vector<FunctionPtr> discoverFunctionEntryVertices() const;
1823
1834
1845 void discoverFunctionBasicBlocks(const FunctionPtr &function) const;
1846
1853 std::set<Address> functionGhostSuccessors(const FunctionPtr&) const;
1854
1863
1884
1889
1897
1902
1938 const CallingConvention::Definition::Ptr &dflt) const;
1957
2019 void fixInterFunctionEdge(const ControlFlowGraph::ConstEdgeIterator&);
2038 bool functionIsNoop(const FunctionPtr&) const;
2039
2045 void allFunctionIsNoop() const;
2046
2062 std::set<Address> functionDataFlowConstants(const FunctionPtr&) const;
2063
2064
2065
2068 //
2069 // Callbacks
2070 //
2073public:
2107public:
2143 std::vector<FunctionPtr> nextFunctionPrologue(Address startVa);
2144 std::vector<FunctionPtr> nextFunctionPrologue(Address startVa, Address &lastSearchedVa /*out*/);
2147public:
2165
2166
2167
2170 //
2171 // Partitioner miscellaneous
2172 //
2175public:
2187 void dumpCfg(std::ostream&, const std::string &prefix="", bool showBlocks=true, bool computeProperties=true) const;
2188
2202 void cfgGraphViz(std::ostream&, const AddressInterval &restrict = AddressInterval::whole(), bool showNeighbors=true) const;
2203
2209 static std::string vertexName(const ControlFlowGraph::Vertex&);
2210 std::string vertexName(const ControlFlowGraph::ConstVertexIterator&) const;
2216 static std::string vertexNameEnd(const ControlFlowGraph::Vertex&);
2217
2223 static std::string edgeNameSrc(const ControlFlowGraph::Edge&);
2224 std::string edgeNameSrc(const ControlFlowGraph::ConstEdgeIterator&) const;
2232 static std::string edgeNameDst(const ControlFlowGraph::Edge&);
2233 std::string edgeNameDst(const ControlFlowGraph::ConstEdgeIterator&) const;
2241 static std::string edgeName(const ControlFlowGraph::Edge&);
2242 std::string edgeName(const ControlFlowGraph::ConstEdgeIterator&) const;
2248 static std::string basicBlockName(const BasicBlockPtr&);
2249
2253 static std::string dataBlockName(const DataBlockPtr&);
2254
2258 static std::string functionName(const FunctionPtr&);
2259
2265
2291 void updateProgress(const std::string &phase, double completion) const;
2292
2294 void showStatistics() const;
2295
2296 // Checks consistency of internal data structures when debugging is enable (when NDEBUG is not defined).
2297 void checkConsistency() const;
2298
2305
2310
2321 //
2322 // Settings
2323 //
2326public:
2327
2347 void enableSymbolicSemantics(bool = true);
2404 void addressName(Address, const std::string&);
2405 const std::string& addressName(Address) const;
2434 //
2435 // Instruction semantics
2436 //
2439public:
2460
2484
2485
2486
2489 //
2490 // Python API support functions
2491 //
2494#ifdef ROSE_ENABLE_PYTHON_API
2495 void pythonUnparse() const;
2496#endif
2497
2498
2499
2502 //
2503 // Partitioner internal utilities
2504 //
2507private:
2508 void init(const MemoryMap::Ptr&);
2509 void init(const Partitioner&);
2510 void updateCfgProgress();
2511
2512private:
2513 // Convert a CFG vertex iterator from one partitioner to another. This is called during copy construction when the source
2514 // and destination CFGs are identical.
2515 ControlFlowGraph::VertexIterator convertFrom(const Partitioner &other,
2516 ControlFlowGraph::ConstVertexIterator otherIter);
2517
2518 // Adjusts edges for a placeholder vertex. This method erases all outgoing edges for the specified placeholder vertex and
2519 // then inserts a single edge from the placeholder to the special "undiscovered" vertex. */
2520 ControlFlowGraph::EdgeIterator adjustPlaceholderEdges(const ControlFlowGraph::VertexIterator &placeholder);
2521
2522 // Adjusts edges for a non-existing basic block. This method erases all outgoing edges for the specified vertex and
2523 // then inserts a single edge from the vertex to the special "non-existing" vertex. */
2524 ControlFlowGraph::EdgeIterator adjustNonexistingEdges(const ControlFlowGraph::VertexIterator &vertex);
2525
2526 // Implementation for the discoverBasicBlock methods. The startVa must not be the address of an existing placeholder.
2527 BasicBlockPtr discoverBasicBlockInternal(Address startVa) const;
2528
2529 // This method is called whenever a new placeholder is inserted into the CFG or a new basic block is attached to the
2530 // CFG/AUM. The call happens immediately after the CFG/AUM are updated.
2531 void bblockAttached(const ControlFlowGraph::VertexIterator &newVertex);
2532
2533 // This method is called whenever a basic block is detached from the CFG/AUM or when a placeholder is erased from the CFG.
2534 // The call happens immediately after the CFG/AUM are updated.
2535 void bblockDetached(Address startVa, const BasicBlockPtr &removedBlock);
2536
2537 // Rebuild the vertexIndex_ and other cache-like data members from the control flow graph
2538 void rebuildVertexIndices();
2539};
2540
2541} // namespace
2542} // namespace
2543} // namespace
2544
2545#endif
2546#endif
Provides and caches instructions.
Partitions instructions into basic blocks and functions.
AddressIntervalSet basicBlockInstructionExtent(const BasicBlockPtr &) const
Returns the addresses used by basic block instructions.
Sawyer::Callbacks< CfgAdjustmentCallback::Ptr > CfgAdjustmentCallbacks
See cfgAdjustmentCallbacks.
const Configuration & configuration() const
Property: Configuration information.
ControlFlowGraph::VertexIterator nonexistingVertex()
Returns the special "non-existing" vertex.
ControlFlowGraph::ConstVertexIterator nonexistingVertex() const
Returns the special "non-existing" vertex.
static std::string dataBlockName(const DataBlockPtr &)
Name of a data block.
bool basicBlockIsFunctionReturn(const BasicBlockPtr &) const
Determine if a basic block looks like a function return.
std::vector< Function::Ptr > entryFunctions()
Entry points of the binary.
std::vector< BasicBlockPtr > basicBlocksContainedIn(const AddressInterval &) const
Returns basic blocks that are fully contained in an address interval.
FunctionPrologueMatchers & functionPrologueMatchers()
Ordered list of function prologue matchers.
void addressName(Address, const std::string &)
Property: Name for address.
ControlFlowGraph::VertexIterator undiscoveredVertex()
Returns the special "undiscovered" vertex.
void basicBlockDropSemantics() const
Immediately drop semantic information for all attached basic blocks.
size_t nDataBlocks() const
Returns the number of data blocks attached to the CFG/AUM.
ControlFlowGraph::ConstVertexIterator indeterminateVertex() const
Returns the special "indeterminate" vertex.
void allFunctionCallingConvention() const
Compute calling conventions for all functions.
InstructionSemantics::BaseSemantics::SValuePtr functionStackDelta(const FunctionPtr &function) const
Stack delta analysis for one function.
void interpretation(SgAsmInterpretation *)
Property: Interpretation corresponding to the memory map.
BasicBlockPtr erasePlaceholder(Address startVa)
Remove a basic block placeholder from the CFG/AUM.
Unparser::BasePtr unparser() const
Returns an unparser.
void forgetFunctionIsNoop() const
Clears cached function no-op analysis results.
CfgAdjustmentCallbacks & cfgAdjustmentCallbacks()
List of all callbacks invoked when the CFG is adjusted.
Sawyer::Optional< bool > functionOptionalMayReturn(const FunctionPtr &function) const
May-return analysis for one function.
std::vector< SgAsmInstruction * > instructionsContainedIn(const AddressInterval &) const
Returns instructions that are fully contained in an address interval.
Sawyer::Optional< bool > basicBlockOptionalMayReturn(const BasicBlockPtr &) const
Determine if part of the CFG can pop the top stack frame.
BasicBlockSuccessors basicBlockSuccessors(const BasicBlockPtr &, Precision::Level precision=Precision::HIGH) const
Determine successors for a basic block.
std::vector< DataBlockPtr > dataBlocksContainedIn(const AddressInterval &) const
Returns data blocks that are fully contained in an address interval.
SemanticMemoryParadigm semanticMemoryParadigm() const
Property: Whether to use map- or list-based memory states.
void allFunctionCallingConvention(const CallingConvention::Definition::Ptr &dflt) const
Compute calling conventions for all functions.
FunctionCallGraph functionCallGraph(AllowParallelEdges::Type allowParallelEdges) const
Returns a function call graph.
size_t stackDeltaInterproceduralLimit() const
Property: max depth for inter-procedural stack delta analysis.
void stackDeltaInterproceduralLimit(size_t)
Property: max depth for inter-procedural stack delta analysis.
ControlFlowGraph::VertexIterator insertPlaceholder(Address startVa)
Insert a basic-block placeholder.
FunctionPtr functionExists(const FunctionPtr &function) const
Determines whether a function exists in the CFG/AUM.
void forgetStackDeltas(const FunctionPtr &) const
Clears all cached stack deltas.
void unparse(std::ostream &, const DataBlockPtr &) const
Unparse some entity.
std::vector< FunctionPtr > functionsOverlapping(const AddressInterval &) const
Returns functions that overlap with specified address interval.
DataBlockPtr matchFunctionPadding(const FunctionPtr &)
Finds function padding.
void configureInsnPlainUnparser(const Unparser::BasePtr &) const
Configure plain single-instruction unparser.
SgAsmInstruction * discoverInstruction(Address startVa) const
Discover an instruction.
bool functionIsNoop(const FunctionPtr &) const
Function no-op analysis.
void fixInterFunctionEdge(const ControlFlowGraph::ConstEdgeIterator &)
Adjust inter-function edge types.
ControlFlowGraph::VertexIterator truncateBasicBlock(const ControlFlowGraph::ConstVertexIterator &basicBlock, SgAsmInstruction *insn)
Truncate an attached basic-block.
Sawyer::Optional< Thunk > functionIsThunk(const FunctionPtr &) const
True if function is a thunk.
size_t attachFunctionBasicBlocks(const Functions &)
Create placeholders for function basic blocks.
const ControlFlowGraph & cfg() const
Returns the control flow graph.
const CallingConvention::Analysis & functionCallingConvention(const FunctionPtr &, const CallingConvention::Definition::Ptr &dflt) const
Calling convention analysis for one function.
const SourceLocations & sourceLocations() const
Property: Source locations.
Partitioner & operator=(BOOST_RV_REF(Partitioner))
Move assignment.
bool isEdgeInterProcedural(ControlFlowGraph::ConstEdgeIterator edge) const
Determine if an edge is inter-procedural.
void checkingCallBranch(bool)
Property: Whether to look for function calls used as branches.
std::vector< BasicBlockPtr > basicBlocksSpanning(const AddressInterval &) const
Returns basic blocks that span an entire address interval.
Configuration & configuration()
Property: Configuration information.
AddressUsageMap aum(const FunctionPtr &) const
Returns the address usage map for a single function.
std::vector< FunctionPaddingMatcherPtr > FunctionPaddingMatchers
See functionPaddingMatchers.
SgAsmGenericSection * elfGot(SgAsmElfFileHeader *)
Find the ELF global offset table and save its address.
std::vector< Address > basicBlockConcreteSuccessors(const BasicBlockPtr &, bool *isComplete=NULL) const
Determines concrete successors for a basic block.
std::vector< DataBlockPtr > dataBlocksSpanning(const AddressInterval &) const
Returns data blocks that span an entire address interval.
DataBlockPtr findBestDataBlock(const AddressInterval &) const
Find an existing data block.
void forgetStackDeltas() const
Clears all cached stack deltas.
void allFunctionStackDelta() const
Compute stack delta analysis for all functions.
bool assumeFunctionsReturn() const
Property: Assume (or not) that function calls return.
static std::string basicBlockName(const BasicBlockPtr &)
Name of a basic block.
void unparse(std::ostream &, const BasicBlockPtr &) const
Unparse some entity.
FunctionPtr functionExists(Address entryVa) const
Determines whether a function exists in the CFG/AUM.
AddressIntervalSet basicBlockDataExtent(const BasicBlockPtr &) const
Returns the addresses used by basic block data.
size_t nPlaceholders() const
Returns the number of basic basic block placeholders in the CFG.
AddressIntervalSet functionExtent(const FunctionPtr &) const
Returns the addresses used by a function.
std::vector< BasicBlockPtr > basicBlocks() const
Returns all basic blocks attached to the CFG.
bool isEdgeInterProcedural(const ControlFlowGraph::Edge &edge, const FunctionPtr &sourceFunction) const
Determine if an edge is inter-procedural.
size_t nFunctions() const
Returns the number of functions attached to the CFG/AUM.
std::vector< FunctionPtr > discoverCalledFunctions() const
Scans the CFG to find function calls.
bool isEdgeIntraProcedural(ControlFlowGraph::ConstEdgeIterator edge) const
Determine if an edge is intra-procedural.
BasicBlockPtr basicBlockExists(const BasicBlockPtr &) const
Determines whether a discovered basic block exists in the CFG/AUM.
void settings(const BasePartitionerSettings &)
Partitioner settings.
std::set< Address > ghostSuccessors() const
Determine all ghost successors in the control flow graph.
bool autoAddCallReturnEdges() const
Property: Insert (or not) function call return edges.
Architecture::BaseConstPtr architecture() const
Property: Architecture information.
void unparse(std::ostream &, SgAsmInstruction *) const
Unparse some entity.
std::set< Address > functionGhostSuccessors(const FunctionPtr &) const
Returns ghost successors for a single function.
bool isEdgeInterProcedural(const ControlFlowGraph::Edge &edge, const FunctionPtr &sourceFunction, const FunctionPtr &targetFunction) const
Determine if an edge is inter-procedural.
std::string edgeName(const ControlFlowGraph::ConstEdgeIterator &) const
Name of an edge.
void unparse(std::ostream &, const FunctionPtr &) const
Unparse some entity.
ControlFlowGraph::VertexIterator indeterminateVertex()
Returns the special "indeterminate" vertex.
bool isEdgeIntraProcedural(const ControlFlowGraph::Edge &edge, const FunctionPtr &) const
Determine if an edge is intra-procedural.
ControlFlowGraph::ConstVertexIterator instructionVertex(Address insnVa) const
Returns the CFG vertex containing specified instruction.
size_t nBytes() const
Returns the number of bytes represented by the CFG.
BasicBlockPtr basicBlockContainingInstruction(Address insnVa) const
Returns the basic block that contains a specific instruction address.
bool basicBlockIsFunctionCall(const BasicBlockPtr &, Precision::Level precision=Precision::HIGH) const
Determine if a basic block looks like a function call.
void attachBasicBlock(const ControlFlowGraph::ConstVertexIterator &placeholder, const BasicBlockPtr &)
Attach a basic block to the CFG/AUM.
InstructionSemantics::BaseSemantics::RiscOperatorsPtr newOperators(SemanticMemoryParadigm) const
Obtain new RiscOperators.
void basicBlockMayReturnReset() const
Clear all may-return properties.
BasicBlockPtr detachBasicBlock(Address startVa)
Detach a basic block from the CFG/AUM.
const std::string & addressName(Address) const
Property: Name for address.
void discoverFunctionBasicBlocks(const FunctionPtr &function) const
Adds basic blocks to a function.
IndirectControlFlow::State & icf()
Internal data structures for indirect control flow recovery.
const CallingConvention::Analysis & functionCallingConvention(const FunctionPtr &) const
Calling convention analysis for one function.
bool usingSymbolicSemantics() const
Use or not use symbolic semantics.
std::vector< FunctionPtr > functionsOwningBasicBlocks(const Container &bblocks) const
Finds functions that own the specified basic block.
bool checkingCallBranch() const
Property: Whether to look for function calls used as branches.
void cfgGraphViz(std::ostream &, const AddressInterval &restrict=AddressInterval::whole(), bool showNeighbors=true) const
Output CFG as GraphViz.
const BasicBlockCallbacks & basicBlockCallbacks() const
Callbacks for adjusting basic block during discovery.
std::vector< SgAsmInstruction * > instructionsSpanning(const AddressInterval &) const
Returns instructions that span an entire address interval.
AddressUser instructionExists(Address startVa) const
Determines whether an instruction is attached to the CFG/AUM.
ControlFlowGraph::VertexIterator findPlaceholder(Address startVa)
Find the CFG vertex for a basic block placeholder.
static std::string functionName(const FunctionPtr &)
Name of a function.
std::vector< FunctionPtr > functionsOwningBasicBlock(const BasicBlockPtr &, bool doSort=true) const
Finds functions that own the specified basic block.
void expandIndeterminateCalls()
Expands indeterminate function calls.
BasicBlockPtr discoverBasicBlock(Address startVa) const
Discover instructions for a detached basic block.
void unparse(std::ostream &) const
Unparse some entity.
bool isEdgeIntraProcedural(const ControlFlowGraph::Edge &edge) const
Determine if an edge is intra-procedural.
DataBlockPtr attachDataBlock(const DataBlockPtr &)
Attach a data block to the CFG/AUM.
size_t attachFunctionBasicBlocks(const FunctionPtr &)
Create placeholders for function basic blocks.
void dumpCfg(std::ostream &, const std::string &prefix="", bool showBlocks=true, bool computeProperties=true) const
Output the control flow graph.
InstructionSemantics::BaseSemantics::RiscOperatorsPtr newOperators() const
Obtain new RiscOperators.
void assumeFunctionsReturn(bool)
Property: Assume (or not) that function calls return.
DataBlockPtr dataBlockExists(const DataBlockPtr &) const
Determine if a data block or its equivalent is attached to the CFG/AUM.
DataBlockPtr attachDataBlockToBasicBlock(const DataBlockPtr &, const BasicBlockPtr &)
Attach a data block to a basic block.
bool basicBlockSemanticsAutoDrop() const
Property: Automatically drop semantics for attached basic blocks.
std::vector< AddressUser > users(Address) const
Entities that exist at a particular address.
std::vector< DataBlockPtr > dataBlocksOverlapping(const AddressInterval &) const
Returns data blocks that overlap with specified address interval.
Partitioner(BOOST_RV_REF(Partitioner))
Move constructor.
BasicBlockPtr detachBasicBlock(const BasicBlockPtr &basicBlock)
Detach a basic block from the CFG/AUM.
std::vector< FunctionPtr > nextFunctionPrologue(Address startVa)
Finds the next function by searching for a function prologue.
InstructionSemantics::BaseSemantics::DispatcherPtr newDispatcher(const InstructionSemantics::BaseSemantics::RiscOperatorsPtr &) const
Obtain a new instruction semantics dispatcher.
std::vector< BasicBlockPtr > basicBlocksOverlapping(const AddressInterval &) const
Returns basic blocks that overlap with specified address interval.
void attachBasicBlock(const BasicBlockPtr &)
Attach a basic block to the CFG/AUM.
SgAsmInterpretation * interpretation() const
Property: Interpretation corresponding to the memory map.
std::string unparsePlain(SgAsmInstruction *) const
Unparse an instruction in a plain way.
Progress::Ptr progress() const
Property: How to report progress.
void detachFunction(const FunctionPtr &)
Detaches a function from the CFG/AUM.
static std::string vertexNameEnd(const ControlFlowGraph::Vertex &)
Name of last instruction in vertex.
void insnUnparser(const Unparser::BasePtr &)
Returns an unparser.
bool addressIsExecutable(Address) const
Returns true if address is executable.
void detachDataBlock(const DataBlockPtr &)
Detaches a data block from the CFG/AUM.
std::string vertexName(const ControlFlowGraph::ConstVertexIterator &) const
Name of a vertex.
void showStatistics() const
Print some partitioner performance statistics.
static Ptr instance(const Architecture::BaseConstPtr &)
Default allocating constructor.
void disableSymbolicSemantics()
Use or not use symbolic semantics.
const AddressUsageMap & aum() const
Returns the address usage map.
const IndirectControlFlow::State & icf() const
Internal data structures for indirect control flow recovery.
std::set< Address > basicBlockGhostSuccessors(const BasicBlockPtr &) const
Determine ghost successors for a basic block.
std::vector< FunctionPtr > functions() const
All functions attached to the CFG/AUM.
BasicBlockPtr erasePlaceholder(const ControlFlowGraph::ConstVertexIterator &placeholder)
Remove a basic block placeholder from the CFG/AUM.
void progress(const Progress::Ptr &)
Property: How to report progress.
std::vector< FunctionPtr > functionsSpanning(const AddressInterval &) const
Returns functions that span an entire address interval.
std::vector< SgAsmInstruction * > instructionsOverlapping(const AddressInterval &) const
Returns instructions that overlap with specified address interval.
void enableSymbolicSemantics(bool=true)
Use or not use symbolic semantics.
ControlFlowGraph::ConstVertexIterator findPlaceholder(Address startVa) const
Find the CFG vertex for a basic block placeholder.
const FunctionPrologueMatchers & functionPrologueMatchers() const
Ordered list of function prologue matchers.
Sawyer::Optional< Address > elfGotVa() const
Returns a previously cached ELF GOT address.
Sawyer::Container::Map< Address, std::string > AddressNameMap
Map address to name.
size_t nInstructions() const
Returns the number of instructions attached to the CFG/AUM.
void unparser(const Unparser::BasePtr &)
Returns an unparser.
static Ptr instance(const Architecture::BaseConstPtr &, const MemoryMap::Ptr &)
Construct a partitioner.
void autoAddCallReturnEdges(bool)
Property: Insert (or not) function call return edges.
InstructionSemantics::BaseSemantics::SValuePtr basicBlockStackDeltaOut(const BasicBlockPtr &, const FunctionPtr &function) const
Return the stack delta expression.
void clear()
Reset CFG/AUM to initial state.
BasicBlockPtr discoverBasicBlock(const ControlFlowGraph::ConstVertexIterator &placeholder) const
Discover instructions for a detached basic block.
std::vector< FunctionPtr > nextFunctionPrologue(Address startVa, Address &lastSearchedVa)
Finds the next function by searching for a function prologue.
bool isDefaultConstructed() const
Return true if this is a default constructed partitioner.
void allFunctionMayReturn() const
Compute may-return analysis for all functions.
std::vector< FunctionPrologueMatcherPtr > FunctionPrologueMatchers
See functionPrologueMatchers.
Unparser::BasePtr insnUnparser() const
Returns an unparser.
SmtSolverPtr smtSolver() const
SMT solver.
std::vector< FunctionPtr > functionsOwningBasicBlock(const ControlFlowGraph::Vertex &, bool doSort=true) const
Finds functions that own the specified basic block.
bool isEdgeIntraProcedural(ControlFlowGraph::ConstEdgeIterator edge, const FunctionPtr &) const
Determine if an edge is intra-procedural.
FunctionPtr attachOrMergeFunction(const FunctionPtr &)
Attaches or merges a function into the CFG/AUM.
DataBlockPtr attachDataBlockToFunction(const DataBlockPtr &, const FunctionPtr &)
Attach a data block to an attached or detached function.
BasicBlockPtr basicBlockExists(Address startVa) const
Determines whether a discovered basic block exists in the CFG/AUM.
size_t attachFunctions(const Functions &)
Attaches a function to the CFG/AUM.
BasicBlockPtr detachBasicBlock(const ControlFlowGraph::ConstVertexIterator &placeholder)
Detach a basic block from the CFG/AUM.
std::set< Address > functionDataFlowConstants(const FunctionPtr &) const
Find constants in function using data-flow.
void functionBasicBlockExtent(const FunctionPtr &function, AddressIntervalSet &retval) const
Returns the addresses used by a function.
size_t nBasicBlocks() const
Returns the number of basic blocks attached to the CFG/AUM.
const AddressNameMap & addressNames() const
Property: Name for address.
std::string edgeNameDst(const ControlFlowGraph::ConstEdgeIterator &) const
Name of an outgoing edge.
void configureInsnUnparser(const Unparser::BasePtr &) const
Configure the single-instruction unparser.
CallingConvention::Dictionary functionCallingConventionDefinitions(const FunctionPtr &) const
Return list of matching calling conventions.
bool basicBlockPopsStack(const BasicBlockPtr &) const
Determine if the basic block pops at least one byte from the stack.
std::vector< FunctionPtr > functionsOwningBasicBlock(const ControlFlowGraph::ConstVertexIterator &, bool doSort=true) const
Finds functions that own the specified basic block.
void fixInterFunctionEdges()
Adjust inter-function edge types.
void allFunctionIsNoop() const
Analyze all functions for whether they are effectivly no-ops.
std::vector< DataBlockPtr > dataBlocks() const
Returns the list of all attached data blocks.
void functionDataBlockExtent(const FunctionPtr &function, AddressIntervalSet &retval) const
Returns the addresses used by a function.
bool isEdgeInterProcedural(ControlFlowGraph::ConstEdgeIterator edge, const FunctionPtr &sourceFunction, const FunctionPtr &targetFunction) const
Determine if an edge is inter-procedural.
bool placeholderExists(Address startVa) const
Determines whether a basic block placeholder exists in the CFG.
const FunctionPaddingMatchers & functionPaddingMatchers() const
Ordered list of function padding matchers.
static PartitionerPtr instanceFromRbaFile(const boost::filesystem::path &, Serialization::Format=Serialization::BINARY)
Construct a partitioner by loading it and an AST from a file.
std::string edgeNameSrc(const ControlFlowGraph::ConstEdgeIterator &) const
Name of an incoming edge.
static std::string vertexName(const ControlFlowGraph::Vertex &)
Name of a vertex.
void semanticMemoryParadigm(SemanticMemoryParadigm)
Property: Whether to use map- or list-based memory states.
BasicBlockCallbacks & basicBlockCallbacks()
Callbacks for adjusting basic block during discovery.
FunctionPtr functionExists(const BasicBlockPtr &entryBlock) const
Determines whether a function exists in the CFG/AUM.
AddressIntervalSet functionDataBlockExtent(const FunctionPtr &function) const
Returns the addresses used by a function.
InstructionProvider & instructionProvider()
Returns the instruction provider.
Sawyer::Callbacks< BasicBlockCallbackPtr > BasicBlockCallbacks
See basicBlockCallbacks.
void sourceLocations(const SourceLocations &)
Property: Source locations.
size_t attachFunction(const FunctionPtr &)
Attaches a function to the CFG/AUM.
void forgetFunctionIsNoop(const FunctionPtr &) const
Clears cached function no-op analysis results.
static std::string edgeName(const ControlFlowGraph::Edge &)
Name of an edge.
static std::string edgeNameDst(const ControlFlowGraph::Edge &)
Name of an outgoing edge.
const CfgAdjustmentCallbacks & cfgAdjustmentCallbacks() const
List of all callbacks invoked when the CFG is adjusted.
void functionExtent(const FunctionPtr &function, AddressIntervalSet &retval) const
Returns the addresses used by a function.
AddressInterval instructionExtent(SgAsmInstruction *) const
Returns the address interval for an instruction.
void basicBlockSemanticsAutoDrop(bool)
Property: Automatically drop semantics for attached basic blocks.
MemoryMap::Ptr memoryMap() const
Returns the memory map.
CrossReferences instructionCrossReferences(const AddressIntervalSet &restriction) const
Cross references.
bool isEdgeInterProcedural(ControlFlowGraph::ConstEdgeIterator edge, const FunctionPtr &sourceFunction) const
Determine if an edge is inter-procedural.
std::vector< FunctionPtr > functionsContainedIn(const AddressInterval &) const
Returns functions that are fully contained in an address interval.
std::vector< FunctionPtr > discoverFunctionEntryVertices() const
Scans the CFG to find function entry basic blocks.
void allFunctionCallingConventionDefinition(const CallingConvention::Definition::Ptr &) const
Analyzes calling conventions and saves results.
SourceLocations & sourceLocations()
Property: Source locations.
bool isEdgeInterProcedural(const ControlFlowGraph::Edge &edge) const
Determine if an edge is inter-procedural.
AddressIntervalSet functionBasicBlockExtent(const FunctionPtr &function) const
Returns the addresses used by a function.
std::vector< FunctionPtr > functionsOwningBasicBlock(Address bblockVa, bool doSort=true) const
Finds functions that own the specified basic block.
const InstructionProvider & instructionProvider() const
Returns the instruction provider.
FunctionPaddingMatchers & functionPaddingMatchers()
Ordered list of function padding matchers.
Sawyer::Optional< bool > basicBlockOptionalMayReturn(const ControlFlowGraph::ConstVertexIterator &) const
Determine if part of the CFG can pop the top stack frame.
const BasePartitionerSettings & settings() const
Partitioner settings.
static std::string edgeNameSrc(const ControlFlowGraph::Edge &)
Name of an incoming edge.
void saveAsRbaFile(const boost::filesystem::path &name, Serialization::Format fmt) const
Save this partitioner as an RBA file.
ControlFlowGraph::ConstVertexIterator undiscoveredVertex() const
Returns the special "undiscovered" vertex.
std::string unparse(SgAsmInstruction *) const
Unparse some entity.
void updateProgress(const std::string &phase, double completion) const
Update partitioner with a new progress report.
CallingConvention::Dictionary functionCallingConventionDefinitions(const FunctionPtr &, const CallingConvention::Definition::Ptr &) const
Return list of matching calling conventions.
void allFunctionCallingConventionDefinition() const
Analyzes calling conventions and saves results.
AddressInterval dataBlockExtent(const DataBlockPtr &) const
Returns the addresses used by a data block.
InstructionSemantics::BaseSemantics::SValuePtr basicBlockStackDeltaIn(const BasicBlockPtr &, const FunctionPtr &function) const
Return the stack delta expression.
AddressUser instructionExists(SgAsmInstruction *insn) const
Determines whether an instruction is attached to the CFG/AUM.
Bidirectional mapping between addresses and source locations.
API and storage for attributes.
Definition Attribute.h:215
Container associating values with keys.
Definition Sawyer/Map.h:72
Holds a value or nothing.
Definition Optional.h:54
Creates SharedPointer from this.
Base class for reference counted objects.
Reference-counting intrusive smart pointer.
Represents the file header of an ELF binary container.
Contiguous region of a file.
Base class for machine instructions.
Represents an interpretation of a binary container.
std::shared_ptr< const Base > BaseConstPtr
Reference counted pointer for Architecture::Base.
std::vector< DefinitionPtr > Dictionary
An ordered collection of calling convention definitions.
boost::shared_ptr< RiscOperators > RiscOperatorsPtr
Shared-ownership pointer to a RISC operators object.
boost::shared_ptr< Dispatcher > DispatcherPtr
Shared-ownership pointer to a semantics instruction dispatcher.
std::vector< BasicBlockSuccessor > BasicBlockSuccessors
All successors in no particular order.
std::uint64_t Address
Address.
Definition Address.h:11
std::shared_ptr< SmtSolver > SmtSolverPtr
Reference counting pointer.
The ROSE library.
Represents information about a thunk.
Address target
The one and only successor for the basic block.
BasicBlockPtr bblock
The one and only basic block for the thunk.