]> git.siccegge.de Git - frida/frida.git/commitdiff
Split disassemble()
authorChristoph Egger <christoph@anonymous.siccegge.de>
Fri, 12 Dec 2014 23:40:37 +0000 (00:40 +0100)
committerChristoph Egger <christoph@anonymous.siccegge.de>
Fri, 12 Dec 2014 23:42:37 +0000 (00:42 +0100)
disassemble() still does take care of initial disassembling of the
binary. However parts needed to (interactively) start disassembling
further parts are now separated.

src/disassembler/llvm/LLVMDisassembler.cxx
src/disassembler/llvm/LLVMDisassembler.hxx

index 1ae024a5aea39f9ef6dd786e3933768e8cc6cf5c..3642c5ed74b7492665d385b540bb0444234461e5 100644 (file)
@@ -128,12 +128,106 @@ LLVMDisassembler::~LLVMDisassembler() {
                   });
 }
 
-void LLVMDisassembler::disassemble() {
-    std::stack<LLVMFunction*> remaining_functions;
+Function* LLVMDisassembler::disassembleFunctionAt(uint64_t address, const std::string& name) {
+    if (functions.find(address) != functions.end()) {
+        return functions[address];
+    }
+
+    LLVMFunction * function;
+    if (name == "") {
+        std::stringstream s;
+        s << "<Unnamed 0x" << std::hex << address << ">";
+        function = new LLVMFunction(s.str(), address);
+    } else {
+        function = new LLVMFunction(name, address);
+    }
+    functions.insert(std::make_pair(address, function));
+
+    disassembleFunction(function);
+
+    return function;
+}
+
+void LLVMDisassembler::disassembleFunction(LLVMFunction* function) {
     std::stack<LLVMBasicBlock*> remaining_blocks;
     SectionRef text_section = sections[".text"];
+    StringRef bytes;
+    text_section.getContents(bytes);
+    StringRefMemoryObject ref(bytes);
+
+    LOG4CXX_DEBUG(logger, "Handling function " << function->getName());
+
+    LLVMBasicBlock * block = new LLVMBasicBlock(function->getStartAddress(), this);
+    remaining_blocks.push(block);
+    blocks.insert(std::make_pair(block->getStartAddress(), block));
+
+    while (remaining_blocks.size()) {
+        LLVMBasicBlock * current_block = remaining_blocks.top();
+        remaining_blocks.pop();
+
+        LOG4CXX_DEBUG(logger, "Handling Block starting at " << std::hex << current_block->getStartAddress());
+
+        uint64_t inst_size;
+        uint64_t base_address;
+        text_section.getAddress(base_address);
+        uint64_t current_address = current_block->getStartAddress() - base_address;
+        while(true) {
+            MCInst inst;
+            std::string buf;
+            llvm::raw_string_ostream s(buf);
+
+            if(llvm::MCDisassembler::Success ==
+               DisAsm->getInstruction(inst, inst_size, ref, current_address, nulls(), nulls())) {
+                uint64_t jmptarget;
+
+                if (MIA->evaluateBranch(inst, current_address, inst_size, jmptarget)) {
+                    jmptarget += base_address;
+                    if (!MIA->isIndirectBranch(inst)) {
+                        if (MIA->isCall(inst)) {
+                            if (functions.find(jmptarget) == functions.end()) {
+                                disassembleFunctionAt(jmptarget);
+                            }
+                        } else {
+                            current_block->setNextBlock(0, jmptarget);
+                            if (blocks.find(jmptarget) == blocks.end()) {
+                                LLVMBasicBlock * block = new LLVMBasicBlock(jmptarget, this);
+                                blocks.insert(std::make_pair(block->getStartAddress(), block));
+                                remaining_blocks.push(block);
+                            }
+                            if (MIA->isConditionalBranch(inst)) {
+                                jmptarget = base_address + current_address + inst_size;
+                                current_block->setNextBlock(1, jmptarget);
+                                if (blocks.find(jmptarget) == blocks.end()) {
+                                    LLVMBasicBlock * block = new LLVMBasicBlock(jmptarget, this);
+                                    blocks.insert(std::make_pair(block->getStartAddress(), block));
+                                    remaining_blocks.push(block);
+                                }
+                            }
+                        }
+                    }
+                }
+            } else {
+                inst_size = 0;
+            }
+
+
+            if (inst_size == 0 || MIA->isTerminator(inst) || MIA->isBranch(inst)) {
+                current_block->setEndAddress(current_address + base_address + inst_size);
+                LOG4CXX_DEBUG(logger, "Finished Block at " << std::hex <<
+                              current_block->getEndAddress());
+                break;
+            }
+            current_address += inst_size;
+        }
+    }
+    LOG4CXX_DEBUG(logger, "Finished function " << function->getName());
+}
+
+void LLVMDisassembler::disassemble() {
+    SectionRef text_section = sections[".text"];
+    std::vector<LLVMFunction*> remaining_functions;
 
-       // Assume all function symbols actually start a real function
+    // Assume all function symbols actually start a real function
     for (auto x = symbols.begin(); x != symbols.end(); ++x) {
         uint64_t result;
         bool contains;
@@ -149,12 +243,16 @@ void LLVMDisassembler::disassemble() {
 
         if (!x->second.getAddress(result)) {
             LLVMFunction * fun = new LLVMFunction(x->first, result);
-            remaining_functions.push(fun);
+            remaining_functions.push_back(fun);
             functions.insert(std::make_pair(result, fun));
             LOG4CXX_DEBUG(logger, "Disasembling " << x->first);
         }
     }
 
+    for (LLVMFunction* function : remaining_functions) {
+        disassembleFunction(function);
+    }
+
     if (binary->isELF()) {
         bool is64bit = (binary->getData()[4] == 0x02);
 
@@ -167,143 +265,64 @@ void LLVMDisassembler::disassemble() {
                 entry |= (unsigned char)binary->getData()[0x18 + i];
             }
         }
-        if (functions.find(entry) == functions.end()) {
-            LOG4CXX_DEBUG(logger, "Adding entry at: " << std::hex << entry);
-            std::stringstream s;
-            s << "<_start 0x" << std::hex << entry << ">";
-            LLVMFunction * fun = new LLVMFunction(s.str(), entry);
-            functions.insert(std::make_pair(entry, fun));
-            remaining_functions.push(fun);
-        }
+        LOG4CXX_DEBUG(logger, "Adding entry at: " << std::hex << entry);
+        std::stringstream s;
+        s << "<_start 0x" << std::hex << entry << ">";
+
+        disassembleFunctionAt(entry, s.str());
     }
 
     if (functions.empty()) {
         uint64_t text_entry;
         text_section.getAddress(text_entry);
         LOG4CXX_INFO(logger, "No Symbols found, starting at the beginning of the text segment");
-
-        std::stringstream s;
-        s << "<Unnamed 0x" << std::hex << text_entry << ">";
-        LLVMFunction * fun = new LLVMFunction(s.str(), text_entry);
-        functions.insert(std::make_pair(text_entry, fun));
-        remaining_functions.push(fun);
+        disassembleFunctionAt(text_entry);
     }
 
+    splitBlocks();
+}
+
+void LLVMDisassembler::splitBlocks() {
+    SectionRef text_section = sections[".text"];
     StringRef bytes;
     text_section.getContents(bytes);
     StringRefMemoryObject ref(bytes);
 
-    while (remaining_functions.size()) {
-        LLVMFunction * current_function = remaining_functions.top();
-        remaining_functions.pop();
-
-        LOG4CXX_DEBUG(logger, "Handling function " << current_function->getName());
-
-        LLVMBasicBlock * block = new LLVMBasicBlock(current_function->getStartAddress(), this);
-        remaining_blocks.push(block);
-        blocks.insert(std::make_pair(block->getStartAddress(), block));
-
-        while (remaining_blocks.size()) {
-            LLVMBasicBlock * current_block = remaining_blocks.top();
-            remaining_blocks.pop();
-
-            LOG4CXX_DEBUG(logger, "Handling Block starting at " << std::hex << current_block->getStartAddress());
-
-            uint64_t inst_size;
-            uint64_t base_address;
-            text_section.getAddress(base_address);
-            uint64_t current_address = current_block->getStartAddress() - base_address;
-            while(true) {
-                MCInst inst;
-                std::string buf;
-                llvm::raw_string_ostream s(buf);
-
-                if(llvm::MCDisassembler::Success ==
-                   DisAsm->getInstruction(inst, inst_size, ref, current_address, nulls(), nulls())) {
-
-                    uint64_t jmptarget;
-                    if (MIA->evaluateBranch(inst, current_address, inst_size, jmptarget)) {
-                        jmptarget += base_address;
-                        if (!MIA->isIndirectBranch(inst)) {
-                            if (MIA->isCall(inst)) {
-                                if (functions.find(jmptarget) == functions.end()) {
-                                    std::stringstream s;
-                                    s << "<Unnamed 0x" << std::hex << jmptarget << ">";
-                                    LLVMFunction * fun = new LLVMFunction(s.str(), jmptarget);
-                                    functions.insert(std::make_pair(jmptarget, fun));
-                                    remaining_functions.push(fun);
-                                }
-                            } else {
-                                                               current_block->setNextBlock(0, jmptarget);
-                                if (blocks.find(jmptarget) == blocks.end()) {
-                                    LLVMBasicBlock * block = new LLVMBasicBlock(jmptarget, this);
-                                    blocks.insert(std::make_pair(block->getStartAddress(), block));
-                                    remaining_blocks.push(block);
-                                }
-                                if (MIA->isConditionalBranch(inst)) {
-                                    jmptarget = base_address + current_address + inst_size;
-                                                                       current_block->setNextBlock(1, jmptarget);
-                                    if (blocks.find(jmptarget) == blocks.end()) {
-                                        LLVMBasicBlock * block = new LLVMBasicBlock(jmptarget, this);
-                                        blocks.insert(std::make_pair(block->getStartAddress(), block));
-                                        remaining_blocks.push(block);
-                                    }
-                                }
-                            }
-                        }
+    // Split blocks where jumps are going inside the block
+    for (auto it = blocks.begin(); it != blocks.end(); ++it) {
+        LLVMBasicBlock * current_block = it->second;
+        uint64_t inst_size;
+        uint64_t base_address;
+        text_section.getAddress(base_address);
+        uint64_t current_address = current_block->getStartAddress() - base_address;
+        while(current_block->getEndAddress() - base_address > current_address) {
+            MCInst inst;
+            std::string buf;
+            llvm::raw_string_ostream s(buf);
+
+            if(llvm::MCDisassembler::Success ==
+               DisAsm->getInstruction(inst, inst_size, ref, current_address, nulls(), nulls())) {
+                auto other = blocks.find(current_address + inst_size + base_address);
+
+                if (other != blocks.end()) {
+                    uint64_t endaddress = current_address + inst_size + base_address;
+                    if (endaddress != current_block->getEndAddress()) {
+                        LOG4CXX_DEBUG(logger, "Shortening block starting at "
+                                      << std::hex
+                                      << current_block->getStartAddress()
+                                      << " now ending at "
+                                      << other->first);
+                        current_block->setEndAddress(endaddress);
+                        current_block->setNextBlock(0, other->first);
+                        current_block->setNextBlock(1, 0);
                     }
-                } else {
-                    inst_size = 0;
-                }
-
-
-                if (inst_size == 0 || MIA->isTerminator(inst) || MIA->isBranch(inst)) {
-                    current_block->setEndAddress(current_address + base_address + inst_size);
-                    LOG4CXX_DEBUG(logger, "Finished Block at " << std::hex <<
-                                  current_block->getEndAddress());
-                    break;
                 }
-                current_address += inst_size;
+            } else {
+                inst_size = 1;
             }
+            current_address += inst_size;
         }
-        LOG4CXX_DEBUG(logger, "Finished function " << current_function->getName());
     }
-
-       // Split blocks where jumps are going inside the block
-       for (auto it = blocks.begin(); it != blocks.end(); ++it) {
-               LLVMBasicBlock * current_block = it->second;
-               uint64_t inst_size;
-               uint64_t base_address;
-               text_section.getAddress(base_address);
-               uint64_t current_address = current_block->getStartAddress() - base_address;
-               while(current_block->getEndAddress() - base_address > current_address) {
-                       MCInst inst;
-                       std::string buf;
-                       llvm::raw_string_ostream s(buf);
-
-                       if(llvm::MCDisassembler::Success ==
-                          DisAsm->getInstruction(inst, inst_size, ref, current_address, nulls(), nulls())) {
-                               auto other = blocks.find(current_address + inst_size + base_address);
-
-                               if (other != blocks.end()) {
-                                       uint64_t endaddress = current_address + inst_size + base_address;
-                                       if (endaddress != current_block->getEndAddress()) {
-                                               LOG4CXX_DEBUG(logger, "Shortening block starting at "
-                                                                         << std::hex
-                                                                         << current_block->getStartAddress()
-                                                                         << " now ending at "
-                                                                         << other->first);
-                                               current_block->setEndAddress(endaddress);
-                                               current_block->setNextBlock(0, other->first);
-                                               current_block->setNextBlock(1, 0);
-                                       }
-                               }
-                       } else {
-                               inst_size = 1;
-                       }
-                       current_address += inst_size;
-               }
-       }
 }
 
 void LLVMDisassembler::readSymbols() {
index 6ed3c8c86936b75c383097e3ff841fd0db8ad027..f2baecb33a2e44904322f298d429ef05852a2654 100644 (file)
@@ -31,13 +31,17 @@ public:
                return blocks[address];
        }
 
+    Function * disassembleFunctionAt(uint64_t address, const std::string& name = "");
+
 protected:
     bool isFunctionCall(uint64_t address) {return false;}
     bool isJump(uint64_t address) {return false;}
 
 private:
     // http://llvm.org/docs/doxygen/html/MCObjectDisassembler_8cpp_source.html +197
-       void disassemble();
+    void disassembleFunction(LLVMFunction* function);
+    void splitBlocks();
+    void disassemble();
 
        void readSymbols();
        void readSections();