});
}
-void LLVMDisassembler::disassemble() {
- std::stack<LLVMFunction*> remaining_functions;
+Function* LLVMDisassembler::disassembleFunctionAt(uint64_t address, const std::string& name) {
+ if (functions.find(address) != functions.end()) {
+ return functions[address];
+ }
+
+ LLVMFunction * function;
+ if (name == "") {
+ std::stringstream s;
+ s << "<Unnamed 0x" << std::hex << address << ">";
+ function = new LLVMFunction(s.str(), address);
+ } else {
+ function = new LLVMFunction(name, address);
+ }
+ functions.insert(std::make_pair(address, function));
+
+ disassembleFunction(function);
+
+ return function;
+}
+
+void LLVMDisassembler::disassembleFunction(LLVMFunction* function) {
std::stack<LLVMBasicBlock*> remaining_blocks;
SectionRef text_section = sections[".text"];
+ StringRef bytes;
+ text_section.getContents(bytes);
+ StringRefMemoryObject ref(bytes);
+
+ LOG4CXX_DEBUG(logger, "Handling function " << function->getName());
+
+ LLVMBasicBlock * block = new LLVMBasicBlock(function->getStartAddress(), this);
+ remaining_blocks.push(block);
+ blocks.insert(std::make_pair(block->getStartAddress(), block));
+
+ while (remaining_blocks.size()) {
+ LLVMBasicBlock * current_block = remaining_blocks.top();
+ remaining_blocks.pop();
+
+ LOG4CXX_DEBUG(logger, "Handling Block starting at " << std::hex << current_block->getStartAddress());
+
+ uint64_t inst_size;
+ uint64_t base_address;
+ text_section.getAddress(base_address);
+ uint64_t current_address = current_block->getStartAddress() - base_address;
+ while(true) {
+ MCInst inst;
+ std::string buf;
+ llvm::raw_string_ostream s(buf);
+
+ if(llvm::MCDisassembler::Success ==
+ DisAsm->getInstruction(inst, inst_size, ref, current_address, nulls(), nulls())) {
+ uint64_t jmptarget;
+
+ if (MIA->evaluateBranch(inst, current_address, inst_size, jmptarget)) {
+ jmptarget += base_address;
+ if (!MIA->isIndirectBranch(inst)) {
+ if (MIA->isCall(inst)) {
+ if (functions.find(jmptarget) == functions.end()) {
+ disassembleFunctionAt(jmptarget);
+ }
+ } else {
+ current_block->setNextBlock(0, jmptarget);
+ if (blocks.find(jmptarget) == blocks.end()) {
+ LLVMBasicBlock * block = new LLVMBasicBlock(jmptarget, this);
+ blocks.insert(std::make_pair(block->getStartAddress(), block));
+ remaining_blocks.push(block);
+ }
+ if (MIA->isConditionalBranch(inst)) {
+ jmptarget = base_address + current_address + inst_size;
+ current_block->setNextBlock(1, jmptarget);
+ if (blocks.find(jmptarget) == blocks.end()) {
+ LLVMBasicBlock * block = new LLVMBasicBlock(jmptarget, this);
+ blocks.insert(std::make_pair(block->getStartAddress(), block));
+ remaining_blocks.push(block);
+ }
+ }
+ }
+ }
+ }
+ } else {
+ inst_size = 0;
+ }
+
+
+ if (inst_size == 0 || MIA->isTerminator(inst) || MIA->isBranch(inst)) {
+ current_block->setEndAddress(current_address + base_address + inst_size);
+ LOG4CXX_DEBUG(logger, "Finished Block at " << std::hex <<
+ current_block->getEndAddress());
+ break;
+ }
+ current_address += inst_size;
+ }
+ }
+ LOG4CXX_DEBUG(logger, "Finished function " << function->getName());
+}
+
+void LLVMDisassembler::disassemble() {
+ SectionRef text_section = sections[".text"];
+ std::vector<LLVMFunction*> remaining_functions;
- // Assume all function symbols actually start a real function
+ // Assume all function symbols actually start a real function
for (auto x = symbols.begin(); x != symbols.end(); ++x) {
uint64_t result;
bool contains;
if (!x->second.getAddress(result)) {
LLVMFunction * fun = new LLVMFunction(x->first, result);
- remaining_functions.push(fun);
+ remaining_functions.push_back(fun);
functions.insert(std::make_pair(result, fun));
LOG4CXX_DEBUG(logger, "Disasembling " << x->first);
}
}
+ for (LLVMFunction* function : remaining_functions) {
+ disassembleFunction(function);
+ }
+
if (binary->isELF()) {
bool is64bit = (binary->getData()[4] == 0x02);
entry |= (unsigned char)binary->getData()[0x18 + i];
}
}
- if (functions.find(entry) == functions.end()) {
- LOG4CXX_DEBUG(logger, "Adding entry at: " << std::hex << entry);
- std::stringstream s;
- s << "<_start 0x" << std::hex << entry << ">";
- LLVMFunction * fun = new LLVMFunction(s.str(), entry);
- functions.insert(std::make_pair(entry, fun));
- remaining_functions.push(fun);
- }
+ LOG4CXX_DEBUG(logger, "Adding entry at: " << std::hex << entry);
+ std::stringstream s;
+ s << "<_start 0x" << std::hex << entry << ">";
+
+ disassembleFunctionAt(entry, s.str());
}
if (functions.empty()) {
uint64_t text_entry;
text_section.getAddress(text_entry);
LOG4CXX_INFO(logger, "No Symbols found, starting at the beginning of the text segment");
-
- std::stringstream s;
- s << "<Unnamed 0x" << std::hex << text_entry << ">";
- LLVMFunction * fun = new LLVMFunction(s.str(), text_entry);
- functions.insert(std::make_pair(text_entry, fun));
- remaining_functions.push(fun);
+ disassembleFunctionAt(text_entry);
}
+ splitBlocks();
+}
+
+void LLVMDisassembler::splitBlocks() {
+ SectionRef text_section = sections[".text"];
StringRef bytes;
text_section.getContents(bytes);
StringRefMemoryObject ref(bytes);
- while (remaining_functions.size()) {
- LLVMFunction * current_function = remaining_functions.top();
- remaining_functions.pop();
-
- LOG4CXX_DEBUG(logger, "Handling function " << current_function->getName());
-
- LLVMBasicBlock * block = new LLVMBasicBlock(current_function->getStartAddress(), this);
- remaining_blocks.push(block);
- blocks.insert(std::make_pair(block->getStartAddress(), block));
-
- while (remaining_blocks.size()) {
- LLVMBasicBlock * current_block = remaining_blocks.top();
- remaining_blocks.pop();
-
- LOG4CXX_DEBUG(logger, "Handling Block starting at " << std::hex << current_block->getStartAddress());
-
- uint64_t inst_size;
- uint64_t base_address;
- text_section.getAddress(base_address);
- uint64_t current_address = current_block->getStartAddress() - base_address;
- while(true) {
- MCInst inst;
- std::string buf;
- llvm::raw_string_ostream s(buf);
-
- if(llvm::MCDisassembler::Success ==
- DisAsm->getInstruction(inst, inst_size, ref, current_address, nulls(), nulls())) {
-
- uint64_t jmptarget;
- if (MIA->evaluateBranch(inst, current_address, inst_size, jmptarget)) {
- jmptarget += base_address;
- if (!MIA->isIndirectBranch(inst)) {
- if (MIA->isCall(inst)) {
- if (functions.find(jmptarget) == functions.end()) {
- std::stringstream s;
- s << "<Unnamed 0x" << std::hex << jmptarget << ">";
- LLVMFunction * fun = new LLVMFunction(s.str(), jmptarget);
- functions.insert(std::make_pair(jmptarget, fun));
- remaining_functions.push(fun);
- }
- } else {
- current_block->setNextBlock(0, jmptarget);
- if (blocks.find(jmptarget) == blocks.end()) {
- LLVMBasicBlock * block = new LLVMBasicBlock(jmptarget, this);
- blocks.insert(std::make_pair(block->getStartAddress(), block));
- remaining_blocks.push(block);
- }
- if (MIA->isConditionalBranch(inst)) {
- jmptarget = base_address + current_address + inst_size;
- current_block->setNextBlock(1, jmptarget);
- if (blocks.find(jmptarget) == blocks.end()) {
- LLVMBasicBlock * block = new LLVMBasicBlock(jmptarget, this);
- blocks.insert(std::make_pair(block->getStartAddress(), block));
- remaining_blocks.push(block);
- }
- }
- }
- }
+ // Split blocks where jumps are going inside the block
+ for (auto it = blocks.begin(); it != blocks.end(); ++it) {
+ LLVMBasicBlock * current_block = it->second;
+ uint64_t inst_size;
+ uint64_t base_address;
+ text_section.getAddress(base_address);
+ uint64_t current_address = current_block->getStartAddress() - base_address;
+ while(current_block->getEndAddress() - base_address > current_address) {
+ MCInst inst;
+ std::string buf;
+ llvm::raw_string_ostream s(buf);
+
+ if(llvm::MCDisassembler::Success ==
+ DisAsm->getInstruction(inst, inst_size, ref, current_address, nulls(), nulls())) {
+ auto other = blocks.find(current_address + inst_size + base_address);
+
+ if (other != blocks.end()) {
+ uint64_t endaddress = current_address + inst_size + base_address;
+ if (endaddress != current_block->getEndAddress()) {
+ LOG4CXX_DEBUG(logger, "Shortening block starting at "
+ << std::hex
+ << current_block->getStartAddress()
+ << " now ending at "
+ << other->first);
+ current_block->setEndAddress(endaddress);
+ current_block->setNextBlock(0, other->first);
+ current_block->setNextBlock(1, 0);
}
- } else {
- inst_size = 0;
- }
-
-
- if (inst_size == 0 || MIA->isTerminator(inst) || MIA->isBranch(inst)) {
- current_block->setEndAddress(current_address + base_address + inst_size);
- LOG4CXX_DEBUG(logger, "Finished Block at " << std::hex <<
- current_block->getEndAddress());
- break;
}
- current_address += inst_size;
+ } else {
+ inst_size = 1;
}
+ current_address += inst_size;
}
- LOG4CXX_DEBUG(logger, "Finished function " << current_function->getName());
}
-
- // Split blocks where jumps are going inside the block
- for (auto it = blocks.begin(); it != blocks.end(); ++it) {
- LLVMBasicBlock * current_block = it->second;
- uint64_t inst_size;
- uint64_t base_address;
- text_section.getAddress(base_address);
- uint64_t current_address = current_block->getStartAddress() - base_address;
- while(current_block->getEndAddress() - base_address > current_address) {
- MCInst inst;
- std::string buf;
- llvm::raw_string_ostream s(buf);
-
- if(llvm::MCDisassembler::Success ==
- DisAsm->getInstruction(inst, inst_size, ref, current_address, nulls(), nulls())) {
- auto other = blocks.find(current_address + inst_size + base_address);
-
- if (other != blocks.end()) {
- uint64_t endaddress = current_address + inst_size + base_address;
- if (endaddress != current_block->getEndAddress()) {
- LOG4CXX_DEBUG(logger, "Shortening block starting at "
- << std::hex
- << current_block->getStartAddress()
- << " now ending at "
- << other->first);
- current_block->setEndAddress(endaddress);
- current_block->setNextBlock(0, other->first);
- current_block->setNextBlock(1, 0);
- }
- }
- } else {
- inst_size = 1;
- }
- current_address += inst_size;
- }
- }
}
void LLVMDisassembler::readSymbols() {