1 //===- COFFObjectFile.cpp - COFF object file implementation -----*- C++ -*-===//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // This file declares the COFFObjectFile class.
12 //===----------------------------------------------------------------------===//
14 #include "llvm/Object/COFF.h"
15 #include "llvm/ADT/SmallString.h"
16 #include "llvm/ADT/StringSwitch.h"
17 #include "llvm/ADT/Triple.h"
20 using namespace object;
23 using support::ulittle8_t;
24 using support::ulittle16_t;
25 using support::ulittle32_t;
26 using support::little16_t;
30 // Returns false if size is greater than the buffer size. And sets ec.
31 bool checkSize(const MemoryBuffer *m, error_code &ec, uint64_t size) {
32 if (m->getBufferSize() < size) {
33 ec = object_error::unexpected_eof;
39 // Returns false if any bytes in [addr, addr + size) fall outsize of m.
40 bool checkAddr(const MemoryBuffer *m,
44 if (addr + size < addr ||
46 addr + size > uintptr_t(m->getBufferEnd())) {
47 ec = object_error::unexpected_eof;
54 const coff_symbol *COFFObjectFile::toSymb(DataRefImpl Symb) const {
55 const coff_symbol *addr = reinterpret_cast<const coff_symbol*>(Symb.p);
58 // Verify that the symbol points to a valid entry in the symbol table.
59 uintptr_t offset = uintptr_t(addr) - uintptr_t(base());
60 if (offset < Header->PointerToSymbolTable
61 || offset >= Header->PointerToSymbolTable
62 + (Header->NumberOfSymbols * sizeof(coff_symbol)))
63 report_fatal_error("Symbol was outside of symbol table.");
65 assert((offset - Header->PointerToSymbolTable) % sizeof(coff_symbol)
66 == 0 && "Symbol did not point to the beginning of a symbol");
72 const coff_section *COFFObjectFile::toSec(DataRefImpl Sec) const {
73 const coff_section *addr = reinterpret_cast<const coff_section*>(Sec.p);
76 // Verify that the section points to a valid entry in the section table.
77 if (addr < SectionTable
78 || addr >= (SectionTable + Header->NumberOfSections))
79 report_fatal_error("Section was outside of section table.");
81 uintptr_t offset = uintptr_t(addr) - uintptr_t(SectionTable);
82 assert(offset % sizeof(coff_section) == 0 &&
83 "Section did not point to the beginning of a section");
89 error_code COFFObjectFile::getSymbolNext(DataRefImpl Symb,
90 SymbolRef &Result) const {
91 const coff_symbol *symb = toSymb(Symb);
92 symb += 1 + symb->NumberOfAuxSymbols;
93 Symb.p = reinterpret_cast<uintptr_t>(symb);
94 Result = SymbolRef(Symb, this);
95 return object_error::success;
98 error_code COFFObjectFile::getSymbolName(DataRefImpl Symb,
99 StringRef &Result) const {
100 const coff_symbol *symb = toSymb(Symb);
101 // Check for string table entry. First 4 bytes are 0.
102 if (symb->Name.Offset.Zeroes == 0) {
103 uint32_t Offset = symb->Name.Offset.Offset;
104 if (error_code ec = getString(Offset, Result))
106 return object_error::success;
109 if (symb->Name.ShortName[7] == 0)
110 // Null terminated, let ::strlen figure out the length.
111 Result = StringRef(symb->Name.ShortName);
113 // Not null terminated, use all 8 bytes.
114 Result = StringRef(symb->Name.ShortName, 8);
115 return object_error::success;
118 error_code COFFObjectFile::getSymbolOffset(DataRefImpl Symb,
119 uint64_t &Result) const {
120 const coff_symbol *symb = toSymb(Symb);
121 const coff_section *Section = NULL;
122 if (error_code ec = getSection(symb->SectionNumber, Section))
125 if (error_code ec = getSymbolNMTypeChar(Symb, Type))
127 if (Type == 'U' || Type == 'w')
128 Result = UnknownAddressOrSize;
130 Result = Section->VirtualAddress + symb->Value;
132 Result = symb->Value;
133 return object_error::success;
136 error_code COFFObjectFile::getSymbolAddress(DataRefImpl Symb,
137 uint64_t &Result) const {
138 const coff_symbol *symb = toSymb(Symb);
139 const coff_section *Section = NULL;
140 if (error_code ec = getSection(symb->SectionNumber, Section))
143 if (error_code ec = getSymbolNMTypeChar(Symb, Type))
145 if (Type == 'U' || Type == 'w')
146 Result = UnknownAddressOrSize;
148 Result = reinterpret_cast<uintptr_t>(base() +
149 Section->PointerToRawData +
152 Result = reinterpret_cast<uintptr_t>(base() + symb->Value);
153 return object_error::success;
156 error_code COFFObjectFile::getSymbolType(DataRefImpl Symb,
157 SymbolRef::SymbolType &Result) const {
158 const coff_symbol *symb = toSymb(Symb);
159 Result = SymbolRef::ST_Other;
160 if (symb->StorageClass == COFF::IMAGE_SYM_CLASS_EXTERNAL &&
161 symb->SectionNumber == COFF::IMAGE_SYM_UNDEFINED) {
162 Result = SymbolRef::ST_External;
164 if (symb->Type.ComplexType == COFF::IMAGE_SYM_DTYPE_FUNCTION) {
165 Result = SymbolRef::ST_Function;
168 if (error_code ec = getSymbolNMTypeChar(Symb, Type))
170 if (Type == 'r' || Type == 'R') {
171 Result = SymbolRef::ST_Data;
175 return object_error::success;
178 error_code COFFObjectFile::isSymbolGlobal(DataRefImpl Symb,
179 bool &Result) const {
180 const coff_symbol *symb = toSymb(Symb);
181 Result = (symb->StorageClass == COFF::IMAGE_SYM_CLASS_EXTERNAL);
182 return object_error::success;
185 error_code COFFObjectFile::getSymbolSize(DataRefImpl Symb,
186 uint64_t &Result) const {
187 // FIXME: Return the correct size. This requires looking at all the symbols
188 // in the same section as this symbol, and looking for either the next
189 // symbol, or the end of the section.
190 const coff_symbol *symb = toSymb(Symb);
191 const coff_section *Section = NULL;
192 if (error_code ec = getSection(symb->SectionNumber, Section))
195 if (error_code ec = getSymbolNMTypeChar(Symb, Type))
197 if (Type == 'U' || Type == 'w')
198 Result = UnknownAddressOrSize;
200 Result = Section->SizeOfRawData - symb->Value;
203 return object_error::success;
206 error_code COFFObjectFile::getSymbolNMTypeChar(DataRefImpl Symb,
207 char &Result) const {
208 const coff_symbol *symb = toSymb(Symb);
210 if (error_code ec = getSymbolName(Symb, name))
212 char ret = StringSwitch<char>(name)
213 .StartsWith(".debug", 'N')
214 .StartsWith(".sxdata", 'N')
219 return object_error::success;
222 uint32_t Characteristics = 0;
223 if (symb->SectionNumber > 0) {
224 const coff_section *Section = NULL;
225 if (error_code ec = getSection(symb->SectionNumber, Section))
227 Characteristics = Section->Characteristics;
230 switch (symb->SectionNumber) {
231 case COFF::IMAGE_SYM_UNDEFINED:
232 // Check storage classes.
233 if (symb->StorageClass == COFF::IMAGE_SYM_CLASS_WEAK_EXTERNAL) {
235 return object_error::success; // Don't do ::toupper.
239 case COFF::IMAGE_SYM_ABSOLUTE:
242 case COFF::IMAGE_SYM_DEBUG:
246 // Check section type.
247 if (Characteristics & COFF::IMAGE_SCN_CNT_CODE)
249 else if ( Characteristics & COFF::IMAGE_SCN_MEM_READ
250 && ~Characteristics & COFF::IMAGE_SCN_MEM_WRITE) // Read only.
252 else if (Characteristics & COFF::IMAGE_SCN_CNT_INITIALIZED_DATA)
254 else if (Characteristics & COFF::IMAGE_SCN_CNT_UNINITIALIZED_DATA)
256 else if (Characteristics & COFF::IMAGE_SCN_LNK_INFO)
259 // Check for section symbol.
260 else if ( symb->StorageClass == COFF::IMAGE_SYM_CLASS_STATIC
265 if (symb->StorageClass == COFF::IMAGE_SYM_CLASS_EXTERNAL)
266 ret = ::toupper(ret);
269 return object_error::success;
272 error_code COFFObjectFile::isSymbolInternal(DataRefImpl Symb,
273 bool &Result) const {
275 return object_error::success;
278 error_code COFFObjectFile::getSectionNext(DataRefImpl Sec,
279 SectionRef &Result) const {
280 const coff_section *sec = toSec(Sec);
282 Sec.p = reinterpret_cast<uintptr_t>(sec);
283 Result = SectionRef(Sec, this);
284 return object_error::success;
287 error_code COFFObjectFile::getSectionName(DataRefImpl Sec,
288 StringRef &Result) const {
289 const coff_section *sec = toSec(Sec);
291 if (sec->Name[7] == 0)
292 // Null terminated, let ::strlen figure out the length.
295 // Not null terminated, use all 8 bytes.
296 name = StringRef(sec->Name, 8);
298 // Check for string table entry. First byte is '/'.
299 if (name[0] == '/') {
301 name.substr(1).getAsInteger(10, Offset);
302 if (error_code ec = getString(Offset, name))
307 return object_error::success;
310 error_code COFFObjectFile::getSectionAddress(DataRefImpl Sec,
311 uint64_t &Result) const {
312 const coff_section *sec = toSec(Sec);
313 Result = sec->VirtualAddress;
314 return object_error::success;
317 error_code COFFObjectFile::getSectionSize(DataRefImpl Sec,
318 uint64_t &Result) const {
319 const coff_section *sec = toSec(Sec);
320 Result = sec->SizeOfRawData;
321 return object_error::success;
324 error_code COFFObjectFile::getSectionContents(DataRefImpl Sec,
325 StringRef &Result) const {
326 const coff_section *sec = toSec(Sec);
327 // The only thing that we need to verify is that the contents is contained
328 // within the file bounds. We don't need to make sure it doesn't cover other
329 // data, as there's nothing that says that is not allowed.
330 uintptr_t con_start = uintptr_t(base()) + sec->PointerToRawData;
331 uintptr_t con_end = con_start + sec->SizeOfRawData;
332 if (con_end >= uintptr_t(Data->getBufferEnd()))
333 return object_error::parse_failed;
334 Result = StringRef(reinterpret_cast<const char*>(con_start),
336 return object_error::success;
339 error_code COFFObjectFile::isSectionText(DataRefImpl Sec,
340 bool &Result) const {
341 const coff_section *sec = toSec(Sec);
342 Result = sec->Characteristics & COFF::IMAGE_SCN_CNT_CODE;
343 return object_error::success;
346 error_code COFFObjectFile::isSectionData(DataRefImpl Sec,
347 bool &Result) const {
348 const coff_section *sec = toSec(Sec);
349 Result = sec->Characteristics & COFF::IMAGE_SCN_CNT_INITIALIZED_DATA;
350 return object_error::success;
353 error_code COFFObjectFile::isSectionBSS(DataRefImpl Sec,
354 bool &Result) const {
355 const coff_section *sec = toSec(Sec);
356 Result = sec->Characteristics & COFF::IMAGE_SCN_CNT_UNINITIALIZED_DATA;
357 return object_error::success;
360 error_code COFFObjectFile::sectionContainsSymbol(DataRefImpl Sec,
362 bool &Result) const {
363 // FIXME: Unimplemented.
365 return object_error::success;
368 relocation_iterator COFFObjectFile::getSectionRelBegin(DataRefImpl Sec) const {
369 const coff_section *sec = toSec(Sec);
371 std::memset(&ret, 0, sizeof(ret));
372 if (sec->NumberOfRelocations == 0)
375 ret.p = reinterpret_cast<uintptr_t>(base() + sec->PointerToRelocations);
377 return relocation_iterator(RelocationRef(ret, this));
380 relocation_iterator COFFObjectFile::getSectionRelEnd(DataRefImpl Sec) const {
381 const coff_section *sec = toSec(Sec);
383 std::memset(&ret, 0, sizeof(ret));
384 if (sec->NumberOfRelocations == 0)
387 ret.p = reinterpret_cast<uintptr_t>(
388 reinterpret_cast<const coff_relocation*>(
389 base() + sec->PointerToRelocations)
390 + sec->NumberOfRelocations);
392 return relocation_iterator(RelocationRef(ret, this));
395 COFFObjectFile::COFFObjectFile(MemoryBuffer *Object, error_code &ec)
396 : ObjectFile(Binary::isCOFF, Object, ec) {
397 // Check that we at least have enough room for a header.
398 if (!checkSize(Data, ec, sizeof(coff_file_header))) return;
400 // The actual starting location of the COFF header in the file. This can be
401 // non-zero in PE/COFF files.
402 uint64_t HeaderStart = 0;
404 // Check if this is a PE/COFF file.
405 if (base()[0] == 0x4d && base()[1] == 0x5a) {
406 // PE/COFF, seek through MS-DOS compatibility stub and 4-byte
407 // PE signature to find 'normal' COFF header.
408 if (!checkSize(Data, ec, 0x3c + 8)) return;
409 HeaderStart += *reinterpret_cast<const ulittle32_t *>(base() + 0x3c);
410 // Check the PE header. ("PE\0\0")
411 if (std::memcmp(base() + HeaderStart, "PE\0\0", 4) != 0) {
412 ec = object_error::parse_failed;
415 HeaderStart += 4; // Skip the PE Header.
418 Header = reinterpret_cast<const coff_file_header *>(base() + HeaderStart);
419 if (!checkAddr(Data, ec, uintptr_t(Header), sizeof(coff_file_header)))
423 reinterpret_cast<const coff_section *>( base()
425 + sizeof(coff_file_header)
426 + Header->SizeOfOptionalHeader);
427 if (!checkAddr(Data, ec, uintptr_t(SectionTable),
428 Header->NumberOfSections * sizeof(coff_section)))
432 reinterpret_cast<const coff_symbol *>(base()
433 + Header->PointerToSymbolTable);
434 if (!checkAddr(Data, ec, uintptr_t(SymbolTable),
435 Header->NumberOfSymbols * sizeof(coff_symbol)))
438 // Find string table.
439 StringTable = reinterpret_cast<const char *>(base())
440 + Header->PointerToSymbolTable
441 + Header->NumberOfSymbols * sizeof(coff_symbol);
442 if (!checkAddr(Data, ec, uintptr_t(StringTable), sizeof(ulittle32_t)))
445 StringTableSize = *reinterpret_cast<const ulittle32_t *>(StringTable);
446 if (!checkAddr(Data, ec, uintptr_t(StringTable), StringTableSize))
448 // Check that the string table is null terminated if has any in it.
449 if (StringTableSize < 4
450 || (StringTableSize > 4 && StringTable[StringTableSize - 1] != 0)) {
451 ec = object_error::parse_failed;
455 ec = object_error::success;
458 symbol_iterator COFFObjectFile::begin_symbols() const {
460 std::memset(&ret, 0, sizeof(DataRefImpl));
461 ret.p = reinterpret_cast<intptr_t>(SymbolTable);
462 return symbol_iterator(SymbolRef(ret, this));
465 symbol_iterator COFFObjectFile::end_symbols() const {
466 // The symbol table ends where the string table begins.
468 std::memset(&ret, 0, sizeof(DataRefImpl));
469 ret.p = reinterpret_cast<intptr_t>(StringTable);
470 return symbol_iterator(SymbolRef(ret, this));
473 section_iterator COFFObjectFile::begin_sections() const {
475 std::memset(&ret, 0, sizeof(DataRefImpl));
476 ret.p = reinterpret_cast<intptr_t>(SectionTable);
477 return section_iterator(SectionRef(ret, this));
480 section_iterator COFFObjectFile::end_sections() const {
482 std::memset(&ret, 0, sizeof(DataRefImpl));
483 ret.p = reinterpret_cast<intptr_t>(SectionTable + Header->NumberOfSections);
484 return section_iterator(SectionRef(ret, this));
487 uint8_t COFFObjectFile::getBytesInAddress() const {
488 return getArch() == Triple::x86_64 ? 8 : 4;
491 StringRef COFFObjectFile::getFileFormatName() const {
492 switch(Header->Machine) {
493 case COFF::IMAGE_FILE_MACHINE_I386:
495 case COFF::IMAGE_FILE_MACHINE_AMD64:
496 return "COFF-x86-64";
498 return "COFF-<unknown arch>";
502 unsigned COFFObjectFile::getArch() const {
503 switch(Header->Machine) {
504 case COFF::IMAGE_FILE_MACHINE_I386:
506 case COFF::IMAGE_FILE_MACHINE_AMD64:
507 return Triple::x86_64;
509 return Triple::UnknownArch;
513 error_code COFFObjectFile::getSection(int32_t index,
514 const coff_section *&Result) const {
515 // Check for special index values.
516 if (index == COFF::IMAGE_SYM_UNDEFINED ||
517 index == COFF::IMAGE_SYM_ABSOLUTE ||
518 index == COFF::IMAGE_SYM_DEBUG)
520 else if (index > 0 && index <= Header->NumberOfSections)
521 // We already verified the section table data, so no need to check again.
522 Result = SectionTable + (index - 1);
524 return object_error::parse_failed;
525 return object_error::success;
528 error_code COFFObjectFile::getString(uint32_t offset,
529 StringRef &Result) const {
530 if (StringTableSize <= 4)
531 // Tried to get a string from an empty string table.
532 return object_error::parse_failed;
533 if (offset >= StringTableSize)
534 return object_error::unexpected_eof;
535 Result = StringRef(StringTable + offset);
536 return object_error::success;
539 error_code COFFObjectFile::getSymbol(uint32_t index,
540 const coff_symbol *&Result) const {
541 if (index > 0 && index < Header->NumberOfSymbols)
542 Result = SymbolTable + index;
544 return object_error::parse_failed;
545 return object_error::success;
548 const coff_relocation *COFFObjectFile::toRel(DataRefImpl Rel) const {
549 return reinterpret_cast<const coff_relocation*>(Rel.p);
551 error_code COFFObjectFile::getRelocationNext(DataRefImpl Rel,
552 RelocationRef &Res) const {
553 Rel.p = reinterpret_cast<uintptr_t>(
554 reinterpret_cast<const coff_relocation*>(Rel.p) + 1);
555 Res = RelocationRef(Rel, this);
556 return object_error::success;
558 error_code COFFObjectFile::getRelocationAddress(DataRefImpl Rel,
559 uint64_t &Res) const {
560 Res = toRel(Rel)->VirtualAddress;
561 return object_error::success;
563 error_code COFFObjectFile::getRelocationSymbol(DataRefImpl Rel,
564 SymbolRef &Res) const {
565 const coff_relocation* R = toRel(Rel);
567 Symb.p = reinterpret_cast<uintptr_t>(SymbolTable + R->SymbolTableIndex);
568 Res = SymbolRef(Symb, this);
569 return object_error::success;
571 error_code COFFObjectFile::getRelocationType(DataRefImpl Rel,
572 uint32_t &Res) const {
573 const coff_relocation* R = toRel(Rel);
575 return object_error::success;
578 #define LLVM_COFF_SWITCH_RELOC_TYPE_NAME(enum) \
579 case COFF::enum: res = #enum; break;
581 error_code COFFObjectFile::getRelocationTypeName(DataRefImpl Rel,
582 SmallVectorImpl<char> &Result) const {
583 const coff_relocation *reloc = toRel(Rel);
585 switch (Header->Machine) {
586 case COFF::IMAGE_FILE_MACHINE_AMD64:
587 switch (reloc->Type) {
588 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_ABSOLUTE);
589 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_ADDR64);
590 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_ADDR32);
591 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_ADDR32NB);
592 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_REL32);
593 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_REL32_1);
594 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_REL32_2);
595 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_REL32_3);
596 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_REL32_4);
597 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_REL32_5);
598 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_SECTION);
599 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_SECREL);
600 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_SECREL7);
601 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_TOKEN);
602 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_SREL32);
603 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_PAIR);
604 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_AMD64_SSPAN32);
609 case COFF::IMAGE_FILE_MACHINE_I386:
610 switch (reloc->Type) {
611 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_I386_ABSOLUTE);
612 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_I386_DIR16);
613 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_I386_REL16);
614 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_I386_DIR32);
615 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_I386_DIR32NB);
616 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_I386_SEG12);
617 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_I386_SECTION);
618 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_I386_SECREL);
619 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_I386_TOKEN);
620 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_I386_SECREL7);
621 LLVM_COFF_SWITCH_RELOC_TYPE_NAME(IMAGE_REL_I386_REL32);
629 Result.append(res.begin(), res.end());
630 return object_error::success;
633 #undef LLVM_COFF_SWITCH_RELOC_TYPE_NAME
635 error_code COFFObjectFile::getRelocationAdditionalInfo(DataRefImpl Rel,
636 int64_t &Res) const {
638 return object_error::success;
640 error_code COFFObjectFile::getRelocationValueString(DataRefImpl Rel,
641 SmallVectorImpl<char> &Result) const {
642 const coff_relocation *reloc = toRel(Rel);
643 const coff_symbol *symb = 0;
644 if (error_code ec = getSymbol(reloc->SymbolTableIndex, symb)) return ec;
646 ::memset(&sym, 0, sizeof(sym));
647 sym.p = reinterpret_cast<uintptr_t>(symb);
649 if (error_code ec = getSymbolName(sym, symname)) return ec;
650 Result.append(symname.begin(), symname.end());
651 return object_error::success;
656 ObjectFile *ObjectFile::createCOFFObjectFile(MemoryBuffer *Object) {
658 return new COFFObjectFile(Object, ec);
661 } // end namespace llvm