1//===- yaml2obj - Convert YAML to a binary object file --------------------===//
2//
3//                     The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This program takes a YAML description of an object file and outputs the
11// binary equivalent.
12//
13// This is used for writing tests that require binary files.
14//
15//===----------------------------------------------------------------------===//
16
17#include "llvm/ADT/SmallString.h"
18#include "llvm/ADT/StringExtras.h"
19#include "llvm/ADT/StringMap.h"
20#include "llvm/ADT/StringSwitch.h"
21#include "llvm/Support/COFF.h"
22#include "llvm/Support/Casting.h"
23#include "llvm/Support/CommandLine.h"
24#include "llvm/Support/Endian.h"
25#include "llvm/Support/ManagedStatic.h"
26#include "llvm/Support/MemoryBuffer.h"
27#include "llvm/Support/PrettyStackTrace.h"
28#include "llvm/Support/Signals.h"
29#include "llvm/Support/SourceMgr.h"
30#include "llvm/Support/YAMLParser.h"
31#include "llvm/Support/raw_ostream.h"
32#include "llvm/Support/system_error.h"
33#include <vector>
34
35using namespace llvm;
36
37static cl::opt<std::string>
38  Input(cl::Positional, cl::desc("<input>"), cl::init("-"));
39
40template<class T>
41typename llvm::enable_if_c<std::numeric_limits<T>::is_integer, bool>::type
42getAs(const llvm::yaml::ScalarNode *SN, T &Result) {
43  SmallString<4> Storage;
44  StringRef Value = SN->getValue(Storage);
45  if (Value.getAsInteger(0, Result))
46    return false;
47  return true;
48}
49
50// Given a container with begin and end with ::value_type of a character type.
51// Iterate through pairs of characters in the the set of [a-fA-F0-9] ignoring
52// all other characters.
53struct hex_pair_iterator {
54  StringRef::const_iterator Current, End;
55  typedef SmallVector<char, 2> value_type;
56  value_type Pair;
57  bool IsDone;
58
59  hex_pair_iterator(StringRef C)
60    : Current(C.begin()), End(C.end()), IsDone(false) {
61    // Initalize Pair.
62    ++*this;
63  }
64
65  // End iterator.
66  hex_pair_iterator() : Current(), End(), IsDone(true) {}
67
68  value_type operator *() const {
69    return Pair;
70  }
71
72  hex_pair_iterator operator ++() {
73    // We're at the end of the input.
74    if (Current == End) {
75      IsDone = true;
76      return *this;
77    }
78    Pair = value_type();
79    for (; Current != End && Pair.size() != 2; ++Current) {
80      // Is a valid hex digit.
81      if ((*Current >= '0' && *Current <= '9') ||
82          (*Current >= 'a' && *Current <= 'f') ||
83          (*Current >= 'A' && *Current <= 'F'))
84        Pair.push_back(*Current);
85    }
86    // Hit the end without getting 2 hex digits. Pair is invalid.
87    if (Pair.size() != 2)
88      IsDone = true;
89    return *this;
90  }
91
92  bool operator ==(const hex_pair_iterator Other) {
93    return (IsDone == Other.IsDone) ||
94           (Current == Other.Current && End == Other.End);
95  }
96
97  bool operator !=(const hex_pair_iterator Other) {
98    return !(*this == Other);
99  }
100};
101
102template <class ContainerOut>
103static bool hexStringToByteArray(StringRef Str, ContainerOut &Out) {
104  for (hex_pair_iterator I(Str), E; I != E; ++I) {
105    typename hex_pair_iterator::value_type Pair = *I;
106    typename ContainerOut::value_type Byte;
107    if (StringRef(Pair.data(), 2).getAsInteger(16, Byte))
108      return false;
109    Out.push_back(Byte);
110  }
111  return true;
112}
113
114/// This parses a yaml stream that represents a COFF object file.
115/// See docs/yaml2obj for the yaml scheema.
116struct COFFParser {
117  COFFParser(yaml::Stream &Input) : YS(Input) {
118    std::memset(&Header, 0, sizeof(Header));
119    // A COFF string table always starts with a 4 byte size field. Offsets into
120    // it include this size, so allocate it now.
121    StringTable.append(4, 0);
122  }
123
124  bool parseHeader(yaml::Node *HeaderN) {
125    yaml::MappingNode *MN = dyn_cast<yaml::MappingNode>(HeaderN);
126    if (!MN) {
127      YS.printError(HeaderN, "header's value must be a mapping node");
128      return false;
129    }
130    for (yaml::MappingNode::iterator i = MN->begin(), e = MN->end();
131                                     i != e; ++i) {
132      yaml::ScalarNode *Key = dyn_cast<yaml::ScalarNode>(i->getKey());
133      if (!Key) {
134        YS.printError(i->getKey(), "Keys must be scalar values");
135        return false;
136      }
137      SmallString<32> Storage;
138      StringRef KeyValue = Key->getValue(Storage);
139      if (KeyValue == "Characteristics") {
140        if (!parseHeaderCharacteristics(i->getValue()))
141          return false;
142      } else {
143        yaml::ScalarNode *Value = dyn_cast<yaml::ScalarNode>(i->getValue());
144        if (!Value) {
145          YS.printError(Value,
146            Twine(KeyValue) + " must be a scalar value");
147          return false;
148        }
149        if (KeyValue == "Machine") {
150          uint16_t Machine = COFF::MT_Invalid;
151          if (!getAs(Value, Machine)) {
152            // It's not a raw number, try matching the string.
153            StringRef ValueValue = Value->getValue(Storage);
154            Machine = StringSwitch<COFF::MachineTypes>(ValueValue)
155              .Case( "IMAGE_FILE_MACHINE_UNKNOWN"
156                   , COFF::IMAGE_FILE_MACHINE_UNKNOWN)
157              .Case( "IMAGE_FILE_MACHINE_AM33"
158                   , COFF::IMAGE_FILE_MACHINE_AM33)
159              .Case( "IMAGE_FILE_MACHINE_AMD64"
160                   , COFF::IMAGE_FILE_MACHINE_AMD64)
161              .Case( "IMAGE_FILE_MACHINE_ARM"
162                   , COFF::IMAGE_FILE_MACHINE_ARM)
163              .Case( "IMAGE_FILE_MACHINE_ARMV7"
164                   , COFF::IMAGE_FILE_MACHINE_ARMV7)
165              .Case( "IMAGE_FILE_MACHINE_EBC"
166                   , COFF::IMAGE_FILE_MACHINE_EBC)
167              .Case( "IMAGE_FILE_MACHINE_I386"
168                   , COFF::IMAGE_FILE_MACHINE_I386)
169              .Case( "IMAGE_FILE_MACHINE_IA64"
170                   , COFF::IMAGE_FILE_MACHINE_IA64)
171              .Case( "IMAGE_FILE_MACHINE_M32R"
172                   , COFF::IMAGE_FILE_MACHINE_M32R)
173              .Case( "IMAGE_FILE_MACHINE_MIPS16"
174                   , COFF::IMAGE_FILE_MACHINE_MIPS16)
175              .Case( "IMAGE_FILE_MACHINE_MIPSFPU"
176                   , COFF::IMAGE_FILE_MACHINE_MIPSFPU)
177              .Case( "IMAGE_FILE_MACHINE_MIPSFPU16"
178                   , COFF::IMAGE_FILE_MACHINE_MIPSFPU16)
179              .Case( "IMAGE_FILE_MACHINE_POWERPC"
180                   , COFF::IMAGE_FILE_MACHINE_POWERPC)
181              .Case( "IMAGE_FILE_MACHINE_POWERPCFP"
182                   , COFF::IMAGE_FILE_MACHINE_POWERPCFP)
183              .Case( "IMAGE_FILE_MACHINE_R4000"
184                   , COFF::IMAGE_FILE_MACHINE_R4000)
185              .Case( "IMAGE_FILE_MACHINE_SH3"
186                   , COFF::IMAGE_FILE_MACHINE_SH3)
187              .Case( "IMAGE_FILE_MACHINE_SH3DSP"
188                   , COFF::IMAGE_FILE_MACHINE_SH3DSP)
189              .Case( "IMAGE_FILE_MACHINE_SH4"
190                   , COFF::IMAGE_FILE_MACHINE_SH4)
191              .Case( "IMAGE_FILE_MACHINE_SH5"
192                   , COFF::IMAGE_FILE_MACHINE_SH5)
193              .Case( "IMAGE_FILE_MACHINE_THUMB"
194                   , COFF::IMAGE_FILE_MACHINE_THUMB)
195              .Case( "IMAGE_FILE_MACHINE_WCEMIPSV2"
196                   , COFF::IMAGE_FILE_MACHINE_WCEMIPSV2)
197              .Default(COFF::MT_Invalid);
198            if (Machine == COFF::MT_Invalid) {
199              YS.printError(Value, "Invalid value for Machine");
200              return false;
201            }
202          }
203          Header.Machine = Machine;
204        } else if (KeyValue == "NumberOfSections") {
205          if (!getAs(Value, Header.NumberOfSections)) {
206              YS.printError(Value, "Invalid value for NumberOfSections");
207              return false;
208          }
209        } else if (KeyValue == "TimeDateStamp") {
210          if (!getAs(Value, Header.TimeDateStamp)) {
211              YS.printError(Value, "Invalid value for TimeDateStamp");
212              return false;
213          }
214        } else if (KeyValue == "PointerToSymbolTable") {
215          if (!getAs(Value, Header.PointerToSymbolTable)) {
216              YS.printError(Value, "Invalid value for PointerToSymbolTable");
217              return false;
218          }
219        } else if (KeyValue == "NumberOfSymbols") {
220          if (!getAs(Value, Header.NumberOfSymbols)) {
221              YS.printError(Value, "Invalid value for NumberOfSymbols");
222              return false;
223          }
224        } else if (KeyValue == "SizeOfOptionalHeader") {
225          if (!getAs(Value, Header.SizeOfOptionalHeader)) {
226              YS.printError(Value, "Invalid value for SizeOfOptionalHeader");
227              return false;
228          }
229        } else {
230          YS.printError(Key, "Unrecognized key in header");
231          return false;
232        }
233      }
234    }
235    return true;
236  }
237
238  bool parseHeaderCharacteristics(yaml::Node *Characteristics) {
239    yaml::ScalarNode *Value = dyn_cast<yaml::ScalarNode>(Characteristics);
240    yaml::SequenceNode *SeqValue
241      = dyn_cast<yaml::SequenceNode>(Characteristics);
242    if (!Value && !SeqValue) {
243      YS.printError(Characteristics,
244        "Characteristics must either be a number or sequence");
245      return false;
246    }
247    if (Value) {
248      if (!getAs(Value, Header.Characteristics)) {
249        YS.printError(Value, "Invalid value for Characteristics");
250        return false;
251      }
252    } else {
253      for (yaml::SequenceNode::iterator ci = SeqValue->begin(),
254                                        ce = SeqValue->end();
255                                        ci != ce; ++ci) {
256        yaml::ScalarNode *CharValue = dyn_cast<yaml::ScalarNode>(&*ci);
257        if (!CharValue) {
258          YS.printError(CharValue,
259            "Characteristics must be scalar values");
260          return false;
261        }
262        SmallString<32> Storage;
263        StringRef Char = CharValue->getValue(Storage);
264        uint16_t Characteristic = StringSwitch<COFF::Characteristics>(Char)
265          .Case( "IMAGE_FILE_RELOCS_STRIPPED"
266                , COFF::IMAGE_FILE_RELOCS_STRIPPED)
267          .Case( "IMAGE_FILE_EXECUTABLE_IMAGE"
268                , COFF::IMAGE_FILE_EXECUTABLE_IMAGE)
269          .Case( "IMAGE_FILE_LINE_NUMS_STRIPPED"
270                , COFF::IMAGE_FILE_LINE_NUMS_STRIPPED)
271          .Case( "IMAGE_FILE_LOCAL_SYMS_STRIPPED"
272                , COFF::IMAGE_FILE_LOCAL_SYMS_STRIPPED)
273          .Case( "IMAGE_FILE_AGGRESSIVE_WS_TRIM"
274                , COFF::IMAGE_FILE_AGGRESSIVE_WS_TRIM)
275          .Case( "IMAGE_FILE_LARGE_ADDRESS_AWARE"
276                , COFF::IMAGE_FILE_LARGE_ADDRESS_AWARE)
277          .Case( "IMAGE_FILE_BYTES_REVERSED_LO"
278                , COFF::IMAGE_FILE_BYTES_REVERSED_LO)
279          .Case( "IMAGE_FILE_32BIT_MACHINE"
280                , COFF::IMAGE_FILE_32BIT_MACHINE)
281          .Case( "IMAGE_FILE_DEBUG_STRIPPED"
282                , COFF::IMAGE_FILE_DEBUG_STRIPPED)
283          .Case( "IMAGE_FILE_REMOVABLE_RUN_FROM_SWAP"
284                , COFF::IMAGE_FILE_REMOVABLE_RUN_FROM_SWAP)
285          .Case( "IMAGE_FILE_SYSTEM"
286                , COFF::IMAGE_FILE_SYSTEM)
287          .Case( "IMAGE_FILE_DLL"
288                , COFF::IMAGE_FILE_DLL)
289          .Case( "IMAGE_FILE_UP_SYSTEM_ONLY"
290                , COFF::IMAGE_FILE_UP_SYSTEM_ONLY)
291          .Default(COFF::C_Invalid);
292        if (Characteristic == COFF::C_Invalid) {
293          // TODO: Typo-correct.
294          YS.printError(CharValue,
295            "Invalid value for Characteristic");
296          return false;
297        }
298        Header.Characteristics |= Characteristic;
299      }
300    }
301    return true;
302  }
303
304  bool parseSections(yaml::Node *SectionsN) {
305    yaml::SequenceNode *SN = dyn_cast<yaml::SequenceNode>(SectionsN);
306    if (!SN) {
307      YS.printError(SectionsN, "Sections must be a sequence");
308      return false;
309    }
310    for (yaml::SequenceNode::iterator i = SN->begin(), e = SN->end();
311                                      i != e; ++i) {
312      Section Sec;
313      std::memset(&Sec.Header, 0, sizeof(Sec.Header));
314      yaml::MappingNode *SecMap = dyn_cast<yaml::MappingNode>(&*i);
315      if (!SecMap) {
316        YS.printError(&*i, "Section entry must be a map");
317        return false;
318      }
319      for (yaml::MappingNode::iterator si = SecMap->begin(), se = SecMap->end();
320                                       si != se; ++si) {
321        yaml::ScalarNode *Key = dyn_cast<yaml::ScalarNode>(si->getKey());
322        if (!Key) {
323          YS.printError(si->getKey(), "Keys must be scalar values");
324          return false;
325        }
326        SmallString<32> Storage;
327        StringRef KeyValue = Key->getValue(Storage);
328
329        yaml::ScalarNode *Value = dyn_cast<yaml::ScalarNode>(si->getValue());
330        if (KeyValue == "Name") {
331          // If the name is less than 8 bytes, store it in place, otherwise
332          // store it in the string table.
333          StringRef Name = Value->getValue(Storage);
334          std::fill_n(Sec.Header.Name, unsigned(COFF::NameSize), 0);
335          if (Name.size() <= COFF::NameSize) {
336            std::copy(Name.begin(), Name.end(), Sec.Header.Name);
337          } else {
338            // Add string to the string table and format the index for output.
339            unsigned Index = getStringIndex(Name);
340            std::string str = utostr(Index);
341            if (str.size() > 7) {
342              YS.printError(Value, "String table got too large");
343              return false;
344            }
345            Sec.Header.Name[0] = '/';
346            std::copy(str.begin(), str.end(), Sec.Header.Name + 1);
347          }
348        } else if (KeyValue == "VirtualSize") {
349          if (!getAs(Value, Sec.Header.VirtualSize)) {
350            YS.printError(Value, "Invalid value for VirtualSize");
351            return false;
352          }
353        } else if (KeyValue == "VirtualAddress") {
354          if (!getAs(Value, Sec.Header.VirtualAddress)) {
355            YS.printError(Value, "Invalid value for VirtualAddress");
356            return false;
357          }
358        } else if (KeyValue == "SizeOfRawData") {
359          if (!getAs(Value, Sec.Header.SizeOfRawData)) {
360            YS.printError(Value, "Invalid value for SizeOfRawData");
361            return false;
362          }
363        } else if (KeyValue == "PointerToRawData") {
364          if (!getAs(Value, Sec.Header.PointerToRawData)) {
365            YS.printError(Value, "Invalid value for PointerToRawData");
366            return false;
367          }
368        } else if (KeyValue == "PointerToRelocations") {
369          if (!getAs(Value, Sec.Header.PointerToRelocations)) {
370            YS.printError(Value, "Invalid value for PointerToRelocations");
371            return false;
372          }
373        } else if (KeyValue == "PointerToLineNumbers") {
374          if (!getAs(Value, Sec.Header.PointerToLineNumbers)) {
375            YS.printError(Value, "Invalid value for PointerToLineNumbers");
376            return false;
377          }
378        } else if (KeyValue == "NumberOfRelocations") {
379          if (!getAs(Value, Sec.Header.NumberOfRelocations)) {
380            YS.printError(Value, "Invalid value for NumberOfRelocations");
381            return false;
382          }
383        } else if (KeyValue == "NumberOfLineNumbers") {
384          if (!getAs(Value, Sec.Header.NumberOfLineNumbers)) {
385            YS.printError(Value, "Invalid value for NumberOfLineNumbers");
386            return false;
387          }
388        } else if (KeyValue == "Characteristics") {
389          yaml::SequenceNode *SeqValue
390            = dyn_cast<yaml::SequenceNode>(si->getValue());
391          if (!Value && !SeqValue) {
392            YS.printError(si->getValue(),
393              "Characteristics must either be a number or sequence");
394            return false;
395          }
396          if (Value) {
397            if (!getAs(Value, Sec.Header.Characteristics)) {
398              YS.printError(Value, "Invalid value for Characteristics");
399              return false;
400            }
401          } else {
402            for (yaml::SequenceNode::iterator ci = SeqValue->begin(),
403                                              ce = SeqValue->end();
404                                              ci != ce; ++ci) {
405              yaml::ScalarNode *CharValue = dyn_cast<yaml::ScalarNode>(&*ci);
406              if (!CharValue) {
407                YS.printError(CharValue, "Invalid value for Characteristics");
408                return false;
409              }
410              StringRef Char = CharValue->getValue(Storage);
411              uint32_t Characteristic =
412                StringSwitch<COFF::SectionCharacteristics>(Char)
413                .Case( "IMAGE_SCN_TYPE_NO_PAD"
414                     , COFF::IMAGE_SCN_TYPE_NO_PAD)
415                .Case( "IMAGE_SCN_CNT_CODE"
416                     , COFF::IMAGE_SCN_CNT_CODE)
417                .Case( "IMAGE_SCN_CNT_INITIALIZED_DATA"
418                     , COFF::IMAGE_SCN_CNT_INITIALIZED_DATA)
419                .Case( "IMAGE_SCN_CNT_UNINITIALIZED_DATA"
420                     , COFF::IMAGE_SCN_CNT_UNINITIALIZED_DATA)
421                .Case( "IMAGE_SCN_LNK_OTHER"
422                     , COFF::IMAGE_SCN_LNK_OTHER)
423                .Case( "IMAGE_SCN_LNK_INFO"
424                     , COFF::IMAGE_SCN_LNK_INFO)
425                .Case( "IMAGE_SCN_LNK_REMOVE"
426                     , COFF::IMAGE_SCN_LNK_REMOVE)
427                .Case( "IMAGE_SCN_LNK_COMDAT"
428                     , COFF::IMAGE_SCN_LNK_COMDAT)
429                .Case( "IMAGE_SCN_GPREL"
430                     , COFF::IMAGE_SCN_GPREL)
431                .Case( "IMAGE_SCN_MEM_PURGEABLE"
432                     , COFF::IMAGE_SCN_MEM_PURGEABLE)
433                .Case( "IMAGE_SCN_MEM_16BIT"
434                     , COFF::IMAGE_SCN_MEM_16BIT)
435                .Case( "IMAGE_SCN_MEM_LOCKED"
436                     , COFF::IMAGE_SCN_MEM_LOCKED)
437                .Case( "IMAGE_SCN_MEM_PRELOAD"
438                     , COFF::IMAGE_SCN_MEM_PRELOAD)
439                .Case( "IMAGE_SCN_ALIGN_1BYTES"
440                     , COFF::IMAGE_SCN_ALIGN_1BYTES)
441                .Case( "IMAGE_SCN_ALIGN_2BYTES"
442                     , COFF::IMAGE_SCN_ALIGN_2BYTES)
443                .Case( "IMAGE_SCN_ALIGN_4BYTES"
444                     , COFF::IMAGE_SCN_ALIGN_4BYTES)
445                .Case( "IMAGE_SCN_ALIGN_8BYTES"
446                     , COFF::IMAGE_SCN_ALIGN_8BYTES)
447                .Case( "IMAGE_SCN_ALIGN_16BYTES"
448                     , COFF::IMAGE_SCN_ALIGN_16BYTES)
449                .Case( "IMAGE_SCN_ALIGN_32BYTES"
450                     , COFF::IMAGE_SCN_ALIGN_32BYTES)
451                .Case( "IMAGE_SCN_ALIGN_64BYTES"
452                     , COFF::IMAGE_SCN_ALIGN_64BYTES)
453                .Case( "IMAGE_SCN_ALIGN_128BYTES"
454                     , COFF::IMAGE_SCN_ALIGN_128BYTES)
455                .Case( "IMAGE_SCN_ALIGN_256BYTES"
456                     , COFF::IMAGE_SCN_ALIGN_256BYTES)
457                .Case( "IMAGE_SCN_ALIGN_512BYTES"
458                     , COFF::IMAGE_SCN_ALIGN_512BYTES)
459                .Case( "IMAGE_SCN_ALIGN_1024BYTES"
460                     , COFF::IMAGE_SCN_ALIGN_1024BYTES)
461                .Case( "IMAGE_SCN_ALIGN_2048BYTES"
462                     , COFF::IMAGE_SCN_ALIGN_2048BYTES)
463                .Case( "IMAGE_SCN_ALIGN_4096BYTES"
464                     , COFF::IMAGE_SCN_ALIGN_4096BYTES)
465                .Case( "IMAGE_SCN_ALIGN_8192BYTES"
466                     , COFF::IMAGE_SCN_ALIGN_8192BYTES)
467                .Case( "IMAGE_SCN_LNK_NRELOC_OVFL"
468                     , COFF::IMAGE_SCN_LNK_NRELOC_OVFL)
469                .Case( "IMAGE_SCN_MEM_DISCARDABLE"
470                     , COFF::IMAGE_SCN_MEM_DISCARDABLE)
471                .Case( "IMAGE_SCN_MEM_NOT_CACHED"
472                     , COFF::IMAGE_SCN_MEM_NOT_CACHED)
473                .Case( "IMAGE_SCN_MEM_NOT_PAGED"
474                     , COFF::IMAGE_SCN_MEM_NOT_PAGED)
475                .Case( "IMAGE_SCN_MEM_SHARED"
476                     , COFF::IMAGE_SCN_MEM_SHARED)
477                .Case( "IMAGE_SCN_MEM_EXECUTE"
478                     , COFF::IMAGE_SCN_MEM_EXECUTE)
479                .Case( "IMAGE_SCN_MEM_READ"
480                     , COFF::IMAGE_SCN_MEM_READ)
481                .Case( "IMAGE_SCN_MEM_WRITE"
482                     , COFF::IMAGE_SCN_MEM_WRITE)
483                .Default(COFF::SC_Invalid);
484              if (Characteristic == COFF::SC_Invalid) {
485                YS.printError(CharValue, "Invalid value for Characteristic");
486                return false;
487              }
488              Sec.Header.Characteristics |= Characteristic;
489            }
490          }
491        } else if (KeyValue == "SectionData") {
492          yaml::ScalarNode *Value = dyn_cast<yaml::ScalarNode>(si->getValue());
493          SmallString<32> Storage;
494          StringRef Data = Value->getValue(Storage);
495          if (!hexStringToByteArray(Data, Sec.Data)) {
496            YS.printError(Value, "SectionData must be a collection of pairs of"
497                                 "hex bytes");
498            return false;
499          }
500        } else
501          si->skip();
502      }
503      Sections.push_back(Sec);
504    }
505    return true;
506  }
507
508  bool parseSymbols(yaml::Node *SymbolsN) {
509    yaml::SequenceNode *SN = dyn_cast<yaml::SequenceNode>(SymbolsN);
510    if (!SN) {
511      YS.printError(SymbolsN, "Symbols must be a sequence");
512      return false;
513    }
514    for (yaml::SequenceNode::iterator i = SN->begin(), e = SN->end();
515                                      i != e; ++i) {
516      Symbol Sym;
517      std::memset(&Sym.Header, 0, sizeof(Sym.Header));
518      yaml::MappingNode *SymMap = dyn_cast<yaml::MappingNode>(&*i);
519      if (!SymMap) {
520        YS.printError(&*i, "Symbol must be a map");
521        return false;
522      }
523      for (yaml::MappingNode::iterator si = SymMap->begin(), se = SymMap->end();
524                                       si != se; ++si) {
525        yaml::ScalarNode *Key = dyn_cast<yaml::ScalarNode>(si->getKey());
526        if (!Key) {
527          YS.printError(si->getKey(), "Keys must be scalar values");
528          return false;
529        }
530        SmallString<32> Storage;
531        StringRef KeyValue = Key->getValue(Storage);
532
533        yaml::ScalarNode *Value = dyn_cast<yaml::ScalarNode>(si->getValue());
534        if (!Value) {
535          YS.printError(si->getValue(), "Must be a scalar value");
536          return false;
537        }
538        if (KeyValue == "Name") {
539          // If the name is less than 8 bytes, store it in place, otherwise
540          // store it in the string table.
541          StringRef Name = Value->getValue(Storage);
542          std::fill_n(Sym.Header.Name, unsigned(COFF::NameSize), 0);
543          if (Name.size() <= COFF::NameSize) {
544            std::copy(Name.begin(), Name.end(), Sym.Header.Name);
545          } else {
546            // Add string to the string table and format the index for output.
547            unsigned Index = getStringIndex(Name);
548            *reinterpret_cast<support::aligned_ulittle32_t*>(
549              Sym.Header.Name + 4) = Index;
550          }
551        } else if (KeyValue == "Value") {
552          if (!getAs(Value, Sym.Header.Value)) {
553            YS.printError(Value, "Invalid value for Value");
554            return false;
555          }
556        } else if (KeyValue == "SimpleType") {
557          Sym.Header.Type |= StringSwitch<COFF::SymbolBaseType>(
558            Value->getValue(Storage))
559            .Case("IMAGE_SYM_TYPE_NULL", COFF::IMAGE_SYM_TYPE_NULL)
560            .Case("IMAGE_SYM_TYPE_VOID", COFF::IMAGE_SYM_TYPE_VOID)
561            .Case("IMAGE_SYM_TYPE_CHAR", COFF::IMAGE_SYM_TYPE_CHAR)
562            .Case("IMAGE_SYM_TYPE_SHORT", COFF::IMAGE_SYM_TYPE_SHORT)
563            .Case("IMAGE_SYM_TYPE_INT", COFF::IMAGE_SYM_TYPE_INT)
564            .Case("IMAGE_SYM_TYPE_LONG", COFF::IMAGE_SYM_TYPE_LONG)
565            .Case("IMAGE_SYM_TYPE_FLOAT", COFF::IMAGE_SYM_TYPE_FLOAT)
566            .Case("IMAGE_SYM_TYPE_DOUBLE", COFF::IMAGE_SYM_TYPE_DOUBLE)
567            .Case("IMAGE_SYM_TYPE_STRUCT", COFF::IMAGE_SYM_TYPE_STRUCT)
568            .Case("IMAGE_SYM_TYPE_UNION", COFF::IMAGE_SYM_TYPE_UNION)
569            .Case("IMAGE_SYM_TYPE_ENUM", COFF::IMAGE_SYM_TYPE_ENUM)
570            .Case("IMAGE_SYM_TYPE_MOE", COFF::IMAGE_SYM_TYPE_MOE)
571            .Case("IMAGE_SYM_TYPE_BYTE", COFF::IMAGE_SYM_TYPE_BYTE)
572            .Case("IMAGE_SYM_TYPE_WORD", COFF::IMAGE_SYM_TYPE_WORD)
573            .Case("IMAGE_SYM_TYPE_UINT", COFF::IMAGE_SYM_TYPE_UINT)
574            .Case("IMAGE_SYM_TYPE_DWORD", COFF::IMAGE_SYM_TYPE_DWORD)
575            .Default(COFF::IMAGE_SYM_TYPE_NULL);
576        } else if (KeyValue == "ComplexType") {
577          Sym.Header.Type |= StringSwitch<COFF::SymbolComplexType>(
578            Value->getValue(Storage))
579            .Case("IMAGE_SYM_DTYPE_NULL", COFF::IMAGE_SYM_DTYPE_NULL)
580            .Case("IMAGE_SYM_DTYPE_POINTER", COFF::IMAGE_SYM_DTYPE_POINTER)
581            .Case("IMAGE_SYM_DTYPE_FUNCTION", COFF::IMAGE_SYM_DTYPE_FUNCTION)
582            .Case("IMAGE_SYM_DTYPE_ARRAY", COFF::IMAGE_SYM_DTYPE_ARRAY)
583            .Default(COFF::IMAGE_SYM_DTYPE_NULL)
584            << COFF::SCT_COMPLEX_TYPE_SHIFT;
585        } else if (KeyValue == "StorageClass") {
586          Sym.Header.StorageClass = StringSwitch<COFF::SymbolStorageClass>(
587            Value->getValue(Storage))
588            .Case( "IMAGE_SYM_CLASS_END_OF_FUNCTION"
589                 , COFF::IMAGE_SYM_CLASS_END_OF_FUNCTION)
590            .Case( "IMAGE_SYM_CLASS_NULL"
591                 , COFF::IMAGE_SYM_CLASS_NULL)
592            .Case( "IMAGE_SYM_CLASS_AUTOMATIC"
593                 , COFF::IMAGE_SYM_CLASS_AUTOMATIC)
594            .Case( "IMAGE_SYM_CLASS_EXTERNAL"
595                 , COFF::IMAGE_SYM_CLASS_EXTERNAL)
596            .Case( "IMAGE_SYM_CLASS_STATIC"
597                 , COFF::IMAGE_SYM_CLASS_STATIC)
598            .Case( "IMAGE_SYM_CLASS_REGISTER"
599                 , COFF::IMAGE_SYM_CLASS_REGISTER)
600            .Case( "IMAGE_SYM_CLASS_EXTERNAL_DEF"
601                 , COFF::IMAGE_SYM_CLASS_EXTERNAL_DEF)
602            .Case( "IMAGE_SYM_CLASS_LABEL"
603                 , COFF::IMAGE_SYM_CLASS_LABEL)
604            .Case( "IMAGE_SYM_CLASS_UNDEFINED_LABEL"
605                 , COFF::IMAGE_SYM_CLASS_UNDEFINED_LABEL)
606            .Case( "IMAGE_SYM_CLASS_MEMBER_OF_STRUCT"
607                 , COFF::IMAGE_SYM_CLASS_MEMBER_OF_STRUCT)
608            .Case( "IMAGE_SYM_CLASS_ARGUMENT"
609                 , COFF::IMAGE_SYM_CLASS_ARGUMENT)
610            .Case( "IMAGE_SYM_CLASS_STRUCT_TAG"
611                 , COFF::IMAGE_SYM_CLASS_STRUCT_TAG)
612            .Case( "IMAGE_SYM_CLASS_MEMBER_OF_UNION"
613                 , COFF::IMAGE_SYM_CLASS_MEMBER_OF_UNION)
614            .Case( "IMAGE_SYM_CLASS_UNION_TAG"
615                 , COFF::IMAGE_SYM_CLASS_UNION_TAG)
616            .Case( "IMAGE_SYM_CLASS_TYPE_DEFINITION"
617                 , COFF::IMAGE_SYM_CLASS_TYPE_DEFINITION)
618            .Case( "IMAGE_SYM_CLASS_UNDEFINED_STATIC"
619                 , COFF::IMAGE_SYM_CLASS_UNDEFINED_STATIC)
620            .Case( "IMAGE_SYM_CLASS_ENUM_TAG"
621                 , COFF::IMAGE_SYM_CLASS_ENUM_TAG)
622            .Case( "IMAGE_SYM_CLASS_MEMBER_OF_ENUM"
623                 , COFF::IMAGE_SYM_CLASS_MEMBER_OF_ENUM)
624            .Case( "IMAGE_SYM_CLASS_REGISTER_PARAM"
625                 , COFF::IMAGE_SYM_CLASS_REGISTER_PARAM)
626            .Case( "IMAGE_SYM_CLASS_BIT_FIELD"
627                 , COFF::IMAGE_SYM_CLASS_BIT_FIELD)
628            .Case( "IMAGE_SYM_CLASS_BLOCK"
629                 , COFF::IMAGE_SYM_CLASS_BLOCK)
630            .Case( "IMAGE_SYM_CLASS_FUNCTION"
631                 , COFF::IMAGE_SYM_CLASS_FUNCTION)
632            .Case( "IMAGE_SYM_CLASS_END_OF_STRUCT"
633                 , COFF::IMAGE_SYM_CLASS_END_OF_STRUCT)
634            .Case( "IMAGE_SYM_CLASS_FILE"
635                 , COFF::IMAGE_SYM_CLASS_FILE)
636            .Case( "IMAGE_SYM_CLASS_SECTION"
637                 , COFF::IMAGE_SYM_CLASS_SECTION)
638            .Case( "IMAGE_SYM_CLASS_WEAK_EXTERNAL"
639                 , COFF::IMAGE_SYM_CLASS_WEAK_EXTERNAL)
640            .Case( "IMAGE_SYM_CLASS_CLR_TOKEN"
641                 , COFF::IMAGE_SYM_CLASS_CLR_TOKEN)
642            .Default(COFF::SSC_Invalid);
643          if (Sym.Header.StorageClass == COFF::SSC_Invalid) {
644            YS.printError(Value, "Invalid value for StorageClass");
645            return false;
646          }
647        } else if (KeyValue == "SectionNumber") {
648          if (!getAs(Value, Sym.Header.SectionNumber)) {
649              YS.printError(Value, "Invalid value for SectionNumber");
650              return false;
651          }
652        } else if (KeyValue == "AuxillaryData") {
653          StringRef Data = Value->getValue(Storage);
654          if (!hexStringToByteArray(Data, Sym.AuxSymbols)) {
655            YS.printError(Value, "AuxillaryData must be a collection of pairs"
656                                 "of hex bytes");
657            return false;
658          }
659        } else
660          si->skip();
661      }
662      Symbols.push_back(Sym);
663    }
664    return true;
665  }
666
667  bool parse() {
668    yaml::Document &D = *YS.begin();
669    yaml::MappingNode *Root = dyn_cast<yaml::MappingNode>(D.getRoot());
670    if (!Root) {
671      YS.printError(D.getRoot(), "Root node must be a map");
672      return false;
673    }
674    for (yaml::MappingNode::iterator i = Root->begin(), e = Root->end();
675                                     i != e; ++i) {
676      yaml::ScalarNode *Key = dyn_cast<yaml::ScalarNode>(i->getKey());
677      if (!Key) {
678        YS.printError(i->getKey(), "Keys must be scalar values");
679        return false;
680      }
681      SmallString<32> Storage;
682      StringRef KeyValue = Key->getValue(Storage);
683      if (KeyValue == "header") {
684        if (!parseHeader(i->getValue()))
685          return false;
686      } else if (KeyValue == "sections") {
687        if (!parseSections(i->getValue()))
688          return false;
689      } else if (KeyValue == "symbols") {
690        if (!parseSymbols(i->getValue()))
691          return false;
692      }
693    }
694    return !YS.failed();
695  }
696
697  unsigned getStringIndex(StringRef Str) {
698    StringMap<unsigned>::iterator i = StringTableMap.find(Str);
699    if (i == StringTableMap.end()) {
700      unsigned Index = StringTable.size();
701      StringTable.append(Str.begin(), Str.end());
702      StringTable.push_back(0);
703      StringTableMap[Str] = Index;
704      return Index;
705    }
706    return i->second;
707  }
708
709  yaml::Stream &YS;
710  COFF::header Header;
711
712  struct Section {
713    COFF::section Header;
714    std::vector<uint8_t> Data;
715    std::vector<COFF::relocation> Relocations;
716  };
717
718  struct Symbol {
719    COFF::symbol Header;
720    std::vector<uint8_t> AuxSymbols;
721  };
722
723  std::vector<Section> Sections;
724  std::vector<Symbol> Symbols;
725  StringMap<unsigned> StringTableMap;
726  std::string StringTable;
727};
728
729// Take a CP and assign addresses and sizes to everything. Returns false if the
730// layout is not valid to do.
731static bool layoutCOFF(COFFParser &CP) {
732  uint32_t SectionTableStart = 0;
733  uint32_t SectionTableSize  = 0;
734
735  // The section table starts immediately after the header, including the
736  // optional header.
737  SectionTableStart = sizeof(COFF::header) + CP.Header.SizeOfOptionalHeader;
738  SectionTableSize = sizeof(COFF::section) * CP.Sections.size();
739
740  uint32_t CurrentSectionDataOffset = SectionTableStart + SectionTableSize;
741
742  // Assign each section data address consecutively.
743  for (std::vector<COFFParser::Section>::iterator i = CP.Sections.begin(),
744                                                  e = CP.Sections.end();
745                                                  i != e; ++i) {
746    if (!i->Data.empty()) {
747      i->Header.SizeOfRawData = i->Data.size();
748      i->Header.PointerToRawData = CurrentSectionDataOffset;
749      CurrentSectionDataOffset += i->Header.SizeOfRawData;
750      // TODO: Handle alignment.
751    } else {
752      i->Header.SizeOfRawData = 0;
753      i->Header.PointerToRawData = 0;
754    }
755  }
756
757  uint32_t SymbolTableStart = CurrentSectionDataOffset;
758
759  // Calculate number of symbols.
760  uint32_t NumberOfSymbols = 0;
761  for (std::vector<COFFParser::Symbol>::iterator i = CP.Symbols.begin(),
762                                                 e = CP.Symbols.end();
763                                                 i != e; ++i) {
764    if (i->AuxSymbols.size() % COFF::SymbolSize != 0) {
765      errs() << "AuxillaryData size not a multiple of symbol size!\n";
766      return false;
767    }
768    i->Header.NumberOfAuxSymbols = i->AuxSymbols.size() / COFF::SymbolSize;
769    NumberOfSymbols += 1 + i->Header.NumberOfAuxSymbols;
770  }
771
772  // Store all the allocated start addresses in the header.
773  CP.Header.NumberOfSections = CP.Sections.size();
774  CP.Header.NumberOfSymbols = NumberOfSymbols;
775  CP.Header.PointerToSymbolTable = SymbolTableStart;
776
777  *reinterpret_cast<support::ulittle32_t *>(&CP.StringTable[0])
778    = CP.StringTable.size();
779
780  return true;
781}
782
783template <typename value_type>
784struct binary_le_impl {
785  value_type Value;
786  binary_le_impl(value_type V) : Value(V) {}
787};
788
789template <typename value_type>
790raw_ostream &operator <<( raw_ostream &OS
791                        , const binary_le_impl<value_type> &BLE) {
792  char Buffer[sizeof(BLE.Value)];
793  support::endian::write<value_type, support::little, support::unaligned>(
794    Buffer, BLE.Value);
795  OS.write(Buffer, sizeof(BLE.Value));
796  return OS;
797}
798
799template <typename value_type>
800binary_le_impl<value_type> binary_le(value_type V) {
801  return binary_le_impl<value_type>(V);
802}
803
804void writeCOFF(COFFParser &CP, raw_ostream &OS) {
805  OS << binary_le(CP.Header.Machine)
806     << binary_le(CP.Header.NumberOfSections)
807     << binary_le(CP.Header.TimeDateStamp)
808     << binary_le(CP.Header.PointerToSymbolTable)
809     << binary_le(CP.Header.NumberOfSymbols)
810     << binary_le(CP.Header.SizeOfOptionalHeader)
811     << binary_le(CP.Header.Characteristics);
812
813  // Output section table.
814  for (std::vector<COFFParser::Section>::const_iterator i = CP.Sections.begin(),
815                                                        e = CP.Sections.end();
816                                                        i != e; ++i) {
817    OS.write(i->Header.Name, COFF::NameSize);
818    OS << binary_le(i->Header.VirtualSize)
819       << binary_le(i->Header.VirtualAddress)
820       << binary_le(i->Header.SizeOfRawData)
821       << binary_le(i->Header.PointerToRawData)
822       << binary_le(i->Header.PointerToRelocations)
823       << binary_le(i->Header.PointerToLineNumbers)
824       << binary_le(i->Header.NumberOfRelocations)
825       << binary_le(i->Header.NumberOfLineNumbers)
826       << binary_le(i->Header.Characteristics);
827  }
828
829  // Output section data.
830  for (std::vector<COFFParser::Section>::const_iterator i = CP.Sections.begin(),
831                                                        e = CP.Sections.end();
832                                                        i != e; ++i) {
833    if (!i->Data.empty())
834      OS.write(reinterpret_cast<const char*>(&i->Data[0]), i->Data.size());
835  }
836
837  // Output symbol table.
838
839  for (std::vector<COFFParser::Symbol>::const_iterator i = CP.Symbols.begin(),
840                                                       e = CP.Symbols.end();
841                                                       i != e; ++i) {
842    OS.write(i->Header.Name, COFF::NameSize);
843    OS << binary_le(i->Header.Value)
844       << binary_le(i->Header.SectionNumber)
845       << binary_le(i->Header.Type)
846       << binary_le(i->Header.StorageClass)
847       << binary_le(i->Header.NumberOfAuxSymbols);
848    if (!i->AuxSymbols.empty())
849      OS.write( reinterpret_cast<const char*>(&i->AuxSymbols[0])
850              , i->AuxSymbols.size());
851  }
852
853  // Output string table.
854  OS.write(&CP.StringTable[0], CP.StringTable.size());
855}
856
857int main(int argc, char **argv) {
858  cl::ParseCommandLineOptions(argc, argv);
859  sys::PrintStackTraceOnErrorSignal();
860  PrettyStackTraceProgram X(argc, argv);
861  llvm_shutdown_obj Y;  // Call llvm_shutdown() on exit.
862
863  OwningPtr<MemoryBuffer> Buf;
864  if (MemoryBuffer::getFileOrSTDIN(Input, Buf))
865    return 1;
866
867  SourceMgr SM;
868  yaml::Stream S(Buf->getBuffer(), SM);
869  COFFParser CP(S);
870  if (!CP.parse()) {
871    errs() << "yaml2obj: Failed to parse YAML file!\n";
872    return 1;
873  }
874  if (!layoutCOFF(CP)) {
875    errs() << "yaml2obj: Failed to layout COFF file!\n";
876    return 1;
877  }
878  writeCOFF(CP, outs());
879}
880