c9436090dd65fadf79d9ccfeb7776d91bb40ed84
[oota-llvm.git] / utils / yaml2obj / yaml2obj.cpp
1 //===- yaml2obj - Convert YAML to a binary object file --------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This program takes a YAML description of an object file and outputs the
11 // binary equivalent.
12 //
13 // This is used for writing tests that require binary files.
14 //
15 //===----------------------------------------------------------------------===//
16
17 #include "llvm/ADT/SmallString.h"
18 #include "llvm/ADT/StringExtras.h"
19 #include "llvm/ADT/StringMap.h"
20 #include "llvm/ADT/StringSwitch.h"
21 #include "llvm/Support/COFF.h"
22 #include "llvm/Support/Casting.h"
23 #include "llvm/Support/CommandLine.h"
24 #include "llvm/Support/Endian.h"
25 #include "llvm/Support/ManagedStatic.h"
26 #include "llvm/Support/MemoryBuffer.h"
27 #include "llvm/Support/PrettyStackTrace.h"
28 #include "llvm/Support/Signals.h"
29 #include "llvm/Support/SourceMgr.h"
30 #include "llvm/Support/YAMLParser.h"
31 #include "llvm/Support/raw_ostream.h"
32 #include "llvm/Support/system_error.h"
33 #include <vector>
34
35 using namespace llvm;
36
37 static cl::opt<std::string>
38   Input(cl::Positional, cl::desc("<input>"), cl::init("-"));
39
40 template<class T>
41 typename llvm::enable_if_c<std::numeric_limits<T>::is_integer, bool>::type
42 getAs(const llvm::yaml::ScalarNode *SN, T &Result) {
43   SmallString<4> Storage;
44   StringRef Value = SN->getValue(Storage);
45   if (Value.getAsInteger(0, Result))
46     return false;
47   return true;
48 }
49
50 // Given a container with begin and end with ::value_type of a character type.
51 // Iterate through pairs of characters in the the set of [a-fA-F0-9] ignoring
52 // all other characters.
53 struct hex_pair_iterator {
54   StringRef::const_iterator Current, End;
55   typedef SmallVector<char, 2> value_type;
56   value_type Pair;
57   bool IsDone;
58
59   hex_pair_iterator(StringRef C)
60     : Current(C.begin()), End(C.end()), IsDone(false) {
61     // Initalize Pair.
62     ++*this;
63   }
64
65   // End iterator.
66   hex_pair_iterator() : Current(), End(), IsDone(true) {}
67
68   value_type operator *() const {
69     return Pair;
70   }
71
72   hex_pair_iterator operator ++() {
73     // We're at the end of the input.
74     if (Current == End) {
75       IsDone = true;
76       return *this;
77     }
78     Pair = value_type();
79     for (; Current != End && Pair.size() != 2; ++Current) {
80       // Is a valid hex digit.
81       if ((*Current >= '0' && *Current <= '9') ||
82           (*Current >= 'a' && *Current <= 'f') ||
83           (*Current >= 'A' && *Current <= 'F'))
84         Pair.push_back(*Current);
85     }
86     // Hit the end without getting 2 hex digits. Pair is invalid.
87     if (Pair.size() != 2)
88       IsDone = true;
89     return *this;
90   }
91
92   bool operator ==(const hex_pair_iterator Other) {
93     return (IsDone == Other.IsDone) ||
94            (Current == Other.Current && End == Other.End);
95   }
96
97   bool operator !=(const hex_pair_iterator Other) {
98     return !(*this == Other);
99   }
100 };
101
102 template <class ContainerOut>
103 static bool hexStringToByteArray(StringRef Str, ContainerOut &Out) {
104   for (hex_pair_iterator I(Str), E; I != E; ++I) {
105     typename hex_pair_iterator::value_type Pair = *I;
106     typename ContainerOut::value_type Byte;
107     if (StringRef(Pair.data(), 2).getAsInteger(16, Byte))
108       return false;
109     Out.push_back(Byte);
110   }
111   return true;
112 }
113
114 /// This parses a yaml stream that represents a COFF object file.
115 /// See docs/yaml2obj for the yaml scheema.
116 struct COFFParser {
117   COFFParser(yaml::Stream &Input) : YS(Input) {
118     std::memset(&Header, 0, sizeof(Header));
119     // A COFF string table always starts with a 4 byte size field. Offsets into
120     // it include this size, so allocate it now.
121     StringTable.append(4, 0);
122   }
123
124   bool parseHeader(yaml::Node *HeaderN) {
125     yaml::MappingNode *MN = dyn_cast<yaml::MappingNode>(HeaderN);
126     if (!MN) {
127       YS.printError(HeaderN, "header's value must be a mapping node");
128       return false;
129     }
130     for (yaml::MappingNode::iterator i = MN->begin(), e = MN->end();
131                                      i != e; ++i) {
132       yaml::ScalarNode *Key = dyn_cast<yaml::ScalarNode>(i->getKey());
133       if (!Key) {
134         YS.printError(i->getKey(), "Keys must be scalar values");
135         return false;
136       }
137       SmallString<32> Storage;
138       StringRef KeyValue = Key->getValue(Storage);
139       if (KeyValue == "Characteristics") {
140         if (!parseHeaderCharacteristics(i->getValue()))
141           return false;
142       } else {
143         yaml::ScalarNode *Value = dyn_cast<yaml::ScalarNode>(i->getValue());
144         if (!Value) {
145           YS.printError(Value,
146             Twine(KeyValue) + " must be a scalar value");
147           return false;
148         }
149         if (KeyValue == "Machine") {
150           uint16_t Machine = COFF::MT_Invalid;
151           if (!getAs(Value, Machine)) {
152             // It's not a raw number, try matching the string.
153             StringRef ValueValue = Value->getValue(Storage);
154             Machine = StringSwitch<COFF::MachineTypes>(ValueValue)
155               .Case( "IMAGE_FILE_MACHINE_UNKNOWN"
156                    , COFF::IMAGE_FILE_MACHINE_UNKNOWN)
157               .Case( "IMAGE_FILE_MACHINE_AM33"
158                    , COFF::IMAGE_FILE_MACHINE_AM33)
159               .Case( "IMAGE_FILE_MACHINE_AMD64"
160                    , COFF::IMAGE_FILE_MACHINE_AMD64)
161               .Case( "IMAGE_FILE_MACHINE_ARM"
162                    , COFF::IMAGE_FILE_MACHINE_ARM)
163               .Case( "IMAGE_FILE_MACHINE_ARMV7"
164                    , COFF::IMAGE_FILE_MACHINE_ARMV7)
165               .Case( "IMAGE_FILE_MACHINE_EBC"
166                    , COFF::IMAGE_FILE_MACHINE_EBC)
167               .Case( "IMAGE_FILE_MACHINE_I386"
168                    , COFF::IMAGE_FILE_MACHINE_I386)
169               .Case( "IMAGE_FILE_MACHINE_IA64"
170                    , COFF::IMAGE_FILE_MACHINE_IA64)
171               .Case( "IMAGE_FILE_MACHINE_M32R"
172                    , COFF::IMAGE_FILE_MACHINE_M32R)
173               .Case( "IMAGE_FILE_MACHINE_MIPS16"
174                    , COFF::IMAGE_FILE_MACHINE_MIPS16)
175               .Case( "IMAGE_FILE_MACHINE_MIPSFPU"
176                    , COFF::IMAGE_FILE_MACHINE_MIPSFPU)
177               .Case( "IMAGE_FILE_MACHINE_MIPSFPU16"
178                    , COFF::IMAGE_FILE_MACHINE_MIPSFPU16)
179               .Case( "IMAGE_FILE_MACHINE_POWERPC"
180                    , COFF::IMAGE_FILE_MACHINE_POWERPC)
181               .Case( "IMAGE_FILE_MACHINE_POWERPCFP"
182                    , COFF::IMAGE_FILE_MACHINE_POWERPCFP)
183               .Case( "IMAGE_FILE_MACHINE_R4000"
184                    , COFF::IMAGE_FILE_MACHINE_R4000)
185               .Case( "IMAGE_FILE_MACHINE_SH3"
186                    , COFF::IMAGE_FILE_MACHINE_SH3)
187               .Case( "IMAGE_FILE_MACHINE_SH3DSP"
188                    , COFF::IMAGE_FILE_MACHINE_SH3DSP)
189               .Case( "IMAGE_FILE_MACHINE_SH4"
190                    , COFF::IMAGE_FILE_MACHINE_SH4)
191               .Case( "IMAGE_FILE_MACHINE_SH5"
192                    , COFF::IMAGE_FILE_MACHINE_SH5)
193               .Case( "IMAGE_FILE_MACHINE_THUMB"
194                    , COFF::IMAGE_FILE_MACHINE_THUMB)
195               .Case( "IMAGE_FILE_MACHINE_WCEMIPSV2"
196                    , COFF::IMAGE_FILE_MACHINE_WCEMIPSV2)
197               .Default(COFF::MT_Invalid);
198             if (Machine == COFF::MT_Invalid) {
199               YS.printError(Value, "Invalid value for Machine");
200               return false;
201             }
202           }
203           Header.Machine = Machine;
204         } else if (KeyValue == "NumberOfSections") {
205           if (!getAs(Value, Header.NumberOfSections)) {
206               YS.printError(Value, "Invalid value for NumberOfSections");
207               return false;
208           }
209         } else if (KeyValue == "TimeDateStamp") {
210           if (!getAs(Value, Header.TimeDateStamp)) {
211               YS.printError(Value, "Invalid value for TimeDateStamp");
212               return false;
213           }
214         } else if (KeyValue == "PointerToSymbolTable") {
215           if (!getAs(Value, Header.PointerToSymbolTable)) {
216               YS.printError(Value, "Invalid value for PointerToSymbolTable");
217               return false;
218           }
219         } else if (KeyValue == "NumberOfSymbols") {
220           if (!getAs(Value, Header.NumberOfSymbols)) {
221               YS.printError(Value, "Invalid value for NumberOfSymbols");
222               return false;
223           }
224         } else if (KeyValue == "SizeOfOptionalHeader") {
225           if (!getAs(Value, Header.SizeOfOptionalHeader)) {
226               YS.printError(Value, "Invalid value for SizeOfOptionalHeader");
227               return false;
228           }
229         } else {
230           YS.printError(Key, "Unrecognized key in header");
231           return false;
232         }
233       }
234     }
235     return true;
236   }
237
238   bool parseHeaderCharacteristics(yaml::Node *Characteristics) {
239     yaml::ScalarNode *Value = dyn_cast<yaml::ScalarNode>(Characteristics);
240     yaml::SequenceNode *SeqValue
241       = dyn_cast<yaml::SequenceNode>(Characteristics);
242     if (!Value && !SeqValue) {
243       YS.printError(Characteristics,
244         "Characteristics must either be a number or sequence");
245       return false;
246     }
247     if (Value) {
248       if (!getAs(Value, Header.Characteristics)) {
249         YS.printError(Value, "Invalid value for Characteristics");
250         return false;
251       }
252     } else {
253       for (yaml::SequenceNode::iterator ci = SeqValue->begin(),
254                                         ce = SeqValue->end();
255                                         ci != ce; ++ci) {
256         yaml::ScalarNode *CharValue = dyn_cast<yaml::ScalarNode>(&*ci);
257         if (!CharValue) {
258           YS.printError(CharValue,
259             "Characteristics must be scalar values");
260           return false;
261         }
262         SmallString<32> Storage;
263         StringRef Char = CharValue->getValue(Storage);
264         uint16_t Characteristic = StringSwitch<COFF::Characteristics>(Char)
265           .Case( "IMAGE_FILE_RELOCS_STRIPPED"
266                 , COFF::IMAGE_FILE_RELOCS_STRIPPED)
267           .Case( "IMAGE_FILE_EXECUTABLE_IMAGE"
268                 , COFF::IMAGE_FILE_EXECUTABLE_IMAGE)
269           .Case( "IMAGE_FILE_LINE_NUMS_STRIPPED"
270                 , COFF::IMAGE_FILE_LINE_NUMS_STRIPPED)
271           .Case( "IMAGE_FILE_LOCAL_SYMS_STRIPPED"
272                 , COFF::IMAGE_FILE_LOCAL_SYMS_STRIPPED)
273           .Case( "IMAGE_FILE_AGGRESSIVE_WS_TRIM"
274                 , COFF::IMAGE_FILE_AGGRESSIVE_WS_TRIM)
275           .Case( "IMAGE_FILE_LARGE_ADDRESS_AWARE"
276                 , COFF::IMAGE_FILE_LARGE_ADDRESS_AWARE)
277           .Case( "IMAGE_FILE_BYTES_REVERSED_LO"
278                 , COFF::IMAGE_FILE_BYTES_REVERSED_LO)
279           .Case( "IMAGE_FILE_32BIT_MACHINE"
280                 , COFF::IMAGE_FILE_32BIT_MACHINE)
281           .Case( "IMAGE_FILE_DEBUG_STRIPPED"
282                 , COFF::IMAGE_FILE_DEBUG_STRIPPED)
283           .Case( "IMAGE_FILE_REMOVABLE_RUN_FROM_SWAP"
284                 , COFF::IMAGE_FILE_REMOVABLE_RUN_FROM_SWAP)
285           .Case( "IMAGE_FILE_SYSTEM"
286                 , COFF::IMAGE_FILE_SYSTEM)
287           .Case( "IMAGE_FILE_DLL"
288                 , COFF::IMAGE_FILE_DLL)
289           .Case( "IMAGE_FILE_UP_SYSTEM_ONLY"
290                 , COFF::IMAGE_FILE_UP_SYSTEM_ONLY)
291           .Default(COFF::C_Invalid);
292         if (Characteristic == COFF::C_Invalid) {
293           // TODO: Typo-correct.
294           YS.printError(CharValue,
295             "Invalid value for Characteristic");
296           return false;
297         }
298         Header.Characteristics |= Characteristic;
299       }
300     }
301     return true;
302   }
303
304   bool parseSections(yaml::Node *SectionsN) {
305     yaml::SequenceNode *SN = dyn_cast<yaml::SequenceNode>(SectionsN);
306     if (!SN) {
307       YS.printError(SectionsN, "Sections must be a sequence");
308       return false;
309     }
310     for (yaml::SequenceNode::iterator i = SN->begin(), e = SN->end();
311                                       i != e; ++i) {
312       Section Sec;
313       std::memset(&Sec.Header, 0, sizeof(Sec.Header));
314       yaml::MappingNode *SecMap = dyn_cast<yaml::MappingNode>(&*i);
315       if (!SecMap) {
316         YS.printError(&*i, "Section entry must be a map");
317         return false;
318       }
319       for (yaml::MappingNode::iterator si = SecMap->begin(), se = SecMap->end();
320                                        si != se; ++si) {
321         yaml::ScalarNode *Key = dyn_cast<yaml::ScalarNode>(si->getKey());
322         if (!Key) {
323           YS.printError(si->getKey(), "Keys must be scalar values");
324           return false;
325         }
326         SmallString<32> Storage;
327         StringRef KeyValue = Key->getValue(Storage);
328
329         yaml::ScalarNode *Value = dyn_cast<yaml::ScalarNode>(si->getValue());
330         if (KeyValue == "Name") {
331           // If the name is less than 8 bytes, store it in place, otherwise
332           // store it in the string table.
333           StringRef Name = Value->getValue(Storage);
334           std::fill_n(Sec.Header.Name, unsigned(COFF::NameSize), 0);
335           if (Name.size() <= COFF::NameSize) {
336             std::copy(Name.begin(), Name.end(), Sec.Header.Name);
337           } else {
338             // Add string to the string table and format the index for output.
339             unsigned Index = getStringIndex(Name);
340             std::string str = utostr(Index);
341             if (str.size() > 7) {
342               YS.printError(Value, "String table got too large");
343               return false;
344             }
345             Sec.Header.Name[0] = '/';
346             std::copy(str.begin(), str.end(), Sec.Header.Name + 1);
347           }
348         } else if (KeyValue == "VirtualSize") {
349           if (!getAs(Value, Sec.Header.VirtualSize)) {
350             YS.printError(Value, "Invalid value for VirtualSize");
351             return false;
352           }
353         } else if (KeyValue == "VirtualAddress") {
354           if (!getAs(Value, Sec.Header.VirtualAddress)) {
355             YS.printError(Value, "Invalid value for VirtualAddress");
356             return false;
357           }
358         } else if (KeyValue == "SizeOfRawData") {
359           if (!getAs(Value, Sec.Header.SizeOfRawData)) {
360             YS.printError(Value, "Invalid value for SizeOfRawData");
361             return false;
362           }
363         } else if (KeyValue == "PointerToRawData") {
364           if (!getAs(Value, Sec.Header.PointerToRawData)) {
365             YS.printError(Value, "Invalid value for PointerToRawData");
366             return false;
367           }
368         } else if (KeyValue == "PointerToRelocations") {
369           if (!getAs(Value, Sec.Header.PointerToRelocations)) {
370             YS.printError(Value, "Invalid value for PointerToRelocations");
371             return false;
372           }
373         } else if (KeyValue == "PointerToLineNumbers") {
374           if (!getAs(Value, Sec.Header.PointerToLineNumbers)) {
375             YS.printError(Value, "Invalid value for PointerToLineNumbers");
376             return false;
377           }
378         } else if (KeyValue == "NumberOfRelocations") {
379           if (!getAs(Value, Sec.Header.NumberOfRelocations)) {
380             YS.printError(Value, "Invalid value for NumberOfRelocations");
381             return false;
382           }
383         } else if (KeyValue == "NumberOfLineNumbers") {
384           if (!getAs(Value, Sec.Header.NumberOfLineNumbers)) {
385             YS.printError(Value, "Invalid value for NumberOfLineNumbers");
386             return false;
387           }
388         } else if (KeyValue == "Characteristics") {
389           yaml::SequenceNode *SeqValue
390             = dyn_cast<yaml::SequenceNode>(si->getValue());
391           if (!Value && !SeqValue) {
392             YS.printError(si->getValue(),
393               "Characteristics must either be a number or sequence");
394             return false;
395           }
396           if (Value) {
397             if (!getAs(Value, Sec.Header.Characteristics)) {
398               YS.printError(Value, "Invalid value for Characteristics");
399               return false;
400             }
401           } else {
402             for (yaml::SequenceNode::iterator ci = SeqValue->begin(),
403                                               ce = SeqValue->end();
404                                               ci != ce; ++ci) {
405               yaml::ScalarNode *CharValue = dyn_cast<yaml::ScalarNode>(&*ci);
406               if (!CharValue) {
407                 YS.printError(CharValue, "Invalid value for Characteristics");
408                 return false;
409               }
410               StringRef Char = CharValue->getValue(Storage);
411               uint32_t Characteristic =
412                 StringSwitch<COFF::SectionCharacteristics>(Char)
413                 .Case( "IMAGE_SCN_TYPE_NO_PAD"
414                      , COFF::IMAGE_SCN_TYPE_NO_PAD)
415                 .Case( "IMAGE_SCN_CNT_CODE"
416                      , COFF::IMAGE_SCN_CNT_CODE)
417                 .Case( "IMAGE_SCN_CNT_INITIALIZED_DATA"
418                      , COFF::IMAGE_SCN_CNT_INITIALIZED_DATA)
419                 .Case( "IMAGE_SCN_CNT_UNINITIALIZED_DATA"
420                      , COFF::IMAGE_SCN_CNT_UNINITIALIZED_DATA)
421                 .Case( "IMAGE_SCN_LNK_OTHER"
422                      , COFF::IMAGE_SCN_LNK_OTHER)
423                 .Case( "IMAGE_SCN_LNK_INFO"
424                      , COFF::IMAGE_SCN_LNK_INFO)
425                 .Case( "IMAGE_SCN_LNK_REMOVE"
426                      , COFF::IMAGE_SCN_LNK_REMOVE)
427                 .Case( "IMAGE_SCN_LNK_COMDAT"
428                      , COFF::IMAGE_SCN_LNK_COMDAT)
429                 .Case( "IMAGE_SCN_GPREL"
430                      , COFF::IMAGE_SCN_GPREL)
431                 .Case( "IMAGE_SCN_MEM_PURGEABLE"
432                      , COFF::IMAGE_SCN_MEM_PURGEABLE)
433                 .Case( "IMAGE_SCN_MEM_16BIT"
434                      , COFF::IMAGE_SCN_MEM_16BIT)
435                 .Case( "IMAGE_SCN_MEM_LOCKED"
436                      , COFF::IMAGE_SCN_MEM_LOCKED)
437                 .Case( "IMAGE_SCN_MEM_PRELOAD"
438                      , COFF::IMAGE_SCN_MEM_PRELOAD)
439                 .Case( "IMAGE_SCN_ALIGN_1BYTES"
440                      , COFF::IMAGE_SCN_ALIGN_1BYTES)
441                 .Case( "IMAGE_SCN_ALIGN_2BYTES"
442                      , COFF::IMAGE_SCN_ALIGN_2BYTES)
443                 .Case( "IMAGE_SCN_ALIGN_4BYTES"
444                      , COFF::IMAGE_SCN_ALIGN_4BYTES)
445                 .Case( "IMAGE_SCN_ALIGN_8BYTES"
446                      , COFF::IMAGE_SCN_ALIGN_8BYTES)
447                 .Case( "IMAGE_SCN_ALIGN_16BYTES"
448                      , COFF::IMAGE_SCN_ALIGN_16BYTES)
449                 .Case( "IMAGE_SCN_ALIGN_32BYTES"
450                      , COFF::IMAGE_SCN_ALIGN_32BYTES)
451                 .Case( "IMAGE_SCN_ALIGN_64BYTES"
452                      , COFF::IMAGE_SCN_ALIGN_64BYTES)
453                 .Case( "IMAGE_SCN_ALIGN_128BYTES"
454                      , COFF::IMAGE_SCN_ALIGN_128BYTES)
455                 .Case( "IMAGE_SCN_ALIGN_256BYTES"
456                      , COFF::IMAGE_SCN_ALIGN_256BYTES)
457                 .Case( "IMAGE_SCN_ALIGN_512BYTES"
458                      , COFF::IMAGE_SCN_ALIGN_512BYTES)
459                 .Case( "IMAGE_SCN_ALIGN_1024BYTES"
460                      , COFF::IMAGE_SCN_ALIGN_1024BYTES)
461                 .Case( "IMAGE_SCN_ALIGN_2048BYTES"
462                      , COFF::IMAGE_SCN_ALIGN_2048BYTES)
463                 .Case( "IMAGE_SCN_ALIGN_4096BYTES"
464                      , COFF::IMAGE_SCN_ALIGN_4096BYTES)
465                 .Case( "IMAGE_SCN_ALIGN_8192BYTES"
466                      , COFF::IMAGE_SCN_ALIGN_8192BYTES)
467                 .Case( "IMAGE_SCN_LNK_NRELOC_OVFL"
468                      , COFF::IMAGE_SCN_LNK_NRELOC_OVFL)
469                 .Case( "IMAGE_SCN_MEM_DISCARDABLE"
470                      , COFF::IMAGE_SCN_MEM_DISCARDABLE)
471                 .Case( "IMAGE_SCN_MEM_NOT_CACHED"
472                      , COFF::IMAGE_SCN_MEM_NOT_CACHED)
473                 .Case( "IMAGE_SCN_MEM_NOT_PAGED"
474                      , COFF::IMAGE_SCN_MEM_NOT_PAGED)
475                 .Case( "IMAGE_SCN_MEM_SHARED"
476                      , COFF::IMAGE_SCN_MEM_SHARED)
477                 .Case( "IMAGE_SCN_MEM_EXECUTE"
478                      , COFF::IMAGE_SCN_MEM_EXECUTE)
479                 .Case( "IMAGE_SCN_MEM_READ"
480                      , COFF::IMAGE_SCN_MEM_READ)
481                 .Case( "IMAGE_SCN_MEM_WRITE"
482                      , COFF::IMAGE_SCN_MEM_WRITE)
483                 .Default(COFF::SC_Invalid);
484               if (Characteristic == COFF::SC_Invalid) {
485                 YS.printError(CharValue, "Invalid value for Characteristic");
486                 return false;
487               }
488               Sec.Header.Characteristics |= Characteristic;
489             }
490           }
491         } else if (KeyValue == "SectionData") {
492           yaml::ScalarNode *Value = dyn_cast<yaml::ScalarNode>(si->getValue());
493           SmallString<32> Storage;
494           StringRef Data = Value->getValue(Storage);
495           if (!hexStringToByteArray(Data, Sec.Data)) {
496             YS.printError(Value, "SectionData must be a collection of pairs of"
497                                  "hex bytes");
498             return false;
499           }
500         } else
501           si->skip();
502       }
503       Sections.push_back(Sec);
504     }
505     return true;
506   }
507
508   bool parseSymbols(yaml::Node *SymbolsN) {
509     yaml::SequenceNode *SN = dyn_cast<yaml::SequenceNode>(SymbolsN);
510     if (!SN) {
511       YS.printError(SymbolsN, "Symbols must be a sequence");
512       return false;
513     }
514     for (yaml::SequenceNode::iterator i = SN->begin(), e = SN->end();
515                                       i != e; ++i) {
516       Symbol Sym;
517       std::memset(&Sym.Header, 0, sizeof(Sym.Header));
518       yaml::MappingNode *SymMap = dyn_cast<yaml::MappingNode>(&*i);
519       if (!SymMap) {
520         YS.printError(&*i, "Symbol must be a map");
521         return false;
522       }
523       for (yaml::MappingNode::iterator si = SymMap->begin(), se = SymMap->end();
524                                        si != se; ++si) {
525         yaml::ScalarNode *Key = dyn_cast<yaml::ScalarNode>(si->getKey());
526         if (!Key) {
527           YS.printError(si->getKey(), "Keys must be scalar values");
528           return false;
529         }
530         SmallString<32> Storage;
531         StringRef KeyValue = Key->getValue(Storage);
532
533         yaml::ScalarNode *Value = dyn_cast<yaml::ScalarNode>(si->getValue());
534         if (!Value) {
535           YS.printError(si->getValue(), "Must be a scalar value");
536           return false;
537         }
538         if (KeyValue == "Name") {
539           // If the name is less than 8 bytes, store it in place, otherwise
540           // store it in the string table.
541           StringRef Name = Value->getValue(Storage);
542           std::fill_n(Sym.Header.Name, unsigned(COFF::NameSize), 0);
543           if (Name.size() <= COFF::NameSize) {
544             std::copy(Name.begin(), Name.end(), Sym.Header.Name);
545           } else {
546             // Add string to the string table and format the index for output.
547             unsigned Index = getStringIndex(Name);
548             *reinterpret_cast<support::aligned_ulittle32_t*>(
549               Sym.Header.Name + 4) = Index;
550           }
551         } else if (KeyValue == "Value") {
552           if (!getAs(Value, Sym.Header.Value)) {
553             YS.printError(Value, "Invalid value for Value");
554             return false;
555           }
556         } else if (KeyValue == "SimpleType") {
557           Sym.Header.Type |= StringSwitch<COFF::SymbolBaseType>(
558             Value->getValue(Storage))
559             .Case("IMAGE_SYM_TYPE_NULL", COFF::IMAGE_SYM_TYPE_NULL)
560             .Case("IMAGE_SYM_TYPE_VOID", COFF::IMAGE_SYM_TYPE_VOID)
561             .Case("IMAGE_SYM_TYPE_CHAR", COFF::IMAGE_SYM_TYPE_CHAR)
562             .Case("IMAGE_SYM_TYPE_SHORT", COFF::IMAGE_SYM_TYPE_SHORT)
563             .Case("IMAGE_SYM_TYPE_INT", COFF::IMAGE_SYM_TYPE_INT)
564             .Case("IMAGE_SYM_TYPE_LONG", COFF::IMAGE_SYM_TYPE_LONG)
565             .Case("IMAGE_SYM_TYPE_FLOAT", COFF::IMAGE_SYM_TYPE_FLOAT)
566             .Case("IMAGE_SYM_TYPE_DOUBLE", COFF::IMAGE_SYM_TYPE_DOUBLE)
567             .Case("IMAGE_SYM_TYPE_STRUCT", COFF::IMAGE_SYM_TYPE_STRUCT)
568             .Case("IMAGE_SYM_TYPE_UNION", COFF::IMAGE_SYM_TYPE_UNION)
569             .Case("IMAGE_SYM_TYPE_ENUM", COFF::IMAGE_SYM_TYPE_ENUM)
570             .Case("IMAGE_SYM_TYPE_MOE", COFF::IMAGE_SYM_TYPE_MOE)
571             .Case("IMAGE_SYM_TYPE_BYTE", COFF::IMAGE_SYM_TYPE_BYTE)
572             .Case("IMAGE_SYM_TYPE_WORD", COFF::IMAGE_SYM_TYPE_WORD)
573             .Case("IMAGE_SYM_TYPE_UINT", COFF::IMAGE_SYM_TYPE_UINT)
574             .Case("IMAGE_SYM_TYPE_DWORD", COFF::IMAGE_SYM_TYPE_DWORD)
575             .Default(COFF::IMAGE_SYM_TYPE_NULL);
576         } else if (KeyValue == "ComplexType") {
577           Sym.Header.Type |= StringSwitch<COFF::SymbolComplexType>(
578             Value->getValue(Storage))
579             .Case("IMAGE_SYM_DTYPE_NULL", COFF::IMAGE_SYM_DTYPE_NULL)
580             .Case("IMAGE_SYM_DTYPE_POINTER", COFF::IMAGE_SYM_DTYPE_POINTER)
581             .Case("IMAGE_SYM_DTYPE_FUNCTION", COFF::IMAGE_SYM_DTYPE_FUNCTION)
582             .Case("IMAGE_SYM_DTYPE_ARRAY", COFF::IMAGE_SYM_DTYPE_ARRAY)
583             .Default(COFF::IMAGE_SYM_DTYPE_NULL)
584             << COFF::SCT_COMPLEX_TYPE_SHIFT;
585         } else if (KeyValue == "StorageClass") {
586           Sym.Header.StorageClass = StringSwitch<COFF::SymbolStorageClass>(
587             Value->getValue(Storage))
588             .Case( "IMAGE_SYM_CLASS_END_OF_FUNCTION"
589                  , COFF::IMAGE_SYM_CLASS_END_OF_FUNCTION)
590             .Case( "IMAGE_SYM_CLASS_NULL"
591                  , COFF::IMAGE_SYM_CLASS_NULL)
592             .Case( "IMAGE_SYM_CLASS_AUTOMATIC"
593                  , COFF::IMAGE_SYM_CLASS_AUTOMATIC)
594             .Case( "IMAGE_SYM_CLASS_EXTERNAL"
595                  , COFF::IMAGE_SYM_CLASS_EXTERNAL)
596             .Case( "IMAGE_SYM_CLASS_STATIC"
597                  , COFF::IMAGE_SYM_CLASS_STATIC)
598             .Case( "IMAGE_SYM_CLASS_REGISTER"
599                  , COFF::IMAGE_SYM_CLASS_REGISTER)
600             .Case( "IMAGE_SYM_CLASS_EXTERNAL_DEF"
601                  , COFF::IMAGE_SYM_CLASS_EXTERNAL_DEF)
602             .Case( "IMAGE_SYM_CLASS_LABEL"
603                  , COFF::IMAGE_SYM_CLASS_LABEL)
604             .Case( "IMAGE_SYM_CLASS_UNDEFINED_LABEL"
605                  , COFF::IMAGE_SYM_CLASS_UNDEFINED_LABEL)
606             .Case( "IMAGE_SYM_CLASS_MEMBER_OF_STRUCT"
607                  , COFF::IMAGE_SYM_CLASS_MEMBER_OF_STRUCT)
608             .Case( "IMAGE_SYM_CLASS_ARGUMENT"
609                  , COFF::IMAGE_SYM_CLASS_ARGUMENT)
610             .Case( "IMAGE_SYM_CLASS_STRUCT_TAG"
611                  , COFF::IMAGE_SYM_CLASS_STRUCT_TAG)
612             .Case( "IMAGE_SYM_CLASS_MEMBER_OF_UNION"
613                  , COFF::IMAGE_SYM_CLASS_MEMBER_OF_UNION)
614             .Case( "IMAGE_SYM_CLASS_UNION_TAG"
615                  , COFF::IMAGE_SYM_CLASS_UNION_TAG)
616             .Case( "IMAGE_SYM_CLASS_TYPE_DEFINITION"
617                  , COFF::IMAGE_SYM_CLASS_TYPE_DEFINITION)
618             .Case( "IMAGE_SYM_CLASS_UNDEFINED_STATIC"
619                  , COFF::IMAGE_SYM_CLASS_UNDEFINED_STATIC)
620             .Case( "IMAGE_SYM_CLASS_ENUM_TAG"
621                  , COFF::IMAGE_SYM_CLASS_ENUM_TAG)
622             .Case( "IMAGE_SYM_CLASS_MEMBER_OF_ENUM"
623                  , COFF::IMAGE_SYM_CLASS_MEMBER_OF_ENUM)
624             .Case( "IMAGE_SYM_CLASS_REGISTER_PARAM"
625                  , COFF::IMAGE_SYM_CLASS_REGISTER_PARAM)
626             .Case( "IMAGE_SYM_CLASS_BIT_FIELD"
627                  , COFF::IMAGE_SYM_CLASS_BIT_FIELD)
628             .Case( "IMAGE_SYM_CLASS_BLOCK"
629                  , COFF::IMAGE_SYM_CLASS_BLOCK)
630             .Case( "IMAGE_SYM_CLASS_FUNCTION"
631                  , COFF::IMAGE_SYM_CLASS_FUNCTION)
632             .Case( "IMAGE_SYM_CLASS_END_OF_STRUCT"
633                  , COFF::IMAGE_SYM_CLASS_END_OF_STRUCT)
634             .Case( "IMAGE_SYM_CLASS_FILE"
635                  , COFF::IMAGE_SYM_CLASS_FILE)
636             .Case( "IMAGE_SYM_CLASS_SECTION"
637                  , COFF::IMAGE_SYM_CLASS_SECTION)
638             .Case( "IMAGE_SYM_CLASS_WEAK_EXTERNAL"
639                  , COFF::IMAGE_SYM_CLASS_WEAK_EXTERNAL)
640             .Case( "IMAGE_SYM_CLASS_CLR_TOKEN"
641                  , COFF::IMAGE_SYM_CLASS_CLR_TOKEN)
642             .Default(COFF::SSC_Invalid);
643           if (Sym.Header.StorageClass == COFF::SSC_Invalid) {
644             YS.printError(Value, "Invalid value for StorageClass");
645             return false;
646           }
647         } else if (KeyValue == "SectionNumber") {
648           if (!getAs(Value, Sym.Header.SectionNumber)) {
649               YS.printError(Value, "Invalid value for SectionNumber");
650               return false;
651           }
652         } else if (KeyValue == "AuxillaryData") {
653           StringRef Data = Value->getValue(Storage);
654           if (!hexStringToByteArray(Data, Sym.AuxSymbols)) {
655             YS.printError(Value, "AuxillaryData must be a collection of pairs"
656                                  "of hex bytes");
657             return false;
658           }
659         } else
660           si->skip();
661       }
662       Symbols.push_back(Sym);
663     }
664     return true;
665   }
666
667   bool parse() {
668     yaml::Document &D = *YS.begin();
669     yaml::MappingNode *Root = dyn_cast<yaml::MappingNode>(D.getRoot());
670     if (!Root) {
671       YS.printError(D.getRoot(), "Root node must be a map");
672       return false;
673     }
674     for (yaml::MappingNode::iterator i = Root->begin(), e = Root->end();
675                                      i != e; ++i) {
676       yaml::ScalarNode *Key = dyn_cast<yaml::ScalarNode>(i->getKey());
677       if (!Key) {
678         YS.printError(i->getKey(), "Keys must be scalar values");
679         return false;
680       }
681       SmallString<32> Storage;
682       StringRef KeyValue = Key->getValue(Storage);
683       if (KeyValue == "header") {
684         if (!parseHeader(i->getValue()))
685           return false;
686       } else if (KeyValue == "sections") {
687         if (!parseSections(i->getValue()))
688           return false;
689       } else if (KeyValue == "symbols") {
690         if (!parseSymbols(i->getValue()))
691           return false;
692       }
693     }
694     return !YS.failed();
695   }
696
697   unsigned getStringIndex(StringRef Str) {
698     StringMap<unsigned>::iterator i = StringTableMap.find(Str);
699     if (i == StringTableMap.end()) {
700       unsigned Index = StringTable.size();
701       StringTable.append(Str.begin(), Str.end());
702       StringTable.push_back(0);
703       StringTableMap[Str] = Index;
704       return Index;
705     }
706     return i->second;
707   }
708
709   yaml::Stream &YS;
710   COFF::header Header;
711
712   struct Section {
713     COFF::section Header;
714     std::vector<uint8_t> Data;
715     std::vector<COFF::relocation> Relocations;
716   };
717
718   struct Symbol {
719     COFF::symbol Header;
720     std::vector<uint8_t> AuxSymbols;
721   };
722
723   std::vector<Section> Sections;
724   std::vector<Symbol> Symbols;
725   StringMap<unsigned> StringTableMap;
726   std::string StringTable;
727 };
728
729 // Take a CP and assign addresses and sizes to everything. Returns false if the
730 // layout is not valid to do.
731 static bool layoutCOFF(COFFParser &CP) {
732   uint32_t SectionTableStart = 0;
733   uint32_t SectionTableSize  = 0;
734
735   // The section table starts immediately after the header, including the
736   // optional header.
737   SectionTableStart = sizeof(COFF::header) + CP.Header.SizeOfOptionalHeader;
738   SectionTableSize = sizeof(COFF::section) * CP.Sections.size();
739
740   uint32_t CurrentSectionDataOffset = SectionTableStart + SectionTableSize;
741
742   // Assign each section data address consecutively.
743   for (std::vector<COFFParser::Section>::iterator i = CP.Sections.begin(),
744                                                   e = CP.Sections.end();
745                                                   i != e; ++i) {
746     if (!i->Data.empty()) {
747       i->Header.SizeOfRawData = i->Data.size();
748       i->Header.PointerToRawData = CurrentSectionDataOffset;
749       CurrentSectionDataOffset += i->Header.SizeOfRawData;
750       // TODO: Handle alignment.
751     } else {
752       i->Header.SizeOfRawData = 0;
753       i->Header.PointerToRawData = 0;
754     }
755   }
756
757   uint32_t SymbolTableStart = CurrentSectionDataOffset;
758
759   // Calculate number of symbols.
760   uint32_t NumberOfSymbols = 0;
761   for (std::vector<COFFParser::Symbol>::iterator i = CP.Symbols.begin(),
762                                                  e = CP.Symbols.end();
763                                                  i != e; ++i) {
764     if (i->AuxSymbols.size() % COFF::SymbolSize != 0) {
765       errs() << "AuxillaryData size not a multiple of symbol size!\n";
766       return false;
767     }
768     i->Header.NumberOfAuxSymbols = i->AuxSymbols.size() / COFF::SymbolSize;
769     NumberOfSymbols += 1 + i->Header.NumberOfAuxSymbols;
770   }
771
772   // Store all the allocated start addresses in the header.
773   CP.Header.NumberOfSections = CP.Sections.size();
774   CP.Header.NumberOfSymbols = NumberOfSymbols;
775   CP.Header.PointerToSymbolTable = SymbolTableStart;
776
777   *reinterpret_cast<support::ulittle32_t *>(&CP.StringTable[0])
778     = CP.StringTable.size();
779
780   return true;
781 }
782
783 template <typename value_type>
784 struct binary_le_impl {
785   value_type Value;
786   binary_le_impl(value_type V) : Value(V) {}
787 };
788
789 template <typename value_type>
790 raw_ostream &operator <<( raw_ostream &OS
791                         , const binary_le_impl<value_type> &BLE) {
792   char Buffer[sizeof(BLE.Value)];
793   support::endian::write_le<value_type, support::unaligned>(Buffer, BLE.Value);
794   OS.write(Buffer, sizeof(BLE.Value));
795   return OS;
796 }
797
798 template <typename value_type>
799 binary_le_impl<value_type> binary_le(value_type V) {
800   return binary_le_impl<value_type>(V);
801 }
802
803 void writeCOFF(COFFParser &CP, raw_ostream &OS) {
804   OS << binary_le(CP.Header.Machine)
805      << binary_le(CP.Header.NumberOfSections)
806      << binary_le(CP.Header.TimeDateStamp)
807      << binary_le(CP.Header.PointerToSymbolTable)
808      << binary_le(CP.Header.NumberOfSymbols)
809      << binary_le(CP.Header.SizeOfOptionalHeader)
810      << binary_le(CP.Header.Characteristics);
811
812   // Output section table.
813   for (std::vector<COFFParser::Section>::const_iterator i = CP.Sections.begin(),
814                                                         e = CP.Sections.end();
815                                                         i != e; ++i) {
816     OS.write(i->Header.Name, COFF::NameSize);
817     OS << binary_le(i->Header.VirtualSize)
818        << binary_le(i->Header.VirtualAddress)
819        << binary_le(i->Header.SizeOfRawData)
820        << binary_le(i->Header.PointerToRawData)
821        << binary_le(i->Header.PointerToRelocations)
822        << binary_le(i->Header.PointerToLineNumbers)
823        << binary_le(i->Header.NumberOfRelocations)
824        << binary_le(i->Header.NumberOfLineNumbers)
825        << binary_le(i->Header.Characteristics);
826   }
827
828   // Output section data.
829   for (std::vector<COFFParser::Section>::const_iterator i = CP.Sections.begin(),
830                                                         e = CP.Sections.end();
831                                                         i != e; ++i) {
832     if (!i->Data.empty())
833       OS.write(reinterpret_cast<const char*>(&i->Data[0]), i->Data.size());
834   }
835
836   // Output symbol table.
837
838   for (std::vector<COFFParser::Symbol>::const_iterator i = CP.Symbols.begin(),
839                                                        e = CP.Symbols.end();
840                                                        i != e; ++i) {
841     OS.write(i->Header.Name, COFF::NameSize);
842     OS << binary_le(i->Header.Value)
843        << binary_le(i->Header.SectionNumber)
844        << binary_le(i->Header.Type)
845        << binary_le(i->Header.StorageClass)
846        << binary_le(i->Header.NumberOfAuxSymbols);
847     if (!i->AuxSymbols.empty())
848       OS.write( reinterpret_cast<const char*>(&i->AuxSymbols[0])
849               , i->AuxSymbols.size());
850   }
851
852   // Output string table.
853   OS.write(&CP.StringTable[0], CP.StringTable.size());
854 }
855
856 int main(int argc, char **argv) {
857   cl::ParseCommandLineOptions(argc, argv);
858   sys::PrintStackTraceOnErrorSignal();
859   PrettyStackTraceProgram X(argc, argv);
860   llvm_shutdown_obj Y;  // Call llvm_shutdown() on exit.
861
862   OwningPtr<MemoryBuffer> Buf;
863   if (MemoryBuffer::getFileOrSTDIN(Input, Buf))
864     return 1;
865
866   SourceMgr SM;
867   yaml::Stream S(Buf->getBuffer(), SM);
868   COFFParser CP(S);
869   if (!CP.parse()) {
870     errs() << "yaml2obj: Failed to parse YAML file!\n";
871     return 1;
872   }
873   if (!layoutCOFF(CP)) {
874     errs() << "yaml2obj: Failed to layout COFF file!\n";
875     return 1;
876   }
877   writeCOFF(CP, outs());
878 }