1 //===-- ObjectFileMachO.cpp -------------------------------------*- C++ -*-===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 
10 #include "llvm/ADT/StringRef.h"
11 #include "llvm/Support/MachO.h"
12 
13 #include "ObjectFileMachO.h"
14 
15 #include "lldb/lldb-private-log.h"
16 #include "lldb/Core/ArchSpec.h"
17 #include "lldb/Core/DataBuffer.h"
18 #include "lldb/Core/Debugger.h"
19 #include "lldb/Core/FileSpecList.h"
20 #include "lldb/Core/Log.h"
21 #include "lldb/Core/Module.h"
22 #include "lldb/Core/ModuleSpec.h"
23 #include "lldb/Core/PluginManager.h"
24 #include "lldb/Core/RangeMap.h"
25 #include "lldb/Core/Section.h"
26 #include "lldb/Core/StreamFile.h"
27 #include "lldb/Core/StreamString.h"
28 #include "lldb/Core/Timer.h"
29 #include "lldb/Core/UUID.h"
30 #include "lldb/Host/Host.h"
31 #include "lldb/Host/FileSpec.h"
32 #include "lldb/Symbol/ClangNamespaceDecl.h"
33 #include "lldb/Symbol/DWARFCallFrameInfo.h"
34 #include "lldb/Symbol/ObjectFile.h"
35 #include "lldb/Target/Platform.h"
36 #include "lldb/Target/Process.h"
37 #include "lldb/Target/Target.h"
38 #include "Plugins/Process/Utility/RegisterContextDarwin_arm.h"
39 #include "Plugins/Process/Utility/RegisterContextDarwin_i386.h"
40 #include "Plugins/Process/Utility/RegisterContextDarwin_x86_64.h"
41 
42 #if defined (__APPLE__) && defined (__arm__)
43 // GetLLDBSharedCacheUUID() needs to call dlsym()
44 #include <dlfcn.h>
45 #endif
46 
47 #ifndef __APPLE__
48 #include "Utility/UuidCompatibility.h"
49 #endif
50 
51 using namespace lldb;
52 using namespace lldb_private;
53 using namespace llvm::MachO;
54 
55 class RegisterContextDarwin_x86_64_Mach : public RegisterContextDarwin_x86_64
56 {
57 public:
58     RegisterContextDarwin_x86_64_Mach (lldb_private::Thread &thread, const DataExtractor &data) :
59         RegisterContextDarwin_x86_64 (thread, 0)
60     {
61         SetRegisterDataFrom_LC_THREAD (data);
62     }
63 
64     virtual void
65     InvalidateAllRegisters ()
66     {
67         // Do nothing... registers are always valid...
68     }
69 
70     void
71     SetRegisterDataFrom_LC_THREAD (const DataExtractor &data)
72     {
73         lldb::offset_t offset = 0;
74         SetError (GPRRegSet, Read, -1);
75         SetError (FPURegSet, Read, -1);
76         SetError (EXCRegSet, Read, -1);
77         bool done = false;
78 
79         while (!done)
80         {
81             int flavor = data.GetU32 (&offset);
82             if (flavor == 0)
83                 done = true;
84             else
85             {
86                 uint32_t i;
87                 uint32_t count = data.GetU32 (&offset);
88                 switch (flavor)
89                 {
90                     case GPRRegSet:
91                         for (i=0; i<count; ++i)
92                             (&gpr.rax)[i] = data.GetU64(&offset);
93                         SetError (GPRRegSet, Read, 0);
94                         done = true;
95 
96                         break;
97                     case FPURegSet:
98                         // TODO: fill in FPU regs....
99                         //SetError (FPURegSet, Read, -1);
100                         done = true;
101 
102                         break;
103                     case EXCRegSet:
104                         exc.trapno = data.GetU32(&offset);
105                         exc.err = data.GetU32(&offset);
106                         exc.faultvaddr = data.GetU64(&offset);
107                         SetError (EXCRegSet, Read, 0);
108                         done = true;
109                         break;
110                     case 7:
111                     case 8:
112                     case 9:
113                         // fancy flavors that encapsulate of the the above
114                         // falvors...
115                         break;
116 
117                     default:
118                         done = true;
119                         break;
120                 }
121             }
122         }
123     }
124 protected:
125     virtual int
126     DoReadGPR (lldb::tid_t tid, int flavor, GPR &gpr)
127     {
128         return 0;
129     }
130 
131     virtual int
132     DoReadFPU (lldb::tid_t tid, int flavor, FPU &fpu)
133     {
134         return 0;
135     }
136 
137     virtual int
138     DoReadEXC (lldb::tid_t tid, int flavor, EXC &exc)
139     {
140         return 0;
141     }
142 
143     virtual int
144     DoWriteGPR (lldb::tid_t tid, int flavor, const GPR &gpr)
145     {
146         return 0;
147     }
148 
149     virtual int
150     DoWriteFPU (lldb::tid_t tid, int flavor, const FPU &fpu)
151     {
152         return 0;
153     }
154 
155     virtual int
156     DoWriteEXC (lldb::tid_t tid, int flavor, const EXC &exc)
157     {
158         return 0;
159     }
160 };
161 
162 
163 class RegisterContextDarwin_i386_Mach : public RegisterContextDarwin_i386
164 {
165 public:
166     RegisterContextDarwin_i386_Mach (lldb_private::Thread &thread, const DataExtractor &data) :
167     RegisterContextDarwin_i386 (thread, 0)
168     {
169         SetRegisterDataFrom_LC_THREAD (data);
170     }
171 
172     virtual void
173     InvalidateAllRegisters ()
174     {
175         // Do nothing... registers are always valid...
176     }
177 
178     void
179     SetRegisterDataFrom_LC_THREAD (const DataExtractor &data)
180     {
181         lldb::offset_t offset = 0;
182         SetError (GPRRegSet, Read, -1);
183         SetError (FPURegSet, Read, -1);
184         SetError (EXCRegSet, Read, -1);
185         bool done = false;
186 
187         while (!done)
188         {
189             int flavor = data.GetU32 (&offset);
190             if (flavor == 0)
191                 done = true;
192             else
193             {
194                 uint32_t i;
195                 uint32_t count = data.GetU32 (&offset);
196                 switch (flavor)
197                 {
198                     case GPRRegSet:
199                         for (i=0; i<count; ++i)
200                             (&gpr.eax)[i] = data.GetU32(&offset);
201                         SetError (GPRRegSet, Read, 0);
202                         done = true;
203 
204                         break;
205                     case FPURegSet:
206                         // TODO: fill in FPU regs....
207                         //SetError (FPURegSet, Read, -1);
208                         done = true;
209 
210                         break;
211                     case EXCRegSet:
212                         exc.trapno = data.GetU32(&offset);
213                         exc.err = data.GetU32(&offset);
214                         exc.faultvaddr = data.GetU32(&offset);
215                         SetError (EXCRegSet, Read, 0);
216                         done = true;
217                         break;
218                     case 7:
219                     case 8:
220                     case 9:
221                         // fancy flavors that encapsulate of the the above
222                         // falvors...
223                         break;
224 
225                     default:
226                         done = true;
227                         break;
228                 }
229             }
230         }
231     }
232 protected:
233     virtual int
234     DoReadGPR (lldb::tid_t tid, int flavor, GPR &gpr)
235     {
236         return 0;
237     }
238 
239     virtual int
240     DoReadFPU (lldb::tid_t tid, int flavor, FPU &fpu)
241     {
242         return 0;
243     }
244 
245     virtual int
246     DoReadEXC (lldb::tid_t tid, int flavor, EXC &exc)
247     {
248         return 0;
249     }
250 
251     virtual int
252     DoWriteGPR (lldb::tid_t tid, int flavor, const GPR &gpr)
253     {
254         return 0;
255     }
256 
257     virtual int
258     DoWriteFPU (lldb::tid_t tid, int flavor, const FPU &fpu)
259     {
260         return 0;
261     }
262 
263     virtual int
264     DoWriteEXC (lldb::tid_t tid, int flavor, const EXC &exc)
265     {
266         return 0;
267     }
268 };
269 
270 class RegisterContextDarwin_arm_Mach : public RegisterContextDarwin_arm
271 {
272 public:
273     RegisterContextDarwin_arm_Mach (lldb_private::Thread &thread, const DataExtractor &data) :
274         RegisterContextDarwin_arm (thread, 0)
275     {
276         SetRegisterDataFrom_LC_THREAD (data);
277     }
278 
279     virtual void
280     InvalidateAllRegisters ()
281     {
282         // Do nothing... registers are always valid...
283     }
284 
285     void
286     SetRegisterDataFrom_LC_THREAD (const DataExtractor &data)
287     {
288         lldb::offset_t offset = 0;
289         SetError (GPRRegSet, Read, -1);
290         SetError (FPURegSet, Read, -1);
291         SetError (EXCRegSet, Read, -1);
292         bool done = false;
293 
294         while (!done)
295         {
296             int flavor = data.GetU32 (&offset);
297             uint32_t count = data.GetU32 (&offset);
298             lldb::offset_t next_thread_state = offset + (count * 4);
299             switch (flavor)
300             {
301                 case GPRRegSet:
302                     for (uint32_t i=0; i<count; ++i)
303                     {
304                         gpr.r[i] = data.GetU32(&offset);
305                     }
306 
307                     // Note that gpr.cpsr is also copied by the above loop; this loop technically extends
308                     // one element past the end of the gpr.r[] array.
309 
310                     SetError (GPRRegSet, Read, 0);
311                     offset = next_thread_state;
312                     break;
313 
314                 case FPURegSet:
315                     {
316                         uint8_t  *fpu_reg_buf = (uint8_t*) &fpu.floats.s[0];
317                         const int fpu_reg_buf_size = sizeof (fpu.floats);
318                         if (data.ExtractBytes (offset, fpu_reg_buf_size, eByteOrderLittle, fpu_reg_buf) == fpu_reg_buf_size)
319                         {
320                             offset += fpu_reg_buf_size;
321                             fpu.fpscr = data.GetU32(&offset);
322                             SetError (FPURegSet, Read, 0);
323                         }
324                         else
325                         {
326                             done = true;
327                         }
328                     }
329                     offset = next_thread_state;
330                     break;
331 
332                 case EXCRegSet:
333                     if (count == 3)
334                     {
335                         exc.exception = data.GetU32(&offset);
336                         exc.fsr = data.GetU32(&offset);
337                         exc.far = data.GetU32(&offset);
338                         SetError (EXCRegSet, Read, 0);
339                     }
340                     done = true;
341                     offset = next_thread_state;
342                     break;
343 
344                 // Unknown register set flavor, stop trying to parse.
345                 default:
346                     done = true;
347             }
348         }
349     }
350 protected:
351     virtual int
352     DoReadGPR (lldb::tid_t tid, int flavor, GPR &gpr)
353     {
354         return -1;
355     }
356 
357     virtual int
358     DoReadFPU (lldb::tid_t tid, int flavor, FPU &fpu)
359     {
360         return -1;
361     }
362 
363     virtual int
364     DoReadEXC (lldb::tid_t tid, int flavor, EXC &exc)
365     {
366         return -1;
367     }
368 
369     virtual int
370     DoReadDBG (lldb::tid_t tid, int flavor, DBG &dbg)
371     {
372         return -1;
373     }
374 
375     virtual int
376     DoWriteGPR (lldb::tid_t tid, int flavor, const GPR &gpr)
377     {
378         return 0;
379     }
380 
381     virtual int
382     DoWriteFPU (lldb::tid_t tid, int flavor, const FPU &fpu)
383     {
384         return 0;
385     }
386 
387     virtual int
388     DoWriteEXC (lldb::tid_t tid, int flavor, const EXC &exc)
389     {
390         return 0;
391     }
392 
393     virtual int
394     DoWriteDBG (lldb::tid_t tid, int flavor, const DBG &dbg)
395     {
396         return -1;
397     }
398 };
399 
400 static uint32_t
401 MachHeaderSizeFromMagic(uint32_t magic)
402 {
403     switch (magic)
404     {
405         case HeaderMagic32:
406         case HeaderMagic32Swapped:
407             return sizeof(struct mach_header);
408 
409         case HeaderMagic64:
410         case HeaderMagic64Swapped:
411             return sizeof(struct mach_header_64);
412             break;
413 
414         default:
415             break;
416     }
417     return 0;
418 }
419 
420 #define MACHO_NLIST_ARM_SYMBOL_IS_THUMB 0x0008
421 
422 void
423 ObjectFileMachO::Initialize()
424 {
425     PluginManager::RegisterPlugin (GetPluginNameStatic(),
426                                    GetPluginDescriptionStatic(),
427                                    CreateInstance,
428                                    CreateMemoryInstance,
429                                    GetModuleSpecifications);
430 }
431 
432 void
433 ObjectFileMachO::Terminate()
434 {
435     PluginManager::UnregisterPlugin (CreateInstance);
436 }
437 
438 
439 lldb_private::ConstString
440 ObjectFileMachO::GetPluginNameStatic()
441 {
442     static ConstString g_name("mach-o");
443     return g_name;
444 }
445 
446 const char *
447 ObjectFileMachO::GetPluginDescriptionStatic()
448 {
449     return "Mach-o object file reader (32 and 64 bit)";
450 }
451 
452 ObjectFile *
453 ObjectFileMachO::CreateInstance (const lldb::ModuleSP &module_sp,
454                                  DataBufferSP& data_sp,
455                                  lldb::offset_t data_offset,
456                                  const FileSpec* file,
457                                  lldb::offset_t file_offset,
458                                  lldb::offset_t length)
459 {
460     if (!data_sp)
461     {
462         data_sp = file->MemoryMapFileContents(file_offset, length);
463         data_offset = 0;
464     }
465 
466     if (ObjectFileMachO::MagicBytesMatch(data_sp, data_offset, length))
467     {
468         // Update the data to contain the entire file if it doesn't already
469         if (data_sp->GetByteSize() < length)
470         {
471             data_sp = file->MemoryMapFileContents(file_offset, length);
472             data_offset = 0;
473         }
474         std::unique_ptr<ObjectFile> objfile_ap(new ObjectFileMachO (module_sp, data_sp, data_offset, file, file_offset, length));
475         if (objfile_ap.get() && objfile_ap->ParseHeader())
476             return objfile_ap.release();
477     }
478     return NULL;
479 }
480 
481 ObjectFile *
482 ObjectFileMachO::CreateMemoryInstance (const lldb::ModuleSP &module_sp,
483                                        DataBufferSP& data_sp,
484                                        const ProcessSP &process_sp,
485                                        lldb::addr_t header_addr)
486 {
487     if (ObjectFileMachO::MagicBytesMatch(data_sp, 0, data_sp->GetByteSize()))
488     {
489         std::unique_ptr<ObjectFile> objfile_ap(new ObjectFileMachO (module_sp, data_sp, process_sp, header_addr));
490         if (objfile_ap.get() && objfile_ap->ParseHeader())
491             return objfile_ap.release();
492     }
493     return NULL;
494 }
495 
496 size_t
497 ObjectFileMachO::GetModuleSpecifications (const lldb_private::FileSpec& file,
498                                           lldb::DataBufferSP& data_sp,
499                                           lldb::offset_t data_offset,
500                                           lldb::offset_t file_offset,
501                                           lldb::offset_t length,
502                                           lldb_private::ModuleSpecList &specs)
503 {
504     const size_t initial_count = specs.GetSize();
505 
506     if (ObjectFileMachO::MagicBytesMatch(data_sp, 0, data_sp->GetByteSize()))
507     {
508         DataExtractor data;
509         data.SetData(data_sp);
510         llvm::MachO::mach_header header;
511         if (ParseHeader (data, &data_offset, header))
512         {
513             if (header.sizeofcmds >= data_sp->GetByteSize())
514             {
515                 data_sp = file.ReadFileContents(file_offset, header.sizeofcmds);
516                 data_offset = MachHeaderSizeFromMagic(header.magic) + file_offset;
517             }
518             if (data_sp)
519             {
520                 ModuleSpec spec;
521                 spec.GetFileSpec() = file;
522                 spec.GetArchitecture().SetArchitecture(eArchTypeMachO,
523                                                        header.cputype,
524                                                        header.cpusubtype);
525                 if (spec.GetArchitecture().IsValid())
526                 {
527                     GetUUID (header, data, data_offset, spec.GetUUID());
528                     specs.Append(spec);
529                 }
530             }
531         }
532     }
533     return specs.GetSize() - initial_count;
534 }
535 
536 
537 
538 const ConstString &
539 ObjectFileMachO::GetSegmentNameTEXT()
540 {
541     static ConstString g_segment_name_TEXT ("__TEXT");
542     return g_segment_name_TEXT;
543 }
544 
545 const ConstString &
546 ObjectFileMachO::GetSegmentNameDATA()
547 {
548     static ConstString g_segment_name_DATA ("__DATA");
549     return g_segment_name_DATA;
550 }
551 
552 const ConstString &
553 ObjectFileMachO::GetSegmentNameOBJC()
554 {
555     static ConstString g_segment_name_OBJC ("__OBJC");
556     return g_segment_name_OBJC;
557 }
558 
559 const ConstString &
560 ObjectFileMachO::GetSegmentNameLINKEDIT()
561 {
562     static ConstString g_section_name_LINKEDIT ("__LINKEDIT");
563     return g_section_name_LINKEDIT;
564 }
565 
566 const ConstString &
567 ObjectFileMachO::GetSectionNameEHFrame()
568 {
569     static ConstString g_section_name_eh_frame ("__eh_frame");
570     return g_section_name_eh_frame;
571 }
572 
573 bool
574 ObjectFileMachO::MagicBytesMatch (DataBufferSP& data_sp,
575                                   lldb::addr_t data_offset,
576                                   lldb::addr_t data_length)
577 {
578     DataExtractor data;
579     data.SetData (data_sp, data_offset, data_length);
580     lldb::offset_t offset = 0;
581     uint32_t magic = data.GetU32(&offset);
582     return MachHeaderSizeFromMagic(magic) != 0;
583 }
584 
585 
586 ObjectFileMachO::ObjectFileMachO(const lldb::ModuleSP &module_sp,
587                                  DataBufferSP& data_sp,
588                                  lldb::offset_t data_offset,
589                                  const FileSpec* file,
590                                  lldb::offset_t file_offset,
591                                  lldb::offset_t length) :
592     ObjectFile(module_sp, file, file_offset, length, data_sp, data_offset),
593     m_mach_segments(),
594     m_mach_sections(),
595     m_entry_point_address(),
596     m_thread_context_offsets(),
597     m_thread_context_offsets_valid(false)
598 {
599     ::memset (&m_header, 0, sizeof(m_header));
600     ::memset (&m_dysymtab, 0, sizeof(m_dysymtab));
601 }
602 
603 ObjectFileMachO::ObjectFileMachO (const lldb::ModuleSP &module_sp,
604                                   lldb::DataBufferSP& header_data_sp,
605                                   const lldb::ProcessSP &process_sp,
606                                   lldb::addr_t header_addr) :
607     ObjectFile(module_sp, process_sp, header_addr, header_data_sp),
608     m_mach_segments(),
609     m_mach_sections(),
610     m_entry_point_address(),
611     m_thread_context_offsets(),
612     m_thread_context_offsets_valid(false)
613 {
614     ::memset (&m_header, 0, sizeof(m_header));
615     ::memset (&m_dysymtab, 0, sizeof(m_dysymtab));
616 }
617 
618 ObjectFileMachO::~ObjectFileMachO()
619 {
620 }
621 
622 bool
623 ObjectFileMachO::ParseHeader (DataExtractor &data,
624                               lldb::offset_t *data_offset_ptr,
625                               llvm::MachO::mach_header &header)
626 {
627     data.SetByteOrder (lldb::endian::InlHostByteOrder());
628     // Leave magic in the original byte order
629     header.magic = data.GetU32(data_offset_ptr);
630     bool can_parse = false;
631     bool is_64_bit = false;
632     switch (header.magic)
633     {
634         case HeaderMagic32:
635             data.SetByteOrder (lldb::endian::InlHostByteOrder());
636             data.SetAddressByteSize(4);
637             can_parse = true;
638             break;
639 
640         case HeaderMagic64:
641             data.SetByteOrder (lldb::endian::InlHostByteOrder());
642             data.SetAddressByteSize(8);
643             can_parse = true;
644             is_64_bit = true;
645             break;
646 
647         case HeaderMagic32Swapped:
648             data.SetByteOrder(lldb::endian::InlHostByteOrder() == eByteOrderBig ? eByteOrderLittle : eByteOrderBig);
649             data.SetAddressByteSize(4);
650             can_parse = true;
651             break;
652 
653         case HeaderMagic64Swapped:
654             data.SetByteOrder(lldb::endian::InlHostByteOrder() == eByteOrderBig ? eByteOrderLittle : eByteOrderBig);
655             data.SetAddressByteSize(8);
656             is_64_bit = true;
657             can_parse = true;
658             break;
659 
660         default:
661             break;
662     }
663 
664     if (can_parse)
665     {
666         data.GetU32(data_offset_ptr, &header.cputype, 6);
667         if (is_64_bit)
668             *data_offset_ptr += 4;
669         return true;
670     }
671     else
672     {
673         memset(&header, 0, sizeof(header));
674     }
675     return false;
676 }
677 
678 bool
679 ObjectFileMachO::ParseHeader ()
680 {
681     ModuleSP module_sp(GetModule());
682     if (module_sp)
683     {
684         lldb_private::Mutex::Locker locker(module_sp->GetMutex());
685         bool can_parse = false;
686         lldb::offset_t offset = 0;
687         m_data.SetByteOrder (lldb::endian::InlHostByteOrder());
688         // Leave magic in the original byte order
689         m_header.magic = m_data.GetU32(&offset);
690         switch (m_header.magic)
691         {
692         case HeaderMagic32:
693             m_data.SetByteOrder (lldb::endian::InlHostByteOrder());
694             m_data.SetAddressByteSize(4);
695             can_parse = true;
696             break;
697 
698         case HeaderMagic64:
699             m_data.SetByteOrder (lldb::endian::InlHostByteOrder());
700             m_data.SetAddressByteSize(8);
701             can_parse = true;
702             break;
703 
704         case HeaderMagic32Swapped:
705             m_data.SetByteOrder(lldb::endian::InlHostByteOrder() == eByteOrderBig ? eByteOrderLittle : eByteOrderBig);
706             m_data.SetAddressByteSize(4);
707             can_parse = true;
708             break;
709 
710         case HeaderMagic64Swapped:
711             m_data.SetByteOrder(lldb::endian::InlHostByteOrder() == eByteOrderBig ? eByteOrderLittle : eByteOrderBig);
712             m_data.SetAddressByteSize(8);
713             can_parse = true;
714             break;
715 
716         default:
717             break;
718         }
719 
720         if (can_parse)
721         {
722             m_data.GetU32(&offset, &m_header.cputype, 6);
723 
724             ArchSpec mach_arch(eArchTypeMachO, m_header.cputype, m_header.cpusubtype);
725 
726             // Check if the module has a required architecture
727             const ArchSpec &module_arch = module_sp->GetArchitecture();
728             if (module_arch.IsValid() && !module_arch.IsCompatibleMatch(mach_arch))
729                 return false;
730 
731             if (SetModulesArchitecture (mach_arch))
732             {
733                 const size_t header_and_lc_size = m_header.sizeofcmds + MachHeaderSizeFromMagic(m_header.magic);
734                 if (m_data.GetByteSize() < header_and_lc_size)
735                 {
736                     DataBufferSP data_sp;
737                     ProcessSP process_sp (m_process_wp.lock());
738                     if (process_sp)
739                     {
740                         data_sp = ReadMemory (process_sp, m_memory_addr, header_and_lc_size);
741                     }
742                     else
743                     {
744                         // Read in all only the load command data from the file on disk
745                         data_sp = m_file.ReadFileContents(m_file_offset, header_and_lc_size);
746                         if (data_sp->GetByteSize() != header_and_lc_size)
747                             return false;
748                     }
749                     if (data_sp)
750                         m_data.SetData (data_sp);
751                 }
752             }
753             return true;
754         }
755         else
756         {
757             memset(&m_header, 0, sizeof(struct mach_header));
758         }
759     }
760     return false;
761 }
762 
763 
764 ByteOrder
765 ObjectFileMachO::GetByteOrder () const
766 {
767     return m_data.GetByteOrder ();
768 }
769 
770 bool
771 ObjectFileMachO::IsExecutable() const
772 {
773     return m_header.filetype == HeaderFileTypeExecutable;
774 }
775 
776 uint32_t
777 ObjectFileMachO::GetAddressByteSize () const
778 {
779     return m_data.GetAddressByteSize ();
780 }
781 
782 AddressClass
783 ObjectFileMachO::GetAddressClass (lldb::addr_t file_addr)
784 {
785     Symtab *symtab = GetSymtab();
786     if (symtab)
787     {
788         Symbol *symbol = symtab->FindSymbolContainingFileAddress(file_addr);
789         if (symbol)
790         {
791             if (symbol->ValueIsAddress())
792             {
793                 SectionSP section_sp (symbol->GetAddress().GetSection());
794                 if (section_sp)
795                 {
796                     const SectionType section_type = section_sp->GetType();
797                     switch (section_type)
798                     {
799                     case eSectionTypeInvalid:               return eAddressClassUnknown;
800                     case eSectionTypeCode:
801                         if (m_header.cputype == llvm::MachO::CPUTypeARM)
802                         {
803                             // For ARM we have a bit in the n_desc field of the symbol
804                             // that tells us ARM/Thumb which is bit 0x0008.
805                             if (symbol->GetFlags() & MACHO_NLIST_ARM_SYMBOL_IS_THUMB)
806                                 return eAddressClassCodeAlternateISA;
807                         }
808                         return eAddressClassCode;
809 
810                     case eSectionTypeContainer:             return eAddressClassUnknown;
811                     case eSectionTypeData:
812                     case eSectionTypeDataCString:
813                     case eSectionTypeDataCStringPointers:
814                     case eSectionTypeDataSymbolAddress:
815                     case eSectionTypeData4:
816                     case eSectionTypeData8:
817                     case eSectionTypeData16:
818                     case eSectionTypeDataPointers:
819                     case eSectionTypeZeroFill:
820                     case eSectionTypeDataObjCMessageRefs:
821                     case eSectionTypeDataObjCCFStrings:
822                         return eAddressClassData;
823                     case eSectionTypeDebug:
824                     case eSectionTypeDWARFDebugAbbrev:
825                     case eSectionTypeDWARFDebugAranges:
826                     case eSectionTypeDWARFDebugFrame:
827                     case eSectionTypeDWARFDebugInfo:
828                     case eSectionTypeDWARFDebugLine:
829                     case eSectionTypeDWARFDebugLoc:
830                     case eSectionTypeDWARFDebugMacInfo:
831                     case eSectionTypeDWARFDebugPubNames:
832                     case eSectionTypeDWARFDebugPubTypes:
833                     case eSectionTypeDWARFDebugRanges:
834                     case eSectionTypeDWARFDebugStr:
835                     case eSectionTypeDWARFAppleNames:
836                     case eSectionTypeDWARFAppleTypes:
837                     case eSectionTypeDWARFAppleNamespaces:
838                     case eSectionTypeDWARFAppleObjC:
839                         return eAddressClassDebug;
840                     case eSectionTypeEHFrame:               return eAddressClassRuntime;
841                     case eSectionTypeOther:                 return eAddressClassUnknown;
842                     }
843                 }
844             }
845 
846             const SymbolType symbol_type = symbol->GetType();
847             switch (symbol_type)
848             {
849             case eSymbolTypeAny:            return eAddressClassUnknown;
850             case eSymbolTypeAbsolute:       return eAddressClassUnknown;
851 
852             case eSymbolTypeCode:
853             case eSymbolTypeTrampoline:
854             case eSymbolTypeResolver:
855                 if (m_header.cputype == llvm::MachO::CPUTypeARM)
856                 {
857                     // For ARM we have a bit in the n_desc field of the symbol
858                     // that tells us ARM/Thumb which is bit 0x0008.
859                     if (symbol->GetFlags() & MACHO_NLIST_ARM_SYMBOL_IS_THUMB)
860                         return eAddressClassCodeAlternateISA;
861                 }
862                 return eAddressClassCode;
863 
864             case eSymbolTypeData:           return eAddressClassData;
865             case eSymbolTypeRuntime:        return eAddressClassRuntime;
866             case eSymbolTypeException:      return eAddressClassRuntime;
867             case eSymbolTypeSourceFile:     return eAddressClassDebug;
868             case eSymbolTypeHeaderFile:     return eAddressClassDebug;
869             case eSymbolTypeObjectFile:     return eAddressClassDebug;
870             case eSymbolTypeCommonBlock:    return eAddressClassDebug;
871             case eSymbolTypeBlock:          return eAddressClassDebug;
872             case eSymbolTypeLocal:          return eAddressClassData;
873             case eSymbolTypeParam:          return eAddressClassData;
874             case eSymbolTypeVariable:       return eAddressClassData;
875             case eSymbolTypeVariableType:   return eAddressClassDebug;
876             case eSymbolTypeLineEntry:      return eAddressClassDebug;
877             case eSymbolTypeLineHeader:     return eAddressClassDebug;
878             case eSymbolTypeScopeBegin:     return eAddressClassDebug;
879             case eSymbolTypeScopeEnd:       return eAddressClassDebug;
880             case eSymbolTypeAdditional:     return eAddressClassUnknown;
881             case eSymbolTypeCompiler:       return eAddressClassDebug;
882             case eSymbolTypeInstrumentation:return eAddressClassDebug;
883             case eSymbolTypeUndefined:      return eAddressClassUnknown;
884             case eSymbolTypeObjCClass:      return eAddressClassRuntime;
885             case eSymbolTypeObjCMetaClass:  return eAddressClassRuntime;
886             case eSymbolTypeObjCIVar:       return eAddressClassRuntime;
887             }
888         }
889     }
890     return eAddressClassUnknown;
891 }
892 
893 Symtab *
894 ObjectFileMachO::GetSymtab()
895 {
896     ModuleSP module_sp(GetModule());
897     if (module_sp)
898     {
899         lldb_private::Mutex::Locker locker(module_sp->GetMutex());
900         if (m_symtab_ap.get() == NULL)
901         {
902             m_symtab_ap.reset(new Symtab(this));
903             Mutex::Locker symtab_locker (m_symtab_ap->GetMutex());
904             ParseSymtab (true);
905             m_symtab_ap->Finalize ();
906         }
907     }
908     return m_symtab_ap.get();
909 }
910 
911 
912 SectionList *
913 ObjectFileMachO::GetSectionList()
914 {
915     ModuleSP module_sp(GetModule());
916     if (module_sp)
917     {
918         lldb_private::Mutex::Locker locker(module_sp->GetMutex());
919         if (m_sections_ap.get() == NULL)
920         {
921             m_sections_ap.reset(new SectionList());
922             ParseSections();
923         }
924     }
925     return m_sections_ap.get();
926 }
927 
928 
929 size_t
930 ObjectFileMachO::ParseSections ()
931 {
932     lldb::user_id_t segID = 0;
933     lldb::user_id_t sectID = 0;
934     lldb::offset_t offset = MachHeaderSizeFromMagic(m_header.magic);
935     uint32_t i;
936     const bool is_core = GetType() == eTypeCoreFile;
937     //bool dump_sections = false;
938     ModuleSP module_sp (GetModule());
939     // First look up any LC_ENCRYPTION_INFO load commands
940     typedef RangeArray<uint32_t, uint32_t, 8> EncryptedFileRanges;
941     EncryptedFileRanges encrypted_file_ranges;
942     encryption_info_command encryption_cmd;
943     for (i=0; i<m_header.ncmds; ++i)
944     {
945         const lldb::offset_t load_cmd_offset = offset;
946         if (m_data.GetU32(&offset, &encryption_cmd, 2) == NULL)
947             break;
948 
949         if (encryption_cmd.cmd == LoadCommandEncryptionInfo)
950         {
951             if (m_data.GetU32(&offset, &encryption_cmd.cryptoff, 3))
952             {
953                 if (encryption_cmd.cryptid != 0)
954                 {
955                     EncryptedFileRanges::Entry entry;
956                     entry.SetRangeBase(encryption_cmd.cryptoff);
957                     entry.SetByteSize(encryption_cmd.cryptsize);
958                     encrypted_file_ranges.Append(entry);
959                 }
960             }
961         }
962         offset = load_cmd_offset + encryption_cmd.cmdsize;
963     }
964 
965     offset = MachHeaderSizeFromMagic(m_header.magic);
966 
967     struct segment_command_64 load_cmd;
968     for (i=0; i<m_header.ncmds; ++i)
969     {
970         const lldb::offset_t load_cmd_offset = offset;
971         if (m_data.GetU32(&offset, &load_cmd, 2) == NULL)
972             break;
973 
974         if (load_cmd.cmd == LoadCommandSegment32 || load_cmd.cmd == LoadCommandSegment64)
975         {
976             if (m_data.GetU8(&offset, (uint8_t*)load_cmd.segname, 16))
977             {
978                 load_cmd.vmaddr = m_data.GetAddress(&offset);
979                 load_cmd.vmsize = m_data.GetAddress(&offset);
980                 load_cmd.fileoff = m_data.GetAddress(&offset);
981                 load_cmd.filesize = m_data.GetAddress(&offset);
982                 if (m_length != 0 && load_cmd.filesize != 0)
983                 {
984                     if (load_cmd.fileoff > m_length)
985                     {
986                         // We have a load command that says it extends past the end of hte file.  This is likely
987                         // a corrupt file.  We don't have any way to return an error condition here (this method
988                         // was likely invokved from something like ObjectFile::GetSectionList()) -- all we can do
989                         // is null out the SectionList vector and if a process has been set up, dump a message
990                         // to stdout.  The most common case here is core file debugging with a truncated file.
991                         const char *lc_segment_name = load_cmd.cmd == LoadCommandSegment64 ? "LC_SEGMENT_64" : "LC_SEGMENT";
992                         GetModule()->ReportError("is a corrupt mach-o file: load command %u %s has a fileoff (0x%" PRIx64 ") that extends beyond the end of the file (0x%" PRIx64 ")",
993                                                  i,
994                                                  lc_segment_name,
995                                                  load_cmd.fileoff,
996                                                  m_length);
997 
998                         load_cmd.fileoff = 0;
999                         load_cmd.filesize = 0;
1000                     }
1001 
1002                     if (load_cmd.fileoff + load_cmd.filesize > m_length)
1003                     {
1004                         // We have a load command that says it extends past the end of hte file.  This is likely
1005                         // a corrupt file.  We don't have any way to return an error condition here (this method
1006                         // was likely invokved from something like ObjectFile::GetSectionList()) -- all we can do
1007                         // is null out the SectionList vector and if a process has been set up, dump a message
1008                         // to stdout.  The most common case here is core file debugging with a truncated file.
1009                         const char *lc_segment_name = load_cmd.cmd == LoadCommandSegment64 ? "LC_SEGMENT_64" : "LC_SEGMENT";
1010                         GetModule()->ReportError("is a corrupt mach-o file: load command %u %s has a fileoff + filesize (0x%" PRIx64 ") that extends beyond the end of the file (0x%" PRIx64 "), the segment will be truncated",
1011                                                  i,
1012                                                  lc_segment_name,
1013                                                  load_cmd.fileoff + load_cmd.filesize,
1014                                                  m_length);
1015 
1016                         // Tuncase the length
1017                         load_cmd.filesize = m_length - load_cmd.fileoff;
1018                     }
1019                 }
1020                 if (m_data.GetU32(&offset, &load_cmd.maxprot, 4))
1021                 {
1022 
1023                     const bool segment_is_encrypted = (load_cmd.flags & SegmentCommandFlagBitProtectedVersion1) != 0;
1024 
1025                     // Keep a list of mach segments around in case we need to
1026                     // get at data that isn't stored in the abstracted Sections.
1027                     m_mach_segments.push_back (load_cmd);
1028 
1029                     ConstString segment_name (load_cmd.segname, std::min<size_t>(strlen(load_cmd.segname), sizeof(load_cmd.segname)));
1030                     // Use a segment ID of the segment index shifted left by 8 so they
1031                     // never conflict with any of the sections.
1032                     SectionSP segment_sp;
1033                     if (segment_name || is_core)
1034                     {
1035                         segment_sp.reset(new Section (module_sp,              // Module to which this section belongs
1036                                                       ++segID << 8,           // Section ID is the 1 based segment index shifted right by 8 bits as not to collide with any of the 256 section IDs that are possible
1037                                                       segment_name,           // Name of this section
1038                                                       eSectionTypeContainer,  // This section is a container of other sections.
1039                                                       load_cmd.vmaddr,        // File VM address == addresses as they are found in the object file
1040                                                       load_cmd.vmsize,        // VM size in bytes of this section
1041                                                       load_cmd.fileoff,       // Offset to the data for this section in the file
1042                                                       load_cmd.filesize,      // Size in bytes of this section as found in the the file
1043                                                       load_cmd.flags));       // Flags for this section
1044 
1045                         segment_sp->SetIsEncrypted (segment_is_encrypted);
1046                         m_sections_ap->AddSection(segment_sp);
1047                     }
1048 
1049                     struct section_64 sect64;
1050                     ::memset (&sect64, 0, sizeof(sect64));
1051                     // Push a section into our mach sections for the section at
1052                     // index zero (NListSectionNoSection) if we don't have any
1053                     // mach sections yet...
1054                     if (m_mach_sections.empty())
1055                         m_mach_sections.push_back(sect64);
1056                     uint32_t segment_sect_idx;
1057                     const lldb::user_id_t first_segment_sectID = sectID + 1;
1058 
1059 
1060                     const uint32_t num_u32s = load_cmd.cmd == LoadCommandSegment32 ? 7 : 8;
1061                     for (segment_sect_idx=0; segment_sect_idx<load_cmd.nsects; ++segment_sect_idx)
1062                     {
1063                         if (m_data.GetU8(&offset, (uint8_t*)sect64.sectname, sizeof(sect64.sectname)) == NULL)
1064                             break;
1065                         if (m_data.GetU8(&offset, (uint8_t*)sect64.segname, sizeof(sect64.segname)) == NULL)
1066                             break;
1067                         sect64.addr = m_data.GetAddress(&offset);
1068                         sect64.size = m_data.GetAddress(&offset);
1069 
1070                         if (m_data.GetU32(&offset, &sect64.offset, num_u32s) == NULL)
1071                             break;
1072 
1073                         // Keep a list of mach sections around in case we need to
1074                         // get at data that isn't stored in the abstracted Sections.
1075                         m_mach_sections.push_back (sect64);
1076 
1077                         ConstString section_name (sect64.sectname, std::min<size_t>(strlen(sect64.sectname), sizeof(sect64.sectname)));
1078                         if (!segment_name)
1079                         {
1080                             // We have a segment with no name so we need to conjure up
1081                             // segments that correspond to the section's segname if there
1082                             // isn't already such a section. If there is such a section,
1083                             // we resize the section so that it spans all sections.
1084                             // We also mark these sections as fake so address matches don't
1085                             // hit if they land in the gaps between the child sections.
1086                             segment_name.SetTrimmedCStringWithLength(sect64.segname, sizeof(sect64.segname));
1087                             segment_sp = m_sections_ap->FindSectionByName (segment_name);
1088                             if (segment_sp.get())
1089                             {
1090                                 Section *segment = segment_sp.get();
1091                                 // Grow the section size as needed.
1092                                 const lldb::addr_t sect64_min_addr = sect64.addr;
1093                                 const lldb::addr_t sect64_max_addr = sect64_min_addr + sect64.size;
1094                                 const lldb::addr_t curr_seg_byte_size = segment->GetByteSize();
1095                                 const lldb::addr_t curr_seg_min_addr = segment->GetFileAddress();
1096                                 const lldb::addr_t curr_seg_max_addr = curr_seg_min_addr + curr_seg_byte_size;
1097                                 if (sect64_min_addr >= curr_seg_min_addr)
1098                                 {
1099                                     const lldb::addr_t new_seg_byte_size = sect64_max_addr - curr_seg_min_addr;
1100                                     // Only grow the section size if needed
1101                                     if (new_seg_byte_size > curr_seg_byte_size)
1102                                         segment->SetByteSize (new_seg_byte_size);
1103                                 }
1104                                 else
1105                                 {
1106                                     // We need to change the base address of the segment and
1107                                     // adjust the child section offsets for all existing children.
1108                                     const lldb::addr_t slide_amount = sect64_min_addr - curr_seg_min_addr;
1109                                     segment->Slide(slide_amount, false);
1110                                     segment->GetChildren().Slide(-slide_amount, false);
1111                                     segment->SetByteSize (curr_seg_max_addr - sect64_min_addr);
1112                                 }
1113 
1114                                 // Grow the section size as needed.
1115                                 if (sect64.offset)
1116                                 {
1117                                     const lldb::addr_t segment_min_file_offset = segment->GetFileOffset();
1118                                     const lldb::addr_t segment_max_file_offset = segment_min_file_offset + segment->GetFileSize();
1119 
1120                                     const lldb::addr_t section_min_file_offset = sect64.offset;
1121                                     const lldb::addr_t section_max_file_offset = section_min_file_offset + sect64.size;
1122                                     const lldb::addr_t new_file_offset = std::min (section_min_file_offset, segment_min_file_offset);
1123                                     const lldb::addr_t new_file_size = std::max (section_max_file_offset, segment_max_file_offset) - new_file_offset;
1124                                     segment->SetFileOffset (new_file_offset);
1125                                     segment->SetFileSize (new_file_size);
1126                                 }
1127                             }
1128                             else
1129                             {
1130                                 // Create a fake section for the section's named segment
1131                                 segment_sp.reset(new Section (segment_sp,            // Parent section
1132                                                               module_sp,           // Module to which this section belongs
1133                                                               ++segID << 8,          // Section ID is the 1 based segment index shifted right by 8 bits as not to collide with any of the 256 section IDs that are possible
1134                                                               segment_name,          // Name of this section
1135                                                               eSectionTypeContainer, // This section is a container of other sections.
1136                                                               sect64.addr,           // File VM address == addresses as they are found in the object file
1137                                                               sect64.size,           // VM size in bytes of this section
1138                                                               sect64.offset,         // Offset to the data for this section in the file
1139                                                               sect64.offset ? sect64.size : 0,        // Size in bytes of this section as found in the the file
1140                                                               load_cmd.flags));      // Flags for this section
1141                                 segment_sp->SetIsFake(true);
1142                                 m_sections_ap->AddSection(segment_sp);
1143                                 segment_sp->SetIsEncrypted (segment_is_encrypted);
1144                             }
1145                         }
1146                         assert (segment_sp.get());
1147 
1148                         uint32_t mach_sect_type = sect64.flags & SectionFlagMaskSectionType;
1149                         static ConstString g_sect_name_objc_data ("__objc_data");
1150                         static ConstString g_sect_name_objc_msgrefs ("__objc_msgrefs");
1151                         static ConstString g_sect_name_objc_selrefs ("__objc_selrefs");
1152                         static ConstString g_sect_name_objc_classrefs ("__objc_classrefs");
1153                         static ConstString g_sect_name_objc_superrefs ("__objc_superrefs");
1154                         static ConstString g_sect_name_objc_const ("__objc_const");
1155                         static ConstString g_sect_name_objc_classlist ("__objc_classlist");
1156                         static ConstString g_sect_name_cfstring ("__cfstring");
1157 
1158                         static ConstString g_sect_name_dwarf_debug_abbrev ("__debug_abbrev");
1159                         static ConstString g_sect_name_dwarf_debug_aranges ("__debug_aranges");
1160                         static ConstString g_sect_name_dwarf_debug_frame ("__debug_frame");
1161                         static ConstString g_sect_name_dwarf_debug_info ("__debug_info");
1162                         static ConstString g_sect_name_dwarf_debug_line ("__debug_line");
1163                         static ConstString g_sect_name_dwarf_debug_loc ("__debug_loc");
1164                         static ConstString g_sect_name_dwarf_debug_macinfo ("__debug_macinfo");
1165                         static ConstString g_sect_name_dwarf_debug_pubnames ("__debug_pubnames");
1166                         static ConstString g_sect_name_dwarf_debug_pubtypes ("__debug_pubtypes");
1167                         static ConstString g_sect_name_dwarf_debug_ranges ("__debug_ranges");
1168                         static ConstString g_sect_name_dwarf_debug_str ("__debug_str");
1169                         static ConstString g_sect_name_dwarf_apple_names ("__apple_names");
1170                         static ConstString g_sect_name_dwarf_apple_types ("__apple_types");
1171                         static ConstString g_sect_name_dwarf_apple_namespaces ("__apple_namespac");
1172                         static ConstString g_sect_name_dwarf_apple_objc ("__apple_objc");
1173                         static ConstString g_sect_name_eh_frame ("__eh_frame");
1174                         static ConstString g_sect_name_DATA ("__DATA");
1175                         static ConstString g_sect_name_TEXT ("__TEXT");
1176 
1177                         SectionType sect_type = eSectionTypeOther;
1178 
1179                         if (section_name == g_sect_name_dwarf_debug_abbrev)
1180                             sect_type = eSectionTypeDWARFDebugAbbrev;
1181                         else if (section_name == g_sect_name_dwarf_debug_aranges)
1182                             sect_type = eSectionTypeDWARFDebugAranges;
1183                         else if (section_name == g_sect_name_dwarf_debug_frame)
1184                             sect_type = eSectionTypeDWARFDebugFrame;
1185                         else if (section_name == g_sect_name_dwarf_debug_info)
1186                             sect_type = eSectionTypeDWARFDebugInfo;
1187                         else if (section_name == g_sect_name_dwarf_debug_line)
1188                             sect_type = eSectionTypeDWARFDebugLine;
1189                         else if (section_name == g_sect_name_dwarf_debug_loc)
1190                             sect_type = eSectionTypeDWARFDebugLoc;
1191                         else if (section_name == g_sect_name_dwarf_debug_macinfo)
1192                             sect_type = eSectionTypeDWARFDebugMacInfo;
1193                         else if (section_name == g_sect_name_dwarf_debug_pubnames)
1194                             sect_type = eSectionTypeDWARFDebugPubNames;
1195                         else if (section_name == g_sect_name_dwarf_debug_pubtypes)
1196                             sect_type = eSectionTypeDWARFDebugPubTypes;
1197                         else if (section_name == g_sect_name_dwarf_debug_ranges)
1198                             sect_type = eSectionTypeDWARFDebugRanges;
1199                         else if (section_name == g_sect_name_dwarf_debug_str)
1200                             sect_type = eSectionTypeDWARFDebugStr;
1201                         else if (section_name == g_sect_name_dwarf_apple_names)
1202                             sect_type = eSectionTypeDWARFAppleNames;
1203                         else if (section_name == g_sect_name_dwarf_apple_types)
1204                             sect_type = eSectionTypeDWARFAppleTypes;
1205                         else if (section_name == g_sect_name_dwarf_apple_namespaces)
1206                             sect_type = eSectionTypeDWARFAppleNamespaces;
1207                         else if (section_name == g_sect_name_dwarf_apple_objc)
1208                             sect_type = eSectionTypeDWARFAppleObjC;
1209                         else if (section_name == g_sect_name_objc_selrefs)
1210                             sect_type = eSectionTypeDataCStringPointers;
1211                         else if (section_name == g_sect_name_objc_msgrefs)
1212                             sect_type = eSectionTypeDataObjCMessageRefs;
1213                         else if (section_name == g_sect_name_eh_frame)
1214                             sect_type = eSectionTypeEHFrame;
1215                         else if (section_name == g_sect_name_cfstring)
1216                             sect_type = eSectionTypeDataObjCCFStrings;
1217                         else if (section_name == g_sect_name_objc_data ||
1218                                  section_name == g_sect_name_objc_classrefs ||
1219                                  section_name == g_sect_name_objc_superrefs ||
1220                                  section_name == g_sect_name_objc_const ||
1221                                  section_name == g_sect_name_objc_classlist)
1222                         {
1223                             sect_type = eSectionTypeDataPointers;
1224                         }
1225 
1226                         if (sect_type == eSectionTypeOther)
1227                         {
1228                             switch (mach_sect_type)
1229                             {
1230                             // TODO: categorize sections by other flags for regular sections
1231                             case SectionTypeRegular:
1232                                 if (segment_sp->GetName() == g_sect_name_TEXT)
1233                                     sect_type = eSectionTypeCode;
1234                                 else if (segment_sp->GetName() == g_sect_name_DATA)
1235                                     sect_type = eSectionTypeData;
1236                                 else
1237                                     sect_type = eSectionTypeOther;
1238                                 break;
1239                             case SectionTypeZeroFill:                   sect_type = eSectionTypeZeroFill; break;
1240                             case SectionTypeCStringLiterals:            sect_type = eSectionTypeDataCString;    break; // section with only literal C strings
1241                             case SectionType4ByteLiterals:              sect_type = eSectionTypeData4;    break; // section with only 4 byte literals
1242                             case SectionType8ByteLiterals:              sect_type = eSectionTypeData8;    break; // section with only 8 byte literals
1243                             case SectionTypeLiteralPointers:            sect_type = eSectionTypeDataPointers;  break; // section with only pointers to literals
1244                             case SectionTypeNonLazySymbolPointers:      sect_type = eSectionTypeDataPointers;  break; // section with only non-lazy symbol pointers
1245                             case SectionTypeLazySymbolPointers:         sect_type = eSectionTypeDataPointers;  break; // section with only lazy symbol pointers
1246                             case SectionTypeSymbolStubs:                sect_type = eSectionTypeCode;  break; // section with only symbol stubs, byte size of stub in the reserved2 field
1247                             case SectionTypeModuleInitFunctionPointers: sect_type = eSectionTypeDataPointers;    break; // section with only function pointers for initialization
1248                             case SectionTypeModuleTermFunctionPointers: sect_type = eSectionTypeDataPointers; break; // section with only function pointers for termination
1249                             case SectionTypeCoalesced:                  sect_type = eSectionTypeOther; break;
1250                             case SectionTypeZeroFillLarge:              sect_type = eSectionTypeZeroFill; break;
1251                             case SectionTypeInterposing:                sect_type = eSectionTypeCode;  break; // section with only pairs of function pointers for interposing
1252                             case SectionType16ByteLiterals:             sect_type = eSectionTypeData16; break; // section with only 16 byte literals
1253                             case SectionTypeDTraceObjectFormat:         sect_type = eSectionTypeDebug; break;
1254                             case SectionTypeLazyDylibSymbolPointers:    sect_type = eSectionTypeDataPointers;  break;
1255                             default: break;
1256                             }
1257                         }
1258 
1259                         SectionSP section_sp(new Section (segment_sp,
1260                                                           module_sp,
1261                                                           ++sectID,
1262                                                           section_name,
1263                                                           sect_type,
1264                                                           sect64.addr - segment_sp->GetFileAddress(),
1265                                                           sect64.size,
1266                                                           sect64.offset,
1267                                                           sect64.offset == 0 ? 0 : sect64.size,
1268                                                           sect64.flags));
1269                         // Set the section to be encrypted to match the segment
1270 
1271                         bool section_is_encrypted = false;
1272                         if (!segment_is_encrypted && load_cmd.filesize != 0)
1273                             section_is_encrypted = encrypted_file_ranges.FindEntryThatContains(sect64.offset) != NULL;
1274 
1275                         section_sp->SetIsEncrypted (segment_is_encrypted || section_is_encrypted);
1276                         segment_sp->GetChildren().AddSection(section_sp);
1277 
1278                         if (segment_sp->IsFake())
1279                         {
1280                             segment_sp.reset();
1281                             segment_name.Clear();
1282                         }
1283                     }
1284                     if (segment_sp && m_header.filetype == HeaderFileTypeDSYM)
1285                     {
1286                         if (first_segment_sectID <= sectID)
1287                         {
1288                             lldb::user_id_t sect_uid;
1289                             for (sect_uid = first_segment_sectID; sect_uid <= sectID; ++sect_uid)
1290                             {
1291                                 SectionSP curr_section_sp(segment_sp->GetChildren().FindSectionByID (sect_uid));
1292                                 SectionSP next_section_sp;
1293                                 if (sect_uid + 1 <= sectID)
1294                                     next_section_sp = segment_sp->GetChildren().FindSectionByID (sect_uid+1);
1295 
1296                                 if (curr_section_sp.get())
1297                                 {
1298                                     if (curr_section_sp->GetByteSize() == 0)
1299                                     {
1300                                         if (next_section_sp.get() != NULL)
1301                                             curr_section_sp->SetByteSize ( next_section_sp->GetFileAddress() - curr_section_sp->GetFileAddress() );
1302                                         else
1303                                             curr_section_sp->SetByteSize ( load_cmd.vmsize );
1304                                     }
1305                                 }
1306                             }
1307                         }
1308                     }
1309                 }
1310             }
1311         }
1312         else if (load_cmd.cmd == LoadCommandDynamicSymtabInfo)
1313         {
1314             m_dysymtab.cmd = load_cmd.cmd;
1315             m_dysymtab.cmdsize = load_cmd.cmdsize;
1316             m_data.GetU32 (&offset, &m_dysymtab.ilocalsym, (sizeof(m_dysymtab) / sizeof(uint32_t)) - 2);
1317         }
1318 
1319         offset = load_cmd_offset + load_cmd.cmdsize;
1320     }
1321 //    if (dump_sections)
1322 //    {
1323 //        StreamFile s(stdout);
1324 //        m_sections_ap->Dump(&s, true);
1325 //    }
1326     return sectID;  // Return the number of sections we registered with the module
1327 }
1328 
1329 class MachSymtabSectionInfo
1330 {
1331 public:
1332 
1333     MachSymtabSectionInfo (SectionList *section_list) :
1334         m_section_list (section_list),
1335         m_section_infos()
1336     {
1337         // Get the number of sections down to a depth of 1 to include
1338         // all segments and their sections, but no other sections that
1339         // may be added for debug map or
1340         m_section_infos.resize(section_list->GetNumSections(1));
1341     }
1342 
1343 
1344     SectionSP
1345     GetSection (uint8_t n_sect, addr_t file_addr)
1346     {
1347         if (n_sect == 0)
1348             return SectionSP();
1349         if (n_sect < m_section_infos.size())
1350         {
1351             if (!m_section_infos[n_sect].section_sp)
1352             {
1353                 SectionSP section_sp (m_section_list->FindSectionByID (n_sect));
1354                 m_section_infos[n_sect].section_sp = section_sp;
1355                 if (section_sp)
1356                 {
1357                     m_section_infos[n_sect].vm_range.SetBaseAddress (section_sp->GetFileAddress());
1358                     m_section_infos[n_sect].vm_range.SetByteSize (section_sp->GetByteSize());
1359                 }
1360                 else
1361                 {
1362                     Host::SystemLog (Host::eSystemLogError, "error: unable to find section for section %u\n", n_sect);
1363                 }
1364             }
1365             if (m_section_infos[n_sect].vm_range.Contains(file_addr))
1366             {
1367                 // Symbol is in section.
1368                 return m_section_infos[n_sect].section_sp;
1369             }
1370             else if (m_section_infos[n_sect].vm_range.GetByteSize () == 0 &&
1371                      m_section_infos[n_sect].vm_range.GetBaseAddress() == file_addr)
1372             {
1373                 // Symbol is in section with zero size, but has the same start
1374                 // address as the section. This can happen with linker symbols
1375                 // (symbols that start with the letter 'l' or 'L'.
1376                 return m_section_infos[n_sect].section_sp;
1377             }
1378         }
1379         return m_section_list->FindSectionContainingFileAddress(file_addr);
1380     }
1381 
1382 protected:
1383     struct SectionInfo
1384     {
1385         SectionInfo () :
1386             vm_range(),
1387             section_sp ()
1388         {
1389         }
1390 
1391         VMRange vm_range;
1392         SectionSP section_sp;
1393     };
1394     SectionList *m_section_list;
1395     std::vector<SectionInfo> m_section_infos;
1396 };
1397 
1398 size_t
1399 ObjectFileMachO::ParseSymtab (bool minimize)
1400 {
1401     Timer scoped_timer(__PRETTY_FUNCTION__,
1402                        "ObjectFileMachO::ParseSymtab () module = %s",
1403                        m_file.GetFilename().AsCString(""));
1404     ModuleSP module_sp (GetModule());
1405     if (!module_sp)
1406         return 0;
1407 
1408     struct symtab_command symtab_load_command = { 0, 0, 0, 0, 0, 0 };
1409     struct linkedit_data_command function_starts_load_command = { 0, 0, 0, 0 };
1410     typedef AddressDataArray<lldb::addr_t, bool, 100> FunctionStarts;
1411     FunctionStarts function_starts;
1412     lldb::offset_t offset = MachHeaderSizeFromMagic(m_header.magic);
1413     uint32_t i;
1414 
1415     Log *log(lldb_private::GetLogIfAllCategoriesSet (LIBLLDB_LOG_SYMBOLS));
1416 
1417     for (i=0; i<m_header.ncmds; ++i)
1418     {
1419         const lldb::offset_t cmd_offset = offset;
1420         // Read in the load command and load command size
1421         struct load_command lc;
1422         if (m_data.GetU32(&offset, &lc, 2) == NULL)
1423             break;
1424         // Watch for the symbol table load command
1425         switch (lc.cmd)
1426         {
1427         case LoadCommandSymtab:
1428             symtab_load_command.cmd = lc.cmd;
1429             symtab_load_command.cmdsize = lc.cmdsize;
1430             // Read in the rest of the symtab load command
1431             if (m_data.GetU32(&offset, &symtab_load_command.symoff, 4) == 0) // fill in symoff, nsyms, stroff, strsize fields
1432                 return 0;
1433             if (symtab_load_command.symoff == 0)
1434             {
1435                 if (log)
1436                     module_sp->LogMessage(log, "LC_SYMTAB.symoff == 0");
1437                 return 0;
1438             }
1439 
1440             if (symtab_load_command.stroff == 0)
1441             {
1442                 if (log)
1443                     module_sp->LogMessage(log, "LC_SYMTAB.stroff == 0");
1444                 return 0;
1445             }
1446 
1447             if (symtab_load_command.nsyms == 0)
1448             {
1449                 if (log)
1450                     module_sp->LogMessage(log, "LC_SYMTAB.nsyms == 0");
1451                 return 0;
1452             }
1453 
1454             if (symtab_load_command.strsize == 0)
1455             {
1456                 if (log)
1457                     module_sp->LogMessage(log, "LC_SYMTAB.strsize == 0");
1458                 return 0;
1459             }
1460             break;
1461 
1462         case LoadCommandFunctionStarts:
1463             function_starts_load_command.cmd = lc.cmd;
1464             function_starts_load_command.cmdsize = lc.cmdsize;
1465             if (m_data.GetU32(&offset, &function_starts_load_command.dataoff, 2) == NULL) // fill in symoff, nsyms, stroff, strsize fields
1466                 bzero (&function_starts_load_command, sizeof(function_starts_load_command));
1467             break;
1468 
1469         default:
1470             break;
1471         }
1472         offset = cmd_offset + lc.cmdsize;
1473     }
1474 
1475     if (symtab_load_command.cmd)
1476     {
1477         Symtab *symtab = m_symtab_ap.get();
1478         SectionList *section_list = GetSectionList();
1479         if (section_list == NULL)
1480             return 0;
1481 
1482         ProcessSP process_sp (m_process_wp.lock());
1483         Process *process = process_sp.get();
1484 
1485         const uint32_t addr_byte_size = m_data.GetAddressByteSize();
1486         const ByteOrder byte_order = m_data.GetByteOrder();
1487         bool bit_width_32 = addr_byte_size == 4;
1488         const size_t nlist_byte_size = bit_width_32 ? sizeof(struct nlist) : sizeof(struct nlist_64);
1489 
1490         DataExtractor nlist_data (NULL, 0, byte_order, addr_byte_size);
1491         DataExtractor strtab_data (NULL, 0, byte_order, addr_byte_size);
1492         DataExtractor function_starts_data (NULL, 0, byte_order, addr_byte_size);
1493         DataExtractor indirect_symbol_index_data (NULL, 0, byte_order, addr_byte_size);
1494 
1495         const addr_t nlist_data_byte_size = symtab_load_command.nsyms * nlist_byte_size;
1496         const addr_t strtab_data_byte_size = symtab_load_command.strsize;
1497         addr_t strtab_addr = LLDB_INVALID_ADDRESS;
1498         if (process)
1499         {
1500             Target &target = process->GetTarget();
1501             SectionSP linkedit_section_sp(section_list->FindSectionByName(GetSegmentNameLINKEDIT()));
1502             // Reading mach file from memory in a process or core file...
1503 
1504             if (linkedit_section_sp)
1505             {
1506                 const addr_t linkedit_load_addr = linkedit_section_sp->GetLoadBaseAddress(&target);
1507                 const addr_t linkedit_file_offset = linkedit_section_sp->GetFileOffset();
1508                 const addr_t symoff_addr = linkedit_load_addr + symtab_load_command.symoff - linkedit_file_offset;
1509                 strtab_addr = linkedit_load_addr + symtab_load_command.stroff - linkedit_file_offset;
1510 
1511                 bool data_was_read = false;
1512 
1513 #if defined (__APPLE__) && defined (__arm__)
1514                 if (m_header.flags & 0x80000000u)
1515                 {
1516                     // This mach-o memory file is in the dyld shared cache. If this
1517                     // program is not remote and this is iOS, then this process will
1518                     // share the same shared cache as the process we are debugging and
1519                     // we can read the entire __LINKEDIT from the address space in this
1520                     // process. This is a needed optimization that is used for local iOS
1521                     // debugging only since all shared libraries in the shared cache do
1522                     // not have corresponding files that exist in the file system of the
1523                     // device. They have been combined into a single file. This means we
1524                     // always have to load these files from memory. All of the symbol and
1525                     // string tables from all of the __LINKEDIT sections from the shared
1526                     // libraries in the shared cache have been merged into a single large
1527                     // symbol and string table. Reading all of this symbol and string table
1528                     // data across can slow down debug launch times, so we optimize this by
1529                     // reading the memory for the __LINKEDIT section from this process.
1530 
1531                     UUID lldb_shared_cache(GetLLDBSharedCacheUUID());
1532                     UUID process_shared_cache(GetProcessSharedCacheUUID(process));
1533                     bool use_lldb_cache = true;
1534                     if (lldb_shared_cache.IsValid() && process_shared_cache.IsValid() && lldb_shared_cache != process_shared_cache)
1535                     {
1536                             use_lldb_cache = false;
1537                             ModuleSP module_sp (GetModule());
1538                             if (module_sp)
1539                                 module_sp->ReportWarning ("shared cache in process does not match lldb's own shared cache, startup will be slow.");
1540 
1541                     }
1542 
1543                     PlatformSP platform_sp (target.GetPlatform());
1544                     if (platform_sp && platform_sp->IsHost() && use_lldb_cache)
1545                     {
1546                         data_was_read = true;
1547                         nlist_data.SetData((void *)symoff_addr, nlist_data_byte_size, eByteOrderLittle);
1548                         strtab_data.SetData((void *)strtab_addr, strtab_data_byte_size, eByteOrderLittle);
1549                         if (function_starts_load_command.cmd)
1550                         {
1551                             const addr_t func_start_addr = linkedit_load_addr + function_starts_load_command.dataoff - linkedit_file_offset;
1552                             function_starts_data.SetData ((void *)func_start_addr, function_starts_load_command.datasize, eByteOrderLittle);
1553                         }
1554                     }
1555                 }
1556 #endif
1557 
1558                 if (!data_was_read)
1559                 {
1560                     DataBufferSP nlist_data_sp (ReadMemory (process_sp, symoff_addr, nlist_data_byte_size));
1561                     if (nlist_data_sp)
1562                         nlist_data.SetData (nlist_data_sp, 0, nlist_data_sp->GetByteSize());
1563                     //DataBufferSP strtab_data_sp (ReadMemory (process_sp, strtab_addr, strtab_data_byte_size));
1564                     //if (strtab_data_sp)
1565                     //    strtab_data.SetData (strtab_data_sp, 0, strtab_data_sp->GetByteSize());
1566                     if (m_dysymtab.nindirectsyms != 0)
1567                     {
1568                         const addr_t indirect_syms_addr = linkedit_load_addr + m_dysymtab.indirectsymoff - linkedit_file_offset;
1569                         DataBufferSP indirect_syms_data_sp (ReadMemory (process_sp, indirect_syms_addr, m_dysymtab.nindirectsyms * 4));
1570                         if (indirect_syms_data_sp)
1571                             indirect_symbol_index_data.SetData (indirect_syms_data_sp, 0, indirect_syms_data_sp->GetByteSize());
1572                     }
1573                     if (function_starts_load_command.cmd)
1574                     {
1575                         const addr_t func_start_addr = linkedit_load_addr + function_starts_load_command.dataoff - linkedit_file_offset;
1576                         DataBufferSP func_start_data_sp (ReadMemory (process_sp, func_start_addr, function_starts_load_command.datasize));
1577                         if (func_start_data_sp)
1578                             function_starts_data.SetData (func_start_data_sp, 0, func_start_data_sp->GetByteSize());
1579                     }
1580                 }
1581             }
1582         }
1583         else
1584         {
1585             nlist_data.SetData (m_data,
1586                                 symtab_load_command.symoff,
1587                                 nlist_data_byte_size);
1588             strtab_data.SetData (m_data,
1589                                  symtab_load_command.stroff,
1590                                  strtab_data_byte_size);
1591             if (m_dysymtab.nindirectsyms != 0)
1592             {
1593                 indirect_symbol_index_data.SetData (m_data,
1594                                                     m_dysymtab.indirectsymoff,
1595                                                     m_dysymtab.nindirectsyms * 4);
1596             }
1597             if (function_starts_load_command.cmd)
1598             {
1599                 function_starts_data.SetData (m_data,
1600                                               function_starts_load_command.dataoff,
1601                                               function_starts_load_command.datasize);
1602             }
1603         }
1604 
1605         if (nlist_data.GetByteSize() == 0)
1606         {
1607             if (log)
1608                 module_sp->LogMessage(log, "failed to read nlist data");
1609             return 0;
1610         }
1611 
1612 
1613         const bool have_strtab_data = strtab_data.GetByteSize() > 0;
1614         if (!have_strtab_data)
1615         {
1616             if (process)
1617             {
1618                 if (strtab_addr == LLDB_INVALID_ADDRESS)
1619                 {
1620                     if (log)
1621                         module_sp->LogMessage(log, "failed to locate the strtab in memory");
1622                     return 0;
1623                 }
1624             }
1625             else
1626             {
1627                 if (log)
1628                     module_sp->LogMessage(log, "failed to read strtab data");
1629                 return 0;
1630             }
1631         }
1632 
1633         const ConstString &g_segment_name_TEXT = GetSegmentNameTEXT();
1634         const ConstString &g_segment_name_DATA = GetSegmentNameDATA();
1635         const ConstString &g_segment_name_OBJC = GetSegmentNameOBJC();
1636         const ConstString &g_section_name_eh_frame = GetSectionNameEHFrame();
1637         SectionSP text_section_sp(section_list->FindSectionByName(g_segment_name_TEXT));
1638         SectionSP data_section_sp(section_list->FindSectionByName(g_segment_name_DATA));
1639         SectionSP objc_section_sp(section_list->FindSectionByName(g_segment_name_OBJC));
1640         SectionSP eh_frame_section_sp;
1641         if (text_section_sp.get())
1642             eh_frame_section_sp = text_section_sp->GetChildren().FindSectionByName (g_section_name_eh_frame);
1643         else
1644             eh_frame_section_sp = section_list->FindSectionByName (g_section_name_eh_frame);
1645 
1646         const bool is_arm = (m_header.cputype == llvm::MachO::CPUTypeARM);
1647 
1648         // lldb works best if it knows the start addresss of all functions in a module.
1649         // Linker symbols or debug info are normally the best source of information for start addr / size but
1650         // they may be stripped in a released binary.
1651         // Two additional sources of information exist in Mach-O binaries:
1652         //    LC_FUNCTION_STARTS - a list of ULEB128 encoded offsets of each function's start address in the
1653         //                         binary, relative to the text section.
1654         //    eh_frame           - the eh_frame FDEs have the start addr & size of each function
1655         //  LC_FUNCTION_STARTS is the fastest source to read in, and is present on all modern binaries.
1656         //  Binaries built to run on older releases may need to use eh_frame information.
1657 
1658         if (text_section_sp && function_starts_data.GetByteSize())
1659         {
1660             FunctionStarts::Entry function_start_entry;
1661             function_start_entry.data = false;
1662             lldb::offset_t function_start_offset = 0;
1663             function_start_entry.addr = text_section_sp->GetFileAddress();
1664             uint64_t delta;
1665             while ((delta = function_starts_data.GetULEB128(&function_start_offset)) > 0)
1666             {
1667                 // Now append the current entry
1668                 function_start_entry.addr += delta;
1669                 function_starts.Append(function_start_entry);
1670             }
1671         }
1672         else
1673         {
1674             // If m_type is eTypeDebugInfo, then this is a dSYM - it will have the load command claiming an eh_frame
1675             // but it doesn't actually have the eh_frame content.  And if we have a dSYM, we don't need to do any
1676             // of this fill-in-the-missing-symbols works anyway - the debug info should give us all the functions in
1677             // the module.
1678             if (text_section_sp.get() && eh_frame_section_sp.get() && m_type != eTypeDebugInfo)
1679             {
1680                 DWARFCallFrameInfo eh_frame(*this, eh_frame_section_sp, eRegisterKindGCC, true);
1681                 DWARFCallFrameInfo::FunctionAddressAndSizeVector functions;
1682                 eh_frame.GetFunctionAddressAndSizeVector (functions);
1683                 addr_t text_base_addr = text_section_sp->GetFileAddress();
1684                 size_t count = functions.GetSize();
1685                 for (size_t i = 0; i < count; ++i)
1686                 {
1687                     const DWARFCallFrameInfo::FunctionAddressAndSizeVector::Entry *func = functions.GetEntryAtIndex (i);
1688                     if (func)
1689                     {
1690                         FunctionStarts::Entry function_start_entry;
1691                         function_start_entry.addr = func->base - text_base_addr;
1692                         function_starts.Append(function_start_entry);
1693                     }
1694                 }
1695             }
1696         }
1697 
1698         const size_t function_starts_count = function_starts.GetSize();
1699 
1700         const user_id_t TEXT_eh_frame_sectID = eh_frame_section_sp.get() ? eh_frame_section_sp->GetID() : NListSectionNoSection;
1701 
1702         lldb::offset_t nlist_data_offset = 0;
1703 
1704         uint32_t N_SO_index = UINT32_MAX;
1705 
1706         MachSymtabSectionInfo section_info (section_list);
1707         std::vector<uint32_t> N_FUN_indexes;
1708         std::vector<uint32_t> N_NSYM_indexes;
1709         std::vector<uint32_t> N_INCL_indexes;
1710         std::vector<uint32_t> N_BRAC_indexes;
1711         std::vector<uint32_t> N_COMM_indexes;
1712         typedef std::map <uint64_t, uint32_t> ValueToSymbolIndexMap;
1713         typedef std::map <uint32_t, uint32_t> NListIndexToSymbolIndexMap;
1714         typedef std::map <const char *, uint32_t> ConstNameToSymbolIndexMap;
1715         ValueToSymbolIndexMap N_FUN_addr_to_sym_idx;
1716         ValueToSymbolIndexMap N_STSYM_addr_to_sym_idx;
1717         ConstNameToSymbolIndexMap N_GSYM_name_to_sym_idx;
1718         // Any symbols that get merged into another will get an entry
1719         // in this map so we know
1720         NListIndexToSymbolIndexMap m_nlist_idx_to_sym_idx;
1721         uint32_t nlist_idx = 0;
1722         Symbol *symbol_ptr = NULL;
1723 
1724         uint32_t sym_idx = 0;
1725         Symbol *sym = NULL;
1726         size_t num_syms = 0;
1727         std::string memory_symbol_name;
1728         uint32_t unmapped_local_symbols_found = 0;
1729 
1730 #if defined (__APPLE__) && defined (__arm__)
1731 
1732         // Some recent builds of the dyld_shared_cache (hereafter: DSC) have been optimized by moving LOCAL
1733         // symbols out of the memory mapped portion of the DSC. The symbol information has all been retained,
1734         // but it isn't available in the normal nlist data. However, there *are* duplicate entries of *some*
1735         // LOCAL symbols in the normal nlist data. To handle this situation correctly, we must first attempt
1736         // to parse any DSC unmapped symbol information. If we find any, we set a flag that tells the normal
1737         // nlist parser to ignore all LOCAL symbols.
1738 
1739         if (m_header.flags & 0x80000000u)
1740         {
1741             // Before we can start mapping the DSC, we need to make certain the target process is actually
1742             // using the cache we can find.
1743 
1744             // Next we need to determine the correct path for the dyld shared cache.
1745 
1746             ArchSpec header_arch(eArchTypeMachO, m_header.cputype, m_header.cpusubtype);
1747             char dsc_path[PATH_MAX];
1748 
1749             snprintf(dsc_path, sizeof(dsc_path), "%s%s%s",
1750                      "/System/Library/Caches/com.apple.dyld/",  /* IPHONE_DYLD_SHARED_CACHE_DIR */
1751                      "dyld_shared_cache_",          /* DYLD_SHARED_CACHE_BASE_NAME */
1752                      header_arch.GetArchitectureName());
1753 
1754             FileSpec dsc_filespec(dsc_path, false);
1755 
1756             // We need definitions of two structures in the on-disk DSC, copy them here manually
1757             struct lldb_copy_dyld_cache_header_v0
1758             {
1759                 char        magic[16];            // e.g. "dyld_v0    i386", "dyld_v1   armv7", etc.
1760                 uint32_t    mappingOffset;        // file offset to first dyld_cache_mapping_info
1761                 uint32_t    mappingCount;         // number of dyld_cache_mapping_info entries
1762                 uint32_t    imagesOffset;
1763                 uint32_t    imagesCount;
1764                 uint64_t    dyldBaseAddress;
1765                 uint64_t    codeSignatureOffset;
1766                 uint64_t    codeSignatureSize;
1767                 uint64_t    slideInfoOffset;
1768                 uint64_t    slideInfoSize;
1769                 uint64_t    localSymbolsOffset;   // file offset of where local symbols are stored
1770                 uint64_t    localSymbolsSize;     // size of local symbols information
1771             };
1772             struct lldb_copy_dyld_cache_header_v1
1773             {
1774                 char        magic[16];            // e.g. "dyld_v0    i386", "dyld_v1   armv7", etc.
1775                 uint32_t    mappingOffset;        // file offset to first dyld_cache_mapping_info
1776                 uint32_t    mappingCount;         // number of dyld_cache_mapping_info entries
1777                 uint32_t    imagesOffset;
1778                 uint32_t    imagesCount;
1779                 uint64_t    dyldBaseAddress;
1780                 uint64_t    codeSignatureOffset;
1781                 uint64_t    codeSignatureSize;
1782                 uint64_t    slideInfoOffset;
1783                 uint64_t    slideInfoSize;
1784                 uint64_t    localSymbolsOffset;
1785                 uint64_t    localSymbolsSize;
1786                 uint8_t     uuid[16];             // v1 and above, also recorded in dyld_all_image_infos v13 and later
1787             };
1788 
1789             struct lldb_copy_dyld_cache_mapping_info
1790             {
1791                 uint64_t        address;
1792                 uint64_t        size;
1793                 uint64_t        fileOffset;
1794                 uint32_t        maxProt;
1795                 uint32_t        initProt;
1796             };
1797 
1798             struct lldb_copy_dyld_cache_local_symbols_info
1799             {
1800                 uint32_t        nlistOffset;
1801                 uint32_t        nlistCount;
1802                 uint32_t        stringsOffset;
1803                 uint32_t        stringsSize;
1804                 uint32_t        entriesOffset;
1805                 uint32_t        entriesCount;
1806             };
1807             struct lldb_copy_dyld_cache_local_symbols_entry
1808             {
1809                 uint32_t        dylibOffset;
1810                 uint32_t        nlistStartIndex;
1811                 uint32_t        nlistCount;
1812             };
1813 
1814             /* The dyld_cache_header has a pointer to the dyld_cache_local_symbols_info structure (localSymbolsOffset).
1815                The dyld_cache_local_symbols_info structure gives us three things:
1816                  1. The start and count of the nlist records in the dyld_shared_cache file
1817                  2. The start and size of the strings for these nlist records
1818                  3. The start and count of dyld_cache_local_symbols_entry entries
1819 
1820                There is one dyld_cache_local_symbols_entry per dylib/framework in the dyld shared cache.
1821                The "dylibOffset" field is the Mach-O header of this dylib/framework in the dyld shared cache.
1822                The dyld_cache_local_symbols_entry also lists the start of this dylib/framework's nlist records
1823                and the count of how many nlist records there are for this dylib/framework.
1824             */
1825 
1826             // Process the dsc header to find the unmapped symbols
1827             //
1828             // Save some VM space, do not map the entire cache in one shot.
1829 
1830             DataBufferSP dsc_data_sp;
1831             dsc_data_sp = dsc_filespec.MemoryMapFileContents(0, sizeof(struct lldb_copy_dyld_cache_header_v1));
1832 
1833             if (dsc_data_sp)
1834             {
1835                 DataExtractor dsc_header_data(dsc_data_sp, byte_order, addr_byte_size);
1836 
1837                 char version_str[17];
1838                 int version = -1;
1839                 lldb::offset_t offset = 0;
1840                 memcpy (version_str, dsc_header_data.GetData (&offset, 16), 16);
1841                 version_str[16] = '\0';
1842                 if (strncmp (version_str, "dyld_v", 6) == 0 && isdigit (version_str[6]))
1843                 {
1844                     int v;
1845                     if (::sscanf (version_str + 6, "%d", &v) == 1)
1846                     {
1847                         version = v;
1848                     }
1849                 }
1850 
1851                 UUID dsc_uuid;
1852                 if (version >= 1)
1853                 {
1854                     offset = offsetof (struct lldb_copy_dyld_cache_header_v1, uuid);
1855                     uint8_t uuid_bytes[sizeof (uuid_t)];
1856                     memcpy (uuid_bytes, dsc_header_data.GetData (&offset, sizeof (uuid_t)), sizeof (uuid_t));
1857                     dsc_uuid.SetBytes (uuid_bytes);
1858                 }
1859 
1860                 bool uuid_match = true;
1861                 if (dsc_uuid.IsValid() && process)
1862                 {
1863                     UUID shared_cache_uuid(GetProcessSharedCacheUUID(process));
1864 
1865                     if (shared_cache_uuid.IsValid() && dsc_uuid != shared_cache_uuid)
1866                     {
1867                         // The on-disk dyld_shared_cache file is not the same as the one in this
1868                         // process' memory, don't use it.
1869                         uuid_match = false;
1870                         ModuleSP module_sp (GetModule());
1871                         if (module_sp)
1872                             module_sp->ReportWarning ("process shared cache does not match on-disk dyld_shared_cache file, some symbol names will be missing.");
1873                     }
1874                 }
1875 
1876                 offset = offsetof (struct lldb_copy_dyld_cache_header_v1, mappingOffset);
1877 
1878                 uint32_t mappingOffset = dsc_header_data.GetU32(&offset);
1879 
1880                 // If the mappingOffset points to a location inside the header, we've
1881                 // opened an old dyld shared cache, and should not proceed further.
1882                 if (uuid_match && mappingOffset >= sizeof(struct lldb_copy_dyld_cache_header_v0))
1883                 {
1884 
1885                     DataBufferSP dsc_mapping_info_data_sp = dsc_filespec.MemoryMapFileContents(mappingOffset, sizeof (struct lldb_copy_dyld_cache_mapping_info));
1886                     DataExtractor dsc_mapping_info_data(dsc_mapping_info_data_sp, byte_order, addr_byte_size);
1887                     offset = 0;
1888 
1889                     // The File addresses (from the in-memory Mach-O load commands) for the shared libraries
1890                     // in the shared library cache need to be adjusted by an offset to match up with the
1891                     // dylibOffset identifying field in the dyld_cache_local_symbol_entry's.  This offset is
1892                     // recorded in mapping_offset_value.
1893                     const uint64_t mapping_offset_value = dsc_mapping_info_data.GetU64(&offset);
1894 
1895                     offset = offsetof (struct lldb_copy_dyld_cache_header_v1, localSymbolsOffset);
1896                     uint64_t localSymbolsOffset = dsc_header_data.GetU64(&offset);
1897                     uint64_t localSymbolsSize = dsc_header_data.GetU64(&offset);
1898 
1899                     if (localSymbolsOffset && localSymbolsSize)
1900                     {
1901                         // Map the local symbols
1902                         if (DataBufferSP dsc_local_symbols_data_sp = dsc_filespec.MemoryMapFileContents(localSymbolsOffset, localSymbolsSize))
1903                         {
1904                             DataExtractor dsc_local_symbols_data(dsc_local_symbols_data_sp, byte_order, addr_byte_size);
1905 
1906                             offset = 0;
1907 
1908                             // Read the local_symbols_infos struct in one shot
1909                             struct lldb_copy_dyld_cache_local_symbols_info local_symbols_info;
1910                             dsc_local_symbols_data.GetU32(&offset, &local_symbols_info.nlistOffset, 6);
1911 
1912                             SectionSP text_section_sp(section_list->FindSectionByName(GetSegmentNameTEXT()));
1913 
1914                             uint32_t header_file_offset = (text_section_sp->GetFileAddress() - mapping_offset_value);
1915 
1916                             offset = local_symbols_info.entriesOffset;
1917                             for (uint32_t entry_index = 0; entry_index < local_symbols_info.entriesCount; entry_index++)
1918                             {
1919                                 struct lldb_copy_dyld_cache_local_symbols_entry local_symbols_entry;
1920                                 local_symbols_entry.dylibOffset = dsc_local_symbols_data.GetU32(&offset);
1921                                 local_symbols_entry.nlistStartIndex = dsc_local_symbols_data.GetU32(&offset);
1922                                 local_symbols_entry.nlistCount = dsc_local_symbols_data.GetU32(&offset);
1923 
1924                                 if (header_file_offset == local_symbols_entry.dylibOffset)
1925                                 {
1926                                     unmapped_local_symbols_found = local_symbols_entry.nlistCount;
1927 
1928                                     // The normal nlist code cannot correctly size the Symbols array, we need to allocate it here.
1929                                     sym = symtab->Resize (symtab_load_command.nsyms + m_dysymtab.nindirectsyms + unmapped_local_symbols_found - m_dysymtab.nlocalsym);
1930                                     num_syms = symtab->GetNumSymbols();
1931 
1932                                     nlist_data_offset = local_symbols_info.nlistOffset + (nlist_byte_size * local_symbols_entry.nlistStartIndex);
1933                                     uint32_t string_table_offset = local_symbols_info.stringsOffset;
1934 
1935                                     for (uint32_t nlist_index = 0; nlist_index < local_symbols_entry.nlistCount; nlist_index++)
1936                                     {
1937                                         /////////////////////////////
1938                                         {
1939                                             struct nlist_64 nlist;
1940                                             if (!dsc_local_symbols_data.ValidOffsetForDataOfSize(nlist_data_offset, nlist_byte_size))
1941                                                 break;
1942 
1943                                             nlist.n_strx  = dsc_local_symbols_data.GetU32_unchecked(&nlist_data_offset);
1944                                             nlist.n_type  = dsc_local_symbols_data.GetU8_unchecked (&nlist_data_offset);
1945                                             nlist.n_sect  = dsc_local_symbols_data.GetU8_unchecked (&nlist_data_offset);
1946                                             nlist.n_desc  = dsc_local_symbols_data.GetU16_unchecked (&nlist_data_offset);
1947                                             nlist.n_value = dsc_local_symbols_data.GetAddress_unchecked (&nlist_data_offset);
1948 
1949                                             SymbolType type = eSymbolTypeInvalid;
1950                                             const char *symbol_name = dsc_local_symbols_data.PeekCStr(string_table_offset + nlist.n_strx);
1951 
1952                                             if (symbol_name == NULL)
1953                                             {
1954                                                 // No symbol should be NULL, even the symbols with no
1955                                                 // string values should have an offset zero which points
1956                                                 // to an empty C-string
1957                                                 Host::SystemLog (Host::eSystemLogError,
1958                                                                  "error: DSC unmapped local symbol[%u] has invalid string table offset 0x%x in %s, ignoring symbol\n",
1959                                                                  entry_index,
1960                                                                  nlist.n_strx,
1961                                                                  module_sp->GetFileSpec().GetPath().c_str());
1962                                                 continue;
1963                                             }
1964                                             if (symbol_name[0] == '\0')
1965                                                 symbol_name = NULL;
1966 
1967                                             const char *symbol_name_non_abi_mangled = NULL;
1968 
1969                                             SectionSP symbol_section;
1970                                             uint32_t symbol_byte_size = 0;
1971                                             bool add_nlist = true;
1972                                             bool is_debug = ((nlist.n_type & NlistMaskStab) != 0);
1973                                             bool demangled_is_synthesized = false;
1974                                             bool is_gsym = false;
1975 
1976                                             assert (sym_idx < num_syms);
1977 
1978                                             sym[sym_idx].SetDebug (is_debug);
1979 
1980                                             if (is_debug)
1981                                             {
1982                                                 switch (nlist.n_type)
1983                                                 {
1984                                                     case StabGlobalSymbol:
1985                                                         // N_GSYM -- global symbol: name,,NO_SECT,type,0
1986                                                         // Sometimes the N_GSYM value contains the address.
1987 
1988                                                         // FIXME: In the .o files, we have a GSYM and a debug symbol for all the ObjC data.  They
1989                                                         // have the same address, but we want to ensure that we always find only the real symbol,
1990                                                         // 'cause we don't currently correctly attribute the GSYM one to the ObjCClass/Ivar/MetaClass
1991                                                         // symbol type.  This is a temporary hack to make sure the ObjectiveC symbols get treated
1992                                                         // correctly.  To do this right, we should coalesce all the GSYM & global symbols that have the
1993                                                         // same address.
1994 
1995                                                         if (symbol_name && symbol_name[0] == '_' && symbol_name[1] ==  'O'
1996                                                             && (strncmp (symbol_name, "_OBJC_IVAR_$_", strlen ("_OBJC_IVAR_$_")) == 0
1997                                                                 || strncmp (symbol_name, "_OBJC_CLASS_$_", strlen ("_OBJC_CLASS_$_")) == 0
1998                                                                 || strncmp (symbol_name, "_OBJC_METACLASS_$_", strlen ("_OBJC_METACLASS_$_")) == 0))
1999                                                             add_nlist = false;
2000                                                         else
2001                                                         {
2002                                                             is_gsym = true;
2003                                                             sym[sym_idx].SetExternal(true);
2004                                                             if (nlist.n_value != 0)
2005                                                                 symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2006                                                             type = eSymbolTypeData;
2007                                                         }
2008                                                         break;
2009 
2010                                                     case StabFunctionName:
2011                                                         // N_FNAME -- procedure name (f77 kludge): name,,NO_SECT,0,0
2012                                                         type = eSymbolTypeCompiler;
2013                                                         break;
2014 
2015                                                     case StabFunction:
2016                                                         // N_FUN -- procedure: name,,n_sect,linenumber,address
2017                                                         if (symbol_name)
2018                                                         {
2019                                                             type = eSymbolTypeCode;
2020                                                             symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2021 
2022                                                             N_FUN_addr_to_sym_idx[nlist.n_value] = sym_idx;
2023                                                             // We use the current number of symbols in the symbol table in lieu of
2024                                                             // using nlist_idx in case we ever start trimming entries out
2025                                                             N_FUN_indexes.push_back(sym_idx);
2026                                                         }
2027                                                         else
2028                                                         {
2029                                                             type = eSymbolTypeCompiler;
2030 
2031                                                             if ( !N_FUN_indexes.empty() )
2032                                                             {
2033                                                                 // Copy the size of the function into the original STAB entry so we don't have
2034                                                                 // to hunt for it later
2035                                                                 symtab->SymbolAtIndex(N_FUN_indexes.back())->SetByteSize(nlist.n_value);
2036                                                                 N_FUN_indexes.pop_back();
2037                                                                 // We don't really need the end function STAB as it contains the size which
2038                                                                 // we already placed with the original symbol, so don't add it if we want a
2039                                                                 // minimal symbol table
2040                                                                 if (minimize)
2041                                                                     add_nlist = false;
2042                                                             }
2043                                                         }
2044                                                         break;
2045 
2046                                                     case StabStaticSymbol:
2047                                                         // N_STSYM -- static symbol: name,,n_sect,type,address
2048                                                         N_STSYM_addr_to_sym_idx[nlist.n_value] = sym_idx;
2049                                                         symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2050                                                         type = eSymbolTypeData;
2051                                                         break;
2052 
2053                                                     case StabLocalCommon:
2054                                                         // N_LCSYM -- .lcomm symbol: name,,n_sect,type,address
2055                                                         symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2056                                                         type = eSymbolTypeCommonBlock;
2057                                                         break;
2058 
2059                                                     case StabBeginSymbol:
2060                                                         // N_BNSYM
2061                                                         // We use the current number of symbols in the symbol table in lieu of
2062                                                         // using nlist_idx in case we ever start trimming entries out
2063                                                         if (minimize)
2064                                                         {
2065                                                             // Skip these if we want minimal symbol tables
2066                                                             add_nlist = false;
2067                                                         }
2068                                                         else
2069                                                         {
2070                                                             symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2071                                                             N_NSYM_indexes.push_back(sym_idx);
2072                                                             type = eSymbolTypeScopeBegin;
2073                                                         }
2074                                                         break;
2075 
2076                                                     case StabEndSymbol:
2077                                                         // N_ENSYM
2078                                                         // Set the size of the N_BNSYM to the terminating index of this N_ENSYM
2079                                                         // so that we can always skip the entire symbol if we need to navigate
2080                                                         // more quickly at the source level when parsing STABS
2081                                                         if (minimize)
2082                                                         {
2083                                                             // Skip these if we want minimal symbol tables
2084                                                             add_nlist = false;
2085                                                         }
2086                                                         else
2087                                                         {
2088                                                             if ( !N_NSYM_indexes.empty() )
2089                                                             {
2090                                                                 symbol_ptr = symtab->SymbolAtIndex(N_NSYM_indexes.back());
2091                                                                 symbol_ptr->SetByteSize(sym_idx + 1);
2092                                                                 symbol_ptr->SetSizeIsSibling(true);
2093                                                                 N_NSYM_indexes.pop_back();
2094                                                             }
2095                                                             type = eSymbolTypeScopeEnd;
2096                                                         }
2097                                                         break;
2098 
2099 
2100                                                     case StabSourceFileOptions:
2101                                                         // N_OPT - emitted with gcc2_compiled and in gcc source
2102                                                         type = eSymbolTypeCompiler;
2103                                                         break;
2104 
2105                                                     case StabRegisterSymbol:
2106                                                         // N_RSYM - register sym: name,,NO_SECT,type,register
2107                                                         type = eSymbolTypeVariable;
2108                                                         break;
2109 
2110                                                     case StabSourceLine:
2111                                                         // N_SLINE - src line: 0,,n_sect,linenumber,address
2112                                                         symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2113                                                         type = eSymbolTypeLineEntry;
2114                                                         break;
2115 
2116                                                     case StabStructureType:
2117                                                         // N_SSYM - structure elt: name,,NO_SECT,type,struct_offset
2118                                                         type = eSymbolTypeVariableType;
2119                                                         break;
2120 
2121                                                     case StabSourceFileName:
2122                                                         // N_SO - source file name
2123                                                         type = eSymbolTypeSourceFile;
2124                                                         if (symbol_name == NULL)
2125                                                         {
2126                                                             if (minimize)
2127                                                                 add_nlist = false;
2128                                                             if (N_SO_index != UINT32_MAX)
2129                                                             {
2130                                                                 // Set the size of the N_SO to the terminating index of this N_SO
2131                                                                 // so that we can always skip the entire N_SO if we need to navigate
2132                                                                 // more quickly at the source level when parsing STABS
2133                                                                 symbol_ptr = symtab->SymbolAtIndex(N_SO_index);
2134                                                                 symbol_ptr->SetByteSize(sym_idx + (minimize ? 0 : 1));
2135                                                                 symbol_ptr->SetSizeIsSibling(true);
2136                                                             }
2137                                                             N_NSYM_indexes.clear();
2138                                                             N_INCL_indexes.clear();
2139                                                             N_BRAC_indexes.clear();
2140                                                             N_COMM_indexes.clear();
2141                                                             N_FUN_indexes.clear();
2142                                                             N_SO_index = UINT32_MAX;
2143                                                         }
2144                                                         else
2145                                                         {
2146                                                             // We use the current number of symbols in the symbol table in lieu of
2147                                                             // using nlist_idx in case we ever start trimming entries out
2148                                                             const bool N_SO_has_full_path = symbol_name[0] == '/';
2149                                                             if (N_SO_has_full_path)
2150                                                             {
2151                                                                 if (minimize && (N_SO_index == sym_idx - 1) && ((sym_idx - 1) < num_syms))
2152                                                                 {
2153                                                                     // We have two consecutive N_SO entries where the first contains a directory
2154                                                                     // and the second contains a full path.
2155                                                                     sym[sym_idx - 1].GetMangled().SetValue(ConstString(symbol_name), false);
2156                                                                     m_nlist_idx_to_sym_idx[nlist_idx] = sym_idx - 1;
2157                                                                     add_nlist = false;
2158                                                                 }
2159                                                                 else
2160                                                                 {
2161                                                                     // This is the first entry in a N_SO that contains a directory or
2162                                                                     // a full path to the source file
2163                                                                     N_SO_index = sym_idx;
2164                                                                 }
2165                                                             }
2166                                                             else if (minimize && (N_SO_index == sym_idx - 1) && ((sym_idx - 1) < num_syms))
2167                                                             {
2168                                                                 // This is usually the second N_SO entry that contains just the filename,
2169                                                                 // so here we combine it with the first one if we are minimizing the symbol table
2170                                                                 const char *so_path = sym[sym_idx - 1].GetMangled().GetDemangledName().AsCString();
2171                                                                 if (so_path && so_path[0])
2172                                                                 {
2173                                                                     std::string full_so_path (so_path);
2174                                                                     const size_t double_slash_pos = full_so_path.find("//");
2175                                                                     if (double_slash_pos != std::string::npos)
2176                                                                     {
2177                                                                         // The linker has been generating bad N_SO entries with doubled up paths
2178                                                                         // in the format "%s%s" where the first stirng in the DW_AT_comp_dir,
2179                                                                         // and the second is the directory for the source file so you end up with
2180                                                                         // a path that looks like "/tmp/src//tmp/src/"
2181                                                                         FileSpec so_dir(so_path, false);
2182                                                                         if (!so_dir.Exists())
2183                                                                         {
2184                                                                             so_dir.SetFile(&full_so_path[double_slash_pos + 1], false);
2185                                                                             if (so_dir.Exists())
2186                                                                             {
2187                                                                                 // Trim off the incorrect path
2188                                                                                 full_so_path.erase(0, double_slash_pos + 1);
2189                                                                             }
2190                                                                         }
2191                                                                     }
2192                                                                     if (*full_so_path.rbegin() != '/')
2193                                                                         full_so_path += '/';
2194                                                                     full_so_path += symbol_name;
2195                                                                     sym[sym_idx - 1].GetMangled().SetValue(ConstString(full_so_path.c_str()), false);
2196                                                                     add_nlist = false;
2197                                                                     m_nlist_idx_to_sym_idx[nlist_idx] = sym_idx - 1;
2198                                                                 }
2199                                                             }
2200                                                             else
2201                                                             {
2202                                                                 // This could be a relative path to a N_SO
2203                                                                 N_SO_index = sym_idx;
2204                                                             }
2205                                                         }
2206                                                         break;
2207 
2208                                                     case StabObjectFileName:
2209                                                         // N_OSO - object file name: name,,0,0,st_mtime
2210                                                         type = eSymbolTypeObjectFile;
2211                                                         break;
2212 
2213                                                     case StabLocalSymbol:
2214                                                         // N_LSYM - local sym: name,,NO_SECT,type,offset
2215                                                         type = eSymbolTypeLocal;
2216                                                         break;
2217 
2218                                                         //----------------------------------------------------------------------
2219                                                         // INCL scopes
2220                                                         //----------------------------------------------------------------------
2221                                                     case StabBeginIncludeFileName:
2222                                                         // N_BINCL - include file beginning: name,,NO_SECT,0,sum
2223                                                         // We use the current number of symbols in the symbol table in lieu of
2224                                                         // using nlist_idx in case we ever start trimming entries out
2225                                                         N_INCL_indexes.push_back(sym_idx);
2226                                                         type = eSymbolTypeScopeBegin;
2227                                                         break;
2228 
2229                                                     case StabEndIncludeFile:
2230                                                         // N_EINCL - include file end: name,,NO_SECT,0,0
2231                                                         // Set the size of the N_BINCL to the terminating index of this N_EINCL
2232                                                         // so that we can always skip the entire symbol if we need to navigate
2233                                                         // more quickly at the source level when parsing STABS
2234                                                         if ( !N_INCL_indexes.empty() )
2235                                                         {
2236                                                             symbol_ptr = symtab->SymbolAtIndex(N_INCL_indexes.back());
2237                                                             symbol_ptr->SetByteSize(sym_idx + 1);
2238                                                             symbol_ptr->SetSizeIsSibling(true);
2239                                                             N_INCL_indexes.pop_back();
2240                                                         }
2241                                                         type = eSymbolTypeScopeEnd;
2242                                                         break;
2243 
2244                                                     case StabIncludeFileName:
2245                                                         // N_SOL - #included file name: name,,n_sect,0,address
2246                                                         type = eSymbolTypeHeaderFile;
2247 
2248                                                         // We currently don't use the header files on darwin
2249                                                         if (minimize)
2250                                                             add_nlist = false;
2251                                                         break;
2252 
2253                                                     case StabCompilerParameters:
2254                                                         // N_PARAMS - compiler parameters: name,,NO_SECT,0,0
2255                                                         type = eSymbolTypeCompiler;
2256                                                         break;
2257 
2258                                                     case StabCompilerVersion:
2259                                                         // N_VERSION - compiler version: name,,NO_SECT,0,0
2260                                                         type = eSymbolTypeCompiler;
2261                                                         break;
2262 
2263                                                     case StabCompilerOptLevel:
2264                                                         // N_OLEVEL - compiler -O level: name,,NO_SECT,0,0
2265                                                         type = eSymbolTypeCompiler;
2266                                                         break;
2267 
2268                                                     case StabParameter:
2269                                                         // N_PSYM - parameter: name,,NO_SECT,type,offset
2270                                                         type = eSymbolTypeVariable;
2271                                                         break;
2272 
2273                                                     case StabAlternateEntry:
2274                                                         // N_ENTRY - alternate entry: name,,n_sect,linenumber,address
2275                                                         symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2276                                                         type = eSymbolTypeLineEntry;
2277                                                         break;
2278 
2279                                                         //----------------------------------------------------------------------
2280                                                         // Left and Right Braces
2281                                                         //----------------------------------------------------------------------
2282                                                     case StabLeftBracket:
2283                                                         // N_LBRAC - left bracket: 0,,NO_SECT,nesting level,address
2284                                                         // We use the current number of symbols in the symbol table in lieu of
2285                                                         // using nlist_idx in case we ever start trimming entries out
2286                                                         symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2287                                                         N_BRAC_indexes.push_back(sym_idx);
2288                                                         type = eSymbolTypeScopeBegin;
2289                                                         break;
2290 
2291                                                     case StabRightBracket:
2292                                                         // N_RBRAC - right bracket: 0,,NO_SECT,nesting level,address
2293                                                         // Set the size of the N_LBRAC to the terminating index of this N_RBRAC
2294                                                         // so that we can always skip the entire symbol if we need to navigate
2295                                                         // more quickly at the source level when parsing STABS
2296                                                         symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2297                                                         if ( !N_BRAC_indexes.empty() )
2298                                                         {
2299                                                             symbol_ptr = symtab->SymbolAtIndex(N_BRAC_indexes.back());
2300                                                             symbol_ptr->SetByteSize(sym_idx + 1);
2301                                                             symbol_ptr->SetSizeIsSibling(true);
2302                                                             N_BRAC_indexes.pop_back();
2303                                                         }
2304                                                         type = eSymbolTypeScopeEnd;
2305                                                         break;
2306 
2307                                                     case StabDeletedIncludeFile:
2308                                                         // N_EXCL - deleted include file: name,,NO_SECT,0,sum
2309                                                         type = eSymbolTypeHeaderFile;
2310                                                         break;
2311 
2312                                                         //----------------------------------------------------------------------
2313                                                         // COMM scopes
2314                                                         //----------------------------------------------------------------------
2315                                                     case StabBeginCommon:
2316                                                         // N_BCOMM - begin common: name,,NO_SECT,0,0
2317                                                         // We use the current number of symbols in the symbol table in lieu of
2318                                                         // using nlist_idx in case we ever start trimming entries out
2319                                                         type = eSymbolTypeScopeBegin;
2320                                                         N_COMM_indexes.push_back(sym_idx);
2321                                                         break;
2322 
2323                                                     case StabEndCommonLocal:
2324                                                         // N_ECOML - end common (local name): 0,,n_sect,0,address
2325                                                         symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2326                                                         // Fall through
2327 
2328                                                     case StabEndCommon:
2329                                                         // N_ECOMM - end common: name,,n_sect,0,0
2330                                                         // Set the size of the N_BCOMM to the terminating index of this N_ECOMM/N_ECOML
2331                                                         // so that we can always skip the entire symbol if we need to navigate
2332                                                         // more quickly at the source level when parsing STABS
2333                                                         if ( !N_COMM_indexes.empty() )
2334                                                         {
2335                                                             symbol_ptr = symtab->SymbolAtIndex(N_COMM_indexes.back());
2336                                                             symbol_ptr->SetByteSize(sym_idx + 1);
2337                                                             symbol_ptr->SetSizeIsSibling(true);
2338                                                             N_COMM_indexes.pop_back();
2339                                                         }
2340                                                         type = eSymbolTypeScopeEnd;
2341                                                         break;
2342 
2343                                                     case StabLength:
2344                                                         // N_LENG - second stab entry with length information
2345                                                         type = eSymbolTypeAdditional;
2346                                                         break;
2347 
2348                                                     default: break;
2349                                                 }
2350                                             }
2351                                             else
2352                                             {
2353                                                 //uint8_t n_pext    = NlistMaskPrivateExternal & nlist.n_type;
2354                                                 uint8_t n_type  = NlistMaskType & nlist.n_type;
2355                                                 sym[sym_idx].SetExternal((NlistMaskExternal & nlist.n_type) != 0);
2356 
2357                                                 switch (n_type)
2358                                                 {
2359                                                     case NListTypeIndirect:         // N_INDR - Fall through
2360                                                     case NListTypePreboundUndefined:// N_PBUD - Fall through
2361                                                     case NListTypeUndefined:        // N_UNDF
2362                                                         type = eSymbolTypeUndefined;
2363                                                         break;
2364 
2365                                                     case NListTypeAbsolute:         // N_ABS
2366                                                         type = eSymbolTypeAbsolute;
2367                                                         break;
2368 
2369                                                     case NListTypeSection:          // N_SECT
2370                                                         {
2371                                                             symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2372 
2373                                                             if (symbol_section == NULL)
2374                                                             {
2375                                                                 // TODO: warn about this?
2376                                                                 add_nlist = false;
2377                                                                 break;
2378                                                             }
2379 
2380                                                             if (TEXT_eh_frame_sectID == nlist.n_sect)
2381                                                             {
2382                                                                 type = eSymbolTypeException;
2383                                                             }
2384                                                             else
2385                                                             {
2386                                                                 uint32_t section_type = symbol_section->Get() & SectionFlagMaskSectionType;
2387 
2388                                                                 switch (section_type)
2389                                                                 {
2390                                                                     case SectionTypeRegular:                     break; // regular section
2391                                                                                                                         //case SectionTypeZeroFill:                 type = eSymbolTypeData;    break; // zero fill on demand section
2392                                                                     case SectionTypeCStringLiterals:            type = eSymbolTypeData;    break; // section with only literal C strings
2393                                                                     case SectionType4ByteLiterals:              type = eSymbolTypeData;    break; // section with only 4 byte literals
2394                                                                     case SectionType8ByteLiterals:              type = eSymbolTypeData;    break; // section with only 8 byte literals
2395                                                                     case SectionTypeLiteralPointers:            type = eSymbolTypeTrampoline; break; // section with only pointers to literals
2396                                                                     case SectionTypeNonLazySymbolPointers:      type = eSymbolTypeTrampoline; break; // section with only non-lazy symbol pointers
2397                                                                     case SectionTypeLazySymbolPointers:         type = eSymbolTypeTrampoline; break; // section with only lazy symbol pointers
2398                                                                     case SectionTypeSymbolStubs:                type = eSymbolTypeTrampoline; break; // section with only symbol stubs, byte size of stub in the reserved2 field
2399                                                                     case SectionTypeModuleInitFunctionPointers: type = eSymbolTypeCode;    break; // section with only function pointers for initialization
2400                                                                     case SectionTypeModuleTermFunctionPointers: type = eSymbolTypeCode;    break; // section with only function pointers for termination
2401                                                                                                                                                   //case SectionTypeCoalesced:                type = eSymbolType;    break; // section contains symbols that are to be coalesced
2402                                                                                                                                                   //case SectionTypeZeroFillLarge:            type = eSymbolTypeData;    break; // zero fill on demand section (that can be larger than 4 gigabytes)
2403                                                                     case SectionTypeInterposing:                type = eSymbolTypeTrampoline;  break; // section with only pairs of function pointers for interposing
2404                                                                     case SectionType16ByteLiterals:             type = eSymbolTypeData;    break; // section with only 16 byte literals
2405                                                                     case SectionTypeDTraceObjectFormat:         type = eSymbolTypeInstrumentation; break;
2406                                                                     case SectionTypeLazyDylibSymbolPointers:    type = eSymbolTypeTrampoline; break;
2407                                                                     default: break;
2408                                                                 }
2409 
2410                                                                 if (type == eSymbolTypeInvalid)
2411                                                                 {
2412                                                                     const char *symbol_sect_name = symbol_section->GetName().AsCString();
2413                                                                     if (symbol_section->IsDescendant (text_section_sp.get()))
2414                                                                     {
2415                                                                         if (symbol_section->IsClear(SectionAttrUserPureInstructions |
2416                                                                                                     SectionAttrUserSelfModifyingCode |
2417                                                                                                     SectionAttrSytemSomeInstructions))
2418                                                                             type = eSymbolTypeData;
2419                                                                         else
2420                                                                             type = eSymbolTypeCode;
2421                                                                     }
2422                                                                     else if (symbol_section->IsDescendant(data_section_sp.get()))
2423                                                                     {
2424                                                                         if (symbol_sect_name && ::strstr (symbol_sect_name, "__objc") == symbol_sect_name)
2425                                                                         {
2426                                                                             type = eSymbolTypeRuntime;
2427 
2428                                                                             if (symbol_name &&
2429                                                                                 symbol_name[0] == '_' &&
2430                                                                                 symbol_name[1] == 'O' &&
2431                                                                                 symbol_name[2] == 'B')
2432                                                                             {
2433                                                                                 llvm::StringRef symbol_name_ref(symbol_name);
2434                                                                                 static const llvm::StringRef g_objc_v2_prefix_class ("_OBJC_CLASS_$_");
2435                                                                                 static const llvm::StringRef g_objc_v2_prefix_metaclass ("_OBJC_METACLASS_$_");
2436                                                                                 static const llvm::StringRef g_objc_v2_prefix_ivar ("_OBJC_IVAR_$_");
2437                                                                                 if (symbol_name_ref.startswith(g_objc_v2_prefix_class))
2438                                                                                 {
2439                                                                                     symbol_name_non_abi_mangled = symbol_name + 1;
2440                                                                                     symbol_name = symbol_name + g_objc_v2_prefix_class.size();
2441                                                                                     type = eSymbolTypeObjCClass;
2442                                                                                     demangled_is_synthesized = true;
2443                                                                                 }
2444                                                                                 else if (symbol_name_ref.startswith(g_objc_v2_prefix_metaclass))
2445                                                                                 {
2446                                                                                     symbol_name_non_abi_mangled = symbol_name + 1;
2447                                                                                     symbol_name = symbol_name + g_objc_v2_prefix_metaclass.size();
2448                                                                                     type = eSymbolTypeObjCMetaClass;
2449                                                                                     demangled_is_synthesized = true;
2450                                                                                 }
2451                                                                                 else if (symbol_name_ref.startswith(g_objc_v2_prefix_ivar))
2452                                                                                 {
2453                                                                                     symbol_name_non_abi_mangled = symbol_name + 1;
2454                                                                                     symbol_name = symbol_name + g_objc_v2_prefix_ivar.size();
2455                                                                                     type = eSymbolTypeObjCIVar;
2456                                                                                     demangled_is_synthesized = true;
2457                                                                                 }
2458                                                                             }
2459                                                                         }
2460                                                                         else if (symbol_sect_name && ::strstr (symbol_sect_name, "__gcc_except_tab") == symbol_sect_name)
2461                                                                         {
2462                                                                             type = eSymbolTypeException;
2463                                                                         }
2464                                                                         else
2465                                                                         {
2466                                                                             type = eSymbolTypeData;
2467                                                                         }
2468                                                                     }
2469                                                                     else if (symbol_sect_name && ::strstr (symbol_sect_name, "__IMPORT") == symbol_sect_name)
2470                                                                     {
2471                                                                         type = eSymbolTypeTrampoline;
2472                                                                     }
2473                                                                     else if (symbol_section->IsDescendant(objc_section_sp.get()))
2474                                                                     {
2475                                                                         type = eSymbolTypeRuntime;
2476                                                                         if (symbol_name && symbol_name[0] == '.')
2477                                                                         {
2478                                                                             llvm::StringRef symbol_name_ref(symbol_name);
2479                                                                             static const llvm::StringRef g_objc_v1_prefix_class (".objc_class_name_");
2480                                                                             if (symbol_name_ref.startswith(g_objc_v1_prefix_class))
2481                                                                             {
2482                                                                                 symbol_name_non_abi_mangled = symbol_name;
2483                                                                                 symbol_name = symbol_name + g_objc_v1_prefix_class.size();
2484                                                                                 type = eSymbolTypeObjCClass;
2485                                                                                 demangled_is_synthesized = true;
2486                                                                             }
2487                                                                         }
2488                                                                     }
2489                                                                 }
2490                                                             }
2491                                                         }
2492                                                         break;
2493                                                 }
2494                                             }
2495 
2496                                             if (add_nlist)
2497                                             {
2498                                                 uint64_t symbol_value = nlist.n_value;
2499                                                 bool symbol_name_is_mangled = false;
2500 
2501                                                 if (symbol_name_non_abi_mangled)
2502                                                 {
2503                                                     sym[sym_idx].GetMangled().SetMangledName (ConstString(symbol_name_non_abi_mangled));
2504                                                     sym[sym_idx].GetMangled().SetDemangledName (ConstString(symbol_name));
2505                                                 }
2506                                                 else
2507                                                 {
2508                                                     if (symbol_name && symbol_name[0] == '_')
2509                                                     {
2510                                                         symbol_name_is_mangled = symbol_name[1] == '_';
2511                                                         symbol_name++;  // Skip the leading underscore
2512                                                     }
2513 
2514                                                     if (symbol_name)
2515                                                     {
2516                                                         ConstString const_symbol_name(symbol_name);
2517                                                         if (is_gsym)
2518                                                             N_GSYM_name_to_sym_idx[const_symbol_name.GetCString()] = sym_idx;
2519                                                         sym[sym_idx].GetMangled().SetValue(const_symbol_name, symbol_name_is_mangled);
2520                                                     }
2521                                                 }
2522                                                 if (symbol_section)
2523                                                 {
2524                                                     const addr_t section_file_addr = symbol_section->GetFileAddress();
2525                                                     if (symbol_byte_size == 0 && function_starts_count > 0)
2526                                                     {
2527                                                         addr_t symbol_lookup_file_addr = nlist.n_value;
2528                                                         // Do an exact address match for non-ARM addresses, else get the closest since
2529                                                         // the symbol might be a thumb symbol which has an address with bit zero set
2530                                                         FunctionStarts::Entry *func_start_entry = function_starts.FindEntry (symbol_lookup_file_addr, !is_arm);
2531                                                         if (is_arm && func_start_entry)
2532                                                         {
2533                                                             // Verify that the function start address is the symbol address (ARM)
2534                                                             // or the symbol address + 1 (thumb)
2535                                                             if (func_start_entry->addr != symbol_lookup_file_addr &&
2536                                                                 func_start_entry->addr != (symbol_lookup_file_addr + 1))
2537                                                             {
2538                                                                 // Not the right entry, NULL it out...
2539                                                                 func_start_entry = NULL;
2540                                                             }
2541                                                         }
2542                                                         if (func_start_entry)
2543                                                         {
2544                                                             func_start_entry->data = true;
2545 
2546                                                             addr_t symbol_file_addr = func_start_entry->addr;
2547                                                             uint32_t symbol_flags = 0;
2548                                                             if (is_arm)
2549                                                             {
2550                                                                 if (symbol_file_addr & 1)
2551                                                                     symbol_flags = MACHO_NLIST_ARM_SYMBOL_IS_THUMB;
2552                                                                 symbol_file_addr &= 0xfffffffffffffffeull;
2553                                                             }
2554 
2555                                                             const FunctionStarts::Entry *next_func_start_entry = function_starts.FindNextEntry (func_start_entry);
2556                                                             const addr_t section_end_file_addr = section_file_addr + symbol_section->GetByteSize();
2557                                                             if (next_func_start_entry)
2558                                                             {
2559                                                                 addr_t next_symbol_file_addr = next_func_start_entry->addr;
2560                                                                 // Be sure the clear the Thumb address bit when we calculate the size
2561                                                                 // from the current and next address
2562                                                                 if (is_arm)
2563                                                                     next_symbol_file_addr &= 0xfffffffffffffffeull;
2564                                                                 symbol_byte_size = std::min<lldb::addr_t>(next_symbol_file_addr - symbol_file_addr, section_end_file_addr - symbol_file_addr);
2565                                                             }
2566                                                             else
2567                                                             {
2568                                                                 symbol_byte_size = section_end_file_addr - symbol_file_addr;
2569                                                             }
2570                                                         }
2571                                                     }
2572                                                     symbol_value -= section_file_addr;
2573                                                 }
2574 
2575                                                 if (is_debug == false)
2576                                                 {
2577                                                     if (type == eSymbolTypeCode)
2578                                                     {
2579                                                         // See if we can find a N_FUN entry for any code symbols.
2580                                                         // If we do find a match, and the name matches, then we
2581                                                         // can merge the two into just the function symbol to avoid
2582                                                         // duplicate entries in the symbol table
2583                                                         ValueToSymbolIndexMap::const_iterator pos = N_FUN_addr_to_sym_idx.find (nlist.n_value);
2584                                                         if (pos != N_FUN_addr_to_sym_idx.end())
2585                                                         {
2586                                                             if ((symbol_name_is_mangled == true && sym[sym_idx].GetMangled().GetMangledName() == sym[pos->second].GetMangled().GetMangledName()) ||
2587                                                                 (symbol_name_is_mangled == false && sym[sym_idx].GetMangled().GetDemangledName() == sym[pos->second].GetMangled().GetDemangledName()))
2588                                                             {
2589                                                                 m_nlist_idx_to_sym_idx[nlist_idx] = pos->second;
2590                                                                 // We just need the flags from the linker symbol, so put these flags
2591                                                                 // into the N_FUN flags to avoid duplicate symbols in the symbol table
2592                                                                 sym[pos->second].SetFlags (nlist.n_type << 16 | nlist.n_desc);
2593                                                                 sym[sym_idx].Clear();
2594                                                                 continue;
2595                                                             }
2596                                                         }
2597                                                     }
2598                                                     else if (type == eSymbolTypeData)
2599                                                     {
2600                                                         // See if we can find a N_STSYM entry for any data symbols.
2601                                                         // If we do find a match, and the name matches, then we
2602                                                         // can merge the two into just the Static symbol to avoid
2603                                                         // duplicate entries in the symbol table
2604                                                         ValueToSymbolIndexMap::const_iterator pos = N_STSYM_addr_to_sym_idx.find (nlist.n_value);
2605                                                         if (pos != N_STSYM_addr_to_sym_idx.end())
2606                                                         {
2607                                                             if ((symbol_name_is_mangled == true && sym[sym_idx].GetMangled().GetMangledName() == sym[pos->second].GetMangled().GetMangledName()) ||
2608                                                                 (symbol_name_is_mangled == false && sym[sym_idx].GetMangled().GetDemangledName() == sym[pos->second].GetMangled().GetDemangledName()))
2609                                                             {
2610                                                                 m_nlist_idx_to_sym_idx[nlist_idx] = pos->second;
2611                                                                 // We just need the flags from the linker symbol, so put these flags
2612                                                                 // into the N_STSYM flags to avoid duplicate symbols in the symbol table
2613                                                                 sym[pos->second].SetFlags (nlist.n_type << 16 | nlist.n_desc);
2614                                                                 sym[sym_idx].Clear();
2615                                                                 continue;
2616                                                             }
2617                                                         }
2618                                                         else
2619                                                         {
2620                                                             // Combine N_GSYM stab entries with the non stab symbol
2621                                                             ConstNameToSymbolIndexMap::const_iterator pos = N_GSYM_name_to_sym_idx.find(sym[sym_idx].GetMangled().GetMangledName().GetCString());
2622                                                             if (pos != N_GSYM_name_to_sym_idx.end())
2623                                                             {
2624                                                                 const uint32_t GSYM_sym_idx = pos->second;
2625                                                                 m_nlist_idx_to_sym_idx[nlist_idx] = GSYM_sym_idx;
2626                                                                 // Copy the address, because often the N_GSYM address has an invalid address of zero
2627                                                                 // when the global is a common symbol
2628                                                                 sym[GSYM_sym_idx].GetAddress().SetSection (symbol_section);
2629                                                                 sym[GSYM_sym_idx].GetAddress().SetOffset (symbol_value);
2630                                                                 // We just need the flags from the linker symbol, so put these flags
2631                                                                 // into the N_STSYM flags to avoid duplicate symbols in the symbol table
2632                                                                 sym[GSYM_sym_idx].SetFlags (nlist.n_type << 16 | nlist.n_desc);
2633                                                                 sym[sym_idx].Clear();
2634                                                                 continue;
2635                                                             }
2636                                                         }
2637                                                     }
2638                                                 }
2639 
2640                                                 sym[sym_idx].SetID (nlist_idx);
2641                                                 sym[sym_idx].SetType (type);
2642                                                 sym[sym_idx].GetAddress().SetSection (symbol_section);
2643                                                 sym[sym_idx].GetAddress().SetOffset (symbol_value);
2644                                                 sym[sym_idx].SetFlags (nlist.n_type << 16 | nlist.n_desc);
2645 
2646                                                 if (symbol_byte_size > 0)
2647                                                     sym[sym_idx].SetByteSize(symbol_byte_size);
2648 
2649                                                 if (demangled_is_synthesized)
2650                                                     sym[sym_idx].SetDemangledNameIsSynthesized(true);
2651                                                 ++sym_idx;
2652                                             }
2653                                             else
2654                                             {
2655                                                 sym[sym_idx].Clear();
2656                                             }
2657 
2658                                         }
2659                                         /////////////////////////////
2660                                     }
2661                                     break; // No more entries to consider
2662                                 }
2663                             }
2664                         }
2665                     }
2666                 }
2667             }
2668         }
2669 
2670         // Must reset this in case it was mutated above!
2671         nlist_data_offset = 0;
2672 #endif
2673 
2674         // If the sym array was not created while parsing the DSC unmapped
2675         // symbols, create it now.
2676         if (sym == NULL)
2677         {
2678             sym = symtab->Resize (symtab_load_command.nsyms + m_dysymtab.nindirectsyms);
2679             num_syms = symtab->GetNumSymbols();
2680         }
2681 
2682         if (unmapped_local_symbols_found)
2683         {
2684             assert(m_dysymtab.ilocalsym == 0);
2685             nlist_data_offset += (m_dysymtab.nlocalsym * nlist_byte_size);
2686             nlist_idx = m_dysymtab.nlocalsym;
2687         }
2688         else
2689         {
2690             nlist_idx = 0;
2691         }
2692 
2693         for (; nlist_idx < symtab_load_command.nsyms; ++nlist_idx)
2694         {
2695             struct nlist_64 nlist;
2696             if (!nlist_data.ValidOffsetForDataOfSize(nlist_data_offset, nlist_byte_size))
2697                 break;
2698 
2699             nlist.n_strx  = nlist_data.GetU32_unchecked(&nlist_data_offset);
2700             nlist.n_type  = nlist_data.GetU8_unchecked (&nlist_data_offset);
2701             nlist.n_sect  = nlist_data.GetU8_unchecked (&nlist_data_offset);
2702             nlist.n_desc  = nlist_data.GetU16_unchecked (&nlist_data_offset);
2703             nlist.n_value = nlist_data.GetAddress_unchecked (&nlist_data_offset);
2704 
2705             SymbolType type = eSymbolTypeInvalid;
2706             const char *symbol_name = NULL;
2707 
2708             if (have_strtab_data)
2709             {
2710                 symbol_name = strtab_data.PeekCStr(nlist.n_strx);
2711 
2712                 if (symbol_name == NULL)
2713                 {
2714                     // No symbol should be NULL, even the symbols with no
2715                     // string values should have an offset zero which points
2716                     // to an empty C-string
2717                     Host::SystemLog (Host::eSystemLogError,
2718                                      "error: symbol[%u] has invalid string table offset 0x%x in %s, ignoring symbol\n",
2719                                      nlist_idx,
2720                                      nlist.n_strx,
2721                                      module_sp->GetFileSpec().GetPath().c_str());
2722                     continue;
2723                 }
2724                 if (symbol_name[0] == '\0')
2725                     symbol_name = NULL;
2726             }
2727             else
2728             {
2729                 const addr_t str_addr = strtab_addr + nlist.n_strx;
2730                 Error str_error;
2731                 if (process->ReadCStringFromMemory(str_addr, memory_symbol_name, str_error))
2732                     symbol_name = memory_symbol_name.c_str();
2733             }
2734             const char *symbol_name_non_abi_mangled = NULL;
2735 
2736             SectionSP symbol_section;
2737             lldb::addr_t symbol_byte_size = 0;
2738             bool add_nlist = true;
2739             bool is_gsym = false;
2740             bool is_debug = ((nlist.n_type & NlistMaskStab) != 0);
2741             bool demangled_is_synthesized = false;
2742 
2743             assert (sym_idx < num_syms);
2744 
2745             sym[sym_idx].SetDebug (is_debug);
2746 
2747             if (is_debug)
2748             {
2749                 switch (nlist.n_type)
2750                 {
2751                 case StabGlobalSymbol:
2752                     // N_GSYM -- global symbol: name,,NO_SECT,type,0
2753                     // Sometimes the N_GSYM value contains the address.
2754 
2755                     // FIXME: In the .o files, we have a GSYM and a debug symbol for all the ObjC data.  They
2756                     // have the same address, but we want to ensure that we always find only the real symbol,
2757                     // 'cause we don't currently correctly attribute the GSYM one to the ObjCClass/Ivar/MetaClass
2758                     // symbol type.  This is a temporary hack to make sure the ObjectiveC symbols get treated
2759                     // correctly.  To do this right, we should coalesce all the GSYM & global symbols that have the
2760                     // same address.
2761 
2762                     if (symbol_name && symbol_name[0] == '_' && symbol_name[1] ==  'O'
2763                         && (strncmp (symbol_name, "_OBJC_IVAR_$_", strlen ("_OBJC_IVAR_$_")) == 0
2764                             || strncmp (symbol_name, "_OBJC_CLASS_$_", strlen ("_OBJC_CLASS_$_")) == 0
2765                             || strncmp (symbol_name, "_OBJC_METACLASS_$_", strlen ("_OBJC_METACLASS_$_")) == 0))
2766                         add_nlist = false;
2767                     else
2768                     {
2769                         is_gsym = true;
2770                         sym[sym_idx].SetExternal(true);
2771                         if (nlist.n_value != 0)
2772                             symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2773                         type = eSymbolTypeData;
2774                     }
2775                     break;
2776 
2777                 case StabFunctionName:
2778                     // N_FNAME -- procedure name (f77 kludge): name,,NO_SECT,0,0
2779                     type = eSymbolTypeCompiler;
2780                     break;
2781 
2782                 case StabFunction:
2783                     // N_FUN -- procedure: name,,n_sect,linenumber,address
2784                     if (symbol_name)
2785                     {
2786                         type = eSymbolTypeCode;
2787                         symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2788 
2789                         N_FUN_addr_to_sym_idx[nlist.n_value] = sym_idx;
2790                         // We use the current number of symbols in the symbol table in lieu of
2791                         // using nlist_idx in case we ever start trimming entries out
2792                         N_FUN_indexes.push_back(sym_idx);
2793                     }
2794                     else
2795                     {
2796                         type = eSymbolTypeCompiler;
2797 
2798                         if ( !N_FUN_indexes.empty() )
2799                         {
2800                             // Copy the size of the function into the original STAB entry so we don't have
2801                             // to hunt for it later
2802                             symtab->SymbolAtIndex(N_FUN_indexes.back())->SetByteSize(nlist.n_value);
2803                             N_FUN_indexes.pop_back();
2804                             // We don't really need the end function STAB as it contains the size which
2805                             // we already placed with the original symbol, so don't add it if we want a
2806                             // minimal symbol table
2807                             if (minimize)
2808                                 add_nlist = false;
2809                         }
2810                     }
2811                     break;
2812 
2813                 case StabStaticSymbol:
2814                     // N_STSYM -- static symbol: name,,n_sect,type,address
2815                     N_STSYM_addr_to_sym_idx[nlist.n_value] = sym_idx;
2816                     symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2817                     type = eSymbolTypeData;
2818                     break;
2819 
2820                 case StabLocalCommon:
2821                     // N_LCSYM -- .lcomm symbol: name,,n_sect,type,address
2822                     symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2823                     type = eSymbolTypeCommonBlock;
2824                     break;
2825 
2826                 case StabBeginSymbol:
2827                     // N_BNSYM
2828                     // We use the current number of symbols in the symbol table in lieu of
2829                     // using nlist_idx in case we ever start trimming entries out
2830                     if (minimize)
2831                     {
2832                         // Skip these if we want minimal symbol tables
2833                         add_nlist = false;
2834                     }
2835                     else
2836                     {
2837                         symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2838                         N_NSYM_indexes.push_back(sym_idx);
2839                         type = eSymbolTypeScopeBegin;
2840                     }
2841                     break;
2842 
2843                 case StabEndSymbol:
2844                     // N_ENSYM
2845                     // Set the size of the N_BNSYM to the terminating index of this N_ENSYM
2846                     // so that we can always skip the entire symbol if we need to navigate
2847                     // more quickly at the source level when parsing STABS
2848                     if (minimize)
2849                     {
2850                         // Skip these if we want minimal symbol tables
2851                         add_nlist = false;
2852                     }
2853                     else
2854                     {
2855                         if ( !N_NSYM_indexes.empty() )
2856                         {
2857                             symbol_ptr = symtab->SymbolAtIndex(N_NSYM_indexes.back());
2858                             symbol_ptr->SetByteSize(sym_idx + 1);
2859                             symbol_ptr->SetSizeIsSibling(true);
2860                             N_NSYM_indexes.pop_back();
2861                         }
2862                         type = eSymbolTypeScopeEnd;
2863                     }
2864                     break;
2865 
2866 
2867                 case StabSourceFileOptions:
2868                     // N_OPT - emitted with gcc2_compiled and in gcc source
2869                     type = eSymbolTypeCompiler;
2870                     break;
2871 
2872                 case StabRegisterSymbol:
2873                     // N_RSYM - register sym: name,,NO_SECT,type,register
2874                     type = eSymbolTypeVariable;
2875                     break;
2876 
2877                 case StabSourceLine:
2878                     // N_SLINE - src line: 0,,n_sect,linenumber,address
2879                     symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
2880                     type = eSymbolTypeLineEntry;
2881                     break;
2882 
2883                 case StabStructureType:
2884                     // N_SSYM - structure elt: name,,NO_SECT,type,struct_offset
2885                     type = eSymbolTypeVariableType;
2886                     break;
2887 
2888                 case StabSourceFileName:
2889                     // N_SO - source file name
2890                     type = eSymbolTypeSourceFile;
2891                     if (symbol_name == NULL)
2892                     {
2893                         if (minimize)
2894                             add_nlist = false;
2895                         if (N_SO_index != UINT32_MAX)
2896                         {
2897                             // Set the size of the N_SO to the terminating index of this N_SO
2898                             // so that we can always skip the entire N_SO if we need to navigate
2899                             // more quickly at the source level when parsing STABS
2900                             symbol_ptr = symtab->SymbolAtIndex(N_SO_index);
2901                             symbol_ptr->SetByteSize(sym_idx + (minimize ? 0 : 1));
2902                             symbol_ptr->SetSizeIsSibling(true);
2903                         }
2904                         N_NSYM_indexes.clear();
2905                         N_INCL_indexes.clear();
2906                         N_BRAC_indexes.clear();
2907                         N_COMM_indexes.clear();
2908                         N_FUN_indexes.clear();
2909                         N_SO_index = UINT32_MAX;
2910                     }
2911                     else
2912                     {
2913                         // We use the current number of symbols in the symbol table in lieu of
2914                         // using nlist_idx in case we ever start trimming entries out
2915                         const bool N_SO_has_full_path = symbol_name[0] == '/';
2916                         if (N_SO_has_full_path)
2917                         {
2918                             if (minimize && (N_SO_index == sym_idx - 1) && ((sym_idx - 1) < num_syms))
2919                             {
2920                                 // We have two consecutive N_SO entries where the first contains a directory
2921                                 // and the second contains a full path.
2922                                 sym[sym_idx - 1].GetMangled().SetValue(ConstString(symbol_name), false);
2923                                 m_nlist_idx_to_sym_idx[nlist_idx] = sym_idx - 1;
2924                                 add_nlist = false;
2925                             }
2926                             else
2927                             {
2928                                 // This is the first entry in a N_SO that contains a directory or
2929                                 // a full path to the source file
2930                                 N_SO_index = sym_idx;
2931                             }
2932                         }
2933                         else if (minimize && (N_SO_index == sym_idx - 1) && ((sym_idx - 1) < num_syms))
2934                         {
2935                             // This is usually the second N_SO entry that contains just the filename,
2936                             // so here we combine it with the first one if we are minimizing the symbol table
2937                             const char *so_path = sym[sym_idx - 1].GetMangled().GetDemangledName().AsCString();
2938                             if (so_path && so_path[0])
2939                             {
2940                                 std::string full_so_path (so_path);
2941                                 const size_t double_slash_pos = full_so_path.find("//");
2942                                 if (double_slash_pos != std::string::npos)
2943                                 {
2944                                     // The linker has been generating bad N_SO entries with doubled up paths
2945                                     // in the format "%s%s" where the first stirng in the DW_AT_comp_dir,
2946                                     // and the second is the directory for the source file so you end up with
2947                                     // a path that looks like "/tmp/src//tmp/src/"
2948                                     FileSpec so_dir(so_path, false);
2949                                     if (!so_dir.Exists())
2950                                     {
2951                                         so_dir.SetFile(&full_so_path[double_slash_pos + 1], false);
2952                                         if (so_dir.Exists())
2953                                         {
2954                                             // Trim off the incorrect path
2955                                             full_so_path.erase(0, double_slash_pos + 1);
2956                                         }
2957                                     }
2958                                 }
2959                                 if (*full_so_path.rbegin() != '/')
2960                                     full_so_path += '/';
2961                                 full_so_path += symbol_name;
2962                                 sym[sym_idx - 1].GetMangled().SetValue(ConstString(full_so_path.c_str()), false);
2963                                 add_nlist = false;
2964                                 m_nlist_idx_to_sym_idx[nlist_idx] = sym_idx - 1;
2965                             }
2966                         }
2967                         else
2968                         {
2969                             // This could be a relative path to a N_SO
2970                             N_SO_index = sym_idx;
2971                         }
2972                     }
2973 
2974                     break;
2975 
2976                 case StabObjectFileName:
2977                     // N_OSO - object file name: name,,0,0,st_mtime
2978                     type = eSymbolTypeObjectFile;
2979                     break;
2980 
2981                 case StabLocalSymbol:
2982                     // N_LSYM - local sym: name,,NO_SECT,type,offset
2983                     type = eSymbolTypeLocal;
2984                     break;
2985 
2986                 //----------------------------------------------------------------------
2987                 // INCL scopes
2988                 //----------------------------------------------------------------------
2989                 case StabBeginIncludeFileName:
2990                     // N_BINCL - include file beginning: name,,NO_SECT,0,sum
2991                     // We use the current number of symbols in the symbol table in lieu of
2992                     // using nlist_idx in case we ever start trimming entries out
2993                     N_INCL_indexes.push_back(sym_idx);
2994                     type = eSymbolTypeScopeBegin;
2995                     break;
2996 
2997                 case StabEndIncludeFile:
2998                     // N_EINCL - include file end: name,,NO_SECT,0,0
2999                     // Set the size of the N_BINCL to the terminating index of this N_EINCL
3000                     // so that we can always skip the entire symbol if we need to navigate
3001                     // more quickly at the source level when parsing STABS
3002                     if ( !N_INCL_indexes.empty() )
3003                     {
3004                         symbol_ptr = symtab->SymbolAtIndex(N_INCL_indexes.back());
3005                         symbol_ptr->SetByteSize(sym_idx + 1);
3006                         symbol_ptr->SetSizeIsSibling(true);
3007                         N_INCL_indexes.pop_back();
3008                     }
3009                     type = eSymbolTypeScopeEnd;
3010                     break;
3011 
3012                 case StabIncludeFileName:
3013                     // N_SOL - #included file name: name,,n_sect,0,address
3014                     type = eSymbolTypeHeaderFile;
3015 
3016                     // We currently don't use the header files on darwin
3017                     if (minimize)
3018                         add_nlist = false;
3019                     break;
3020 
3021                 case StabCompilerParameters:
3022                     // N_PARAMS - compiler parameters: name,,NO_SECT,0,0
3023                     type = eSymbolTypeCompiler;
3024                     break;
3025 
3026                 case StabCompilerVersion:
3027                     // N_VERSION - compiler version: name,,NO_SECT,0,0
3028                     type = eSymbolTypeCompiler;
3029                     break;
3030 
3031                 case StabCompilerOptLevel:
3032                     // N_OLEVEL - compiler -O level: name,,NO_SECT,0,0
3033                     type = eSymbolTypeCompiler;
3034                     break;
3035 
3036                 case StabParameter:
3037                     // N_PSYM - parameter: name,,NO_SECT,type,offset
3038                     type = eSymbolTypeVariable;
3039                     break;
3040 
3041                 case StabAlternateEntry:
3042                     // N_ENTRY - alternate entry: name,,n_sect,linenumber,address
3043                     symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
3044                     type = eSymbolTypeLineEntry;
3045                     break;
3046 
3047                 //----------------------------------------------------------------------
3048                 // Left and Right Braces
3049                 //----------------------------------------------------------------------
3050                 case StabLeftBracket:
3051                     // N_LBRAC - left bracket: 0,,NO_SECT,nesting level,address
3052                     // We use the current number of symbols in the symbol table in lieu of
3053                     // using nlist_idx in case we ever start trimming entries out
3054                     symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
3055                     N_BRAC_indexes.push_back(sym_idx);
3056                     type = eSymbolTypeScopeBegin;
3057                     break;
3058 
3059                 case StabRightBracket:
3060                     // N_RBRAC - right bracket: 0,,NO_SECT,nesting level,address
3061                     // Set the size of the N_LBRAC to the terminating index of this N_RBRAC
3062                     // so that we can always skip the entire symbol if we need to navigate
3063                     // more quickly at the source level when parsing STABS
3064                     symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
3065                     if ( !N_BRAC_indexes.empty() )
3066                     {
3067                         symbol_ptr = symtab->SymbolAtIndex(N_BRAC_indexes.back());
3068                         symbol_ptr->SetByteSize(sym_idx + 1);
3069                         symbol_ptr->SetSizeIsSibling(true);
3070                         N_BRAC_indexes.pop_back();
3071                     }
3072                     type = eSymbolTypeScopeEnd;
3073                     break;
3074 
3075                 case StabDeletedIncludeFile:
3076                     // N_EXCL - deleted include file: name,,NO_SECT,0,sum
3077                     type = eSymbolTypeHeaderFile;
3078                     break;
3079 
3080                 //----------------------------------------------------------------------
3081                 // COMM scopes
3082                 //----------------------------------------------------------------------
3083                 case StabBeginCommon:
3084                     // N_BCOMM - begin common: name,,NO_SECT,0,0
3085                     // We use the current number of symbols in the symbol table in lieu of
3086                     // using nlist_idx in case we ever start trimming entries out
3087                     type = eSymbolTypeScopeBegin;
3088                     N_COMM_indexes.push_back(sym_idx);
3089                     break;
3090 
3091                 case StabEndCommonLocal:
3092                     // N_ECOML - end common (local name): 0,,n_sect,0,address
3093                     symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
3094                     // Fall through
3095 
3096                 case StabEndCommon:
3097                     // N_ECOMM - end common: name,,n_sect,0,0
3098                     // Set the size of the N_BCOMM to the terminating index of this N_ECOMM/N_ECOML
3099                     // so that we can always skip the entire symbol if we need to navigate
3100                     // more quickly at the source level when parsing STABS
3101                     if ( !N_COMM_indexes.empty() )
3102                     {
3103                         symbol_ptr = symtab->SymbolAtIndex(N_COMM_indexes.back());
3104                         symbol_ptr->SetByteSize(sym_idx + 1);
3105                         symbol_ptr->SetSizeIsSibling(true);
3106                         N_COMM_indexes.pop_back();
3107                     }
3108                     type = eSymbolTypeScopeEnd;
3109                     break;
3110 
3111                 case StabLength:
3112                     // N_LENG - second stab entry with length information
3113                     type = eSymbolTypeAdditional;
3114                     break;
3115 
3116                 default: break;
3117                 }
3118             }
3119             else
3120             {
3121                 //uint8_t n_pext    = NlistMaskPrivateExternal & nlist.n_type;
3122                 uint8_t n_type  = NlistMaskType & nlist.n_type;
3123                 sym[sym_idx].SetExternal((NlistMaskExternal & nlist.n_type) != 0);
3124 
3125                 switch (n_type)
3126                 {
3127                 case NListTypeIndirect:         // N_INDR - Fall through
3128                 case NListTypePreboundUndefined:// N_PBUD - Fall through
3129                 case NListTypeUndefined:        // N_UNDF
3130                     type = eSymbolTypeUndefined;
3131                     break;
3132 
3133                 case NListTypeAbsolute:         // N_ABS
3134                     type = eSymbolTypeAbsolute;
3135                     break;
3136 
3137                 case NListTypeSection:          // N_SECT
3138                     {
3139                         symbol_section = section_info.GetSection (nlist.n_sect, nlist.n_value);
3140 
3141                         if (!symbol_section)
3142                         {
3143                             // TODO: warn about this?
3144                             add_nlist = false;
3145                             break;
3146                         }
3147 
3148                         if (TEXT_eh_frame_sectID == nlist.n_sect)
3149                         {
3150                             type = eSymbolTypeException;
3151                         }
3152                         else
3153                         {
3154                             uint32_t section_type = symbol_section->Get() & SectionFlagMaskSectionType;
3155 
3156                             switch (section_type)
3157                             {
3158                             case SectionTypeRegular:                     break; // regular section
3159                             //case SectionTypeZeroFill:                 type = eSymbolTypeData;    break; // zero fill on demand section
3160                             case SectionTypeCStringLiterals:            type = eSymbolTypeData;    break; // section with only literal C strings
3161                             case SectionType4ByteLiterals:              type = eSymbolTypeData;    break; // section with only 4 byte literals
3162                             case SectionType8ByteLiterals:              type = eSymbolTypeData;    break; // section with only 8 byte literals
3163                             case SectionTypeLiteralPointers:            type = eSymbolTypeTrampoline; break; // section with only pointers to literals
3164                             case SectionTypeNonLazySymbolPointers:      type = eSymbolTypeTrampoline; break; // section with only non-lazy symbol pointers
3165                             case SectionTypeLazySymbolPointers:         type = eSymbolTypeTrampoline; break; // section with only lazy symbol pointers
3166                             case SectionTypeSymbolStubs:                type = eSymbolTypeTrampoline; break; // section with only symbol stubs, byte size of stub in the reserved2 field
3167                             case SectionTypeModuleInitFunctionPointers: type = eSymbolTypeCode;    break; // section with only function pointers for initialization
3168                             case SectionTypeModuleTermFunctionPointers: type = eSymbolTypeCode;    break; // section with only function pointers for termination
3169                             //case SectionTypeCoalesced:                type = eSymbolType;    break; // section contains symbols that are to be coalesced
3170                             //case SectionTypeZeroFillLarge:            type = eSymbolTypeData;    break; // zero fill on demand section (that can be larger than 4 gigabytes)
3171                             case SectionTypeInterposing:                type = eSymbolTypeTrampoline;  break; // section with only pairs of function pointers for interposing
3172                             case SectionType16ByteLiterals:             type = eSymbolTypeData;    break; // section with only 16 byte literals
3173                             case SectionTypeDTraceObjectFormat:         type = eSymbolTypeInstrumentation; break;
3174                             case SectionTypeLazyDylibSymbolPointers:    type = eSymbolTypeTrampoline; break;
3175                             default: break;
3176                             }
3177 
3178                             if (type == eSymbolTypeInvalid)
3179                             {
3180                                 const char *symbol_sect_name = symbol_section->GetName().AsCString();
3181                                 if (symbol_section->IsDescendant (text_section_sp.get()))
3182                                 {
3183                                     if (symbol_section->IsClear(SectionAttrUserPureInstructions |
3184                                                                 SectionAttrUserSelfModifyingCode |
3185                                                                 SectionAttrSytemSomeInstructions))
3186                                         type = eSymbolTypeData;
3187                                     else
3188                                         type = eSymbolTypeCode;
3189                                 }
3190                                 else
3191                                 if (symbol_section->IsDescendant(data_section_sp.get()))
3192                                 {
3193                                     if (symbol_sect_name && ::strstr (symbol_sect_name, "__objc") == symbol_sect_name)
3194                                     {
3195                                         type = eSymbolTypeRuntime;
3196 
3197                                         if (symbol_name &&
3198                                             symbol_name[0] == '_' &&
3199                                             symbol_name[1] == 'O' &&
3200                                             symbol_name[2] == 'B')
3201                                         {
3202                                             llvm::StringRef symbol_name_ref(symbol_name);
3203                                             static const llvm::StringRef g_objc_v2_prefix_class ("_OBJC_CLASS_$_");
3204                                             static const llvm::StringRef g_objc_v2_prefix_metaclass ("_OBJC_METACLASS_$_");
3205                                             static const llvm::StringRef g_objc_v2_prefix_ivar ("_OBJC_IVAR_$_");
3206                                             if (symbol_name_ref.startswith(g_objc_v2_prefix_class))
3207                                             {
3208                                                 symbol_name_non_abi_mangled = symbol_name + 1;
3209                                                 symbol_name = symbol_name + g_objc_v2_prefix_class.size();
3210                                                 type = eSymbolTypeObjCClass;
3211                                                 demangled_is_synthesized = true;
3212                                             }
3213                                             else if (symbol_name_ref.startswith(g_objc_v2_prefix_metaclass))
3214                                             {
3215                                                 symbol_name_non_abi_mangled = symbol_name + 1;
3216                                                 symbol_name = symbol_name + g_objc_v2_prefix_metaclass.size();
3217                                                 type = eSymbolTypeObjCMetaClass;
3218                                                 demangled_is_synthesized = true;
3219                                             }
3220                                             else if (symbol_name_ref.startswith(g_objc_v2_prefix_ivar))
3221                                             {
3222                                                 symbol_name_non_abi_mangled = symbol_name + 1;
3223                                                 symbol_name = symbol_name + g_objc_v2_prefix_ivar.size();
3224                                                 type = eSymbolTypeObjCIVar;
3225                                                 demangled_is_synthesized = true;
3226                                             }
3227                                         }
3228                                     }
3229                                     else
3230                                     if (symbol_sect_name && ::strstr (symbol_sect_name, "__gcc_except_tab") == symbol_sect_name)
3231                                     {
3232                                         type = eSymbolTypeException;
3233                                     }
3234                                     else
3235                                     {
3236                                         type = eSymbolTypeData;
3237                                     }
3238                                 }
3239                                 else
3240                                 if (symbol_sect_name && ::strstr (symbol_sect_name, "__IMPORT") == symbol_sect_name)
3241                                 {
3242                                     type = eSymbolTypeTrampoline;
3243                                 }
3244                                 else
3245                                 if (symbol_section->IsDescendant(objc_section_sp.get()))
3246                                 {
3247                                     type = eSymbolTypeRuntime;
3248                                     if (symbol_name && symbol_name[0] == '.')
3249                                     {
3250                                         llvm::StringRef symbol_name_ref(symbol_name);
3251                                         static const llvm::StringRef g_objc_v1_prefix_class (".objc_class_name_");
3252                                         if (symbol_name_ref.startswith(g_objc_v1_prefix_class))
3253                                         {
3254                                             symbol_name_non_abi_mangled = symbol_name;
3255                                             symbol_name = symbol_name + g_objc_v1_prefix_class.size();
3256                                             type = eSymbolTypeObjCClass;
3257                                             demangled_is_synthesized = true;
3258                                         }
3259                                     }
3260                                 }
3261                             }
3262                         }
3263                     }
3264                     break;
3265                 }
3266             }
3267 
3268             if (add_nlist)
3269             {
3270                 uint64_t symbol_value = nlist.n_value;
3271                 bool symbol_name_is_mangled = false;
3272 
3273                 if (symbol_name_non_abi_mangled)
3274                 {
3275                     sym[sym_idx].GetMangled().SetMangledName (ConstString(symbol_name_non_abi_mangled));
3276                     sym[sym_idx].GetMangled().SetDemangledName (ConstString(symbol_name));
3277                 }
3278                 else
3279                 {
3280                     if (symbol_name && symbol_name[0] == '_')
3281                     {
3282                         symbol_name_is_mangled = symbol_name[1] == '_';
3283                         symbol_name++;  // Skip the leading underscore
3284                     }
3285 
3286                     if (symbol_name)
3287                     {
3288                         ConstString const_symbol_name(symbol_name);
3289                         if (is_gsym)
3290                             N_GSYM_name_to_sym_idx[const_symbol_name.GetCString()] = sym_idx;
3291                         sym[sym_idx].GetMangled().SetValue(const_symbol_name, symbol_name_is_mangled);
3292                     }
3293                 }
3294                 if (symbol_section)
3295                 {
3296                     const addr_t section_file_addr = symbol_section->GetFileAddress();
3297                     if (symbol_byte_size == 0 && function_starts_count > 0)
3298                     {
3299                         addr_t symbol_lookup_file_addr = nlist.n_value;
3300                         // Do an exact address match for non-ARM addresses, else get the closest since
3301                         // the symbol might be a thumb symbol which has an address with bit zero set
3302                         FunctionStarts::Entry *func_start_entry = function_starts.FindEntry (symbol_lookup_file_addr, !is_arm);
3303                         if (is_arm && func_start_entry)
3304                         {
3305                             // Verify that the function start address is the symbol address (ARM)
3306                             // or the symbol address + 1 (thumb)
3307                             if (func_start_entry->addr != symbol_lookup_file_addr &&
3308                                 func_start_entry->addr != (symbol_lookup_file_addr + 1))
3309                             {
3310                                 // Not the right entry, NULL it out...
3311                                 func_start_entry = NULL;
3312                             }
3313                         }
3314                         if (func_start_entry)
3315                         {
3316                             func_start_entry->data = true;
3317 
3318                             addr_t symbol_file_addr = func_start_entry->addr;
3319                             if (is_arm)
3320                                 symbol_file_addr &= 0xfffffffffffffffeull;
3321 
3322                             const FunctionStarts::Entry *next_func_start_entry = function_starts.FindNextEntry (func_start_entry);
3323                             const addr_t section_end_file_addr = section_file_addr + symbol_section->GetByteSize();
3324                             if (next_func_start_entry)
3325                             {
3326                                 addr_t next_symbol_file_addr = next_func_start_entry->addr;
3327                                 // Be sure the clear the Thumb address bit when we calculate the size
3328                                 // from the current and next address
3329                                 if (is_arm)
3330                                     next_symbol_file_addr &= 0xfffffffffffffffeull;
3331                                 symbol_byte_size = std::min<lldb::addr_t>(next_symbol_file_addr - symbol_file_addr, section_end_file_addr - symbol_file_addr);
3332                             }
3333                             else
3334                             {
3335                                 symbol_byte_size = section_end_file_addr - symbol_file_addr;
3336                             }
3337                         }
3338                     }
3339                     symbol_value -= section_file_addr;
3340                 }
3341 
3342                 if (is_debug == false)
3343                 {
3344                     if (type == eSymbolTypeCode)
3345                     {
3346                         // See if we can find a N_FUN entry for any code symbols.
3347                         // If we do find a match, and the name matches, then we
3348                         // can merge the two into just the function symbol to avoid
3349                         // duplicate entries in the symbol table
3350                         ValueToSymbolIndexMap::const_iterator pos = N_FUN_addr_to_sym_idx.find (nlist.n_value);
3351                         if (pos != N_FUN_addr_to_sym_idx.end())
3352                         {
3353                             if ((symbol_name_is_mangled == true && sym[sym_idx].GetMangled().GetMangledName() == sym[pos->second].GetMangled().GetMangledName()) ||
3354                                 (symbol_name_is_mangled == false && sym[sym_idx].GetMangled().GetDemangledName() == sym[pos->second].GetMangled().GetDemangledName()))
3355                             {
3356                                 m_nlist_idx_to_sym_idx[nlist_idx] = pos->second;
3357                                 // We just need the flags from the linker symbol, so put these flags
3358                                 // into the N_FUN flags to avoid duplicate symbols in the symbol table
3359                                 sym[pos->second].SetFlags (nlist.n_type << 16 | nlist.n_desc);
3360                                 sym[sym_idx].Clear();
3361                                 continue;
3362                             }
3363                         }
3364                     }
3365                     else if (type == eSymbolTypeData)
3366                     {
3367                         // See if we can find a N_STSYM entry for any data symbols.
3368                         // If we do find a match, and the name matches, then we
3369                         // can merge the two into just the Static symbol to avoid
3370                         // duplicate entries in the symbol table
3371                         ValueToSymbolIndexMap::const_iterator pos = N_STSYM_addr_to_sym_idx.find (nlist.n_value);
3372                         if (pos != N_STSYM_addr_to_sym_idx.end())
3373                         {
3374                             if ((symbol_name_is_mangled == true && sym[sym_idx].GetMangled().GetMangledName() == sym[pos->second].GetMangled().GetMangledName()) ||
3375                                 (symbol_name_is_mangled == false && sym[sym_idx].GetMangled().GetDemangledName() == sym[pos->second].GetMangled().GetDemangledName()))
3376                             {
3377                                 m_nlist_idx_to_sym_idx[nlist_idx] = pos->second;
3378                                 // We just need the flags from the linker symbol, so put these flags
3379                                 // into the N_STSYM flags to avoid duplicate symbols in the symbol table
3380                                 sym[pos->second].SetFlags (nlist.n_type << 16 | nlist.n_desc);
3381                                 sym[sym_idx].Clear();
3382                                 continue;
3383                             }
3384                         }
3385                         else
3386                         {
3387                             // Combine N_GSYM stab entries with the non stab symbol
3388                             ConstNameToSymbolIndexMap::const_iterator pos = N_GSYM_name_to_sym_idx.find(sym[sym_idx].GetMangled().GetMangledName().GetCString());
3389                             if (pos != N_GSYM_name_to_sym_idx.end())
3390                             {
3391                                 const uint32_t GSYM_sym_idx = pos->second;
3392                                 m_nlist_idx_to_sym_idx[nlist_idx] = GSYM_sym_idx;
3393                                 // Copy the address, because often the N_GSYM address has an invalid address of zero
3394                                 // when the global is a common symbol
3395                                 sym[GSYM_sym_idx].GetAddress().SetSection (symbol_section);
3396                                 sym[GSYM_sym_idx].GetAddress().SetOffset (symbol_value);
3397                                 // We just need the flags from the linker symbol, so put these flags
3398                                 // into the N_STSYM flags to avoid duplicate symbols in the symbol table
3399                                 sym[GSYM_sym_idx].SetFlags (nlist.n_type << 16 | nlist.n_desc);
3400                                 sym[sym_idx].Clear();
3401                                 continue;
3402                             }
3403                         }
3404                     }
3405                 }
3406 
3407                 sym[sym_idx].SetID (nlist_idx);
3408                 sym[sym_idx].SetType (type);
3409                 sym[sym_idx].GetAddress().SetSection (symbol_section);
3410                 sym[sym_idx].GetAddress().SetOffset (symbol_value);
3411                 sym[sym_idx].SetFlags (nlist.n_type << 16 | nlist.n_desc);
3412 
3413                 if (symbol_byte_size > 0)
3414                     sym[sym_idx].SetByteSize(symbol_byte_size);
3415 
3416                 if (demangled_is_synthesized)
3417                     sym[sym_idx].SetDemangledNameIsSynthesized(true);
3418 
3419                 ++sym_idx;
3420             }
3421             else
3422             {
3423                 sym[sym_idx].Clear();
3424             }
3425 
3426         }
3427 
3428         // STAB N_GSYM entries end up having a symbol type eSymbolTypeGlobal and when the symbol value
3429         // is zero, the address of the global ends up being in a non-STAB entry. Try and fix up all
3430         // such entries by figuring out what the address for the global is by looking up this non-STAB
3431         // entry and copying the value into the debug symbol's value to save us the hassle in the
3432         // debug symbol parser.
3433 
3434         Symbol *global_symbol = NULL;
3435         for (nlist_idx = 0;
3436              nlist_idx < symtab_load_command.nsyms && (global_symbol = symtab->FindSymbolWithType (eSymbolTypeData, Symtab::eDebugYes, Symtab::eVisibilityAny, nlist_idx)) != NULL;
3437              nlist_idx++)
3438         {
3439             if (global_symbol->GetAddress().GetFileAddress() == 0)
3440             {
3441                 std::vector<uint32_t> indexes;
3442                 if (symtab->AppendSymbolIndexesWithName (global_symbol->GetMangled().GetName(), indexes) > 0)
3443                 {
3444                     std::vector<uint32_t>::const_iterator pos;
3445                     std::vector<uint32_t>::const_iterator end = indexes.end();
3446                     for (pos = indexes.begin(); pos != end; ++pos)
3447                     {
3448                         symbol_ptr = symtab->SymbolAtIndex(*pos);
3449                         if (symbol_ptr != global_symbol && symbol_ptr->IsDebug() == false)
3450                         {
3451                             global_symbol->GetAddress() = symbol_ptr->GetAddress();
3452                             break;
3453                         }
3454                     }
3455                 }
3456             }
3457         }
3458 
3459         uint32_t synthetic_sym_id = symtab_load_command.nsyms;
3460 
3461         if (function_starts_count > 0)
3462         {
3463             char synthetic_function_symbol[PATH_MAX];
3464             uint32_t num_synthetic_function_symbols = 0;
3465             for (i=0; i<function_starts_count; ++i)
3466             {
3467                 if (function_starts.GetEntryRef (i).data == false)
3468                     ++num_synthetic_function_symbols;
3469             }
3470 
3471             if (num_synthetic_function_symbols > 0)
3472             {
3473                 if (num_syms < sym_idx + num_synthetic_function_symbols)
3474                 {
3475                     num_syms = sym_idx + num_synthetic_function_symbols;
3476                     sym = symtab->Resize (num_syms);
3477                 }
3478                 uint32_t synthetic_function_symbol_idx = 0;
3479                 for (i=0; i<function_starts_count; ++i)
3480                 {
3481                     const FunctionStarts::Entry *func_start_entry = function_starts.GetEntryAtIndex (i);
3482                     if (func_start_entry->data == false)
3483                     {
3484                         addr_t symbol_file_addr = func_start_entry->addr;
3485                         uint32_t symbol_flags = 0;
3486                         if (is_arm)
3487                         {
3488                             if (symbol_file_addr & 1)
3489                                 symbol_flags = MACHO_NLIST_ARM_SYMBOL_IS_THUMB;
3490                             symbol_file_addr &= 0xfffffffffffffffeull;
3491                         }
3492                         Address symbol_addr;
3493                         if (module_sp->ResolveFileAddress (symbol_file_addr, symbol_addr))
3494                         {
3495                             SectionSP symbol_section (symbol_addr.GetSection());
3496                             uint32_t symbol_byte_size = 0;
3497                             if (symbol_section)
3498                             {
3499                                 const addr_t section_file_addr = symbol_section->GetFileAddress();
3500                                 const FunctionStarts::Entry *next_func_start_entry = function_starts.FindNextEntry (func_start_entry);
3501                                 const addr_t section_end_file_addr = section_file_addr + symbol_section->GetByteSize();
3502                                 if (next_func_start_entry)
3503                                 {
3504                                     addr_t next_symbol_file_addr = next_func_start_entry->addr;
3505                                     if (is_arm)
3506                                         next_symbol_file_addr &= 0xfffffffffffffffeull;
3507                                     symbol_byte_size = std::min<lldb::addr_t>(next_symbol_file_addr - symbol_file_addr, section_end_file_addr - symbol_file_addr);
3508                                 }
3509                                 else
3510                                 {
3511                                     symbol_byte_size = section_end_file_addr - symbol_file_addr;
3512                                 }
3513                                 snprintf (synthetic_function_symbol,
3514                                           sizeof(synthetic_function_symbol),
3515                                           "___lldb_unnamed_function%u$$%s",
3516                                           ++synthetic_function_symbol_idx,
3517                                           module_sp->GetFileSpec().GetFilename().GetCString());
3518                                 sym[sym_idx].SetID (synthetic_sym_id++);
3519                                 sym[sym_idx].GetMangled().SetDemangledName(ConstString(synthetic_function_symbol));
3520                                 sym[sym_idx].SetType (eSymbolTypeCode);
3521                                 sym[sym_idx].SetIsSynthetic (true);
3522                                 sym[sym_idx].GetAddress() = symbol_addr;
3523                                 if (symbol_flags)
3524                                     sym[sym_idx].SetFlags (symbol_flags);
3525                                 if (symbol_byte_size)
3526                                     sym[sym_idx].SetByteSize (symbol_byte_size);
3527                                 ++sym_idx;
3528                             }
3529                         }
3530                     }
3531                 }
3532             }
3533         }
3534 
3535         // Trim our symbols down to just what we ended up with after
3536         // removing any symbols.
3537         if (sym_idx < num_syms)
3538         {
3539             num_syms = sym_idx;
3540             sym = symtab->Resize (num_syms);
3541         }
3542 
3543         // Now synthesize indirect symbols
3544         if (m_dysymtab.nindirectsyms != 0)
3545         {
3546             if (indirect_symbol_index_data.GetByteSize())
3547             {
3548                 NListIndexToSymbolIndexMap::const_iterator end_index_pos = m_nlist_idx_to_sym_idx.end();
3549 
3550                 for (uint32_t sect_idx = 1; sect_idx < m_mach_sections.size(); ++sect_idx)
3551                 {
3552                     if ((m_mach_sections[sect_idx].flags & SectionFlagMaskSectionType) == SectionTypeSymbolStubs)
3553                     {
3554                         uint32_t symbol_stub_byte_size = m_mach_sections[sect_idx].reserved2;
3555                         if (symbol_stub_byte_size == 0)
3556                             continue;
3557 
3558                         const uint32_t num_symbol_stubs = m_mach_sections[sect_idx].size / symbol_stub_byte_size;
3559 
3560                         if (num_symbol_stubs == 0)
3561                             continue;
3562 
3563                         const uint32_t symbol_stub_index_offset = m_mach_sections[sect_idx].reserved1;
3564                         for (uint32_t stub_idx = 0; stub_idx < num_symbol_stubs; ++stub_idx)
3565                         {
3566                             const uint32_t symbol_stub_index = symbol_stub_index_offset + stub_idx;
3567                             const lldb::addr_t symbol_stub_addr = m_mach_sections[sect_idx].addr + (stub_idx * symbol_stub_byte_size);
3568                             lldb::offset_t symbol_stub_offset = symbol_stub_index * 4;
3569                             if (indirect_symbol_index_data.ValidOffsetForDataOfSize(symbol_stub_offset, 4))
3570                             {
3571                                 const uint32_t stub_sym_id = indirect_symbol_index_data.GetU32 (&symbol_stub_offset);
3572                                 if (stub_sym_id & (IndirectSymbolAbsolute | IndirectSymbolLocal))
3573                                     continue;
3574 
3575                                 NListIndexToSymbolIndexMap::const_iterator index_pos = m_nlist_idx_to_sym_idx.find (stub_sym_id);
3576                                 Symbol *stub_symbol = NULL;
3577                                 if (index_pos != end_index_pos)
3578                                 {
3579                                     // We have a remapping from the original nlist index to
3580                                     // a current symbol index, so just look this up by index
3581                                     stub_symbol = symtab->SymbolAtIndex (index_pos->second);
3582                                 }
3583                                 else
3584                                 {
3585                                     // We need to lookup a symbol using the original nlist
3586                                     // symbol index since this index is coming from the
3587                                     // S_SYMBOL_STUBS
3588                                     stub_symbol = symtab->FindSymbolByID (stub_sym_id);
3589                                 }
3590 
3591                                 if (stub_symbol)
3592                                 {
3593                                     Address so_addr(symbol_stub_addr, section_list);
3594 
3595                                     if (stub_symbol->GetType() == eSymbolTypeUndefined)
3596                                     {
3597                                         // Change the external symbol into a trampoline that makes sense
3598                                         // These symbols were N_UNDF N_EXT, and are useless to us, so we
3599                                         // can re-use them so we don't have to make up a synthetic symbol
3600                                         // for no good reason.
3601                                         stub_symbol->SetType (eSymbolTypeTrampoline);
3602                                         stub_symbol->SetExternal (false);
3603                                         stub_symbol->GetAddress() = so_addr;
3604                                         stub_symbol->SetByteSize (symbol_stub_byte_size);
3605                                     }
3606                                     else
3607                                     {
3608                                         // Make a synthetic symbol to describe the trampoline stub
3609                                         Mangled stub_symbol_mangled_name(stub_symbol->GetMangled());
3610                                         if (sym_idx >= num_syms)
3611                                         {
3612                                             sym = symtab->Resize (++num_syms);
3613                                             stub_symbol = NULL;  // this pointer no longer valid
3614                                         }
3615                                         sym[sym_idx].SetID (synthetic_sym_id++);
3616                                         sym[sym_idx].GetMangled() = stub_symbol_mangled_name;
3617                                         sym[sym_idx].SetType (eSymbolTypeTrampoline);
3618                                         sym[sym_idx].SetIsSynthetic (true);
3619                                         sym[sym_idx].GetAddress() = so_addr;
3620                                         sym[sym_idx].SetByteSize (symbol_stub_byte_size);
3621                                         ++sym_idx;
3622                                     }
3623                                 }
3624                                 else
3625                                 {
3626                                     if (log)
3627                                         log->Warning ("symbol stub referencing symbol table symbol %u that isn't in our minimal symbol table, fix this!!!", stub_sym_id);
3628                                 }
3629                             }
3630                         }
3631                     }
3632                 }
3633             }
3634         }
3635         return symtab->GetNumSymbols();
3636     }
3637     return 0;
3638 }
3639 
3640 
3641 void
3642 ObjectFileMachO::Dump (Stream *s)
3643 {
3644     ModuleSP module_sp(GetModule());
3645     if (module_sp)
3646     {
3647         lldb_private::Mutex::Locker locker(module_sp->GetMutex());
3648         s->Printf("%p: ", this);
3649         s->Indent();
3650         if (m_header.magic == HeaderMagic64 || m_header.magic == HeaderMagic64Swapped)
3651             s->PutCString("ObjectFileMachO64");
3652         else
3653             s->PutCString("ObjectFileMachO32");
3654 
3655         ArchSpec header_arch(eArchTypeMachO, m_header.cputype, m_header.cpusubtype);
3656 
3657         *s << ", file = '" << m_file << "', arch = " << header_arch.GetArchitectureName() << "\n";
3658 
3659         if (m_sections_ap.get())
3660             m_sections_ap->Dump(s, NULL, true, UINT32_MAX);
3661 
3662         if (m_symtab_ap.get())
3663             m_symtab_ap->Dump(s, NULL, eSortOrderNone);
3664     }
3665 }
3666 
3667 bool
3668 ObjectFileMachO::GetUUID (const llvm::MachO::mach_header &header,
3669                           const lldb_private::DataExtractor &data,
3670                           lldb::offset_t lc_offset,
3671                           lldb_private::UUID& uuid)
3672 {
3673     uint32_t i;
3674     struct uuid_command load_cmd;
3675 
3676     lldb::offset_t offset = lc_offset;
3677     for (i=0; i<header.ncmds; ++i)
3678     {
3679         const lldb::offset_t cmd_offset = offset;
3680         if (data.GetU32(&offset, &load_cmd, 2) == NULL)
3681             break;
3682 
3683         if (load_cmd.cmd == LoadCommandUUID)
3684         {
3685             const uint8_t *uuid_bytes = data.PeekData(offset, 16);
3686 
3687             if (uuid_bytes)
3688             {
3689                 // OpenCL on Mac OS X uses the same UUID for each of its object files.
3690                 // We pretend these object files have no UUID to prevent crashing.
3691 
3692                 const uint8_t opencl_uuid[] = { 0x8c, 0x8e, 0xb3, 0x9b,
3693                     0x3b, 0xa8,
3694                     0x4b, 0x16,
3695                     0xb6, 0xa4,
3696                     0x27, 0x63, 0xbb, 0x14, 0xf0, 0x0d };
3697 
3698                 if (!memcmp(uuid_bytes, opencl_uuid, 16))
3699                     return false;
3700 
3701                 uuid.SetBytes (uuid_bytes);
3702                 return true;
3703             }
3704             return false;
3705         }
3706         offset = cmd_offset + load_cmd.cmdsize;
3707     }
3708     return false;
3709 }
3710 
3711 bool
3712 ObjectFileMachO::GetUUID (lldb_private::UUID* uuid)
3713 {
3714     ModuleSP module_sp(GetModule());
3715     if (module_sp)
3716     {
3717         lldb_private::Mutex::Locker locker(module_sp->GetMutex());
3718         lldb::offset_t offset = MachHeaderSizeFromMagic(m_header.magic);
3719         return GetUUID (m_header, m_data, offset, *uuid);
3720     }
3721     return false;
3722 }
3723 
3724 
3725 uint32_t
3726 ObjectFileMachO::GetDependentModules (FileSpecList& files)
3727 {
3728     uint32_t count = 0;
3729     ModuleSP module_sp(GetModule());
3730     if (module_sp)
3731     {
3732         lldb_private::Mutex::Locker locker(module_sp->GetMutex());
3733         struct load_command load_cmd;
3734         lldb::offset_t offset = MachHeaderSizeFromMagic(m_header.magic);
3735         const bool resolve_path = false; // Don't resolve the dependend file paths since they may not reside on this system
3736         uint32_t i;
3737         for (i=0; i<m_header.ncmds; ++i)
3738         {
3739             const uint32_t cmd_offset = offset;
3740             if (m_data.GetU32(&offset, &load_cmd, 2) == NULL)
3741                 break;
3742 
3743             switch (load_cmd.cmd)
3744             {
3745             case LoadCommandDylibLoad:
3746             case LoadCommandDylibLoadWeak:
3747             case LoadCommandDylibReexport:
3748             case LoadCommandDynamicLinkerLoad:
3749             case LoadCommandFixedVMShlibLoad:
3750             case LoadCommandDylibLoadUpward:
3751                 {
3752                     uint32_t name_offset = cmd_offset + m_data.GetU32(&offset);
3753                     const char *path = m_data.PeekCStr(name_offset);
3754                     // Skip any path that starts with '@' since these are usually:
3755                     // @executable_path/.../file
3756                     // @rpath/.../file
3757                     if (path && path[0] != '@')
3758                     {
3759                         FileSpec file_spec(path, resolve_path);
3760                         if (files.AppendIfUnique(file_spec))
3761                             count++;
3762                     }
3763                 }
3764                 break;
3765 
3766             default:
3767                 break;
3768             }
3769             offset = cmd_offset + load_cmd.cmdsize;
3770         }
3771     }
3772     return count;
3773 }
3774 
3775 lldb_private::Address
3776 ObjectFileMachO::GetEntryPointAddress ()
3777 {
3778     // If the object file is not an executable it can't hold the entry point.  m_entry_point_address
3779     // is initialized to an invalid address, so we can just return that.
3780     // If m_entry_point_address is valid it means we've found it already, so return the cached value.
3781 
3782     if (!IsExecutable() || m_entry_point_address.IsValid())
3783         return m_entry_point_address;
3784 
3785     // Otherwise, look for the UnixThread or Thread command.  The data for the Thread command is given in
3786     // /usr/include/mach-o.h, but it is basically:
3787     //
3788     //  uint32_t flavor  - this is the flavor argument you would pass to thread_get_state
3789     //  uint32_t count   - this is the count of longs in the thread state data
3790     //  struct XXX_thread_state state - this is the structure from <machine/thread_status.h> corresponding to the flavor.
3791     //  <repeat this trio>
3792     //
3793     // So we just keep reading the various register flavors till we find the GPR one, then read the PC out of there.
3794     // FIXME: We will need to have a "RegisterContext data provider" class at some point that can get all the registers
3795     // out of data in this form & attach them to a given thread.  That should underlie the MacOS X User process plugin,
3796     // and we'll also need it for the MacOS X Core File process plugin.  When we have that we can also use it here.
3797     //
3798     // For now we hard-code the offsets and flavors we need:
3799     //
3800     //
3801 
3802     ModuleSP module_sp(GetModule());
3803     if (module_sp)
3804     {
3805         lldb_private::Mutex::Locker locker(module_sp->GetMutex());
3806         struct load_command load_cmd;
3807         lldb::offset_t offset = MachHeaderSizeFromMagic(m_header.magic);
3808         uint32_t i;
3809         lldb::addr_t start_address = LLDB_INVALID_ADDRESS;
3810         bool done = false;
3811 
3812         for (i=0; i<m_header.ncmds; ++i)
3813         {
3814             const lldb::offset_t cmd_offset = offset;
3815             if (m_data.GetU32(&offset, &load_cmd, 2) == NULL)
3816                 break;
3817 
3818             switch (load_cmd.cmd)
3819             {
3820             case LoadCommandUnixThread:
3821             case LoadCommandThread:
3822                 {
3823                     while (offset < cmd_offset + load_cmd.cmdsize)
3824                     {
3825                         uint32_t flavor = m_data.GetU32(&offset);
3826                         uint32_t count = m_data.GetU32(&offset);
3827                         if (count == 0)
3828                         {
3829                             // We've gotten off somehow, log and exit;
3830                             return m_entry_point_address;
3831                         }
3832 
3833                         switch (m_header.cputype)
3834                         {
3835                         case llvm::MachO::CPUTypeARM:
3836                            if (flavor == 1) // ARM_THREAD_STATE from mach/arm/thread_status.h
3837                            {
3838                                offset += 60;  // This is the offset of pc in the GPR thread state data structure.
3839                                start_address = m_data.GetU32(&offset);
3840                                done = true;
3841                             }
3842                         break;
3843                         case llvm::MachO::CPUTypeI386:
3844                            if (flavor == 1) // x86_THREAD_STATE32 from mach/i386/thread_status.h
3845                            {
3846                                offset += 40;  // This is the offset of eip in the GPR thread state data structure.
3847                                start_address = m_data.GetU32(&offset);
3848                                done = true;
3849                             }
3850                         break;
3851                         case llvm::MachO::CPUTypeX86_64:
3852                            if (flavor == 4) // x86_THREAD_STATE64 from mach/i386/thread_status.h
3853                            {
3854                                offset += 16 * 8;  // This is the offset of rip in the GPR thread state data structure.
3855                                start_address = m_data.GetU64(&offset);
3856                                done = true;
3857                             }
3858                         break;
3859                         default:
3860                             return m_entry_point_address;
3861                         }
3862                         // Haven't found the GPR flavor yet, skip over the data for this flavor:
3863                         if (done)
3864                             break;
3865                         offset += count * 4;
3866                     }
3867                 }
3868                 break;
3869             case LoadCommandMain:
3870                 {
3871                     ConstString text_segment_name ("__TEXT");
3872                     uint64_t entryoffset = m_data.GetU64(&offset);
3873                     SectionSP text_segment_sp = GetSectionList()->FindSectionByName(text_segment_name);
3874                     if (text_segment_sp)
3875                     {
3876                         done = true;
3877                         start_address = text_segment_sp->GetFileAddress() + entryoffset;
3878                     }
3879                 }
3880 
3881             default:
3882                 break;
3883             }
3884             if (done)
3885                 break;
3886 
3887             // Go to the next load command:
3888             offset = cmd_offset + load_cmd.cmdsize;
3889         }
3890 
3891         if (start_address != LLDB_INVALID_ADDRESS)
3892         {
3893             // We got the start address from the load commands, so now resolve that address in the sections
3894             // of this ObjectFile:
3895             if (!m_entry_point_address.ResolveAddressUsingFileSections (start_address, GetSectionList()))
3896             {
3897                 m_entry_point_address.Clear();
3898             }
3899         }
3900         else
3901         {
3902             // We couldn't read the UnixThread load command - maybe it wasn't there.  As a fallback look for the
3903             // "start" symbol in the main executable.
3904 
3905             ModuleSP module_sp (GetModule());
3906 
3907             if (module_sp)
3908             {
3909                 SymbolContextList contexts;
3910                 SymbolContext context;
3911                 if (module_sp->FindSymbolsWithNameAndType(ConstString ("start"), eSymbolTypeCode, contexts))
3912                 {
3913                     if (contexts.GetContextAtIndex(0, context))
3914                         m_entry_point_address = context.symbol->GetAddress();
3915                 }
3916             }
3917         }
3918     }
3919 
3920     return m_entry_point_address;
3921 
3922 }
3923 
3924 lldb_private::Address
3925 ObjectFileMachO::GetHeaderAddress ()
3926 {
3927     lldb_private::Address header_addr;
3928     SectionList *section_list = GetSectionList();
3929     if (section_list)
3930     {
3931         SectionSP text_segment_sp (section_list->FindSectionByName (GetSegmentNameTEXT()));
3932         if (text_segment_sp)
3933         {
3934             header_addr.SetSection (text_segment_sp);
3935             header_addr.SetOffset (0);
3936         }
3937     }
3938     return header_addr;
3939 }
3940 
3941 uint32_t
3942 ObjectFileMachO::GetNumThreadContexts ()
3943 {
3944     ModuleSP module_sp(GetModule());
3945     if (module_sp)
3946     {
3947         lldb_private::Mutex::Locker locker(module_sp->GetMutex());
3948         if (!m_thread_context_offsets_valid)
3949         {
3950             m_thread_context_offsets_valid = true;
3951             lldb::offset_t offset = MachHeaderSizeFromMagic(m_header.magic);
3952             FileRangeArray::Entry file_range;
3953             thread_command thread_cmd;
3954             for (uint32_t i=0; i<m_header.ncmds; ++i)
3955             {
3956                 const uint32_t cmd_offset = offset;
3957                 if (m_data.GetU32(&offset, &thread_cmd, 2) == NULL)
3958                     break;
3959 
3960                 if (thread_cmd.cmd == LoadCommandThread)
3961                 {
3962                     file_range.SetRangeBase (offset);
3963                     file_range.SetByteSize (thread_cmd.cmdsize - 8);
3964                     m_thread_context_offsets.Append (file_range);
3965                 }
3966                 offset = cmd_offset + thread_cmd.cmdsize;
3967             }
3968         }
3969     }
3970     return m_thread_context_offsets.GetSize();
3971 }
3972 
3973 lldb::RegisterContextSP
3974 ObjectFileMachO::GetThreadContextAtIndex (uint32_t idx, lldb_private::Thread &thread)
3975 {
3976     lldb::RegisterContextSP reg_ctx_sp;
3977 
3978     ModuleSP module_sp(GetModule());
3979     if (module_sp)
3980     {
3981         lldb_private::Mutex::Locker locker(module_sp->GetMutex());
3982         if (!m_thread_context_offsets_valid)
3983             GetNumThreadContexts ();
3984 
3985         const FileRangeArray::Entry *thread_context_file_range = m_thread_context_offsets.GetEntryAtIndex (idx);
3986         if (thread_context_file_range)
3987         {
3988 
3989             DataExtractor data (m_data,
3990                                 thread_context_file_range->GetRangeBase(),
3991                                 thread_context_file_range->GetByteSize());
3992 
3993             switch (m_header.cputype)
3994             {
3995                 case llvm::MachO::CPUTypeARM:
3996                     reg_ctx_sp.reset (new RegisterContextDarwin_arm_Mach (thread, data));
3997                     break;
3998 
3999                 case llvm::MachO::CPUTypeI386:
4000                     reg_ctx_sp.reset (new RegisterContextDarwin_i386_Mach (thread, data));
4001                     break;
4002 
4003                 case llvm::MachO::CPUTypeX86_64:
4004                     reg_ctx_sp.reset (new RegisterContextDarwin_x86_64_Mach (thread, data));
4005                     break;
4006             }
4007         }
4008     }
4009     return reg_ctx_sp;
4010 }
4011 
4012 
4013 ObjectFile::Type
4014 ObjectFileMachO::CalculateType()
4015 {
4016     switch (m_header.filetype)
4017     {
4018         case HeaderFileTypeObject:                                          // 0x1u MH_OBJECT
4019             if (GetAddressByteSize () == 4)
4020             {
4021                 // 32 bit kexts are just object files, but they do have a valid
4022                 // UUID load command.
4023                 UUID uuid;
4024                 if (GetUUID(&uuid))
4025                 {
4026                     // this checking for the UUID load command is not enough
4027                     // we could eventually look for the symbol named
4028                     // "OSKextGetCurrentIdentifier" as this is required of kexts
4029                     if (m_strata == eStrataInvalid)
4030                         m_strata = eStrataKernel;
4031                     return eTypeSharedLibrary;
4032                 }
4033             }
4034             return eTypeObjectFile;
4035 
4036         case HeaderFileTypeExecutable:          return eTypeExecutable;     // 0x2u MH_EXECUTE
4037         case HeaderFileTypeFixedVMShlib:        return eTypeSharedLibrary;  // 0x3u MH_FVMLIB
4038         case HeaderFileTypeCore:                return eTypeCoreFile;       // 0x4u MH_CORE
4039         case HeaderFileTypePreloadedExecutable: return eTypeSharedLibrary;  // 0x5u MH_PRELOAD
4040         case HeaderFileTypeDynamicShlib:        return eTypeSharedLibrary;  // 0x6u MH_DYLIB
4041         case HeaderFileTypeDynamicLinkEditor:   return eTypeDynamicLinker;  // 0x7u MH_DYLINKER
4042         case HeaderFileTypeBundle:              return eTypeSharedLibrary;  // 0x8u MH_BUNDLE
4043         case HeaderFileTypeDynamicShlibStub:    return eTypeStubLibrary;    // 0x9u MH_DYLIB_STUB
4044         case HeaderFileTypeDSYM:                return eTypeDebugInfo;      // 0xAu MH_DSYM
4045         case HeaderFileTypeKextBundle:          return eTypeSharedLibrary;  // 0xBu MH_KEXT_BUNDLE
4046         default:
4047             break;
4048     }
4049     return eTypeUnknown;
4050 }
4051 
4052 ObjectFile::Strata
4053 ObjectFileMachO::CalculateStrata()
4054 {
4055     switch (m_header.filetype)
4056     {
4057         case HeaderFileTypeObject:      // 0x1u MH_OBJECT
4058             {
4059                 // 32 bit kexts are just object files, but they do have a valid
4060                 // UUID load command.
4061                 UUID uuid;
4062                 if (GetUUID(&uuid))
4063                 {
4064                     // this checking for the UUID load command is not enough
4065                     // we could eventually look for the symbol named
4066                     // "OSKextGetCurrentIdentifier" as this is required of kexts
4067                     if (m_type == eTypeInvalid)
4068                         m_type = eTypeSharedLibrary;
4069 
4070                     return eStrataKernel;
4071                 }
4072             }
4073             return eStrataUnknown;
4074 
4075         case HeaderFileTypeExecutable:                                     // 0x2u MH_EXECUTE
4076             // Check for the MH_DYLDLINK bit in the flags
4077             if (m_header.flags & HeaderFlagBitIsDynamicLinkObject)
4078             {
4079                 return eStrataUser;
4080             }
4081             else
4082             {
4083                 SectionList *section_list = GetSectionList();
4084                 if (section_list)
4085                 {
4086                     static ConstString g_kld_section_name ("__KLD");
4087                     if (section_list->FindSectionByName(g_kld_section_name))
4088                         return eStrataKernel;
4089                 }
4090             }
4091             return eStrataRawImage;
4092 
4093         case HeaderFileTypeFixedVMShlib:        return eStrataUser;         // 0x3u MH_FVMLIB
4094         case HeaderFileTypeCore:                return eStrataUnknown;      // 0x4u MH_CORE
4095         case HeaderFileTypePreloadedExecutable: return eStrataRawImage;     // 0x5u MH_PRELOAD
4096         case HeaderFileTypeDynamicShlib:        return eStrataUser;         // 0x6u MH_DYLIB
4097         case HeaderFileTypeDynamicLinkEditor:   return eStrataUser;         // 0x7u MH_DYLINKER
4098         case HeaderFileTypeBundle:              return eStrataUser;         // 0x8u MH_BUNDLE
4099         case HeaderFileTypeDynamicShlibStub:    return eStrataUser;         // 0x9u MH_DYLIB_STUB
4100         case HeaderFileTypeDSYM:                return eStrataUnknown;      // 0xAu MH_DSYM
4101         case HeaderFileTypeKextBundle:          return eStrataKernel;       // 0xBu MH_KEXT_BUNDLE
4102         default:
4103             break;
4104     }
4105     return eStrataUnknown;
4106 }
4107 
4108 
4109 uint32_t
4110 ObjectFileMachO::GetVersion (uint32_t *versions, uint32_t num_versions)
4111 {
4112     ModuleSP module_sp(GetModule());
4113     if (module_sp)
4114     {
4115         lldb_private::Mutex::Locker locker(module_sp->GetMutex());
4116         struct dylib_command load_cmd;
4117         lldb::offset_t offset = MachHeaderSizeFromMagic(m_header.magic);
4118         uint32_t version_cmd = 0;
4119         uint64_t version = 0;
4120         uint32_t i;
4121         for (i=0; i<m_header.ncmds; ++i)
4122         {
4123             const lldb::offset_t cmd_offset = offset;
4124             if (m_data.GetU32(&offset, &load_cmd, 2) == NULL)
4125                 break;
4126 
4127             if (load_cmd.cmd == LoadCommandDylibIdent)
4128             {
4129                 if (version_cmd == 0)
4130                 {
4131                     version_cmd = load_cmd.cmd;
4132                     if (m_data.GetU32(&offset, &load_cmd.dylib, 4) == NULL)
4133                         break;
4134                     version = load_cmd.dylib.current_version;
4135                 }
4136                 break; // Break for now unless there is another more complete version
4137                        // number load command in the future.
4138             }
4139             offset = cmd_offset + load_cmd.cmdsize;
4140         }
4141 
4142         if (version_cmd == LoadCommandDylibIdent)
4143         {
4144             if (versions != NULL && num_versions > 0)
4145             {
4146                 if (num_versions > 0)
4147                     versions[0] = (version & 0xFFFF0000ull) >> 16;
4148                 if (num_versions > 1)
4149                     versions[1] = (version & 0x0000FF00ull) >> 8;
4150                 if (num_versions > 2)
4151                     versions[2] = (version & 0x000000FFull);
4152                 // Fill in an remaining version numbers with invalid values
4153                 for (i=3; i<num_versions; ++i)
4154                     versions[i] = UINT32_MAX;
4155             }
4156             // The LC_ID_DYLIB load command has a version with 3 version numbers
4157             // in it, so always return 3
4158             return 3;
4159         }
4160     }
4161     return false;
4162 }
4163 
4164 bool
4165 ObjectFileMachO::GetArchitecture (ArchSpec &arch)
4166 {
4167     ModuleSP module_sp(GetModule());
4168     if (module_sp)
4169     {
4170         lldb_private::Mutex::Locker locker(module_sp->GetMutex());
4171         arch.SetArchitecture (eArchTypeMachO, m_header.cputype, m_header.cpusubtype);
4172 
4173         // Files with type MH_PRELOAD are currently used in cases where the image
4174         // debugs at the addresses in the file itself. Below we set the OS to
4175         // unknown to make sure we use the DynamicLoaderStatic()...
4176         if (m_header.filetype == HeaderFileTypePreloadedExecutable)
4177         {
4178             arch.GetTriple().setOS (llvm::Triple::UnknownOS);
4179         }
4180         return true;
4181     }
4182     return false;
4183 }
4184 
4185 
4186 UUID
4187 ObjectFileMachO::GetProcessSharedCacheUUID (Process *process)
4188 {
4189     UUID uuid;
4190     if (process)
4191     {
4192         addr_t all_image_infos = process->GetImageInfoAddress();
4193 
4194         // The address returned by GetImageInfoAddress may be the address of dyld (don't want)
4195         // or it may be the address of the dyld_all_image_infos structure (want).  The first four
4196         // bytes will be either the version field (all_image_infos) or a Mach-O file magic constant.
4197         // Version 13 and higher of dyld_all_image_infos is required to get the sharedCacheUUID field.
4198 
4199         Error err;
4200         uint32_t version_or_magic = process->ReadUnsignedIntegerFromMemory (all_image_infos, 4, -1, err);
4201         if (version_or_magic != -1
4202             && version_or_magic != HeaderMagic32
4203             && version_or_magic != HeaderMagic32Swapped
4204             && version_or_magic != HeaderMagic64
4205             && version_or_magic != HeaderMagic64Swapped
4206             && version_or_magic >= 13)
4207         {
4208             addr_t sharedCacheUUID_address = LLDB_INVALID_ADDRESS;
4209             int wordsize = process->GetAddressByteSize();
4210             if (wordsize == 8)
4211             {
4212                 sharedCacheUUID_address = all_image_infos + 160;  // sharedCacheUUID <mach-o/dyld_images.h>
4213             }
4214             if (wordsize == 4)
4215             {
4216                 sharedCacheUUID_address = all_image_infos + 84;   // sharedCacheUUID <mach-o/dyld_images.h>
4217             }
4218             if (sharedCacheUUID_address != LLDB_INVALID_ADDRESS)
4219             {
4220                 uuid_t shared_cache_uuid;
4221                 if (process->ReadMemory (sharedCacheUUID_address, shared_cache_uuid, sizeof (uuid_t), err) == sizeof (uuid_t))
4222                 {
4223                     uuid.SetBytes (shared_cache_uuid);
4224                 }
4225             }
4226         }
4227     }
4228     return uuid;
4229 }
4230 
4231 UUID
4232 ObjectFileMachO::GetLLDBSharedCacheUUID ()
4233 {
4234     UUID uuid;
4235 #if defined (__APPLE__) && defined (__arm__)
4236     uint8_t *(*dyld_get_all_image_infos)(void);
4237     dyld_get_all_image_infos = (uint8_t*(*)()) dlsym (RTLD_DEFAULT, "_dyld_get_all_image_infos");
4238     if (dyld_get_all_image_infos)
4239     {
4240         uint8_t *dyld_all_image_infos_address = dyld_get_all_image_infos();
4241         if (dyld_all_image_infos_address)
4242         {
4243             uint32_t *version = (uint32_t*) dyld_all_image_infos_address;              // version <mach-o/dyld_images.h>
4244             if (*version >= 13)
4245             {
4246                 uuid_t *sharedCacheUUID_address = (uuid_t*) ((uint8_t*) dyld_all_image_infos_address + 84);  // sharedCacheUUID <mach-o/dyld_images.h>
4247                 uuid.SetBytes (sharedCacheUUID_address);
4248             }
4249         }
4250     }
4251 #endif
4252     return uuid;
4253 }
4254 
4255 
4256 //------------------------------------------------------------------
4257 // PluginInterface protocol
4258 //------------------------------------------------------------------
4259 lldb_private::ConstString
4260 ObjectFileMachO::GetPluginName()
4261 {
4262     return GetPluginNameStatic();
4263 }
4264 
4265 uint32_t
4266 ObjectFileMachO::GetPluginVersion()
4267 {
4268     return 1;
4269 }
4270 
4271