EhFrame.cpp revision 360660
1//===- EhFrame.cpp -------------------------------------------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// .eh_frame section contains information on how to unwind the stack when
10// an exception is thrown. The section consists of sequence of CIE and FDE
11// records. The linker needs to merge CIEs and associate FDEs to CIEs.
12// That means the linker has to understand the format of the section.
13//
14// This file contains a few utility functions to read .eh_frame contents.
15//
16//===----------------------------------------------------------------------===//
17
18#include "EhFrame.h"
19#include "Config.h"
20#include "InputSection.h"
21#include "Relocations.h"
22#include "Target.h"
23#include "lld/Common/ErrorHandler.h"
24#include "lld/Common/Strings.h"
25#include "llvm/BinaryFormat/Dwarf.h"
26#include "llvm/Object/ELF.h"
27
28using namespace llvm;
29using namespace llvm::ELF;
30using namespace llvm::dwarf;
31using namespace llvm::object;
32
33using namespace lld;
34using namespace lld::elf;
35
36namespace {
37class EhReader {
38public:
39  EhReader(InputSectionBase *s, ArrayRef<uint8_t> d) : isec(s), d(d) {}
40  size_t readEhRecordSize();
41  uint8_t getFdeEncoding();
42
43private:
44  template <class P> void failOn(const P *loc, const Twine &msg) {
45    fatal("corrupted .eh_frame: " + msg + "\n>>> defined in " +
46          isec->getObjMsg((const uint8_t *)loc - isec->data().data()));
47  }
48
49  uint8_t readByte();
50  void skipBytes(size_t count);
51  StringRef readString();
52  void skipLeb128();
53  void skipAugP();
54
55  InputSectionBase *isec;
56  ArrayRef<uint8_t> d;
57};
58}
59
60size_t elf::readEhRecordSize(InputSectionBase *s, size_t off) {
61  return EhReader(s, s->data().slice(off)).readEhRecordSize();
62}
63
64// .eh_frame section is a sequence of records. Each record starts with
65// a 4 byte length field. This function reads the length.
66size_t EhReader::readEhRecordSize() {
67  if (d.size() < 4)
68    failOn(d.data(), "CIE/FDE too small");
69
70  // First 4 bytes of CIE/FDE is the size of the record.
71  // If it is 0xFFFFFFFF, the next 8 bytes contain the size instead,
72  // but we do not support that format yet.
73  uint64_t v = read32(d.data());
74  if (v == UINT32_MAX)
75    failOn(d.data(), "CIE/FDE too large");
76  uint64_t size = v + 4;
77  if (size > d.size())
78    failOn(d.data(), "CIE/FDE ends past the end of the section");
79  return size;
80}
81
82// Read a byte and advance D by one byte.
83uint8_t EhReader::readByte() {
84  if (d.empty())
85    failOn(d.data(), "unexpected end of CIE");
86  uint8_t b = d.front();
87  d = d.slice(1);
88  return b;
89}
90
91void EhReader::skipBytes(size_t count) {
92  if (d.size() < count)
93    failOn(d.data(), "CIE is too small");
94  d = d.slice(count);
95}
96
97// Read a null-terminated string.
98StringRef EhReader::readString() {
99  const uint8_t *end = llvm::find(d, '\0');
100  if (end == d.end())
101    failOn(d.data(), "corrupted CIE (failed to read string)");
102  StringRef s = toStringRef(d.slice(0, end - d.begin()));
103  d = d.slice(s.size() + 1);
104  return s;
105}
106
107// Skip an integer encoded in the LEB128 format.
108// Actual number is not of interest because only the runtime needs it.
109// But we need to be at least able to skip it so that we can read
110// the field that follows a LEB128 number.
111void EhReader::skipLeb128() {
112  const uint8_t *errPos = d.data();
113  while (!d.empty()) {
114    uint8_t val = d.front();
115    d = d.slice(1);
116    if ((val & 0x80) == 0)
117      return;
118  }
119  failOn(errPos, "corrupted CIE (failed to read LEB128)");
120}
121
122static size_t getAugPSize(unsigned enc) {
123  switch (enc & 0x0f) {
124  case DW_EH_PE_absptr:
125  case DW_EH_PE_signed:
126    return config->wordsize;
127  case DW_EH_PE_udata2:
128  case DW_EH_PE_sdata2:
129    return 2;
130  case DW_EH_PE_udata4:
131  case DW_EH_PE_sdata4:
132    return 4;
133  case DW_EH_PE_udata8:
134  case DW_EH_PE_sdata8:
135    return 8;
136  }
137  return 0;
138}
139
140void EhReader::skipAugP() {
141  uint8_t enc = readByte();
142  if ((enc & 0xf0) == DW_EH_PE_aligned)
143    failOn(d.data() - 1, "DW_EH_PE_aligned encoding is not supported");
144  size_t size = getAugPSize(enc);
145  if (size == 0)
146    failOn(d.data() - 1, "unknown FDE encoding");
147  if (size >= d.size())
148    failOn(d.data() - 1, "corrupted CIE");
149  d = d.slice(size);
150}
151
152uint8_t elf::getFdeEncoding(EhSectionPiece *p) {
153  return EhReader(p->sec, p->data()).getFdeEncoding();
154}
155
156uint8_t EhReader::getFdeEncoding() {
157  skipBytes(8);
158  int version = readByte();
159  if (version != 1 && version != 3)
160    failOn(d.data() - 1,
161           "FDE version 1 or 3 expected, but got " + Twine(version));
162
163  StringRef aug = readString();
164
165  // Skip code and data alignment factors.
166  skipLeb128();
167  skipLeb128();
168
169  // Skip the return address register. In CIE version 1 this is a single
170  // byte. In CIE version 3 this is an unsigned LEB128.
171  if (version == 1)
172    readByte();
173  else
174    skipLeb128();
175
176  // We only care about an 'R' value, but other records may precede an 'R'
177  // record. Unfortunately records are not in TLV (type-length-value) format,
178  // so we need to teach the linker how to skip records for each type.
179  for (char c : aug) {
180    if (c == 'R')
181      return readByte();
182    if (c == 'z') {
183      skipLeb128();
184      continue;
185    }
186    if (c == 'P') {
187      skipAugP();
188      continue;
189    }
190    if (c == 'L') {
191      readByte();
192      continue;
193    }
194    failOn(aug.data(), "unknown .eh_frame augmentation string: " + aug);
195  }
196  return DW_EH_PE_absptr;
197}
198