|
1 // Copyright (c) 2010 Google Inc. All Rights Reserved. |
|
2 // |
|
3 // Redistribution and use in source and binary forms, with or without |
|
4 // modification, are permitted provided that the following conditions are |
|
5 // met: |
|
6 // |
|
7 // * Redistributions of source code must retain the above copyright |
|
8 // notice, this list of conditions and the following disclaimer. |
|
9 // * Redistributions in binary form must reproduce the above |
|
10 // copyright notice, this list of conditions and the following disclaimer |
|
11 // in the documentation and/or other materials provided with the |
|
12 // distribution. |
|
13 // * Neither the name of Google Inc. nor the names of its |
|
14 // contributors may be used to endorse or promote products derived from |
|
15 // this software without specific prior written permission. |
|
16 // |
|
17 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS |
|
18 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT |
|
19 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR |
|
20 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT |
|
21 // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, |
|
22 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT |
|
23 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, |
|
24 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY |
|
25 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
|
26 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
|
27 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
|
28 |
|
29 #include <assert.h> |
|
30 #include <stdlib.h> |
|
31 |
|
32 #include "common/dwarf/bytereader-inl.h" |
|
33 #include "common/dwarf/bytereader.h" |
|
34 |
|
35 namespace dwarf2reader { |
|
36 |
|
37 ByteReader::ByteReader(enum Endianness endian) |
|
38 :offset_reader_(NULL), address_reader_(NULL), endian_(endian), |
|
39 address_size_(0), offset_size_(0), |
|
40 have_section_base_(), have_text_base_(), have_data_base_(), |
|
41 have_function_base_() { } |
|
42 |
|
43 ByteReader::~ByteReader() { } |
|
44 |
|
45 void ByteReader::SetOffsetSize(uint8 size) { |
|
46 offset_size_ = size; |
|
47 assert(size == 4 || size == 8); |
|
48 if (size == 4) { |
|
49 this->offset_reader_ = &ByteReader::ReadFourBytes; |
|
50 } else { |
|
51 this->offset_reader_ = &ByteReader::ReadEightBytes; |
|
52 } |
|
53 } |
|
54 |
|
55 void ByteReader::SetAddressSize(uint8 size) { |
|
56 address_size_ = size; |
|
57 assert(size == 4 || size == 8); |
|
58 if (size == 4) { |
|
59 this->address_reader_ = &ByteReader::ReadFourBytes; |
|
60 } else { |
|
61 this->address_reader_ = &ByteReader::ReadEightBytes; |
|
62 } |
|
63 } |
|
64 |
|
65 uint64 ByteReader::ReadInitialLength(const char* start, size_t* len) { |
|
66 const uint64 initial_length = ReadFourBytes(start); |
|
67 start += 4; |
|
68 |
|
69 // In DWARF2/3, if the initial length is all 1 bits, then the offset |
|
70 // size is 8 and we need to read the next 8 bytes for the real length. |
|
71 if (initial_length == 0xffffffff) { |
|
72 SetOffsetSize(8); |
|
73 *len = 12; |
|
74 return ReadOffset(start); |
|
75 } else { |
|
76 SetOffsetSize(4); |
|
77 *len = 4; |
|
78 } |
|
79 return initial_length; |
|
80 } |
|
81 |
|
82 bool ByteReader::ValidEncoding(DwarfPointerEncoding encoding) const { |
|
83 if (encoding == DW_EH_PE_omit) return true; |
|
84 if (encoding == DW_EH_PE_aligned) return true; |
|
85 if ((encoding & 0x7) > DW_EH_PE_udata8) |
|
86 return false; |
|
87 if ((encoding & 0x70) > DW_EH_PE_funcrel) |
|
88 return false; |
|
89 return true; |
|
90 } |
|
91 |
|
92 bool ByteReader::UsableEncoding(DwarfPointerEncoding encoding) const { |
|
93 switch (encoding & 0x70) { |
|
94 case DW_EH_PE_absptr: return true; |
|
95 case DW_EH_PE_pcrel: return have_section_base_; |
|
96 case DW_EH_PE_textrel: return have_text_base_; |
|
97 case DW_EH_PE_datarel: return have_data_base_; |
|
98 case DW_EH_PE_funcrel: return have_function_base_; |
|
99 default: return false; |
|
100 } |
|
101 } |
|
102 |
|
103 uint64 ByteReader::ReadEncodedPointer(const char *buffer, |
|
104 DwarfPointerEncoding encoding, |
|
105 size_t *len) const { |
|
106 // UsableEncoding doesn't approve of DW_EH_PE_omit, so we shouldn't |
|
107 // see it here. |
|
108 assert(encoding != DW_EH_PE_omit); |
|
109 |
|
110 // The Linux Standards Base 4.0 does not make this clear, but the |
|
111 // GNU tools (gcc/unwind-pe.h; readelf/dwarf.c; gdb/dwarf2-frame.c) |
|
112 // agree that aligned pointers are always absolute, machine-sized, |
|
113 // machine-signed pointers. |
|
114 if (encoding == DW_EH_PE_aligned) { |
|
115 assert(have_section_base_); |
|
116 |
|
117 // We don't need to align BUFFER in *our* address space. Rather, we |
|
118 // need to find the next position in our buffer that would be aligned |
|
119 // when the .eh_frame section the buffer contains is loaded into the |
|
120 // program's memory. So align assuming that buffer_base_ gets loaded at |
|
121 // address section_base_, where section_base_ itself may or may not be |
|
122 // aligned. |
|
123 |
|
124 // First, find the offset to START from the closest prior aligned |
|
125 // address. |
|
126 uint64 skew = section_base_ & (AddressSize() - 1); |
|
127 // Now find the offset from that aligned address to buffer. |
|
128 uint64 offset = skew + (buffer - buffer_base_); |
|
129 // Round up to the next boundary. |
|
130 uint64 aligned = (offset + AddressSize() - 1) & -AddressSize(); |
|
131 // Convert back to a pointer. |
|
132 const char *aligned_buffer = buffer_base_ + (aligned - skew); |
|
133 // Finally, store the length and actually fetch the pointer. |
|
134 *len = aligned_buffer - buffer + AddressSize(); |
|
135 return ReadAddress(aligned_buffer); |
|
136 } |
|
137 |
|
138 // Extract the value first, ignoring whether it's a pointer or an |
|
139 // offset relative to some base. |
|
140 uint64 offset; |
|
141 switch (encoding & 0x0f) { |
|
142 case DW_EH_PE_absptr: |
|
143 // DW_EH_PE_absptr is weird, as it is used as a meaningful value for |
|
144 // both the high and low nybble of encoding bytes. When it appears in |
|
145 // the high nybble, it means that the pointer is absolute, not an |
|
146 // offset from some base address. When it appears in the low nybble, |
|
147 // as here, it means that the pointer is stored as a normal |
|
148 // machine-sized and machine-signed address. A low nybble of |
|
149 // DW_EH_PE_absptr does not imply that the pointer is absolute; it is |
|
150 // correct for us to treat the value as an offset from a base address |
|
151 // if the upper nybble is not DW_EH_PE_absptr. |
|
152 offset = ReadAddress(buffer); |
|
153 *len = AddressSize(); |
|
154 break; |
|
155 |
|
156 case DW_EH_PE_uleb128: |
|
157 offset = ReadUnsignedLEB128(buffer, len); |
|
158 break; |
|
159 |
|
160 case DW_EH_PE_udata2: |
|
161 offset = ReadTwoBytes(buffer); |
|
162 *len = 2; |
|
163 break; |
|
164 |
|
165 case DW_EH_PE_udata4: |
|
166 offset = ReadFourBytes(buffer); |
|
167 *len = 4; |
|
168 break; |
|
169 |
|
170 case DW_EH_PE_udata8: |
|
171 offset = ReadEightBytes(buffer); |
|
172 *len = 8; |
|
173 break; |
|
174 |
|
175 case DW_EH_PE_sleb128: |
|
176 offset = ReadSignedLEB128(buffer, len); |
|
177 break; |
|
178 |
|
179 case DW_EH_PE_sdata2: |
|
180 offset = ReadTwoBytes(buffer); |
|
181 // Sign-extend from 16 bits. |
|
182 offset = (offset ^ 0x8000) - 0x8000; |
|
183 *len = 2; |
|
184 break; |
|
185 |
|
186 case DW_EH_PE_sdata4: |
|
187 offset = ReadFourBytes(buffer); |
|
188 // Sign-extend from 32 bits. |
|
189 offset = (offset ^ 0x80000000ULL) - 0x80000000ULL; |
|
190 *len = 4; |
|
191 break; |
|
192 |
|
193 case DW_EH_PE_sdata8: |
|
194 // No need to sign-extend; this is the full width of our type. |
|
195 offset = ReadEightBytes(buffer); |
|
196 *len = 8; |
|
197 break; |
|
198 |
|
199 default: |
|
200 abort(); |
|
201 } |
|
202 |
|
203 // Find the appropriate base address. |
|
204 uint64 base; |
|
205 switch (encoding & 0x70) { |
|
206 case DW_EH_PE_absptr: |
|
207 base = 0; |
|
208 break; |
|
209 |
|
210 case DW_EH_PE_pcrel: |
|
211 assert(have_section_base_); |
|
212 base = section_base_ + (buffer - buffer_base_); |
|
213 break; |
|
214 |
|
215 case DW_EH_PE_textrel: |
|
216 assert(have_text_base_); |
|
217 base = text_base_; |
|
218 break; |
|
219 |
|
220 case DW_EH_PE_datarel: |
|
221 assert(have_data_base_); |
|
222 base = data_base_; |
|
223 break; |
|
224 |
|
225 case DW_EH_PE_funcrel: |
|
226 assert(have_function_base_); |
|
227 base = function_base_; |
|
228 break; |
|
229 |
|
230 default: |
|
231 abort(); |
|
232 } |
|
233 |
|
234 uint64 pointer = base + offset; |
|
235 |
|
236 // Remove inappropriate upper bits. |
|
237 if (AddressSize() == 4) |
|
238 pointer = pointer & 0xffffffff; |
|
239 else |
|
240 assert(AddressSize() == sizeof(uint64)); |
|
241 |
|
242 return pointer; |
|
243 } |
|
244 |
|
245 } // namespace dwarf2reader |