blob: 9ef3ad3789c17d17eb043cb6f33d2dec6d3e0402 [file] [log] [blame]
b.liue9582032025-04-17 19:18:16 +08001/*
2 * parse_vdso.c: Linux reference vDSO parser
3 * Written by Andrew Lutomirski, 2011-2014.
4 *
5 * This code is meant to be linked in to various programs that run on Linux.
6 * As such, it is available with as few restrictions as possible. This file
7 * is licensed under the Creative Commons Zero License, version 1.0,
8 * available at http://creativecommons.org/publicdomain/zero/1.0/legalcode
9 *
10 * The vDSO is a regular ELF DSO that the kernel maps into user space when
11 * it starts a program. It works equally well in statically and dynamically
12 * linked binaries.
13 *
14 * This code is tested on x86. In principle it should work on any
15 * architecture that has a vDSO.
16 */
17
18#include <stdbool.h>
19#include <stdint.h>
20#include <string.h>
21#include <limits.h>
22#include <elf.h>
23
24/*
25 * To use this vDSO parser, first call one of the vdso_init_* functions.
26 * If you've already parsed auxv, then pass the value of AT_SYSINFO_EHDR
27 * to vdso_init_from_sysinfo_ehdr. Otherwise pass auxv to vdso_init_from_auxv.
28 * Then call vdso_sym for each symbol you want. For example, to look up
29 * gettimeofday on x86_64, use:
30 *
31 * <some pointer> = vdso_sym("LINUX_2.6", "gettimeofday");
32 * or
33 * <some pointer> = vdso_sym("LINUX_2.6", "__vdso_gettimeofday");
34 *
35 * vdso_sym will return 0 if the symbol doesn't exist or if the init function
36 * failed or was not called. vdso_sym is a little slow, so its return value
37 * should be cached.
38 *
39 * vdso_sym is threadsafe; the init functions are not.
40 *
41 * These are the prototypes:
42 */
43extern void vdso_init_from_auxv(void *auxv);
44extern void vdso_init_from_sysinfo_ehdr(uintptr_t base);
45extern void *vdso_sym(const char *version, const char *name);
46
47
48/* And here's the code. */
49#ifndef ELF_BITS
50# if ULONG_MAX > 0xffffffffUL
51# define ELF_BITS 64
52# else
53# define ELF_BITS 32
54# endif
55#endif
56
57#define ELF_BITS_XFORM2(bits, x) Elf##bits##_##x
58#define ELF_BITS_XFORM(bits, x) ELF_BITS_XFORM2(bits, x)
59#define ELF(x) ELF_BITS_XFORM(ELF_BITS, x)
60
61static struct vdso_info
62{
63 bool valid;
64
65 /* Load information */
66 uintptr_t load_addr;
67 uintptr_t load_offset; /* load_addr - recorded vaddr */
68
69 /* Symbol table */
70 ELF(Sym) *symtab;
71 const char *symstrings;
72 ELF(Word) *bucket, *chain;
73 ELF(Word) nbucket, nchain;
74
75 /* Version table */
76 ELF(Versym) *versym;
77 ELF(Verdef) *verdef;
78} vdso_info;
79
80/*
81 * Straight from the ELF specification...and then tweaked slightly, in order to
82 * avoid a few clang warnings.
83 */
84static unsigned long elf_hash(const char *name)
85{
86 unsigned long h = 0, g;
87 const unsigned char *uch_name = (const unsigned char *)name;
88
89 while (*uch_name)
90 {
91 h = (h << 4) + *uch_name++;
92 g = h & 0xf0000000;
93 if (g)
94 h ^= g >> 24;
95 h &= ~g;
96 }
97 return h;
98}
99
100void vdso_init_from_sysinfo_ehdr(uintptr_t base)
101{
102 size_t i;
103 bool found_vaddr = false;
104
105 vdso_info.valid = false;
106
107 vdso_info.load_addr = base;
108
109 ELF(Ehdr) *hdr = (ELF(Ehdr)*)base;
110 if (hdr->e_ident[EI_CLASS] !=
111 (ELF_BITS == 32 ? ELFCLASS32 : ELFCLASS64)) {
112 return; /* Wrong ELF class -- check ELF_BITS */
113 }
114
115 ELF(Phdr) *pt = (ELF(Phdr)*)(vdso_info.load_addr + hdr->e_phoff);
116 ELF(Dyn) *dyn = 0;
117
118 /*
119 * We need two things from the segment table: the load offset
120 * and the dynamic table.
121 */
122 for (i = 0; i < hdr->e_phnum; i++)
123 {
124 if (pt[i].p_type == PT_LOAD && !found_vaddr) {
125 found_vaddr = true;
126 vdso_info.load_offset = base
127 + (uintptr_t)pt[i].p_offset
128 - (uintptr_t)pt[i].p_vaddr;
129 } else if (pt[i].p_type == PT_DYNAMIC) {
130 dyn = (ELF(Dyn)*)(base + pt[i].p_offset);
131 }
132 }
133
134 if (!found_vaddr || !dyn)
135 return; /* Failed */
136
137 /*
138 * Fish out the useful bits of the dynamic table.
139 */
140 ELF(Word) *hash = 0;
141 vdso_info.symstrings = 0;
142 vdso_info.symtab = 0;
143 vdso_info.versym = 0;
144 vdso_info.verdef = 0;
145 for (i = 0; dyn[i].d_tag != DT_NULL; i++) {
146 switch (dyn[i].d_tag) {
147 case DT_STRTAB:
148 vdso_info.symstrings = (const char *)
149 ((uintptr_t)dyn[i].d_un.d_ptr
150 + vdso_info.load_offset);
151 break;
152 case DT_SYMTAB:
153 vdso_info.symtab = (ELF(Sym) *)
154 ((uintptr_t)dyn[i].d_un.d_ptr
155 + vdso_info.load_offset);
156 break;
157 case DT_HASH:
158 hash = (ELF(Word) *)
159 ((uintptr_t)dyn[i].d_un.d_ptr
160 + vdso_info.load_offset);
161 break;
162 case DT_VERSYM:
163 vdso_info.versym = (ELF(Versym) *)
164 ((uintptr_t)dyn[i].d_un.d_ptr
165 + vdso_info.load_offset);
166 break;
167 case DT_VERDEF:
168 vdso_info.verdef = (ELF(Verdef) *)
169 ((uintptr_t)dyn[i].d_un.d_ptr
170 + vdso_info.load_offset);
171 break;
172 }
173 }
174 if (!vdso_info.symstrings || !vdso_info.symtab || !hash)
175 return; /* Failed */
176
177 if (!vdso_info.verdef)
178 vdso_info.versym = 0;
179
180 /* Parse the hash table header. */
181 vdso_info.nbucket = hash[0];
182 vdso_info.nchain = hash[1];
183 vdso_info.bucket = &hash[2];
184 vdso_info.chain = &hash[vdso_info.nbucket + 2];
185
186 /* That's all we need. */
187 vdso_info.valid = true;
188}
189
190static bool vdso_match_version(ELF(Versym) ver,
191 const char *name, ELF(Word) hash)
192{
193 /*
194 * This is a helper function to check if the version indexed by
195 * ver matches name (which hashes to hash).
196 *
197 * The version definition table is a mess, and I don't know how
198 * to do this in better than linear time without allocating memory
199 * to build an index. I also don't know why the table has
200 * variable size entries in the first place.
201 *
202 * For added fun, I can't find a comprehensible specification of how
203 * to parse all the weird flags in the table.
204 *
205 * So I just parse the whole table every time.
206 */
207
208 /* First step: find the version definition */
209 ver &= 0x7fff; /* Apparently bit 15 means "hidden" */
210 ELF(Verdef) *def = vdso_info.verdef;
211 while(true) {
212 if ((def->vd_flags & VER_FLG_BASE) == 0
213 && (def->vd_ndx & 0x7fff) == ver)
214 break;
215
216 if (def->vd_next == 0)
217 return false; /* No definition. */
218
219 def = (ELF(Verdef) *)((char *)def + def->vd_next);
220 }
221
222 /* Now figure out whether it matches. */
223 ELF(Verdaux) *aux = (ELF(Verdaux)*)((char *)def + def->vd_aux);
224 return def->vd_hash == hash
225 && !strcmp(name, vdso_info.symstrings + aux->vda_name);
226}
227
228void *vdso_sym(const char *version, const char *name)
229{
230 unsigned long ver_hash;
231 if (!vdso_info.valid)
232 return 0;
233
234 ver_hash = elf_hash(version);
235 ELF(Word) chain = vdso_info.bucket[elf_hash(name) % vdso_info.nbucket];
236
237 for (; chain != STN_UNDEF; chain = vdso_info.chain[chain]) {
238 ELF(Sym) *sym = &vdso_info.symtab[chain];
239
240 /* Check for a defined global or weak function w/ right name. */
241 if (ELF64_ST_TYPE(sym->st_info) != STT_FUNC)
242 continue;
243 if (ELF64_ST_BIND(sym->st_info) != STB_GLOBAL &&
244 ELF64_ST_BIND(sym->st_info) != STB_WEAK)
245 continue;
246 if (sym->st_shndx == SHN_UNDEF)
247 continue;
248 if (strcmp(name, vdso_info.symstrings + sym->st_name))
249 continue;
250
251 /* Check symbol version. */
252 if (vdso_info.versym
253 && !vdso_match_version(vdso_info.versym[chain],
254 version, ver_hash))
255 continue;
256
257 return (void *)(vdso_info.load_offset + sym->st_value);
258 }
259
260 return 0;
261}
262
263void vdso_init_from_auxv(void *auxv)
264{
265 ELF(auxv_t) *elf_auxv = auxv;
266 for (int i = 0; elf_auxv[i].a_type != AT_NULL; i++)
267 {
268 if (elf_auxv[i].a_type == AT_SYSINFO_EHDR) {
269 vdso_init_from_sysinfo_ehdr(elf_auxv[i].a_un.a_val);
270 return;
271 }
272 }
273
274 vdso_info.valid = false;
275}