elfcore.c revision 102944
1/*-
2 * Copyright (c) 1998 John D. Polstra
3 * All rights reserved.
4 *
5 * Redistribution and use in source and binary forms, with or without
6 * modification, are permitted provided that the following conditions
7 * are met:
8 * 1. Redistributions of source code must retain the above copyright
9 *    notice, this list of conditions and the following disclaimer.
10 * 2. Redistributions in binary form must reproduce the above copyright
11 *    notice, this list of conditions and the following disclaimer in the
12 *    documentation and/or other materials provided with the distribution.
13 *
14 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17 * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24 * SUCH DAMAGE.
25 */
26
27#include <sys/cdefs.h>
28__FBSDID("$FreeBSD: head/usr.bin/gcore/elfcore.c 102944 2002-09-04 23:29:10Z dwmalone $");
29
30#include <sys/param.h>
31#include <sys/procfs.h>
32#include <machine/elf.h>
33#include <vm/vm_param.h>
34#include <vm/vm.h>
35#include <vm/pmap.h>
36#include <vm/vm_map.h>
37#include <err.h>
38#include <errno.h>
39#include <fcntl.h>
40#include <stdio.h>
41#include <stdlib.h>
42#include <string.h>
43#include <unistd.h>
44
45#include "extern.h"
46
47/*
48 * Code for generating ELF core dumps.
49 */
50
51typedef void (*segment_callback)(vm_map_entry_t, void *);
52
53/* Closure for cb_put_phdr(). */
54struct phdr_closure {
55	Elf_Phdr *phdr;		/* Program header to fill in */
56	Elf_Off offset;		/* Offset of segment in core file */
57};
58
59/* Closure for cb_size_segment(). */
60struct sseg_closure {
61	int count;		/* Count of writable segments. */
62	size_t size;		/* Total size of all writable segments. */
63};
64
65static void cb_put_phdr(vm_map_entry_t, void *);
66static void cb_size_segment(vm_map_entry_t, void *);
67static void each_writable_segment(vm_map_entry_t, segment_callback,
68    void *closure);
69static void elf_corehdr(int fd, pid_t, vm_map_entry_t, int numsegs,
70    void *hdr, size_t hdrsize);
71static void elf_puthdr(vm_map_entry_t, void *, size_t *,
72    const prstatus_t *, const prfpregset_t *, const prpsinfo_t *, int numsegs);
73static void elf_putnote(void *dst, size_t *off, const char *name, int type,
74    const void *desc, size_t descsz);
75static void freemap(vm_map_entry_t);
76static void readhdrinfo(pid_t, prstatus_t *, prfpregset_t *, prpsinfo_t *);
77static vm_map_entry_t readmap(pid_t);
78
79/*
80 * Write an ELF coredump for the given pid to the given fd.
81 */
82void
83elf_coredump(int fd, pid_t pid)
84{
85	vm_map_entry_t map;
86	struct sseg_closure seginfo;
87	void *hdr;
88	size_t hdrsize;
89	char memname[64];
90	int memfd;
91	Elf_Phdr *php;
92	int i;
93
94	/* Get the program's memory map. */
95	map = readmap(pid);
96
97	/* Size the program segments. */
98	seginfo.count = 0;
99	seginfo.size = 0;
100	each_writable_segment(map, cb_size_segment, &seginfo);
101
102	/*
103	 * Calculate the size of the core file header area by making
104	 * a dry run of generating it.  Nothing is written, but the
105	 * size is calculated.
106	 */
107	hdrsize = 0;
108	elf_puthdr(map, (void *)NULL, &hdrsize,
109	    (const prstatus_t *)NULL, (const prfpregset_t *)NULL,
110	    (const prpsinfo_t *)NULL, seginfo.count);
111
112	/*
113	 * Allocate memory for building the header, fill it up,
114	 * and write it out.
115	 */
116	hdr = malloc(hdrsize);
117	if ((hdr = malloc(hdrsize)) == NULL)
118		errx(1, "out of memory");
119	elf_corehdr(fd, pid, map, seginfo.count, hdr, hdrsize);
120
121	/* Write the contents of all of the writable segments. */
122	snprintf(memname, sizeof memname, "/proc/%d/mem", pid);
123	if ((memfd = open(memname, O_RDONLY)) == -1)
124		err(1, "cannot open %s", memname);
125
126	php = (Elf_Phdr *)((char *)hdr + sizeof(Elf_Ehdr)) + 1;
127	for (i = 0;  i < seginfo.count;  i++) {
128		uintmax_t nleft = php->p_filesz;
129
130		lseek(memfd, (off_t)php->p_vaddr, SEEK_SET);
131		while (nleft > 0) {
132			char buf[8*1024];
133			size_t nwant;
134			ssize_t ngot;
135
136			if (nleft > sizeof(buf))
137				nwant = sizeof buf;
138			else
139				nwant = nleft;
140			ngot = read(memfd, buf, nwant);
141			if (ngot == -1)
142				err(1, "read from %s", memname);
143			if ((size_t)ngot < nwant)
144				errx(1, "short read from %s:"
145				    " wanted %d, got %d", memname,
146				    nwant, ngot);
147			ngot = write(fd, buf, nwant);
148			if (ngot == -1)
149				err(1, "write of segment %d failed", i);
150			if ((size_t)ngot != nwant)
151				errx(1, "short write");
152			nleft -= nwant;
153		}
154		php++;
155	}
156	close(memfd);
157	free(hdr);
158	freemap(map);
159}
160
161/*
162 * A callback for each_writable_segment() to write out the segment's
163 * program header entry.
164 */
165static void
166cb_put_phdr(vm_map_entry_t entry, void *closure)
167{
168	struct phdr_closure *phc = (struct phdr_closure *)closure;
169	Elf_Phdr *phdr = phc->phdr;
170
171	phc->offset = round_page(phc->offset);
172
173	phdr->p_type = PT_LOAD;
174	phdr->p_offset = phc->offset;
175	phdr->p_vaddr = entry->start;
176	phdr->p_paddr = 0;
177	phdr->p_filesz = phdr->p_memsz = entry->end - entry->start;
178	phdr->p_align = PAGE_SIZE;
179	phdr->p_flags = 0;
180	if (entry->protection & VM_PROT_READ)
181		phdr->p_flags |= PF_R;
182	if (entry->protection & VM_PROT_WRITE)
183		phdr->p_flags |= PF_W;
184	if (entry->protection & VM_PROT_EXECUTE)
185		phdr->p_flags |= PF_X;
186
187	phc->offset += phdr->p_filesz;
188	phc->phdr++;
189}
190
191/*
192 * A callback for each_writable_segment() to gather information about
193 * the number of segments and their total size.
194 */
195static void
196cb_size_segment(vm_map_entry_t entry, void *closure)
197{
198	struct sseg_closure *ssc = (struct sseg_closure *)closure;
199
200	ssc->count++;
201	ssc->size += entry->end - entry->start;
202}
203
204/*
205 * For each segment in the given memory map, call the given function
206 * with a pointer to the map entry and some arbitrary caller-supplied
207 * data.
208 */
209static void
210each_writable_segment(vm_map_entry_t map, segment_callback func, void *closure)
211{
212	vm_map_entry_t entry;
213
214	for (entry = map;  entry != NULL;  entry = entry->next)
215		(*func)(entry, closure);
216}
217
218/*
219 * Write the core file header to the file, including padding up to
220 * the page boundary.
221 */
222static void
223elf_corehdr(int fd, pid_t pid, vm_map_entry_t map, int numsegs, void *hdr,
224    size_t hdrsize)
225{
226	size_t off;
227	prstatus_t status;
228	prfpregset_t fpregset;
229	prpsinfo_t psinfo;
230
231	/* Gather the information for the header. */
232	readhdrinfo(pid, &status, &fpregset, &psinfo);
233
234	/* Fill in the header. */
235	memset(hdr, 0, hdrsize);
236	off = 0;
237	elf_puthdr(map, hdr, &off, &status, &fpregset, &psinfo, numsegs);
238
239	/* Write it to the core file. */
240	if (write(fd, hdr, hdrsize) == -1)
241		err(1, "write");
242}
243
244/*
245 * Generate the ELF coredump header into the buffer at "dst".  "dst" may
246 * be NULL, in which case the header is sized but not actually generated.
247 */
248static void
249elf_puthdr(vm_map_entry_t map, void *dst, size_t *off, const prstatus_t *status,
250    const prfpregset_t *fpregset, const prpsinfo_t *psinfo, int numsegs)
251{
252	size_t ehoff;
253	size_t phoff;
254	size_t noteoff;
255	size_t notesz;
256
257	ehoff = *off;
258	*off += sizeof(Elf_Ehdr);
259
260	phoff = *off;
261	*off += (numsegs + 1) * sizeof(Elf_Phdr);
262
263	noteoff = *off;
264	elf_putnote(dst, off, "FreeBSD", NT_PRSTATUS, status,
265	    sizeof *status);
266	elf_putnote(dst, off, "FreeBSD", NT_FPREGSET, fpregset,
267	    sizeof *fpregset);
268	elf_putnote(dst, off, "FreeBSD", NT_PRPSINFO, psinfo,
269	    sizeof *psinfo);
270	notesz = *off - noteoff;
271
272	/* Align up to a page boundary for the program segments. */
273	*off = round_page(*off);
274
275	if (dst != NULL) {
276		Elf_Ehdr *ehdr;
277		Elf_Phdr *phdr;
278		struct phdr_closure phc;
279
280		/*
281		 * Fill in the ELF header.
282		 */
283		ehdr = (Elf_Ehdr *)((char *)dst + ehoff);
284		ehdr->e_ident[EI_MAG0] = ELFMAG0;
285		ehdr->e_ident[EI_MAG1] = ELFMAG1;
286		ehdr->e_ident[EI_MAG2] = ELFMAG2;
287		ehdr->e_ident[EI_MAG3] = ELFMAG3;
288		ehdr->e_ident[EI_CLASS] = ELF_CLASS;
289		ehdr->e_ident[EI_DATA] = ELF_DATA;
290		ehdr->e_ident[EI_VERSION] = EV_CURRENT;
291		ehdr->e_ident[EI_OSABI] = ELFOSABI_FREEBSD;
292		ehdr->e_ident[EI_ABIVERSION] = 0;
293		ehdr->e_ident[EI_PAD] = 0;
294		ehdr->e_type = ET_CORE;
295		ehdr->e_machine = ELF_ARCH;
296		ehdr->e_version = EV_CURRENT;
297		ehdr->e_entry = 0;
298		ehdr->e_phoff = phoff;
299		ehdr->e_flags = 0;
300		ehdr->e_ehsize = sizeof(Elf_Ehdr);
301		ehdr->e_phentsize = sizeof(Elf_Phdr);
302		ehdr->e_phnum = numsegs + 1;
303		ehdr->e_shentsize = sizeof(Elf_Shdr);
304		ehdr->e_shnum = 0;
305		ehdr->e_shstrndx = SHN_UNDEF;
306
307		/*
308		 * Fill in the program header entries.
309		 */
310		phdr = (Elf_Phdr *)((char *)dst + phoff);
311
312		/* The note segment. */
313		phdr->p_type = PT_NOTE;
314		phdr->p_offset = noteoff;
315		phdr->p_vaddr = 0;
316		phdr->p_paddr = 0;
317		phdr->p_filesz = notesz;
318		phdr->p_memsz = 0;
319		phdr->p_flags = 0;
320		phdr->p_align = 0;
321		phdr++;
322
323		/* All the writable segments from the program. */
324		phc.phdr = phdr;
325		phc.offset = *off;
326		each_writable_segment(map, cb_put_phdr, &phc);
327	}
328}
329
330/*
331 * Emit one note section to "dst", or just size it if "dst" is NULL.
332 */
333static void
334elf_putnote(void *dst, size_t *off, const char *name, int type,
335    const void *desc, size_t descsz)
336{
337	Elf_Note note;
338
339	note.n_namesz = strlen(name) + 1;
340	note.n_descsz = descsz;
341	note.n_type = type;
342	if (dst != NULL)
343		bcopy(&note, (char *)dst + *off, sizeof note);
344	*off += sizeof note;
345	if (dst != NULL)
346		bcopy(name, (char *)dst + *off, note.n_namesz);
347	*off += roundup2(note.n_namesz, sizeof(Elf_Size));
348	if (dst != NULL)
349		bcopy(desc, (char *)dst + *off, note.n_descsz);
350	*off += roundup2(note.n_descsz, sizeof(Elf_Size));
351}
352
353/*
354 * Free the memory map.
355 */
356static void
357freemap(vm_map_entry_t map)
358{
359	while (map != NULL) {
360		vm_map_entry_t next = map->next;
361		free(map);
362		map = next;
363	}
364}
365
366/*
367 * Read the process information necessary to fill in the core file's header.
368 */
369static void
370readhdrinfo(pid_t pid, prstatus_t *status, prfpregset_t *fpregset,
371    prpsinfo_t *psinfo)
372{
373	char name[64];
374	char line[256];
375	int fd;
376	int i;
377	int n;
378
379	memset(status, 0, sizeof *status);
380	status->pr_version = PRSTATUS_VERSION;
381	status->pr_statussz = sizeof(prstatus_t);
382	status->pr_gregsetsz = sizeof(gregset_t);
383	status->pr_fpregsetsz = sizeof(fpregset_t);
384	status->pr_osreldate = __FreeBSD_version;
385	status->pr_pid = pid;
386
387	memset(fpregset, 0, sizeof *fpregset);
388
389	memset(psinfo, 0, sizeof *psinfo);
390	psinfo->pr_version = PRPSINFO_VERSION;
391	psinfo->pr_psinfosz = sizeof(prpsinfo_t);
392
393	/* Read the general registers. */
394	snprintf(name, sizeof name, "/proc/%d/regs", pid);
395	if ((fd = open(name, O_RDONLY)) == -1)
396		err(1, "cannot open %s", name);
397	if ((n = read(fd, &status->pr_reg, sizeof status->pr_reg)) == -1)
398		err(1, "read error from %s", name);
399	if ((size_t)n < sizeof(status->pr_reg))
400		errx(1, "short read from %s: wanted %u, got %d", name,
401		    sizeof status->pr_reg, n);
402	close(fd);
403
404	/* Read the floating point registers. */
405	snprintf(name, sizeof name, "/proc/%d/fpregs", pid);
406	if ((fd = open(name, O_RDONLY)) == -1)
407		err(1, "cannot open %s", name);
408	if ((n = read(fd, fpregset, sizeof *fpregset)) == -1)
409		err(1, "read error from %s", name);
410	if ((size_t)n < sizeof(*fpregset))
411		errx(1, "short read from %s: wanted %u, got %d", name,
412		    sizeof *fpregset, n);
413	close(fd);
414
415	/* Read and parse the process status. */
416	snprintf(name, sizeof name, "/proc/%d/status", pid);
417	if ((fd = open(name, O_RDONLY)) == -1)
418		err(1, "cannot open %s", name);
419	if ((n = read(fd, line, sizeof line - 1)) == -1)
420		err(1, "read error from %s", name);
421	if (n > MAXCOMLEN)
422		n = MAXCOMLEN;
423	for (i = 0;  i < n && line[i] != ' ';  i++)
424		psinfo->pr_fname[i] = line[i];
425	strncpy(psinfo->pr_psargs, psinfo->pr_fname, PRARGSZ);
426	close(fd);
427}
428
429/*
430 * Read the process's memory map using procfs, and return a list of
431 * VM map entries.  Only the non-device read/writable segments are
432 * returned.  The map entries in the list aren't fully filled in; only
433 * the items we need are present.
434 */
435static vm_map_entry_t
436readmap(pid_t pid)
437{
438	char mapname[64];
439	int mapfd;
440	ssize_t mapsize;
441	size_t bufsize;
442	char *mapbuf;
443	int pos;
444	vm_map_entry_t map;
445	vm_map_entry_t *linkp;
446
447	snprintf(mapname, sizeof mapname, "/proc/%d/map", pid);
448	if ((mapfd = open(mapname, O_RDONLY)) == -1)
449		err(1, "cannot open %s", mapname);
450
451	/*
452	 * Procfs requires (for consistency) that the entire memory map
453	 * be read with a single read() call.  Start with a reasonably sized
454	 * buffer, and double it until it is big enough.
455	 */
456	bufsize = 8 * 1024;
457	mapbuf = NULL;
458	for ( ; ; ) {
459		if ((mapbuf = realloc(mapbuf, bufsize + 1)) == NULL)
460			errx(1, "out of memory");
461		mapsize = read(mapfd, mapbuf, bufsize);
462		if (mapsize != -1 || errno != EFBIG)
463			break;
464		bufsize *= 2;
465		/* This lseek shouldn't be necessary, but it is. */
466		lseek(mapfd, (off_t)0, SEEK_SET);
467	}
468	if (mapsize == -1)
469		err(1, "read error from %s", mapname);
470	if (mapsize == 0)
471		errx(1, "empty map file %s", mapname);
472	mapbuf[mapsize] = 0;
473	close(mapfd);
474
475	pos = 0;
476	map = NULL;
477	linkp = &map;
478	while (pos < mapsize) {
479		vm_map_entry_t ent;
480		vm_offset_t start;
481		vm_offset_t end;
482		char prot[4];
483		char type[16];
484		int n;
485		int len;
486
487		len = 0;
488		n = sscanf(mapbuf + pos, "%x %x %*d %*d %*x %3[-rwx]"
489		    " %*d %*d %*x %*s %*s %16s%*[\n]%n",
490		    &start, &end, prot, type, &len);
491		if (n != 4)
492			errx(1, "ill-formed line in %s", mapname);
493		pos += len;
494
495		/* Ignore segments of the wrong kind, and unwritable ones */
496		if (strncmp(prot, "rw", 2) != 0 ||
497		    (strcmp(type, "default") != 0 &&
498		    strcmp(type, "vnode") != 0 &&
499		    strcmp(type, "swap") != 0))
500			continue;
501
502		if ((ent = (vm_map_entry_t)calloc(1, sizeof *ent)) == NULL)
503			errx(1, "out of memory");
504		ent->start = start;
505		ent->end = end;
506		ent->protection = VM_PROT_READ | VM_PROT_WRITE;
507		if (prot[2] == 'x')
508		    ent->protection |= VM_PROT_EXECUTE;
509
510		*linkp = ent;
511		linkp = &ent->next;
512	}
513	free(mapbuf);
514	return map;
515}
516