mirror of
https://github.com/checkpoint-restore/criu
synced 2025-08-31 06:15:24 +00:00
Make fdinfo_entry carry only the minimal info describing a file descriptor -- the fd value itself, the fd type (regular file, exe link, cwd, filemap and it will be pipes, sockets, inotifies, etc.) and the describing file ID. The mentioned ID will identify the type-d object, e.g. for regfiles this ID is already generated with file-ids.c code. The other part of this structure describes a regfile (i.e. a file opened with open syscall). I put this new entry at the end of the fdinfo_entry just to make the patching simpler. Soon this entry will be dumped into its own file. Signed-off-by: Pavel Emelyanov <xemul@parallels.com>
1522 lines
31 KiB
C
1522 lines
31 KiB
C
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <stdarg.h>
|
|
#include <signal.h>
|
|
#include <limits.h>
|
|
#include <unistd.h>
|
|
#include <errno.h>
|
|
#include <string.h>
|
|
#include <parasite.h>
|
|
|
|
#include <fcntl.h>
|
|
|
|
#include <sys/types.h>
|
|
#include <sys/stat.h>
|
|
#include <sys/vfs.h>
|
|
|
|
#include <sys/sendfile.h>
|
|
|
|
#include <linux/major.h>
|
|
|
|
#include "types.h"
|
|
#include "list.h"
|
|
#include "file-ids.h"
|
|
|
|
#include "compiler.h"
|
|
#include "crtools.h"
|
|
#include "syscall.h"
|
|
#include "ptrace.h"
|
|
#include "util.h"
|
|
#include "sockets.h"
|
|
#include "namespaces.h"
|
|
#include "image.h"
|
|
#include "proc_parse.h"
|
|
#include "parasite-syscall.h"
|
|
|
|
#ifndef CONFIG_X86_64
|
|
# error No x86-32 support yet
|
|
#endif
|
|
|
|
static char big_buffer[PATH_MAX];
|
|
static char loc_buf[PAGE_SIZE];
|
|
|
|
void free_pstree(struct list_head *pstree_list)
|
|
{
|
|
struct pstree_item *item, *p;
|
|
|
|
list_for_each_entry_safe(item, p, pstree_list, list) {
|
|
xfree(item->children);
|
|
xfree(item->threads);
|
|
xfree(item);
|
|
}
|
|
|
|
INIT_LIST_HEAD(pstree_list);
|
|
}
|
|
|
|
void free_mappings(struct list_head *vma_area_list)
|
|
{
|
|
struct vma_area *vma_area, *p;
|
|
|
|
list_for_each_entry_safe(vma_area, p, vma_area_list, list) {
|
|
if (vma_area->vm_file_fd > 0)
|
|
close(vma_area->vm_file_fd);
|
|
free(vma_area);
|
|
}
|
|
|
|
INIT_LIST_HEAD(vma_area_list);
|
|
}
|
|
|
|
static int collect_mappings(pid_t pid, struct list_head *vma_area_list)
|
|
{
|
|
int ret = -1;
|
|
|
|
pr_info("\n");
|
|
pr_info("Collecting mappings (pid: %d)\n", pid);
|
|
pr_info("----------------------------------------\n");
|
|
|
|
ret = parse_maps(pid, vma_area_list, true);
|
|
if (ret < 0)
|
|
goto err;
|
|
|
|
pr_info_vma_list(vma_area_list);
|
|
|
|
pr_info("----------------------------------------\n");
|
|
ret = 0;
|
|
|
|
err:
|
|
return ret;
|
|
}
|
|
|
|
struct fd_parms {
|
|
unsigned long fd_name;
|
|
unsigned long pos;
|
|
unsigned int flags;
|
|
unsigned int type;
|
|
|
|
u32 id;
|
|
pid_t pid;
|
|
};
|
|
|
|
static int dump_one_reg_file(const struct fd_parms *p, int lfd,
|
|
const struct cr_fdset *cr_fdset,
|
|
bool do_close_lfd)
|
|
{
|
|
struct fdinfo_entry e;
|
|
char fd_str[128];
|
|
int len;
|
|
int ret = -1;
|
|
|
|
snprintf(fd_str, sizeof(fd_str), "/proc/self/fd/%d", lfd);
|
|
len = readlink(fd_str, big_buffer, sizeof(big_buffer) - 1);
|
|
if (len < 0) {
|
|
pr_perror("Can't readlink %s", fd_str);
|
|
goto err;
|
|
}
|
|
|
|
big_buffer[len] = '\0';
|
|
pr_info("Dumping path for %lx fd via self %d [%s]\n",
|
|
p->fd_name, lfd, big_buffer);
|
|
|
|
if (do_close_lfd)
|
|
close(lfd);
|
|
|
|
e.type = p->type;
|
|
e.addr = p->fd_name;
|
|
e.id = p->id;
|
|
|
|
ret = fd_id_generate(p->pid, &e);
|
|
if (ret < 0)
|
|
goto err;
|
|
|
|
e.rfe.len = len;
|
|
e.rfe.flags = p->flags;
|
|
e.rfe.pos = p->pos;
|
|
e.rfe.id = e.id;
|
|
|
|
pr_info("fdinfo: type: %2x len: %2x flags: %4x pos: %8lx addr: %16lx\n",
|
|
p->type, len, p->flags, p->pos, p->fd_name);
|
|
|
|
if (write_img(cr_fdset->fds[CR_FD_FDINFO], &e))
|
|
goto err;
|
|
if (write_img_buf(cr_fdset->fds[CR_FD_FDINFO], big_buffer, e.rfe.len))
|
|
goto err;
|
|
|
|
ret = 0;
|
|
err:
|
|
return ret;
|
|
}
|
|
|
|
static int dump_task_special_files(pid_t pid, const struct cr_fdset *cr_fdset)
|
|
{
|
|
struct fd_parms params;
|
|
int fd, ret;
|
|
|
|
/* Dump /proc/pid/cwd */
|
|
params = (struct fd_parms) {
|
|
.id = FD_ID_INVALID,
|
|
.pid = FD_PID_INVALID,
|
|
.type = FDINFO_CWD,
|
|
};
|
|
|
|
fd = open_proc(pid, "cwd");
|
|
if (fd < 0)
|
|
return -1;
|
|
ret = dump_one_reg_file(¶ms, fd, cr_fdset, 1);
|
|
if (ret)
|
|
return ret;
|
|
|
|
/* Dump /proc/pid/exe */
|
|
params = (struct fd_parms) {
|
|
.id = FD_ID_INVALID,
|
|
.pid = FD_PID_INVALID,
|
|
.type = FDINFO_EXE,
|
|
};
|
|
|
|
fd = open_proc(pid, "exe");
|
|
if (fd < 0)
|
|
return -1;
|
|
ret = dump_one_reg_file(¶ms, fd, cr_fdset, 1);
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int dump_pipe_and_data(int lfd, struct pipe_entry *e,
|
|
const struct cr_fdset *cr_fdset)
|
|
{
|
|
int fd_pipes;
|
|
int steal_pipe[2];
|
|
int pipe_size;
|
|
int has_bytes;
|
|
int ret = -1;
|
|
|
|
fd_pipes = cr_fdset->fds[CR_FD_PIPES];
|
|
|
|
pr_info("Dumping data from pipe %x\n", e->pipeid);
|
|
if (pipe(steal_pipe) < 0) {
|
|
pr_perror("Can't create pipe for stealing data");
|
|
goto err;
|
|
}
|
|
|
|
pipe_size = fcntl(lfd, F_GETPIPE_SZ);
|
|
if (pipe_size < 0) {
|
|
pr_err("Can't obtain piped data size\n");
|
|
goto err;
|
|
}
|
|
|
|
has_bytes = tee(lfd, steal_pipe[1], pipe_size, SPLICE_F_NONBLOCK);
|
|
if (has_bytes < 0) {
|
|
if (errno != EAGAIN) {
|
|
pr_perror("Can't pick pipe data");
|
|
goto err_close;
|
|
} else
|
|
has_bytes = 0;
|
|
}
|
|
|
|
e->bytes = has_bytes;
|
|
if (write_img(fd_pipes, e))
|
|
goto err_close;
|
|
|
|
if (has_bytes) {
|
|
ret = splice(steal_pipe[0], NULL, fd_pipes,
|
|
NULL, has_bytes, 0);
|
|
if (ret < 0) {
|
|
pr_perror("Can't push pipe data");
|
|
goto err_close;
|
|
}
|
|
}
|
|
|
|
ret = 0;
|
|
|
|
err_close:
|
|
close(steal_pipe[0]);
|
|
close(steal_pipe[1]);
|
|
|
|
err:
|
|
return ret;
|
|
}
|
|
|
|
static int dump_one_pipe(const struct fd_parms *p, unsigned int id, int lfd,
|
|
const struct cr_fdset *cr_fdset)
|
|
{
|
|
struct pipe_entry e;
|
|
int ret = -1;
|
|
struct statfs stfs_buf;
|
|
|
|
if (fstatfs(lfd, &stfs_buf) < 0) {
|
|
pr_perror("Can't fstatfs on %ld", p->fd_name);
|
|
return -1;
|
|
}
|
|
|
|
if (stfs_buf.f_type != PIPEFS_MAGIC) {
|
|
pr_err("Dumping of FIFO's is not supported: %ld\n", p->fd_name);
|
|
return -1;
|
|
}
|
|
|
|
pr_info("Dumping pipe %ld/%x flags %x\n", p->fd_name, id, p->flags);
|
|
|
|
e.fd = p->fd_name;
|
|
e.pipeid = id;
|
|
e.flags = p->flags;
|
|
|
|
if (p->flags & O_WRONLY) {
|
|
e.bytes = 0;
|
|
ret = write_img(cr_fdset->fds[CR_FD_PIPES], &e);
|
|
} else
|
|
ret = dump_pipe_and_data(lfd, &e, cr_fdset);
|
|
|
|
err:
|
|
if (!ret)
|
|
pr_info("Dumped pipe: fd: %8x pipeid: %8x flags: %8x bytes: %8x\n",
|
|
e.fd, e.pipeid, e.flags, e.bytes);
|
|
else
|
|
pr_err("Dumping pipe %ld/%x flags %x\n", p->fd_name, id, p->flags);
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int read_fd_params(pid_t pid, const char *fd, struct fd_parms *p)
|
|
{
|
|
FILE *file;
|
|
int ret;
|
|
|
|
file = fopen_proc(pid, "fdinfo/%s", fd);
|
|
if (!file)
|
|
return -1;
|
|
|
|
p->fd_name = atoi(fd);
|
|
ret = fscanf(file, "pos:\t%li\nflags:\t%o\n", &p->pos, &p->flags);
|
|
fclose(file);
|
|
|
|
if (ret != 2) {
|
|
pr_err("Bad format of fdinfo file (%d items, want 2)\n", ret);
|
|
return -1;
|
|
}
|
|
|
|
pr_info("%d fdinfo %s: pos: %16lx flags: %16o\n",
|
|
pid, fd, p->pos, p->flags);
|
|
|
|
p->pid = pid;
|
|
p->id = FD_ID_INVALID;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int dump_one_fd(pid_t pid, int pid_fd_dir, const char *d_name,
|
|
const struct cr_fdset *cr_fdset,
|
|
struct sk_queue *sk_queue)
|
|
{
|
|
struct stat fd_stat;
|
|
int err = -1;
|
|
struct fd_parms p;
|
|
int lfd;
|
|
|
|
if (read_fd_params(pid, d_name, &p))
|
|
return -1;
|
|
|
|
lfd = openat(pid_fd_dir, d_name, O_RDONLY);
|
|
if (lfd < 0) {
|
|
err = try_dump_socket(pid, p.fd_name, cr_fdset, sk_queue);
|
|
if (err != 1)
|
|
return err;
|
|
|
|
pr_perror("Failed to open %d/%ld", pid_fd_dir, p.fd_name);
|
|
return -1;
|
|
}
|
|
|
|
if (fstat(lfd, &fd_stat) < 0) {
|
|
pr_perror("Can't get stat on %ld", p.fd_name);
|
|
goto out_close;
|
|
}
|
|
|
|
if (S_ISCHR(fd_stat.st_mode) &&
|
|
(major(fd_stat.st_rdev) == TTY_MAJOR ||
|
|
major(fd_stat.st_rdev) == UNIX98_PTY_SLAVE_MAJOR)) {
|
|
/* skip only standard destriptors */
|
|
if (p.fd_name < 3) {
|
|
err = 0;
|
|
pr_info("... Skipping tty ... %d/%ld\n",
|
|
pid_fd_dir, p.fd_name);
|
|
goto out_close;
|
|
}
|
|
goto err;
|
|
}
|
|
|
|
if (S_ISREG(fd_stat.st_mode) ||
|
|
S_ISDIR(fd_stat.st_mode) ||
|
|
(S_ISCHR(fd_stat.st_mode) && major(fd_stat.st_rdev) == MEM_MAJOR)) {
|
|
|
|
p.id = MAKE_FD_GENID(fd_stat.st_dev, fd_stat.st_ino, p.pos);
|
|
p.type = FDINFO_REG;
|
|
|
|
return dump_one_reg_file(&p, lfd, cr_fdset, 1);
|
|
}
|
|
|
|
if (S_ISFIFO(fd_stat.st_mode))
|
|
return dump_one_pipe(&p, fd_stat.st_ino, lfd, cr_fdset);
|
|
|
|
err:
|
|
pr_err("Can't dump file %ld of that type [%x]\n", p.fd_name, fd_stat.st_mode);
|
|
|
|
out_close:
|
|
close_safe(&lfd);
|
|
return err;
|
|
}
|
|
|
|
static int dump_task_files(pid_t pid, const struct cr_fdset *cr_fdset,
|
|
struct sk_queue *sk_queue)
|
|
{
|
|
struct dirent *de;
|
|
unsigned long pos;
|
|
unsigned int flags;
|
|
DIR *fd_dir;
|
|
|
|
pr_info("\n");
|
|
pr_info("Dumping opened files (pid: %d)\n", pid);
|
|
pr_info("----------------------------------------\n");
|
|
|
|
/*
|
|
* Dump special files at the beginning. We might need
|
|
* to re-read them in restorer, so better to make it
|
|
* fast.
|
|
*/
|
|
if (dump_task_special_files(pid, cr_fdset)) {
|
|
pr_err("Can't dump special files\n");
|
|
return -1;
|
|
}
|
|
|
|
fd_dir = opendir_proc(pid, "fd");
|
|
if (!fd_dir)
|
|
return -1;
|
|
|
|
while ((de = readdir(fd_dir))) {
|
|
if (!strcmp(de->d_name, "."))
|
|
continue;
|
|
if (!strcmp(de->d_name, ".."))
|
|
continue;
|
|
if (dump_one_fd(pid, dirfd(fd_dir), de->d_name, cr_fdset,
|
|
sk_queue))
|
|
return -1;
|
|
}
|
|
|
|
pr_info("----------------------------------------\n");
|
|
|
|
closedir(fd_dir);
|
|
return 0;
|
|
}
|
|
|
|
struct shmem_info
|
|
{
|
|
unsigned long size;
|
|
unsigned long shmid;
|
|
unsigned long start;
|
|
unsigned long end;
|
|
int pid;
|
|
};
|
|
|
|
static int nr_shmems;
|
|
static struct shmem_info *shmems;
|
|
|
|
#define SHMEMS_SIZE 4096
|
|
|
|
static struct shmem_info* shmem_find(unsigned long shmid)
|
|
{
|
|
int i;
|
|
|
|
for (i = 0; i < nr_shmems; i++)
|
|
if (shmems[i].shmid == shmid)
|
|
return &shmems[i];
|
|
|
|
return NULL;
|
|
}
|
|
|
|
static int add_shmem_area(pid_t pid, struct vma_entry *vma)
|
|
{
|
|
struct shmem_info *si;
|
|
unsigned long size = vma->pgoff + (vma->end - vma->start);
|
|
|
|
si = shmem_find(vma->shmid);
|
|
if (si) {
|
|
if (si->size < size)
|
|
si->size = size;
|
|
return 0;
|
|
}
|
|
|
|
nr_shmems++;
|
|
if (nr_shmems * sizeof(*si) == SHMEMS_SIZE) {
|
|
pr_err("OOM storing shmems\n");
|
|
return -1;
|
|
}
|
|
|
|
si = &shmems[nr_shmems - 1];
|
|
si->size = size;
|
|
si->pid = pid;
|
|
si->start = vma->start;
|
|
si->end = vma->end;
|
|
si->shmid = vma->shmid;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int dump_filemap(pid_t pid, struct vma_entry *vma, int file_fd,
|
|
const struct cr_fdset *fdset)
|
|
{
|
|
struct fd_parms p = {
|
|
.fd_name = vma->start,
|
|
.id = FD_ID_INVALID,
|
|
.pid = pid,
|
|
.type = FDINFO_MAP,
|
|
};
|
|
|
|
if ((vma->prot & PROT_WRITE) && vma_entry_is(vma, VMA_FILE_SHARED))
|
|
p.flags = O_RDWR;
|
|
else
|
|
p.flags = O_RDONLY;
|
|
|
|
return dump_one_reg_file(&p, file_fd, fdset, 0);
|
|
}
|
|
|
|
static int dump_task_mappings(pid_t pid, const struct list_head *vma_area_list,
|
|
const struct cr_fdset *cr_fdset)
|
|
{
|
|
struct vma_area *vma_area;
|
|
int ret = -1, fd = cr_fdset->fds[CR_FD_VMAS];
|
|
|
|
pr_info("\n");
|
|
pr_info("Dumping mappings (pid: %d)\n", pid);
|
|
pr_info("----------------------------------------\n");
|
|
|
|
list_for_each_entry(vma_area, vma_area_list, list) {
|
|
struct vma_entry *vma = &vma_area->vma;
|
|
|
|
ret = write_img(fd, vma);
|
|
if (ret < 0)
|
|
goto err;
|
|
|
|
if (!vma_entry_is(vma, VMA_AREA_REGULAR))
|
|
continue;
|
|
if (vma_entry_is(vma, VMA_AREA_SYSVIPC))
|
|
continue;
|
|
|
|
pr_info_vma(vma_area);
|
|
|
|
if (vma_entry_is(vma, VMA_ANON_SHARED))
|
|
ret = add_shmem_area(pid, vma);
|
|
else if (vma_entry_is(vma, VMA_FILE_PRIVATE) ||
|
|
vma_entry_is(vma, VMA_FILE_SHARED))
|
|
ret = dump_filemap(pid, vma, vma_area->vm_file_fd, cr_fdset);
|
|
else
|
|
ret = 0;
|
|
|
|
if (ret)
|
|
goto err;
|
|
}
|
|
|
|
ret = 0;
|
|
pr_info("----------------------------------------\n");
|
|
err:
|
|
return ret;
|
|
}
|
|
|
|
static int dump_task_creds(pid_t pid, const struct parasite_dump_misc *misc,
|
|
const struct cr_fdset *fds)
|
|
{
|
|
int ret, i;
|
|
struct proc_status_creds cr;
|
|
struct creds_entry ce;
|
|
|
|
pr_info("\n");
|
|
pr_info("Dumping creds for %d)\n", pid);
|
|
pr_info("----------------------------------------\n");
|
|
|
|
ret = parse_pid_status(pid, &cr);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
ce.uid = cr.uids[0];
|
|
ce.gid = cr.gids[0];
|
|
ce.euid = cr.uids[1];
|
|
ce.egid = cr.gids[1];
|
|
ce.suid = cr.uids[2];
|
|
ce.sgid = cr.gids[2];
|
|
ce.fsuid = cr.uids[3];
|
|
ce.fsgid = cr.gids[3];
|
|
|
|
BUILD_BUG_ON(CR_CAP_SIZE != PROC_CAP_SIZE);
|
|
|
|
for (i = 0; i < CR_CAP_SIZE; i++) {
|
|
ce.cap_inh[i] = cr.cap_inh[i];
|
|
ce.cap_prm[i] = cr.cap_prm[i];
|
|
ce.cap_eff[i] = cr.cap_eff[i];
|
|
ce.cap_bnd[i] = cr.cap_bnd[i];
|
|
}
|
|
|
|
ce.secbits = misc->secbits;
|
|
|
|
ret = write_img(fds->fds[CR_FD_CREDS], &ce);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
return 0;
|
|
}
|
|
|
|
#define assign_reg(dst, src, e) dst.e = (__typeof__(dst.e))src.e
|
|
#define assign_array(dst, src, e) memcpy(&dst.e, &src.e, sizeof(dst.e))
|
|
|
|
static int get_task_auxv(pid_t pid, struct core_entry *core)
|
|
{
|
|
int fd = open_proc(pid, "auxv");
|
|
int ret, i;
|
|
|
|
if (fd < 0)
|
|
return -1;
|
|
|
|
for (i = 0; i < AT_VECTOR_SIZE; i++) {
|
|
ret = read(fd, &core->tc.mm_saved_auxv[i],
|
|
sizeof(core->tc.mm_saved_auxv[0]));
|
|
if (ret == 0)
|
|
break;
|
|
else if (ret != sizeof(core->tc.mm_saved_auxv[0])) {
|
|
ret = -1;
|
|
pr_perror("Error readind %d's auxv[%d]",
|
|
pid, i);
|
|
goto err;
|
|
}
|
|
}
|
|
|
|
ret = 0;
|
|
|
|
err:
|
|
close_safe(&fd);
|
|
return ret;
|
|
}
|
|
|
|
static int get_task_personality(pid_t pid, u32 *personality)
|
|
{
|
|
FILE *file = NULL;
|
|
int ret = -1;
|
|
|
|
file = fopen_proc(pid, "personality");
|
|
if (!file)
|
|
goto err;
|
|
|
|
if (!fgets(loc_buf, sizeof(loc_buf), file)) {
|
|
perror("Can't read task personality");
|
|
goto err;
|
|
}
|
|
|
|
*personality = atoi(loc_buf);
|
|
ret = 0;
|
|
|
|
err:
|
|
if (file)
|
|
fclose(file);
|
|
return ret;
|
|
}
|
|
|
|
static int get_task_regs(pid_t pid, struct core_entry *core, const struct parasite_ctl *ctl)
|
|
{
|
|
user_fpregs_struct_t fpregs = {-1};
|
|
user_regs_struct_t regs = {-1};
|
|
int ret = -1;
|
|
|
|
if (ctl)
|
|
regs = ctl->regs_orig;
|
|
else {
|
|
if (ptrace(PTRACE_GETREGS, pid, NULL, ®s)) {
|
|
pr_err("Can't obtain GP registers for %d\n", pid);
|
|
goto err;
|
|
}
|
|
}
|
|
|
|
if (ptrace(PTRACE_GETFPREGS, pid, NULL, &fpregs)) {
|
|
pr_err("Can't obtain FPU registers for %d\n", pid);
|
|
goto err;
|
|
}
|
|
|
|
/* Did we come from a system call? */
|
|
if ((int)regs.orig_ax >= 0) {
|
|
/* Restart the system call */
|
|
switch ((long)(int)regs.ax) {
|
|
case -ERESTARTNOHAND:
|
|
case -ERESTARTSYS:
|
|
case -ERESTARTNOINTR:
|
|
regs.ax = regs.orig_ax;
|
|
regs.ip -= 2;
|
|
break;
|
|
case -ERESTART_RESTARTBLOCK:
|
|
regs.ax = __NR_restart_syscall;
|
|
regs.ip -= 2;
|
|
break;
|
|
}
|
|
}
|
|
|
|
assign_reg(core->arch.gpregs, regs, r15);
|
|
assign_reg(core->arch.gpregs, regs, r14);
|
|
assign_reg(core->arch.gpregs, regs, r13);
|
|
assign_reg(core->arch.gpregs, regs, r12);
|
|
assign_reg(core->arch.gpregs, regs, bp);
|
|
assign_reg(core->arch.gpregs, regs, bx);
|
|
assign_reg(core->arch.gpregs, regs, r11);
|
|
assign_reg(core->arch.gpregs, regs, r10);
|
|
assign_reg(core->arch.gpregs, regs, r9);
|
|
assign_reg(core->arch.gpregs, regs, r8);
|
|
assign_reg(core->arch.gpregs, regs, ax);
|
|
assign_reg(core->arch.gpregs, regs, cx);
|
|
assign_reg(core->arch.gpregs, regs, dx);
|
|
assign_reg(core->arch.gpregs, regs, si);
|
|
assign_reg(core->arch.gpregs, regs, di);
|
|
assign_reg(core->arch.gpregs, regs, orig_ax);
|
|
assign_reg(core->arch.gpregs, regs, ip);
|
|
assign_reg(core->arch.gpregs, regs, cs);
|
|
assign_reg(core->arch.gpregs, regs, flags);
|
|
assign_reg(core->arch.gpregs, regs, sp);
|
|
assign_reg(core->arch.gpregs, regs, ss);
|
|
assign_reg(core->arch.gpregs, regs, fs_base);
|
|
assign_reg(core->arch.gpregs, regs, gs_base);
|
|
assign_reg(core->arch.gpregs, regs, ds);
|
|
assign_reg(core->arch.gpregs, regs, es);
|
|
assign_reg(core->arch.gpregs, regs, fs);
|
|
assign_reg(core->arch.gpregs, regs, gs);
|
|
|
|
assign_reg(core->arch.fpregs, fpregs, cwd);
|
|
assign_reg(core->arch.fpregs, fpregs, swd);
|
|
assign_reg(core->arch.fpregs, fpregs, twd);
|
|
assign_reg(core->arch.fpregs, fpregs, fop);
|
|
assign_reg(core->arch.fpregs, fpregs, rip);
|
|
assign_reg(core->arch.fpregs, fpregs, rdp);
|
|
assign_reg(core->arch.fpregs, fpregs, mxcsr);
|
|
assign_reg(core->arch.fpregs, fpregs, mxcsr_mask);
|
|
|
|
assign_array(core->arch.fpregs, fpregs, st_space);
|
|
assign_array(core->arch.fpregs, fpregs, xmm_space);
|
|
assign_array(core->arch.fpregs, fpregs, padding);
|
|
|
|
ret = 0;
|
|
|
|
err:
|
|
return ret;
|
|
}
|
|
|
|
static int dump_task_core(struct core_entry *core, const struct cr_fdset *fdset)
|
|
{
|
|
int fd_core = fdset->fds[CR_FD_CORE];
|
|
int ret;
|
|
|
|
lseek(fd_core, MAGIC_OFFSET, SEEK_SET);
|
|
|
|
pr_info("Dumping header ... ");
|
|
|
|
core->header.version = HEADER_VERSION;
|
|
core->header.arch = HEADER_ARCH_X86_64;
|
|
core->header.flags = 0;
|
|
|
|
ret = write_img(fd_core, core);
|
|
|
|
free(core);
|
|
return ret;
|
|
}
|
|
|
|
static int dump_task_core_all(pid_t pid, const struct proc_pid_stat *stat,
|
|
const struct parasite_dump_misc *misc, const struct parasite_ctl *ctl,
|
|
const struct cr_fdset *cr_fdset)
|
|
{
|
|
struct core_entry *core = xzalloc(sizeof(*core));
|
|
int ret = -1;
|
|
unsigned long brk;
|
|
|
|
pr_info("\n");
|
|
pr_info("Dumping core (pid: %d)\n", pid);
|
|
pr_info("----------------------------------------\n");
|
|
|
|
if (!core)
|
|
goto err;
|
|
|
|
pr_info("Dumping GP/FPU registers ... ");
|
|
ret = get_task_regs(pid, core, ctl);
|
|
if (ret)
|
|
goto err_free;
|
|
pr_info("OK\n");
|
|
|
|
pr_info("Obtainting personality ... ");
|
|
ret = get_task_personality(pid, &core->tc.personality);
|
|
if (ret)
|
|
goto err_free;
|
|
pr_info("OK\n");
|
|
|
|
strncpy((char *)core->tc.comm, stat->comm, TASK_COMM_LEN);
|
|
core->tc.flags = stat->flags;
|
|
core->tc.mm_start_code = stat->start_code;
|
|
core->tc.mm_end_code = stat->end_code;
|
|
core->tc.mm_start_data = stat->start_data;
|
|
core->tc.mm_end_data = stat->end_data;
|
|
core->tc.mm_start_stack = stat->start_stack;
|
|
core->tc.mm_start_brk = stat->start_brk;
|
|
|
|
core->tc.mm_arg_start = stat->arg_start;
|
|
core->tc.mm_arg_end = stat->arg_end;
|
|
core->tc.mm_env_start = stat->env_start;
|
|
core->tc.mm_env_end = stat->env_end;
|
|
|
|
core->tc.mm_brk = misc->brk;
|
|
|
|
BUILD_BUG_ON(sizeof(core->tc.blk_sigset) != sizeof(k_rtsigset_t));
|
|
memcpy(&core->tc.blk_sigset, &misc->blocked, sizeof(k_rtsigset_t));
|
|
|
|
pr_info("Obtainting task auvx ... ");
|
|
ret = get_task_auxv(pid, core);
|
|
if (ret)
|
|
goto err_free;
|
|
pr_info("OK\n");
|
|
|
|
core->tc.task_state = TASK_ALIVE;
|
|
core->tc.exit_code = 0;
|
|
|
|
return dump_task_core(core, cr_fdset);
|
|
|
|
err_free:
|
|
free(core);
|
|
err:
|
|
pr_info("----------------------------------------\n");
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int parse_threads(const struct pstree_item *item, u32 **_t, int *_n)
|
|
{
|
|
struct dirent *de;
|
|
DIR *dir;
|
|
u32 *t = NULL;
|
|
int nr = 1;
|
|
|
|
dir = opendir_proc(item->pid, "task");
|
|
if (!dir)
|
|
return -1;
|
|
|
|
while ((de = readdir(dir))) {
|
|
u32 *tmp;
|
|
|
|
/* We expect numbers only here */
|
|
if (de->d_name[0] == '.')
|
|
continue;
|
|
|
|
tmp = xrealloc(t, nr * sizeof(u32));
|
|
if (!tmp) {
|
|
xfree(t);
|
|
return -1;
|
|
}
|
|
t = tmp;
|
|
t[nr - 1] = atoi(de->d_name);
|
|
nr++;
|
|
}
|
|
|
|
closedir(dir);
|
|
|
|
*_t = t;
|
|
*_n = nr - 1;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int get_threads(struct pstree_item *item)
|
|
{
|
|
return parse_threads(item, &item->threads, &item->nr_threads);
|
|
}
|
|
|
|
static int check_threads(const struct pstree_item *item)
|
|
{
|
|
u32 *t;
|
|
int nr, ret;
|
|
|
|
ret = parse_threads(item, &t, &nr);
|
|
if (ret)
|
|
return ret;
|
|
|
|
ret = ((nr == item->nr_threads) && !memcmp(t, item->threads, nr));
|
|
xfree(t);
|
|
|
|
if (!ret) {
|
|
pr_info("Threads set has changed while suspending\n");
|
|
return -1;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int parse_children(const struct pstree_item *item, u32 **_c, int *_n)
|
|
{
|
|
FILE *file;
|
|
char *tok;
|
|
u32 *ch = NULL;
|
|
int nr = 1, i;
|
|
|
|
for (i = 0; i < item->nr_threads; i++) {
|
|
|
|
file = fopen_proc(item->pid, "task/%d/children", item->threads[i]);
|
|
if (!file)
|
|
goto err;
|
|
|
|
if (!(fgets(loc_buf, sizeof(loc_buf), file)))
|
|
loc_buf[0] = 0;
|
|
|
|
fclose(file);
|
|
|
|
tok = strtok(loc_buf, " \n");
|
|
while (tok) {
|
|
u32 *tmp = xrealloc(ch, nr * sizeof(u32));
|
|
if (!tmp)
|
|
goto err;
|
|
ch = tmp;
|
|
ch[nr - 1] = atoi(tok);
|
|
nr++;
|
|
tok = strtok(NULL, " \n");
|
|
}
|
|
|
|
}
|
|
|
|
*_c = ch;
|
|
*_n = nr - 1;
|
|
|
|
return 0;
|
|
|
|
err:
|
|
xfree(ch);
|
|
return -1;
|
|
}
|
|
|
|
static int get_children(struct pstree_item *item)
|
|
{
|
|
return parse_children(item, &item->children, &item->nr_children);
|
|
}
|
|
|
|
static void unseize_task_and_threads(const struct pstree_item *item, int st)
|
|
{
|
|
int i;
|
|
|
|
for (i = 0; i < item->nr_threads; i++)
|
|
unseize_task(item->threads[i], st); /* item->pid will be here */
|
|
}
|
|
|
|
static void pstree_switch_state(const struct list_head *list,
|
|
const struct cr_options *opts)
|
|
{
|
|
struct pstree_item *item;
|
|
|
|
list_for_each_entry(item, list, list) {
|
|
unseize_task_and_threads(item, opts->final_state);
|
|
if (opts->leader_only)
|
|
break;
|
|
}
|
|
}
|
|
|
|
static int seize_threads(const struct pstree_item *item)
|
|
{
|
|
int i = 0, ret;
|
|
|
|
if ((item->state == TASK_DEAD) && (item->nr_threads > 1)) {
|
|
pr_err("Zombies with threads are not supported\n");
|
|
goto err;
|
|
}
|
|
|
|
for (i = 0; i < item->nr_threads; i++) {
|
|
if (item->pid == item->threads[i])
|
|
continue;
|
|
|
|
pr_info("\tSeizing %d's %d thread\n", item->pid, item->threads[i]);
|
|
ret = seize_task(item->threads[i], item->ppid);
|
|
if (ret < 0)
|
|
goto err;
|
|
|
|
if (ret == TASK_DEAD) {
|
|
pr_err("Zombie thread not supported\n");
|
|
goto err;
|
|
}
|
|
|
|
if (ret == TASK_STOPPED) {
|
|
pr_err("Stopped threads not supported\n");
|
|
goto err;
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
|
|
err:
|
|
for (i--; i >= 0; i--) {
|
|
if (item->pid == item->threads[i])
|
|
continue;
|
|
|
|
unseize_task(item->threads[i], TASK_ALIVE);
|
|
}
|
|
|
|
return -1;
|
|
}
|
|
|
|
static int collect_threads(struct pstree_item *item)
|
|
{
|
|
int ret;
|
|
|
|
ret = get_threads(item);
|
|
if (!ret)
|
|
ret = seize_threads(item);
|
|
if (!ret)
|
|
ret = check_threads(item);
|
|
|
|
return ret;
|
|
}
|
|
|
|
static struct pstree_item *collect_task(pid_t pid, pid_t ppid, struct list_head *list)
|
|
{
|
|
int ret;
|
|
struct pstree_item *item;
|
|
|
|
item = xzalloc(sizeof(*item));
|
|
if (!item)
|
|
goto err;
|
|
|
|
ret = seize_task(pid, ppid);
|
|
if (ret < 0)
|
|
goto err_free;
|
|
|
|
pr_info("Seized task %d, state %d\n", pid, ret);
|
|
item->pid = pid;
|
|
item->ppid = ppid;
|
|
item->state = ret;
|
|
|
|
ret = collect_threads(item);
|
|
if (ret < 0)
|
|
goto err_close;
|
|
|
|
ret = get_children(item);
|
|
if (ret < 0)
|
|
goto err_close;
|
|
|
|
if ((item->state == TASK_DEAD) && (item->nr_children > 0)) {
|
|
pr_err("Zombie with children?! O_o Run, run, run!\n");
|
|
goto err_close;
|
|
}
|
|
|
|
close_pid_proc();
|
|
list_add_tail(&item->list, list);
|
|
pr_info("Collected %d in %d state\n", item->pid, item->state);
|
|
return item;
|
|
|
|
err_close:
|
|
close_pid_proc();
|
|
unseize_task(pid, item->state);
|
|
err_free:
|
|
xfree(item->children);
|
|
xfree(item->threads);
|
|
xfree(item);
|
|
err:
|
|
return NULL;
|
|
}
|
|
|
|
static int check_subtree(const struct pstree_item *item)
|
|
{
|
|
u32 *ch;
|
|
int nr, ret;
|
|
|
|
ret = parse_children(item, &ch, &nr);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
ret = ((nr == item->nr_children) && !memcmp(ch, item->children, nr));
|
|
xfree(ch);
|
|
|
|
if (!ret) {
|
|
pr_info("Children set has changed while suspending\n");
|
|
return -1;
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int collect_subtree(pid_t pid, pid_t ppid, struct list_head *pstree_list,
|
|
int leader_only)
|
|
{
|
|
struct pstree_item *item;
|
|
int i;
|
|
|
|
pr_info("Collecting tasks starting from %d\n", pid);
|
|
item = collect_task(pid, ppid, pstree_list);
|
|
if (item == NULL)
|
|
return -1;
|
|
|
|
if (leader_only)
|
|
return 0;
|
|
|
|
for (i = 0; i < item->nr_children; i++)
|
|
if (collect_subtree(item->children[i], item->pid, pstree_list, 0) < 0)
|
|
return -1;
|
|
|
|
if (check_subtree(item))
|
|
return -1;
|
|
|
|
return 0;
|
|
}
|
|
|
|
static int dump_pstree(pid_t pid, const struct list_head *pstree_list);
|
|
|
|
static int collect_dump_pstree(pid_t pid, struct list_head *pstree_list,
|
|
const struct cr_options *opts)
|
|
{
|
|
int ret, attempts = 5;
|
|
|
|
while (1) {
|
|
struct pstree_item *item;
|
|
|
|
ret = collect_subtree(pid, -1, pstree_list, opts->leader_only);
|
|
if (ret == 0) {
|
|
/*
|
|
* Some tasks could have been reparented to
|
|
* namespaces' reaper. Check this.
|
|
*/
|
|
if (opts->namespaces_flags & CLONE_NEWPID) {
|
|
item = list_first_entry(pstree_list,
|
|
struct pstree_item, list);
|
|
BUG_ON(item->pid != 1);
|
|
|
|
if (check_subtree(item))
|
|
goto try_again;
|
|
}
|
|
|
|
break;
|
|
}
|
|
|
|
if (list_empty(pstree_list))
|
|
/*
|
|
* No items at all -- no need in re-scanning it again
|
|
*/
|
|
break;
|
|
|
|
/*
|
|
* Old tasks can die and new ones can appear while we
|
|
* try to seize the swarm. It's much simpler (and reliable)
|
|
* just to restart the collection from the beginning
|
|
* rather than trying to chase them.
|
|
*/
|
|
try_again:
|
|
if (attempts == 0)
|
|
break;
|
|
|
|
attempts--;
|
|
pr_info("Trying to suspend tasks again\n");
|
|
|
|
while (!list_empty(pstree_list)) {
|
|
item = list_first_entry(pstree_list,
|
|
struct pstree_item, list);
|
|
list_del(&item->list);
|
|
|
|
unseize_task_and_threads(item, TASK_ALIVE);
|
|
|
|
xfree(item->children);
|
|
xfree(item->threads);
|
|
xfree(item);
|
|
}
|
|
}
|
|
|
|
if (ret)
|
|
return ret;
|
|
|
|
return dump_pstree(pid, pstree_list);
|
|
}
|
|
|
|
static int dump_pstree(pid_t pid, const struct list_head *pstree_list)
|
|
{
|
|
const struct pstree_item *item;
|
|
struct pstree_entry e;
|
|
unsigned long i;
|
|
int ret = -1;
|
|
int pstree_fd;
|
|
|
|
pr_info("\n");
|
|
pr_info("Dumping pstree (pid: %d)\n", pid);
|
|
pr_info("----------------------------------------\n");
|
|
|
|
pstree_fd = open_image(CR_FD_PSTREE, O_RDWR | O_CREAT | O_EXCL, pid);
|
|
if (pstree_fd < 0)
|
|
return -1;
|
|
|
|
list_for_each_entry(item, pstree_list, list) {
|
|
|
|
pr_info("Process: %d (%d children)\n",
|
|
item->pid, item->nr_children);
|
|
|
|
e.pid = item->pid;
|
|
e.nr_children = item->nr_children;
|
|
e.nr_threads = item->nr_threads;
|
|
|
|
if (write_img(pstree_fd, &e))
|
|
goto err;
|
|
|
|
if (write_img_buf(pstree_fd, item->children,
|
|
item->nr_children * sizeof(u32)))
|
|
goto err;
|
|
|
|
if (write_img_buf(pstree_fd, item->threads,
|
|
item->nr_threads * sizeof(u32)))
|
|
goto err;
|
|
}
|
|
ret = 0;
|
|
|
|
err:
|
|
pr_info("----------------------------------------\n");
|
|
close(pstree_fd);
|
|
return ret;
|
|
}
|
|
|
|
static int dump_task_thread(struct parasite_ctl *parasite_ctl,
|
|
pid_t pid, const struct cr_fdset *cr_fdset)
|
|
{
|
|
struct core_entry *core = xzalloc(sizeof(*core));
|
|
int ret = -1;
|
|
unsigned int *taddr;
|
|
|
|
pr_info("\n");
|
|
pr_info("Dumping core for thread (pid: %d)\n", pid);
|
|
pr_info("----------------------------------------\n");
|
|
|
|
if (!core)
|
|
goto err;
|
|
|
|
pr_info("Dumping GP/FPU registers ... ");
|
|
ret = get_task_regs(pid, core, NULL);
|
|
if (ret)
|
|
goto err_free;
|
|
|
|
ret = parasite_dump_tid_addr_seized(parasite_ctl, pid, &taddr);
|
|
if (ret) {
|
|
pr_err("Can't dump tid address for pid %d", pid);
|
|
goto err;
|
|
}
|
|
|
|
pr_info("%d: tid_address=%p\n", pid, taddr);
|
|
core->clear_tid_address = (u64) taddr;
|
|
|
|
pr_info("OK\n");
|
|
|
|
core->tc.task_state = TASK_ALIVE;
|
|
core->tc.exit_code = 0;
|
|
|
|
return dump_task_core(core, cr_fdset);
|
|
|
|
err_free:
|
|
free(core);
|
|
err:
|
|
pr_info("----------------------------------------\n");
|
|
|
|
return ret;
|
|
}
|
|
|
|
static int dump_one_zombie(const struct pstree_item *item,
|
|
const struct proc_pid_stat *pps,
|
|
struct cr_fdset *cr_fdset)
|
|
{
|
|
struct core_entry *core;
|
|
int ret;
|
|
|
|
cr_fdset = cr_dump_fdset_open(item->pid, CR_FD_DESC_CORE, cr_fdset);
|
|
if (cr_fdset == NULL)
|
|
return -1;
|
|
|
|
core = xzalloc(sizeof(*core));
|
|
if (core == NULL)
|
|
return -1;
|
|
|
|
core->tc.task_state = TASK_DEAD;
|
|
core->tc.exit_code = pps->exit_code;
|
|
|
|
return dump_task_core(core, cr_fdset);
|
|
}
|
|
|
|
static struct proc_pid_stat pps_buf;
|
|
|
|
static int dump_task_threads(struct parasite_ctl *parasite_ctl,
|
|
const struct pstree_item *item)
|
|
{
|
|
int i;
|
|
struct cr_fdset *cr_fdset_thread = NULL;
|
|
|
|
if (item->nr_threads == 1)
|
|
return 0;
|
|
|
|
for (i = 0; i < item->nr_threads; i++) {
|
|
/* Leader is already dumped */
|
|
if (item->pid == item->threads[i])
|
|
continue;
|
|
|
|
cr_fdset_thread = cr_dump_fdset_open(item->threads[i], CR_FD_DESC_CORE, NULL);
|
|
if (!cr_fdset_thread)
|
|
goto err;
|
|
|
|
if (dump_task_thread(parasite_ctl,
|
|
item->threads[i], cr_fdset_thread))
|
|
goto err;
|
|
|
|
close_cr_fdset(&cr_fdset_thread);
|
|
}
|
|
|
|
return 0;
|
|
|
|
err:
|
|
close_cr_fdset(&cr_fdset_thread);
|
|
return -1;
|
|
}
|
|
|
|
static int dump_one_task(const struct pstree_item *item, struct cr_fdset *cr_fdset)
|
|
{
|
|
pid_t pid = item->pid;
|
|
LIST_HEAD(vma_area_list);
|
|
struct parasite_ctl *parasite_ctl;
|
|
int ret = -1;
|
|
struct parasite_dump_misc misc;
|
|
struct sk_queue sk_queue = { };
|
|
|
|
pr_info("========================================\n");
|
|
pr_info("Dumping task (pid: %d)\n", pid);
|
|
pr_info("========================================\n");
|
|
|
|
if (item->state == TASK_STOPPED) {
|
|
pr_err("Stopped tasks are not supported\n");
|
|
goto err_free;
|
|
}
|
|
|
|
pr_info("Obtainting task stat ... ");
|
|
ret = parse_pid_stat(pid, &pps_buf);
|
|
if (ret < 0)
|
|
goto err;
|
|
|
|
if (item->state == TASK_DEAD)
|
|
return dump_one_zombie(item, &pps_buf, cr_fdset);
|
|
|
|
ret = -1;
|
|
if (!cr_dump_fdset_open(item->pid, CR_FD_DESC_TASK, cr_fdset))
|
|
goto err;
|
|
|
|
ret = collect_mappings(pid, &vma_area_list);
|
|
if (ret) {
|
|
pr_err("Collect mappings (pid: %d) failed with %d\n", pid, ret);
|
|
goto err;
|
|
}
|
|
|
|
ret = dump_task_files(pid, cr_fdset, &sk_queue);
|
|
if (ret) {
|
|
pr_err("Dump files (pid: %d) failed with %d\n", pid, ret);
|
|
goto err;
|
|
}
|
|
|
|
parasite_ctl = parasite_infect_seized(pid, &vma_area_list);
|
|
if (!parasite_ctl) {
|
|
pr_err("Can't infect (pid: %d) with parasite\n", pid);
|
|
goto err;
|
|
}
|
|
|
|
ret = parasite_dump_pages_seized(parasite_ctl, &vma_area_list, cr_fdset);
|
|
if (ret) {
|
|
pr_err("Can't dump pages (pid: %d) with parasite\n", pid);
|
|
goto err;
|
|
}
|
|
|
|
ret = parasite_dump_sigacts_seized(parasite_ctl, cr_fdset);
|
|
if (ret) {
|
|
pr_err("Can't dump sigactions (pid: %d) with parasite\n", pid);
|
|
goto err;
|
|
}
|
|
|
|
ret = parasite_dump_itimers_seized(parasite_ctl, cr_fdset);
|
|
if (ret) {
|
|
pr_err("Can't dump itimers (pid: %d)\n", pid);
|
|
goto err;
|
|
}
|
|
|
|
ret = parasite_dump_misc_seized(parasite_ctl, &misc);
|
|
if (ret) {
|
|
pr_err("Can't dump misc (pid: %d)\n", pid);
|
|
goto err;
|
|
}
|
|
|
|
ret = dump_task_core_all(pid, &pps_buf, &misc, parasite_ctl, cr_fdset);
|
|
if (ret) {
|
|
pr_err("Dump core (pid: %d) failed with %d\n", pid, ret);
|
|
goto err;
|
|
}
|
|
|
|
ret = dump_task_threads(parasite_ctl, item);
|
|
if (ret) {
|
|
pr_err("Can't dump threads\n");
|
|
goto err;
|
|
}
|
|
|
|
ret = parasite_dump_socket_info(parasite_ctl, cr_fdset, &sk_queue);
|
|
if (ret) {
|
|
pr_err("Can't dump socket info (pid: %d)\n", pid);
|
|
goto err;
|
|
}
|
|
|
|
ret = parasite_cure_seized(parasite_ctl);
|
|
if (ret) {
|
|
pr_err("Can't cure (pid: %d) from parasite\n", pid);
|
|
goto err;
|
|
}
|
|
|
|
ret = dump_task_mappings(pid, &vma_area_list, cr_fdset);
|
|
if (ret) {
|
|
pr_err("Dump mappings (pid: %d) failed with %d\n", pid, ret);
|
|
goto err;
|
|
}
|
|
|
|
ret = dump_task_creds(pid, &misc, cr_fdset);
|
|
if (ret) {
|
|
pr_err("Dump creds (pid: %d) failed with %d\n", pid, ret);
|
|
goto err;
|
|
}
|
|
err:
|
|
close_pid_proc();
|
|
err_free:
|
|
free_mappings(&vma_area_list);
|
|
return ret;
|
|
}
|
|
|
|
static int cr_dump_shmem(void)
|
|
{
|
|
int err, fd;
|
|
struct cr_fdset *cr_fdset = NULL;
|
|
unsigned char *map = NULL;
|
|
void *addr = NULL;
|
|
struct shmem_info *si;
|
|
unsigned long pfn, nrpages;
|
|
|
|
for (si = shmems; si < &shmems[nr_shmems]; si++) {
|
|
pr_info("Dumping shared memory %lx\n", si->shmid);
|
|
|
|
nrpages = (si->size + PAGE_SIZE -1) / PAGE_SIZE;
|
|
map = xmalloc(nrpages * sizeof(*map));
|
|
if (!map)
|
|
goto err;
|
|
|
|
fd = open_proc(si->pid, "map_files/%lx-%lx", si->start, si->end);
|
|
if (fd < 0)
|
|
goto err;
|
|
|
|
addr = mmap(NULL, si->size, PROT_READ, MAP_SHARED, fd, 0);
|
|
close(fd);
|
|
if (addr == MAP_FAILED) {
|
|
pr_err("Can't map shmem %lx (%lx-%lx)\n",
|
|
si->shmid, si->start, si->end);
|
|
goto err;
|
|
}
|
|
|
|
err = mincore(addr, si->size, map);
|
|
if (err)
|
|
goto err_unmap;
|
|
|
|
fd = open_image(CR_FD_SHMEM_PAGES, O_WRONLY | O_CREAT, si->shmid);
|
|
if (fd < 0)
|
|
goto err_unmap;
|
|
|
|
for (pfn = 0; pfn < nrpages; pfn++) {
|
|
u64 offset = pfn * PAGE_SIZE;
|
|
|
|
if (!(map[pfn] & PAGE_RSS))
|
|
continue;
|
|
|
|
if (write_img_buf(fd, &offset, sizeof(offset)))
|
|
break;
|
|
if (write_img_buf(fd, addr + offset, PAGE_SIZE))
|
|
break;
|
|
}
|
|
|
|
if (pfn != nrpages)
|
|
goto err_close;
|
|
|
|
err = write_img(fd, &zero_page_entry);
|
|
if (err < 0)
|
|
goto err_close;
|
|
|
|
close(fd);
|
|
munmap(addr, si->size);
|
|
xfree(map);
|
|
}
|
|
|
|
return 0;
|
|
|
|
err_close:
|
|
close(fd);
|
|
err_unmap:
|
|
munmap(addr, si->size);
|
|
err:
|
|
xfree(map);
|
|
return -1;
|
|
}
|
|
|
|
int cr_dump_tasks(pid_t pid, const struct cr_options *opts)
|
|
{
|
|
LIST_HEAD(pstree_list);
|
|
struct pstree_item *item;
|
|
int i, ret = -1;
|
|
|
|
pr_info("========================================\n");
|
|
if (!opts->leader_only)
|
|
pr_info("Dumping process group (pid: %d)\n", pid);
|
|
else
|
|
pr_info("Dumping process (pid: %d)\n", pid);
|
|
pr_info("========================================\n");
|
|
|
|
if (collect_dump_pstree(pid, &pstree_list, opts))
|
|
goto err;
|
|
|
|
if (opts->namespaces_flags) {
|
|
if (dump_namespaces(pid, opts->namespaces_flags) < 0)
|
|
goto err;
|
|
}
|
|
|
|
/*
|
|
* Ignore collection errors by now since we may not want
|
|
* to dump the missed sockets. But later, when we will start
|
|
* dumping containers, we'll better fail here, rather than
|
|
* in the dump stage
|
|
*/
|
|
|
|
collect_sockets();
|
|
|
|
nr_shmems = 0;
|
|
shmems = xmalloc(SHMEMS_SIZE);
|
|
if (!shmems)
|
|
goto err;
|
|
|
|
list_for_each_entry(item, &pstree_list, list) {
|
|
struct cr_fdset *cr_fdset = NULL;
|
|
|
|
cr_fdset = cr_dump_fdset_open(item->pid, CR_FD_DESC_NONE, NULL);
|
|
if (!cr_fdset)
|
|
goto err;
|
|
|
|
/*
|
|
* Prepare for socket queues in advance. They are not per-task,
|
|
* but per-someother-task which makes restore tricky. Thus save
|
|
* them in "global" image.
|
|
* That's why we open the file with tree leader's pid for any
|
|
* of it's children.
|
|
*/
|
|
if (!cr_dump_fdset_open(pid, CR_FD_DESC_USE(CR_FD_SK_QUEUES), cr_fdset))
|
|
goto err;
|
|
|
|
if (dump_one_task(item, cr_fdset))
|
|
goto err;
|
|
|
|
close_cr_fdset(&cr_fdset);
|
|
|
|
if (opts->leader_only)
|
|
break;
|
|
}
|
|
|
|
ret = cr_dump_shmem();
|
|
xfree(shmems);
|
|
|
|
fd_id_show_tree();
|
|
err:
|
|
pstree_switch_state(&pstree_list, opts);
|
|
free_pstree(&pstree_list);
|
|
|
|
return ret;
|
|
}
|