#include #include #include #include "image.h" #include "cr_options.h" #include "servicefd.h" #include "page-read.h" #include "protobuf.h" #include "protobuf/pagemap.pb-c.h" #ifndef SEEK_DATA #define SEEK_DATA 3 #define SEEK_HOLE 4 #endif static int get_page_vaddr(struct page_read *pr, struct iovec *iov) { int ret; u64 img_va; ret = read_img_eof(pr->fd_pg, &img_va); if (ret <= 0) return ret; iov->iov_base = (void *)decode_pointer(img_va); iov->iov_len = PAGE_SIZE; return 1; } static int read_page(struct page_read *pr, unsigned long vaddr, void *buf) { int ret; ret = read(pr->fd_pg, buf, PAGE_SIZE); if (ret != PAGE_SIZE) { pr_err("Can't read mapping page %d\n", ret); return -1; } return 1; } void pagemap2iovec(PagemapEntry *pe, struct iovec *iov) { iov->iov_base = decode_pointer(pe->vaddr); iov->iov_len = pe->nr_pages * PAGE_SIZE; } static int get_pagemap(struct page_read *pr, struct iovec *iov) { int ret; PagemapEntry *pe; ret = pb_read_one_eof(pr->fd, &pe, PB_PAGEMAP); if (ret <= 0) return ret; pagemap2iovec(pe, iov); pr->pe = pe; pr->cvaddr = (unsigned long)iov->iov_base; if (pe->in_parent && !pr->parent) { pr_err("No parent for snapshot pagemap\n"); return -1; } return 1; } static void put_pagemap(struct page_read *pr) { pagemap_entry__free_unpacked(pr->pe, NULL); } static int read_pagemap_page(struct page_read *pr, unsigned long vaddr, void *buf); static void skip_pagemap_pages(struct page_read *pr, unsigned long len) { if (!len) return; pr_debug("\tpr%u Skip %lx bytes from page-dump\n", pr->id, len); if (!pr->pe->in_parent) lseek(pr->fd_pg, len, SEEK_CUR); pr->cvaddr += len; } int seek_pagemap_page(struct page_read *pr, unsigned long vaddr, bool warn) { int ret; struct iovec iov; if (pr->pe) pagemap2iovec(pr->pe, &iov); else goto new_pagemap; while (1) { unsigned long iov_end; if (vaddr < pr->cvaddr) { if (warn) pr_err("Missing %lu in parent pagemap, current iov: base=%lx,len=%zu\n", vaddr, (unsigned long)iov.iov_base, iov.iov_len); return 0; } iov_end = (unsigned long)iov.iov_base + iov.iov_len; if (iov_end <= vaddr) { skip_pagemap_pages(pr, iov_end - pr->cvaddr); put_pagemap(pr); new_pagemap: ret = get_pagemap(pr, &iov); if (ret <= 0) return ret; continue; } skip_pagemap_pages(pr, vaddr - pr->cvaddr); return 1; } } static int read_pagemap_page(struct page_read *pr, unsigned long vaddr, void *buf) { int ret; if (pr->pe->in_parent) { pr_debug("\tpr%u Read page %lx from parent\n", pr->id, vaddr); ret = seek_pagemap_page(pr->parent, vaddr, true); if (ret <= 0) return -1; ret = read_pagemap_page(pr->parent, vaddr, buf); if (ret == -1) return ret; } else { off_t current_vaddr = lseek(pr->fd_pg, 0, SEEK_CUR); pr_debug("\tpr%u Read page %lx from self %lx/%"PRIx64"\n", pr->id, vaddr, pr->cvaddr, current_vaddr); ret = read(pr->fd_pg, buf, PAGE_SIZE); if (ret != PAGE_SIZE) { pr_perror("Can't read mapping page %d", ret); return -1; } if (opts.auto_dedup) { ret = punch_hole(pr, current_vaddr, (unsigned int)PAGE_SIZE, false); if (ret == -1) { return -1; } } } pr->cvaddr += PAGE_SIZE; return 1; } static void close_page_read(struct page_read *pr) { int ret; if (pr->bunch.iov_len > 0) { ret = punch_hole(pr, 0, 0, true); if (ret == -1) return; pr->bunch.iov_len = 0; } if (pr->parent) { close_page_read(pr->parent); xfree(pr->parent); } close(pr->fd_pg); close(pr->fd); } static int try_open_parent(int dfd, int pid, struct page_read *pr, int flags) { int pfd; struct page_read *parent = NULL; pfd = openat(dfd, CR_PARENT_LINK, O_RDONLY); if (pfd < 0 && errno == ENOENT) goto out; parent = xmalloc(sizeof(*parent)); if (!parent) goto err_cl; if (open_page_read_at(pfd, pid, parent, flags, false)) { if (errno != ENOENT) goto err_free; xfree(parent); parent = NULL; } close(pfd); out: pr->parent = parent; return 0; err_free: xfree(parent); err_cl: close(pfd); return -1; } int open_page_read_at(int dfd, int pid, struct page_read *pr, int flags, bool shmem) { pr->pe = NULL; pr->bunch.iov_len = 0; pr->bunch.iov_base = NULL; pr->fd = open_image_at(dfd, shmem ? CR_FD_SHMEM_PAGEMAP : CR_FD_PAGEMAP, O_RSTR, (long)pid); if (pr->fd < 0) { pr->fd_pg = open_image_at(dfd, shmem ? CR_FD_SHM_PAGES_OLD : CR_FD_PAGES_OLD, flags, pid); if (pr->fd_pg < 0) return -1; pr->parent = NULL; pr->get_pagemap = get_page_vaddr; pr->put_pagemap = NULL; pr->read_page = read_page; } else { static unsigned ids = 1; if (!shmem && try_open_parent(dfd, pid, pr, flags)) { close(pr->fd); return -1; } pr->fd_pg = open_pages_image_at(dfd, flags, pr->fd); if (pr->fd_pg < 0) { close_page_read(pr); return -1; } pr->get_pagemap = get_pagemap; pr->put_pagemap = put_pagemap; pr->read_page = read_pagemap_page; pr->id = ids++; pr_debug("Opened page read %u (parent %u)\n", pr->id, pr->parent ? pr->parent->id : 0); } pr->close = close_page_read; return 0; } int open_page_read(int pid, struct page_read *pr, int flags, bool shmem) { return open_page_read_at(get_service_fd(IMG_FD_OFF), pid, pr, flags, shmem); }