/* * Copyright © 2011 Intel Corporation * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice (including the next * paragraph) shall be included in all copies or substantial portions of the * Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS * IN THE SOFTWARE. * * Authors: * Chris Wilson * */ #include #include "igt.h" #include #include #include #include #include #include #include #include #include #include #include #include #include #include "drm.h" #include "i915/gem_create.h" #include "igt_vgem.h" #define MiB(x) ((x) * 1024 * 1024) typedef void *(*mmap_fn_t)(int, uint32_t, uint64_t, uint64_t, unsigned int); static void *wrap_gem_mmap__gtt(int i915, uint32_t handle, uint64_t offset, uint64_t length, unsigned int prot) { return gem_mmap__gtt(i915, handle, length, prot); } static void pread_self(int i915) { int start = gem_has_mappable_ggtt(i915) ? 0 : 1; static const mmap_fn_t mmap_fn[] = { wrap_gem_mmap__gtt, gem_mmap__cpu, gem_mmap__wc, NULL }; for (const mmap_fn_t *fn = mmap_fn + start; *fn; fn++) { uint32_t handle = gem_create(i915, MiB(4)); void *ptr = (*fn)(i915, handle, 0, MiB(4), PROT_WRITE); gem_read(i915, handle, 0, ptr + MiB(3), MiB(1)); gem_read(i915, handle, MiB(3), ptr, MiB(1)); gem_read(i915, handle, MiB(1), ptr + MiB(1), MiB(2)); munmap(ptr, MiB(4)); gem_close(i915, handle); } } static int userfaultfd(int flags) { return syscall(SYS_userfaultfd, flags); } struct ufd_thread { uint32_t *page; int i915; int vgem; int err; }; static uint32_t dmabuf_create_handle(int i915, int vgem) { struct vgem_bo scratch; uint32_t handle; int dmabuf; scratch.width = 64; scratch.height = 64; scratch.bpp = 32; vgem_create(vgem, &scratch); dmabuf = prime_handle_to_fd(vgem, scratch.handle); handle = prime_fd_to_handle(i915, dmabuf); close(dmabuf); return handle; } static void *ufd_thread(void *arg) { struct ufd_thread *t = arg; uint32_t handle = dmabuf_create_handle(t->i915, t->vgem); t->err = __gem_read(t->i915, handle, 0, t->page, 1); gem_close(t->i915, handle); return NULL; } static void write_value(const char *path, int value) { char buf[80]; int fd, len; len = sprintf(buf, "%d", value); if (len < 0) return; fd = open(path, O_WRONLY); if (fd != -1) { write(fd, buf, len); close(fd); } } static void unlimited_processes(unsigned int limit) { struct rlimit rlim; write_value("/proc/sys/kernel/threads-max", 150000); write_value("/proc/sys/vm/max_map_count", 500000); write_value("/proc/sys/kernel/pid_max", 200000); if (getrlimit(RLIMIT_NPROC, &rlim)) return; rlim.rlim_cur = limit; rlim.rlim_max = limit; setrlimit(RLIMIT_NPROC, &rlim); } static void test_exhaustion(int i915) { struct uffdio_api api = { .api = UFFD_API }; struct uffdio_register reg; struct uffdio_copy copy; struct ufd_thread t = { .i915 = i915, .vgem = drm_open_driver(DRIVER_VGEM), }; pthread_t *thread = NULL; struct uffd_msg msg; unsigned long count; char buf[4096]; int ufd; unlimited_processes(1024 * 1024); ufd = userfaultfd(0); igt_require_f(ufd != -1, "kernel support for userfaultfd\n"); igt_require_f(ioctl(ufd, UFFDIO_API, &api) == 0 && api.api == UFFD_API, "userfaultfd API v%lld:%lld\n", UFFD_API, api.api); t.page = mmap(NULL, 4096, PROT_WRITE, MAP_SHARED | MAP_ANON, 0, 0); igt_assert(t.page != MAP_FAILED); /* Register our fault handler for t.page */ memset(®, 0, sizeof(reg)); reg.mode = UFFDIO_REGISTER_MODE_MISSING; reg.range.start = to_user_pointer(t.page); reg.range.len = 4096; do_ioctl(ufd, UFFDIO_REGISTER, ®); count = 0; while (!READ_ONCE(t.err)) { if (is_power_of_two(count)) { unsigned long sz = count ? 2 * count : 1; thread = realloc(thread, sz * sizeof(*thread)); igt_assert(thread); } if (pthread_create(&thread[count], NULL, ufd_thread, &t)) break; if (count == 0) { /* Wait for the first userfault */ igt_assert_eq(read(ufd, &msg, sizeof(msg)), sizeof(msg)); igt_assert_eq(msg.event, UFFD_EVENT_PAGEFAULT); igt_assert(from_user_pointer(msg.arg.pagefault.address) == t.page); } count++; } igt_assert(count); if (t.err) igt_warn("err:%d after %lu threads\n", t.err, count); /* Service the fault; releasing the stuck ioctls */ memset(©, 0, sizeof(copy)); copy.dst = msg.arg.pagefault.address; copy.src = to_user_pointer(memset(buf, 0xc5, sizeof(buf))); copy.len = 4096; do_ioctl(ufd, UFFDIO_COPY, ©); while (count--) pthread_join(thread[count], NULL); free(thread); munmap(t.page, 4096); close(ufd); close(t.vgem); } #define OBJECT_SIZE 16384 #define KGRN "\x1B[32m" #define KRED "\x1B[31m" #define KNRM "\x1B[0m" static void do_gem_read(int fd, uint32_t handle, void *buf, int len, int loops) { while (loops--) gem_read(fd, handle, 0, buf, len); } static double elapsed(const struct timeval *start, const struct timeval *end, int loop) { return (1e6*(end->tv_sec - start->tv_sec) + (end->tv_usec - start->tv_usec))/loop; } static const char *bytes_per_sec(char *buf, double v) { const char *order[] = { "", "KiB", "MiB", "GiB", "TiB", NULL, }, **o = order; while (v > 1000 && o[1]) { v /= 1000; o++; } sprintf(buf, "%.1f%s/s", v, *o); return buf; } uint32_t *src, dst; int fd, count; int object_size = 0; static int opt_handler(int opt, int opt_index, void *data) { switch (opt) { case 's': object_size = atoi(optarg); break; default: return IGT_OPT_HANDLER_ERROR; } return IGT_OPT_HANDLER_SUCCESS; } const char *help_str = " -s\tObject size in bytes\n"; igt_main_args("s:", NULL, help_str, opt_handler, NULL) { double usecs; char buf[100]; const char* bps; const struct { int level; const char *name; } cache[] = { { 0, "uncached" }, { 1, "snoop" }, { 2, "display" }, { -1 }, }, *c; if (object_size == 0) object_size = OBJECT_SIZE; object_size = (object_size + 3) & -4; igt_fixture { fd = drm_open_driver(DRIVER_INTEL); gem_require_pread_pwrite(fd); dst = gem_create(fd, object_size); src = malloc(object_size); } igt_subtest("bench") { for (count = 1; count <= 1<<17; count <<= 1) { struct timeval start, end; gettimeofday(&start, NULL); do_gem_read(fd, dst, src, object_size, count); gettimeofday(&end, NULL); usecs = elapsed(&start, &end, count); bps = bytes_per_sec(buf, object_size/usecs*1e6); igt_info("Time to pread %d bytes x %6d: %7.3fµs, %s\n", object_size, count, usecs, bps); fflush(stdout); } } igt_subtest("self") pread_self(fd); igt_subtest("exhaustion") test_exhaustion(fd); for (c = cache; c->level != -1; c++) { igt_subtest(c->name) { gem_set_caching(fd, dst, c->level); for (count = 1; count <= 1<<17; count <<= 1) { struct timeval start, end; gettimeofday(&start, NULL); do_gem_read(fd, dst, src, object_size, count); gettimeofday(&end, NULL); usecs = elapsed(&start, &end, count); bps = bytes_per_sec(buf, object_size/usecs*1e6); igt_info("Time to %s pread %d bytes x %6d: %7.3fµs, %s\n", c->name, object_size, count, usecs, bps); fflush(stdout); } } } igt_fixture { free(src); gem_close(fd, dst); close(fd); } }