/* * Copyright (c) 2012 Intel Corporation * * Permission is hereby granted, free of charge, to any person obtaining a * copy of this software and associated documentation files (the "Software"), * to deal in the Software without restriction, including without limitation * the rights to use, copy, modify, merge, publish, distribute, sublicense, * and/or sell copies of the Software, and to permit persons to whom the * Software is furnished to do so, subject to the following conditions: * * The above copyright notice and this permission notice (including the next * paragraph) shall be included in all copies or substantial portions of the * Software. * * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS * IN THE SOFTWARE. * * Authors: * Mika Kuoppala * */ /* * This test runs blitcopy -> rendercopy with multiple buffers over wrap * boundary. Note: Driver can only handle UINT32_MAX/2-1 increments to seqno. */ #include #include #include #include #include #include #include #include #include #include #include "i915_drm.h" #include "intel_bufmgr.h" #include "intel_batchbuffer.h" #include "intel_gpu_tools.h" #include "rendercopy.h" #define SAFETY_REGION 0x1f static int devid; static uint32_t last_seqno = 0; static uint32_t last_seqno_write = 0; static struct intel_batchbuffer *batch_blt; static struct intel_batchbuffer *batch_3d; struct option_struct { int rounds; int background; char cmd[1024]; int verbose; int timeout; int dontwrap; int prewrap_space; int random; int buffers; }; static struct option_struct options; static void init_buffer(drm_intel_bufmgr *bufmgr, struct scratch_buf *buf, drm_intel_bo *bo, int width, int height) { /* buf->bo = drm_intel_bo_alloc(bufmgr, "", size, 4096); */ buf->bo = bo; buf->size = width * height * 4; assert(buf->bo); buf->tiling = I915_TILING_NONE; buf->data = buf->cpu_mapping = NULL; buf->num_tiles = width * height * 4; buf->stride = width * 4; } static void set_bo(drm_intel_bo *bo, uint32_t val, int width, int height) { int size = width * height; uint32_t *vaddr; drm_intel_gem_bo_start_gtt_access(bo, true); vaddr = bo->virtual; while (size--) *vaddr++ = val; } static int cmp_bo(drm_intel_bo *bo, uint32_t val, int width, int height) { int size = width * height; uint32_t *vaddr; drm_intel_gem_bo_start_gtt_access(bo, false); vaddr = bo->virtual; while (size--) { if (*vaddr++ != val) { printf("%d: 0x%x differs from assumed 0x%x\n", width * height - size, *vaddr-1, val); return -1; } } return 0; } static drm_intel_bo * create_bo(drm_intel_bufmgr *bufmgr, uint32_t val, int width, int height) { drm_intel_bo *bo; bo = drm_intel_bo_alloc(bufmgr, "bo", width * height * 4, 0); assert(bo); /* gtt map doesn't have a write parameter, so just keep the mapping * around (to avoid the set_domain with the gtt write domain set) and * manually tell the kernel when we start access the gtt. */ drm_intel_gem_bo_map_gtt(bo); set_bo(bo, val, width, height); return bo; } static void release_bo(drm_intel_bo *bo) { drm_intel_gem_bo_unmap_gtt(bo); drm_intel_bo_unreference(bo); } static void render_copyfunc(struct scratch_buf *src, struct scratch_buf *dst, int width, int height) { const int src_x = 0, src_y = 0, dst_x = 0, dst_y = 0; render_copyfunc_t rendercopy = get_render_copyfunc(devid); static int warned = 0; if (rendercopy) { rendercopy(batch_3d, src, src_x, src_y, width, height, dst, dst_x, dst_y); intel_batchbuffer_flush(batch_3d); } else { if (!warned) { printf("No render copy found for this gen, " "test is shallow!\n"); warned = 1; } intel_copy_bo(batch_blt, dst->bo, src->bo, width, height); intel_batchbuffer_flush(batch_blt); } } static void exchange_uint(void *array, unsigned i, unsigned j) { unsigned *i_arr = array; unsigned i_tmp; i_tmp = i_arr[i]; i_arr[i] = i_arr[j]; i_arr[j] = i_tmp; } static int run_sync_test(int num_buffers, bool verify) { drm_intel_bufmgr *bufmgr; int max; drm_intel_bo *src[128], *dst1[128], *dst2[128]; int width = 128, height = 128; int fd; int i; int r = -1; int failed = 0; unsigned int *p_dst1, *p_dst2; struct scratch_buf s_src[128], s_dst[128]; fd = drm_open_any(); assert(fd >= 0); gem_quiescent_gpu(fd); devid = intel_get_drm_devid(fd); max = gem_aperture_size (fd) / (1024 * 1024) / 2; if (num_buffers > max) num_buffers = max; bufmgr = drm_intel_bufmgr_gem_init(fd, 4096); drm_intel_bufmgr_gem_enable_reuse(bufmgr); batch_blt = intel_batchbuffer_alloc(bufmgr, intel_get_drm_devid(fd)); assert(batch_blt); batch_3d = intel_batchbuffer_alloc(bufmgr, intel_get_drm_devid(fd)); assert(batch_3d); p_dst1 = malloc(num_buffers * sizeof(unsigned int)); if (p_dst1 == NULL) return -ENOMEM; p_dst2 = malloc(num_buffers * sizeof(unsigned int)); if (p_dst2 == NULL) return -ENOMEM; for (i = 0; i < num_buffers; i++) { p_dst1[i] = p_dst2[i] = i; src[i] = create_bo(bufmgr, i, width, height); dst1[i] = create_bo(bufmgr, ~i, width, height); dst2[i] = create_bo(bufmgr, ~i, width, height); init_buffer(bufmgr, &s_src[i], src[i], width, height); init_buffer(bufmgr, &s_dst[i], dst1[i], width, height); } drmtest_permute_array(p_dst1, num_buffers, exchange_uint); drmtest_permute_array(p_dst2, num_buffers, exchange_uint); for (i = 0; i < num_buffers; i++) render_copyfunc(&s_src[i], &s_dst[p_dst1[i]], width, height); /* Only sync between buffers if this is actual test run and * not a seqno filler */ if (verify) { for (i = 0; i < num_buffers; i++) intel_copy_bo(batch_blt, dst2[p_dst2[i]], dst1[p_dst1[i]], width, height); for (i = 0; i < num_buffers; i++) { r = cmp_bo(dst2[p_dst2[i]], i, width, height); if (r) { printf("buffer %d differs, seqno_before_test 0x%x, " " approximated seqno on test fail 0x%x\n", i, last_seqno_write, last_seqno_write + i * 2); failed = -1; } } } for (i = 0; i < num_buffers; i++) { release_bo(src[i]); release_bo(dst1[i]); release_bo(dst2[i]); } intel_batchbuffer_free(batch_3d); intel_batchbuffer_free(batch_blt); drm_intel_bufmgr_destroy(bufmgr); free(p_dst1); free(p_dst2); gem_quiescent_gpu(fd); close(fd); return failed; } static int run_cmd(char *s) { int pid; int r = -1; int status = 0; wordexp_t wexp; int i; r = wordexp(s, &wexp, 0); if (r != 0) { printf("can't parse %s\n", s); return r; } for(i = 0; i < wexp.we_wordc; i++) printf("argv[%d] = %s\n", i, wexp.we_wordv[i]); pid = fork(); if (pid == 0) { char path[PATH_MAX]; char full_path[PATH_MAX]; if (getcwd(path, PATH_MAX) == NULL) perror("getcwd"); assert(snprintf(full_path, PATH_MAX, "%s/%s", path, wexp.we_wordv[0]) > 0); /* if (!options.verbose) { close(STDOUT_FILENO); close(STDERR_FILENO); } */ r = execv(full_path, wexp.we_wordv); if (r == -1) perror("execv failed"); } else { int waitcount = options.timeout; while(waitcount-- > 0) { r = waitpid(pid, &status, WNOHANG); if (r == pid) { if(WIFEXITED(status)) { if (WEXITSTATUS(status)) fprintf(stderr, "child returned with %d\n", WEXITSTATUS(status)); return WEXITSTATUS(status); } } else if (r != 0) { perror("waitpid"); return -errno; } sleep(1); } kill(pid, SIGKILL); return -ETIMEDOUT; } return r; } static const char *debug_fs_entry = "/sys/kernel/debug/dri/0/i915_next_seqno"; static int read_seqno(uint32_t *seqno) { int fh; char buf[32]; int r; char *p; unsigned long int tmp; fh = open(debug_fs_entry, O_RDWR); if (fh == -1) { perror("open"); fprintf(stderr, "no %s found, too old kernel?\n", debug_fs_entry); return -errno; } r = read(fh, buf, sizeof(buf) - 1); if (r < 0) { perror("read"); close(fh); return -errno; } close(fh); buf[r] = 0; p = strstr(buf, "0x"); if (!p) p = buf; tmp = strtoul(p, NULL, 0); if (tmp == ULONG_MAX) { perror("strtoul"); return -errno; } *seqno = tmp; if (options.verbose) printf("seqno read : 0x%x\n", *seqno); return 0; } static int write_seqno(uint32_t seqno) { int fh; char buf[32]; int r; fh = open(debug_fs_entry, O_RDWR); if (fh == -1) { perror("open"); return -errno; } assert(snprintf(buf, sizeof(buf), "0x%x", seqno) > 0); r = write(fh, buf, strnlen(buf, sizeof(buf))); if (r < 0) return r; assert(r == strnlen(buf, sizeof(buf))); close(fh); if (options.verbose) printf("seqno write: 0x%x\n", seqno); last_seqno_write = seqno; return 0; } static uint32_t calc_prewrap_val(void) { const int pval = options.prewrap_space; if (options.random == 0) return pval; return random() % pval; } static int seqno_near_boundary(uint32_t seqno) { if (seqno > UINT32_MAX - options.prewrap_space || seqno < options.prewrap_space) return 1; if (seqno < UINT32_MAX/2 + SAFETY_REGION && seqno > UINT32_MAX/2 - SAFETY_REGION) return 1; return 0; } static int run_once(void) { int r; uint32_t seqno_before = 0; uint32_t seqno_after = 0; uint32_t seqno; const uint32_t pw_val = calc_prewrap_val(); r = read_seqno(&seqno_before); assert(r == 0); seqno = last_seqno = seqno_before; /* Skip seqno write if close to boundary */ if (!seqno_near_boundary(seqno)) { if (seqno > UINT32_MAX/2 + 1) seqno = UINT32_MAX - pw_val; else seqno = UINT32_MAX/2 - SAFETY_REGION; if (!options.dontwrap) { r = write_seqno(seqno); if (r < 0) { fprintf(stderr, "write_seqno 0x%x returned %d\n", seqno, r); /* We might fail if we are at background and * some operations were done between seqno * read and this write */ if (!options.background) return r; } } } if (!options.background) { /* Only run tests if we are across the half way of seqno space. * If we are not, run something which just increments seqnos */ if (seqno >= UINT32_MAX/2 + 1) { if (strnlen(options.cmd, sizeof(options.cmd)) > 0) { r = run_cmd(options.cmd); } else { r = run_sync_test(options.buffers, true); } } else { r = run_sync_test(options.buffers, false); } if (r != 0) { fprintf(stderr, "test returned %d\n", r); return -1; } } else { /* Let's wait in background for seqno to increment */ sleep(2); } r = read_seqno(&seqno_after); assert(r == 0); if (seqno_before > seqno_after) { if (options.verbose) printf("before 0x%x, after 0x%x , diff %d\n", seqno_before, seqno_after, seqno_after - seqno_before); return 1; } return 0; } static void print_usage(const char *s) { printf("%s: [OPTION]...\n", s); printf(" where options are:\n"); printf(" -b --background run in background inducing wraps\n"); printf(" -c --cmd=cmdstring use cmdstring to cross wrap\n"); printf(" -n --rounds=num run num times across wrap boundary, 0 == forever\n"); printf(" -t --timeout=sec set timeout to wait for testrun to sec seconds\n"); printf(" -d --dontwrap don't wrap just run the test\n"); printf(" -p --prewrap=n set seqno to WRAP - n for each testrun\n"); printf(" -r --norandom dont randomize prewrap space\n"); printf(" -i --buffers number of buffers to copy\n"); exit(-1); } static void parse_options(int argc, char **argv) { int c; int option_index = 0; static struct option long_options[] = { {"cmd", required_argument, 0, 'c'}, {"rounds", required_argument, 0, 'n'}, {"background", no_argument, 0, 'b'}, {"timeout", required_argument, 0, 't'}, {"dontwrap", no_argument, 0, 'd'}, {"verbose", no_argument, 0, 'v'}, {"prewrap", required_argument, 0, 'p'}, {"norandom", no_argument, 0, 'r'}, {"buffers", required_argument, 0, 'i'}, }; strcpy(options.cmd, ""); options.rounds = 50; options.background = 0; options.dontwrap = 0; options.timeout = 20; options.verbose = 0; options.random = 1; options.prewrap_space = 30; options.buffers = 20; while((c = getopt_long(argc, argv, "c:n:bvt:dp:ri:", long_options, &option_index)) != -1) { switch(c) { case 'b': options.background = 1; printf("running in background inducing wraps\n"); break; case 'd': options.dontwrap = 1; printf("won't wrap after testruns\n"); break; case 'n': options.rounds = atoi(optarg); printf("running %d rounds\n", options.rounds); break; case 'c': strncpy(options.cmd, optarg, sizeof(options.cmd) - 1); options.cmd[sizeof(options.cmd) - 1] = 0; printf("cmd set to %s\n", options.cmd); break; case 'i': options.buffers = atoi(optarg); printf("buffers %d\n", options.buffers); break; case 't': options.timeout = atoi(optarg); if (options.timeout == 0) options.timeout = 10; printf("setting timeout to %d seconds\n", options.timeout); break; case 'v': options.verbose = 1; break; case 'r': options.random = 0; break; case 'p': options.prewrap_space = atoi(optarg); if (options.prewrap_space == 0) options.prewrap_space = 1; printf("prewrap set to %d (0x%x)\n", options.prewrap_space, UINT32_MAX - options.prewrap_space); break; default: printf("unkown command options\n"); print_usage(argv[0]); break; } } if (optind < argc) { printf("unkown command options\n"); print_usage(argv[0]); } } int main(int argc, char **argv) { int wcount = 0; int r = -1; parse_options(argc, argv); srandom(time(NULL)); while(options.rounds == 0 || wcount < options.rounds) { r = run_once(); if (r < 0) { if (options.verbose) fprintf(stderr, "run once returned %d\n", r); return r; } if (options.dontwrap) wcount++; else wcount += r; if (options.verbose) { printf("%s done: %d\n", options.dontwrap ? "tests" : "wraps", wcount); fflush(stdout); } } if (options.rounds == wcount) { if (options.verbose) printf("done %d wraps successfully\n", wcount); return 0; } return r; }