gem_exec_nop.c 5.89 KB
Newer Older
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44
/*
 * Copyright © 2011 Intel Corporation
 *
 * Permission is hereby granted, free of charge, to any person obtaining a
 * copy of this software and associated documentation files (the "Software"),
 * to deal in the Software without restriction, including without limitation
 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
 * and/or sell copies of the Software, and to permit persons to whom the
 * Software is furnished to do so, subject to the following conditions:
 *
 * The above copyright notice and this permission notice (including the next
 * paragraph) shall be included in all copies or substantial portions of the
 * Software.
 *
 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
 * IN THE SOFTWARE.
 *
 * Authors:
 *    Chris Wilson <chris@chris-wilson.co.uk>
 *
 */

#include <unistd.h>
#include <stdlib.h>
#include <stdint.h>
#include <stdio.h>
#include <string.h>
#include <fcntl.h>
#include <inttypes.h>
#include <errno.h>
#include <sys/stat.h>
#include <sys/ioctl.h>
#include <sys/time.h>
#include <time.h>

#include "drm.h"
#include "ioctl_wrappers.h"
#include "drmtest.h"
#include "intel_io.h"
45
#include "intel_reg.h"
46 47 48 49 50
#include "igt_stats.h"

#define LOCAL_I915_EXEC_NO_RELOC (1<<11)
#define LOCAL_I915_EXEC_HANDLE_LUT (1<<12)

51 52 53 54 55
#define LOCAL_I915_EXEC_BSD_SHIFT      (13)
#define LOCAL_I915_EXEC_BSD_MASK       (3 << LOCAL_I915_EXEC_BSD_SHIFT)

#define ENGINE_FLAGS  (I915_EXEC_RING_MASK | LOCAL_I915_EXEC_BSD_MASK)

56
#define SYNC 0x1
57 58
#define WRITE 0x2
#define READ_ALL 0x4
59 60 61

static double elapsed(const struct timespec *start,
		      const struct timespec *end)
62
{
63
	return (end->tv_sec - start->tv_sec) + 1e-9*(end->tv_nsec - start->tv_nsec);
64 65 66 67
}

static uint32_t batch(int fd)
{
68
	const uint32_t bbe = MI_BATCH_BUFFER_END;
69
	uint32_t handle = gem_create(fd, 4096);
70
	gem_write(fd, handle, 0, &bbe, sizeof(bbe));
71 72 73
	return handle;
}

74
static int loop(unsigned ring, int reps, int ncpus, unsigned flags)
75 76
{
	struct drm_i915_gem_execbuffer2 execbuf;
77 78 79
	struct drm_i915_gem_exec_object2 obj[2];
	unsigned all_engines[16];
	unsigned all_nengine;
80 81
	unsigned engines[16];
	unsigned nengine;
82
	double *shared;
83
	int fd;
84

85 86
	shared = mmap(0, 4096, PROT_WRITE, MAP_SHARED | MAP_ANON, -1, 0);

87
	fd = drm_open_driver(DRIVER_INTEL);
88

89 90 91 92 93
	memset(obj, 0, sizeof(obj));
	obj[0].handle = gem_create(fd, 4096);
	if (flags & WRITE)
		obj[0].flags = EXEC_OBJECT_WRITE;
	obj[1].handle = batch(fd);
94 95

	memset(&execbuf, 0, sizeof(execbuf));
96 97
	execbuf.buffers_ptr = (uintptr_t)obj;
	execbuf.buffer_count = 2;
98 99 100
	execbuf.flags |= LOCAL_I915_EXEC_HANDLE_LUT;
	execbuf.flags |= LOCAL_I915_EXEC_NO_RELOC;
	if (__gem_execbuf(fd, &execbuf)) {
101
		execbuf.flags = 0;
102 103 104 105
		if (__gem_execbuf(fd, &execbuf))
			return 77;
	}

106 107 108 109
	if (flags & WRITE && !(execbuf.flags & LOCAL_I915_EXEC_HANDLE_LUT))
		return 77;

	all_nengine = 0;
110
	for (unsigned r = 1; r < 16; r++) {
111
		execbuf.flags &= ~ENGINE_FLAGS;
112
		execbuf.flags |= r;
113
		if (__gem_execbuf(fd, &execbuf) == 0)
114
			all_engines[all_nengine++] = r;
115 116
	}

117
	if (ring == -1) {
118 119 120 121 122 123
		nengine = all_nengine;
		memcpy(engines, all_engines, all_nengine*sizeof(engines[0]));
	} else {
		nengine = 1;
		engines[0] = ring;
	}
124

125
	while (reps--) {
126
		memset(shared, 0, 4096);
127

128
		gem_set_domain(fd, obj[1].handle, I915_GEM_DOMAIN_GTT, 0);
129 130
		sleep(1); /* wait for the hw to go back to sleep */

131 132 133 134
		igt_fork(child, ncpus) {
			struct timespec start, end;
			unsigned count = 0;

135 136
			obj[0].handle = gem_create(fd, 4096);
			obj[1].handle = batch(fd);
137

138 139 140
			clock_gettime(CLOCK_MONOTONIC, &start);
			do {
				for (int inner = 0; inner < 1024; inner++) {
141 142 143 144 145 146 147 148 149 150
					if (flags & READ_ALL) {
						obj[0].flags = 0;
						for (int n = 0; n < all_nengine; n++) {
							execbuf.flags &= ~ENGINE_FLAGS;
							execbuf.flags |= all_engines[n];
							gem_execbuf(fd, &execbuf);
						}
						if (flags & WRITE)
							obj[0].flags = EXEC_OBJECT_WRITE;
					}
151 152 153 154
					execbuf.flags &= ~ENGINE_FLAGS;
					execbuf.flags |= engines[count++ % nengine];
					gem_execbuf(fd, &execbuf);
					if (flags & SYNC)
155
						gem_sync(fd, obj[1].handle);
156 157 158 159 160
				}

				clock_gettime(CLOCK_MONOTONIC, &end);
			} while (elapsed(&start, &end) < 2.);

161
			gem_sync(fd, obj[1].handle);
162
			clock_gettime(CLOCK_MONOTONIC, &end);
163
			shared[child] = 1e6*elapsed(&start, &end) / count;
164

165 166
			gem_close(fd, obj[1].handle);
			gem_close(fd, obj[0].handle);
167 168
		}
		igt_waitchildren();
169

170 171 172 173
		for (int child = 0; child < ncpus; child++)
			shared[ncpus] += shared[child];
		printf("%7.3f\n", shared[ncpus] / ncpus);

174
		obj[0].flags = 0;
175 176 177 178 179
		for (int n = 0; n < nengine; n++) {
			execbuf.flags &= ~ENGINE_FLAGS;
			execbuf.flags |= engines[n];
			gem_execbuf(fd, &execbuf);
		}
180 181
		if (flags & WRITE)
			obj[0].flags = EXEC_OBJECT_WRITE;
182 183 184 185 186 187 188
	}
	return 0;
}

int main(int argc, char **argv)
{
	unsigned ring = I915_EXEC_RENDER;
189 190
	unsigned flags = 0;
	int reps = 1;
191
	int ncpus = 1;
192 193
	int c;

194
	while ((c = getopt (argc, argv, "e:r:sf")) != -1) {
195 196 197 198 199 200 201 202 203 204
		switch (c) {
		case 'e':
			if (strcmp(optarg, "rcs") == 0)
				ring = I915_EXEC_RENDER;
			else if (strcmp(optarg, "vcs") == 0)
				ring = I915_EXEC_BSD;
			else if (strcmp(optarg, "bcs") == 0)
				ring = I915_EXEC_BLT;
			else if (strcmp(optarg, "vecs") == 0)
				ring = I915_EXEC_VEBOX;
205 206
			else if (strcmp(optarg, "all") == 0)
				ring = -1;
207 208 209 210 211 212 213 214 215 216
			else
				ring = atoi(optarg);
			break;

		case 'r':
			reps = atoi(optarg);
			if (reps < 1)
				reps = 1;
			break;

217 218 219 220
		case 'f':
			ncpus = sysconf(_SC_NPROCESSORS_ONLN);
			break;

221 222 223 224
		case 's':
			flags |= SYNC;
			break;

225 226 227 228 229 230 231 232
		case 'W':
			flags |= WRITE;
			break;

		case 'A':
			flags |= READ_ALL;
			break;

233 234 235 236 237
		default:
			break;
		}
	}

238
	return loop(ring, reps, ncpus, flags);
239
}