mirror of
https://github.com/tiagovignatti/intel-gpu-tools.git
synced 2025-06-07 16:06:25 +00:00
Apply the new API to all call sites within the test suite using the following semantic patch: // Semantic patch for replacing drm_open_any* with arch-specific drm_open_driver* calls @@ identifier i =~ "\bdrm_open_any\b"; @@ - i() + drm_open_driver(DRIVER_INTEL) @@ identifier i =~ "\bdrm_open_any_master\b"; @@ - i() + drm_open_driver_master(DRIVER_INTEL) @@ identifier i =~ "\bdrm_open_any_render\b"; @@ - i() + drm_open_driver_render(DRIVER_INTEL) @@ identifier i =~ "\b__drm_open_any\b"; @@ - i() + __drm_open_driver(DRIVER_INTEL) Signed-off-by: Micah Fedke <micah.fedke@collabora.co.uk> Signed-off-by: Thomas Wood <thomas.wood@intel.com>
253 lines
6.7 KiB
C
253 lines
6.7 KiB
C
/*
|
|
* Copyright © 2011 Intel Corporation
|
|
*
|
|
* Permission is hereby granted, free of charge, to any person obtaining a
|
|
* copy of this software and associated documentation files (the "Software"),
|
|
* to deal in the Software without restriction, including without limitation
|
|
* the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
|
* and/or sell copies of the Software, and to permit persons to whom the
|
|
* Software is furnished to do so, subject to the following conditions:
|
|
*
|
|
* The above copyright notice and this permission notice (including the next
|
|
* paragraph) shall be included in all copies or substantial portions of the
|
|
* Software.
|
|
*
|
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
|
|
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
|
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
|
* THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
|
|
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
|
|
* FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
|
|
* IN THE SOFTWARE.
|
|
*
|
|
* Authors:
|
|
* Chris Wilson <chris@chris-wilson.co.uk>
|
|
*
|
|
*/
|
|
|
|
#include <unistd.h>
|
|
#include <stdlib.h>
|
|
#include <stdint.h>
|
|
#include <stdio.h>
|
|
#include <string.h>
|
|
#include <fcntl.h>
|
|
#include <inttypes.h>
|
|
#include <errno.h>
|
|
#include <sys/stat.h>
|
|
#include <sys/ioctl.h>
|
|
#include <sys/time.h>
|
|
#include <time.h>
|
|
|
|
#include "drm.h"
|
|
#include "ioctl_wrappers.h"
|
|
#include "drmtest.h"
|
|
#include "intel_io.h"
|
|
#include "igt_stats.h"
|
|
|
|
enum {
|
|
ADD_BO = 0,
|
|
DEL_BO,
|
|
EXEC,
|
|
};
|
|
|
|
struct trace_add_bo {
|
|
uint32_t handle;
|
|
uint64_t size;
|
|
} __attribute__((packed));
|
|
|
|
struct trace_del_bo {
|
|
uint32_t handle;
|
|
} __attribute__((packed));
|
|
|
|
struct trace_exec {
|
|
uint32_t object_count;
|
|
uint64_t flags;
|
|
} __attribute__((packed));
|
|
struct trace_exec_object {
|
|
uint32_t handle;
|
|
uint32_t relocation_count;
|
|
uint64_t alignment;
|
|
uint64_t flags;
|
|
uint64_t rsvd1;
|
|
uint64_t rsvd2;
|
|
} __attribute__((packed));
|
|
struct trace_exec_relocation {
|
|
uint32_t target_handle;
|
|
uint32_t delta;
|
|
uint64_t offset;
|
|
uint32_t read_domains;
|
|
uint32_t write_domain;
|
|
} __attribute__((packed));
|
|
|
|
static double elapsed(const struct timespec *start, const struct timespec *end)
|
|
{
|
|
return 1e3*(end->tv_sec - start->tv_sec) + 1e-6*(end->tv_nsec - start->tv_nsec);
|
|
}
|
|
|
|
static void replay(const char *filename)
|
|
{
|
|
struct timespec t_start, t_end;
|
|
struct drm_i915_gem_execbuffer2 eb = {};
|
|
struct bo {
|
|
uint32_t handle;
|
|
uint64_t offset;
|
|
|
|
struct drm_i915_gem_relocation_entry *relocs;
|
|
uint32_t max_relocs;
|
|
} *bo = NULL, **offsets = NULL;
|
|
int num_bo = 0;
|
|
struct drm_i915_gem_exec_object2 *exec_objects = NULL;
|
|
int max_objects = 0;
|
|
struct stat st;
|
|
uint8_t *ptr, *end;
|
|
int fd;
|
|
|
|
fd = open(filename, O_RDONLY);
|
|
if (fd < 0)
|
|
return;
|
|
|
|
if (fstat(fd, &st) < 0)
|
|
return;
|
|
|
|
ptr = mmap(0, st.st_size, PROT_READ, MAP_SHARED, fd, 0);
|
|
close(fd);
|
|
|
|
if (ptr == MAP_FAILED)
|
|
return;
|
|
|
|
madvise(ptr, st.st_size, MADV_SEQUENTIAL);
|
|
|
|
end = ptr + st.st_size;
|
|
fd = drm_open_driver(DRIVER_INTEL);
|
|
|
|
clock_gettime(CLOCK_MONOTONIC, &t_start);
|
|
do {
|
|
switch (*ptr++) {
|
|
case ADD_BO: {
|
|
uint32_t bb = 0xa << 23;
|
|
struct trace_add_bo *t = (void *)ptr;
|
|
ptr = (void *)(t + 1);
|
|
|
|
if (t->handle >= num_bo) {
|
|
int new_bo = (t->handle + 4096) & -4096;
|
|
bo = realloc(bo, sizeof(*bo)*new_bo);
|
|
memset(bo + num_bo, 0, sizeof(*bo)*(new_bo - num_bo));
|
|
num_bo = new_bo;
|
|
}
|
|
|
|
bo[t->handle].handle = gem_create(fd, t->size);
|
|
gem_write(fd, bo[t->handle].handle, 0, &bb, sizeof(bb));
|
|
break;
|
|
}
|
|
case DEL_BO: {
|
|
struct trace_del_bo *t = (void *)ptr;
|
|
ptr = (void *)(t + 1);
|
|
|
|
gem_close(fd, bo[t->handle].handle);
|
|
bo[t->handle].handle = 0;
|
|
|
|
free(bo[t->handle].relocs);
|
|
bo[t->handle].relocs = NULL;
|
|
bo[t->handle].max_relocs = 0;
|
|
break;
|
|
}
|
|
case EXEC: {
|
|
struct trace_exec *t = (void *)ptr;
|
|
uint32_t i, j;
|
|
ptr = (void *)(t + 1);
|
|
|
|
eb.buffer_count = t->object_count;
|
|
eb.flags = t->flags & ~I915_EXEC_RING_MASK;
|
|
|
|
if (eb.buffer_count > max_objects) {
|
|
free(exec_objects);
|
|
free(offsets);
|
|
|
|
max_objects = ALIGN(eb.buffer_count, 4096);
|
|
|
|
exec_objects = malloc(max_objects*sizeof(*exec_objects));
|
|
offsets = malloc(max_objects*sizeof(*offsets));
|
|
|
|
eb.buffers_ptr = (uintptr_t)exec_objects;
|
|
}
|
|
|
|
for (i = 0; i < eb.buffer_count; i++) {
|
|
struct drm_i915_gem_relocation_entry *relocs;
|
|
struct trace_exec_object *to = (void *)ptr;
|
|
ptr = (void *)(to + 1);
|
|
|
|
offsets[i] = &bo[to->handle];
|
|
|
|
exec_objects[i].handle = bo[to->handle].handle;
|
|
exec_objects[i].offset = bo[to->handle].offset;
|
|
exec_objects[i].alignment = to->alignment;
|
|
exec_objects[i].flags = to->flags;
|
|
exec_objects[i].rsvd1 = to->rsvd1;
|
|
exec_objects[i].rsvd2 = to->rsvd2;
|
|
|
|
exec_objects[i].relocation_count = to->relocation_count;
|
|
if (!to->relocation_count)
|
|
continue;
|
|
|
|
if (to->relocation_count > bo[to->handle].max_relocs) {
|
|
free(bo[to->handle].relocs);
|
|
|
|
bo[to->handle].max_relocs = ALIGN(to->relocation_count, 128);
|
|
bo[to->handle].relocs = malloc(sizeof(*bo[to->handle].relocs)*bo[to->handle].max_relocs);
|
|
}
|
|
relocs = bo[to->handle].relocs;
|
|
exec_objects[i].relocs_ptr = (uintptr_t)relocs;
|
|
|
|
for (j = 0; j < to->relocation_count; j++) {
|
|
struct trace_exec_relocation *tr = (void *)ptr;
|
|
ptr = (void *)(tr + 1);
|
|
|
|
if (eb.flags & I915_EXEC_HANDLE_LUT) {
|
|
uint32_t handle;
|
|
|
|
relocs[j].target_handle = tr->target_handle;
|
|
|
|
handle = exec_objects[tr->target_handle].handle;
|
|
relocs[j].presumed_offset = bo[handle].offset;
|
|
} else {
|
|
relocs[j].target_handle = bo[tr->target_handle].handle;
|
|
relocs[j].presumed_offset = bo[tr->target_handle].offset;
|
|
}
|
|
relocs[j].delta = tr->delta;
|
|
relocs[j].offset = tr->offset;
|
|
relocs[j].read_domains = tr->read_domains;
|
|
relocs[j].write_domain = tr->write_domain;
|
|
}
|
|
}
|
|
|
|
gem_execbuf(fd, &eb);
|
|
|
|
for (i = 0; i < eb.buffer_count; i++)
|
|
offsets[i]->offset = exec_objects[i].offset;
|
|
|
|
break;
|
|
}
|
|
}
|
|
} while (ptr < end);
|
|
clock_gettime(CLOCK_MONOTONIC, &t_end);
|
|
close(fd);
|
|
munmap(end-st.st_size, st.st_size);
|
|
|
|
for (fd = 0; fd < num_bo; fd++)
|
|
free(bo[fd].relocs);
|
|
free(bo);
|
|
free(offsets);
|
|
|
|
printf("%s: %.3f\n", filename, elapsed(&t_start, &t_end));
|
|
}
|
|
|
|
int main(int argc, char **argv)
|
|
{
|
|
int i;
|
|
|
|
for (i = 1; i < argc; i++)
|
|
replay(argv[i]);
|
|
|
|
return 0;
|
|
}
|