benchmarks/gem_latency: Measure effect of using RealTime priority

Allow the producers to be set with maximum RT priority to verify that the waiters are not exhibiting priorty-inversion. Signed-off-by: Chris Wilson <chris@chris-wilson.co.uk>
2025-07-26 03:07:24 +00:00 · 2015-12-20 14:55:42 +00:00 · 2015-12-20 14:55:42 +00:00 · a91ee853b1
commit a91ee853b1
parent 27e093dd1f
1 changed files with 37 additions and 19 deletions
--- a/benchmarks/gem_latency.c
+++ b/benchmarks/gem_latency.c
@ -52,7 +52,7 @@ static volatile uint32_t *timestamp_reg;
 struct consumer {
 	pthread_t thread;

-	int wait;
+	int go;

 	igt_stats_t latency;
 	struct producer *producer;
@ -81,7 +81,7 @@ struct producer {
 	int wait;
 	int complete;
 	int done;
-	igt_stats_t latency, throughput;
+	igt_stats_t latency, dispatch;

 	int nop;
 	int nconsumers;
@ -281,19 +281,17 @@ static void *producer(void *arg)
 		gem_execbuf(fd, &p->latency_dispatch.execbuf);

 		/* Wake all the associated clients to wait upon our batch */
-		pthread_mutex_lock(&p->lock);
 		p->wait = p->nconsumers;
 		for (n = 0; n < p->nconsumers; n++)
-			p->consumers[n].wait = 1;
+			p->consumers[n].go = 1;
 		pthread_cond_broadcast(&p->c_cond);
-		pthread_mutex_unlock(&p->lock);

 		/* Wait for this batch to finish and record how long we waited,
 		 * and how long it took for the batch to be submitted
 		 * (including the nop delays).
 		 */
 		measure_latency(p, &p->latency);
-		igt_stats_push(&p->throughput, *p->last_timestamp - start);
+		igt_stats_push(&p->dispatch, *p->last_timestamp - start);

 		/* Tidy up all the extra threads before we submit again. */
 		pthread_mutex_lock(&p->lock);
@ -308,7 +306,7 @@ static void *producer(void *arg)
 	p->wait = p->nconsumers;
 	p->done = true;
 	for (n = 0; n < p->nconsumers; n++)
-		p->consumers[n].wait = 1;
+		p->consumers[n].go = 1;
 	pthread_cond_broadcast(&p->c_cond);
 	pthread_mutex_unlock(&p->lock);

@ -328,9 +326,9 @@ static void *consumer(void *arg)
 		pthread_mutex_lock(&p->lock);
 		if (--p->wait == 0)
 			pthread_cond_signal(&p->p_cond);
-		while (!c->wait)
+		while (!c->go)
 			pthread_cond_wait(&p->c_cond, &p->lock);
-		c->wait = 0;
+		c->go = 0;
 		pthread_mutex_unlock(&p->lock);
 		if (p->done)
 			return NULL;
@ -350,6 +348,7 @@ static double l_estimate(igt_stats_t *stats)
 }

 #define CONTEXT 1
+#define REALTIME 2
 static int run(int seconds,
 	       int nproducers,
 	       int nconsumers,
@ -357,8 +356,9 @@ static int run(int seconds,
 	       int workload,
 	       unsigned flags)
 {
+	pthread_attr_t attr;
 	struct producer *p;
-	igt_stats_t latency, throughput;
+	igt_stats_t platency, latency, dispatch;
 	uint32_t nop_batch;
 	uint32_t workload_batch;
 	uint32_t scratch;
@ -406,7 +406,7 @@ static int run(int seconds,
 		pthread_cond_init(&p[n].c_cond, NULL);

 		igt_stats_init(&p[n].latency);
-		igt_stats_init(&p[n].throughput);
+		igt_stats_init(&p[n].dispatch);
 		p[n].wait = nconsumers;
 		p[n].nop = nop;
 		p[n].nconsumers = nconsumers;
@ -423,14 +423,22 @@ static int run(int seconds,
 		pthread_mutex_unlock(&p->lock);
 	}

+	pthread_attr_init(&attr);
+	if (flags & REALTIME) {
+		struct sched_param param = { .sched_priority = 99 };
+		pthread_attr_setinheritsched(&attr, PTHREAD_EXPLICIT_SCHED);
+		pthread_attr_setschedpolicy(&attr, SCHED_FIFO);
+		pthread_attr_setschedparam(&attr, &param);
+	}
 	for (n = 0; n < nproducers; n++)
-		pthread_create(&p[n].thread, NULL, producer, &p[n]);
+		pthread_create(&p[n].thread, &attr, producer, &p[n]);

 	sleep(seconds);
 	done = true;

 	nrun = complete = 0;
-	igt_stats_init_with_size(&throughput, nproducers);
+	igt_stats_init_with_size(&dispatch, nproducers);
+	igt_stats_init_with_size(&platency, nproducers);
 	igt_stats_init_with_size(&latency, nconsumers*nproducers);
 	for (n = 0; n < nproducers; n++) {
 		pthread_join(p[n].thread, NULL);
@ -441,7 +449,8 @@ static int run(int seconds,
 		nrun++;
 		complete += p[n].complete;
 		igt_stats_push_float(&latency, l_estimate(&p[n].latency));
-		igt_stats_push_float(&throughput, l_estimate(&p[n].throughput));
+		igt_stats_push_float(&platency, l_estimate(&p[n].latency));
+		igt_stats_push_float(&dispatch, l_estimate(&p[n].dispatch));

 		for (m = 0; m < nconsumers; m++) {
 			pthread_join(p[n].consumers[m].thread, NULL);
@ -451,16 +460,20 @@ static int run(int seconds,

 	switch ((flags >> 8) & 0xf) {
 	default:
-		printf("%d/%d: %7.3fus %7.3fus\n", complete, nrun,
-		       CYCLES_TO_US(l_estimate(&throughput)),
-		       CYCLES_TO_US(l_estimate(&latency)));
+		printf("%d/%d: %7.3fus %7.3fus %7.3fus\n", complete, nrun,
+		       CYCLES_TO_US(l_estimate(&dispatch)),
+		       CYCLES_TO_US(l_estimate(&latency)),
+		       CYCLES_TO_US(l_estimate(&platency)));
 		break;
 	case 1:
-		printf("%f\n", CYCLES_TO_US(l_estimate(&throughput)));
+		printf("%f\n", CYCLES_TO_US(l_estimate(&dispatch)));
 		break;
 	case 2:
 		printf("%f\n", CYCLES_TO_US(l_estimate(&latency)));
 		break;
+	case 3:
+		printf("%f\n", CYCLES_TO_US(l_estimate(&platency)));
+		break;
 	}

 	return 0;
@ -476,7 +489,7 @@ int main(int argc, char **argv)
 	unsigned flags = 0;
 	int c;

-	while ((c = getopt(argc, argv, "p:c:n:w:t:f:s")) != -1) {
+	while ((c = getopt(argc, argv, "p:c:n:w:t:f:sR")) != -1) {
 		switch (c) {
 		case 'p':
 			/* How many threads generate work? */
@ -530,6 +543,11 @@ int main(int argc, char **argv)
 			flags |= CONTEXT;
 			break;

+		case 'R':
+			/* Run the producers at RealTime priority */
+			flags |= REALTIME;
+			break;
+
 		default:
 			break;
 		}