281 lines
7.2 KiB
C
281 lines
7.2 KiB
C
/******************************************************************************
|
|
*
|
|
* Copyright © International Business Machines Corp., 2007, 2008, 2009
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License as published by
|
|
* the Free Software Foundation; either version 2 of the License, or
|
|
* (at your option) any later version.
|
|
*
|
|
* This program is distributed in the hope that it will be useful,
|
|
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See
|
|
* the GNU General Public License for more details.
|
|
*
|
|
* You should have received a copy of the GNU General Public License
|
|
* along with this program; if not, write to the Free Software
|
|
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
*
|
|
* NAME
|
|
* pi_perf.c
|
|
*
|
|
* DESCRIPTION
|
|
* Create a scenario with one high, one low and several
|
|
* medium priority threads. Low priority thread holds a PI lock, high
|
|
* priority thread later tries to grab it. The test measures the maximum
|
|
* amount of time the high priority thread has to wait before it gets
|
|
* the lock. This time should be bound by the duration for which low
|
|
* priority thread holds the lock
|
|
*
|
|
* USAGE:
|
|
* Use run_auto.sh script in current directory to build and run test.
|
|
* Use "-j" to enable jvm simulator.
|
|
*
|
|
* AUTHOR
|
|
* Author: Sripathi Kodi <sripathik@in.ibm.com>
|
|
*
|
|
* HISTORY
|
|
* 2007-Nov-20: Initial version by Sripathi Kodi <sripathik@in.ibm.com>
|
|
* 2009-Jul-03: Pass criteria corrected by Sripathi Kodi
|
|
* <sripathik@in.ibm.com>
|
|
*
|
|
*****************************************************************************/
|
|
|
|
#include <stdio.h>
|
|
#include <stdlib.h>
|
|
#include <limits.h>
|
|
#include <unistd.h>
|
|
#include <string.h>
|
|
#include <math.h>
|
|
#include <librttest.h>
|
|
#include <libstats.h>
|
|
|
|
#define LOWPRIO 30
|
|
#define HIGHPRIO 40
|
|
#define BUSYPRIO 35
|
|
|
|
#define DEF_LOW_WORK_MS 6
|
|
#define DEF_HIGH_WORK_MS 1
|
|
#define DEF_BUSY_WORK_MS 6
|
|
#define DEF_ITERATIONS 100
|
|
|
|
#define HIST_BUCKETS 100
|
|
#define THRESHOLD 200 /* microseconds */
|
|
|
|
pthread_barrier_t bar1, bar2;
|
|
pthread_mutex_t lock;
|
|
|
|
static int end = 0;
|
|
|
|
static unsigned int iterations = DEF_ITERATIONS;
|
|
static unsigned int low_work_time = DEF_LOW_WORK_MS;
|
|
static unsigned int high_work_time = DEF_HIGH_WORK_MS;
|
|
static unsigned int busy_work_time;
|
|
static int num_busy = -1;
|
|
|
|
nsec_t low_unlock, max_pi_delay;
|
|
|
|
stats_container_t low_dat, cpu_delay_dat;
|
|
stats_container_t cpu_delay_hist;
|
|
stats_quantiles_t cpu_delay_quantiles;
|
|
stats_record_t rec;
|
|
|
|
void usage(void)
|
|
{
|
|
rt_help();
|
|
printf("pi_perf_test specific options:\n");
|
|
printf
|
|
(" -nNUMBER Number of busy threads. Default = number of cpus\n");
|
|
printf(" -iNUMBER Number of iterations. Default = %d\n",
|
|
DEF_ITERATIONS);
|
|
printf(" -tPERIOD Duration of work. Number of ms.\n");
|
|
}
|
|
|
|
int parse_args(int c, char *v)
|
|
{
|
|
int handled = 1;
|
|
switch (c) {
|
|
case 'h':
|
|
usage();
|
|
exit(0);
|
|
case 'i':
|
|
iterations = atoi(v);
|
|
break;
|
|
case 'n':
|
|
num_busy = atoi(v);
|
|
break;
|
|
case 'w':
|
|
low_work_time = atoi(v);
|
|
break;
|
|
default:
|
|
handled = 0;
|
|
break;
|
|
}
|
|
return handled;
|
|
}
|
|
|
|
void *busy_thread(void *arg)
|
|
{
|
|
struct thread *thr = (struct thread *)arg;
|
|
|
|
printf("Busy %ld started\n", (long)thr->arg);
|
|
|
|
while (!end) {
|
|
/* Wait for all threads to reach barrier wait */
|
|
pthread_barrier_wait(&bar1);
|
|
busy_work_ms(busy_work_time);
|
|
/* Wait for all threads to finish this iteration */
|
|
pthread_barrier_wait(&bar2);
|
|
}
|
|
return NULL;
|
|
}
|
|
|
|
void *low_prio_thread(void *arg)
|
|
{
|
|
nsec_t low_start, low_hold;
|
|
unsigned int i;
|
|
|
|
stats_container_init(&low_dat, iterations);
|
|
|
|
printf("Low prio thread started\n");
|
|
|
|
for (i = 0; i < iterations; i++) {
|
|
pthread_mutex_lock(&lock);
|
|
/* Wait for all threads to reach barrier wait.
|
|
Since we already own the mutex, high prio
|
|
thread will boost our priority.
|
|
*/
|
|
pthread_barrier_wait(&bar1);
|
|
|
|
low_start = rt_gettime();
|
|
busy_work_ms(low_work_time);
|
|
low_unlock = rt_gettime();
|
|
low_hold = low_unlock - low_start;
|
|
|
|
pthread_mutex_unlock(&lock);
|
|
|
|
rec.x = i;
|
|
rec.y = low_hold / NS_PER_US;
|
|
stats_container_append(&low_dat, rec);
|
|
|
|
if (i == iterations - 1)
|
|
end = 1;
|
|
|
|
/* Wait for all threads to finish this iteration */
|
|
pthread_barrier_wait(&bar2);
|
|
}
|
|
|
|
return NULL;
|
|
}
|
|
|
|
void *high_prio_thread(void *arg)
|
|
{
|
|
nsec_t high_start, high_end, high_get_lock;
|
|
unsigned int i;
|
|
|
|
stats_container_init(&cpu_delay_dat, iterations);
|
|
stats_container_init(&cpu_delay_hist, HIST_BUCKETS);
|
|
stats_quantiles_init(&cpu_delay_quantiles, (int)log10(iterations));
|
|
|
|
printf("High prio thread started\n");
|
|
|
|
for (i = 0; i < iterations; i++) {
|
|
/* Wait for all threads to reach barrier wait. When
|
|
woken up, low prio thread will own the mutex
|
|
*/
|
|
pthread_barrier_wait(&bar1);
|
|
|
|
high_start = rt_gettime();
|
|
pthread_mutex_lock(&lock);
|
|
high_end = rt_gettime();
|
|
high_get_lock = high_end - low_unlock;
|
|
|
|
busy_work_ms(high_work_time);
|
|
pthread_mutex_unlock(&lock);
|
|
|
|
rec.x = i;
|
|
rec.y = high_get_lock / NS_PER_US;
|
|
stats_container_append(&cpu_delay_dat, rec);
|
|
|
|
/* Wait for all threads to finish this iteration */
|
|
pthread_barrier_wait(&bar2);
|
|
}
|
|
|
|
stats_hist(&cpu_delay_hist, &cpu_delay_dat);
|
|
stats_container_save("samples", "pi_perf Latency Scatter Plot",
|
|
"Iteration", "Latency (us)", &cpu_delay_dat,
|
|
"points");
|
|
stats_container_save("hist", "pi_perf Latency Histogram",
|
|
"Latency (us)", "Samples", &cpu_delay_hist,
|
|
"steps");
|
|
|
|
printf
|
|
("Time taken for high prio thread to get the lock once released by low prio thread\n");
|
|
printf("Min delay = %ld us\n", stats_min(&cpu_delay_dat));
|
|
printf("Max delay = %ld us\n", stats_max(&cpu_delay_dat));
|
|
printf("Average delay = %4.2f us\n", stats_avg(&cpu_delay_dat));
|
|
printf("Standard Deviation = %4.2f us\n", stats_stddev(&cpu_delay_dat));
|
|
printf("Quantiles:\n");
|
|
stats_quantiles_calc(&cpu_delay_dat, &cpu_delay_quantiles);
|
|
stats_quantiles_print(&cpu_delay_quantiles);
|
|
|
|
max_pi_delay = stats_max(&cpu_delay_dat);
|
|
|
|
return NULL;
|
|
}
|
|
|
|
int main(int argc, char *argv[])
|
|
{
|
|
long i;
|
|
int ret;
|
|
setup();
|
|
|
|
pass_criteria = THRESHOLD;
|
|
rt_init("hi:n:w:", parse_args, argc, argv);
|
|
|
|
if (iterations < 100) {
|
|
printf("Number of iterations cannot be less than 100\n");
|
|
exit(1);
|
|
}
|
|
|
|
busy_work_time = low_work_time;
|
|
if (num_busy == -1) {
|
|
/* Number of busy threads = No. of CPUs */
|
|
num_busy = sysconf(_SC_NPROCESSORS_ONLN);
|
|
}
|
|
|
|
if ((ret = pthread_barrier_init(&bar1, NULL, (num_busy + 2)))) {
|
|
printf("pthread_barrier_init failed: %s\n", strerror(ret));
|
|
exit(ret);
|
|
}
|
|
if ((ret = pthread_barrier_init(&bar2, NULL, (num_busy + 2)))) {
|
|
printf("pthread_barrier_init failed: %s\n", strerror(ret));
|
|
exit(ret);
|
|
}
|
|
|
|
init_pi_mutex(&lock);
|
|
|
|
if ((ret = create_fifo_thread(low_prio_thread, NULL, LOWPRIO)) < 0)
|
|
exit(ret);
|
|
if ((ret =
|
|
create_fifo_thread(high_prio_thread, NULL, HIGHPRIO)) < 0)
|
|
exit(ret);
|
|
|
|
for (i = 0; i < num_busy; i++) {
|
|
if ((ret =
|
|
create_fifo_thread(busy_thread, (void *)i, BUSYPRIO)) < 0)
|
|
exit(ret);
|
|
}
|
|
|
|
join_threads();
|
|
printf("Criteria: High prio lock wait time < "
|
|
"(Low prio lock held time + %d us)\n", (int)pass_criteria);
|
|
|
|
ret = 0;
|
|
if (max_pi_delay > pass_criteria)
|
|
ret = 1;
|
|
|
|
printf("Result: %s\n", ret ? "FAIL" : "PASS");
|
|
return ret;
|
|
}
|