Merge branch 'gh/staging' into temp

Conflicts: Makefile bin/rt_launch.c bin/rtspin.c src/task.c
author: Glenn Elliott <gelliott@cs.unc.edu> 2013-03-13 15:33:57 -0400
committer: Glenn Elliott <gelliott@cs.unc.edu> 2013-03-13 15:33:57 -0400
commit: 944a78c21028da69fb53c0aec3e9dfdb048d47e4 (patch)
tree: bdbc77b3c0ff1337670a7e5d0f9d438388c1a866
parent: f338b34ea0fb6136ea3895a07161ece030c4b998 (diff)
parent: 1ff4fc699f01f0ad1359fad48b00c9d3be1b28b4 (diff)
24 files changed, 1447 insertions, 326 deletions
diff --git a/Makefile b/Makefile
index 8886ff9..3489de6 100644
--- a/Makefile
+++ b/Makefile
@@ -19,7 +19,7 @@ LITMUS_KERNEL ?= ../litmus-rt
 # Internal configuration.
 # compiler flags
-flags-debug    = -Wall -Wdeclaration-after-statement -g
+flags-debug    = -O2 -Wall -Werror -g -Wdeclaration-after-statement
 flags-api      = -D_XOPEN_SOURCE=600 -D_GNU_SOURCE
 flags-misc     = -fasynchronous-unwind-tables -fnon-call-exceptions
@@ -72,7 +72,8 @@ AR  := ${CROSS_COMPILE}${AR}
 all     = lib ${rt-apps}
 rt-apps = cycles base_task rt_launch rtspin release_ts measure_syscall \
-          base_mt_task runtests nested locktest ikglptest dgl aux_threads normal_task
+          base_mt_task uncache runtests \
+          nested locktest ikglptest dgl aux_threads normal_task
 .PHONY: all lib clean dump-config TAGS tags cscope help
@@ -237,6 +238,9 @@ lib-normal_task = -lrt -pthread -lm
 obj-dgl = dgl.o common.o
 lib-dgl = -lrt -pthread
+obj-uncache = uncache.o
+lib-uncache = -lrt
 obj-release_ts = release_ts.o
 obj-measure_syscall = null_call.o
diff --git a/bin/base_mt_task.c b/bin/base_mt_task.c
index 8090cc3..1d72143 100644
--- a/bin/base_mt_task.c
+++ b/bin/base_mt_task.c
@@ -1,4 +1,4 @@
-/* based_mt_task.c -- A basic multi-threaded real-time task skeleton. 
+/* based_mt_task.c -- A basic multi-threaded real-time task skeleton.
 *
 * This (by itself useless) task demos how to setup a multi-threaded LITMUS^RT
 * real-time task. Familiarity with the single threaded example (base_task.c)
@@ -28,10 +28,10 @@
 #define NS_PER_MS         1e6
-/* Let's create 10 threads in the example, 
+/* Let's create 10 threads in the example,
 * for a total utilization of 1.
 */
-#define NUM_THREADS      10 
+#define NUM_THREADS      10
 /* The information passed to each thread. Could be anything. */
 struct thread_context {
@@ -43,7 +43,7 @@ struct thread_context {
 */
 void* rt_thread(void *tcontext);
-/* Declare the periodically invoked job. 
+/* Declare the periodically invoked job.
 * Returns 1 -> task should exit.
 *         0 -> task should continue.
 */
@@ -62,7 +62,7 @@ int job(void);
        } while (0)
-/* Basic setup is the same as in the single-threaded example. However, 
+/* Basic setup is the same as in the single-threaded example. However,
 * we do some thread initiliazation first before invoking the job.
 */
 int main(int argc, char** argv)
@@ -71,7 +71,7 @@ int main(int argc, char** argv)
        struct thread_context ctx[NUM_THREADS];
        pthread_t             task[NUM_THREADS];
-        /* The task is in background mode upon startup. */              
+        /* The task is in background mode upon startup. */
        /*****
@@ -79,7 +79,7 @@ int main(int argc, char** argv)
         */
-       
        /*****
         * 2) Work environment (e.g., global data structures, file data, etc.) would
         *    be setup here.
@@ -94,7 +94,7 @@ int main(int argc, char** argv)
        init_litmus();
-        /***** 
+        /*****
         * 4) Launch threads.
         */
        for (i = 0; i < NUM_THREADS; i++) {
@@ -102,15 +102,15 @@ int main(int argc, char** argv)
                pthread_create(task + i, NULL, rt_thread, (void *) (ctx + i));
        }
-        
        /*****
         * 5) Wait for RT threads to terminate.
         */
        for (i = 0; i < NUM_THREADS; i++)
                pthread_join(task[i], NULL);
-        
-        /***** 
+        /*****
         * 6) Clean up, maybe print results and stats, and exit.
         */
        return 0;
@@ -166,7 +166,7 @@ void* rt_thread(void *tcontext)
         */
        CALL( task_mode(LITMUS_RT_TASK) );
-        /* The task is now executing as a real-time task if the call didn't fail. 
+        /* The task is now executing as a real-time task if the call didn't fail.
         */
@@ -178,11 +178,11 @@ void* rt_thread(void *tcontext)
                /* Wait until the next job is released. */
                sleep_next_period();
                /* Invoke job. */
-                do_exit = job();                
+                do_exit = job();
        } while (!do_exit);
-        
        /*****
         * 4) Transition to background mode.
         */
@@ -194,7 +194,7 @@ void* rt_thread(void *tcontext)
-int job(void) 
+int job(void)
 {
        /* Do real-time calculation. */
diff --git a/bin/base_task.c b/bin/base_task.c
index df0c5a2..2b0a49c 100644
--- a/bin/base_task.c
+++ b/bin/base_task.c
@@ -1,6 +1,6 @@
-/* based_task.c -- A basic real-time task skeleton. 
+/* based_task.c -- A basic real-time task skeleton.
 *
- * This (by itself useless) task demos how to setup a 
+ * This (by itself useless) task demos how to setup a
 * single-threaded LITMUS^RT real-time task.
 */
@@ -20,7 +20,7 @@
 */
 #include "litmus.h"
-/* Next, we define period and execution cost to be constant. 
+/* Next, we define period and execution cost to be constant.
 * These are only constants for convenience in this example, they can be
 * determined at run time, e.g., from command line parameters.
 *
@@ -44,13 +44,13 @@
        } while (0)
-/* Declare the periodically invoked job. 
+/* Declare the periodically invoked job.
 * Returns 1 -> task should exit.
 *         0 -> task should continue.
 */
 int job(void);
-/* typically, main() does a couple of things: 
+/* typically, main() does a couple of things:
 *      1) parse command line parameters, etc.
 *      2) Setup work environment.
 *      3) Setup real-time parameters.
@@ -60,7 +60,7 @@ int job(void);
 *      7) Clean up and exit.
 *
 * The following main() function provides the basic skeleton of a single-threaded
- * LITMUS^RT real-time task. In a real program, all the return values should be 
+ * LITMUS^RT real-time task. In a real program, all the return values should be
 * checked for errors.
 */
 int main(int argc, char** argv)
@@ -100,9 +100,9 @@ int main(int argc, char** argv)
        /*****
-         * 3) Setup real-time parameters. 
+         * 3) Setup real-time parameters.
-         *    In this example, we create a sporadic task that does not specify a 
+         *    In this example, we create a sporadic task that does not specify a
-         *    target partition (and thus is intended to run under global scheduling). 
+         *    target partition (and thus is intended to run under global scheduling).
         *    If this were to execute under a partitioned scheduler, it would be assigned
         *    to the first partition (since partitioning is performed offline).
         */
@@ -124,7 +124,7 @@ int main(int argc, char** argv)
         */
        CALL( task_mode(LITMUS_RT_TASK) );
-        /* The task is now executing as a real-time task if the call didn't fail. 
+        /* The task is now executing as a real-time task if the call didn't fail.
         */
@@ -136,11 +136,11 @@ int main(int argc, char** argv)
                /* Wait until the next job is released. */
                sleep_next_period();
                /* Invoke job. */
-                do_exit = job();                
+                do_exit = job();
        } while (!do_exit);
-        
        /*****
         * 6) Transition to background mode.
         */
@@ -148,14 +148,14 @@ int main(int argc, char** argv)
-        /***** 
+        /*****
         * 7) Clean up, maybe print results and stats, and exit.
         */
        return 0;
 }
-int job(void) 
+int job(void)
 {
        /* Do real-time calculation. */
diff --git a/bin/null_call.c b/bin/null_call.c
index d714e77..bab8e73 100644
--- a/bin/null_call.c
+++ b/bin/null_call.c
@@ -16,7 +16,7 @@ static void time_null_call(void)
        t2 = get_cycles();
        if (ret != 0)
                perror("null_call");
-        printf("%10" CYCLES_FMT ", " 
+        printf("%10" CYCLES_FMT ", "
               "%10" CYCLES_FMT ", "
               "%10" CYCLES_FMT ", "
               "%10" CYCLES_FMT ", "
@@ -38,7 +38,7 @@ int main(int argc, char **argv)
 {
        double delay;
        struct timespec sleep_time;
-        
        if (argc == 2) {
                delay = atof(argv[1]);
                sleep_time = sec2timespec(delay);
diff --git a/bin/release_ts.c b/bin/release_ts.c
index 7752097..f745c52 100644
--- a/bin/release_ts.c
+++ b/bin/release_ts.c
@@ -31,35 +31,14 @@ void usage(char *error) {
 void wait_until_ready(int expected)
 {
        int ready = 0, all = 0;
-        char buf[100];
        int loops = 0;
-        ssize_t len;
-        
        do {
                if (loops++ > 0)
                        sleep(1);
-                len = read_file(LITMUS_STATS_FILE, buf, sizeof(buf) - 1);
+                if (!read_litmus_stats(&ready, &all))
-                if (len < 0) {
+                        perror("read_litmus_stats");
-                        fprintf(stderr,
+        } while (expected > ready || (!expected && ready < all));
-                                "(EE) Error while reading '%s': %m.\n"
-                                "(EE) Ignoring -w option.\n",
-                                LITMUS_STATS_FILE);
-                        break;
-                } else {
-                        len = sscanf(buf,
-                                     "real-time tasks   = %d\n"
-                                     "ready for release = %d\n",
-                                     &all, &ready);
-                        if (len != 2) {
-                                fprintf(stderr, 
-                                        "(EE) Could not parse '%s'.\n"
-                                        "(EE) Ignoring -w option.\n",
-                                        LITMUS_STATS_FILE);
-                                break;
-                        }
-                }
-        } while (expected > ready || ready < all);
 }
 int main(int argc, char** argv)
@@ -69,7 +48,7 @@ int main(int argc, char** argv)
        int wait = 0;
        int expected = 0;
        int opt;
-      
        while ((opt = getopt(argc, argv, OPTSTR)) != -1) {
                switch (opt) {
                case 'd':
@@ -79,6 +58,7 @@ int main(int argc, char** argv)
                        wait = 1;
                        break;
                case 'f':
+                        wait = 1;
                        expected = atoi(optarg);
                        break;
                case ':':
@@ -99,7 +79,7 @@ int main(int argc, char** argv)
                perror("release task system");
                exit(1);
        }
-        
        printf("Released %d real-time tasks.\n", released);
        return 0;
diff --git a/bin/rt_launch.c b/bin/rt_launch.c
index 84a5e6c..db7a8b4 100644
--- a/bin/rt_launch.c
+++ b/bin/rt_launch.c
@@ -29,7 +29,7 @@ int launch(void *task_info_p) {
 }
 void usage(char *error) {
-        fprintf(stderr, "%s\nUsage: rt_launch [-w][-v][-p cpu][-c hrt | srt | be] wcet period program [arg1 arg2 ...]\n"
+        fprintf(stderr, "%s\nUsage: rt_launch [-w][-v][-p cpu][-q prio][-c hrt | srt | be] wcet period program [arg1 arg2 ...]\n"
                        "\t-w\tSynchronous release\n"
                        "\t-v\tVerbose\n"
                        "\t-p\tcpu (or initial cpu)\n"
@@ -41,9 +41,9 @@ void usage(char *error) {
 }
-#define OPTSTR "p:c:vw"
+#define OPTSTR "p:c:vwq:"
-int main(int argc, char** argv) 
+int main(int argc, char** argv)
 {
        int ret;
        lt_t wcet;
@@ -54,7 +54,8 @@ int main(int argc, char** argv)
        int verbose = 0;
        int wait = 0;
        startup_info_t info;
-        task_class_t rt_class = RT_CLASS_HARD;
+        task_class_t cls = RT_CLASS_HARD;
+        unsigned int priority = LITMUS_LOWEST_PRIORITY;
        while ((opt = getopt(argc, argv, OPTSTR)) != -1) {
                switch (opt) {
@@ -68,9 +69,14 @@ int main(int argc, char** argv)
                        cpu = atoi(optarg);
                        migrate = 1;
                        break;
+                case 'q':
+                        priority = atoi(optarg);
+                        if (!litmus_is_valid_fixed_prio(priority))
+                                usage("Invalid priority.");
+                        break;
                case 'c':
-                        rt_class = str2class(optarg);
+                        cls = str2class(optarg);
-                        if (rt_class == -1)
+                        if (cls == -1)
                                usage("Unknown task class.");
                        break;
@@ -87,7 +93,7 @@ int main(int argc, char** argv)
        signal(SIGUSR1, SIG_IGN);
        if (argc - optind < 3)
-                usage("Arguments missing.");       
+                usage("Arguments missing.");
        wcet   = ms2lt(atoi(argv[optind + 0]));
        period = ms2lt(atoi(argv[optind + 1]));
        if (wcet <= 0)
@@ -107,13 +113,12 @@ int main(int argc, char** argv)
                if (ret < 0)
                        bail_out("could not migrate to target partition");
        }
-        ret = __create_rt_task(launch, &info, cpu, wcet, period, rt_class);
+        ret = __create_rt_task(launch, &info, cpu, wcet, period, priority, cls);
-        
        if (ret < 0)
                bail_out("could not create rt child process");
        else if (verbose)
                printf("%d\n", ret);
-        return 0;       
+        return 0;
 }
diff --git a/bin/rtspin.c b/bin/rtspin.c
index cbfaee2..6632027 100644
--- a/bin/rtspin.c
+++ b/bin/rtspin.c
@@ -4,6 +4,7 @@
 #include <stdlib.h>
 #include <unistd.h>
 #include <time.h>
+#include <string.h>
 #include <assert.h>
@@ -21,8 +22,10 @@ static void usage(char *error) {
                "       rt_spin -l\n"
                "\n"
                "COMMON-OPTS = [-w] [-p PARTITION] [-c CLASS] [-s SCALE]\n"
+                "              [-X LOCKING-PROTOCOL] [-L CRITICAL SECTION LENGTH] [-Q RESOURCE-ID]"
                "\n"
-                "WCET and PERIOD are milliseconds, DURATION is seconds.\n");
+                "WCET and PERIOD are milliseconds, DURATION is seconds.\n"
+                "CRITICAL SECTION LENGTH is in milliseconds.\n");
        exit(EXIT_FAILURE);
 }
@@ -77,7 +80,7 @@ static void get_exec_times(const char *file, const int column,
                for (cur_col = 1; cur_col < column; ++cur_col) {
                        /* discard input until we get to the column we want */
-                        fscanf(fstream, "%*s,");
+                        int unused __attribute__ ((unused)) = fscanf(fstream, "%*s,");
                }
                /* get the desired exec. time */
@@ -150,31 +153,37 @@ static void debug_delay_loop(void)
        }
 }
-static int job(double exec_time, double program_end)
+static int job(double exec_time, double program_end, int lock_od, double cs_length)
 {
-        int exit = 0;
+        double chunk1, chunk2;
-        if (wctime() > program_end) {
-                exit = 1;
+        if (wctime() > program_end)
-        }
+                return 0;
        else {
-                LITMUS_TRY {
+                if (lock_od >= 0) {
+                        /* simulate critical section somewhere in the middle */
+                        chunk1 = drand48() * (exec_time - cs_length);
+                        chunk2 = exec_time - cs_length - chunk1;
+                        /* non-critical section */
+                        loop_for(chunk1, program_end + 1);
+                        /* critical section */
+                        litmus_lock(lock_od);
+                        loop_for(cs_length, program_end + 1);
+                        litmus_unlock(lock_od);
+                        /* non-critical section */
+                        loop_for(chunk2, program_end + 2);
+                } else {
                        loop_for(exec_time, program_end + 1);
                }
-                LITMUS_CATCH(SIG_BUDGET) {
-                        fprintf(stdout, "Exhausted budget! Finishing job NOW!\n");
-                }
-                END_LITMUS_TRY;
-        }
-        if (!exit) {
                sleep_next_period();
+                return 1;
        }
-        return !exit;
 }
-#define OPTSTR "p:c:wlveio:f:s:q:"
+#define OPTSTR "p:c:wlveio:f:s:q:X:L:Q:"
 int main(int argc, char** argv)
 {
        int ret;
@@ -191,11 +200,18 @@ int main(int argc, char** argv)
        const char *file = NULL;
        int want_enforcement = 0;
        int want_signals = 0;
-        double duration = 0, start;
+        double duration = 0, start = 0;
        double *exec_times = NULL;
        double scale = 1.0;
-        task_class_t rt_class = RT_CLASS_HARD;
+        task_class_t cls = RT_CLASS_HARD;
-        int cur_job, num_jobs;
+        int cur_job = 0, num_jobs = 0;
+        /* locking */
+        int lock_od = -1;
+        int resource_id = 0;
+        const char *lock_namespace = "./rtspin-locks";
+        int protocol = -1;
+        double cs_length = 1; /* millisecond */
        progname = argv[0];
@@ -214,8 +230,8 @@ int main(int argc, char** argv)
                                usage("Invalid priority.");
                        break;
                case 'c':
-                        rt_class = str2class(optarg);
+                        cls = str2class(optarg);
-                        if (rt_class == -1)
+                        if (cls == -1)
                                usage("Unknown task class.");
                        break;
                case 'e':
@@ -236,6 +252,21 @@ int main(int argc, char** argv)
                case 's':
                        scale = atof(optarg);
                        break;
+                case 'X':
+                        protocol = lock_protocol_for_name(optarg);
+                        if (protocol < 0)
+                                usage("Unknown locking protocol specified.");
+                        break;
+                case 'L':
+                        cs_length = atof(optarg);
+                        if (cs_length <= 0)
+                                usage("Invalid critical section length.");
+                        break;
+                case 'Q':
+                        resource_id = atoi(optarg);
+                        if (resource_id <= 0 && strcmp(optarg, "0"))
+                                usage("Invalid resource ID.");
+                        break;
                case ':':
                        usage("Argument missing.");
                        break;
@@ -251,6 +282,8 @@ int main(int argc, char** argv)
                return 0;
        }
+        srand(getpid());
        if (file) {
                get_exec_times(file, column, &num_jobs, &exec_times);
@@ -296,12 +329,12 @@ int main(int argc, char** argv)
                        bail_out("could not migrate to target partition");
        }
-        ret = sporadic_task_ns(wcet, period, 0, cpu, priority, rt_class,
+        ret = sporadic_task_ns(wcet, period, 0, cpu, priority, cls,
-                               want_enforcement ? PRECISE_ENFORCEMENT
+                                want_enforcement ? PRECISE_ENFORCEMENT
-                                                : NO_ENFORCEMENT,
+                                                 : NO_ENFORCEMENT,
-                                   want_signals ? PRECISE_SIGNALS
+                                want_signals ? PRECISE_SIGNALS
-                                                                : NO_SIGNALS,
+                                                 : NO_SIGNALS,
-                               migrate);
+                                migrate);
        if (ret < 0)
                bail_out("could not setup rt task params");
@@ -316,6 +349,15 @@ int main(int argc, char** argv)
        if (ret != 0)
                bail_out("could not become RT task");
+        if (protocol >= 0) {
+                /* open reference to semaphore */
+                lock_od = litmus_open_lock(protocol, resource_id, lock_namespace, &cpu);
+                if (lock_od < 0) {
+                        perror("litmus_open_lock");
+                        usage("Could not open lock.");
+                }
+        }
        if (wait) {
                ret = wait_for_ts_release();
                if (ret != 0)
@@ -329,14 +371,13 @@ int main(int argc, char** argv)
                for (cur_job = 0; cur_job < num_jobs; ++cur_job) {
                        /* convert job's length to seconds */
                        job(exec_times[cur_job] * 0.001 * scale,
-                                        start + duration);
+                            start + duration,
+                            lock_od, cs_length * 0.001);
                }
        } else {
-                /* conver to seconds and scale */
+                /* convert to seconds and scale */
-                int run = 1;
+                while (job(wcet_ms * 0.001 * scale, start + duration,
-                while (run) {
+                           lock_od, cs_length * 0.001));
-                        run = job(wcet_ms * 0.001 * scale, start + duration);
-                }
        }
        ret = task_mode(BACKGROUND_TASK);
diff --git a/bin/uncache.c b/bin/uncache.c
new file mode 100644
index 0000000..b6f6913
--- /dev/null
+++ b/bin/uncache.c
@@ -0,0 +1,381 @@
+#include <stdio.h>
+#include <stdlib.h>
+#include <unistd.h>
+#include <time.h>
+#include <sched.h>
+#include <assert.h>
+#include <string.h>
+#include <stdint.h>
+#include <sys/fcntl.h>
+#include <sys/mman.h>
+/* Test tool for validating Litmus's uncache device.     */
+/* Tool also capable basic cache vs. sysmem statistics.  */
+/* Compile with '-O2' for significaintly greater margins */
+/* in performance between cache and sysmem:              */
+/* (Intel Xeon X5650)                                    */
+/*    -g -> uncache is 30x slower                        */
+/*    -O2 -> uncache is >100x slower                     */
+int PAGE_SIZE;
+#define NR_PAGES 16
+#define UNCACHE_DEV "/dev/litmus/uncache"
+/* volatile forces a read from memory (or cache) on every reference. Note
+   that volatile does not keep data out of the cache! */
+typedef volatile char* pbuf_t;
+/* hit the first byte in each page.
+   addr must be page aligned. */
+inline int linear_write(pbuf_t addr, int size, char val)
+{
+        pbuf_t end = addr + size;
+        pbuf_t step;
+        int nr_pages = (unsigned long)(end - addr)/PAGE_SIZE;
+        int times = nr_pages * PAGE_SIZE;
+        int i;
+        for (i = 0; i < times; ++i)
+                for(step = addr; step < end; step += PAGE_SIZE)
+                        *step = val;
+        return 0;
+}
+inline int linear_read(pbuf_t addr, int size, char val)
+{
+        pbuf_t end = addr + size;
+        pbuf_t step;
+        int nr_pages = (unsigned long)(end - addr)/PAGE_SIZE;
+        int times = nr_pages * PAGE_SIZE;
+        int i;
+        for (i = 0; i < times; ++i)
+                for(step = addr; step < end; step += PAGE_SIZE) {
+                        if (*step != val)
+                                return -1;
+                }
+        return 0;
+}
+/* write to *data nr times. */
+inline int hammer_write(pbuf_t data, char val, int nr)
+{
+        int i;
+        for (i = 0; i < nr; ++i)
+                *data = val;
+        return 0;
+}
+/* read from *data nr times. */
+inline int hammer_read(pbuf_t data, char val, int nr)
+{
+        int i;
+        for (i = 0; i < nr; ++i) {
+                if (*data != val)
+                        return -1;
+        }
+        return 0;
+}
+inline int test(pbuf_t data, int size, int trials)
+{
+        int HAMMER_TIME = 10000;  /* can't cache this! */
+        char VAL = 0x55;
+        int t;
+        for(t = 0; t < trials; ++t) {
+#if 0
+                if (linear_write(data, size, VAL) != 0) {
+                        printf("failed linear_write()\n");
+                        return -1;
+                }
+                if (linear_read(data, size, VAL) != 0) {
+                        printf("failed linear_read()\n");
+                        return -1;
+                }
+#endif
+                /* hammer at the first byte in the array */
+                if (hammer_write(data, VAL, HAMMER_TIME) != 0) {
+                        printf("failed hammer_write()\n");
+                        return -1;
+                }
+                if (hammer_read(data, VAL, HAMMER_TIME) != 0) {
+                        printf("failed hammer_read()\n");
+                        return -1;
+                }
+        }
+        return 0;
+}
+inline void timespec_normalize(struct timespec* ts, time_t sec, int64_t nsec)
+{
+        while(nsec > 1000000000LL) {
+                asm("" : "+rm"(nsec));
+                nsec -= 1000000000LL;
+                ++sec;
+        }
+        while(nsec < 0) {
+                asm("" : "+rm"(nsec));
+                nsec += 1000000000LL;
+                --sec;
+        }
+        ts->tv_sec = sec;
+        ts->tv_nsec = nsec;
+}
+inline struct timespec timespec_sub(struct timespec lhs, struct timespec rhs)
+{
+        struct timespec delta;
+        timespec_normalize(&delta, lhs.tv_sec - rhs.tv_sec, lhs.tv_nsec - rhs.tv_nsec);
+        return delta;
+}
+inline struct timespec timespec_add(struct timespec lhs, struct timespec rhs)
+{
+        struct timespec delta;
+        timespec_normalize(&delta, lhs.tv_sec + rhs.tv_sec, lhs.tv_nsec + rhs.tv_nsec);
+        return delta;
+}
+inline int64_t timespec_to_us(struct timespec ts)
+{
+        int64_t t;
+        t = ts.tv_sec * 1000000LL;
+        t += ts.tv_nsec / 1000LL;
+        return t;
+}
+/* hammers away at the first byte in each mmaped page and
+   times how long it took. */
+int do_data(int do_uncache, int64_t* time)
+{
+        int size;
+        int prot = PROT_READ | PROT_WRITE;
+        int flags = MAP_PRIVATE;
+        pbuf_t data;
+        struct sched_param fifo_params;
+        struct timespec start, end;
+        int64_t elapsed;
+        int trials = 1000;
+        printf("Running data access test.\n");
+        mlockall(MCL_CURRENT | MCL_FUTURE);
+        memset(&fifo_params, 0, sizeof(fifo_params));
+        fifo_params.sched_priority = sched_get_priority_max(SCHED_FIFO);
+        size = PAGE_SIZE*NR_PAGES;
+        printf("Allocating %d %s pages.\n", NR_PAGES, (do_uncache) ?
+                                        "uncacheable" : "cacheable");
+        if (do_uncache) {
+                int fd = open(UNCACHE_DEV, O_RDWR);
+                data = mmap(NULL, size, prot, flags, fd, 0);
+                close(fd);
+        }
+        else {
+                /* Accessed data will probably fit in L1, so this will go VERY fast.
+                   Code should also have little-to-no pipeline stalls. */
+                flags |= MAP_ANONYMOUS;
+                data = mmap(NULL, size, prot, flags, -1, 0);
+        }
+        if (data == MAP_FAILED) {
+                printf("Failed to alloc data! "
+                           "Are you running Litmus? "
+                           "Is Litmus broken?\n");
+                return -1;
+        }
+        else {
+                printf("Data allocated at %p.\n", data);
+        }
+        printf("Beginning tests...\n");
+        if (sched_setscheduler(getpid(), SCHED_FIFO, &fifo_params)) {
+                printf("(Could not become SCHED_FIFO task.) Are you running as root?\n");
+        }
+        /* observations suggest that no warmup phase is needed. */
+        clock_gettime(CLOCK_THREAD_CPUTIME_ID, &start);
+        if (test(data, size, trials) != 0) {
+                printf("Test failed!\n");
+                munmap((char*)data, size);
+                return -1;
+        }
+        clock_gettime(CLOCK_THREAD_CPUTIME_ID, &end);
+        elapsed = timespec_to_us(timespec_sub(end, start));
+        printf("%s Time: %ldus\n", (do_uncache) ?
+                                        "Uncache" : "Cache", elapsed);
+        munmap((char*)data, size);
+        if(time)
+                *time = elapsed;
+        return 0;
+}
+/* compares runtime of cached vs. uncached */
+int do_data_compare()
+{
+        const double thresh = 1.3;
+        int ret = 0;
+        double ratio;
+        int64_t cache_time = 0, uncache_time = 0;
+        printf("Timing cached pages...\n");
+        ret = do_data(0, &cache_time);
+        if (ret != 0)
+                goto out;
+        printf("Timing uncached pages...\n");
+        ret = do_data(1, &uncache_time);
+        if (ret != 0)
+                goto out;
+        ratio = (double)uncache_time/(double)cache_time;
+        printf("Uncached/Cached Ratio: %f\n", ratio);
+        if (ratio < thresh) {
+                printf("Ratio is unexpectedly small (< %f)! "
+                                " Uncache broken? Are you on kvm?\n", thresh);
+                ret = -1;
+        }
+out:
+        return ret;
+}
+/* tries to max out uncache allocations.
+   under normal conditions (non-mlock),
+   pages should spill into swap. uncache
+   pages are not locked in memory. */
+int do_max_alloc(void)
+{
+        int fd;
+        int good = 1;
+        int count = 0;
+        uint64_t mmap_size = PAGE_SIZE; /* start at one page per mmap */
+        /* half of default limit on ubuntu. (see /proc/sys/vm/max_map_count) */
+        int max_mmaps = 32765;
+        volatile char** maps = calloc(max_mmaps, sizeof(pbuf_t));
+        if (!maps) {
+                printf("failed to alloc pointers for pages\n");
+                return -1;
+        }
+        printf("Testing max amount of uncache data. System may get wonkie (OOM Killer)!\n");
+        fd = open(UNCACHE_DEV, O_RDWR);
+        do {
+                int i;
+                int nr_pages = mmap_size/PAGE_SIZE;
+                printf("Testing mmaps of %d pages.\n", nr_pages);
+                count = 0;
+                for (i = 0; (i < max_mmaps) && good; ++i) {
+                        pbuf_t data = mmap(NULL, mmap_size, PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_POPULATE, fd, 0);
+                        if (data != MAP_FAILED) {
+                                maps[i] = data;
+                                ++count;
+                        }
+                        else {
+                                perror(NULL);
+                                good = 0;
+                        }
+                }
+                for (i = 0; i < count; ++i) {
+                        if (maps[i])
+                                munmap((char*)(maps[i]), mmap_size);
+                }
+                memset(maps, 0, sizeof(maps[0])*max_mmaps);
+                mmap_size *= 2; /* let's do it again with bigger allocations */
+        }while(good);
+        free(maps);
+        close(fd);
+        printf("Maxed out allocs with %d mmaps of %lu pages in size.\n",
+                count, mmap_size/PAGE_SIZE);
+        return 0;
+}
+typedef enum
+{
+        UNCACHE,
+        CACHE,
+        COMPARE,
+        MAX_ALLOC
+} test_t;
+#define OPTSTR "ucxa"
+int main(int argc, char** argv)
+{
+        int ret;
+        test_t test = UNCACHE;
+        int opt;
+        PAGE_SIZE = sysconf(_SC_PAGE_SIZE);
+        while((opt = getopt(argc, argv, OPTSTR)) != -1) {
+                switch(opt) {
+                        case 'c':
+                                test = CACHE;
+                                break;
+                        case 'u':
+                                test = UNCACHE;
+                                break;
+                        case 'x':
+                                test = COMPARE;
+                                break;
+                        case 'a':
+                                test = MAX_ALLOC;
+                                break;
+                        case ':':
+                                printf("missing option\n");
+                                exit(-1);
+                        case '?':
+                        default:
+                                printf("bad argument\n");
+                                exit(-1);
+                }
+        }
+        printf("Page Size: %d\n", PAGE_SIZE);
+        switch(test)
+        {
+        case CACHE:
+                ret = do_data(0, NULL);
+                break;
+        case UNCACHE:
+                ret = do_data(1, NULL);
+                break;
+        case COMPARE:
+                ret = do_data_compare();
+                break;
+        case MAX_ALLOC:
+                ret = do_max_alloc();
+                break;
+        default:
+                printf("invalid test\n");
+                ret = -1;
+                break;
+        }
+        if (ret != 0) {
+                printf("Test failed.\n");
+        }
+        return ret;
+}
diff --git a/gpu/aux_threads.c b/gpu/aux_threads.c
index 1e168c6..1711c40 100644
--- a/gpu/aux_threads.c
+++ b/gpu/aux_threads.c
@@ -1,4 +1,4 @@
-/* based_mt_task.c -- A basic multi-threaded real-time task skeleton. 
+/* based_mt_task.c -- A basic multi-threaded real-time task skeleton.
 *
 * This (by itself useless) task demos how to setup a multi-threaded LITMUS^RT
 * real-time task. Familiarity with the single threaded example (base_task.c)
@@ -48,7 +48,7 @@ struct thread_context {
 void* rt_thread(void *tcontext);
 void* aux_thread(void *tcontext);
-/* Declare the periodically invoked job. 
+/* Declare the periodically invoked job.
 * Returns 1 -> task should exit.
 *         0 -> task should continue.
 */
@@ -112,7 +112,7 @@ int main(int argc, char** argv)
        ctx = calloc(NUM_AUX_THREADS, sizeof(struct thread_context));
        task = calloc(NUM_AUX_THREADS, sizeof(pthread_t));
-        
        //lt_t delay = ms2lt(1000);
        /*****
@@ -199,9 +199,9 @@ int main(int argc, char** argv)
                        printf("child %d: %fs\n", i, time);
                }
        }
-        
-        /***** 
+        /*****
         * 6) Clean up, maybe print results and stats, and exit.
         */
        return 0;
@@ -271,7 +271,7 @@ void* rt_thread(void *tcontext)
        wait_for_ts_release();
-        /* The task is now executing as a real-time task if the call didn't fail. 
+        /* The task is now executing as a real-time task if the call didn't fail.
         */
@@ -304,7 +304,7 @@ void* rt_thread(void *tcontext)
        return ctx;
 }
-int job(void) 
+int job(void)
 {
        /* Do real-time calculation. */
diff --git a/gpu/dgl.c b/gpu/dgl.c
index dc68ead..42a3ae2 100644
--- a/gpu/dgl.c
+++ b/gpu/dgl.c
@@ -177,7 +177,7 @@ void* rt_thread(void* _ctx)
                        xfprintf(stdout, "ikglp od = %d\n", ctx->ikglp);
        }
-        
        for (i = 0; i < NUM_SEMS; i++) {
                if(!USE_PRIOQ) {
                        ctx->od[i] = open_fifo_sem(ctx->fd, i+1);
@@ -208,29 +208,29 @@ void* rt_thread(void* _ctx)
                int last = (first + NEST_DEPTH - 1 >= NUM_SEMS) ? NUM_SEMS - 1 : first + NEST_DEPTH - 1;
                int dgl_size = last - first + 1;
                int dgl[dgl_size];
-                
                // construct the DGL
                for(i = first; i <= last; ++i) {
                        dgl[i-first] = ctx->od[i];
                }
-                
-                
                if(NUM_REPLICAS) {
                        replica = litmus_lock(ctx->ikglp);
                        xfprintf(stdout, "[%d] got ikglp replica %d.\n", ctx->id, replica);
                }
-                
                litmus_dgl_lock(dgl, dgl_size);
                xfprintf(stdout, "[%d] acquired dgl.\n", ctx->id);
-                
                do_exit = job(ctx);
-                
                xfprintf(stdout, "[%d] unlocking dgl.\n", ctx->id);
                litmus_dgl_unlock(dgl, dgl_size);
-                
-                if(NUM_REPLICAS) {              
+                if(NUM_REPLICAS) {
                        xfprintf(stdout, "[%d]: freeing ikglp replica %d.\n", ctx->id, replica);
                        litmus_unlock(ctx->ikglp);
                }
@@ -249,7 +249,7 @@ void* rt_thread(void* _ctx)
        return NULL;
 }
-void dirty_kb(int kb) 
+void dirty_kb(int kb)
 {
        int32_t one_kb[256];
        int32_t sum = 0;
diff --git a/gpu/ikglptest.c b/gpu/ikglptest.c
index f802801..30623b7 100644
--- a/gpu/ikglptest.c
+++ b/gpu/ikglptest.c
@@ -172,7 +172,7 @@ struct avg_info feedback(int _a, int _b)
        }
        stdev = sqrtf(devsum/(NUM_SAMPLES-1));
-        
        ret.avg = avg;
        ret.stdev = stdev;
@@ -189,10 +189,10 @@ struct avg_info feedback(int _a, int _b)
 int main(int argc, char** argv)
 {
        int i;
-        struct thread_context* ctx;
+        struct thread_context* ctx = NULL;
-        struct thread_context* aux_ctx;
+        struct thread_context* aux_ctx = NULL;
-        pthread_t*           task;
+        pthread_t*           task = NULL;
-        pthread_t*           aux_task;
+        pthread_t*           aux_task = NULL;
        int fd;
        int opt;
@@ -291,7 +291,7 @@ int main(int argc, char** argv)
                        }
                }
        }
-        
        printf("Best:\ta = %d\tb = %d\t(b-a) = %d\tavg = %6.2f\tstdev = %6.2f\n", best_a, best_b, best_b - best_a, best.avg, best.stdev);
        printf("2nd:\ta = %d\tb = %d\t(b-a) = %d\tavg = %6.2f\tstdev = %6.2f\n", second_best_a, second_best_b, second_best_b - second_best_a, second_best.avg, second_best.stdev);
@@ -308,7 +308,7 @@ int main(int argc, char** argv)
                        }
        printf("Aaron:\tavg = %6.2f\tstd = %6.2f\n", avg_accum/TRIALS, std_accum/TRIALS);
-        
@@ -385,7 +385,7 @@ int affinity_distance(struct thread_context* ctx, int a, int b)
 {
        int i;
        int dist;
-        
        if(a >= 0 && b >= 0) {
                for(i = 0; i <= 3; ++i) {
                        if(a>>i == b>>i) {
@@ -397,25 +397,25 @@ int affinity_distance(struct thread_context* ctx, int a, int b)
        }
        else {
                dist = 0;
-        }       
+        }
-        
 out:
-        //printf("[%d]: distance: %d -> %d = %d\n", ctx->id, a, b, dist);       
+        //printf("[%d]: distance: %d -> %d = %d\n", ctx->id, a, b, dist);
-        
        ++(ctx->mig_count[dist]);
-        
        return dist;
-        
 //      int groups[] = {2, 4, 8};
 //      int i;
-//      
+//
 //      if(a < 0 || b < 0)
 //              return (sizeof(groups)/sizeof(groups[0]));  // worst affinity
-//      
+//
 //      // no migration
 //      if(a == b)
 //              return 0;
-//      
+//
 //      for(i = 0; i < sizeof(groups)/sizeof(groups[0]); ++i) {
 //              if(a/groups[i] == b/groups[i])
 //                      return (i+1);
@@ -441,7 +441,7 @@ void* rt_thread(void* _ctx)
 {
        int i;
        int do_exit = 0;
-        int last_replica = -1;  
+        int last_replica = -1;
        struct thread_context *ctx = (struct thread_context*)_ctx;
@@ -472,13 +472,13 @@ void* rt_thread(void* _ctx)
                                                                          IKGLP_OPTIMAL_FIFO_LEN :
                                                                          IKGLP_UNLIMITED_FIFO_LEN,
                                                                ENABLE_AFFINITY
-                                                                );      
+                                                                );
        }
        if(ctx->kexclu < 0)
                perror("open_kexclu_sem");
        else
                printf("kexclu od = %d\n", ctx->kexclu);
-        
        for (i = 0; i < NUM_SEMS; ++i) {
                if(!USE_PRIOQ) {
                        ctx->od[i] = open_fifo_sem(ctx->fd, i + ctx->kexclu + 2);
@@ -508,21 +508,21 @@ void* rt_thread(void* _ctx)
                int dgl_size = last - first + 1;
                int replica = -1;
                int distance;
-                
-                int dgl[dgl_size];              
+                int dgl[dgl_size];
-                
                // construct the DGL
                for(i = first; i <= last; ++i) {
                        dgl[i-first] = ctx->od[i];
-                }               
+                }
-                
                replica = litmus_lock(ctx->kexclu);
                //printf("[%d] got kexclu replica %d.\n", ctx->id, replica);
                //fflush(stdout);
                distance = affinity_distance(ctx, replica, last_replica);
-                
                if(USE_DYNAMIC_GROUP_LOCKS) {
                        litmus_dgl_lock(dgl, dgl_size);
                }
@@ -531,24 +531,24 @@ void* rt_thread(void* _ctx)
                                litmus_lock(dgl[i]);
                        }
                }
-                
                //do_exit = nested_job(ctx, &count, &first, affinity_cost[distance]);
                do_exit = job(ctx, affinity_cost[distance]);
-                
                if(USE_DYNAMIC_GROUP_LOCKS) {
                        litmus_dgl_unlock(dgl, dgl_size);
                }
                else {
                        for(i = dgl_size - 1; i >= 0; --i) {
                                litmus_unlock(dgl[i]);
-                        }                       
+                        }
-                }               
+                }
-                
                //printf("[%d]: freeing kexclu replica %d.\n", ctx->id, replica);
                //fflush(stdout);
                litmus_unlock(ctx->kexclu);
-                
                last_replica = replica;
                if(SLEEP_BETWEEN_JOBS && !do_exit) {
@@ -567,7 +567,7 @@ void* rt_thread(void* _ctx)
         */
        TH_CALL( task_mode(BACKGROUND_TASK) );
-        for(i = 0; i < sizeof(ctx->mig_count)/sizeof(ctx->mig_count[0]); ++i) 
+        for(i = 0; i < sizeof(ctx->mig_count)/sizeof(ctx->mig_count[0]); ++i)
        {
                printf("[%d]: mig_count[%d] = %d\n", ctx->id, i, ctx->mig_count[i]);
        }
@@ -608,15 +608,15 @@ void* rt_thread(void* _ctx)
 //}
-void dirty_kb(int kb) 
+void dirty_kb(int kb)
-{       
+{
        int32_t one_kb[256];
        int32_t sum = 0;
        int32_t i;
        if(!kb)
-                return; 
+                return;
-        
        for (i = 0; i < 256; i++)
                sum += one_kb[i];
        kb--;
@@ -630,9 +630,9 @@ void dirty_kb(int kb)
 int job(struct thread_context* ctx, int runfactor)
 {
        //struct timespec tosleep = {0, 100000}; // 0.1 ms
-        
        //printf("[%d]: runfactor = %d\n", ctx->id, runfactor);
-        
        //dirty_kb(8 * runfactor);
        dirty_kb(1 * runfactor);
        //nanosleep(&tosleep, NULL);
diff --git a/gpu/locktest.c b/gpu/locktest.c
index bc4fc54..6a1219a 100644
--- a/gpu/locktest.c
+++ b/gpu/locktest.c
@@ -177,7 +177,7 @@ void* rt_thread(void* _ctx)
        return NULL;
 }
-void dirty_kb(int kb) 
+void dirty_kb(int kb)
 {
        int32_t one_kb[256];
        int32_t sum = 0;
diff --git a/gpu/nested.c b/gpu/nested.c
index 8c39152..edec46b 100644
--- a/gpu/nested.c
+++ b/gpu/nested.c
@@ -180,7 +180,7 @@ void* rt_thread(void* _ctx)
                int first = (int)(NUM_SEMS * (rand_r(&(ctx->rand)) / (RAND_MAX + 1.0)));
                int count = NEST_DEPTH;
                do_exit = nested_job(ctx, &count, &first);
-                
                if(SLEEP_BETWEEN_JOBS && !do_exit) {
                        sleep_next_period();
                }
@@ -226,7 +226,7 @@ int nested_job(struct thread_context* ctx, int *count, int *next)
-void dirty_kb(int kb) 
+void dirty_kb(int kb)
 {
        int32_t one_kb[256];
        int32_t sum = 0;
diff --git a/gpu/rtspin_fake_cuda.cpp b/gpu/rtspin_fake_cuda.cpp
index 78e4f60..247a74c 100644
--- a/gpu/rtspin_fake_cuda.cpp
+++ b/gpu/rtspin_fake_cuda.cpp
@@ -119,7 +119,7 @@ char *h_state_data = 0;
                mmap(NULL, s ,   \
                                PROT_READ | PROT_WRITE,  \
                                MAP_PRIVATE | MAP_ANONYMOUS | MAP_LOCKED,  \
-                                -1, 0) 
+                                -1, 0)
 #else
 #define c_malloc(s) malloc(s)
 #endif
@@ -144,38 +144,38 @@ cudaError_t cudaGetLastError()
 ////////////////////////////////////////////////////////////////////////
 struct ce_lock_state
-{       
+{
        int locks[2];
        size_t num_locks;
        size_t budget_remaining;
        bool locked;
-        
        ce_lock_state(int device_a, enum cudaMemcpyKind kind, size_t size, int device_b = -1) {
                num_locks = (device_a != -1) + (device_b != -1);
-                
                if(device_a != -1) {
                        locks[0] = (kind == cudaMemcpyHostToDevice) ?
                        CE_SEND_LOCKS[device_a] : CE_RECV_LOCKS[device_a];
                }
-                
                if(device_b != -1) {
                        assert(kind == cudaMemcpyDeviceToDevice);
-                        
                        locks[1] = CE_RECV_LOCKS[device_b];
-                        
                        if(locks[1] < locks[0]) {
                                int temp = locks[1];
                                locks[1] = locks[0];
                                locks[0] = temp;
                        }
                }
-                
                if(!ENABLE_CHUNKING)
                        budget_remaining = size;
                else
                        budget_remaining = CHUNK_SIZE;
        }
-        
        void lock() {
                if(USE_DYNAMIC_GROUP_LOCKS) {
                        litmus_dgl_lock(locks, num_locks);
@@ -189,7 +189,7 @@ struct ce_lock_state
                }
                locked = true;
        }
-        
        void unlock() {
                if(USE_DYNAMIC_GROUP_LOCKS) {
                        litmus_dgl_unlock(locks, num_locks);
@@ -204,15 +204,15 @@ struct ce_lock_state
                }
                locked = false;
        }
-        
        void refresh() {
                budget_remaining = CHUNK_SIZE;
        }
-        
        bool budgetIsAvailable(size_t tosend) {
                return(tosend >= budget_remaining);
        }
-        
        void decreaseBudget(size_t spent) {
                budget_remaining -= spent;
        }
@@ -225,53 +225,53 @@ cudaError_t __chunkMemcpy(void* a_dst, const void* a_src, size_t count,
 {
    cudaError_t ret = cudaSuccess;
    int remaining = count;
-    
    char* dst = (char*)a_dst;
    const char* src = (const char*)a_src;
-    
        // disable chunking, if needed, by setting chunk_size equal to the
        // amount of data to be copied.
        int chunk_size = (ENABLE_CHUNKING) ? CHUNK_SIZE : count;
        int i = 0;
-        
    while(remaining != 0)
    {
        int bytesToCopy = std::min(remaining, chunk_size);
-                
                if(state && state->budgetIsAvailable(bytesToCopy) && state->locked) {
                        //cutilSafeCall( cudaStreamSynchronize(streams[CUR_DEVICE]) );
                        ret = cudaGetLastError();
-                        
                        if(ret != cudaSuccess)
                        {
                                break;
                        }
-                        
                        state->unlock();
                        state->refresh(); // replentish.
                                                          // we can only run out of
                                                          // budget if chunking is enabled.
                                                          // we presume that init budget would
                                                          // be set to cover entire memcpy
-                                                          // if chunking were disabled.                 
+                                                          // if chunking were disabled.
                }
-                
                if(state && !state->locked) {
                        state->lock();
                }
-                
        //ret = cudaMemcpy(dst+i*chunk_size, src+i*chunk_size, bytesToCopy, kind);
                //cudaMemcpyAsync(dst+i*chunk_size, src+i*chunk_size, bytesToCopy, kind, streams[CUR_DEVICE]);
                if(state) {
                        state->decreaseBudget(bytesToCopy);
                }
-                
 //              if(ret != cudaSuccess)
 //              {
 //                      break;
-//              }               
+//              }
-                
        ++i;
        remaining -= bytesToCopy;
    }
@@ -281,7 +281,7 @@ cudaError_t __chunkMemcpy(void* a_dst, const void* a_src, size_t count,
 cudaError_t chunkMemcpy(void* a_dst, const void* a_src, size_t count,
                                                enum cudaMemcpyKind kind,
                                                int device_a = -1,  // device_a == -1 disables locking
-                                                bool do_locking = true, 
+                                                bool do_locking = true,
                                                int device_b = -1)
 {
        cudaError_t ret;
@@ -317,7 +317,7 @@ inline uint64_t timespec_to_ns(const struct timespec& t)
 inline struct timespec ns_to_timespec(const uint64_t& ns)
 {
        struct timespec temp = {ns/1e9, ns - ns/1e9};
-        return(temp);   
+        return(temp);
 }
 inline uint64_t clock_gettime_ns(clockid_t clk_id)
@@ -366,9 +366,9 @@ static void allocate_locks()
 {
        // allocate k-FMLP lock
        int fd = open("semaphores", O_RDONLY | O_CREAT, S_IRUSR | S_IWUSR);
-        
        int base_name = GPU_PARTITION * 1000;
-        
        if(USE_KFMLP) {
                KEXCLU_LOCK = open_kfmlp_gpu_sem(fd,
                                                                                 base_name,  /* name */
@@ -397,7 +397,7 @@ static void allocate_locks()
 //                                                                               NUM_SIMULT_USERS,
 //                                                                               ENABLE_AFFINITY,
 //                                                                               RELAX_FIFO_MAX_LEN
-//                                                                               );             
+//                                                                               );
        }
        if(KEXCLU_LOCK < 0)
                perror("open_kexclu_sem");
@@ -406,31 +406,31 @@ static void allocate_locks()
        {
                open_sem_t opensem = (!USE_PRIOQ) ? open_fifo_sem : open_prioq_sem;
                const char* opensem_label = (!USE_PRIOQ) ? "open_fifo_sem" : "open_prioq_sem";
-                
                // allocate the engine locks.
                for (int i = 0; i < MAX_GPUS; ++i)
                {
                        EE_LOCKS[i] = opensem(fd, (i+1)*10 + base_name);
                        if(EE_LOCKS[i] < 0)
                                perror(opensem_label);
-                        
                        CE_SEND_LOCKS[i] = opensem(fd, (i+1)*10 + base_name + 1);
                        if(CE_SEND_LOCKS[i] < 0)
-                                perror(opensem_label);                  
+                                perror(opensem_label);
-                        
                        if(NUM_SIMULT_USERS == 3)
                        {
                                // allocate a separate lock for the second copy engine
                                CE_RECV_LOCKS[i] = opensem(fd, (i+1)*10 + base_name + 2);
                                if(CE_RECV_LOCKS[i] < 0)
-                                        perror(opensem_label);                                  
+                                        perror(opensem_label);
                        }
                        else
                        {
                                // share a single lock for the single copy engine
                                CE_RECV_LOCKS[i] = CE_SEND_LOCKS[i];
                        }
-                }               
+                }
        }
 }
@@ -449,22 +449,22 @@ static void allocate_host_memory()
 //              h_send_data = (char *)c_malloc(send_alloc_bytes);
 //              memset(h_send_data, 0x55, send_alloc_bytes);  // write some random value
 //              // this will open a connection to GPU 0 if there is no active context, so
-//              // expect long stalls.  LAME.   
+//              // expect long stalls.  LAME.
 //              cutilSafeCall( cudaHostRegister(h_send_data, send_alloc_bytes, cudaHostRegisterPortable) );
 //      }
-//      
+//
 //      if(recv_alloc_bytes > 0)
-//      {       
+//      {
 //              h_recv_data = (char *)c_malloc(recv_alloc_bytes);
 //              memset(h_recv_data, 0xAA, recv_alloc_bytes);
-//              cutilSafeCall( cudaHostRegister(h_recv_data, recv_alloc_bytes, cudaHostRegisterPortable) );     
+//              cutilSafeCall( cudaHostRegister(h_recv_data, recv_alloc_bytes, cudaHostRegisterPortable) );
 //      }
-//      
+//
 //      if(state_alloc_bytes > 0)
-//      {               
+//      {
 //              h_state_data = (char *)c_malloc(state_alloc_bytes);
 //              memset(h_state_data, 0xCC, state_alloc_bytes);  // write some random value
-//              cutilSafeCall( cudaHostRegister(h_state_data, state_alloc_bytes, cudaHostRegisterPortable) );   
+//              cutilSafeCall( cudaHostRegister(h_state_data, state_alloc_bytes, cudaHostRegisterPortable) );
 //      }
        printf("Host memory allocated.\n");
@@ -477,28 +477,28 @@ static void allocate_device_memory()
 //      for(int i = 0; i < GPU_PARTITION_SIZE; ++i)
 //      {
 //              int which_device = GPU_PARTITION*GPU_PARTITION_SIZE + i;
-//              
+//
 //              if(ENABLE_WAIT) gpu_mgmt_mutexes[which_device].lock();
-//              
+//
 //              cutilSafeCall( cudaSetDevice(which_device) );
 //              cutilSafeCall( cudaDeviceSetLimit(cudaLimitPrintfFifoSize, 0) );
 //              cutilSafeCall( cudaDeviceSetLimit(cudaLimitMallocHeapSize, 0) );
-//              
+//
 //              cutilSafeCall( cudaStreamCreate(&streams[which_device]) );
-//              
+//
 //              /* pre-allocate memory, pray there's enough to go around */
 //              if(SEND_SIZE > 0) {
-//                      cutilSafeCall( cudaMalloc((void**)&d_send_data[which_device], SEND_SIZE) );     
+//                      cutilSafeCall( cudaMalloc((void**)&d_send_data[which_device], SEND_SIZE) );
 //              }
 //              if(RECV_SIZE > 0) {
 //                      cutilSafeCall( cudaMalloc((void**)&h_recv_data[which_device], RECV_SIZE) );
 //              }
 //              if(STATE_SIZE > 0) {
 //                      cutilSafeCall( cudaMalloc((void**)&h_state_data[which_device], STATE_SIZE) );
-//              }               
+//              }
-//              
+//
 //              if(ENABLE_WAIT) gpu_mgmt_mutexes[which_device].unlock();
-//      }       
+//      }
        printf("Device memory allocated.\n");
 }
@@ -508,39 +508,39 @@ static void configure_gpus()
 //      // SUSPEND WHEN BLOCKED!!
 //      cutilSafeCall( cudaSetDeviceFlags(cudaDeviceScheduleBlockingSync) );
-//      
+//
 //      // establish a connection to each GPU.
 //      for(int i = 0; i < GPU_PARTITION_SIZE; ++i)
 //      {
 //              int which_device = GPU_PARTITION*GPU_PARTITION_SIZE + i;
-//              
+//
 //              if(ENABLE_WAIT) gpu_mgmt_mutexes[which_device].lock();
-//              
+//
 //              cutilSafeCall( cudaSetDevice(which_device) );
 //              cutilSafeCall( cudaDeviceSetLimit(cudaLimitPrintfFifoSize, 0) );
 //              cutilSafeCall( cudaDeviceSetLimit(cudaLimitMallocHeapSize, 0) );
-//              
+//
 //              cutilSafeCall( cudaStreamCreate(&streams[which_device]) );
-//              
+//
 //              // enable P2P migrations.
 //              // we assume all GPUs are on the same I/O hub.
 //              for(int j = 0; j < GPU_PARTITION_SIZE; ++j)
 //              {
 //                      int other_device = GPU_PARTITION*GPU_PARTITION_SIZE + j;
-//                      
+//
 //                      if(which_device != other_device)
 //                      {
 //                              cutilSafeCall( cudaDeviceEnablePeerAccess(other_device, 0) );
 //                      }
 //              }
-//              
+//
 //              if(i == 0)
 //              {
 //                      struct cudaDeviceProp pi;
 //                      cudaGetDeviceProperties(&pi, i);
 //                      gpuCyclesPerSecond = pi.clockRate * 1000; /* khz -> hz */
-//              }               
+//              }
-//              
+//
 //              if(ENABLE_WAIT) gpu_mgmt_mutexes[which_device].unlock();
 //      }
@@ -580,7 +580,7 @@ static void catchExit(void)
                        for(int i = 0; i < GPU_PARTITION_SIZE; ++i)
                        {
                                int which_device = GPU_PARTITION*GPU_PARTITION_SIZE + i;
-                                
                                litmus_unlock(EE_LOCKS[which_device]);
                                litmus_unlock(CE_SEND_LOCKS[which_device]);
                                if(NUM_SIMULT_USERS == 2) {
@@ -588,11 +588,11 @@ static void catchExit(void)
                                }
                        }
                }
-                
                if(CUR_DEVICE >= 0) {
                        unregister_nv_device(CUR_DEVICE);
                }
-                
                litmus_unlock(KEXCLU_LOCK);
        }
 }
@@ -604,18 +604,18 @@ static void migrateToGPU(int destination)
                if(MIGRATE_VIA_SYSMEM)
                {
                        chunkMemcpy(h_state_data, d_state_data[LAST_DEVICE], STATE_SIZE,
-                                                cudaMemcpyDeviceToHost, LAST_DEVICE, useEngineLocks());                 
+                                                cudaMemcpyDeviceToHost, LAST_DEVICE, useEngineLocks());
                }
        }
-        
-//      cutilSafeCall( cudaSetDevice(destination) );            
+//      cutilSafeCall( cudaSetDevice(destination) );
-        
        if(!BROADCAST_STATE && STATE_SIZE > 0)
        {
                if(MIGRATE_VIA_SYSMEM)
                {
                        chunkMemcpy(d_state_data[CUR_DEVICE], h_state_data, STATE_SIZE,
-                                                cudaMemcpyHostToDevice, CUR_DEVICE, useEngineLocks());                  
+                                                cudaMemcpyHostToDevice, CUR_DEVICE, useEngineLocks());
                }
                else
                {
@@ -633,15 +633,15 @@ static void migrateToGPU(int destination)
 static void broadcastState(int from)
 {
        if(STATE_SIZE > 0)
-        {               
+        {
                assert(CUR_DEVICE == from);
-                
                if(MIGRATE_VIA_SYSMEM)
                {
                        chunkMemcpy(h_state_data, d_state_data[from], STATE_SIZE,
                                                cudaMemcpyDeviceToHost, from, useEngineLocks());
-                }       
+                }
-        
                for(int i = 0; i < GPU_PARTITION_SIZE; ++i)
                {
                        int which_device = GPU_PARTITION*GPU_PARTITION_SIZE + i;
@@ -652,7 +652,7 @@ static void broadcastState(int from)
 //                                      cutilSafeCall( cudaSetDevice(which_device) );
                                        CUR_DEVICE = which_device; // temporary
                                        chunkMemcpy(d_state_data[which_device], h_state_data, STATE_SIZE,
-                                                                cudaMemcpyHostToDevice, which_device, useEngineLocks());                                        
+                                                                cudaMemcpyHostToDevice, which_device, useEngineLocks());
                                }
                                else
                                {
@@ -662,11 +662,11 @@ static void broadcastState(int from)
                                                                cudaMemcpyDeviceToDevice,
                                                                from,
                                                                useEngineLocks(),
-                                                                which_device);  
+                                                                which_device);
                                }
                        }
                }
-                
                if(MIGRATE_VIA_SYSMEM && CUR_DEVICE != from)
                {
 //                      cutilSafeCall( cudaSetDevice(from) );
@@ -714,18 +714,18 @@ static void gpu_loop_for(double gpu_sec_time, double emergency_exit)
                }
                if(useEngineLocks()) litmus_lock(EE_LOCKS[CUR_DEVICE]);
-                
 //              docudaspin <<<numblocks,blocksz, 0, streams[CUR_DEVICE]>>> (numcycles);
 //              cutilSafeCall( cudaStreamSynchronize(streams[CUR_DEVICE]) );
-                
                if(useEngineLocks()) litmus_unlock(EE_LOCKS[CUR_DEVICE]);
-                
                if(RECV_SIZE > 0)
                {
                        chunkMemcpy(h_recv_data, d_recv_data[CUR_DEVICE], RECV_SIZE,
                                                cudaMemcpyDeviceToHost, CUR_DEVICE, useEngineLocks());
                }
-                
                if(BROADCAST_STATE)
                {
                        broadcastState(CUR_DEVICE);
@@ -802,7 +802,7 @@ int main(int argc, char** argv)
        int num_tasks = 0;
        double gpu_sec_ms = 0;
-        
        while ((opt = getopt(argc, argv, OPTSTR)) != -1) {
 //              printf("opt = %c optarg = %s\n", opt, optarg);
                switch (opt) {
@@ -858,7 +858,7 @@ int main(int argc, char** argv)
                        break;
                case 'r':
                        RELAX_FIFO_MAX_LEN = true;
-                        break;                          
+                        break;
                case 'L':
                        USE_KFMLP = true;
                        break;
@@ -949,13 +949,13 @@ int main(int argc, char** argv)
                {
                        printf("%d creating release shared memory\n", getpid());
                        shared_memory_object::remove("release_barrier_memory");
-                        release_segment_ptr = new managed_shared_memory(create_only, "release_barrier_memory", 4*1024);                 
+                        release_segment_ptr = new managed_shared_memory(create_only, "release_barrier_memory", 4*1024);
-                        
                        printf("%d creating release barrier for %d users\n", getpid(), num_tasks);
                        release_barrier = release_segment_ptr->construct<barrier>("barrier release_barrier")(num_tasks);
-                        
                        init_release_time = release_segment_ptr->construct<uint64_t>("uint64_t instance")();
-                        *init_release_time = 0;         
+                        *init_release_time = 0;
                }
                else
                {
@@ -972,13 +972,13 @@ int main(int argc, char** argv)
                                        sleep(1);
                                }
                        }while(segment_ptr == NULL);
-                        
                        release_barrier = segment_ptr->find<barrier>("barrier release_barrier").first;
                        init_release_time = segment_ptr->find<uint64_t>("uint64_t instance").first;
                }
        }
-        
-        
        if(GPU_TASK)
        {
                if(ENABLE_WAIT)
@@ -1019,7 +1019,7 @@ int main(int argc, char** argv)
                SEND_SIZE *= scale;
                RECV_SIZE *= scale;
                STATE_SIZE *= scale;
-                
                init_cuda();
        }
@@ -1036,16 +1036,16 @@ int main(int argc, char** argv)
        if (ret != 0)
                bail_out("could not become RT task");
-        
-        
        uint64_t jobCount = 0;
        blitz::Array<uint64_t, 1> responseTimeLog(num_jobs+1);
-        
        struct timespec spec;
        uint64_t release;
        uint64_t finish;
-                
-        
        if (ENABLE_WAIT) {
                printf("Waiting for release.\n");
                ret = wait_for_ts_release();
@@ -1056,14 +1056,14 @@ int main(int argc, char** argv)
        {
                sleep_next_period();
        }
-        
        clock_gettime(CLOCK_MONOTONIC, &spec);
        release = timespec_to_ns(spec);
        if (!__sync_bool_compare_and_swap(init_release_time, 0, release))
        {
                release = *init_release_time;
        }
-                
        releaseTime = wctime();
        double failsafeEnd = releaseTime + duration;
@@ -1087,7 +1087,7 @@ int main(int argc, char** argv)
                        clock_gettime(CLOCK_MONOTONIC, &spec);
                        finish = timespec_to_ns(spec);
-                        responseTimeLog(min(num_jobs,jobCount++)) = finish - release;   
+                        responseTimeLog(min(num_jobs,jobCount++)) = finish - release;
                        // this is an estimated upper-bound on release time.  it may be off by several microseconds.
 #ifdef RESET_RELEASE_ON_MISS
@@ -1097,11 +1097,11 @@ int main(int argc, char** argv)
 #else
                        release = release + period; // allow things to get progressively later.
 #endif
-                        
                        sleep_next_period();
                        clock_gettime(CLOCK_MONOTONIC, &spec);
                        release = min(timespec_to_ns(spec), release);
-                        
                } while(keepGoing);
        }
@@ -1147,13 +1147,13 @@ int main(int argc, char** argv)
                }
        }
-        
        if (ENABLE_WAIT)
        {
                printf("%d waiting at exit barrier\n", getpid());
                release_barrier->wait();
        }
-        
        char gpu_using_str[] = "GPU\n";
        char cpu_only_str[] = "CPU\n";
@@ -1166,7 +1166,7 @@ int main(int argc, char** argv)
                   // average
                   blitz::mean(USED(responseTimeLog)),
                   // average pct of period
-                   100.0*(blitz::mean(USED(responseTimeLog))/period),                      
+                   100.0*(blitz::mean(USED(responseTimeLog))/period),
                   // min
                   blitz::min(USED(responseTimeLog)),
                   // max
@@ -1182,6 +1182,6 @@ int main(int argc, char** argv)
                   // flag gpu-using tasks
                   ((GPU_TASK) ? gpu_using_str : cpu_only_str)
                   );
-        
        return 0;
 }
diff --git a/include/litmus.h b/include/litmus.h
index a4f6c61..0b2c407 100644
--- a/include/litmus.h
+++ b/include/litmus.h
@@ -77,12 +77,12 @@ typedef enum  {
        FIFO_MUTEX      = 6,
        IKGLP_SEM       = 7,
        KFMLP_SEM       = 8,
-        
        IKGLP_SIMPLE_GPU_AFF_OBS = 9,
        IKGLP_GPU_AFF_OBS = 10,
        KFMLP_SIMPLE_GPU_AFF_OBS = 11,
        KFMLP_GPU_AFF_OBS = 12,
-        
        PRIOQ_MUTEX = 13,
 } obj_type_t;
@@ -97,6 +97,13 @@ static inline int od_open(int fd, obj_type_t type, int obj_id)
        return od_openx(fd, type, obj_id, 0);
 }
+int litmus_open_lock(
+        obj_type_t protocol,    /* which locking protocol to use, e.g., FMLP_SEM */
+        int lock_id,            /* numerical id of the lock, user-specified */
+        const char* namespace,  /* path to a shared file */
+        void *config_param);    /* any extra info needed by the protocol (such
+                                 * as CPU under SRP and PCP), may be NULL */
 /* real-time locking protocol support */
 int litmus_lock(int od);
 int litmus_unlock(int od);
@@ -109,7 +116,7 @@ int litmus_unlock(int od);
 *   litmus_dgl_unlock({A, B, C, D}, 4);
 */
 int litmus_dgl_lock(int* ods, int dgl_size);
-int litmus_dgl_unlock(int* ods, int dgl_size);  
+int litmus_dgl_unlock(int* ods, int dgl_size);
 /* nvidia graphics cards */
 int register_nv_device(int nv_device_id);
@@ -129,9 +136,9 @@ void exit_litmus(void);
 typedef int (*rt_fn_t)(void*);
 /* These two functions configure the RT task to use enforced exe budgets */
-int create_rt_task(rt_fn_t rt_prog, void *arg, int cpu, int wcet, int period);
+int create_rt_task(rt_fn_t rt_prog, void *arg, int cpu, lt_t wcet, lt_t period, unsigned int prio);
-int __create_rt_task(rt_fn_t rt_prog, void *arg, int cpu, int wcet,
+int __create_rt_task(rt_fn_t rt_prog, void *arg, int cpu, lt_t wcet,
-                     int period, task_class_t cls);
+                     lt_t period, unsigned int priority, task_class_t cls);
 /*      per-task modes */
 enum rt_task_mode_t {
@@ -153,6 +160,7 @@ int wait_for_ts_release();
 int wait_for_ts_release2(struct timespec *release);
 int release_ts(lt_t *delay);
 int get_nr_ts_release_waiters(void);
+int read_litmus_stats(int *ready, int *total);
 int enable_aux_rt_tasks(int flags);
@@ -177,7 +185,7 @@ double wctime(void);
 /* semaphore allocation */
 typedef int (*open_sem_t)(int fd, int name);
-        
 static inline int open_fmlp_sem(int fd, int name)
 {
        return od_open(fd, FMLP_SEM, name);
@@ -214,7 +222,7 @@ static inline int open_fifo_sem(int fd, int name)
 {
        return od_open(fd, FIFO_MUTEX, name);
 }
-        
 static inline int open_prioq_sem(int fd, int name)
 {
        return od_open(fd, PRIOQ_MUTEX, name);
@@ -228,7 +236,7 @@ int open_ikglp_sem(int fd, int name, unsigned int nr_replicas);
 int open_kfmlp_gpu_sem(int fd, int name,
        unsigned int num_gpus, unsigned int gpu_offset, unsigned int rho,
        int affinity_aware /* bool */);
-        
 /* -- Example Configurations --
 *
 * Optimal IKGLP Configuration:
@@ -262,13 +270,13 @@ int open_kfmlp_gpu_sem(int fd, int name,
 *  - rho > 0
 *  - num_gpus > 0
 */
-// takes names 'name' and 'name+1'      
+// takes names 'name' and 'name+1'
 int open_gpusync_token_lock(int fd, int name,
                unsigned int num_gpus, unsigned int gpu_offset,
                unsigned int rho, unsigned int max_in_fifos,
                unsigned int max_fifo_len,
                int enable_affinity_heuristics /* bool */);
-        
 /* syscall overhead measuring */
 int null_call(cycles_t *timestamp);
@@ -296,11 +304,11 @@ printf("%s:%d:%d\n",__FUNCTION__,__LINE__,temp); \
 __inject_action(temp); \
 }while(0);
 */
-        
 #define inject_action(COUNT) \
 do { \
 }while(0);
-        
 /* Litmus signal handling */
diff --git a/include/tests.h b/include/tests.h
index ed2b409..4ca21f8 100644
--- a/include/tests.h
+++ b/include/tests.h
@@ -7,8 +7,11 @@
 #define fail(fmt, args...)                                              \
        do {                                                            \
-                fprintf(stderr, "\n!! TEST FAILURE " fmt "\n   at %s:%d (%s)\n", \
+                fprintf(stderr, "\n!! TEST FAILURE " fmt                \
-                        ## args, __FILE__, __LINE__, __FUNCTION__);     \
+                        "\n   at %s:%d (%s)"                            \
+                        "\n   in task PID=%d\n",                        \
+                        ## args, __FILE__, __LINE__, __FUNCTION__,      \
+                        getpid());                                      \
                fflush(stderr);                                         \
                exit(200);                                              \
        } while (0)
diff --git a/src/kernel_iface.c b/src/kernel_iface.c
index 4cc1af5..e446102 100644
--- a/src/kernel_iface.c
+++ b/src/kernel_iface.c
@@ -56,9 +56,8 @@ ssize_t read_file(const char* fname, void* buf, size_t maxlen)
                return got;
 }
-int get_nr_ts_release_waiters(void)
+int read_litmus_stats(int *ready, int *all)
 {
-        int ready = 0, all = 0;
        char buf[100];
        ssize_t len;
@@ -67,11 +66,17 @@ int get_nr_ts_release_waiters(void)
                len = sscanf(buf,
                             "real-time tasks   = %d\n"
                             "ready for release = %d\n",
-                             &all, &ready);
+                             all, ready);
-        if (len == 2)
+        return len == 2;
+}
+int get_nr_ts_release_waiters(void)
+{
+        int ready, all;
+        if (read_litmus_stats(&ready, &all))
                return ready;
        else
-                return len;
+                return -1;
 }
 /* thread-local pointer to control page */
diff --git a/src/litmus.c b/src/litmus.c
index ba47e45..7cdffcc 100644
--- a/src/litmus.c
+++ b/src/litmus.c
@@ -3,7 +3,10 @@
 #include <stdio.h>
 #include <string.h>
 #include <signal.h>
+#include <fcntl.h>
 #include <sys/mman.h>
+#include <sys/types.h>
 #include <sched.h> /* for cpu sets */
@@ -32,7 +35,7 @@ static struct {
        {IKGLP_GPU_AFF_OBS, "IKGLP-GPU"},
        {KFMLP_SIMPLE_GPU_AFF_OBS, "KFMLP-GPU-SIMPLE"},
        {KFMLP_GPU_AFF_OBS, "KFMLP-GPU"},
-        
        {PRIOQ_MUTEX, "PRIOQ"},
 };
@@ -60,6 +63,23 @@ const char* name_for_lock_protocol(int id)
        return "<UNKNOWN>";
 }
+int litmus_open_lock(
+        obj_type_t protocol,
+        int lock_id,
+        const char* namespace,
+        void *config_param)
+{
+        int fd, od;
+        fd = open(namespace, O_RDWR | O_CREAT, S_IRUSR | S_IWUSR);
+        if (fd < 0)
+                return -1;
+        od = od_openx(fd, protocol, lock_id, config_param);
+        close(fd);
+        return od;
+}
 void show_rt_param(struct rt_task* tp)
 {
@@ -171,7 +191,7 @@ int open_kfmlp_gpu_sem(int fd, int name,
        unsigned int num_replicas;
        struct gpu_affinity_observer_args aff_args;
        int aff_type;
-        
        // number of GPU tokens
        num_replicas = num_gpus * rho;
@@ -181,20 +201,20 @@ int open_kfmlp_gpu_sem(int fd, int name,
                perror("open_kfmlp_sem");
                return -1;
        }
-        
        // create the affinity method to use.
        // "no affinity" -> KFMLP_SIMPLE_GPU_AFF_OBS
        aff_args.obs.lock_od = lock_od;
        aff_args.replica_to_gpu_offset = gpu_offset;
        aff_args.rho = rho;
-        
        aff_type = (affinity_aware) ? KFMLP_GPU_AFF_OBS : KFMLP_SIMPLE_GPU_AFF_OBS;
        affinity_od = od_openx(fd, aff_type, name+1, &aff_args);
        if(affinity_od < 0) {
                perror("open_kfmlp_aff");
                return -1;
-        }       
+        }
-        
        return lock_od;
 }
@@ -209,28 +229,28 @@ int open_kfmlp_gpu_sem(int fd, int name,
 //
 //      // number of GPU tokens
 //      num_replicas = num_gpus * num_simult_users;
-//      
+//
 //      // create the GPU token lock
 //      lock_od = open_ikglp_sem(fd, name, (void*)&num_replicas);
 //      if(lock_od < 0) {
 //              perror("open_ikglp_sem");
 //              return -1;
 //      }
-//      
+//
 //      // create the affinity method to use.
 //      // "no affinity" -> KFMLP_SIMPLE_GPU_AFF_OBS
 //      aff_args.obs.lock_od = lock_od;
 //      aff_args.replica_to_gpu_offset = gpu_offset;
 //      aff_args.nr_simult_users = num_simult_users;
 //      aff_args.relaxed_rules = (relax_max_fifo_len) ? 1 : 0;
-//      
+//
 //      aff_type = (affinity_aware) ? IKGLP_GPU_AFF_OBS : IKGLP_SIMPLE_GPU_AFF_OBS;
 //      affinity_od = od_openx(fd, aff_type, name+1, &aff_args);
 //      if(affinity_od < 0) {
 //              perror("open_ikglp_aff");
 //              return -1;
-//      }       
+//      }
-//      
+//
 //      return lock_od;
 //}
@@ -243,7 +263,7 @@ int open_ikglp_sem(int fd, int name, unsigned int nr_replicas)
                .nr_replicas = nr_replicas,
                .max_in_fifos = IKGLP_M_IN_FIFOS,
                .max_fifo_len = IKGLP_OPTIMAL_FIFO_LEN};
-        
        return od_openx(fd, IKGLP_SEM, name, &args);
 }
@@ -257,7 +277,7 @@ int open_gpusync_token_lock(int fd, int name,
 {
        int lock_od;
        int affinity_od;
-        
        struct ikglp_args args = {
                .nr_replicas = num_gpus*rho,
                .max_in_fifos = max_in_fifos,
@@ -265,41 +285,37 @@ int open_gpusync_token_lock(int fd, int name,
        };
        struct gpu_affinity_observer_args aff_args;
        int aff_type;
-        
        if (!num_gpus || !rho) {
                perror("open_gpusync_sem");
                return -1;
        }
-        
        if ((max_in_fifos != IKGLP_UNLIMITED_IN_FIFOS) &&
                (max_fifo_len != IKGLP_UNLIMITED_FIFO_LEN) &&
                (max_in_fifos > args.nr_replicas * max_fifo_len)) {
                perror("open_gpusync_sem");
                return(-1);
        }
-        
        lock_od = od_openx(fd, IKGLP_SEM, name, &args);
        if(lock_od < 0) {
                perror("open_gpusync_sem");
                return -1;
        }
-        
        // create the affinity method to use.
        aff_args.obs.lock_od = lock_od;
        aff_args.replica_to_gpu_offset = gpu_offset;
        aff_args.rho = rho;
        aff_args.relaxed_rules = (max_fifo_len == IKGLP_UNLIMITED_FIFO_LEN) ? 1 : 0;
-        
        aff_type = (enable_affinity_heuristics) ? IKGLP_GPU_AFF_OBS : IKGLP_SIMPLE_GPU_AFF_OBS;
        affinity_od = od_openx(fd, aff_type, name+1, &aff_args);
        if(affinity_od < 0) {
                perror("open_gpusync_affinity");
                return -1;
        }
-        
        return lock_od;
 }
diff --git a/src/signal.c b/src/signal.c
index bfe18b9..397a797 100644
--- a/src/signal.c
+++ b/src/signal.c
@@ -28,7 +28,7 @@ static void reg_litmus_signals(unsigned long litmus_sig_mask,
 {
        int ret;
-        if (litmus_sig_mask | SIG_BUDGET_MASK) { 
+        if (litmus_sig_mask | SIG_BUDGET_MASK) {
                ret = sigaction(SIG_BUDGET, pAction, NULL);
                check("SIG_BUDGET");
        }
diff --git a/src/task.c b/src/task.c
index 26fc15a..9317cc7 100644
--- a/src/task.c
+++ b/src/task.c
@@ -40,15 +40,16 @@ int __launch_rt_task(rt_fn_t rt_prog, void *rt_arg, rt_setup_fn_t setup,
        return rt_task;
 }
-int __create_rt_task(rt_fn_t rt_prog, void *arg, int cpu, int wcet, int period,
+int __create_rt_task(rt_fn_t rt_prog, void *arg, int cpu, lt_t wcet, lt_t period,
-                     task_class_t rt_class)
+                     unsigned int priority, task_class_t cls)
 {
        struct rt_task params;
        params.cpu       = cpu;
        params.period    = period;
        params.exec_cost = wcet;
-        params.cls       = rt_class;
+        params.cls       = cls;
        params.phase     = 0;
+        params.priority = priority;
        /* enforce budget for tasks that might not use sleep_next_period() */
        params.budget_policy = QUANTUM_ENFORCEMENT;
@@ -56,8 +57,9 @@ int __create_rt_task(rt_fn_t rt_prog, void *arg, int cpu, int wcet, int period,
                                (rt_setup_fn_t) set_rt_task_param, &params);
 }
-int create_rt_task(rt_fn_t rt_prog, void *arg, int cpu, int wcet, int period) {
+int create_rt_task(rt_fn_t rt_prog, void *arg, int cpu, lt_t wcet, lt_t period,
-        return __create_rt_task(rt_prog, arg, cpu, wcet, period, RT_CLASS_HARD);
+                   unsigned int priority) {
+        return __create_rt_task(rt_prog, arg, cpu, wcet, period, priority, RT_CLASS_HARD);
 }
diff --git a/tests/fdso.c b/tests/fdso.c
index 8e320cf..c06e28c 100644
--- a/tests/fdso.c
+++ b/tests/fdso.c
@@ -16,7 +16,7 @@ TESTCASE(fmlp_not_active, C_EDF | PFAIR | LINUX,
 {
        int fd;
-        SYSCALL( fd = open(".fmlp_locks", O_RDONLY | O_CREAT) );
+        SYSCALL( fd = open(".fmlp_locks", O_RDONLY | O_CREAT, S_IRUSR) );
        ASSERT(fd != -1);
@@ -57,7 +57,7 @@ TESTCASE(not_inherit_od, GSN_EDF | PSN_EDF,
 {
        int fd, od, pid, status;
-        SYSCALL( fd = open(".fmlp_locks", O_RDONLY | O_CREAT) );
+        SYSCALL( fd = open(".fmlp_locks", O_RDONLY | O_CREAT, S_IRUSR) );
        SYSCALL( od = open_fmlp_sem(fd, 0) );
diff --git a/tests/locks.c b/tests/locks.c
index d7ebfe2..9a928b3 100644
--- a/tests/locks.c
+++ b/tests/locks.c
@@ -11,7 +11,7 @@ TESTCASE(not_lock_fmlp_be, GSN_EDF | PSN_EDF | P_FP,
 {
        int fd, od;
-        SYSCALL( fd = open(".fmlp_locks", O_RDONLY | O_CREAT) );
+        SYSCALL( fd = open(".fmlp_locks", O_RDONLY | O_CREAT, S_IRUSR) );
        SYSCALL( od = open_fmlp_sem(fd, 0) );
@@ -34,7 +34,7 @@ TESTCASE(not_lock_srp_be, PSN_EDF | P_FP,
 {
        int fd, od;
-        SYSCALL( fd = open(".srp_locks", O_RDONLY | O_CREAT) );
+        SYSCALL( fd = open(".srp_locks", O_RDONLY | O_CREAT, S_IRUSR) );
        /* BE tasks may not open SRP semaphores */
@@ -51,7 +51,7 @@ TESTCASE(lock_srp, PSN_EDF | P_FP,
 {
        int fd, od;
-        SYSCALL( fd = open(".srp_locks", O_RDONLY | O_CREAT) );
+        SYSCALL( fd = open(".srp_locks", O_RDONLY | O_CREAT, S_IRUSR) );
        SYSCALL( sporadic_partitioned(10, 100, 0) );
        SYSCALL( task_mode(LITMUS_RT_TASK) );
@@ -83,7 +83,7 @@ TESTCASE(lock_fmlp, PSN_EDF | GSN_EDF | P_FP,
 {
        int fd, od;
-        SYSCALL( fd = open(".fmlp_locks", O_RDONLY | O_CREAT) );
+        SYSCALL( fd = open(".fmlp_locks", O_RDONLY | O_CREAT, S_IRUSR) );
        SYSCALL( sporadic_partitioned(10, 100, 0) );
        SYSCALL( task_mode(LITMUS_RT_TASK) );
diff --git a/tests/nesting.c b/tests/nesting.c
new file mode 100644
index 0000000..b294334
--- /dev/null
+++ b/tests/nesting.c
@@ -0,0 +1,468 @@
+#include <fcntl.h>
+#include <unistd.h>
+#include <stdio.h>
+#include "tests.h"
+#include "litmus.h"
+TESTCASE(lock_fmlp_nesting, PSN_EDF | GSN_EDF | P_FP,
+         "FMLP no nesting allowed")
+{
+        int fd, od, od2;
+        SYSCALL( fd = open(".fmlp_locks", O_RDONLY | O_CREAT, S_IRUSR) );
+        SYSCALL( sporadic_partitioned(10, 100, 0) );
+        SYSCALL( task_mode(LITMUS_RT_TASK) );
+        SYSCALL( od = open_fmlp_sem(fd, 0) );
+        SYSCALL( od2 = open_fmlp_sem(fd, 1) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od2));
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od));
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( od_close(od) );
+        SYSCALL( od_close(od2) );
+        SYSCALL( close(fd) );
+        SYSCALL( remove(".fmlp_locks") );
+}
+TESTCASE(lock_fmlp_srp_nesting, PSN_EDF | P_FP,
+         "FMLP no nesting with SRP resources allowed")
+{
+        int fd, od, od2;
+        SYSCALL( fd = open(".fmlp_locks", O_RDONLY | O_CREAT, S_IRUSR) );
+        SYSCALL( sporadic_partitioned(10, 100, 0) );
+        SYSCALL( task_mode(LITMUS_RT_TASK) );
+        SYSCALL( od = open_fmlp_sem(fd, 0) );
+        SYSCALL( od2 = open_srp_sem(fd, 1) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od2));
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od));
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( od_close(od) );
+        SYSCALL( od_close(od2) );
+        SYSCALL( close(fd) );
+        SYSCALL( remove(".fmlp_locks") );
+}
+TESTCASE(lock_srp_nesting, PSN_EDF | P_FP,
+         "SRP nesting allowed")
+{
+        int fd, od, od2;
+        SYSCALL( fd = open(".fmlp_locks", O_RDONLY | O_CREAT, S_IRUSR) );
+        SYSCALL( sporadic_partitioned(10, 100, 0) );
+        SYSCALL( task_mode(LITMUS_RT_TASK) );
+        SYSCALL( od = open_srp_sem(fd, 0) );
+        SYSCALL( od2 = open_srp_sem(fd, 1) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( od_close(od) );
+        SYSCALL( od_close(od2) );
+        SYSCALL( close(fd) );
+        SYSCALL( remove(".fmlp_locks") );
+}
+TESTCASE(lock_pcp_nesting, P_FP,
+         "PCP nesting allowed")
+{
+        int od, od2;
+        const char* namespace = ".pcp_locks";
+        SYSCALL( sporadic_partitioned(10, 100, 0) );
+        SYSCALL( task_mode(LITMUS_RT_TASK) );
+        SYSCALL( od  = litmus_open_lock(PCP_SEM, 0, namespace, NULL) );
+        SYSCALL( od2 = litmus_open_lock(PCP_SEM, 1, namespace, NULL) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( od_close(od) );
+        SYSCALL( od_close(od2) );
+        SYSCALL( remove(namespace) );
+}
+TESTCASE(lock_mpcp_pcp_no_nesting, P_FP,
+         "PCP and MPCP nesting not allowed")
+{
+        int od, od2;
+        const char* namespace = ".pcp_locks";
+        SYSCALL( sporadic_partitioned(10, 100, 0) );
+        SYSCALL( task_mode(LITMUS_RT_TASK) );
+        SYSCALL( od  = litmus_open_lock(PCP_SEM, 0, namespace, NULL) );
+        SYSCALL( od2 = litmus_open_lock(MPCP_SEM, 1, namespace, NULL) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od2));
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od));
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( od_close(od) );
+        SYSCALL( od_close(od2) );
+        SYSCALL( remove(namespace) );
+}
+TESTCASE(lock_fmlp_pcp_no_nesting, P_FP,
+         "PCP and FMLP nesting not allowed")
+{
+        int od, od2;
+        const char* namespace = ".pcp_locks";
+        SYSCALL( sporadic_partitioned(10, 100, 0) );
+        SYSCALL( task_mode(LITMUS_RT_TASK) );
+        SYSCALL( od  = litmus_open_lock(PCP_SEM, 0, namespace, NULL) );
+        SYSCALL( od2 = litmus_open_lock(FMLP_SEM, 1, namespace, NULL) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od2));
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od));
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( od_close(od) );
+        SYSCALL( od_close(od2) );
+        SYSCALL( remove(namespace) );
+}
+TESTCASE(lock_dpcp_pcp_no_nesting, P_FP,
+         "PCP and DPCP nesting not allowed")
+{
+        int od, od2;
+        int cpu = 0;
+        const char* namespace = ".pcp_locks";
+        SYSCALL( sporadic_partitioned(10, 100, 0) );
+        SYSCALL( task_mode(LITMUS_RT_TASK) );
+        SYSCALL( od  = litmus_open_lock(PCP_SEM, 0, namespace, NULL) );
+        SYSCALL( od2 = litmus_open_lock(DPCP_SEM, 1, namespace, &cpu) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od2));
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od));
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( od_close(od) );
+        SYSCALL( od_close(od2) );
+        SYSCALL( remove(namespace) );
+}
+TESTCASE(lock_mpcp_srp_no_nesting, P_FP,
+         "SRP and MPCP nesting not allowed")
+{
+        int od, od2;
+        const char* namespace = ".pcp_locks";
+        SYSCALL( sporadic_partitioned(10, 100, 0) );
+        SYSCALL( task_mode(LITMUS_RT_TASK) );
+        SYSCALL( od  = litmus_open_lock(SRP_SEM, 0, namespace, NULL) );
+        SYSCALL( od2 = litmus_open_lock(MPCP_SEM, 1, namespace, NULL) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od2));
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od));
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( od_close(od) );
+        SYSCALL( od_close(od2) );
+        SYSCALL( remove(namespace) );
+}
+TESTCASE(lock_dpcp_srp_no_nesting, P_FP,
+         "SRP and DPCP nesting not allowed")
+{
+        int od, od2;
+        int cpu = 0;
+        const char* namespace = ".pcp_locks";
+        SYSCALL( sporadic_partitioned(10, 100, 0) );
+        SYSCALL( task_mode(LITMUS_RT_TASK) );
+        SYSCALL( od  = litmus_open_lock(SRP_SEM, 0, namespace, NULL) );
+        SYSCALL( od2 = litmus_open_lock(DPCP_SEM, 1, namespace, &cpu) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od2));
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od));
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( od_close(od) );
+        SYSCALL( od_close(od2) );
+        SYSCALL( remove(namespace) );
+}
+TESTCASE(lock_fmlp_mpcp_no_nesting, P_FP,
+         "MPCP and FMLP nesting not allowed")
+{
+        int od, od2;
+        const char* namespace = ".pcp_locks";
+        SYSCALL( sporadic_partitioned(10, 100, 0) );
+        SYSCALL( task_mode(LITMUS_RT_TASK) );
+        SYSCALL( od  = litmus_open_lock(MPCP_SEM, 0, namespace, NULL) );
+        SYSCALL( od2 = litmus_open_lock(FMLP_SEM, 1, namespace, NULL) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od2));
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od));
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( od_close(od) );
+        SYSCALL( od_close(od2) );
+        SYSCALL( remove(namespace) );
+}
+TESTCASE(lock_fmlp_dpcp_no_nesting, P_FP,
+         "DPCP and FMLP nesting not allowed")
+{
+        int od, od2;
+        const char* namespace = ".pcp_locks";
+        int cpu = 0;
+        SYSCALL( sporadic_partitioned(10, 100, 0) );
+        SYSCALL( task_mode(LITMUS_RT_TASK) );
+        SYSCALL( od  = litmus_open_lock(DPCP_SEM, 0, namespace, &cpu) );
+        SYSCALL( od2 = litmus_open_lock(FMLP_SEM, 1, namespace, NULL) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od2));
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od));
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( od_close(od) );
+        SYSCALL( od_close(od2) );
+        SYSCALL( remove(namespace) );
+}
+TESTCASE(mpcp_nesting, P_FP,
+         "MPCP no nesting allowed")
+{
+        int od, od2;
+        SYSCALL( sporadic_partitioned(10, 100, 0) );
+        SYSCALL( task_mode(LITMUS_RT_TASK) );
+        SYSCALL( od  = litmus_open_lock(MPCP_SEM, 0, ".mpcp_locks", NULL) );
+        SYSCALL( od2 = litmus_open_lock(MPCP_SEM, 1, ".mpcp_locks", NULL) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od2));
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od));
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( od_close(od) );
+        SYSCALL( od_close(od2) );
+        SYSCALL( remove(".mpcp_locks") );
+}
+TESTCASE(mpcpvs_nesting, P_FP,
+         "MPCP-VS no nesting allowed")
+{
+        int od, od2;
+        SYSCALL( sporadic_partitioned(10, 100, 0) );
+        SYSCALL( task_mode(LITMUS_RT_TASK) );
+        SYSCALL( od  = litmus_open_lock(MPCP_VS_SEM, 0, ".mpcp_locks", NULL) );
+        SYSCALL( od2 = litmus_open_lock(MPCP_VS_SEM, 1, ".mpcp_locks", NULL) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od2));
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od));
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( od_close(od) );
+        SYSCALL( od_close(od2) );
+        SYSCALL( remove(".mpcp_locks") );
+}
+TESTCASE(dpcp_nesting, P_FP,
+         "DPCP no nesting allowed")
+{
+        int od, od2;
+        int cpu = 0;
+        SYSCALL( sporadic_partitioned(10, 100, 0) );
+        SYSCALL( task_mode(LITMUS_RT_TASK) );
+        SYSCALL( od  = litmus_open_lock(DPCP_SEM, 0, ".dpcp_locks", &cpu) );
+        SYSCALL( od2 = litmus_open_lock(DPCP_SEM, 1, ".dpcp_locks", &cpu) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( litmus_lock(od) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od2));
+        SYSCALL( litmus_unlock(od) );
+        SYSCALL( litmus_lock(od2) );
+        SYSCALL_FAILS(EBUSY, litmus_lock(od));
+        SYSCALL( litmus_unlock(od2) );
+        SYSCALL( od_close(od) );
+        SYSCALL( od_close(od2) );
+        SYSCALL( remove(".dpcp_locks") );
+}
diff --git a/tests/pcp.c b/tests/pcp.c
index 88d1be3..8e1204f 100644
--- a/tests/pcp.c
+++ b/tests/pcp.c
@@ -1,6 +1,8 @@
 #include <fcntl.h>
 #include <unistd.h>
 #include <stdio.h>
+#include <sys/wait.h> /* for waitpid() */
 #include "tests.h"
 #include "litmus.h"
@@ -11,7 +13,7 @@ TESTCASE(lock_pcp, P_FP,
 {
        int fd, od, cpu = 0;
-        SYSCALL( fd = open(".pcp_locks", O_RDONLY | O_CREAT) );
+        SYSCALL( fd = open(".pcp_locks", O_RDONLY | O_CREAT, S_IRUSR) );
        SYSCALL( sporadic_partitioned(10, 100, cpu) );
        SYSCALL( task_mode(LITMUS_RT_TASK) );
@@ -37,12 +39,218 @@ TESTCASE(lock_pcp, P_FP,
        SYSCALL( remove(".pcp_locks") );
 }
+TESTCASE(pcp_inheritance, P_FP,
+         "PCP priority inheritance")
+{
+        int fd, od, cpu = 0;
+        int child_hi, child_lo, child_middle, status, waiters;
+        lt_t delay = ms2lt(100);
+        double start, stop;
+        struct rt_task params;
+        params.cpu        = 0;
+        params.exec_cost  =  ms2lt(10000);
+        params.period     = ms2lt(100000);
+        params.relative_deadline = params.period;
+        params.phase      = 0;
+        params.cls        = RT_CLASS_HARD;
+        params.budget_policy = NO_ENFORCEMENT;
+        SYSCALL( fd = open(".pcp_locks", O_RDONLY | O_CREAT, S_IRUSR) );
+        child_lo = FORK_TASK(
+                params.priority = LITMUS_LOWEST_PRIORITY;
+                params.phase    = 0;
+                SYSCALL( set_rt_task_param(gettid(), &params) );
+                SYSCALL( be_migrate_to(params.cpu) );
+                SYSCALL( task_mode(LITMUS_RT_TASK) );
+                SYSCALL( od = open_pcp_sem(fd, 0, cpu) );
+                SYSCALL( wait_for_ts_release() );
+                SYSCALL( litmus_lock(od) );
+                start = cputime();
+                while (cputime() - start < 0.25)
+                        ;
+                SYSCALL( litmus_unlock(od) );
+                SYSCALL(sleep_next_period() );
+                );
+        child_middle = FORK_TASK(
+                params.priority = LITMUS_HIGHEST_PRIORITY + 1;
+                params.phase    = ms2lt(100);
+                SYSCALL( set_rt_task_param(gettid(), &params) );
+                SYSCALL( be_migrate_to(params.cpu) );
+                SYSCALL( task_mode(LITMUS_RT_TASK) );
+                SYSCALL( wait_for_ts_release() );
+                start = cputime();
+                while (cputime() - start < 5)
+                        ;
+                SYSCALL( sleep_next_period() );
+                );
+        child_hi = FORK_TASK(
+                params.priority = LITMUS_HIGHEST_PRIORITY;
+                params.phase    = ms2lt(50);
+                SYSCALL( set_rt_task_param(gettid(), &params) );
+                SYSCALL( be_migrate_to(params.cpu) );
+                SYSCALL( task_mode(LITMUS_RT_TASK) );
+                SYSCALL( od = open_pcp_sem(fd, 0, cpu) );
+                SYSCALL( wait_for_ts_release() );
+                start = wctime();
+                /* block on semaphore */
+                SYSCALL( litmus_lock(od) );
+                SYSCALL( litmus_unlock(od) );
+                stop  = wctime();
+                /* Assert we had some blocking. */
+                ASSERT( stop - start > 0.1);
+                /* Assert we woke up 'soonish' after the sleep. */
+                ASSERT( stop - start < 1 );
+                SYSCALL( kill(child_middle, SIGUSR2) );
+                SYSCALL( kill(child_lo, SIGUSR2) );
+                );
+        do {
+                waiters = get_nr_ts_release_waiters();
+                ASSERT( waiters >= 0 );
+        } while (waiters != 3);
+        SYSCALL( be_migrate_to(1) );
+        waiters = release_ts(&delay);
+        SYSCALL( waitpid(child_hi, &status, 0) );
+        ASSERT( status == 0 );
+        SYSCALL( waitpid(child_lo, &status, 0) );
+        ASSERT( status ==  SIGUSR2);
+        SYSCALL( waitpid(child_middle, &status, 0) );
+        ASSERT( status ==  SIGUSR2);
+}
+TESTCASE(srp_ceiling_blocking, P_FP | PSN_EDF,
+         "SRP ceiling blocking")
+{
+        int fd, od;
+        int child_hi, child_lo, child_middle, status, waiters;
+        lt_t delay = ms2lt(100);
+        double start, stop;
+        struct rt_task params;
+        params.cpu        = 0;
+        params.exec_cost  =  ms2lt(10000);
+        params.period     = ms2lt(100000);
+        params.relative_deadline = params.period;
+        params.phase      = 0;
+        params.cls        = RT_CLASS_HARD;
+        params.budget_policy = NO_ENFORCEMENT;
+        SYSCALL( fd = open(".srp_locks", O_RDONLY | O_CREAT, S_IRUSR) );
+        child_lo = FORK_TASK(
+                params.priority = LITMUS_LOWEST_PRIORITY;
+                params.phase    = 0;
+                SYSCALL( set_rt_task_param(gettid(), &params) );
+                SYSCALL( be_migrate_to(params.cpu) );
+                SYSCALL( task_mode(LITMUS_RT_TASK) );
+                SYSCALL( od = open_srp_sem(fd, 0) );
+                SYSCALL( wait_for_ts_release() );
+                SYSCALL( litmus_lock(od) );
+                start = cputime();
+                while (cputime() - start < 0.25)
+                        ;
+                SYSCALL( litmus_unlock(od) );
+                );
+        child_middle = FORK_TASK(
+                params.priority = LITMUS_HIGHEST_PRIORITY + 1;
+                params.phase    = ms2lt(100);
+                params.relative_deadline -= ms2lt(110);
+                SYSCALL( set_rt_task_param(gettid(), &params) );
+                SYSCALL( be_migrate_to(params.cpu) );
+                SYSCALL( task_mode(LITMUS_RT_TASK) );
+                SYSCALL( wait_for_ts_release() );
+                start = cputime();
+                while (cputime() - start < 5)
+                        ;
+                );
+        child_hi = FORK_TASK(
+                params.priority = LITMUS_HIGHEST_PRIORITY;
+                params.phase    = ms2lt(50);
+                params.relative_deadline -= ms2lt(200);
+                SYSCALL( set_rt_task_param(gettid(), &params) );
+                SYSCALL( be_migrate_to(params.cpu) );
+                SYSCALL( task_mode(LITMUS_RT_TASK) );
+                SYSCALL( od = open_srp_sem(fd, 0) );
+                SYSCALL( wait_for_ts_release() );
+                start = wctime();
+                /* block on semaphore */
+                SYSCALL( litmus_lock(od) );
+                SYSCALL( litmus_unlock(od) );
+                stop  = wctime();
+                /* Assert we had "no" blocking (modulo qemu overheads). */
+                ASSERT( stop - start < 0.01);
+                SYSCALL( kill(child_middle, SIGUSR2) );
+                SYSCALL( kill(child_lo, SIGUSR2) );
+                );
+        do {
+                waiters = get_nr_ts_release_waiters();
+                ASSERT( waiters >= 0 );
+        } while (waiters != 3);
+        SYSCALL( be_migrate_to(1) );
+        waiters = release_ts(&delay);
+        SYSCALL( waitpid(child_hi, &status, 0) );
+        ASSERT( status == 0 );
+        SYSCALL( waitpid(child_lo, &status, 0) );
+        ASSERT( status ==  SIGUSR2);
+        SYSCALL( waitpid(child_middle, &status, 0) );
+        ASSERT( status ==  SIGUSR2);
+}
 TESTCASE(lock_dpcp, P_FP,
         "DPCP acquisition and release")
 {
        int fd, od, cpu = 1;
-        SYSCALL( fd = open(".pcp_locks", O_RDONLY | O_CREAT) );
+        SYSCALL( fd = open(".pcp_locks", O_RDONLY | O_CREAT, S_IRUSR) );
        SYSCALL( sporadic_partitioned(10, 100, 0) );
        SYSCALL( task_mode(LITMUS_RT_TASK) );
@@ -73,7 +281,7 @@ TESTCASE(not_lock_pcp_be, P_FP,
 {
        int fd, od;
-        SYSCALL( fd = open(".pcp_locks", O_RDONLY | O_CREAT) );
+        SYSCALL( fd = open(".pcp_locks", O_RDONLY | O_CREAT, S_IRUSR) );
        /* BE tasks are not even allowed to open a PCP semaphore */
        SYSCALL_FAILS(EPERM, od = open_pcp_sem(fd, 0, 1) );
@@ -95,7 +303,7 @@ TESTCASE(lock_mpcp, P_FP,
 {
        int fd, od;
-        SYSCALL( fd = open(".pcp_locks", O_RDONLY | O_CREAT) );
+        SYSCALL( fd = open(".pcp_locks", O_RDONLY | O_CREAT, S_IRUSR) );
        SYSCALL( sporadic_partitioned(10, 100, 0) );
        SYSCALL( task_mode(LITMUS_RT_TASK) );
author	Glenn Elliott <gelliott@cs.unc.edu>	2013-03-13 15:33:57 -0400
committer	Glenn Elliott <gelliott@cs.unc.edu>	2013-03-13 15:33:57 -0400
commit	944a78c21028da69fb53c0aec3e9dfdb048d47e4 (patch)
tree	bdbc77b3c0ff1337670a7e5d0f9d438388c1a866
parent	f338b34ea0fb6136ea3895a07161ece030c4b998 (diff)
parent	1ff4fc699f01f0ad1359fad48b00c9d3be1b28b4 (diff)