IRQ tracing: clarify use of per-core counters

Make it a bit more obvious what these counters are used for and how. Question for future work: can we return to using only a single per-core counter?
author: Bjoern Brandenburg <bbb@mpi-sws.org> 2017-03-10 09:46:05 -0500
committer: Bjoern Brandenburg <bbb@mpi-sws.org> 2017-05-26 17:12:27 -0400
commit: cbe61859a233702ed8e6723b3b133d1f2ae1ae2c (patch)
tree: e5c20aa3f19feeb5b899bfb3302b5956d86fe526
parent: 4673107e2ff7c218ecac2de9eedeb61153940bbe (diff)
1 files changed, 28 insertions, 32 deletions
diff --git a/litmus/trace.c b/litmus/trace.c
index 937b1c4d0975..7d698aac257d 100644
--- a/litmus/trace.c
+++ b/litmus/trace.c
@@ -16,8 +16,8 @@ static struct ftdev msg_overhead_dev;
 #define cpu_trace_ts_buf(cpu) cpu_overhead_dev.minor[(cpu)].buf
 #define msg_trace_ts_buf(cpu) msg_overhead_dev.minor[(cpu)].buf
-DEFINE_PER_CPU(atomic_t, irq_fired_count;)
+DEFINE_PER_CPU(unsigned int, local_irq_count;)
-DEFINE_PER_CPU_SHARED_ALIGNED(atomic_t, cpu_irq_fired_count);
+DEFINE_PER_CPU_SHARED_ALIGNED(atomic_t, msg_irq_count);
 static DEFINE_PER_CPU(unsigned int, cpu_ts_seq_no);
 static DEFINE_PER_CPU(atomic_t, msg_ts_seq_no);
@@ -27,42 +27,28 @@ static int64_t cycle_offset[NR_CPUS][NR_CPUS];
 void ft_irq_fired(void)
 {
        /* Only called with preemptions disabled.  */
-        atomic_inc(this_cpu_ptr(&irq_fired_count));
+        /* local counter => not atomic, trace points disable interrupts */
-        atomic_inc(this_cpu_ptr(&cpu_irq_fired_count));
+        this_cpu_inc(local_irq_count);
+        /* counter for messages => read remotely */
+        atomic_inc(this_cpu_ptr(&msg_irq_count));
        if (has_control_page(current))
                get_control_page(current)->irq_count++;
 }
-static inline void clear_irq_fired(void)
+static inline unsigned int snapshot_local_irqs(void)
 {
-        atomic_set(raw_cpu_ptr(&irq_fired_count), 0);
+        return this_cpu_xchg(local_irq_count, 0);
 }
-static inline unsigned int get_and_clear_irq_fired(void)
+static inline unsigned int snapshot_msg_irq_for(int cpu)
 {
-        /* This is potentially not atomic  since we might migrate if
+        return atomic_xchg(&per_cpu(msg_irq_count, cpu), 0);
-         * preemptions are not disabled. As a tradeoff between
-         * accuracy and tracing overheads, this seems acceptable.
-         * If it proves to be a problem, then one could add a callback
-         * from the migration code to invalidate irq_fired_count.
-         */
-        return atomic_xchg(raw_cpu_ptr(&irq_fired_count), 0);
-}
-static inline unsigned int get_and_clear_irq_fired_for_cpu(int cpu)
-{
-        return atomic_xchg(&per_cpu(irq_fired_count, cpu), 0);
-}
-static inline void cpu_clear_irq_fired(void)
-{
-        atomic_set(raw_cpu_ptr(&cpu_irq_fired_count), 0);
 }
-static inline unsigned int cpu_get_and_clear_irq_fired(void)
+static inline unsigned int snapshot_msg_irq_locally(void)
 {
-        return atomic_xchg(raw_cpu_ptr(&cpu_irq_fired_count), 0);
+        return atomic_xchg(raw_cpu_ptr(&msg_irq_count), 0);
 }
 static inline void save_irq_flags(struct timestamp *ts, unsigned int irq_count)
@@ -141,11 +127,21 @@ static inline void __write_record(
                ts->cpu       = cpu;
-                if (record_irq) {
+                switch (record_irq) {
-                        if (local_cpu)
+                        case LOCAL_IRQ_COUNT:
-                                irq_count = cpu_get_and_clear_irq_fired();
+                                if (is_cpu_timestamp)
-                        else
+                                        irq_count = snapshot_local_irqs();
-                                irq_count = get_and_clear_irq_fired_for_cpu(cpu);
+                                else
+                                        irq_count = snapshot_msg_irq_locally();
+                                break;
+                        case REMOTE_IRQ_COUNT:
+                                irq_count = snapshot_msg_irq_for(other_cpu);
+                                break;
+                        case NO_IRQ_COUNT:
+                                /* fall through */
+                        default:
+                                /* do nothing */
+                                break;
                }
                save_irq_flags(ts, irq_count - hide_irq);
@@ -301,7 +297,7 @@ static void __add_timestamp_user(struct timestamp *pre_recorded)
                *ts = *pre_recorded;
                ts->seq_no = seq_no;
                ts->cpu    = raw_smp_processor_id();
-                save_irq_flags(ts, get_and_clear_irq_fired());
+                save_irq_flags(ts, snapshot_local_irqs());
                ft_buffer_finish_write(buf, ts);
        }
author	Bjoern Brandenburg <bbb@mpi-sws.org>	2017-03-10 09:46:05 -0500
committer	Bjoern Brandenburg <bbb@mpi-sws.org>	2017-05-26 17:12:27 -0400
commit	cbe61859a233702ed8e6723b3b133d1f2ae1ae2c (patch)
tree	e5c20aa3f19feeb5b899bfb3302b5956d86fe526
parent	4673107e2ff7c218ecac2de9eedeb61153940bbe (diff)