aboutsummaryrefslogtreecommitdiffstats
path: root/arch
diff options
context:
space:
mode:
authorCliff Wickman <cpw@sgi.com>2010-06-02 17:22:01 -0400
committerIngo Molnar <mingo@elte.hu>2010-06-08 15:13:44 -0400
commite8e5e8a8048006a12d7777a93baebd6e39496101 (patch)
treec3da45e649920e77b14907fa3b33dde1b8d9328d /arch
parent12a6611fa16e9c6d2f844fe2175d219c6e9bd95d (diff)
x86, UV: BAU tunables into a debugfs file
Make the Broadcast Assist Unit driver's nine tuning values variable by making them accessible through a read/write debugfs file. The file will normally be mounted as /sys/kernel/debug/sgi_uv/bau_tunables. The tunables are kept in each cpu's per-cpu BAU structure. The patch also does a little name improvement, and corrects the reset of two destination timeout counters. Signed-off-by: Cliff Wickman <cpw@sgi.com> Cc: gregkh@suse.de LKML-Reference: <E1OJvNx-0004Zx-Uo@eag09.americas.sgi.com> Signed-off-by: Ingo Molnar <mingo@elte.hu>
Diffstat (limited to 'arch')
-rw-r--r--arch/x86/include/asm/uv/uv_bau.h53
-rw-r--r--arch/x86/kernel/tlb_uv.c281
2 files changed, 278 insertions, 56 deletions
diff --git a/arch/x86/include/asm/uv/uv_bau.h b/arch/x86/include/asm/uv/uv_bau.h
index 458e04c626a2..e5543c1a80ca 100644
--- a/arch/x86/include/asm/uv/uv_bau.h
+++ b/arch/x86/include/asm/uv/uv_bau.h
@@ -45,10 +45,14 @@
45#define UV_DESC_BASE_PNODE_SHIFT 49 45#define UV_DESC_BASE_PNODE_SHIFT 49
46#define UV_PAYLOADQ_PNODE_SHIFT 49 46#define UV_PAYLOADQ_PNODE_SHIFT 49
47#define UV_PTC_BASENAME "sgi_uv/ptc_statistics" 47#define UV_PTC_BASENAME "sgi_uv/ptc_statistics"
48#define UV_BAU_BASENAME "sgi_uv/bau_tunables"
49#define UV_BAU_TUNABLES_DIR "sgi_uv"
50#define UV_BAU_TUNABLES_FILE "bau_tunables"
51#define WHITESPACE " \t\n"
48#define uv_physnodeaddr(x) ((__pa((unsigned long)(x)) & uv_mmask)) 52#define uv_physnodeaddr(x) ((__pa((unsigned long)(x)) & uv_mmask))
49#define UV_ENABLE_INTD_SOFT_ACK_MODE_SHIFT 15 53#define UV_ENABLE_INTD_SOFT_ACK_MODE_SHIFT 15
50#define UV_INTD_SOFT_ACK_TIMEOUT_PERIOD_SHIFT 16 54#define UV_INTD_SOFT_ACK_TIMEOUT_PERIOD_SHIFT 16
51#define UV_INTD_SOFT_ACK_TIMEOUT_PERIOD 0x000000000bUL 55#define UV_INTD_SOFT_ACK_TIMEOUT_PERIOD 0x0000000009UL
52/* [19:16] SOFT_ACK timeout period 19: 1 is urgency 7 17:16 1 is multiplier */ 56/* [19:16] SOFT_ACK timeout period 19: 1 is urgency 7 17:16 1 is multiplier */
53#define BAU_MISC_CONTROL_MULT_MASK 3 57#define BAU_MISC_CONTROL_MULT_MASK 3
54 58
@@ -70,25 +74,23 @@
70#define DESC_STATUS_DESTINATION_TIMEOUT 2 74#define DESC_STATUS_DESTINATION_TIMEOUT 2
71#define DESC_STATUS_SOURCE_TIMEOUT 3 75#define DESC_STATUS_SOURCE_TIMEOUT 3
72 76
77#define TIMEOUT_DELAY 10
73/* 78/*
74 * source side threshholds at which message retries print a warning 79 * delay for 'plugged' timeout retries, in microseconds
75 */
76#define SOURCE_TIMEOUT_LIMIT 20
77#define DESTINATION_TIMEOUT_LIMIT 20
78
79/*
80 * misc. delays, in microseconds
81 */ 80 */
82#define THROTTLE_DELAY 10 81#define PLUGGED_DELAY 10
83#define TIMEOUT_DELAY 10
84#define BIOS_TO 1000
85/* BIOS is assumed to set the destination timeout to 1003520 nanoseconds */
86 82
87/* 83/*
88 * threshholds at which to use IPI to free resources 84 * threshholds at which to use IPI to free resources
89 */ 85 */
86/* after this # consecutive 'plugged' timeouts, use IPI to release resources */
90#define PLUGSB4RESET 100 87#define PLUGSB4RESET 100
91#define TIMEOUTSB4RESET 100 88/* after this many consecutive timeouts, use IPI to release resources */
89#define TIMEOUTSB4RESET 1
90/* at this number uses of IPI to release resources, giveup the request */
91#define IPI_RESET_LIMIT 1
92/* after this # consecutive successes, bump up the throttle if it was lowered */
93#define COMPLETE_THRESHOLD 5
92 94
93/* 95/*
94 * number of entries in the destination side payload queue 96 * number of entries in the destination side payload queue
@@ -108,6 +110,13 @@
108#define FLUSH_COMPLETE 4 110#define FLUSH_COMPLETE 4
109 111
110/* 112/*
113 * tuning the action when the numalink network is extremely delayed
114 */
115#define CONGESTED_RESPONSE_US 1000 /* 'long' response time, in microseconds */
116#define CONGESTED_REPS 10 /* long delays averaged over this many broadcasts */
117#define CONGESTED_PERIOD 30 /* time for the bau to be disabled, in seconds */
118
119/*
111 * Distribution: 32 bytes (256 bits) (bytes 0-0x1f of descriptor) 120 * Distribution: 32 bytes (256 bits) (bytes 0-0x1f of descriptor)
112 * If the 'multilevel' flag in the header portion of the descriptor 121 * If the 'multilevel' flag in the header portion of the descriptor
113 * has been set to 0, then endpoint multi-unicast mode is selected. 122 * has been set to 0, then endpoint multi-unicast mode is selected.
@@ -323,14 +332,13 @@ struct bau_control {
323 struct bau_control *uvhub_master; 332 struct bau_control *uvhub_master;
324 struct bau_control *socket_master; 333 struct bau_control *socket_master;
325 unsigned long timeout_interval; 334 unsigned long timeout_interval;
335 unsigned long set_bau_on_time;
326 atomic_t active_descriptor_count; 336 atomic_t active_descriptor_count;
327 int max_concurrent;
328 int max_concurrent_constant;
329 int retry_message_scans;
330 int plugged_tries; 337 int plugged_tries;
331 int timeout_tries; 338 int timeout_tries;
332 int ipi_attempts; 339 int ipi_attempts;
333 int conseccompletes; 340 int conseccompletes;
341 int set_bau_off;
334 short cpu; 342 short cpu;
335 short uvhub_cpu; 343 short uvhub_cpu;
336 short uvhub; 344 short uvhub;
@@ -343,6 +351,19 @@ struct bau_control {
343 spinlock_t masks_lock; 351 spinlock_t masks_lock;
344 spinlock_t uvhub_lock; 352 spinlock_t uvhub_lock;
345 spinlock_t queue_lock; 353 spinlock_t queue_lock;
354 /* tunables */
355 int max_bau_concurrent;
356 int max_bau_concurrent_constant;
357 int plugged_delay;
358 int plugsb4reset;
359 int timeoutsb4reset;
360 int ipi_reset_limit;
361 int complete_threshold;
362 int congested_response_us;
363 int congested_reps;
364 int congested_period;
365 cycles_t period_time;
366 long period_requests;
346}; 367};
347 368
348/* 369/*
diff --git a/arch/x86/kernel/tlb_uv.c b/arch/x86/kernel/tlb_uv.c
index 5506836c4a82..c8661779c51e 100644
--- a/arch/x86/kernel/tlb_uv.c
+++ b/arch/x86/kernel/tlb_uv.c
@@ -8,6 +8,7 @@
8 */ 8 */
9#include <linux/seq_file.h> 9#include <linux/seq_file.h>
10#include <linux/proc_fs.h> 10#include <linux/proc_fs.h>
11#include <linux/debugfs.h>
11#include <linux/kernel.h> 12#include <linux/kernel.h>
12#include <linux/slab.h> 13#include <linux/slab.h>
13 14
@@ -42,12 +43,22 @@ static int timeout_base_ns[] = {
42 167772160 43 167772160
43}; 44};
44static int timeout_us; 45static int timeout_us;
46static int nobau;
45 47
46#define UV_INTD_SOFT_ACK_TIMEOUT_PERIOD 0x000000000bUL 48/* tunables: */
47 49static int max_bau_concurrent = MAX_BAU_CONCURRENT;
48static int uv_bau_max_concurrent __read_mostly; 50static int max_bau_concurrent_constant = MAX_BAU_CONCURRENT;
51static int plugged_delay = PLUGGED_DELAY;
52static int plugsb4reset = PLUGSB4RESET;
53static int timeoutsb4reset = TIMEOUTSB4RESET;
54static int ipi_reset_limit = IPI_RESET_LIMIT;
55static int complete_threshold = COMPLETE_THRESHOLD;
56static int congested_response_us = CONGESTED_RESPONSE_US;
57static int congested_reps = CONGESTED_REPS;
58static int congested_period = CONGESTED_PERIOD;
59static struct dentry *tunables_dir;
60static struct dentry *tunables_file;
49 61
50static int nobau;
51static int __init setup_nobau(char *arg) 62static int __init setup_nobau(char *arg)
52{ 63{
53 nobau = 1; 64 nobau = 1;
@@ -539,23 +550,24 @@ const struct cpumask *uv_flush_send_and_wait(struct bau_desc *bau_desc,
539 unsigned long index; 550 unsigned long index;
540 cycles_t time1; 551 cycles_t time1;
541 cycles_t time2; 552 cycles_t time2;
553 cycles_t elapsed;
542 struct ptc_stats *stat = &per_cpu(ptcstats, bcp->cpu); 554 struct ptc_stats *stat = &per_cpu(ptcstats, bcp->cpu);
543 struct bau_control *smaster = bcp->socket_master; 555 struct bau_control *smaster = bcp->socket_master;
544 struct bau_control *hmaster = bcp->uvhub_master; 556 struct bau_control *hmaster = bcp->uvhub_master;
545 557
546 /* 558 /*
547 * Spin here while there are hmaster->max_concurrent or more active 559 * Spin here while there are hmaster->max_bau_concurrent or more active
548 * descriptors. This is the per-uvhub 'throttle'. 560 * descriptors. This is the per-uvhub 'throttle'.
549 */ 561 */
550 if (!atomic_inc_unless_ge(&hmaster->uvhub_lock, 562 if (!atomic_inc_unless_ge(&hmaster->uvhub_lock,
551 &hmaster->active_descriptor_count, 563 &hmaster->active_descriptor_count,
552 hmaster->max_concurrent)) { 564 hmaster->max_bau_concurrent)) {
553 stat->s_throttles++; 565 stat->s_throttles++;
554 do { 566 do {
555 cpu_relax(); 567 cpu_relax();
556 } while (!atomic_inc_unless_ge(&hmaster->uvhub_lock, 568 } while (!atomic_inc_unless_ge(&hmaster->uvhub_lock,
557 &hmaster->active_descriptor_count, 569 &hmaster->active_descriptor_count,
558 hmaster->max_concurrent)); 570 hmaster->max_bau_concurrent));
559 } 571 }
560 572
561 while (hmaster->uvhub_quiesce) 573 while (hmaster->uvhub_quiesce)
@@ -609,9 +621,9 @@ const struct cpumask *uv_flush_send_and_wait(struct bau_desc *bau_desc,
609 * that case hardware immediately returns the ERROR 621 * that case hardware immediately returns the ERROR
610 * that looks like a destination timeout. 622 * that looks like a destination timeout.
611 */ 623 */
612 udelay(TIMEOUT_DELAY); 624 udelay(bcp->plugged_delay);
613 bcp->plugged_tries++; 625 bcp->plugged_tries++;
614 if (bcp->plugged_tries >= PLUGSB4RESET) { 626 if (bcp->plugged_tries >= bcp->plugsb4reset) {
615 bcp->plugged_tries = 0; 627 bcp->plugged_tries = 0;
616 quiesce_local_uvhub(hmaster); 628 quiesce_local_uvhub(hmaster);
617 spin_lock(&hmaster->queue_lock); 629 spin_lock(&hmaster->queue_lock);
@@ -623,10 +635,10 @@ const struct cpumask *uv_flush_send_and_wait(struct bau_desc *bau_desc,
623 stat->s_resets_plug++; 635 stat->s_resets_plug++;
624 } 636 }
625 } else if (completion_status == FLUSH_RETRY_TIMEOUT) { 637 } else if (completion_status == FLUSH_RETRY_TIMEOUT) {
626 hmaster->max_concurrent = 1; 638 hmaster->max_bau_concurrent = 1;
627 bcp->timeout_tries++; 639 bcp->timeout_tries++;
628 udelay(TIMEOUT_DELAY); 640 udelay(TIMEOUT_DELAY);
629 if (bcp->timeout_tries >= TIMEOUTSB4RESET) { 641 if (bcp->timeout_tries >= bcp->timeoutsb4reset) {
630 bcp->timeout_tries = 0; 642 bcp->timeout_tries = 0;
631 quiesce_local_uvhub(hmaster); 643 quiesce_local_uvhub(hmaster);
632 spin_lock(&hmaster->queue_lock); 644 spin_lock(&hmaster->queue_lock);
@@ -638,7 +650,7 @@ const struct cpumask *uv_flush_send_and_wait(struct bau_desc *bau_desc,
638 stat->s_resets_timeout++; 650 stat->s_resets_timeout++;
639 } 651 }
640 } 652 }
641 if (bcp->ipi_attempts >= 3) { 653 if (bcp->ipi_attempts >= bcp->ipi_reset_limit) {
642 bcp->ipi_attempts = 0; 654 bcp->ipi_attempts = 0;
643 completion_status = FLUSH_GIVEUP; 655 completion_status = FLUSH_GIVEUP;
644 break; 656 break;
@@ -648,9 +660,14 @@ const struct cpumask *uv_flush_send_and_wait(struct bau_desc *bau_desc,
648 (completion_status == FLUSH_RETRY_TIMEOUT)); 660 (completion_status == FLUSH_RETRY_TIMEOUT));
649 time2 = get_cycles(); 661 time2 = get_cycles();
650 662
651 if ((completion_status == FLUSH_COMPLETE) && (bcp->conseccompletes > 5) 663 bcp->plugged_tries = 0;
652 && (hmaster->max_concurrent < hmaster->max_concurrent_constant)) 664 bcp->timeout_tries = 0;
653 hmaster->max_concurrent++; 665
666 if ((completion_status == FLUSH_COMPLETE) &&
667 (bcp->conseccompletes > bcp->complete_threshold) &&
668 (hmaster->max_bau_concurrent <
669 hmaster->max_bau_concurrent_constant))
670 hmaster->max_bau_concurrent++;
654 671
655 /* 672 /*
656 * hold any cpu not timing out here; no other cpu currently held by 673 * hold any cpu not timing out here; no other cpu currently held by
@@ -661,9 +678,10 @@ const struct cpumask *uv_flush_send_and_wait(struct bau_desc *bau_desc,
661 atomic_dec(&hmaster->active_descriptor_count); 678 atomic_dec(&hmaster->active_descriptor_count);
662 679
663 /* guard against cycles wrap */ 680 /* guard against cycles wrap */
664 if (time2 > time1) 681 if (time2 > time1) {
665 stat->s_time += (time2 - time1); 682 elapsed = time2 - time1;
666 else 683 stat->s_time += elapsed;
684 } else
667 stat->s_requestor--; /* don't count this one */ 685 stat->s_requestor--; /* don't count this one */
668 if (completion_status == FLUSH_COMPLETE && try > 1) 686 if (completion_status == FLUSH_COMPLETE && try > 1)
669 stat->s_retriesok++; 687 stat->s_retriesok++;
@@ -730,10 +748,12 @@ const struct cpumask *uv_flush_tlb_others(const struct cpumask *cpumask,
730 struct ptc_stats *stat; 748 struct ptc_stats *stat;
731 struct bau_control *bcp; 749 struct bau_control *bcp;
732 750
751 /* kernel was booted 'nobau' */
733 if (nobau) 752 if (nobau)
734 return cpumask; 753 return cpumask;
735 754
736 bcp = &per_cpu(bau_control, cpu); 755 bcp = &per_cpu(bau_control, cpu);
756
737 /* 757 /*
738 * Each sending cpu has a per-cpu mask which it fills from the caller's 758 * Each sending cpu has a per-cpu mask which it fills from the caller's
739 * cpu mask. Only remote cpus are converted to uvhubs and copied. 759 * cpu mask. Only remote cpus are converted to uvhubs and copied.
@@ -970,6 +990,7 @@ static int uv_ptc_seq_show(struct seq_file *file, void *data)
970 stat->s_resets_plug, stat->s_resets_timeout, 990 stat->s_resets_plug, stat->s_resets_timeout,
971 stat->s_giveup, stat->s_stimeout, 991 stat->s_giveup, stat->s_stimeout,
972 stat->s_busy, stat->s_throttles); 992 stat->s_busy, stat->s_throttles);
993
973 /* destination side statistics */ 994 /* destination side statistics */
974 seq_printf(file, 995 seq_printf(file,
975 "%lx %ld %ld %ld %ld %ld %ld %ld %ld %ld %ld %ld\n", 996 "%lx %ld %ld %ld %ld %ld %ld %ld %ld %ld %ld %ld\n",
@@ -986,9 +1007,28 @@ static int uv_ptc_seq_show(struct seq_file *file, void *data)
986} 1007}
987 1008
988/* 1009/*
1010 * Display the tunables thru debugfs
1011 */
1012static ssize_t tunables_read(struct file *file, char __user *userbuf,
1013 size_t count, loff_t *ppos)
1014{
1015 char buf[300];
1016 int ret;
1017
1018 ret = snprintf(buf, 300, "%s %s %s\n%d %d %d %d %d %d %d %d %d\n",
1019 "max_bau_concurrent plugged_delay plugsb4reset",
1020 "timeoutsb4reset ipi_reset_limit complete_threshold",
1021 "congested_response_us congested_reps congested_period",
1022 max_bau_concurrent, plugged_delay, plugsb4reset,
1023 timeoutsb4reset, ipi_reset_limit, complete_threshold,
1024 congested_response_us, congested_reps, congested_period);
1025
1026 return simple_read_from_buffer(userbuf, count, ppos, buf, ret);
1027}
1028
1029/*
989 * -1: resetf the statistics 1030 * -1: resetf the statistics
990 * 0: display meaning of the statistics 1031 * 0: display meaning of the statistics
991 * >0: maximum concurrent active descriptors per uvhub (throttle)
992 */ 1032 */
993static ssize_t uv_ptc_proc_write(struct file *file, const char __user *user, 1033static ssize_t uv_ptc_proc_write(struct file *file, const char __user *user,
994 size_t count, loff_t *data) 1034 size_t count, loff_t *data)
@@ -997,7 +1037,6 @@ static ssize_t uv_ptc_proc_write(struct file *file, const char __user *user,
997 long input_arg; 1037 long input_arg;
998 char optstr[64]; 1038 char optstr[64];
999 struct ptc_stats *stat; 1039 struct ptc_stats *stat;
1000 struct bau_control *bcp;
1001 1040
1002 if (count == 0 || count > sizeof(optstr)) 1041 if (count == 0 || count > sizeof(optstr))
1003 return -EINVAL; 1042 return -EINVAL;
@@ -1078,24 +1117,149 @@ static ssize_t uv_ptc_proc_write(struct file *file, const char __user *user,
1078 stat = &per_cpu(ptcstats, cpu); 1117 stat = &per_cpu(ptcstats, cpu);
1079 memset(stat, 0, sizeof(struct ptc_stats)); 1118 memset(stat, 0, sizeof(struct ptc_stats));
1080 } 1119 }
1081 } else { 1120 }
1082 uv_bau_max_concurrent = input_arg; 1121
1083 bcp = &per_cpu(bau_control, smp_processor_id()); 1122 return count;
1084 if (uv_bau_max_concurrent < 1 || 1123}
1085 uv_bau_max_concurrent > bcp->cpus_in_uvhub) { 1124
1086 printk(KERN_DEBUG 1125static int local_atoi(const char *name)
1087 "Error: BAU max concurrent %d; %d is invalid\n", 1126{
1088 bcp->max_concurrent, uv_bau_max_concurrent); 1127 int val = 0;
1089 return -EINVAL; 1128
1090 } 1129 for (;; name++) {
1091 printk(KERN_DEBUG "Set BAU max concurrent:%d\n", 1130 switch (*name) {
1092 uv_bau_max_concurrent); 1131 case '0' ... '9':
1093 for_each_present_cpu(cpu) { 1132 val = 10*val+(*name-'0');
1094 bcp = &per_cpu(bau_control, cpu); 1133 break;
1095 bcp->max_concurrent = uv_bau_max_concurrent; 1134 default:
1135 return val;
1096 } 1136 }
1097 } 1137 }
1138}
1139
1140/*
1141 * set the tunables
1142 * 0 values reset them to defaults
1143 */
1144static ssize_t tunables_write(struct file *file, const char __user *user,
1145 size_t count, loff_t *data)
1146{
1147 int cpu;
1148 int cnt = 0;
1149 int val;
1150 char *p;
1151 char *q;
1152 char instr[64];
1153 struct bau_control *bcp;
1098 1154
1155 if (count == 0 || count > sizeof(instr)-1)
1156 return -EINVAL;
1157 if (copy_from_user(instr, user, count))
1158 return -EFAULT;
1159
1160 instr[count] = '\0';
1161 /* count the fields */
1162 p = instr + strspn(instr, WHITESPACE);
1163 q = p;
1164 for (; *p; p = q + strspn(q, WHITESPACE)) {
1165 q = p + strcspn(p, WHITESPACE);
1166 cnt++;
1167 if (q == p)
1168 break;
1169 }
1170 if (cnt != 9) {
1171 printk(KERN_INFO "bau tunable error: should be 9 numbers\n");
1172 return -EINVAL;
1173 }
1174
1175 p = instr + strspn(instr, WHITESPACE);
1176 q = p;
1177 for (cnt = 0; *p; p = q + strspn(q, WHITESPACE), cnt++) {
1178 q = p + strcspn(p, WHITESPACE);
1179 val = local_atoi(p);
1180 switch (cnt) {
1181 case 0:
1182 if (val == 0) {
1183 max_bau_concurrent = MAX_BAU_CONCURRENT;
1184 max_bau_concurrent_constant =
1185 MAX_BAU_CONCURRENT;
1186 continue;
1187 }
1188 bcp = &per_cpu(bau_control, smp_processor_id());
1189 if (val < 1 || val > bcp->cpus_in_uvhub) {
1190 printk(KERN_DEBUG
1191 "Error: BAU max concurrent %d is invalid\n",
1192 val);
1193 return -EINVAL;
1194 }
1195 max_bau_concurrent = val;
1196 max_bau_concurrent_constant = val;
1197 continue;
1198 case 1:
1199 if (val == 0)
1200 plugged_delay = PLUGGED_DELAY;
1201 else
1202 plugged_delay = val;
1203 continue;
1204 case 2:
1205 if (val == 0)
1206 plugsb4reset = PLUGSB4RESET;
1207 else
1208 plugsb4reset = val;
1209 continue;
1210 case 3:
1211 if (val == 0)
1212 timeoutsb4reset = TIMEOUTSB4RESET;
1213 else
1214 timeoutsb4reset = val;
1215 continue;
1216 case 4:
1217 if (val == 0)
1218 ipi_reset_limit = IPI_RESET_LIMIT;
1219 else
1220 ipi_reset_limit = val;
1221 continue;
1222 case 5:
1223 if (val == 0)
1224 complete_threshold = COMPLETE_THRESHOLD;
1225 else
1226 complete_threshold = val;
1227 continue;
1228 case 6:
1229 if (val == 0)
1230 congested_response_us = CONGESTED_RESPONSE_US;
1231 else
1232 congested_response_us = val;
1233 continue;
1234 case 7:
1235 if (val == 0)
1236 congested_reps = CONGESTED_REPS;
1237 else
1238 congested_reps = val;
1239 continue;
1240 case 8:
1241 if (val == 0)
1242 congested_period = CONGESTED_PERIOD;
1243 else
1244 congested_period = val;
1245 continue;
1246 }
1247 if (q == p)
1248 break;
1249 }
1250 for_each_present_cpu(cpu) {
1251 bcp = &per_cpu(bau_control, cpu);
1252 bcp->max_bau_concurrent = max_bau_concurrent;
1253 bcp->max_bau_concurrent_constant = max_bau_concurrent;
1254 bcp->plugged_delay = plugged_delay;
1255 bcp->plugsb4reset = plugsb4reset;
1256 bcp->timeoutsb4reset = timeoutsb4reset;
1257 bcp->ipi_reset_limit = ipi_reset_limit;
1258 bcp->complete_threshold = complete_threshold;
1259 bcp->congested_response_us = congested_response_us;
1260 bcp->congested_reps = congested_reps;
1261 bcp->congested_period = congested_period;
1262 }
1099 return count; 1263 return count;
1100} 1264}
1101 1265
@@ -1111,6 +1275,11 @@ static int uv_ptc_proc_open(struct inode *inode, struct file *file)
1111 return seq_open(file, &uv_ptc_seq_ops); 1275 return seq_open(file, &uv_ptc_seq_ops);
1112} 1276}
1113 1277
1278static int tunables_open(struct inode *inode, struct file *file)
1279{
1280 return 0;
1281}
1282
1114static const struct file_operations proc_uv_ptc_operations = { 1283static const struct file_operations proc_uv_ptc_operations = {
1115 .open = uv_ptc_proc_open, 1284 .open = uv_ptc_proc_open,
1116 .read = seq_read, 1285 .read = seq_read,
@@ -1119,6 +1288,12 @@ static const struct file_operations proc_uv_ptc_operations = {
1119 .release = seq_release, 1288 .release = seq_release,
1120}; 1289};
1121 1290
1291static const struct file_operations tunables_fops = {
1292 .open = tunables_open,
1293 .read = tunables_read,
1294 .write = tunables_write,
1295};
1296
1122static int __init uv_ptc_init(void) 1297static int __init uv_ptc_init(void)
1123{ 1298{
1124 struct proc_dir_entry *proc_uv_ptc; 1299 struct proc_dir_entry *proc_uv_ptc;
@@ -1133,6 +1308,20 @@ static int __init uv_ptc_init(void)
1133 UV_PTC_BASENAME); 1308 UV_PTC_BASENAME);
1134 return -EINVAL; 1309 return -EINVAL;
1135 } 1310 }
1311
1312 tunables_dir = debugfs_create_dir(UV_BAU_TUNABLES_DIR, NULL);
1313 if (!tunables_dir) {
1314 printk(KERN_ERR "unable to create debugfs directory %s\n",
1315 UV_BAU_TUNABLES_DIR);
1316 return -EINVAL;
1317 }
1318 tunables_file = debugfs_create_file(UV_BAU_TUNABLES_FILE, 0600,
1319 tunables_dir, NULL, &tunables_fops);
1320 if (!tunables_file) {
1321 printk(KERN_ERR "unable to create debugfs file %s\n",
1322 UV_BAU_TUNABLES_FILE);
1323 return -EINVAL;
1324 }
1136 return 0; 1325 return 0;
1137} 1326}
1138 1327
@@ -1336,15 +1525,12 @@ static void uv_init_per_cpu(int nuvhubs)
1336 bcp = &per_cpu(bau_control, cpu); 1525 bcp = &per_cpu(bau_control, cpu);
1337 memset(bcp, 0, sizeof(struct bau_control)); 1526 memset(bcp, 0, sizeof(struct bau_control));
1338 spin_lock_init(&bcp->masks_lock); 1527 spin_lock_init(&bcp->masks_lock);
1339 bcp->max_concurrent = uv_bau_max_concurrent;
1340 pnode = uv_cpu_hub_info(cpu)->pnode; 1528 pnode = uv_cpu_hub_info(cpu)->pnode;
1341 uvhub = uv_cpu_hub_info(cpu)->numa_blade_id; 1529 uvhub = uv_cpu_hub_info(cpu)->numa_blade_id;
1342 bdp = &uvhub_descs[uvhub]; 1530 bdp = &uvhub_descs[uvhub];
1343 bdp->num_cpus++; 1531 bdp->num_cpus++;
1344 bdp->uvhub = uvhub; 1532 bdp->uvhub = uvhub;
1345 bdp->pnode = pnode; 1533 bdp->pnode = pnode;
1346 /* time interval to catch a hardware stay-busy bug */
1347 bcp->timeout_interval = microsec_2_cycles(2*timeout_us);
1348 /* kludge: assume uv_hub.h is constant */ 1534 /* kludge: assume uv_hub.h is constant */
1349 socket = (cpu_physical_id(cpu)>>5)&1; 1535 socket = (cpu_physical_id(cpu)>>5)&1;
1350 if (socket >= bdp->num_sockets) 1536 if (socket >= bdp->num_sockets)
@@ -1380,6 +1566,21 @@ static void uv_init_per_cpu(int nuvhubs)
1380 } 1566 }
1381 } 1567 }
1382 kfree(uvhub_descs); 1568 kfree(uvhub_descs);
1569 for_each_present_cpu(cpu) {
1570 bcp = &per_cpu(bau_control, cpu);
1571 /* time interval to catch a hardware stay-busy bug */
1572 bcp->timeout_interval = microsec_2_cycles(2*timeout_us);
1573 bcp->max_bau_concurrent = max_bau_concurrent;
1574 bcp->max_bau_concurrent_constant = max_bau_concurrent;
1575 bcp->plugged_delay = plugged_delay;
1576 bcp->plugsb4reset = plugsb4reset;
1577 bcp->timeoutsb4reset = timeoutsb4reset;
1578 bcp->ipi_reset_limit = ipi_reset_limit;
1579 bcp->complete_threshold = complete_threshold;
1580 bcp->congested_response_us = congested_response_us;
1581 bcp->congested_reps = congested_reps;
1582 bcp->congested_period = congested_period;
1583 }
1383} 1584}
1384 1585
1385/* 1586/*
@@ -1404,7 +1605,7 @@ static int __init uv_bau_init(void)
1404 zalloc_cpumask_var_node(&per_cpu(uv_flush_tlb_mask, cur_cpu), 1605 zalloc_cpumask_var_node(&per_cpu(uv_flush_tlb_mask, cur_cpu),
1405 GFP_KERNEL, cpu_to_node(cur_cpu)); 1606 GFP_KERNEL, cpu_to_node(cur_cpu));
1406 1607
1407 uv_bau_max_concurrent = MAX_BAU_CONCURRENT; 1608 max_bau_concurrent = MAX_BAU_CONCURRENT;
1408 uv_nshift = uv_hub_info->m_val; 1609 uv_nshift = uv_hub_info->m_val;
1409 uv_mmask = (1UL << uv_hub_info->m_val) - 1; 1610 uv_mmask = (1UL << uv_hub_info->m_val) - 1;
1410 nuvhubs = uv_num_possible_blades(); 1611 nuvhubs = uv_num_possible_blades();
@@ -1437,4 +1638,4 @@ static int __init uv_bau_init(void)
1437 return 0; 1638 return 0;
1438} 1639}
1439core_initcall(uv_bau_init); 1640core_initcall(uv_bau_init);
1440core_initcall(uv_ptc_init); 1641fs_initcall(uv_ptc_init);