diff options
Diffstat (limited to 'lib')
| -rw-r--r-- | lib/Kconfig | 8 | ||||
| -rw-r--r-- | lib/Kconfig.debug | 42 | ||||
| -rw-r--r-- | lib/Makefile | 2 | ||||
| -rw-r--r-- | lib/debugobjects.c | 11 | ||||
| -rw-r--r-- | lib/dynamic_debug.c | 190 | ||||
| -rw-r--r-- | lib/jedec_ddr_data.c | 135 | ||||
| -rw-r--r-- | lib/kobject.c | 14 | ||||
| -rw-r--r-- | lib/list_debug.c | 22 | ||||
| -rw-r--r-- | lib/raid6/Makefile | 2 | ||||
| -rw-r--r-- | lib/raid6/algos.c | 127 | ||||
| -rw-r--r-- | lib/raid6/mktables.c | 25 | ||||
| -rw-r--r-- | lib/raid6/recov.c | 15 | ||||
| -rw-r--r-- | lib/raid6/recov_ssse3.c | 335 | ||||
| -rw-r--r-- | lib/raid6/test/Makefile | 2 | ||||
| -rw-r--r-- | lib/raid6/test/test.c | 32 | ||||
| -rw-r--r-- | lib/raid6/x86.h | 15 | ||||
| -rw-r--r-- | lib/rational.c | 2 |
17 files changed, 823 insertions, 156 deletions
diff --git a/lib/Kconfig b/lib/Kconfig index 4a8aba2e5cc0..0e25c03939e3 100644 --- a/lib/Kconfig +++ b/lib/Kconfig | |||
| @@ -353,6 +353,14 @@ config CORDIC | |||
| 353 | This option provides an implementation of the CORDIC algorithm; | 353 | This option provides an implementation of the CORDIC algorithm; |
| 354 | calculations are in fixed point. Module will be called cordic. | 354 | calculations are in fixed point. Module will be called cordic. |
| 355 | 355 | ||
| 356 | config DDR | ||
| 357 | bool "JEDEC DDR data" | ||
| 358 | help | ||
| 359 | Data from JEDEC specs for DDR SDRAM memories, | ||
| 360 | particularly the AC timing parameters and addressing | ||
| 361 | information. This data is useful for drivers handling | ||
| 362 | DDR SDRAM controllers. | ||
| 363 | |||
| 356 | config MPILIB | 364 | config MPILIB |
| 357 | tristate | 365 | tristate |
| 358 | select CLZ_TAB | 366 | select CLZ_TAB |
diff --git a/lib/Kconfig.debug b/lib/Kconfig.debug index 6777153f18f3..a42d3ae39648 100644 --- a/lib/Kconfig.debug +++ b/lib/Kconfig.debug | |||
| @@ -3,12 +3,16 @@ config PRINTK_TIME | |||
| 3 | bool "Show timing information on printks" | 3 | bool "Show timing information on printks" |
| 4 | depends on PRINTK | 4 | depends on PRINTK |
| 5 | help | 5 | help |
| 6 | Selecting this option causes timing information to be | 6 | Selecting this option causes time stamps of the printk() |
| 7 | included in printk output. This allows you to measure | 7 | messages to be added to the output of the syslog() system |
| 8 | the interval between kernel operations, including bootup | 8 | call and at the console. |
| 9 | operations. This is useful for identifying long delays | 9 | |
| 10 | in kernel startup. Or add printk.time=1 at boot-time. | 10 | The timestamp is always recorded internally, and exported |
| 11 | See Documentation/kernel-parameters.txt | 11 | to /dev/kmsg. This flag just specifies if the timestamp should |
| 12 | be included, not that the timestamp is recorded. | ||
| 13 | |||
| 14 | The behavior is also controlled by the kernel command line | ||
| 15 | parameter printk.time=1. See Documentation/kernel-parameters.txt | ||
| 12 | 16 | ||
| 13 | config DEFAULT_MESSAGE_LOGLEVEL | 17 | config DEFAULT_MESSAGE_LOGLEVEL |
| 14 | int "Default message log level (1-7)" | 18 | int "Default message log level (1-7)" |
| @@ -70,6 +74,15 @@ config STRIP_ASM_SYMS | |||
| 70 | that look like '.Lxxx') so they don't pollute the output of | 74 | that look like '.Lxxx') so they don't pollute the output of |
| 71 | get_wchan() and suchlike. | 75 | get_wchan() and suchlike. |
| 72 | 76 | ||
| 77 | config READABLE_ASM | ||
| 78 | bool "Generate readable assembler code" | ||
| 79 | depends on DEBUG_KERNEL | ||
| 80 | help | ||
| 81 | Disable some compiler optimizations that tend to generate human unreadable | ||
| 82 | assembler output. This may make the kernel slightly slower, but it helps | ||
| 83 | to keep kernel developers who have to stare a lot at assembler listings | ||
| 84 | sane. | ||
| 85 | |||
| 73 | config UNUSED_SYMBOLS | 86 | config UNUSED_SYMBOLS |
| 74 | bool "Enable unused/obsolete exported symbols" | 87 | bool "Enable unused/obsolete exported symbols" |
| 75 | default y if X86 | 88 | default y if X86 |
| @@ -1205,8 +1218,13 @@ config DYNAMIC_DEBUG | |||
| 1205 | otherwise be available at runtime. These messages can then be | 1218 | otherwise be available at runtime. These messages can then be |
| 1206 | enabled/disabled based on various levels of scope - per source file, | 1219 | enabled/disabled based on various levels of scope - per source file, |
| 1207 | function, module, format string, and line number. This mechanism | 1220 | function, module, format string, and line number. This mechanism |
| 1208 | implicitly enables all pr_debug() and dev_dbg() calls. The impact of | 1221 | implicitly compiles in all pr_debug() and dev_dbg() calls, which |
| 1209 | this compile option is a larger kernel text size of about 2%. | 1222 | enlarges the kernel text size by about 2%. |
| 1223 | |||
| 1224 | If a source file is compiled with DEBUG flag set, any | ||
| 1225 | pr_debug() calls in it are enabled by default, but can be | ||
| 1226 | disabled at runtime as below. Note that DEBUG flag is | ||
| 1227 | turned on by many CONFIG_*DEBUG* options. | ||
| 1210 | 1228 | ||
| 1211 | Usage: | 1229 | Usage: |
| 1212 | 1230 | ||
| @@ -1223,16 +1241,16 @@ config DYNAMIC_DEBUG | |||
| 1223 | lineno : line number of the debug statement | 1241 | lineno : line number of the debug statement |
| 1224 | module : module that contains the debug statement | 1242 | module : module that contains the debug statement |
| 1225 | function : function that contains the debug statement | 1243 | function : function that contains the debug statement |
| 1226 | flags : 'p' means the line is turned 'on' for printing | 1244 | flags : '=p' means the line is turned 'on' for printing |
| 1227 | format : the format used for the debug statement | 1245 | format : the format used for the debug statement |
| 1228 | 1246 | ||
| 1229 | From a live system: | 1247 | From a live system: |
| 1230 | 1248 | ||
| 1231 | nullarbor:~ # cat <debugfs>/dynamic_debug/control | 1249 | nullarbor:~ # cat <debugfs>/dynamic_debug/control |
| 1232 | # filename:lineno [module]function flags format | 1250 | # filename:lineno [module]function flags format |
| 1233 | fs/aio.c:222 [aio]__put_ioctx - "__put_ioctx:\040freeing\040%p\012" | 1251 | fs/aio.c:222 [aio]__put_ioctx =_ "__put_ioctx:\040freeing\040%p\012" |
| 1234 | fs/aio.c:248 [aio]ioctx_alloc - "ENOMEM:\040nr_events\040too\040high\012" | 1252 | fs/aio.c:248 [aio]ioctx_alloc =_ "ENOMEM:\040nr_events\040too\040high\012" |
| 1235 | fs/aio.c:1770 [aio]sys_io_cancel - "calling\040cancel\012" | 1253 | fs/aio.c:1770 [aio]sys_io_cancel =_ "calling\040cancel\012" |
| 1236 | 1254 | ||
| 1237 | Example usage: | 1255 | Example usage: |
| 1238 | 1256 | ||
diff --git a/lib/Makefile b/lib/Makefile index 18515f0267c4..74290c9e2864 100644 --- a/lib/Makefile +++ b/lib/Makefile | |||
| @@ -123,6 +123,8 @@ obj-$(CONFIG_SIGNATURE) += digsig.o | |||
| 123 | 123 | ||
| 124 | obj-$(CONFIG_CLZ_TAB) += clz_tab.o | 124 | obj-$(CONFIG_CLZ_TAB) += clz_tab.o |
| 125 | 125 | ||
| 126 | obj-$(CONFIG_DDR) += jedec_ddr_data.o | ||
| 127 | |||
| 126 | hostprogs-y := gen_crc32table | 128 | hostprogs-y := gen_crc32table |
| 127 | clean-files := crc32table.h | 129 | clean-files := crc32table.h |
| 128 | 130 | ||
diff --git a/lib/debugobjects.c b/lib/debugobjects.c index 0ab9ae8057f0..d11808ca4bc4 100644 --- a/lib/debugobjects.c +++ b/lib/debugobjects.c | |||
| @@ -79,30 +79,29 @@ static const char *obj_states[ODEBUG_STATE_MAX] = { | |||
| 79 | [ODEBUG_STATE_NOTAVAILABLE] = "not available", | 79 | [ODEBUG_STATE_NOTAVAILABLE] = "not available", |
| 80 | }; | 80 | }; |
| 81 | 81 | ||
| 82 | static int fill_pool(void) | 82 | static void fill_pool(void) |
| 83 | { | 83 | { |
| 84 | gfp_t gfp = GFP_ATOMIC | __GFP_NORETRY | __GFP_NOWARN; | 84 | gfp_t gfp = GFP_ATOMIC | __GFP_NORETRY | __GFP_NOWARN; |
| 85 | struct debug_obj *new; | 85 | struct debug_obj *new; |
| 86 | unsigned long flags; | 86 | unsigned long flags; |
| 87 | 87 | ||
| 88 | if (likely(obj_pool_free >= ODEBUG_POOL_MIN_LEVEL)) | 88 | if (likely(obj_pool_free >= ODEBUG_POOL_MIN_LEVEL)) |
| 89 | return obj_pool_free; | 89 | return; |
| 90 | 90 | ||
| 91 | if (unlikely(!obj_cache)) | 91 | if (unlikely(!obj_cache)) |
| 92 | return obj_pool_free; | 92 | return; |
| 93 | 93 | ||
| 94 | while (obj_pool_free < ODEBUG_POOL_MIN_LEVEL) { | 94 | while (obj_pool_free < ODEBUG_POOL_MIN_LEVEL) { |
| 95 | 95 | ||
| 96 | new = kmem_cache_zalloc(obj_cache, gfp); | 96 | new = kmem_cache_zalloc(obj_cache, gfp); |
| 97 | if (!new) | 97 | if (!new) |
| 98 | return obj_pool_free; | 98 | return; |
| 99 | 99 | ||
| 100 | raw_spin_lock_irqsave(&pool_lock, flags); | 100 | raw_spin_lock_irqsave(&pool_lock, flags); |
| 101 | hlist_add_head(&new->node, &obj_pool); | 101 | hlist_add_head(&new->node, &obj_pool); |
| 102 | obj_pool_free++; | 102 | obj_pool_free++; |
| 103 | raw_spin_unlock_irqrestore(&pool_lock, flags); | 103 | raw_spin_unlock_irqrestore(&pool_lock, flags); |
| 104 | } | 104 | } |
| 105 | return obj_pool_free; | ||
| 106 | } | 105 | } |
| 107 | 106 | ||
| 108 | /* | 107 | /* |
| @@ -1052,10 +1051,10 @@ static int __init debug_objects_replace_static_objects(void) | |||
| 1052 | cnt++; | 1051 | cnt++; |
| 1053 | } | 1052 | } |
| 1054 | } | 1053 | } |
| 1054 | local_irq_enable(); | ||
| 1055 | 1055 | ||
| 1056 | printk(KERN_DEBUG "ODEBUG: %d of %d active objects replaced\n", cnt, | 1056 | printk(KERN_DEBUG "ODEBUG: %d of %d active objects replaced\n", cnt, |
| 1057 | obj_pool_used); | 1057 | obj_pool_used); |
| 1058 | local_irq_enable(); | ||
| 1059 | return 0; | 1058 | return 0; |
| 1060 | free: | 1059 | free: |
| 1061 | hlist_for_each_entry_safe(obj, node, tmp, &objects, node) { | 1060 | hlist_for_each_entry_safe(obj, node, tmp, &objects, node) { |
diff --git a/lib/dynamic_debug.c b/lib/dynamic_debug.c index 310c753cf83e..7ca29a0a3019 100644 --- a/lib/dynamic_debug.c +++ b/lib/dynamic_debug.c | |||
| @@ -107,20 +107,22 @@ static char *ddebug_describe_flags(struct _ddebug *dp, char *buf, | |||
| 107 | return buf; | 107 | return buf; |
| 108 | } | 108 | } |
| 109 | 109 | ||
| 110 | #define vpr_info_dq(q, msg) \ | 110 | #define vpr_info(fmt, ...) \ |
| 111 | do { \ | 111 | if (verbose) do { pr_info(fmt, ##__VA_ARGS__); } while (0) |
| 112 | if (verbose) \ | 112 | |
| 113 | /* trim last char off format print */ \ | 113 | #define vpr_info_dq(q, msg) \ |
| 114 | pr_info("%s: func=\"%s\" file=\"%s\" " \ | 114 | do { \ |
| 115 | "module=\"%s\" format=\"%.*s\" " \ | 115 | /* trim last char off format print */ \ |
| 116 | "lineno=%u-%u", \ | 116 | vpr_info("%s: func=\"%s\" file=\"%s\" " \ |
| 117 | msg, \ | 117 | "module=\"%s\" format=\"%.*s\" " \ |
| 118 | q->function ? q->function : "", \ | 118 | "lineno=%u-%u", \ |
| 119 | q->filename ? q->filename : "", \ | 119 | msg, \ |
| 120 | q->module ? q->module : "", \ | 120 | q->function ? q->function : "", \ |
| 121 | (int)(q->format ? strlen(q->format) - 1 : 0), \ | 121 | q->filename ? q->filename : "", \ |
| 122 | q->format ? q->format : "", \ | 122 | q->module ? q->module : "", \ |
| 123 | q->first_lineno, q->last_lineno); \ | 123 | (int)(q->format ? strlen(q->format) - 1 : 0), \ |
| 124 | q->format ? q->format : "", \ | ||
| 125 | q->first_lineno, q->last_lineno); \ | ||
| 124 | } while (0) | 126 | } while (0) |
| 125 | 127 | ||
| 126 | /* | 128 | /* |
| @@ -180,12 +182,11 @@ static int ddebug_change(const struct ddebug_query *query, | |||
| 180 | if (newflags == dp->flags) | 182 | if (newflags == dp->flags) |
| 181 | continue; | 183 | continue; |
| 182 | dp->flags = newflags; | 184 | dp->flags = newflags; |
| 183 | if (verbose) | 185 | vpr_info("changed %s:%d [%s]%s =%s\n", |
| 184 | pr_info("changed %s:%d [%s]%s =%s\n", | 186 | trim_prefix(dp->filename), dp->lineno, |
| 185 | trim_prefix(dp->filename), dp->lineno, | 187 | dt->mod_name, dp->function, |
| 186 | dt->mod_name, dp->function, | 188 | ddebug_describe_flags(dp, flagbuf, |
| 187 | ddebug_describe_flags(dp, flagbuf, | 189 | sizeof(flagbuf))); |
| 188 | sizeof(flagbuf))); | ||
| 189 | } | 190 | } |
| 190 | } | 191 | } |
| 191 | mutex_unlock(&ddebug_lock); | 192 | mutex_unlock(&ddebug_lock); |
| @@ -337,7 +338,7 @@ static int check_set(const char **dest, char *src, char *name) | |||
| 337 | * Returns 0 on success, <0 on error. | 338 | * Returns 0 on success, <0 on error. |
| 338 | */ | 339 | */ |
| 339 | static int ddebug_parse_query(char *words[], int nwords, | 340 | static int ddebug_parse_query(char *words[], int nwords, |
| 340 | struct ddebug_query *query) | 341 | struct ddebug_query *query, const char *modname) |
| 341 | { | 342 | { |
| 342 | unsigned int i; | 343 | unsigned int i; |
| 343 | int rc; | 344 | int rc; |
| @@ -347,6 +348,10 @@ static int ddebug_parse_query(char *words[], int nwords, | |||
| 347 | return -EINVAL; | 348 | return -EINVAL; |
| 348 | memset(query, 0, sizeof(*query)); | 349 | memset(query, 0, sizeof(*query)); |
| 349 | 350 | ||
| 351 | if (modname) | ||
| 352 | /* support $modname.dyndbg=<multiple queries> */ | ||
| 353 | query->module = modname; | ||
| 354 | |||
| 350 | for (i = 0 ; i < nwords ; i += 2) { | 355 | for (i = 0 ; i < nwords ; i += 2) { |
| 351 | if (!strcmp(words[i], "func")) | 356 | if (!strcmp(words[i], "func")) |
| 352 | rc = check_set(&query->function, words[i+1], "func"); | 357 | rc = check_set(&query->function, words[i+1], "func"); |
| @@ -410,8 +415,7 @@ static int ddebug_parse_flags(const char *str, unsigned int *flagsp, | |||
| 410 | default: | 415 | default: |
| 411 | return -EINVAL; | 416 | return -EINVAL; |
| 412 | } | 417 | } |
| 413 | if (verbose) | 418 | vpr_info("op='%c'\n", op); |
| 414 | pr_info("op='%c'\n", op); | ||
| 415 | 419 | ||
| 416 | for ( ; *str ; ++str) { | 420 | for ( ; *str ; ++str) { |
| 417 | for (i = ARRAY_SIZE(opt_array) - 1; i >= 0; i--) { | 421 | for (i = ARRAY_SIZE(opt_array) - 1; i >= 0; i--) { |
| @@ -423,8 +427,7 @@ static int ddebug_parse_flags(const char *str, unsigned int *flagsp, | |||
| 423 | if (i < 0) | 427 | if (i < 0) |
| 424 | return -EINVAL; | 428 | return -EINVAL; |
| 425 | } | 429 | } |
| 426 | if (verbose) | 430 | vpr_info("flags=0x%x\n", flags); |
| 427 | pr_info("flags=0x%x\n", flags); | ||
| 428 | 431 | ||
| 429 | /* calculate final *flagsp, *maskp according to mask and op */ | 432 | /* calculate final *flagsp, *maskp according to mask and op */ |
| 430 | switch (op) { | 433 | switch (op) { |
| @@ -441,12 +444,11 @@ static int ddebug_parse_flags(const char *str, unsigned int *flagsp, | |||
| 441 | *flagsp = 0; | 444 | *flagsp = 0; |
| 442 | break; | 445 | break; |
| 443 | } | 446 | } |
| 444 | if (verbose) | 447 | vpr_info("*flagsp=0x%x *maskp=0x%x\n", *flagsp, *maskp); |
| 445 | pr_info("*flagsp=0x%x *maskp=0x%x\n", *flagsp, *maskp); | ||
| 446 | return 0; | 448 | return 0; |
| 447 | } | 449 | } |
| 448 | 450 | ||
| 449 | static int ddebug_exec_query(char *query_string) | 451 | static int ddebug_exec_query(char *query_string, const char *modname) |
| 450 | { | 452 | { |
| 451 | unsigned int flags = 0, mask = 0; | 453 | unsigned int flags = 0, mask = 0; |
| 452 | struct ddebug_query query; | 454 | struct ddebug_query query; |
| @@ -457,7 +459,7 @@ static int ddebug_exec_query(char *query_string) | |||
| 457 | nwords = ddebug_tokenize(query_string, words, MAXWORDS); | 459 | nwords = ddebug_tokenize(query_string, words, MAXWORDS); |
| 458 | if (nwords <= 0) | 460 | if (nwords <= 0) |
| 459 | return -EINVAL; | 461 | return -EINVAL; |
| 460 | if (ddebug_parse_query(words, nwords-1, &query)) | 462 | if (ddebug_parse_query(words, nwords-1, &query, modname)) |
| 461 | return -EINVAL; | 463 | return -EINVAL; |
| 462 | if (ddebug_parse_flags(words[nwords-1], &flags, &mask)) | 464 | if (ddebug_parse_flags(words[nwords-1], &flags, &mask)) |
| 463 | return -EINVAL; | 465 | return -EINVAL; |
| @@ -473,7 +475,7 @@ static int ddebug_exec_query(char *query_string) | |||
| 473 | last error or number of matching callsites. Module name is either | 475 | last error or number of matching callsites. Module name is either |
| 474 | in param (for boot arg) or perhaps in query string. | 476 | in param (for boot arg) or perhaps in query string. |
| 475 | */ | 477 | */ |
| 476 | static int ddebug_exec_queries(char *query) | 478 | static int ddebug_exec_queries(char *query, const char *modname) |
| 477 | { | 479 | { |
| 478 | char *split; | 480 | char *split; |
| 479 | int i, errs = 0, exitcode = 0, rc, nfound = 0; | 481 | int i, errs = 0, exitcode = 0, rc, nfound = 0; |
| @@ -487,10 +489,9 @@ static int ddebug_exec_queries(char *query) | |||
| 487 | if (!query || !*query || *query == '#') | 489 | if (!query || !*query || *query == '#') |
| 488 | continue; | 490 | continue; |
| 489 | 491 | ||
| 490 | if (verbose) | 492 | vpr_info("query %d: \"%s\"\n", i, query); |
| 491 | pr_info("query %d: \"%s\"\n", i, query); | ||
| 492 | 493 | ||
| 493 | rc = ddebug_exec_query(query); | 494 | rc = ddebug_exec_query(query, modname); |
| 494 | if (rc < 0) { | 495 | if (rc < 0) { |
| 495 | errs++; | 496 | errs++; |
| 496 | exitcode = rc; | 497 | exitcode = rc; |
| @@ -498,7 +499,7 @@ static int ddebug_exec_queries(char *query) | |||
| 498 | nfound += rc; | 499 | nfound += rc; |
| 499 | i++; | 500 | i++; |
| 500 | } | 501 | } |
| 501 | pr_info("processed %d queries, with %d matches, %d errs\n", | 502 | vpr_info("processed %d queries, with %d matches, %d errs\n", |
| 502 | i, nfound, errs); | 503 | i, nfound, errs); |
| 503 | 504 | ||
| 504 | if (exitcode) | 505 | if (exitcode) |
| @@ -653,10 +654,9 @@ static ssize_t ddebug_proc_write(struct file *file, const char __user *ubuf, | |||
| 653 | return -EFAULT; | 654 | return -EFAULT; |
| 654 | } | 655 | } |
| 655 | tmpbuf[len] = '\0'; | 656 | tmpbuf[len] = '\0'; |
| 656 | if (verbose) | 657 | vpr_info("read %d bytes from userspace\n", (int)len); |
| 657 | pr_info("read %d bytes from userspace\n", (int)len); | ||
| 658 | 658 | ||
| 659 | ret = ddebug_exec_queries(tmpbuf); | 659 | ret = ddebug_exec_queries(tmpbuf, NULL); |
| 660 | kfree(tmpbuf); | 660 | kfree(tmpbuf); |
| 661 | if (ret < 0) | 661 | if (ret < 0) |
| 662 | return ret; | 662 | return ret; |
| @@ -717,8 +717,7 @@ static void *ddebug_proc_start(struct seq_file *m, loff_t *pos) | |||
| 717 | struct _ddebug *dp; | 717 | struct _ddebug *dp; |
| 718 | int n = *pos; | 718 | int n = *pos; |
| 719 | 719 | ||
| 720 | if (verbose) | 720 | vpr_info("called m=%p *pos=%lld\n", m, (unsigned long long)*pos); |
| 721 | pr_info("called m=%p *pos=%lld\n", m, (unsigned long long)*pos); | ||
| 722 | 721 | ||
| 723 | mutex_lock(&ddebug_lock); | 722 | mutex_lock(&ddebug_lock); |
| 724 | 723 | ||
| @@ -742,9 +741,8 @@ static void *ddebug_proc_next(struct seq_file *m, void *p, loff_t *pos) | |||
| 742 | struct ddebug_iter *iter = m->private; | 741 | struct ddebug_iter *iter = m->private; |
| 743 | struct _ddebug *dp; | 742 | struct _ddebug *dp; |
| 744 | 743 | ||
| 745 | if (verbose) | 744 | vpr_info("called m=%p p=%p *pos=%lld\n", |
| 746 | pr_info("called m=%p p=%p *pos=%lld\n", | 745 | m, p, (unsigned long long)*pos); |
| 747 | m, p, (unsigned long long)*pos); | ||
| 748 | 746 | ||
| 749 | if (p == SEQ_START_TOKEN) | 747 | if (p == SEQ_START_TOKEN) |
| 750 | dp = ddebug_iter_first(iter); | 748 | dp = ddebug_iter_first(iter); |
| @@ -766,8 +764,7 @@ static int ddebug_proc_show(struct seq_file *m, void *p) | |||
| 766 | struct _ddebug *dp = p; | 764 | struct _ddebug *dp = p; |
| 767 | char flagsbuf[10]; | 765 | char flagsbuf[10]; |
| 768 | 766 | ||
| 769 | if (verbose) | 767 | vpr_info("called m=%p p=%p\n", m, p); |
| 770 | pr_info("called m=%p p=%p\n", m, p); | ||
| 771 | 768 | ||
| 772 | if (p == SEQ_START_TOKEN) { | 769 | if (p == SEQ_START_TOKEN) { |
| 773 | seq_puts(m, | 770 | seq_puts(m, |
| @@ -791,8 +788,7 @@ static int ddebug_proc_show(struct seq_file *m, void *p) | |||
| 791 | */ | 788 | */ |
| 792 | static void ddebug_proc_stop(struct seq_file *m, void *p) | 789 | static void ddebug_proc_stop(struct seq_file *m, void *p) |
| 793 | { | 790 | { |
| 794 | if (verbose) | 791 | vpr_info("called m=%p p=%p\n", m, p); |
| 795 | pr_info("called m=%p p=%p\n", m, p); | ||
| 796 | mutex_unlock(&ddebug_lock); | 792 | mutex_unlock(&ddebug_lock); |
| 797 | } | 793 | } |
| 798 | 794 | ||
| @@ -815,8 +811,7 @@ static int ddebug_proc_open(struct inode *inode, struct file *file) | |||
| 815 | struct ddebug_iter *iter; | 811 | struct ddebug_iter *iter; |
| 816 | int err; | 812 | int err; |
| 817 | 813 | ||
| 818 | if (verbose) | 814 | vpr_info("called\n"); |
| 819 | pr_info("called\n"); | ||
| 820 | 815 | ||
| 821 | iter = kzalloc(sizeof(*iter), GFP_KERNEL); | 816 | iter = kzalloc(sizeof(*iter), GFP_KERNEL); |
| 822 | if (iter == NULL) | 817 | if (iter == NULL) |
| @@ -866,12 +861,51 @@ int ddebug_add_module(struct _ddebug *tab, unsigned int n, | |||
| 866 | list_add_tail(&dt->link, &ddebug_tables); | 861 | list_add_tail(&dt->link, &ddebug_tables); |
| 867 | mutex_unlock(&ddebug_lock); | 862 | mutex_unlock(&ddebug_lock); |
| 868 | 863 | ||
| 869 | if (verbose) | 864 | vpr_info("%u debug prints in module %s\n", n, dt->mod_name); |
| 870 | pr_info("%u debug prints in module %s\n", n, dt->mod_name); | ||
| 871 | return 0; | 865 | return 0; |
| 872 | } | 866 | } |
| 873 | EXPORT_SYMBOL_GPL(ddebug_add_module); | 867 | EXPORT_SYMBOL_GPL(ddebug_add_module); |
| 874 | 868 | ||
| 869 | /* helper for ddebug_dyndbg_(boot|module)_param_cb */ | ||
| 870 | static int ddebug_dyndbg_param_cb(char *param, char *val, | ||
| 871 | const char *modname, int on_err) | ||
| 872 | { | ||
| 873 | char *sep; | ||
| 874 | |||
| 875 | sep = strchr(param, '.'); | ||
| 876 | if (sep) { | ||
| 877 | /* needed only for ddebug_dyndbg_boot_param_cb */ | ||
| 878 | *sep = '\0'; | ||
| 879 | modname = param; | ||
| 880 | param = sep + 1; | ||
| 881 | } | ||
| 882 | if (strcmp(param, "dyndbg")) | ||
| 883 | return on_err; /* determined by caller */ | ||
| 884 | |||
| 885 | ddebug_exec_queries((val ? val : "+p"), modname); | ||
| 886 | |||
| 887 | return 0; /* query failure shouldnt stop module load */ | ||
| 888 | } | ||
| 889 | |||
| 890 | /* handle both dyndbg and $module.dyndbg params at boot */ | ||
| 891 | static int ddebug_dyndbg_boot_param_cb(char *param, char *val, | ||
| 892 | const char *unused) | ||
| 893 | { | ||
| 894 | vpr_info("%s=\"%s\"\n", param, val); | ||
| 895 | return ddebug_dyndbg_param_cb(param, val, NULL, 0); | ||
| 896 | } | ||
| 897 | |||
| 898 | /* | ||
| 899 | * modprobe foo finds foo.params in boot-args, strips "foo.", and | ||
| 900 | * passes them to load_module(). This callback gets unknown params, | ||
| 901 | * processes dyndbg params, rejects others. | ||
| 902 | */ | ||
| 903 | int ddebug_dyndbg_module_param_cb(char *param, char *val, const char *module) | ||
| 904 | { | ||
| 905 | vpr_info("module: %s %s=\"%s\"\n", module, param, val); | ||
| 906 | return ddebug_dyndbg_param_cb(param, val, module, -ENOENT); | ||
| 907 | } | ||
| 908 | |||
| 875 | static void ddebug_table_free(struct ddebug_table *dt) | 909 | static void ddebug_table_free(struct ddebug_table *dt) |
| 876 | { | 910 | { |
| 877 | list_del_init(&dt->link); | 911 | list_del_init(&dt->link); |
| @@ -888,8 +922,7 @@ int ddebug_remove_module(const char *mod_name) | |||
| 888 | struct ddebug_table *dt, *nextdt; | 922 | struct ddebug_table *dt, *nextdt; |
| 889 | int ret = -ENOENT; | 923 | int ret = -ENOENT; |
| 890 | 924 | ||
| 891 | if (verbose) | 925 | vpr_info("removing module \"%s\"\n", mod_name); |
| 892 | pr_info("removing module \"%s\"\n", mod_name); | ||
| 893 | 926 | ||
| 894 | mutex_lock(&ddebug_lock); | 927 | mutex_lock(&ddebug_lock); |
| 895 | list_for_each_entry_safe(dt, nextdt, &ddebug_tables, link) { | 928 | list_for_each_entry_safe(dt, nextdt, &ddebug_tables, link) { |
| @@ -940,8 +973,10 @@ static int __init dynamic_debug_init(void) | |||
| 940 | { | 973 | { |
| 941 | struct _ddebug *iter, *iter_start; | 974 | struct _ddebug *iter, *iter_start; |
| 942 | const char *modname = NULL; | 975 | const char *modname = NULL; |
| 976 | char *cmdline; | ||
| 943 | int ret = 0; | 977 | int ret = 0; |
| 944 | int n = 0; | 978 | int n = 0, entries = 0, modct = 0; |
| 979 | int verbose_bytes = 0; | ||
| 945 | 980 | ||
| 946 | if (__start___verbose == __stop___verbose) { | 981 | if (__start___verbose == __stop___verbose) { |
| 947 | pr_warn("_ddebug table is empty in a " | 982 | pr_warn("_ddebug table is empty in a " |
| @@ -952,10 +987,15 @@ static int __init dynamic_debug_init(void) | |||
| 952 | modname = iter->modname; | 987 | modname = iter->modname; |
| 953 | iter_start = iter; | 988 | iter_start = iter; |
| 954 | for (; iter < __stop___verbose; iter++) { | 989 | for (; iter < __stop___verbose; iter++) { |
| 990 | entries++; | ||
| 991 | verbose_bytes += strlen(iter->modname) + strlen(iter->function) | ||
| 992 | + strlen(iter->filename) + strlen(iter->format); | ||
| 993 | |||
| 955 | if (strcmp(modname, iter->modname)) { | 994 | if (strcmp(modname, iter->modname)) { |
| 995 | modct++; | ||
| 956 | ret = ddebug_add_module(iter_start, n, modname); | 996 | ret = ddebug_add_module(iter_start, n, modname); |
| 957 | if (ret) | 997 | if (ret) |
| 958 | goto out_free; | 998 | goto out_err; |
| 959 | n = 0; | 999 | n = 0; |
| 960 | modname = iter->modname; | 1000 | modname = iter->modname; |
| 961 | iter_start = iter; | 1001 | iter_start = iter; |
| @@ -964,29 +1004,45 @@ static int __init dynamic_debug_init(void) | |||
| 964 | } | 1004 | } |
| 965 | ret = ddebug_add_module(iter_start, n, modname); | 1005 | ret = ddebug_add_module(iter_start, n, modname); |
| 966 | if (ret) | 1006 | if (ret) |
| 967 | goto out_free; | 1007 | goto out_err; |
| 1008 | |||
| 1009 | ddebug_init_success = 1; | ||
| 1010 | vpr_info("%d modules, %d entries and %d bytes in ddebug tables," | ||
| 1011 | " %d bytes in (readonly) verbose section\n", | ||
| 1012 | modct, entries, (int)( modct * sizeof(struct ddebug_table)), | ||
| 1013 | verbose_bytes + (int)(__stop___verbose - __start___verbose)); | ||
| 968 | 1014 | ||
| 969 | /* ddebug_query boot param got passed -> set it up */ | 1015 | /* apply ddebug_query boot param, dont unload tables on err */ |
| 970 | if (ddebug_setup_string[0] != '\0') { | 1016 | if (ddebug_setup_string[0] != '\0') { |
| 971 | ret = ddebug_exec_queries(ddebug_setup_string); | 1017 | pr_warn("ddebug_query param name is deprecated," |
| 1018 | " change it to dyndbg\n"); | ||
| 1019 | ret = ddebug_exec_queries(ddebug_setup_string, NULL); | ||
| 972 | if (ret < 0) | 1020 | if (ret < 0) |
| 973 | pr_warn("Invalid ddebug boot param %s", | 1021 | pr_warn("Invalid ddebug boot param %s", |
| 974 | ddebug_setup_string); | 1022 | ddebug_setup_string); |
| 975 | else | 1023 | else |
| 976 | pr_info("%d changes by ddebug_query\n", ret); | 1024 | pr_info("%d changes by ddebug_query\n", ret); |
| 977 | |||
| 978 | /* keep tables even on ddebug_query parse error */ | ||
| 979 | ret = 0; | ||
| 980 | } | 1025 | } |
| 1026 | /* now that ddebug tables are loaded, process all boot args | ||
| 1027 | * again to find and activate queries given in dyndbg params. | ||
| 1028 | * While this has already been done for known boot params, it | ||
| 1029 | * ignored the unknown ones (dyndbg in particular). Reusing | ||
| 1030 | * parse_args avoids ad-hoc parsing. This will also attempt | ||
| 1031 | * to activate queries for not-yet-loaded modules, which is | ||
| 1032 | * slightly noisy if verbose, but harmless. | ||
| 1033 | */ | ||
| 1034 | cmdline = kstrdup(saved_command_line, GFP_KERNEL); | ||
| 1035 | parse_args("dyndbg params", cmdline, NULL, | ||
| 1036 | 0, 0, 0, &ddebug_dyndbg_boot_param_cb); | ||
| 1037 | kfree(cmdline); | ||
| 1038 | return 0; | ||
| 981 | 1039 | ||
| 982 | out_free: | 1040 | out_err: |
| 983 | if (ret) | 1041 | ddebug_remove_all_tables(); |
| 984 | ddebug_remove_all_tables(); | ||
| 985 | else | ||
| 986 | ddebug_init_success = 1; | ||
| 987 | return 0; | 1042 | return 0; |
| 988 | } | 1043 | } |
| 989 | /* Allow early initialization for boot messages via boot param */ | 1044 | /* Allow early initialization for boot messages via boot param */ |
| 990 | arch_initcall(dynamic_debug_init); | 1045 | early_initcall(dynamic_debug_init); |
| 1046 | |||
| 991 | /* Debugfs setup must be done later */ | 1047 | /* Debugfs setup must be done later */ |
| 992 | module_init(dynamic_debug_init_debugfs); | 1048 | fs_initcall(dynamic_debug_init_debugfs); |
diff --git a/lib/jedec_ddr_data.c b/lib/jedec_ddr_data.c new file mode 100644 index 000000000000..6d2cbf1d567f --- /dev/null +++ b/lib/jedec_ddr_data.c | |||
| @@ -0,0 +1,135 @@ | |||
| 1 | /* | ||
| 2 | * DDR addressing details and AC timing parameters from JEDEC specs | ||
| 3 | * | ||
| 4 | * Copyright (C) 2012 Texas Instruments, Inc. | ||
| 5 | * | ||
| 6 | * Aneesh V <aneesh@ti.com> | ||
| 7 | * | ||
| 8 | * This program is free software; you can redistribute it and/or modify | ||
| 9 | * it under the terms of the GNU General Public License version 2 as | ||
| 10 | * published by the Free Software Foundation. | ||
| 11 | */ | ||
| 12 | |||
| 13 | #include <memory/jedec_ddr.h> | ||
| 14 | #include <linux/module.h> | ||
| 15 | |||
| 16 | /* LPDDR2 addressing details from JESD209-2 section 2.4 */ | ||
| 17 | const struct lpddr2_addressing | ||
| 18 | lpddr2_jedec_addressing_table[NUM_DDR_ADDR_TABLE_ENTRIES] = { | ||
| 19 | {B4, T_REFI_15_6, T_RFC_90}, /* 64M */ | ||
| 20 | {B4, T_REFI_15_6, T_RFC_90}, /* 128M */ | ||
| 21 | {B4, T_REFI_7_8, T_RFC_90}, /* 256M */ | ||
| 22 | {B4, T_REFI_7_8, T_RFC_90}, /* 512M */ | ||
| 23 | {B8, T_REFI_7_8, T_RFC_130}, /* 1GS4 */ | ||
| 24 | {B8, T_REFI_3_9, T_RFC_130}, /* 2GS4 */ | ||
| 25 | {B8, T_REFI_3_9, T_RFC_130}, /* 4G */ | ||
| 26 | {B8, T_REFI_3_9, T_RFC_210}, /* 8G */ | ||
| 27 | {B4, T_REFI_7_8, T_RFC_130}, /* 1GS2 */ | ||
| 28 | {B4, T_REFI_3_9, T_RFC_130}, /* 2GS2 */ | ||
| 29 | }; | ||
| 30 | EXPORT_SYMBOL_GPL(lpddr2_jedec_addressing_table); | ||
| 31 | |||
| 32 | /* LPDDR2 AC timing parameters from JESD209-2 section 12 */ | ||
| 33 | const struct lpddr2_timings | ||
| 34 | lpddr2_jedec_timings[NUM_DDR_TIMING_TABLE_ENTRIES] = { | ||
| 35 | /* Speed bin 400(200 MHz) */ | ||
| 36 | [0] = { | ||
| 37 | .max_freq = 200000000, | ||
| 38 | .min_freq = 10000000, | ||
| 39 | .tRPab = 21000, | ||
| 40 | .tRCD = 18000, | ||
| 41 | .tWR = 15000, | ||
| 42 | .tRAS_min = 42000, | ||
| 43 | .tRRD = 10000, | ||
| 44 | .tWTR = 10000, | ||
| 45 | .tXP = 7500, | ||
| 46 | .tRTP = 7500, | ||
| 47 | .tCKESR = 15000, | ||
| 48 | .tDQSCK_max = 5500, | ||
| 49 | .tFAW = 50000, | ||
| 50 | .tZQCS = 90000, | ||
| 51 | .tZQCL = 360000, | ||
| 52 | .tZQinit = 1000000, | ||
| 53 | .tRAS_max_ns = 70000, | ||
| 54 | .tDQSCK_max_derated = 6000, | ||
| 55 | }, | ||
| 56 | /* Speed bin 533(266 MHz) */ | ||
| 57 | [1] = { | ||
| 58 | .max_freq = 266666666, | ||
| 59 | .min_freq = 10000000, | ||
| 60 | .tRPab = 21000, | ||
| 61 | .tRCD = 18000, | ||
| 62 | .tWR = 15000, | ||
| 63 | .tRAS_min = 42000, | ||
| 64 | .tRRD = 10000, | ||
| 65 | .tWTR = 7500, | ||
| 66 | .tXP = 7500, | ||
| 67 | .tRTP = 7500, | ||
| 68 | .tCKESR = 15000, | ||
| 69 | .tDQSCK_max = 5500, | ||
| 70 | .tFAW = 50000, | ||
| 71 | .tZQCS = 90000, | ||
| 72 | .tZQCL = 360000, | ||
| 73 | .tZQinit = 1000000, | ||
| 74 | .tRAS_max_ns = 70000, | ||
| 75 | .tDQSCK_max_derated = 6000, | ||
| 76 | }, | ||
| 77 | /* Speed bin 800(400 MHz) */ | ||
| 78 | [2] = { | ||
| 79 | .max_freq = 400000000, | ||
| 80 | .min_freq = 10000000, | ||
| 81 | .tRPab = 21000, | ||
| 82 | .tRCD = 18000, | ||
| 83 | .tWR = 15000, | ||
| 84 | .tRAS_min = 42000, | ||
| 85 | .tRRD = 10000, | ||
| 86 | .tWTR = 7500, | ||
| 87 | .tXP = 7500, | ||
| 88 | .tRTP = 7500, | ||
| 89 | .tCKESR = 15000, | ||
| 90 | .tDQSCK_max = 5500, | ||
| 91 | .tFAW = 50000, | ||
| 92 | .tZQCS = 90000, | ||
| 93 | .tZQCL = 360000, | ||
| 94 | .tZQinit = 1000000, | ||
| 95 | .tRAS_max_ns = 70000, | ||
| 96 | .tDQSCK_max_derated = 6000, | ||
| 97 | }, | ||
| 98 | /* Speed bin 1066(533 MHz) */ | ||
| 99 | [3] = { | ||
| 100 | .max_freq = 533333333, | ||
| 101 | .min_freq = 10000000, | ||
| 102 | .tRPab = 21000, | ||
| 103 | .tRCD = 18000, | ||
| 104 | .tWR = 15000, | ||
| 105 | .tRAS_min = 42000, | ||
| 106 | .tRRD = 10000, | ||
| 107 | .tWTR = 7500, | ||
| 108 | .tXP = 7500, | ||
| 109 | .tRTP = 7500, | ||
| 110 | .tCKESR = 15000, | ||
| 111 | .tDQSCK_max = 5500, | ||
| 112 | .tFAW = 50000, | ||
| 113 | .tZQCS = 90000, | ||
| 114 | .tZQCL = 360000, | ||
| 115 | .tZQinit = 1000000, | ||
| 116 | .tRAS_max_ns = 70000, | ||
| 117 | .tDQSCK_max_derated = 5620, | ||
| 118 | }, | ||
| 119 | }; | ||
| 120 | EXPORT_SYMBOL_GPL(lpddr2_jedec_timings); | ||
| 121 | |||
| 122 | const struct lpddr2_min_tck lpddr2_jedec_min_tck = { | ||
| 123 | .tRPab = 3, | ||
| 124 | .tRCD = 3, | ||
| 125 | .tWR = 3, | ||
| 126 | .tRASmin = 3, | ||
| 127 | .tRRD = 2, | ||
| 128 | .tWTR = 2, | ||
| 129 | .tXP = 2, | ||
| 130 | .tRTP = 2, | ||
| 131 | .tCKE = 3, | ||
| 132 | .tCKESR = 3, | ||
| 133 | .tFAW = 8 | ||
| 134 | }; | ||
| 135 | EXPORT_SYMBOL_GPL(lpddr2_jedec_min_tck); | ||
diff --git a/lib/kobject.c b/lib/kobject.c index aeefa8bc8b1c..e07ee1fcd6f1 100644 --- a/lib/kobject.c +++ b/lib/kobject.c | |||
| @@ -47,13 +47,11 @@ static int populate_dir(struct kobject *kobj) | |||
| 47 | static int create_dir(struct kobject *kobj) | 47 | static int create_dir(struct kobject *kobj) |
| 48 | { | 48 | { |
| 49 | int error = 0; | 49 | int error = 0; |
| 50 | if (kobject_name(kobj)) { | 50 | error = sysfs_create_dir(kobj); |
| 51 | error = sysfs_create_dir(kobj); | 51 | if (!error) { |
| 52 | if (!error) { | 52 | error = populate_dir(kobj); |
| 53 | error = populate_dir(kobj); | 53 | if (error) |
| 54 | if (error) | 54 | sysfs_remove_dir(kobj); |
| 55 | sysfs_remove_dir(kobj); | ||
| 56 | } | ||
| 57 | } | 55 | } |
| 58 | return error; | 56 | return error; |
| 59 | } | 57 | } |
| @@ -634,7 +632,7 @@ struct kobject *kobject_create(void) | |||
| 634 | /** | 632 | /** |
| 635 | * kobject_create_and_add - create a struct kobject dynamically and register it with sysfs | 633 | * kobject_create_and_add - create a struct kobject dynamically and register it with sysfs |
| 636 | * | 634 | * |
| 637 | * @name: the name for the kset | 635 | * @name: the name for the kobject |
| 638 | * @parent: the parent kobject of this kobject, if any. | 636 | * @parent: the parent kobject of this kobject, if any. |
| 639 | * | 637 | * |
| 640 | * This function creates a kobject structure dynamically and registers it | 638 | * This function creates a kobject structure dynamically and registers it |
diff --git a/lib/list_debug.c b/lib/list_debug.c index 982b850d4e7a..3810b481f940 100644 --- a/lib/list_debug.c +++ b/lib/list_debug.c | |||
| @@ -10,6 +10,7 @@ | |||
| 10 | #include <linux/list.h> | 10 | #include <linux/list.h> |
| 11 | #include <linux/bug.h> | 11 | #include <linux/bug.h> |
| 12 | #include <linux/kernel.h> | 12 | #include <linux/kernel.h> |
| 13 | #include <linux/rculist.h> | ||
| 13 | 14 | ||
| 14 | /* | 15 | /* |
| 15 | * Insert a new entry between two known consecutive entries. | 16 | * Insert a new entry between two known consecutive entries. |
| @@ -75,3 +76,24 @@ void list_del(struct list_head *entry) | |||
| 75 | entry->prev = LIST_POISON2; | 76 | entry->prev = LIST_POISON2; |
| 76 | } | 77 | } |
| 77 | EXPORT_SYMBOL(list_del); | 78 | EXPORT_SYMBOL(list_del); |
| 79 | |||
| 80 | /* | ||
| 81 | * RCU variants. | ||
| 82 | */ | ||
| 83 | void __list_add_rcu(struct list_head *new, | ||
| 84 | struct list_head *prev, struct list_head *next) | ||
| 85 | { | ||
| 86 | WARN(next->prev != prev, | ||
| 87 | "list_add_rcu corruption. next->prev should be " | ||
| 88 | "prev (%p), but was %p. (next=%p).\n", | ||
| 89 | prev, next->prev, next); | ||
| 90 | WARN(prev->next != next, | ||
| 91 | "list_add_rcu corruption. prev->next should be " | ||
| 92 | "next (%p), but was %p. (prev=%p).\n", | ||
| 93 | next, prev->next, prev); | ||
| 94 | new->next = next; | ||
| 95 | new->prev = prev; | ||
| 96 | rcu_assign_pointer(list_next_rcu(prev), new); | ||
| 97 | next->prev = new; | ||
| 98 | } | ||
| 99 | EXPORT_SYMBOL(__list_add_rcu); | ||
diff --git a/lib/raid6/Makefile b/lib/raid6/Makefile index 8a38102770f3..de06dfe165b8 100644 --- a/lib/raid6/Makefile +++ b/lib/raid6/Makefile | |||
| @@ -1,6 +1,6 @@ | |||
| 1 | obj-$(CONFIG_RAID6_PQ) += raid6_pq.o | 1 | obj-$(CONFIG_RAID6_PQ) += raid6_pq.o |
| 2 | 2 | ||
| 3 | raid6_pq-y += algos.o recov.o tables.o int1.o int2.o int4.o \ | 3 | raid6_pq-y += algos.o recov.o recov_ssse3.o tables.o int1.o int2.o int4.o \ |
| 4 | int8.o int16.o int32.o altivec1.o altivec2.o altivec4.o \ | 4 | int8.o int16.o int32.o altivec1.o altivec2.o altivec4.o \ |
| 5 | altivec8.o mmx.o sse1.o sse2.o | 5 | altivec8.o mmx.o sse1.o sse2.o |
| 6 | hostprogs-y += mktables | 6 | hostprogs-y += mktables |
diff --git a/lib/raid6/algos.c b/lib/raid6/algos.c index 8b02f60ffc86..589f5f50ad2e 100644 --- a/lib/raid6/algos.c +++ b/lib/raid6/algos.c | |||
| @@ -17,11 +17,11 @@ | |||
| 17 | */ | 17 | */ |
| 18 | 18 | ||
| 19 | #include <linux/raid/pq.h> | 19 | #include <linux/raid/pq.h> |
| 20 | #include <linux/module.h> | ||
| 21 | #ifndef __KERNEL__ | 20 | #ifndef __KERNEL__ |
| 22 | #include <sys/mman.h> | 21 | #include <sys/mman.h> |
| 23 | #include <stdio.h> | 22 | #include <stdio.h> |
| 24 | #else | 23 | #else |
| 24 | #include <linux/module.h> | ||
| 25 | #include <linux/gfp.h> | 25 | #include <linux/gfp.h> |
| 26 | #if !RAID6_USE_EMPTY_ZERO_PAGE | 26 | #if !RAID6_USE_EMPTY_ZERO_PAGE |
| 27 | /* In .bss so it's zeroed */ | 27 | /* In .bss so it's zeroed */ |
| @@ -34,10 +34,6 @@ struct raid6_calls raid6_call; | |||
| 34 | EXPORT_SYMBOL_GPL(raid6_call); | 34 | EXPORT_SYMBOL_GPL(raid6_call); |
| 35 | 35 | ||
| 36 | const struct raid6_calls * const raid6_algos[] = { | 36 | const struct raid6_calls * const raid6_algos[] = { |
| 37 | &raid6_intx1, | ||
| 38 | &raid6_intx2, | ||
| 39 | &raid6_intx4, | ||
| 40 | &raid6_intx8, | ||
| 41 | #if defined(__ia64__) | 37 | #if defined(__ia64__) |
| 42 | &raid6_intx16, | 38 | &raid6_intx16, |
| 43 | &raid6_intx32, | 39 | &raid6_intx32, |
| @@ -61,6 +57,24 @@ const struct raid6_calls * const raid6_algos[] = { | |||
| 61 | &raid6_altivec4, | 57 | &raid6_altivec4, |
| 62 | &raid6_altivec8, | 58 | &raid6_altivec8, |
| 63 | #endif | 59 | #endif |
| 60 | &raid6_intx1, | ||
| 61 | &raid6_intx2, | ||
| 62 | &raid6_intx4, | ||
| 63 | &raid6_intx8, | ||
| 64 | NULL | ||
| 65 | }; | ||
| 66 | |||
| 67 | void (*raid6_2data_recov)(int, size_t, int, int, void **); | ||
| 68 | EXPORT_SYMBOL_GPL(raid6_2data_recov); | ||
| 69 | |||
| 70 | void (*raid6_datap_recov)(int, size_t, int, void **); | ||
| 71 | EXPORT_SYMBOL_GPL(raid6_datap_recov); | ||
| 72 | |||
| 73 | const struct raid6_recov_calls *const raid6_recov_algos[] = { | ||
| 74 | #if (defined(__i386__) || defined(__x86_64__)) && !defined(__arch_um__) | ||
| 75 | &raid6_recov_ssse3, | ||
| 76 | #endif | ||
| 77 | &raid6_recov_intx1, | ||
| 64 | NULL | 78 | NULL |
| 65 | }; | 79 | }; |
| 66 | 80 | ||
| @@ -72,59 +86,55 @@ const struct raid6_calls * const raid6_algos[] = { | |||
| 72 | #define time_before(x, y) ((x) < (y)) | 86 | #define time_before(x, y) ((x) < (y)) |
| 73 | #endif | 87 | #endif |
| 74 | 88 | ||
| 75 | /* Try to pick the best algorithm */ | 89 | static inline const struct raid6_recov_calls *raid6_choose_recov(void) |
| 76 | /* This code uses the gfmul table as convenient data set to abuse */ | ||
| 77 | |||
| 78 | int __init raid6_select_algo(void) | ||
| 79 | { | 90 | { |
| 80 | const struct raid6_calls * const * algo; | 91 | const struct raid6_recov_calls *const *algo; |
| 81 | const struct raid6_calls * best; | 92 | const struct raid6_recov_calls *best; |
| 82 | char *syndromes; | ||
| 83 | void *dptrs[(65536/PAGE_SIZE)+2]; | ||
| 84 | int i, disks; | ||
| 85 | unsigned long perf, bestperf; | ||
| 86 | int bestprefer; | ||
| 87 | unsigned long j0, j1; | ||
| 88 | 93 | ||
| 89 | disks = (65536/PAGE_SIZE)+2; | 94 | for (best = NULL, algo = raid6_recov_algos; *algo; algo++) |
| 90 | for ( i = 0 ; i < disks-2 ; i++ ) { | 95 | if (!best || (*algo)->priority > best->priority) |
| 91 | dptrs[i] = ((char *)raid6_gfmul) + PAGE_SIZE*i; | 96 | if (!(*algo)->valid || (*algo)->valid()) |
| 92 | } | 97 | best = *algo; |
| 93 | 98 | ||
| 94 | /* Normal code - use a 2-page allocation to avoid D$ conflict */ | 99 | if (best) { |
| 95 | syndromes = (void *) __get_free_pages(GFP_KERNEL, 1); | 100 | raid6_2data_recov = best->data2; |
| 101 | raid6_datap_recov = best->datap; | ||
| 96 | 102 | ||
| 97 | if ( !syndromes ) { | 103 | printk("raid6: using %s recovery algorithm\n", best->name); |
| 98 | printk("raid6: Yikes! No memory available.\n"); | 104 | } else |
| 99 | return -ENOMEM; | 105 | printk("raid6: Yikes! No recovery algorithm found!\n"); |
| 100 | } | ||
| 101 | 106 | ||
| 102 | dptrs[disks-2] = syndromes; | 107 | return best; |
| 103 | dptrs[disks-1] = syndromes + PAGE_SIZE; | 108 | } |
| 109 | |||
| 110 | static inline const struct raid6_calls *raid6_choose_gen( | ||
| 111 | void *(*const dptrs)[(65536/PAGE_SIZE)+2], const int disks) | ||
| 112 | { | ||
| 113 | unsigned long perf, bestperf, j0, j1; | ||
| 114 | const struct raid6_calls *const *algo; | ||
| 115 | const struct raid6_calls *best; | ||
| 104 | 116 | ||
| 105 | bestperf = 0; bestprefer = 0; best = NULL; | 117 | for (bestperf = 0, best = NULL, algo = raid6_algos; *algo; algo++) { |
| 118 | if (!best || (*algo)->prefer >= best->prefer) { | ||
| 119 | if ((*algo)->valid && !(*algo)->valid()) | ||
| 120 | continue; | ||
| 106 | 121 | ||
| 107 | for ( algo = raid6_algos ; *algo ; algo++ ) { | ||
| 108 | if ( !(*algo)->valid || (*algo)->valid() ) { | ||
| 109 | perf = 0; | 122 | perf = 0; |
| 110 | 123 | ||
| 111 | preempt_disable(); | 124 | preempt_disable(); |
| 112 | j0 = jiffies; | 125 | j0 = jiffies; |
| 113 | while ( (j1 = jiffies) == j0 ) | 126 | while ((j1 = jiffies) == j0) |
| 114 | cpu_relax(); | 127 | cpu_relax(); |
| 115 | while (time_before(jiffies, | 128 | while (time_before(jiffies, |
| 116 | j1 + (1<<RAID6_TIME_JIFFIES_LG2))) { | 129 | j1 + (1<<RAID6_TIME_JIFFIES_LG2))) { |
| 117 | (*algo)->gen_syndrome(disks, PAGE_SIZE, dptrs); | 130 | (*algo)->gen_syndrome(disks, PAGE_SIZE, *dptrs); |
| 118 | perf++; | 131 | perf++; |
| 119 | } | 132 | } |
| 120 | preempt_enable(); | 133 | preempt_enable(); |
| 121 | 134 | ||
| 122 | if ( (*algo)->prefer > bestprefer || | 135 | if (perf > bestperf) { |
| 123 | ((*algo)->prefer == bestprefer && | ||
| 124 | perf > bestperf) ) { | ||
| 125 | best = *algo; | ||
| 126 | bestprefer = best->prefer; | ||
| 127 | bestperf = perf; | 136 | bestperf = perf; |
| 137 | best = *algo; | ||
| 128 | } | 138 | } |
| 129 | printk("raid6: %-8s %5ld MB/s\n", (*algo)->name, | 139 | printk("raid6: %-8s %5ld MB/s\n", (*algo)->name, |
| 130 | (perf*HZ) >> (20-16+RAID6_TIME_JIFFIES_LG2)); | 140 | (perf*HZ) >> (20-16+RAID6_TIME_JIFFIES_LG2)); |
| @@ -139,9 +149,46 @@ int __init raid6_select_algo(void) | |||
| 139 | } else | 149 | } else |
| 140 | printk("raid6: Yikes! No algorithm found!\n"); | 150 | printk("raid6: Yikes! No algorithm found!\n"); |
| 141 | 151 | ||
| 152 | return best; | ||
| 153 | } | ||
| 154 | |||
| 155 | |||
| 156 | /* Try to pick the best algorithm */ | ||
| 157 | /* This code uses the gfmul table as convenient data set to abuse */ | ||
| 158 | |||
| 159 | int __init raid6_select_algo(void) | ||
| 160 | { | ||
| 161 | const int disks = (65536/PAGE_SIZE)+2; | ||
| 162 | |||
| 163 | const struct raid6_calls *gen_best; | ||
| 164 | const struct raid6_recov_calls *rec_best; | ||
| 165 | char *syndromes; | ||
| 166 | void *dptrs[(65536/PAGE_SIZE)+2]; | ||
| 167 | int i; | ||
| 168 | |||
| 169 | for (i = 0; i < disks-2; i++) | ||
| 170 | dptrs[i] = ((char *)raid6_gfmul) + PAGE_SIZE*i; | ||
| 171 | |||
| 172 | /* Normal code - use a 2-page allocation to avoid D$ conflict */ | ||
| 173 | syndromes = (void *) __get_free_pages(GFP_KERNEL, 1); | ||
| 174 | |||
| 175 | if (!syndromes) { | ||
| 176 | printk("raid6: Yikes! No memory available.\n"); | ||
| 177 | return -ENOMEM; | ||
| 178 | } | ||
| 179 | |||
| 180 | dptrs[disks-2] = syndromes; | ||
| 181 | dptrs[disks-1] = syndromes + PAGE_SIZE; | ||
| 182 | |||
| 183 | /* select raid gen_syndrome function */ | ||
| 184 | gen_best = raid6_choose_gen(&dptrs, disks); | ||
| 185 | |||
| 186 | /* select raid recover functions */ | ||
| 187 | rec_best = raid6_choose_recov(); | ||
| 188 | |||
| 142 | free_pages((unsigned long)syndromes, 1); | 189 | free_pages((unsigned long)syndromes, 1); |
| 143 | 190 | ||
| 144 | return best ? 0 : -EINVAL; | 191 | return gen_best && rec_best ? 0 : -EINVAL; |
| 145 | } | 192 | } |
| 146 | 193 | ||
| 147 | static void raid6_exit(void) | 194 | static void raid6_exit(void) |
diff --git a/lib/raid6/mktables.c b/lib/raid6/mktables.c index 8a3780902cec..39787db588b0 100644 --- a/lib/raid6/mktables.c +++ b/lib/raid6/mktables.c | |||
| @@ -81,6 +81,31 @@ int main(int argc, char *argv[]) | |||
| 81 | printf("EXPORT_SYMBOL(raid6_gfmul);\n"); | 81 | printf("EXPORT_SYMBOL(raid6_gfmul);\n"); |
| 82 | printf("#endif\n"); | 82 | printf("#endif\n"); |
| 83 | 83 | ||
| 84 | /* Compute vector multiplication table */ | ||
| 85 | printf("\nconst u8 __attribute__((aligned(256)))\n" | ||
| 86 | "raid6_vgfmul[256][32] =\n" | ||
| 87 | "{\n"); | ||
| 88 | for (i = 0; i < 256; i++) { | ||
| 89 | printf("\t{\n"); | ||
| 90 | for (j = 0; j < 16; j += 8) { | ||
| 91 | printf("\t\t"); | ||
| 92 | for (k = 0; k < 8; k++) | ||
| 93 | printf("0x%02x,%c", gfmul(i, j + k), | ||
| 94 | (k == 7) ? '\n' : ' '); | ||
| 95 | } | ||
| 96 | for (j = 0; j < 16; j += 8) { | ||
| 97 | printf("\t\t"); | ||
| 98 | for (k = 0; k < 8; k++) | ||
| 99 | printf("0x%02x,%c", gfmul(i, (j + k) << 4), | ||
| 100 | (k == 7) ? '\n' : ' '); | ||
| 101 | } | ||
| 102 | printf("\t},\n"); | ||
| 103 | } | ||
| 104 | printf("};\n"); | ||
| 105 | printf("#ifdef __KERNEL__\n"); | ||
| 106 | printf("EXPORT_SYMBOL(raid6_vgfmul);\n"); | ||
| 107 | printf("#endif\n"); | ||
| 108 | |||
| 84 | /* Compute power-of-2 table (exponent) */ | 109 | /* Compute power-of-2 table (exponent) */ |
| 85 | v = 1; | 110 | v = 1; |
| 86 | printf("\nconst u8 __attribute__((aligned(256)))\n" | 111 | printf("\nconst u8 __attribute__((aligned(256)))\n" |
diff --git a/lib/raid6/recov.c b/lib/raid6/recov.c index fe275d7b6b36..1805a5cc5daa 100644 --- a/lib/raid6/recov.c +++ b/lib/raid6/recov.c | |||
| @@ -22,7 +22,7 @@ | |||
| 22 | #include <linux/raid/pq.h> | 22 | #include <linux/raid/pq.h> |
| 23 | 23 | ||
| 24 | /* Recover two failed data blocks. */ | 24 | /* Recover two failed data blocks. */ |
| 25 | void raid6_2data_recov(int disks, size_t bytes, int faila, int failb, | 25 | void raid6_2data_recov_intx1(int disks, size_t bytes, int faila, int failb, |
| 26 | void **ptrs) | 26 | void **ptrs) |
| 27 | { | 27 | { |
| 28 | u8 *p, *q, *dp, *dq; | 28 | u8 *p, *q, *dp, *dq; |
| @@ -64,10 +64,9 @@ void raid6_2data_recov(int disks, size_t bytes, int faila, int failb, | |||
| 64 | p++; q++; | 64 | p++; q++; |
| 65 | } | 65 | } |
| 66 | } | 66 | } |
| 67 | EXPORT_SYMBOL_GPL(raid6_2data_recov); | ||
| 68 | 67 | ||
| 69 | /* Recover failure of one data block plus the P block */ | 68 | /* Recover failure of one data block plus the P block */ |
| 70 | void raid6_datap_recov(int disks, size_t bytes, int faila, void **ptrs) | 69 | void raid6_datap_recov_intx1(int disks, size_t bytes, int faila, void **ptrs) |
| 71 | { | 70 | { |
| 72 | u8 *p, *q, *dq; | 71 | u8 *p, *q, *dq; |
| 73 | const u8 *qmul; /* Q multiplier table */ | 72 | const u8 *qmul; /* Q multiplier table */ |
| @@ -96,7 +95,15 @@ void raid6_datap_recov(int disks, size_t bytes, int faila, void **ptrs) | |||
| 96 | q++; dq++; | 95 | q++; dq++; |
| 97 | } | 96 | } |
| 98 | } | 97 | } |
| 99 | EXPORT_SYMBOL_GPL(raid6_datap_recov); | 98 | |
| 99 | |||
| 100 | const struct raid6_recov_calls raid6_recov_intx1 = { | ||
| 101 | .data2 = raid6_2data_recov_intx1, | ||
| 102 | .datap = raid6_datap_recov_intx1, | ||
| 103 | .valid = NULL, | ||
| 104 | .name = "intx1", | ||
| 105 | .priority = 0, | ||
| 106 | }; | ||
| 100 | 107 | ||
| 101 | #ifndef __KERNEL__ | 108 | #ifndef __KERNEL__ |
| 102 | /* Testing only */ | 109 | /* Testing only */ |
diff --git a/lib/raid6/recov_ssse3.c b/lib/raid6/recov_ssse3.c new file mode 100644 index 000000000000..37ae61930559 --- /dev/null +++ b/lib/raid6/recov_ssse3.c | |||
| @@ -0,0 +1,335 @@ | |||
| 1 | /* | ||
| 2 | * Copyright (C) 2012 Intel Corporation | ||
| 3 | * | ||
| 4 | * This program is free software; you can redistribute it and/or | ||
| 5 | * modify it under the terms of the GNU General Public License | ||
| 6 | * as published by the Free Software Foundation; version 2 | ||
| 7 | * of the License. | ||
| 8 | */ | ||
| 9 | |||
| 10 | #if (defined(__i386__) || defined(__x86_64__)) && !defined(__arch_um__) | ||
| 11 | |||
| 12 | #include <linux/raid/pq.h> | ||
| 13 | #include "x86.h" | ||
| 14 | |||
| 15 | static int raid6_has_ssse3(void) | ||
| 16 | { | ||
| 17 | return boot_cpu_has(X86_FEATURE_XMM) && | ||
| 18 | boot_cpu_has(X86_FEATURE_XMM2) && | ||
| 19 | boot_cpu_has(X86_FEATURE_SSSE3); | ||
| 20 | } | ||
| 21 | |||
| 22 | void raid6_2data_recov_ssse3(int disks, size_t bytes, int faila, int failb, | ||
| 23 | void **ptrs) | ||
| 24 | { | ||
| 25 | u8 *p, *q, *dp, *dq; | ||
| 26 | const u8 *pbmul; /* P multiplier table for B data */ | ||
| 27 | const u8 *qmul; /* Q multiplier table (for both) */ | ||
| 28 | static const u8 __aligned(16) x0f[16] = { | ||
| 29 | 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, | ||
| 30 | 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, 0x0f}; | ||
| 31 | |||
| 32 | p = (u8 *)ptrs[disks-2]; | ||
| 33 | q = (u8 *)ptrs[disks-1]; | ||
| 34 | |||
| 35 | /* Compute syndrome with zero for the missing data pages | ||
| 36 | Use the dead data pages as temporary storage for | ||
| 37 | delta p and delta q */ | ||
| 38 | dp = (u8 *)ptrs[faila]; | ||
| 39 | ptrs[faila] = (void *)raid6_empty_zero_page; | ||
| 40 | ptrs[disks-2] = dp; | ||
| 41 | dq = (u8 *)ptrs[failb]; | ||
| 42 | ptrs[failb] = (void *)raid6_empty_zero_page; | ||
| 43 | ptrs[disks-1] = dq; | ||
| 44 | |||
| 45 | raid6_call.gen_syndrome(disks, bytes, ptrs); | ||
| 46 | |||
| 47 | /* Restore pointer table */ | ||
| 48 | ptrs[faila] = dp; | ||
| 49 | ptrs[failb] = dq; | ||
| 50 | ptrs[disks-2] = p; | ||
| 51 | ptrs[disks-1] = q; | ||
| 52 | |||
| 53 | /* Now, pick the proper data tables */ | ||
| 54 | pbmul = raid6_vgfmul[raid6_gfexi[failb-faila]]; | ||
| 55 | qmul = raid6_vgfmul[raid6_gfinv[raid6_gfexp[faila] ^ | ||
| 56 | raid6_gfexp[failb]]]; | ||
| 57 | |||
| 58 | kernel_fpu_begin(); | ||
| 59 | |||
| 60 | asm volatile("movdqa %0,%%xmm7" : : "m" (x0f[0])); | ||
| 61 | |||
| 62 | #ifdef CONFIG_X86_64 | ||
| 63 | asm volatile("movdqa %0,%%xmm6" : : "m" (qmul[0])); | ||
| 64 | asm volatile("movdqa %0,%%xmm14" : : "m" (pbmul[0])); | ||
| 65 | asm volatile("movdqa %0,%%xmm15" : : "m" (pbmul[16])); | ||
| 66 | #endif | ||
| 67 | |||
| 68 | /* Now do it... */ | ||
| 69 | while (bytes) { | ||
| 70 | #ifdef CONFIG_X86_64 | ||
| 71 | /* xmm6, xmm14, xmm15 */ | ||
| 72 | |||
| 73 | asm volatile("movdqa %0,%%xmm1" : : "m" (q[0])); | ||
| 74 | asm volatile("movdqa %0,%%xmm9" : : "m" (q[16])); | ||
| 75 | asm volatile("movdqa %0,%%xmm0" : : "m" (p[0])); | ||
| 76 | asm volatile("movdqa %0,%%xmm8" : : "m" (p[16])); | ||
| 77 | asm volatile("pxor %0,%%xmm1" : : "m" (dq[0])); | ||
| 78 | asm volatile("pxor %0,%%xmm9" : : "m" (dq[16])); | ||
| 79 | asm volatile("pxor %0,%%xmm0" : : "m" (dp[0])); | ||
| 80 | asm volatile("pxor %0,%%xmm8" : : "m" (dp[16])); | ||
| 81 | |||
| 82 | /* xmm0/8 = px */ | ||
| 83 | |||
| 84 | asm volatile("movdqa %xmm6,%xmm4"); | ||
| 85 | asm volatile("movdqa %0,%%xmm5" : : "m" (qmul[16])); | ||
| 86 | asm volatile("movdqa %xmm6,%xmm12"); | ||
| 87 | asm volatile("movdqa %xmm5,%xmm13"); | ||
| 88 | asm volatile("movdqa %xmm1,%xmm3"); | ||
| 89 | asm volatile("movdqa %xmm9,%xmm11"); | ||
| 90 | asm volatile("movdqa %xmm0,%xmm2"); /* xmm2/10 = px */ | ||
| 91 | asm volatile("movdqa %xmm8,%xmm10"); | ||
| 92 | asm volatile("psraw $4,%xmm1"); | ||
| 93 | asm volatile("psraw $4,%xmm9"); | ||
| 94 | asm volatile("pand %xmm7,%xmm3"); | ||
| 95 | asm volatile("pand %xmm7,%xmm11"); | ||
| 96 | asm volatile("pand %xmm7,%xmm1"); | ||
| 97 | asm volatile("pand %xmm7,%xmm9"); | ||
| 98 | asm volatile("pshufb %xmm3,%xmm4"); | ||
| 99 | asm volatile("pshufb %xmm11,%xmm12"); | ||
| 100 | asm volatile("pshufb %xmm1,%xmm5"); | ||
| 101 | asm volatile("pshufb %xmm9,%xmm13"); | ||
| 102 | asm volatile("pxor %xmm4,%xmm5"); | ||
| 103 | asm volatile("pxor %xmm12,%xmm13"); | ||
| 104 | |||
| 105 | /* xmm5/13 = qx */ | ||
| 106 | |||
| 107 | asm volatile("movdqa %xmm14,%xmm4"); | ||
| 108 | asm volatile("movdqa %xmm15,%xmm1"); | ||
| 109 | asm volatile("movdqa %xmm14,%xmm12"); | ||
| 110 | asm volatile("movdqa %xmm15,%xmm9"); | ||
| 111 | asm volatile("movdqa %xmm2,%xmm3"); | ||
| 112 | asm volatile("movdqa %xmm10,%xmm11"); | ||
| 113 | asm volatile("psraw $4,%xmm2"); | ||
| 114 | asm volatile("psraw $4,%xmm10"); | ||
| 115 | asm volatile("pand %xmm7,%xmm3"); | ||
| 116 | asm volatile("pand %xmm7,%xmm11"); | ||
| 117 | asm volatile("pand %xmm7,%xmm2"); | ||
| 118 | asm volatile("pand %xmm7,%xmm10"); | ||
| 119 | asm volatile("pshufb %xmm3,%xmm4"); | ||
| 120 | asm volatile("pshufb %xmm11,%xmm12"); | ||
| 121 | asm volatile("pshufb %xmm2,%xmm1"); | ||
| 122 | asm volatile("pshufb %xmm10,%xmm9"); | ||
| 123 | asm volatile("pxor %xmm4,%xmm1"); | ||
| 124 | asm volatile("pxor %xmm12,%xmm9"); | ||
| 125 | |||
| 126 | /* xmm1/9 = pbmul[px] */ | ||
| 127 | asm volatile("pxor %xmm5,%xmm1"); | ||
| 128 | asm volatile("pxor %xmm13,%xmm9"); | ||
| 129 | /* xmm1/9 = db = DQ */ | ||
| 130 | asm volatile("movdqa %%xmm1,%0" : "=m" (dq[0])); | ||
| 131 | asm volatile("movdqa %%xmm9,%0" : "=m" (dq[16])); | ||
| 132 | |||
| 133 | asm volatile("pxor %xmm1,%xmm0"); | ||
| 134 | asm volatile("pxor %xmm9,%xmm8"); | ||
| 135 | asm volatile("movdqa %%xmm0,%0" : "=m" (dp[0])); | ||
| 136 | asm volatile("movdqa %%xmm8,%0" : "=m" (dp[16])); | ||
| 137 | |||
| 138 | bytes -= 32; | ||
| 139 | p += 32; | ||
| 140 | q += 32; | ||
| 141 | dp += 32; | ||
| 142 | dq += 32; | ||
| 143 | #else | ||
| 144 | asm volatile("movdqa %0,%%xmm1" : : "m" (*q)); | ||
| 145 | asm volatile("movdqa %0,%%xmm0" : : "m" (*p)); | ||
| 146 | asm volatile("pxor %0,%%xmm1" : : "m" (*dq)); | ||
| 147 | asm volatile("pxor %0,%%xmm0" : : "m" (*dp)); | ||
| 148 | |||
| 149 | /* 1 = dq ^ q | ||
| 150 | * 0 = dp ^ p | ||
| 151 | */ | ||
| 152 | asm volatile("movdqa %0,%%xmm4" : : "m" (qmul[0])); | ||
| 153 | asm volatile("movdqa %0,%%xmm5" : : "m" (qmul[16])); | ||
| 154 | |||
| 155 | asm volatile("movdqa %xmm1,%xmm3"); | ||
| 156 | asm volatile("psraw $4,%xmm1"); | ||
| 157 | asm volatile("pand %xmm7,%xmm3"); | ||
| 158 | asm volatile("pand %xmm7,%xmm1"); | ||
| 159 | asm volatile("pshufb %xmm3,%xmm4"); | ||
| 160 | asm volatile("pshufb %xmm1,%xmm5"); | ||
| 161 | asm volatile("pxor %xmm4,%xmm5"); | ||
| 162 | |||
| 163 | asm volatile("movdqa %xmm0,%xmm2"); /* xmm2 = px */ | ||
| 164 | |||
| 165 | /* xmm5 = qx */ | ||
| 166 | |||
| 167 | asm volatile("movdqa %0,%%xmm4" : : "m" (pbmul[0])); | ||
| 168 | asm volatile("movdqa %0,%%xmm1" : : "m" (pbmul[16])); | ||
| 169 | asm volatile("movdqa %xmm2,%xmm3"); | ||
| 170 | asm volatile("psraw $4,%xmm2"); | ||
| 171 | asm volatile("pand %xmm7,%xmm3"); | ||
| 172 | asm volatile("pand %xmm7,%xmm2"); | ||
| 173 | asm volatile("pshufb %xmm3,%xmm4"); | ||
| 174 | asm volatile("pshufb %xmm2,%xmm1"); | ||
| 175 | asm volatile("pxor %xmm4,%xmm1"); | ||
| 176 | |||
| 177 | /* xmm1 = pbmul[px] */ | ||
| 178 | asm volatile("pxor %xmm5,%xmm1"); | ||
| 179 | /* xmm1 = db = DQ */ | ||
| 180 | asm volatile("movdqa %%xmm1,%0" : "=m" (*dq)); | ||
| 181 | |||
| 182 | asm volatile("pxor %xmm1,%xmm0"); | ||
| 183 | asm volatile("movdqa %%xmm0,%0" : "=m" (*dp)); | ||
| 184 | |||
| 185 | bytes -= 16; | ||
| 186 | p += 16; | ||
| 187 | q += 16; | ||
| 188 | dp += 16; | ||
| 189 | dq += 16; | ||
| 190 | #endif | ||
| 191 | } | ||
| 192 | |||
| 193 | kernel_fpu_end(); | ||
| 194 | } | ||
| 195 | |||
| 196 | |||
| 197 | void raid6_datap_recov_ssse3(int disks, size_t bytes, int faila, void **ptrs) | ||
| 198 | { | ||
| 199 | u8 *p, *q, *dq; | ||
| 200 | const u8 *qmul; /* Q multiplier table */ | ||
| 201 | static const u8 __aligned(16) x0f[16] = { | ||
| 202 | 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, | ||
| 203 | 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, 0x0f, 0x0f}; | ||
| 204 | |||
| 205 | p = (u8 *)ptrs[disks-2]; | ||
| 206 | q = (u8 *)ptrs[disks-1]; | ||
| 207 | |||
| 208 | /* Compute syndrome with zero for the missing data page | ||
| 209 | Use the dead data page as temporary storage for delta q */ | ||
| 210 | dq = (u8 *)ptrs[faila]; | ||
| 211 | ptrs[faila] = (void *)raid6_empty_zero_page; | ||
| 212 | ptrs[disks-1] = dq; | ||
| 213 | |||
| 214 | raid6_call.gen_syndrome(disks, bytes, ptrs); | ||
| 215 | |||
| 216 | /* Restore pointer table */ | ||
| 217 | ptrs[faila] = dq; | ||
| 218 | ptrs[disks-1] = q; | ||
| 219 | |||
| 220 | /* Now, pick the proper data tables */ | ||
| 221 | qmul = raid6_vgfmul[raid6_gfinv[raid6_gfexp[faila]]]; | ||
| 222 | |||
| 223 | kernel_fpu_begin(); | ||
| 224 | |||
| 225 | asm volatile("movdqa %0, %%xmm7" : : "m" (x0f[0])); | ||
| 226 | |||
| 227 | while (bytes) { | ||
| 228 | #ifdef CONFIG_X86_64 | ||
| 229 | asm volatile("movdqa %0, %%xmm3" : : "m" (dq[0])); | ||
| 230 | asm volatile("movdqa %0, %%xmm4" : : "m" (dq[16])); | ||
| 231 | asm volatile("pxor %0, %%xmm3" : : "m" (q[0])); | ||
| 232 | asm volatile("movdqa %0, %%xmm0" : : "m" (qmul[0])); | ||
| 233 | |||
| 234 | /* xmm3 = q[0] ^ dq[0] */ | ||
| 235 | |||
| 236 | asm volatile("pxor %0, %%xmm4" : : "m" (q[16])); | ||
| 237 | asm volatile("movdqa %0, %%xmm1" : : "m" (qmul[16])); | ||
| 238 | |||
| 239 | /* xmm4 = q[16] ^ dq[16] */ | ||
| 240 | |||
| 241 | asm volatile("movdqa %xmm3, %xmm6"); | ||
| 242 | asm volatile("movdqa %xmm4, %xmm8"); | ||
| 243 | |||
| 244 | /* xmm4 = xmm8 = q[16] ^ dq[16] */ | ||
| 245 | |||
| 246 | asm volatile("psraw $4, %xmm3"); | ||
| 247 | asm volatile("pand %xmm7, %xmm6"); | ||
| 248 | asm volatile("pand %xmm7, %xmm3"); | ||
| 249 | asm volatile("pshufb %xmm6, %xmm0"); | ||
| 250 | asm volatile("pshufb %xmm3, %xmm1"); | ||
| 251 | asm volatile("movdqa %0, %%xmm10" : : "m" (qmul[0])); | ||
| 252 | asm volatile("pxor %xmm0, %xmm1"); | ||
| 253 | asm volatile("movdqa %0, %%xmm11" : : "m" (qmul[16])); | ||
| 254 | |||
| 255 | /* xmm1 = qmul[q[0] ^ dq[0]] */ | ||
| 256 | |||
| 257 | asm volatile("psraw $4, %xmm4"); | ||
| 258 | asm volatile("pand %xmm7, %xmm8"); | ||
| 259 | asm volatile("pand %xmm7, %xmm4"); | ||
| 260 | asm volatile("pshufb %xmm8, %xmm10"); | ||
| 261 | asm volatile("pshufb %xmm4, %xmm11"); | ||
| 262 | asm volatile("movdqa %0, %%xmm2" : : "m" (p[0])); | ||
| 263 | asm volatile("pxor %xmm10, %xmm11"); | ||
| 264 | asm volatile("movdqa %0, %%xmm12" : : "m" (p[16])); | ||
| 265 | |||
| 266 | /* xmm11 = qmul[q[16] ^ dq[16]] */ | ||
| 267 | |||
| 268 | asm volatile("pxor %xmm1, %xmm2"); | ||
| 269 | |||
| 270 | /* xmm2 = p[0] ^ qmul[q[0] ^ dq[0]] */ | ||
| 271 | |||
| 272 | asm volatile("pxor %xmm11, %xmm12"); | ||
| 273 | |||
| 274 | /* xmm12 = p[16] ^ qmul[q[16] ^ dq[16]] */ | ||
| 275 | |||
| 276 | asm volatile("movdqa %%xmm1, %0" : "=m" (dq[0])); | ||
| 277 | asm volatile("movdqa %%xmm11, %0" : "=m" (dq[16])); | ||
| 278 | |||
| 279 | asm volatile("movdqa %%xmm2, %0" : "=m" (p[0])); | ||
| 280 | asm volatile("movdqa %%xmm12, %0" : "=m" (p[16])); | ||
| 281 | |||
| 282 | bytes -= 32; | ||
| 283 | p += 32; | ||
| 284 | q += 32; | ||
| 285 | dq += 32; | ||
| 286 | |||
| 287 | #else | ||
| 288 | asm volatile("movdqa %0, %%xmm3" : : "m" (dq[0])); | ||
| 289 | asm volatile("movdqa %0, %%xmm0" : : "m" (qmul[0])); | ||
| 290 | asm volatile("pxor %0, %%xmm3" : : "m" (q[0])); | ||
| 291 | asm volatile("movdqa %0, %%xmm1" : : "m" (qmul[16])); | ||
| 292 | |||
| 293 | /* xmm3 = *q ^ *dq */ | ||
| 294 | |||
| 295 | asm volatile("movdqa %xmm3, %xmm6"); | ||
| 296 | asm volatile("movdqa %0, %%xmm2" : : "m" (p[0])); | ||
| 297 | asm volatile("psraw $4, %xmm3"); | ||
| 298 | asm volatile("pand %xmm7, %xmm6"); | ||
| 299 | asm volatile("pand %xmm7, %xmm3"); | ||
| 300 | asm volatile("pshufb %xmm6, %xmm0"); | ||
| 301 | asm volatile("pshufb %xmm3, %xmm1"); | ||
| 302 | asm volatile("pxor %xmm0, %xmm1"); | ||
| 303 | |||
| 304 | /* xmm1 = qmul[*q ^ *dq */ | ||
| 305 | |||
| 306 | asm volatile("pxor %xmm1, %xmm2"); | ||
| 307 | |||
| 308 | /* xmm2 = *p ^ qmul[*q ^ *dq] */ | ||
| 309 | |||
| 310 | asm volatile("movdqa %%xmm1, %0" : "=m" (dq[0])); | ||
| 311 | asm volatile("movdqa %%xmm2, %0" : "=m" (p[0])); | ||
| 312 | |||
| 313 | bytes -= 16; | ||
| 314 | p += 16; | ||
| 315 | q += 16; | ||
| 316 | dq += 16; | ||
| 317 | #endif | ||
| 318 | } | ||
| 319 | |||
| 320 | kernel_fpu_end(); | ||
| 321 | } | ||
| 322 | |||
| 323 | const struct raid6_recov_calls raid6_recov_ssse3 = { | ||
| 324 | .data2 = raid6_2data_recov_ssse3, | ||
| 325 | .datap = raid6_datap_recov_ssse3, | ||
| 326 | .valid = raid6_has_ssse3, | ||
| 327 | #ifdef CONFIG_X86_64 | ||
| 328 | .name = "ssse3x2", | ||
| 329 | #else | ||
| 330 | .name = "ssse3x1", | ||
| 331 | #endif | ||
| 332 | .priority = 1, | ||
| 333 | }; | ||
| 334 | |||
| 335 | #endif | ||
diff --git a/lib/raid6/test/Makefile b/lib/raid6/test/Makefile index aa651697b6dc..c76151d94764 100644 --- a/lib/raid6/test/Makefile +++ b/lib/raid6/test/Makefile | |||
| @@ -23,7 +23,7 @@ RANLIB = ranlib | |||
| 23 | all: raid6.a raid6test | 23 | all: raid6.a raid6test |
| 24 | 24 | ||
| 25 | raid6.a: int1.o int2.o int4.o int8.o int16.o int32.o mmx.o sse1.o sse2.o \ | 25 | raid6.a: int1.o int2.o int4.o int8.o int16.o int32.o mmx.o sse1.o sse2.o \ |
| 26 | altivec1.o altivec2.o altivec4.o altivec8.o recov.o algos.o \ | 26 | altivec1.o altivec2.o altivec4.o altivec8.o recov.o recov_ssse3.o algos.o \ |
| 27 | tables.o | 27 | tables.o |
| 28 | rm -f $@ | 28 | rm -f $@ |
| 29 | $(AR) cq $@ $^ | 29 | $(AR) cq $@ $^ |
diff --git a/lib/raid6/test/test.c b/lib/raid6/test/test.c index 7a930318b17d..5a485b7a7d3c 100644 --- a/lib/raid6/test/test.c +++ b/lib/raid6/test/test.c | |||
| @@ -90,25 +90,35 @@ static int test_disks(int i, int j) | |||
| 90 | int main(int argc, char *argv[]) | 90 | int main(int argc, char *argv[]) |
| 91 | { | 91 | { |
| 92 | const struct raid6_calls *const *algo; | 92 | const struct raid6_calls *const *algo; |
| 93 | const struct raid6_recov_calls *const *ra; | ||
| 93 | int i, j; | 94 | int i, j; |
| 94 | int err = 0; | 95 | int err = 0; |
| 95 | 96 | ||
| 96 | makedata(); | 97 | makedata(); |
| 97 | 98 | ||
| 98 | for (algo = raid6_algos; *algo; algo++) { | 99 | for (ra = raid6_recov_algos; *ra; ra++) { |
| 99 | if (!(*algo)->valid || (*algo)->valid()) { | 100 | if ((*ra)->valid && !(*ra)->valid()) |
| 100 | raid6_call = **algo; | 101 | continue; |
| 102 | raid6_2data_recov = (*ra)->data2; | ||
| 103 | raid6_datap_recov = (*ra)->datap; | ||
| 101 | 104 | ||
| 102 | /* Nuke syndromes */ | 105 | printf("using recovery %s\n", (*ra)->name); |
| 103 | memset(data[NDISKS-2], 0xee, 2*PAGE_SIZE); | ||
| 104 | 106 | ||
| 105 | /* Generate assumed good syndrome */ | 107 | for (algo = raid6_algos; *algo; algo++) { |
| 106 | raid6_call.gen_syndrome(NDISKS, PAGE_SIZE, | 108 | if (!(*algo)->valid || (*algo)->valid()) { |
| 107 | (void **)&dataptrs); | 109 | raid6_call = **algo; |
| 108 | 110 | ||
| 109 | for (i = 0; i < NDISKS-1; i++) | 111 | /* Nuke syndromes */ |
| 110 | for (j = i+1; j < NDISKS; j++) | 112 | memset(data[NDISKS-2], 0xee, 2*PAGE_SIZE); |
| 111 | err += test_disks(i, j); | 113 | |
| 114 | /* Generate assumed good syndrome */ | ||
| 115 | raid6_call.gen_syndrome(NDISKS, PAGE_SIZE, | ||
| 116 | (void **)&dataptrs); | ||
| 117 | |||
| 118 | for (i = 0; i < NDISKS-1; i++) | ||
| 119 | for (j = i+1; j < NDISKS; j++) | ||
| 120 | err += test_disks(i, j); | ||
| 121 | } | ||
| 112 | } | 122 | } |
| 113 | printf("\n"); | 123 | printf("\n"); |
| 114 | } | 124 | } |
diff --git a/lib/raid6/x86.h b/lib/raid6/x86.h index cb2a8c91c886..d55d63232c55 100644 --- a/lib/raid6/x86.h +++ b/lib/raid6/x86.h | |||
| @@ -35,24 +35,29 @@ static inline void kernel_fpu_end(void) | |||
| 35 | { | 35 | { |
| 36 | } | 36 | } |
| 37 | 37 | ||
| 38 | #define __aligned(x) __attribute__((aligned(x))) | ||
| 39 | |||
| 38 | #define X86_FEATURE_MMX (0*32+23) /* Multimedia Extensions */ | 40 | #define X86_FEATURE_MMX (0*32+23) /* Multimedia Extensions */ |
| 39 | #define X86_FEATURE_FXSR (0*32+24) /* FXSAVE and FXRSTOR instructions | 41 | #define X86_FEATURE_FXSR (0*32+24) /* FXSAVE and FXRSTOR instructions |
| 40 | * (fast save and restore) */ | 42 | * (fast save and restore) */ |
| 41 | #define X86_FEATURE_XMM (0*32+25) /* Streaming SIMD Extensions */ | 43 | #define X86_FEATURE_XMM (0*32+25) /* Streaming SIMD Extensions */ |
| 42 | #define X86_FEATURE_XMM2 (0*32+26) /* Streaming SIMD Extensions-2 */ | 44 | #define X86_FEATURE_XMM2 (0*32+26) /* Streaming SIMD Extensions-2 */ |
| 45 | #define X86_FEATURE_XMM3 (4*32+ 0) /* "pni" SSE-3 */ | ||
| 46 | #define X86_FEATURE_SSSE3 (4*32+ 9) /* Supplemental SSE-3 */ | ||
| 47 | #define X86_FEATURE_AVX (4*32+28) /* Advanced Vector Extensions */ | ||
| 43 | #define X86_FEATURE_MMXEXT (1*32+22) /* AMD MMX extensions */ | 48 | #define X86_FEATURE_MMXEXT (1*32+22) /* AMD MMX extensions */ |
| 44 | 49 | ||
| 45 | /* Should work well enough on modern CPUs for testing */ | 50 | /* Should work well enough on modern CPUs for testing */ |
| 46 | static inline int boot_cpu_has(int flag) | 51 | static inline int boot_cpu_has(int flag) |
| 47 | { | 52 | { |
| 48 | u32 eax = (flag >> 5) ? 0x80000001 : 1; | 53 | u32 eax = (flag & 0x20) ? 0x80000001 : 1; |
| 49 | u32 edx; | 54 | u32 ecx, edx; |
| 50 | 55 | ||
| 51 | asm volatile("cpuid" | 56 | asm volatile("cpuid" |
| 52 | : "+a" (eax), "=d" (edx) | 57 | : "+a" (eax), "=d" (edx), "=c" (ecx) |
| 53 | : : "ecx", "ebx"); | 58 | : : "ebx"); |
| 54 | 59 | ||
| 55 | return (edx >> (flag & 31)) & 1; | 60 | return ((flag & 0x80 ? ecx : edx) >> (flag & 31)) & 1; |
| 56 | } | 61 | } |
| 57 | 62 | ||
| 58 | #endif /* ndef __KERNEL__ */ | 63 | #endif /* ndef __KERNEL__ */ |
diff --git a/lib/rational.c b/lib/rational.c index d326da3976f5..f0aa21c2a762 100644 --- a/lib/rational.c +++ b/lib/rational.c | |||
| @@ -1,7 +1,7 @@ | |||
| 1 | /* | 1 | /* |
| 2 | * rational fractions | 2 | * rational fractions |
| 3 | * | 3 | * |
| 4 | * Copyright (C) 2009 emlix GmbH, Oskar Schirmer <os@emlix.com> | 4 | * Copyright (C) 2009 emlix GmbH, Oskar Schirmer <oskar@scara.com> |
| 5 | * | 5 | * |
| 6 | * helper functions when coping with rational numbers | 6 | * helper functions when coping with rational numbers |
| 7 | */ | 7 | */ |
