diff options
author | Joonwoo Park <joonwpark81@gmail.com> | 2008-07-08 05:37:54 -0400 |
---|---|---|
committer | David S. Miller <davem@davemloft.net> | 2008-07-08 05:37:54 -0400 |
commit | 3b76d08190e6b420ed3f5534aa99ee29d82d731f (patch) | |
tree | 90f5f3b38148529946d3b0807d6cdd80445ed1cf /lib/ts_bm.c | |
parent | b9c796783151678d08b1ec1ef410685b2515ba51 (diff) |
textsearch: ts_bm: support case insensitive searching in Boyer-Moore algorithm
Add support for case insensitive search to Boyer-Moore algorithm.
Signed-off-by: Joonwoo Park <joonwpark81@gmail.com>
Signed-off-by: Patrick McHardy <kaber@trash.net>
Signed-off-by: David S. Miller <davem@davemloft.net>
Diffstat (limited to 'lib/ts_bm.c')
-rw-r--r-- | lib/ts_bm.c | 26 |
1 files changed, 20 insertions, 6 deletions
diff --git a/lib/ts_bm.c b/lib/ts_bm.c index 4a7fce72898e..9e66ee4020e9 100644 --- a/lib/ts_bm.c +++ b/lib/ts_bm.c | |||
@@ -39,6 +39,7 @@ | |||
39 | #include <linux/module.h> | 39 | #include <linux/module.h> |
40 | #include <linux/types.h> | 40 | #include <linux/types.h> |
41 | #include <linux/string.h> | 41 | #include <linux/string.h> |
42 | #include <linux/ctype.h> | ||
42 | #include <linux/textsearch.h> | 43 | #include <linux/textsearch.h> |
43 | 44 | ||
44 | /* Alphabet size, use ASCII */ | 45 | /* Alphabet size, use ASCII */ |
@@ -64,6 +65,7 @@ static unsigned int bm_find(struct ts_config *conf, struct ts_state *state) | |||
64 | unsigned int i, text_len, consumed = state->offset; | 65 | unsigned int i, text_len, consumed = state->offset; |
65 | const u8 *text; | 66 | const u8 *text; |
66 | int shift = bm->patlen - 1, bs; | 67 | int shift = bm->patlen - 1, bs; |
68 | const u8 icase = conf->flags & TS_IGNORECASE; | ||
67 | 69 | ||
68 | for (;;) { | 70 | for (;;) { |
69 | text_len = conf->get_next_block(consumed, &text, conf, state); | 71 | text_len = conf->get_next_block(consumed, &text, conf, state); |
@@ -75,7 +77,9 @@ static unsigned int bm_find(struct ts_config *conf, struct ts_state *state) | |||
75 | DEBUGP("Searching in position %d (%c)\n", | 77 | DEBUGP("Searching in position %d (%c)\n", |
76 | shift, text[shift]); | 78 | shift, text[shift]); |
77 | for (i = 0; i < bm->patlen; i++) | 79 | for (i = 0; i < bm->patlen; i++) |
78 | if (text[shift-i] != bm->pattern[bm->patlen-1-i]) | 80 | if ((icase ? toupper(text[shift-i]) |
81 | : text[shift-i]) | ||
82 | != bm->pattern[bm->patlen-1-i]) | ||
79 | goto next; | 83 | goto next; |
80 | 84 | ||
81 | /* London calling... */ | 85 | /* London calling... */ |
@@ -111,14 +115,18 @@ static int subpattern(u8 *pattern, int i, int j, int g) | |||
111 | return ret; | 115 | return ret; |
112 | } | 116 | } |
113 | 117 | ||
114 | static void compute_prefix_tbl(struct ts_bm *bm) | 118 | static void compute_prefix_tbl(struct ts_bm *bm, int flags) |
115 | { | 119 | { |
116 | int i, j, g; | 120 | int i, j, g; |
117 | 121 | ||
118 | for (i = 0; i < ASIZE; i++) | 122 | for (i = 0; i < ASIZE; i++) |
119 | bm->bad_shift[i] = bm->patlen; | 123 | bm->bad_shift[i] = bm->patlen; |
120 | for (i = 0; i < bm->patlen - 1; i++) | 124 | for (i = 0; i < bm->patlen - 1; i++) { |
121 | bm->bad_shift[bm->pattern[i]] = bm->patlen - 1 - i; | 125 | bm->bad_shift[bm->pattern[i]] = bm->patlen - 1 - i; |
126 | if (flags & TS_IGNORECASE) | ||
127 | bm->bad_shift[tolower(bm->pattern[i])] | ||
128 | = bm->patlen - 1 - i; | ||
129 | } | ||
122 | 130 | ||
123 | /* Compute the good shift array, used to match reocurrences | 131 | /* Compute the good shift array, used to match reocurrences |
124 | * of a subpattern */ | 132 | * of a subpattern */ |
@@ -135,10 +143,11 @@ static void compute_prefix_tbl(struct ts_bm *bm) | |||
135 | } | 143 | } |
136 | 144 | ||
137 | static struct ts_config *bm_init(const void *pattern, unsigned int len, | 145 | static struct ts_config *bm_init(const void *pattern, unsigned int len, |
138 | gfp_t gfp_mask) | 146 | gfp_t gfp_mask, int flags) |
139 | { | 147 | { |
140 | struct ts_config *conf; | 148 | struct ts_config *conf; |
141 | struct ts_bm *bm; | 149 | struct ts_bm *bm; |
150 | int i; | ||
142 | unsigned int prefix_tbl_len = len * sizeof(unsigned int); | 151 | unsigned int prefix_tbl_len = len * sizeof(unsigned int); |
143 | size_t priv_size = sizeof(*bm) + len + prefix_tbl_len; | 152 | size_t priv_size = sizeof(*bm) + len + prefix_tbl_len; |
144 | 153 | ||
@@ -146,11 +155,16 @@ static struct ts_config *bm_init(const void *pattern, unsigned int len, | |||
146 | if (IS_ERR(conf)) | 155 | if (IS_ERR(conf)) |
147 | return conf; | 156 | return conf; |
148 | 157 | ||
158 | conf->flags = flags; | ||
149 | bm = ts_config_priv(conf); | 159 | bm = ts_config_priv(conf); |
150 | bm->patlen = len; | 160 | bm->patlen = len; |
151 | bm->pattern = (u8 *) bm->good_shift + prefix_tbl_len; | 161 | bm->pattern = (u8 *) bm->good_shift + prefix_tbl_len; |
152 | memcpy(bm->pattern, pattern, len); | 162 | if (flags & TS_IGNORECASE) |
153 | compute_prefix_tbl(bm); | 163 | for (i = 0; i < len; i++) |
164 | bm->pattern[i] = toupper(((u8 *)pattern)[i]); | ||
165 | else | ||
166 | memcpy(bm->pattern, pattern, len); | ||
167 | compute_prefix_tbl(bm, flags); | ||
154 | 168 | ||
155 | return conf; | 169 | return conf; |
156 | } | 170 | } |