aboutsummaryrefslogtreecommitdiffstats
path: root/fs/cifs/cifs_unicode.c
diff options
context:
space:
mode:
authorJeff Layton <jlayton@redhat.com>2009-04-30 06:46:15 -0400
committerSteve French <sfrench@us.ibm.com>2009-04-30 11:44:59 -0400
commit7fabf0c9479fef9fdb9528a5fbdb1cb744a744a4 (patch)
treea44ab17abeefb87a623d62c344d4aa4b4f1a4b7f /fs/cifs/cifs_unicode.c
parent66345f50f070ae7412a28543ee197cb5eff73598 (diff)
cifs: add replacement for cifs_strtoUCS_le called cifs_from_ucs2
Add a replacement function for cifs_strtoUCS_le. cifs_from_ucs2 takes args for the source and destination length so that we can ensure that the function is confined within the intended buffers. Signed-off-by: Jeff Layton <jlayton@redhat.com> Acked-by: Suresh Jayaraman <sjayaraman@suse.de> Signed-off-by: Steve French <sfrench@us.ibm.com>
Diffstat (limited to 'fs/cifs/cifs_unicode.c')
-rw-r--r--fs/cifs/cifs_unicode.c124
1 files changed, 124 insertions, 0 deletions
diff --git a/fs/cifs/cifs_unicode.c b/fs/cifs/cifs_unicode.c
index 7d75272a6b3f..8389f359b03d 100644
--- a/fs/cifs/cifs_unicode.c
+++ b/fs/cifs/cifs_unicode.c
@@ -26,6 +26,130 @@
26#include "cifs_debug.h" 26#include "cifs_debug.h"
27 27
28/* 28/*
29 * cifs_mapchar - convert a little-endian char to proper char in codepage
30 * @target - where converted character should be copied
31 * @src_char - 2 byte little-endian source character
32 * @cp - codepage to which character should be converted
33 * @mapchar - should character be mapped according to mapchars mount option?
34 *
35 * This function handles the conversion of a single character. It is the
36 * responsibility of the caller to ensure that the target buffer is large
37 * enough to hold the result of the conversion (at least NLS_MAX_CHARSET_SIZE).
38 */
39static int
40cifs_mapchar(char *target, const __le16 src_char, const struct nls_table *cp,
41 bool mapchar)
42{
43 int len = 1;
44
45 if (!mapchar)
46 goto cp_convert;
47
48 /*
49 * BB: Cannot handle remapping UNI_SLASH until all the calls to
50 * build_path_from_dentry are modified, as they use slash as
51 * separator.
52 */
53 switch (le16_to_cpu(src_char)) {
54 case UNI_COLON:
55 *target = ':';
56 break;
57 case UNI_ASTERIK:
58 *target = '*';
59 break;
60 case UNI_QUESTION:
61 *target = '?';
62 break;
63 case UNI_PIPE:
64 *target = '|';
65 break;
66 case UNI_GRTRTHAN:
67 *target = '>';
68 break;
69 case UNI_LESSTHAN:
70 *target = '<';
71 break;
72 default:
73 goto cp_convert;
74 }
75
76out:
77 return len;
78
79cp_convert:
80 len = cp->uni2char(le16_to_cpu(src_char), target,
81 NLS_MAX_CHARSET_SIZE);
82 if (len <= 0) {
83 *target = '?';
84 len = 1;
85 }
86 goto out;
87}
88
89/*
90 * cifs_from_ucs2 - convert utf16le string to local charset
91 * @to - destination buffer
92 * @from - source buffer
93 * @tolen - destination buffer size (in bytes)
94 * @fromlen - source buffer size (in bytes)
95 * @codepage - codepage to which characters should be converted
96 * @mapchar - should characters be remapped according to the mapchars option?
97 *
98 * Convert a little-endian ucs2le string (as sent by the server) to a string
99 * in the provided codepage. The tolen and fromlen parameters are to ensure
100 * that the code doesn't walk off of the end of the buffer (which is always
101 * a danger if the alignment of the source buffer is off). The destination
102 * string is always properly null terminated and fits in the destination
103 * buffer. Returns the length of the destination string in bytes (including
104 * null terminator).
105 *
106 * Note that some windows versions actually send multiword UTF-16 characters
107 * instead of straight UCS-2. The linux nls routines however aren't able to
108 * deal with those characters properly. In the event that we get some of
109 * those characters, they won't be translated properly.
110 */
111int
112cifs_from_ucs2(char *to, const __le16 *from, int tolen, int fromlen,
113 const struct nls_table *codepage, bool mapchar)
114{
115 int i, charlen, safelen;
116 int outlen = 0;
117 int nullsize = nls_nullsize(codepage);
118 int fromwords = fromlen / 2;
119 char tmp[NLS_MAX_CHARSET_SIZE];
120
121 /*
122 * because the chars can be of varying widths, we need to take care
123 * not to overflow the destination buffer when we get close to the
124 * end of it. Until we get to this offset, we don't need to check
125 * for overflow however.
126 */
127 safelen = tolen - (NLS_MAX_CHARSET_SIZE + nullsize);
128
129 for (i = 0; i < fromwords && from[i]; i++) {
130 /*
131 * check to see if converting this character might make the
132 * conversion bleed into the null terminator
133 */
134 if (outlen >= safelen) {
135 charlen = cifs_mapchar(tmp, from[i], codepage, mapchar);
136 if ((outlen + charlen) > (tolen - nullsize))
137 break;
138 }
139
140 /* put converted char into 'to' buffer */
141 charlen = cifs_mapchar(&to[outlen], from[i], codepage, mapchar);
142 outlen += charlen;
143 }
144
145 /* properly null-terminate string */
146 for (i = 0; i < nullsize; i++)
147 to[outlen++] = 0;
148
149 return outlen;
150}
151
152/*
29 * NAME: cifs_strfromUCS() 153 * NAME: cifs_strfromUCS()
30 * 154 *
31 * FUNCTION: Convert little-endian unicode string to character string 155 * FUNCTION: Convert little-endian unicode string to character string