cifs: add replacement for cifs_strtoUCS_le called cifs_from_ucs2

Add a replacement function for cifs_strtoUCS_le. cifs_from_ucs2 takes args for the source and destination length so that we can ensure that the function is confined within the intended buffers. Signed-off-by: Jeff Layton <jlayton@redhat.com> Acked-by: Suresh Jayaraman <sjayaraman@suse.de> Signed-off-by: Steve French <sfrench@us.ibm.com>
author: Jeff Layton <jlayton@redhat.com> 2009-04-30 06:46:15 -0400
committer: Steve French <sfrench@us.ibm.com> 2009-04-30 11:44:59 -0400
commit: 7fabf0c9479fef9fdb9528a5fbdb1cb744a744a4 (patch)
tree: a44ab17abeefb87a623d62c344d4aa4b4f1a4b7f /fs/cifs/cifs_unicode.c
parent: 66345f50f070ae7412a28543ee197cb5eff73598 (diff)
1 files changed, 124 insertions, 0 deletions
diff --git a/fs/cifs/cifs_unicode.c b/fs/cifs/cifs_unicode.c
index 7d75272a6b3f..8389f359b03d 100644
--- a/fs/cifs/cifs_unicode.c
+++ b/fs/cifs/cifs_unicode.c
@@ -26,6 +26,130 @@
 #include "cifs_debug.h"
 /*
+ * cifs_mapchar - convert a little-endian char to proper char in codepage
+ * @target - where converted character should be copied
+ * @src_char - 2 byte little-endian source character
+ * @cp - codepage to which character should be converted
+ * @mapchar - should character be mapped according to mapchars mount option?
+ *
+ * This function handles the conversion of a single character. It is the
+ * responsibility of the caller to ensure that the target buffer is large
+ * enough to hold the result of the conversion (at least NLS_MAX_CHARSET_SIZE).
+ */
+static int
+cifs_mapchar(char *target, const __le16 src_char, const struct nls_table *cp,
+             bool mapchar)
+{
+        int len = 1;
+        if (!mapchar)
+                goto cp_convert;
+        /*
+         * BB: Cannot handle remapping UNI_SLASH until all the calls to
+         *     build_path_from_dentry are modified, as they use slash as
+         *     separator.
+         */
+        switch (le16_to_cpu(src_char)) {
+        case UNI_COLON:
+                *target = ':';
+                break;
+        case UNI_ASTERIK:
+                *target = '*';
+                break;
+        case UNI_QUESTION:
+                *target = '?';
+                break;
+        case UNI_PIPE:
+                *target = '|';
+                break;
+        case UNI_GRTRTHAN:
+                *target = '>';
+                break;
+        case UNI_LESSTHAN:
+                *target = '<';
+                break;
+        default:
+                goto cp_convert;
+        }
+out:
+        return len;
+cp_convert:
+        len = cp->uni2char(le16_to_cpu(src_char), target,
+                           NLS_MAX_CHARSET_SIZE);
+        if (len <= 0) {
+                *target = '?';
+                len = 1;
+        }
+        goto out;
+}
+/*
+ * cifs_from_ucs2 - convert utf16le string to local charset
+ * @to - destination buffer
+ * @from - source buffer
+ * @tolen - destination buffer size (in bytes)
+ * @fromlen - source buffer size (in bytes)
+ * @codepage - codepage to which characters should be converted
+ * @mapchar - should characters be remapped according to the mapchars option?
+ *
+ * Convert a little-endian ucs2le string (as sent by the server) to a string
+ * in the provided codepage. The tolen and fromlen parameters are to ensure
+ * that the code doesn't walk off of the end of the buffer (which is always
+ * a danger if the alignment of the source buffer is off). The destination
+ * string is always properly null terminated and fits in the destination
+ * buffer. Returns the length of the destination string in bytes (including
+ * null terminator).
+ *
+ * Note that some windows versions actually send multiword UTF-16 characters
+ * instead of straight UCS-2. The linux nls routines however aren't able to
+ * deal with those characters properly. In the event that we get some of
+ * those characters, they won't be translated properly.
+ */
+int
+cifs_from_ucs2(char *to, const __le16 *from, int tolen, int fromlen,
+                 const struct nls_table *codepage, bool mapchar)
+{
+        int i, charlen, safelen;
+        int outlen = 0;
+        int nullsize = nls_nullsize(codepage);
+        int fromwords = fromlen / 2;
+        char tmp[NLS_MAX_CHARSET_SIZE];
+        /*
+         * because the chars can be of varying widths, we need to take care
+         * not to overflow the destination buffer when we get close to the
+         * end of it. Until we get to this offset, we don't need to check
+         * for overflow however.
+         */
+        safelen = tolen - (NLS_MAX_CHARSET_SIZE + nullsize);
+        for (i = 0; i < fromwords && from[i]; i++) {
+                /*
+                 * check to see if converting this character might make the
+                 * conversion bleed into the null terminator
+                 */
+                if (outlen >= safelen) {
+                        charlen = cifs_mapchar(tmp, from[i], codepage, mapchar);
+                        if ((outlen + charlen) > (tolen - nullsize))
+                                break;
+                }
+                /* put converted char into 'to' buffer */
+                charlen = cifs_mapchar(&to[outlen], from[i], codepage, mapchar);
+                outlen += charlen;
+        }
+        /* properly null-terminate string */
+        for (i = 0; i < nullsize; i++)
+                to[outlen++] = 0;
+        return outlen;
+}
+/*
 * NAME:        cifs_strfromUCS()
 *
 * FUNCTION:    Convert little-endian unicode string to character string
author	Jeff Layton <jlayton@redhat.com>	2009-04-30 06:46:15 -0400
committer	Steve French <sfrench@us.ibm.com>	2009-04-30 11:44:59 -0400
commit	7fabf0c9479fef9fdb9528a5fbdb1cb744a744a4 (patch)
tree	a44ab17abeefb87a623d62c344d4aa4b4f1a4b7f /fs/cifs/cifs_unicode.c
parent	66345f50f070ae7412a28543ee197cb5eff73598 (diff)

diff --git a/fs/cifs/cifs_unicode.c b/fs/cifs/cifs_unicode.c index 7d75272a6b3f..8389f359b03d 100644 --- a/fs/cifs/cifs_unicode.c +++ b/fs/cifs/cifs_unicode.c
@@ -26,6 +26,130 @@
26	#include "cifs_debug.h"	26	#include "cifs_debug.h"
27		27
28	/*	28	/*
		29	* cifs_mapchar - convert a little-endian char to proper char in codepage
		30	* @target - where converted character should be copied
		31	* @src_char - 2 byte little-endian source character
		32	* @cp - codepage to which character should be converted
		33	* @mapchar - should character be mapped according to mapchars mount option?
		34	*
		35	* This function handles the conversion of a single character. It is the
		36	* responsibility of the caller to ensure that the target buffer is large
		37	* enough to hold the result of the conversion (at least NLS_MAX_CHARSET_SIZE).
		38	*/
		39	static int
		40	cifs_mapchar(char target, const __le16 src_char, const struct nls_table cp,
		41	bool mapchar)
		42	{
		43	int len = 1;
		44
		45	if (!mapchar)
		46	goto cp_convert;
		47
		48	/*
		49	* BB: Cannot handle remapping UNI_SLASH until all the calls to
		50	* build_path_from_dentry are modified, as they use slash as
		51	* separator.
		52	*/
		53	switch (le16_to_cpu(src_char)) {
		54	case UNI_COLON:
		55	*target = ':';
		56	break;
		57	case UNI_ASTERIK:
		58	target = '';
		59	break;
		60	case UNI_QUESTION:
		61	*target = '?';
		62	break;
		63	case UNI_PIPE:
		64	*target = '\|';
		65	break;
		66	case UNI_GRTRTHAN:
		67	*target = '>';
		68	break;
		69	case UNI_LESSTHAN:
		70	*target = '<';
		71	break;
		72	default:
		73	goto cp_convert;
		74	}
		75
		76	out:
		77	return len;
		78
		79	cp_convert:
		80	len = cp->uni2char(le16_to_cpu(src_char), target,
		81	NLS_MAX_CHARSET_SIZE);
		82	if (len <= 0) {
		83	*target = '?';
		84	len = 1;
		85	}
		86	goto out;
		87	}
		88
		89	/*
		90	* cifs_from_ucs2 - convert utf16le string to local charset
		91	* @to - destination buffer
		92	* @from - source buffer
		93	* @tolen - destination buffer size (in bytes)
		94	* @fromlen - source buffer size (in bytes)
		95	* @codepage - codepage to which characters should be converted
		96	* @mapchar - should characters be remapped according to the mapchars option?
		97	*
		98	* Convert a little-endian ucs2le string (as sent by the server) to a string
		99	* in the provided codepage. The tolen and fromlen parameters are to ensure
		100	* that the code doesn't walk off of the end of the buffer (which is always
		101	* a danger if the alignment of the source buffer is off). The destination
		102	* string is always properly null terminated and fits in the destination
		103	* buffer. Returns the length of the destination string in bytes (including
		104	* null terminator).
		105	*
		106	* Note that some windows versions actually send multiword UTF-16 characters
		107	* instead of straight UCS-2. The linux nls routines however aren't able to
		108	* deal with those characters properly. In the event that we get some of
		109	* those characters, they won't be translated properly.
		110	*/
		111	int
		112	cifs_from_ucs2(char to, const __le16 from, int tolen, int fromlen,
		113	const struct nls_table *codepage, bool mapchar)
		114	{
		115	int i, charlen, safelen;
		116	int outlen = 0;
		117	int nullsize = nls_nullsize(codepage);
		118	int fromwords = fromlen / 2;
		119	char tmp[NLS_MAX_CHARSET_SIZE];
		120
		121	/*
		122	* because the chars can be of varying widths, we need to take care
		123	* not to overflow the destination buffer when we get close to the
		124	* end of it. Until we get to this offset, we don't need to check
		125	* for overflow however.
		126	*/
		127	safelen = tolen - (NLS_MAX_CHARSET_SIZE + nullsize);
		128
		129	for (i = 0; i < fromwords && from[i]; i++) {
		130	/*
		131	* check to see if converting this character might make the
		132	* conversion bleed into the null terminator
		133	*/
		134	if (outlen >= safelen) {
		135	charlen = cifs_mapchar(tmp, from[i], codepage, mapchar);
		136	if ((outlen + charlen) > (tolen - nullsize))
		137	break;
		138	}
		139
		140	/* put converted char into 'to' buffer */
		141	charlen = cifs_mapchar(&to[outlen], from[i], codepage, mapchar);
		142	outlen += charlen;
		143	}
		144
		145	/* properly null-terminate string */
		146	for (i = 0; i < nullsize; i++)
		147	to[outlen++] = 0;
		148
		149	return outlen;
		150	}
		151
		152	/*
29	* NAME: cifs_strfromUCS()	153	* NAME: cifs_strfromUCS()
30	*	154	*
31	* FUNCTION: Convert little-endian unicode string to character string	155	* FUNCTION: Convert little-endian unicode string to character string