Blame view

fs/cifs/cifs_unicode.c 16 KB
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
1
2
3
  /*
   *   fs/cifs/cifs_unicode.c
   *
d185cda77   Steve French   [CIFS] rename cif...
4
   *   Copyright (c) International Business Machines  Corp., 2000,2009
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
5
6
7
8
   *   Modified by Steve French (sfrench@us.ibm.com)
   *
   *   This program is free software;  you can redistribute it and/or modify
   *   it under the terms of the GNU General Public License as published by
221601c3d   Steve French   [CIFS] whitespace...
9
   *   the Free Software Foundation; either version 2 of the License, or
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
10
   *   (at your option) any later version.
221601c3d   Steve French   [CIFS] whitespace...
11
   *
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
12
13
14
15
16
17
   *   This program is distributed in the hope that it will be useful,
   *   but WITHOUT ANY WARRANTY;  without even the implied warranty of
   *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See
   *   the GNU General Public License for more details.
   *
   *   You should have received a copy of the GNU General Public License
221601c3d   Steve French   [CIFS] whitespace...
18
   *   along with this program;  if not, write to the Free Software
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
19
20
21
   *   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
   */
  #include <linux/fs.h>
5a0e3ad6a   Tejun Heo   include cleanup: ...
22
  #include <linux/slab.h>
2baa26825   Steve French   Remap reserved po...
23
  #include "cifs_fs_sb.h"
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
24
25
26
  #include "cifs_unicode.h"
  #include "cifs_uniupr.h"
  #include "cifspdu.h"
3979877e5   Steve French   [CIFS] Support fo...
27
  #include "cifsglob.h"
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
28
  #include "cifs_debug.h"
2baa26825   Steve French   Remap reserved po...
29
30
31
32
33
34
35
36
37
38
39
40
41
  int cifs_remap(struct cifs_sb_info *cifs_sb)
  {
  	int map_type;
  
  	if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_MAP_SFM_CHR)
  		map_type = SFM_MAP_UNI_RSVD;
  	else if (cifs_sb->mnt_cifs_flags & CIFS_MOUNT_MAP_SPECIAL_CHR)
  		map_type = SFU_MAP_UNI_RSVD;
  	else
  		map_type = NO_MAP_UNI_RSVD;
  
  	return map_type;
  }
b693855fe   Steve French   Allow conversion ...
42
43
44
  /* Convert character using the SFU - "Services for Unix" remapping range */
  static bool
  convert_sfu_char(const __u16 src_char, char *target)
7fabf0c94   Jeff Layton   cifs: add replace...
45
  {
7fabf0c94   Jeff Layton   cifs: add replace...
46
47
48
49
50
  	/*
  	 * BB: Cannot handle remapping UNI_SLASH until all the calls to
  	 *     build_path_from_dentry are modified, as they use slash as
  	 *     separator.
  	 */
ba2dbf30d   Jeff Layton   cifs: clean up un...
51
  	switch (src_char) {
7fabf0c94   Jeff Layton   cifs: add replace...
52
53
54
  	case UNI_COLON:
  		*target = ':';
  		break;
581ade4d1   Jeff Layton   cifs: clean up va...
55
  	case UNI_ASTERISK:
7fabf0c94   Jeff Layton   cifs: add replace...
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
  		*target = '*';
  		break;
  	case UNI_QUESTION:
  		*target = '?';
  		break;
  	case UNI_PIPE:
  		*target = '|';
  		break;
  	case UNI_GRTRTHAN:
  		*target = '>';
  		break;
  	case UNI_LESSTHAN:
  		*target = '<';
  		break;
  	default:
b693855fe   Steve French   Allow conversion ...
71
  		return false;
7fabf0c94   Jeff Layton   cifs: add replace...
72
  	}
b693855fe   Steve French   Allow conversion ...
73
74
  	return true;
  }
7fabf0c94   Jeff Layton   cifs: add replace...
75

b693855fe   Steve French   Allow conversion ...
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
  /* Convert character using the SFM - "Services for Mac" remapping range */
  static bool
  convert_sfm_char(const __u16 src_char, char *target)
  {
  	switch (src_char) {
  	case SFM_COLON:
  		*target = ':';
  		break;
  	case SFM_ASTERISK:
  		*target = '*';
  		break;
  	case SFM_QUESTION:
  		*target = '?';
  		break;
  	case SFM_PIPE:
  		*target = '|';
  		break;
  	case SFM_GRTRTHAN:
  		*target = '>';
  		break;
  	case SFM_LESSTHAN:
  		*target = '<';
  		break;
  	case SFM_SLASH:
  		*target = '\\';
  		break;
45e8a2583   Steve French   File names with t...
102
103
104
105
106
107
  	case SFM_SPACE:
  		*target = ' ';
  		break;
  	case SFM_PERIOD:
  		*target = '.';
  		break;
b693855fe   Steve French   Allow conversion ...
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
  	default:
  		return false;
  	}
  	return true;
  }
  
  
  /*
   * cifs_mapchar - convert a host-endian char to proper char in codepage
   * @target - where converted character should be copied
   * @src_char - 2 byte host-endian source character
   * @cp - codepage to which character should be converted
   * @map_type - How should the 7 NTFS/SMB reserved characters be mapped to UCS2?
   *
   * This function handles the conversion of a single character. It is the
   * responsibility of the caller to ensure that the target buffer is large
   * enough to hold the result of the conversion (at least NLS_MAX_CHARSET_SIZE).
   */
  static int
b29103076   Nakajima Akira   Fix to convert SU...
127
  cifs_mapchar(char *target, const __u16 *from, const struct nls_table *cp,
b693855fe   Steve French   Allow conversion ...
128
129
130
  	     int maptype)
  {
  	int len = 1;
b29103076   Nakajima Akira   Fix to convert SU...
131
132
133
  	__u16 src_char;
  
  	src_char = *from;
b693855fe   Steve French   Allow conversion ...
134
135
136
137
138
139
  
  	if ((maptype == SFM_MAP_UNI_RSVD) && convert_sfm_char(src_char, target))
  		return len;
  	else if ((maptype == SFU_MAP_UNI_RSVD) &&
  		  convert_sfu_char(src_char, target))
  		return len;
7fabf0c94   Jeff Layton   cifs: add replace...
140

b693855fe   Steve French   Allow conversion ...
141
  	/* if character not one of seven in special remap set */
ba2dbf30d   Jeff Layton   cifs: clean up un...
142
  	len = cp->uni2char(src_char, target, NLS_MAX_CHARSET_SIZE);
b29103076   Nakajima Akira   Fix to convert SU...
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
  	if (len <= 0)
  		goto surrogate_pair;
  
  	return len;
  
  surrogate_pair:
  	/* convert SURROGATE_PAIR and IVS */
  	if (strcmp(cp->charset, "utf8"))
  		goto unknown;
  	len = utf16s_to_utf8s(from, 3, UTF16_LITTLE_ENDIAN, target, 6);
  	if (len <= 0)
  		goto unknown;
  	return len;
  
  unknown:
  	*target = '?';
  	len = 1;
b693855fe   Steve French   Allow conversion ...
160
  	return len;
7fabf0c94   Jeff Layton   cifs: add replace...
161
162
163
  }
  
  /*
acbbb76a2   Steve French   CIFS: Rename *UCS...
164
   * cifs_from_utf16 - convert utf16le string to local charset
7fabf0c94   Jeff Layton   cifs: add replace...
165
166
167
168
169
170
171
   * @to - destination buffer
   * @from - source buffer
   * @tolen - destination buffer size (in bytes)
   * @fromlen - source buffer size (in bytes)
   * @codepage - codepage to which characters should be converted
   * @mapchar - should characters be remapped according to the mapchars option?
   *
acbbb76a2   Steve French   CIFS: Rename *UCS...
172
   * Convert a little-endian utf16le string (as sent by the server) to a string
7fabf0c94   Jeff Layton   cifs: add replace...
173
174
175
176
177
178
179
180
   * in the provided codepage. The tolen and fromlen parameters are to ensure
   * that the code doesn't walk off of the end of the buffer (which is always
   * a danger if the alignment of the source buffer is off). The destination
   * string is always properly null terminated and fits in the destination
   * buffer. Returns the length of the destination string in bytes (including
   * null terminator).
   *
   * Note that some windows versions actually send multiword UTF-16 characters
acbbb76a2   Steve French   CIFS: Rename *UCS...
181
   * instead of straight UTF16-2. The linux nls routines however aren't able to
7fabf0c94   Jeff Layton   cifs: add replace...
182
183
184
185
   * deal with those characters properly. In the event that we get some of
   * those characters, they won't be translated properly.
   */
  int
acbbb76a2   Steve French   CIFS: Rename *UCS...
186
  cifs_from_utf16(char *to, const __le16 *from, int tolen, int fromlen,
b693855fe   Steve French   Allow conversion ...
187
  		const struct nls_table *codepage, int map_type)
7fabf0c94   Jeff Layton   cifs: add replace...
188
189
190
191
192
193
  {
  	int i, charlen, safelen;
  	int outlen = 0;
  	int nullsize = nls_nullsize(codepage);
  	int fromwords = fromlen / 2;
  	char tmp[NLS_MAX_CHARSET_SIZE];
b29103076   Nakajima Akira   Fix to convert SU...
194
  	__u16 ftmp[3];		/* ftmp[3] = 3array x 2bytes = 6bytes UTF-16 */
7fabf0c94   Jeff Layton   cifs: add replace...
195
196
197
198
199
200
201
202
  
  	/*
  	 * because the chars can be of varying widths, we need to take care
  	 * not to overflow the destination buffer when we get close to the
  	 * end of it. Until we get to this offset, we don't need to check
  	 * for overflow however.
  	 */
  	safelen = tolen - (NLS_MAX_CHARSET_SIZE + nullsize);
ba2dbf30d   Jeff Layton   cifs: clean up un...
203
  	for (i = 0; i < fromwords; i++) {
b29103076   Nakajima Akira   Fix to convert SU...
204
205
  		ftmp[0] = get_unaligned_le16(&from[i]);
  		if (ftmp[0] == 0)
ba2dbf30d   Jeff Layton   cifs: clean up un...
206
  			break;
b29103076   Nakajima Akira   Fix to convert SU...
207
208
209
210
211
212
213
214
  		if (i + 1 < fromwords)
  			ftmp[1] = get_unaligned_le16(&from[i + 1]);
  		else
  			ftmp[1] = 0;
  		if (i + 2 < fromwords)
  			ftmp[2] = get_unaligned_le16(&from[i + 2]);
  		else
  			ftmp[2] = 0;
ba2dbf30d   Jeff Layton   cifs: clean up un...
215

7fabf0c94   Jeff Layton   cifs: add replace...
216
217
218
219
220
  		/*
  		 * check to see if converting this character might make the
  		 * conversion bleed into the null terminator
  		 */
  		if (outlen >= safelen) {
b693855fe   Steve French   Allow conversion ...
221
  			charlen = cifs_mapchar(tmp, ftmp, codepage, map_type);
7fabf0c94   Jeff Layton   cifs: add replace...
222
223
224
225
226
  			if ((outlen + charlen) > (tolen - nullsize))
  				break;
  		}
  
  		/* put converted char into 'to' buffer */
b693855fe   Steve French   Allow conversion ...
227
  		charlen = cifs_mapchar(&to[outlen], ftmp, codepage, map_type);
7fabf0c94   Jeff Layton   cifs: add replace...
228
  		outlen += charlen;
b29103076   Nakajima Akira   Fix to convert SU...
229
230
231
232
233
234
235
236
237
238
239
  
  		/* charlen (=bytes of UTF-8 for 1 character)
  		 * 4bytes UTF-8(surrogate pair) is charlen=4
  		 *   (4bytes UTF-16 code)
  		 * 7-8bytes UTF-8(IVS) is charlen=3+4 or 4+4
  		 *   (2 UTF-8 pairs divided to 2 UTF-16 pairs) */
  		if (charlen == 4)
  			i++;
  		else if (charlen >= 5)
  			/* 5-6bytes UTF-8 */
  			i += 2;
7fabf0c94   Jeff Layton   cifs: add replace...
240
241
242
243
244
245
246
247
248
249
  	}
  
  	/* properly null-terminate string */
  	for (i = 0; i < nullsize; i++)
  		to[outlen++] = 0;
  
  	return outlen;
  }
  
  /*
acbbb76a2   Steve French   CIFS: Rename *UCS...
250
   * NAME:	cifs_strtoUTF16()
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
251
252
253
254
255
   *
   * FUNCTION:	Convert character string to unicode string
   *
   */
  int
acbbb76a2   Steve French   CIFS: Rename *UCS...
256
  cifs_strtoUTF16(__le16 *to, const char *from, int len,
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
257
258
259
260
  	      const struct nls_table *codepage)
  {
  	int charlen;
  	int i;
ba2dbf30d   Jeff Layton   cifs: clean up un...
261
  	wchar_t wchar_to; /* needed to quiet sparse */
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
262

fd3ba42c7   Frediano Ziglio   Convert properly ...
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
  	/* special case for utf8 to handle no plane0 chars */
  	if (!strcmp(codepage->charset, "utf8")) {
  		/*
  		 * convert utf8 -> utf16, we assume we have enough space
  		 * as caller should have assumed conversion does not overflow
  		 * in destination len is length in wchar_t units (16bits)
  		 */
  		i  = utf8s_to_utf16s(from, len, UTF16_LITTLE_ENDIAN,
  				       (wchar_t *) to, len);
  
  		/* if success terminate and exit */
  		if (i >= 0)
  			goto success;
  		/*
  		 * if fails fall back to UCS encoding as this
  		 * function should not return negative values
  		 * currently can fail only if source contains
  		 * invalid encoded characters
  		 */
  	}
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
283
  	for (i = 0; len && *from; i++, from += charlen, len -= charlen) {
ba2dbf30d   Jeff Layton   cifs: clean up un...
284
  		charlen = codepage->char2uni(from, len, &wchar_to);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
285
  		if (charlen < 1) {
f96637be0   Joe Perches   [CIFS] cifs: Rena...
286
287
288
  			cifs_dbg(VFS, "strtoUTF16: char2uni of 0x%x returned %d
  ",
  				 *from, charlen);
69114089b   Steve French   [CIFS] Reduce spa...
289
  			/* A question mark */
ba2dbf30d   Jeff Layton   cifs: clean up un...
290
  			wchar_to = 0x003f;
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
291
  			charlen = 1;
ba2dbf30d   Jeff Layton   cifs: clean up un...
292
293
  		}
  		put_unaligned_le16(wchar_to, &to[i]);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
294
  	}
fd3ba42c7   Frediano Ziglio   Convert properly ...
295
  success:
ba2dbf30d   Jeff Layton   cifs: clean up un...
296
  	put_unaligned_le16(0, &to[i]);
1da177e4c   Linus Torvalds   Linux-2.6.12-rc2
297
298
  	return i;
  }
066ce6899   Jeff Layton   cifs: rename cifs...
299
  /*
b29103076   Nakajima Akira   Fix to convert SU...
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
   * cifs_utf16_bytes - how long will a string be after conversion?
   * @utf16 - pointer to input string
   * @maxbytes - don't go past this many bytes of input string
   * @codepage - destination codepage
   *
   * Walk a utf16le string and return the number of bytes that the string will
   * be after being converted to the given charset, not including any null
   * termination required. Don't walk past maxbytes in the source buffer.
   */
  int
  cifs_utf16_bytes(const __le16 *from, int maxbytes,
  		const struct nls_table *codepage)
  {
  	int i;
  	int charlen, outlen = 0;
  	int maxwords = maxbytes / 2;
  	char tmp[NLS_MAX_CHARSET_SIZE];
  	__u16 ftmp[3];
  
  	for (i = 0; i < maxwords; i++) {
  		ftmp[0] = get_unaligned_le16(&from[i]);
  		if (ftmp[0] == 0)
  			break;
  		if (i + 1 < maxwords)
  			ftmp[1] = get_unaligned_le16(&from[i + 1]);
  		else
  			ftmp[1] = 0;
  		if (i + 2 < maxwords)
  			ftmp[2] = get_unaligned_le16(&from[i + 2]);
  		else
  			ftmp[2] = 0;
  
  		charlen = cifs_mapchar(tmp, ftmp, codepage, NO_MAP_UNI_RSVD);
  		outlen += charlen;
  	}
  
  	return outlen;
  }
  
  /*
acbbb76a2   Steve French   CIFS: Rename *UCS...
340
341
   * cifs_strndup_from_utf16 - copy a string from wire format to the local
   * codepage
066ce6899   Jeff Layton   cifs: rename cifs...
342
343
344
345
346
347
348
349
350
351
   * @src - source string
   * @maxlen - don't walk past this many bytes in the source string
   * @is_unicode - is this a unicode string?
   * @codepage - destination codepage
   *
   * Take a string given by the server, convert it to the local codepage and
   * put it in a new buffer. Returns a pointer to the new string or NULL on
   * error.
   */
  char *
acbbb76a2   Steve French   CIFS: Rename *UCS...
352
353
  cifs_strndup_from_utf16(const char *src, const int maxlen,
  			const bool is_unicode, const struct nls_table *codepage)
066ce6899   Jeff Layton   cifs: rename cifs...
354
355
356
357
358
  {
  	int len;
  	char *dst;
  
  	if (is_unicode) {
acbbb76a2   Steve French   CIFS: Rename *UCS...
359
  		len = cifs_utf16_bytes((__le16 *) src, maxlen, codepage);
066ce6899   Jeff Layton   cifs: rename cifs...
360
361
362
363
  		len += nls_nullsize(codepage);
  		dst = kmalloc(len, GFP_KERNEL);
  		if (!dst)
  			return NULL;
acbbb76a2   Steve French   CIFS: Rename *UCS...
364
  		cifs_from_utf16(dst, (__le16 *) src, len, maxlen, codepage,
b693855fe   Steve French   Allow conversion ...
365
  			       NO_MAP_UNI_RSVD);
066ce6899   Jeff Layton   cifs: rename cifs...
366
367
368
369
370
371
372
373
374
375
376
  	} else {
  		len = strnlen(src, maxlen);
  		len++;
  		dst = kmalloc(len, GFP_KERNEL);
  		if (!dst)
  			return NULL;
  		strlcpy(dst, src, len);
  	}
  
  	return dst;
  }
a4153cb1d   Steve French   Allow conversion ...
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
  static __le16 convert_to_sfu_char(char src_char)
  {
  	__le16 dest_char;
  
  	switch (src_char) {
  	case ':':
  		dest_char = cpu_to_le16(UNI_COLON);
  		break;
  	case '*':
  		dest_char = cpu_to_le16(UNI_ASTERISK);
  		break;
  	case '?':
  		dest_char = cpu_to_le16(UNI_QUESTION);
  		break;
  	case '<':
  		dest_char = cpu_to_le16(UNI_LESSTHAN);
  		break;
  	case '>':
  		dest_char = cpu_to_le16(UNI_GRTRTHAN);
  		break;
  	case '|':
  		dest_char = cpu_to_le16(UNI_PIPE);
  		break;
  	default:
  		dest_char = 0;
  	}
  
  	return dest_char;
  }
45e8a2583   Steve French   File names with t...
406
  static __le16 convert_to_sfm_char(char src_char, bool end_of_string)
a4153cb1d   Steve French   Allow conversion ...
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
  {
  	__le16 dest_char;
  
  	switch (src_char) {
  	case ':':
  		dest_char = cpu_to_le16(SFM_COLON);
  		break;
  	case '*':
  		dest_char = cpu_to_le16(SFM_ASTERISK);
  		break;
  	case '?':
  		dest_char = cpu_to_le16(SFM_QUESTION);
  		break;
  	case '<':
  		dest_char = cpu_to_le16(SFM_LESSTHAN);
  		break;
  	case '>':
  		dest_char = cpu_to_le16(SFM_GRTRTHAN);
  		break;
  	case '|':
  		dest_char = cpu_to_le16(SFM_PIPE);
  		break;
45e8a2583   Steve French   File names with t...
429
430
431
432
433
434
435
436
437
438
439
440
  	case '.':
  		if (end_of_string)
  			dest_char = cpu_to_le16(SFM_PERIOD);
  		else
  			dest_char = 0;
  		break;
  	case ' ':
  		if (end_of_string)
  			dest_char = cpu_to_le16(SFM_SPACE);
  		else
  			dest_char = 0;
  		break;
a4153cb1d   Steve French   Allow conversion ...
441
442
443
444
445
446
  	default:
  		dest_char = 0;
  	}
  
  	return dest_char;
  }
84cdf74e8   Jeff Layton   cifs: fix unalign...
447
448
449
450
451
452
453
  /*
   * Convert 16 bit Unicode pathname to wire format from string in current code
   * page. Conversion may involve remapping up the six characters that are
   * only legal in POSIX-like OS (if they are present in the string). Path
   * names are little endian 16 bit Unicode on the wire
   */
  int
acbbb76a2   Steve French   CIFS: Rename *UCS...
454
  cifsConvertToUTF16(__le16 *target, const char *source, int srclen,
a4153cb1d   Steve French   Allow conversion ...
455
  		 const struct nls_table *cp, int map_chars)
84cdf74e8   Jeff Layton   cifs: fix unalign...
456
  {
ce36d9ab3   Steve French   [CIFS] fix mount ...
457
458
  	int i, charlen;
  	int j = 0;
84cdf74e8   Jeff Layton   cifs: fix unalign...
459
  	char src_char;
581ade4d1   Jeff Layton   cifs: clean up va...
460
461
  	__le16 dst_char;
  	wchar_t tmp;
b29103076   Nakajima Akira   Fix to convert SU...
462
463
464
  	wchar_t *wchar_to;	/* UTF-16 */
  	int ret;
  	unicode_t u;
84cdf74e8   Jeff Layton   cifs: fix unalign...
465

a4153cb1d   Steve French   Allow conversion ...
466
  	if (map_chars == NO_MAP_UNI_RSVD)
acbbb76a2   Steve French   CIFS: Rename *UCS...
467
  		return cifs_strtoUTF16(target, source, PATH_MAX, cp);
84cdf74e8   Jeff Layton   cifs: fix unalign...
468

b29103076   Nakajima Akira   Fix to convert SU...
469
  	wchar_to = kzalloc(6, GFP_KERNEL);
ce36d9ab3   Steve French   [CIFS] fix mount ...
470
  	for (i = 0; i < srclen; j++) {
84cdf74e8   Jeff Layton   cifs: fix unalign...
471
  		src_char = source[i];
11379b5e3   Jeff Layton   cifs: fix cifsCon...
472
  		charlen = 1;
a4153cb1d   Steve French   Allow conversion ...
473
474
475
  
  		/* check if end of string */
  		if (src_char == 0)
acbbb76a2   Steve French   CIFS: Rename *UCS...
476
  			goto ctoUTF16_out;
a4153cb1d   Steve French   Allow conversion ...
477
478
479
480
  
  		/* see if we must remap this char */
  		if (map_chars == SFU_MAP_UNI_RSVD)
  			dst_char = convert_to_sfu_char(src_char);
45e8a2583   Steve French   File names with t...
481
482
483
484
485
486
487
488
489
490
  		else if (map_chars == SFM_MAP_UNI_RSVD) {
  			bool end_of_string;
  
  			if (i == srclen - 1)
  				end_of_string = true;
  			else
  				end_of_string = false;
  
  			dst_char = convert_to_sfm_char(src_char, end_of_string);
  		} else
a4153cb1d   Steve French   Allow conversion ...
491
  			dst_char = 0;
84cdf74e8   Jeff Layton   cifs: fix unalign...
492
493
494
495
496
  		/*
  		 * FIXME: We can not handle remapping backslash (UNI_SLASH)
  		 * until all the calls to build_path_from_dentry are modified,
  		 * as they use backslash as separator.
  		 */
a4153cb1d   Steve French   Allow conversion ...
497
  		if (dst_char == 0) {
581ade4d1   Jeff Layton   cifs: clean up va...
498
499
  			charlen = cp->char2uni(source + i, srclen - i, &tmp);
  			dst_char = cpu_to_le16(tmp);
84cdf74e8   Jeff Layton   cifs: fix unalign...
500
501
502
503
  			/*
  			 * if no match, use question mark, which at least in
  			 * some cases serves as wild card
  			 */
b29103076   Nakajima Akira   Fix to convert SU...
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
  			if (charlen > 0)
  				goto ctoUTF16;
  
  			/* convert SURROGATE_PAIR */
  			if (strcmp(cp->charset, "utf8") || !wchar_to)
  				goto unknown;
  			if (*(source + i) & 0x80) {
  				charlen = utf8_to_utf32(source + i, 6, &u);
  				if (charlen < 0)
  					goto unknown;
  			} else
  				goto unknown;
  			ret  = utf8s_to_utf16s(source + i, charlen,
  					       UTF16_LITTLE_ENDIAN,
  					       wchar_to, 6);
  			if (ret < 0)
  				goto unknown;
  
  			i += charlen;
  			dst_char = cpu_to_le16(*wchar_to);
  			if (charlen <= 3)
  				/* 1-3bytes UTF-8 to 2bytes UTF-16 */
  				put_unaligned(dst_char, &target[j]);
  			else if (charlen == 4) {
  				/* 4bytes UTF-8(surrogate pair) to 4bytes UTF-16
  				 * 7-8bytes UTF-8(IVS) divided to 2 UTF-16
  				 *   (charlen=3+4 or 4+4) */
  				put_unaligned(dst_char, &target[j]);
  				dst_char = cpu_to_le16(*(wchar_to + 1));
  				j++;
  				put_unaligned(dst_char, &target[j]);
  			} else if (charlen >= 5) {
  				/* 5-6bytes UTF-8 to 6bytes UTF-16 */
  				put_unaligned(dst_char, &target[j]);
  				dst_char = cpu_to_le16(*(wchar_to + 1));
  				j++;
  				put_unaligned(dst_char, &target[j]);
  				dst_char = cpu_to_le16(*(wchar_to + 2));
  				j++;
  				put_unaligned(dst_char, &target[j]);
84cdf74e8   Jeff Layton   cifs: fix unalign...
544
  			}
b29103076   Nakajima Akira   Fix to convert SU...
545
546
547
548
549
  			continue;
  
  unknown:
  			dst_char = cpu_to_le16(0x003f);
  			charlen = 1;
84cdf74e8   Jeff Layton   cifs: fix unalign...
550
  		}
b29103076   Nakajima Akira   Fix to convert SU...
551
552
  
  ctoUTF16:
11379b5e3   Jeff Layton   cifs: fix cifsCon...
553
554
555
556
557
  		/*
  		 * character may take more than one byte in the source string,
  		 * but will take exactly two bytes in the target string
  		 */
  		i += charlen;
581ade4d1   Jeff Layton   cifs: clean up va...
558
  		put_unaligned(dst_char, &target[j]);
84cdf74e8   Jeff Layton   cifs: fix unalign...
559
  	}
acbbb76a2   Steve French   CIFS: Rename *UCS...
560
  ctoUTF16_out:
ce36d9ab3   Steve French   [CIFS] fix mount ...
561
  	put_unaligned(0, &target[j]); /* Null terminate target unicode string */
b29103076   Nakajima Akira   Fix to convert SU...
562
  	kfree(wchar_to);
c73f69398   Jeff Layton   cifs: fix return ...
563
  	return j;
84cdf74e8   Jeff Layton   cifs: fix unalign...
564
  }
2503a0dba   Pavel Shilovsky   CIFS: Add SMB2 su...
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
  
  #ifdef CONFIG_CIFS_SMB2
  /*
   * cifs_local_to_utf16_bytes - how long will a string be after conversion?
   * @from - pointer to input string
   * @maxbytes - don't go past this many bytes of input string
   * @codepage - source codepage
   *
   * Walk a string and return the number of bytes that the string will
   * be after being converted to the given charset, not including any null
   * termination required. Don't walk past maxbytes in the source buffer.
   */
  
  static int
  cifs_local_to_utf16_bytes(const char *from, int len,
  			  const struct nls_table *codepage)
  {
  	int charlen;
  	int i;
  	wchar_t wchar_to;
  
  	for (i = 0; len && *from; i++, from += charlen, len -= charlen) {
  		charlen = codepage->char2uni(from, len, &wchar_to);
  		/* Failed conversion defaults to a question mark */
  		if (charlen < 1)
  			charlen = 1;
  	}
  	return 2 * i; /* UTF16 characters are two bytes */
  }
  
  /*
   * cifs_strndup_to_utf16 - copy a string to wire format from the local codepage
   * @src - source string
   * @maxlen - don't walk past this many bytes in the source string
   * @utf16_len - the length of the allocated string in bytes (including null)
   * @cp - source codepage
   * @remap - map special chars
   *
   * Take a string convert it from the local codepage to UTF16 and
   * put it in a new buffer. Returns a pointer to the new string or NULL on
   * error.
   */
  __le16 *
  cifs_strndup_to_utf16(const char *src, const int maxlen, int *utf16_len,
  		      const struct nls_table *cp, int remap)
  {
  	int len;
  	__le16 *dst;
  
  	len = cifs_local_to_utf16_bytes(src, maxlen, cp);
  	len += 2; /* NULL */
  	dst = kmalloc(len, GFP_KERNEL);
  	if (!dst) {
  		*utf16_len = 0;
  		return NULL;
  	}
  	cifsConvertToUTF16(dst, src, strlen(src), cp, remap);
  	*utf16_len = len;
  	return dst;
  }
  #endif /* CONFIG_CIFS_SMB2 */