11da177e4SLinus Torvalds /*
2f30c2269SUwe Zeisberger * linux/fs/nls/nls_base.c
31da177e4SLinus Torvalds *
41da177e4SLinus Torvalds * Native language support--charsets and unicode translations.
51da177e4SLinus Torvalds * By Gordon Chaffee 1996, 1997
61da177e4SLinus Torvalds *
71da177e4SLinus Torvalds * Unicode based case conversion 1999 by Wolfram Pienkoss
81da177e4SLinus Torvalds *
91da177e4SLinus Torvalds */
101da177e4SLinus Torvalds
111da177e4SLinus Torvalds #include <linux/module.h>
121da177e4SLinus Torvalds #include <linux/string.h>
131da177e4SLinus Torvalds #include <linux/nls.h>
141da177e4SLinus Torvalds #include <linux/kernel.h>
151da177e4SLinus Torvalds #include <linux/errno.h>
161da177e4SLinus Torvalds #include <linux/kmod.h>
171da177e4SLinus Torvalds #include <linux/spinlock.h>
1874675a58SAlan Stern #include <asm/byteorder.h>
191da177e4SLinus Torvalds
201da177e4SLinus Torvalds static struct nls_table default_table;
211da177e4SLinus Torvalds static struct nls_table *tables = &default_table;
221da177e4SLinus Torvalds static DEFINE_SPINLOCK(nls_lock);
231da177e4SLinus Torvalds
241da177e4SLinus Torvalds /*
251da177e4SLinus Torvalds * Sample implementation from Unicode home page.
261da177e4SLinus Torvalds * http://www.stonehand.com/unicode/standard/fss-utf.html
271da177e4SLinus Torvalds */
281da177e4SLinus Torvalds struct utf8_table {
291da177e4SLinus Torvalds int cmask;
301da177e4SLinus Torvalds int cval;
311da177e4SLinus Torvalds int shift;
321da177e4SLinus Torvalds long lmask;
331da177e4SLinus Torvalds long lval;
341da177e4SLinus Torvalds };
351da177e4SLinus Torvalds
36b9ec0339SDenys Vlasenko static const struct utf8_table utf8_table[] =
371da177e4SLinus Torvalds {
381da177e4SLinus Torvalds {0x80, 0x00, 0*6, 0x7F, 0, /* 1 byte sequence */},
391da177e4SLinus Torvalds {0xE0, 0xC0, 1*6, 0x7FF, 0x80, /* 2 byte sequence */},
401da177e4SLinus Torvalds {0xF0, 0xE0, 2*6, 0xFFFF, 0x800, /* 3 byte sequence */},
411da177e4SLinus Torvalds {0xF8, 0xF0, 3*6, 0x1FFFFF, 0x10000, /* 4 byte sequence */},
421da177e4SLinus Torvalds {0xFC, 0xF8, 4*6, 0x3FFFFFF, 0x200000, /* 5 byte sequence */},
431da177e4SLinus Torvalds {0xFE, 0xFC, 5*6, 0x7FFFFFFF, 0x4000000, /* 6 byte sequence */},
441da177e4SLinus Torvalds {0, /* end of table */}
451da177e4SLinus Torvalds };
461da177e4SLinus Torvalds
4774675a58SAlan Stern #define UNICODE_MAX 0x0010ffff
4874675a58SAlan Stern #define PLANE_SIZE 0x00010000
4974675a58SAlan Stern
5074675a58SAlan Stern #define SURROGATE_MASK 0xfffff800
5174675a58SAlan Stern #define SURROGATE_PAIR 0x0000d800
5274675a58SAlan Stern #define SURROGATE_LOW 0x00000400
5374675a58SAlan Stern #define SURROGATE_BITS 0x000003ff
5474675a58SAlan Stern
utf8_to_utf32(const u8 * s,int inlen,unicode_t * pu)55045ddc89SAlan Stern int utf8_to_utf32(const u8 *s, int inlen, unicode_t *pu)
561da177e4SLinus Torvalds {
5774675a58SAlan Stern unsigned long l;
581da177e4SLinus Torvalds int c0, c, nc;
59b9ec0339SDenys Vlasenko const struct utf8_table *t;
601da177e4SLinus Torvalds
611da177e4SLinus Torvalds nc = 0;
621da177e4SLinus Torvalds c0 = *s;
631da177e4SLinus Torvalds l = c0;
641da177e4SLinus Torvalds for (t = utf8_table; t->cmask; t++) {
651da177e4SLinus Torvalds nc++;
661da177e4SLinus Torvalds if ((c0 & t->cmask) == t->cval) {
671da177e4SLinus Torvalds l &= t->lmask;
6874675a58SAlan Stern if (l < t->lval || l > UNICODE_MAX ||
6974675a58SAlan Stern (l & SURROGATE_MASK) == SURROGATE_PAIR)
701da177e4SLinus Torvalds return -1;
7174675a58SAlan Stern *pu = (unicode_t) l;
721da177e4SLinus Torvalds return nc;
731da177e4SLinus Torvalds }
74045ddc89SAlan Stern if (inlen <= nc)
751da177e4SLinus Torvalds return -1;
761da177e4SLinus Torvalds s++;
771da177e4SLinus Torvalds c = (*s ^ 0x80) & 0xFF;
781da177e4SLinus Torvalds if (c & 0xC0)
791da177e4SLinus Torvalds return -1;
801da177e4SLinus Torvalds l = (l << 6) | c;
811da177e4SLinus Torvalds }
821da177e4SLinus Torvalds return -1;
831da177e4SLinus Torvalds }
8474675a58SAlan Stern EXPORT_SYMBOL(utf8_to_utf32);
851da177e4SLinus Torvalds
utf32_to_utf8(unicode_t u,u8 * s,int maxout)86045ddc89SAlan Stern int utf32_to_utf8(unicode_t u, u8 *s, int maxout)
871da177e4SLinus Torvalds {
8874675a58SAlan Stern unsigned long l;
891da177e4SLinus Torvalds int c, nc;
90b9ec0339SDenys Vlasenko const struct utf8_table *t;
911da177e4SLinus Torvalds
92c80544dcSStephen Hemminger if (!s)
931da177e4SLinus Torvalds return 0;
941da177e4SLinus Torvalds
9574675a58SAlan Stern l = u;
9674675a58SAlan Stern if (l > UNICODE_MAX || (l & SURROGATE_MASK) == SURROGATE_PAIR)
9774675a58SAlan Stern return -1;
9874675a58SAlan Stern
991da177e4SLinus Torvalds nc = 0;
100045ddc89SAlan Stern for (t = utf8_table; t->cmask && maxout; t++, maxout--) {
1011da177e4SLinus Torvalds nc++;
1021da177e4SLinus Torvalds if (l <= t->lmask) {
1031da177e4SLinus Torvalds c = t->shift;
10474675a58SAlan Stern *s = (u8) (t->cval | (l >> c));
1051da177e4SLinus Torvalds while (c > 0) {
1061da177e4SLinus Torvalds c -= 6;
1071da177e4SLinus Torvalds s++;
10874675a58SAlan Stern *s = (u8) (0x80 | ((l >> c) & 0x3F));
1091da177e4SLinus Torvalds }
1101da177e4SLinus Torvalds return nc;
1111da177e4SLinus Torvalds }
1121da177e4SLinus Torvalds }
1131da177e4SLinus Torvalds return -1;
1141da177e4SLinus Torvalds }
11574675a58SAlan Stern EXPORT_SYMBOL(utf32_to_utf8);
1161da177e4SLinus Torvalds
put_utf16(wchar_t * s,unsigned c,enum utf16_endian endian)1170720a06aSAlan Stern static inline void put_utf16(wchar_t *s, unsigned c, enum utf16_endian endian)
1180720a06aSAlan Stern {
1190720a06aSAlan Stern switch (endian) {
1200720a06aSAlan Stern default:
1210720a06aSAlan Stern *s = (wchar_t) c;
1220720a06aSAlan Stern break;
1230720a06aSAlan Stern case UTF16_LITTLE_ENDIAN:
1240720a06aSAlan Stern *s = __cpu_to_le16(c);
1250720a06aSAlan Stern break;
1260720a06aSAlan Stern case UTF16_BIG_ENDIAN:
1270720a06aSAlan Stern *s = __cpu_to_be16(c);
1280720a06aSAlan Stern break;
1290720a06aSAlan Stern }
1300720a06aSAlan Stern }
1310720a06aSAlan Stern
utf8s_to_utf16s(const u8 * s,int inlen,enum utf16_endian endian,wchar_t * pwcs,int maxout)132045ddc89SAlan Stern int utf8s_to_utf16s(const u8 *s, int inlen, enum utf16_endian endian,
133045ddc89SAlan Stern wchar_t *pwcs, int maxout)
1341da177e4SLinus Torvalds {
13574675a58SAlan Stern u16 *op;
1361da177e4SLinus Torvalds int size;
13774675a58SAlan Stern unicode_t u;
13874675a58SAlan Stern
13974675a58SAlan Stern op = pwcs;
140045ddc89SAlan Stern while (inlen > 0 && maxout > 0 && *s) {
14174675a58SAlan Stern if (*s & 0x80) {
142045ddc89SAlan Stern size = utf8_to_utf32(s, inlen, &u);
14367638e40SOGAWA Hirofumi if (size < 0)
14467638e40SOGAWA Hirofumi return -EINVAL;
14574675a58SAlan Stern s += size;
146045ddc89SAlan Stern inlen -= size;
1470720a06aSAlan Stern
1480720a06aSAlan Stern if (u >= PLANE_SIZE) {
149045ddc89SAlan Stern if (maxout < 2)
1500720a06aSAlan Stern break;
1510720a06aSAlan Stern u -= PLANE_SIZE;
1520720a06aSAlan Stern put_utf16(op++, SURROGATE_PAIR |
1530720a06aSAlan Stern ((u >> 10) & SURROGATE_BITS),
1540720a06aSAlan Stern endian);
1550720a06aSAlan Stern put_utf16(op++, SURROGATE_PAIR |
1560720a06aSAlan Stern SURROGATE_LOW |
1570720a06aSAlan Stern (u & SURROGATE_BITS),
1580720a06aSAlan Stern endian);
159045ddc89SAlan Stern maxout -= 2;
16074675a58SAlan Stern } else {
1610720a06aSAlan Stern put_utf16(op++, u, endian);
162045ddc89SAlan Stern maxout--;
1630720a06aSAlan Stern }
1640720a06aSAlan Stern } else {
1650720a06aSAlan Stern put_utf16(op++, *s++, endian);
166045ddc89SAlan Stern inlen--;
167045ddc89SAlan Stern maxout--;
16874675a58SAlan Stern }
16974675a58SAlan Stern }
17074675a58SAlan Stern return op - pwcs;
17174675a58SAlan Stern }
17274675a58SAlan Stern EXPORT_SYMBOL(utf8s_to_utf16s);
17374675a58SAlan Stern
get_utf16(unsigned c,enum utf16_endian endian)17474675a58SAlan Stern static inline unsigned long get_utf16(unsigned c, enum utf16_endian endian)
17574675a58SAlan Stern {
17674675a58SAlan Stern switch (endian) {
17774675a58SAlan Stern default:
17874675a58SAlan Stern return c;
17974675a58SAlan Stern case UTF16_LITTLE_ENDIAN:
18074675a58SAlan Stern return __le16_to_cpu(c);
18174675a58SAlan Stern case UTF16_BIG_ENDIAN:
18274675a58SAlan Stern return __be16_to_cpu(c);
18374675a58SAlan Stern }
18474675a58SAlan Stern }
18574675a58SAlan Stern
utf16s_to_utf8s(const wchar_t * pwcs,int inlen,enum utf16_endian endian,u8 * s,int maxout)186045ddc89SAlan Stern int utf16s_to_utf8s(const wchar_t *pwcs, int inlen, enum utf16_endian endian,
187045ddc89SAlan Stern u8 *s, int maxout)
18874675a58SAlan Stern {
18974675a58SAlan Stern u8 *op;
19074675a58SAlan Stern int size;
19174675a58SAlan Stern unsigned long u, v;
1921da177e4SLinus Torvalds
1931da177e4SLinus Torvalds op = s;
194045ddc89SAlan Stern while (inlen > 0 && maxout > 0) {
19574675a58SAlan Stern u = get_utf16(*pwcs, endian);
19674675a58SAlan Stern if (!u)
19774675a58SAlan Stern break;
19874675a58SAlan Stern pwcs++;
199045ddc89SAlan Stern inlen--;
20074675a58SAlan Stern if (u > 0x7f) {
20174675a58SAlan Stern if ((u & SURROGATE_MASK) == SURROGATE_PAIR) {
20274675a58SAlan Stern if (u & SURROGATE_LOW) {
20374675a58SAlan Stern /* Ignore character and move on */
20474675a58SAlan Stern continue;
20574675a58SAlan Stern }
206045ddc89SAlan Stern if (inlen <= 0)
20774675a58SAlan Stern break;
20874675a58SAlan Stern v = get_utf16(*pwcs, endian);
20974675a58SAlan Stern if ((v & SURROGATE_MASK) != SURROGATE_PAIR ||
21074675a58SAlan Stern !(v & SURROGATE_LOW)) {
21174675a58SAlan Stern /* Ignore character and move on */
21274675a58SAlan Stern continue;
21374675a58SAlan Stern }
21474675a58SAlan Stern u = PLANE_SIZE + ((u & SURROGATE_BITS) << 10)
21574675a58SAlan Stern + (v & SURROGATE_BITS);
21674675a58SAlan Stern pwcs++;
217045ddc89SAlan Stern inlen--;
21874675a58SAlan Stern }
219045ddc89SAlan Stern size = utf32_to_utf8(u, op, maxout);
2201da177e4SLinus Torvalds if (size == -1) {
2211da177e4SLinus Torvalds /* Ignore character and move on */
2221da177e4SLinus Torvalds } else {
2231da177e4SLinus Torvalds op += size;
224045ddc89SAlan Stern maxout -= size;
2251da177e4SLinus Torvalds }
2261da177e4SLinus Torvalds } else {
22774675a58SAlan Stern *op++ = (u8) u;
228045ddc89SAlan Stern maxout--;
2291da177e4SLinus Torvalds }
2301da177e4SLinus Torvalds }
23174675a58SAlan Stern return op - s;
2321da177e4SLinus Torvalds }
23374675a58SAlan Stern EXPORT_SYMBOL(utf16s_to_utf8s);
2341da177e4SLinus Torvalds
__register_nls(struct nls_table * nls,struct module * owner)235479e64c2SAl Viro int __register_nls(struct nls_table *nls, struct module *owner)
2361da177e4SLinus Torvalds {
2371da177e4SLinus Torvalds struct nls_table ** tmp = &tables;
2381da177e4SLinus Torvalds
2391da177e4SLinus Torvalds if (nls->next)
2401da177e4SLinus Torvalds return -EBUSY;
2411da177e4SLinus Torvalds
242479e64c2SAl Viro nls->owner = owner;
2431da177e4SLinus Torvalds spin_lock(&nls_lock);
2441da177e4SLinus Torvalds while (*tmp) {
2451da177e4SLinus Torvalds if (nls == *tmp) {
2461da177e4SLinus Torvalds spin_unlock(&nls_lock);
2471da177e4SLinus Torvalds return -EBUSY;
2481da177e4SLinus Torvalds }
2491da177e4SLinus Torvalds tmp = &(*tmp)->next;
2501da177e4SLinus Torvalds }
2511da177e4SLinus Torvalds nls->next = tables;
2521da177e4SLinus Torvalds tables = nls;
2531da177e4SLinus Torvalds spin_unlock(&nls_lock);
2541da177e4SLinus Torvalds return 0;
2551da177e4SLinus Torvalds }
256479e64c2SAl Viro EXPORT_SYMBOL(__register_nls);
2571da177e4SLinus Torvalds
unregister_nls(struct nls_table * nls)2581da177e4SLinus Torvalds int unregister_nls(struct nls_table * nls)
2591da177e4SLinus Torvalds {
2601da177e4SLinus Torvalds struct nls_table ** tmp = &tables;
2611da177e4SLinus Torvalds
2621da177e4SLinus Torvalds spin_lock(&nls_lock);
2631da177e4SLinus Torvalds while (*tmp) {
2641da177e4SLinus Torvalds if (nls == *tmp) {
2651da177e4SLinus Torvalds *tmp = nls->next;
2661da177e4SLinus Torvalds spin_unlock(&nls_lock);
2671da177e4SLinus Torvalds return 0;
2681da177e4SLinus Torvalds }
2691da177e4SLinus Torvalds tmp = &(*tmp)->next;
2701da177e4SLinus Torvalds }
2711da177e4SLinus Torvalds spin_unlock(&nls_lock);
2721da177e4SLinus Torvalds return -EINVAL;
2731da177e4SLinus Torvalds }
2741da177e4SLinus Torvalds
find_nls(const char * charset)275*c1ed39ecSWinston Wen static struct nls_table *find_nls(const char *charset)
2761da177e4SLinus Torvalds {
2771da177e4SLinus Torvalds struct nls_table *nls;
2781da177e4SLinus Torvalds spin_lock(&nls_lock);
2791da177e4SLinus Torvalds for (nls = tables; nls; nls = nls->next) {
2801da177e4SLinus Torvalds if (!strcmp(nls->charset, charset))
2811da177e4SLinus Torvalds break;
2821da177e4SLinus Torvalds if (nls->alias && !strcmp(nls->alias, charset))
2831da177e4SLinus Torvalds break;
2841da177e4SLinus Torvalds }
2851da177e4SLinus Torvalds if (nls && !try_module_get(nls->owner))
2861da177e4SLinus Torvalds nls = NULL;
2871da177e4SLinus Torvalds spin_unlock(&nls_lock);
2881da177e4SLinus Torvalds return nls;
2891da177e4SLinus Torvalds }
2901da177e4SLinus Torvalds
load_nls(const char * charset)291*c1ed39ecSWinston Wen struct nls_table *load_nls(const char *charset)
2921da177e4SLinus Torvalds {
2935f4123beSJohannes Berg return try_then_request_module(find_nls(charset), "nls_%s", charset);
2941da177e4SLinus Torvalds }
2951da177e4SLinus Torvalds
unload_nls(struct nls_table * nls)2961da177e4SLinus Torvalds void unload_nls(struct nls_table *nls)
2971da177e4SLinus Torvalds {
2986d729e44SThomas Gleixner if (nls)
2991da177e4SLinus Torvalds module_put(nls->owner);
3001da177e4SLinus Torvalds }
3011da177e4SLinus Torvalds
302b9ec0339SDenys Vlasenko static const wchar_t charset2uni[256] = {
3031da177e4SLinus Torvalds /* 0x00*/
3041da177e4SLinus Torvalds 0x0000, 0x0001, 0x0002, 0x0003,
3051da177e4SLinus Torvalds 0x0004, 0x0005, 0x0006, 0x0007,
3061da177e4SLinus Torvalds 0x0008, 0x0009, 0x000a, 0x000b,
3071da177e4SLinus Torvalds 0x000c, 0x000d, 0x000e, 0x000f,
3081da177e4SLinus Torvalds /* 0x10*/
3091da177e4SLinus Torvalds 0x0010, 0x0011, 0x0012, 0x0013,
3101da177e4SLinus Torvalds 0x0014, 0x0015, 0x0016, 0x0017,
3111da177e4SLinus Torvalds 0x0018, 0x0019, 0x001a, 0x001b,
3121da177e4SLinus Torvalds 0x001c, 0x001d, 0x001e, 0x001f,
3131da177e4SLinus Torvalds /* 0x20*/
3141da177e4SLinus Torvalds 0x0020, 0x0021, 0x0022, 0x0023,
3151da177e4SLinus Torvalds 0x0024, 0x0025, 0x0026, 0x0027,
3161da177e4SLinus Torvalds 0x0028, 0x0029, 0x002a, 0x002b,
3171da177e4SLinus Torvalds 0x002c, 0x002d, 0x002e, 0x002f,
3181da177e4SLinus Torvalds /* 0x30*/
3191da177e4SLinus Torvalds 0x0030, 0x0031, 0x0032, 0x0033,
3201da177e4SLinus Torvalds 0x0034, 0x0035, 0x0036, 0x0037,
3211da177e4SLinus Torvalds 0x0038, 0x0039, 0x003a, 0x003b,
3221da177e4SLinus Torvalds 0x003c, 0x003d, 0x003e, 0x003f,
3231da177e4SLinus Torvalds /* 0x40*/
3241da177e4SLinus Torvalds 0x0040, 0x0041, 0x0042, 0x0043,
3251da177e4SLinus Torvalds 0x0044, 0x0045, 0x0046, 0x0047,
3261da177e4SLinus Torvalds 0x0048, 0x0049, 0x004a, 0x004b,
3271da177e4SLinus Torvalds 0x004c, 0x004d, 0x004e, 0x004f,
3281da177e4SLinus Torvalds /* 0x50*/
3291da177e4SLinus Torvalds 0x0050, 0x0051, 0x0052, 0x0053,
3301da177e4SLinus Torvalds 0x0054, 0x0055, 0x0056, 0x0057,
3311da177e4SLinus Torvalds 0x0058, 0x0059, 0x005a, 0x005b,
3321da177e4SLinus Torvalds 0x005c, 0x005d, 0x005e, 0x005f,
3331da177e4SLinus Torvalds /* 0x60*/
3341da177e4SLinus Torvalds 0x0060, 0x0061, 0x0062, 0x0063,
3351da177e4SLinus Torvalds 0x0064, 0x0065, 0x0066, 0x0067,
3361da177e4SLinus Torvalds 0x0068, 0x0069, 0x006a, 0x006b,
3371da177e4SLinus Torvalds 0x006c, 0x006d, 0x006e, 0x006f,
3381da177e4SLinus Torvalds /* 0x70*/
3391da177e4SLinus Torvalds 0x0070, 0x0071, 0x0072, 0x0073,
3401da177e4SLinus Torvalds 0x0074, 0x0075, 0x0076, 0x0077,
3411da177e4SLinus Torvalds 0x0078, 0x0079, 0x007a, 0x007b,
3421da177e4SLinus Torvalds 0x007c, 0x007d, 0x007e, 0x007f,
3431da177e4SLinus Torvalds /* 0x80*/
3441da177e4SLinus Torvalds 0x0080, 0x0081, 0x0082, 0x0083,
3451da177e4SLinus Torvalds 0x0084, 0x0085, 0x0086, 0x0087,
3461da177e4SLinus Torvalds 0x0088, 0x0089, 0x008a, 0x008b,
3471da177e4SLinus Torvalds 0x008c, 0x008d, 0x008e, 0x008f,
3481da177e4SLinus Torvalds /* 0x90*/
3491da177e4SLinus Torvalds 0x0090, 0x0091, 0x0092, 0x0093,
3501da177e4SLinus Torvalds 0x0094, 0x0095, 0x0096, 0x0097,
3511da177e4SLinus Torvalds 0x0098, 0x0099, 0x009a, 0x009b,
3521da177e4SLinus Torvalds 0x009c, 0x009d, 0x009e, 0x009f,
3531da177e4SLinus Torvalds /* 0xa0*/
3541da177e4SLinus Torvalds 0x00a0, 0x00a1, 0x00a2, 0x00a3,
3551da177e4SLinus Torvalds 0x00a4, 0x00a5, 0x00a6, 0x00a7,
3561da177e4SLinus Torvalds 0x00a8, 0x00a9, 0x00aa, 0x00ab,
3571da177e4SLinus Torvalds 0x00ac, 0x00ad, 0x00ae, 0x00af,
3581da177e4SLinus Torvalds /* 0xb0*/
3591da177e4SLinus Torvalds 0x00b0, 0x00b1, 0x00b2, 0x00b3,
3601da177e4SLinus Torvalds 0x00b4, 0x00b5, 0x00b6, 0x00b7,
3611da177e4SLinus Torvalds 0x00b8, 0x00b9, 0x00ba, 0x00bb,
3621da177e4SLinus Torvalds 0x00bc, 0x00bd, 0x00be, 0x00bf,
3631da177e4SLinus Torvalds /* 0xc0*/
3641da177e4SLinus Torvalds 0x00c0, 0x00c1, 0x00c2, 0x00c3,
3651da177e4SLinus Torvalds 0x00c4, 0x00c5, 0x00c6, 0x00c7,
3661da177e4SLinus Torvalds 0x00c8, 0x00c9, 0x00ca, 0x00cb,
3671da177e4SLinus Torvalds 0x00cc, 0x00cd, 0x00ce, 0x00cf,
3681da177e4SLinus Torvalds /* 0xd0*/
3691da177e4SLinus Torvalds 0x00d0, 0x00d1, 0x00d2, 0x00d3,
3701da177e4SLinus Torvalds 0x00d4, 0x00d5, 0x00d6, 0x00d7,
3711da177e4SLinus Torvalds 0x00d8, 0x00d9, 0x00da, 0x00db,
3721da177e4SLinus Torvalds 0x00dc, 0x00dd, 0x00de, 0x00df,
3731da177e4SLinus Torvalds /* 0xe0*/
3741da177e4SLinus Torvalds 0x00e0, 0x00e1, 0x00e2, 0x00e3,
3751da177e4SLinus Torvalds 0x00e4, 0x00e5, 0x00e6, 0x00e7,
3761da177e4SLinus Torvalds 0x00e8, 0x00e9, 0x00ea, 0x00eb,
3771da177e4SLinus Torvalds 0x00ec, 0x00ed, 0x00ee, 0x00ef,
3781da177e4SLinus Torvalds /* 0xf0*/
3791da177e4SLinus Torvalds 0x00f0, 0x00f1, 0x00f2, 0x00f3,
3801da177e4SLinus Torvalds 0x00f4, 0x00f5, 0x00f6, 0x00f7,
3811da177e4SLinus Torvalds 0x00f8, 0x00f9, 0x00fa, 0x00fb,
3821da177e4SLinus Torvalds 0x00fc, 0x00fd, 0x00fe, 0x00ff,
3831da177e4SLinus Torvalds };
3841da177e4SLinus Torvalds
385b9ec0339SDenys Vlasenko static const unsigned char page00[256] = {
3861da177e4SLinus Torvalds 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, /* 0x00-0x07 */
3871da177e4SLinus Torvalds 0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f, /* 0x08-0x0f */
3881da177e4SLinus Torvalds 0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17, /* 0x10-0x17 */
3891da177e4SLinus Torvalds 0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f, /* 0x18-0x1f */
3901da177e4SLinus Torvalds 0x20, 0x21, 0x22, 0x23, 0x24, 0x25, 0x26, 0x27, /* 0x20-0x27 */
3911da177e4SLinus Torvalds 0x28, 0x29, 0x2a, 0x2b, 0x2c, 0x2d, 0x2e, 0x2f, /* 0x28-0x2f */
3921da177e4SLinus Torvalds 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37, /* 0x30-0x37 */
3931da177e4SLinus Torvalds 0x38, 0x39, 0x3a, 0x3b, 0x3c, 0x3d, 0x3e, 0x3f, /* 0x38-0x3f */
3941da177e4SLinus Torvalds 0x40, 0x41, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47, /* 0x40-0x47 */
3951da177e4SLinus Torvalds 0x48, 0x49, 0x4a, 0x4b, 0x4c, 0x4d, 0x4e, 0x4f, /* 0x48-0x4f */
3961da177e4SLinus Torvalds 0x50, 0x51, 0x52, 0x53, 0x54, 0x55, 0x56, 0x57, /* 0x50-0x57 */
3971da177e4SLinus Torvalds 0x58, 0x59, 0x5a, 0x5b, 0x5c, 0x5d, 0x5e, 0x5f, /* 0x58-0x5f */
3981da177e4SLinus Torvalds 0x60, 0x61, 0x62, 0x63, 0x64, 0x65, 0x66, 0x67, /* 0x60-0x67 */
3991da177e4SLinus Torvalds 0x68, 0x69, 0x6a, 0x6b, 0x6c, 0x6d, 0x6e, 0x6f, /* 0x68-0x6f */
4001da177e4SLinus Torvalds 0x70, 0x71, 0x72, 0x73, 0x74, 0x75, 0x76, 0x77, /* 0x70-0x77 */
4011da177e4SLinus Torvalds 0x78, 0x79, 0x7a, 0x7b, 0x7c, 0x7d, 0x7e, 0x7f, /* 0x78-0x7f */
4021da177e4SLinus Torvalds
4031da177e4SLinus Torvalds 0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87, /* 0x80-0x87 */
4041da177e4SLinus Torvalds 0x88, 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, 0x8f, /* 0x88-0x8f */
4051da177e4SLinus Torvalds 0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97, /* 0x90-0x97 */
4061da177e4SLinus Torvalds 0x98, 0x99, 0x9a, 0x9b, 0x9c, 0x9d, 0x9e, 0x9f, /* 0x98-0x9f */
4071da177e4SLinus Torvalds 0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7, /* 0xa0-0xa7 */
4081da177e4SLinus Torvalds 0xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad, 0xae, 0xaf, /* 0xa8-0xaf */
4091da177e4SLinus Torvalds 0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7, /* 0xb0-0xb7 */
4101da177e4SLinus Torvalds 0xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf, /* 0xb8-0xbf */
4111da177e4SLinus Torvalds 0xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7, /* 0xc0-0xc7 */
4121da177e4SLinus Torvalds 0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf, /* 0xc8-0xcf */
4131da177e4SLinus Torvalds 0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7, /* 0xd0-0xd7 */
4141da177e4SLinus Torvalds 0xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf, /* 0xd8-0xdf */
4151da177e4SLinus Torvalds 0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, /* 0xe0-0xe7 */
4161da177e4SLinus Torvalds 0xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef, /* 0xe8-0xef */
4171da177e4SLinus Torvalds 0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7, /* 0xf0-0xf7 */
4181da177e4SLinus Torvalds 0xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe, 0xff, /* 0xf8-0xff */
4191da177e4SLinus Torvalds };
4201da177e4SLinus Torvalds
421b9ec0339SDenys Vlasenko static const unsigned char *const page_uni2charset[256] = {
4221da177e4SLinus Torvalds page00
4231da177e4SLinus Torvalds };
4241da177e4SLinus Torvalds
425b9ec0339SDenys Vlasenko static const unsigned char charset2lower[256] = {
4261da177e4SLinus Torvalds 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, /* 0x00-0x07 */
4271da177e4SLinus Torvalds 0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f, /* 0x08-0x0f */
4281da177e4SLinus Torvalds 0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17, /* 0x10-0x17 */
4291da177e4SLinus Torvalds 0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f, /* 0x18-0x1f */
4301da177e4SLinus Torvalds 0x20, 0x21, 0x22, 0x23, 0x24, 0x25, 0x26, 0x27, /* 0x20-0x27 */
4311da177e4SLinus Torvalds 0x28, 0x29, 0x2a, 0x2b, 0x2c, 0x2d, 0x2e, 0x2f, /* 0x28-0x2f */
4321da177e4SLinus Torvalds 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37, /* 0x30-0x37 */
4331da177e4SLinus Torvalds 0x38, 0x39, 0x3a, 0x3b, 0x3c, 0x3d, 0x3e, 0x3f, /* 0x38-0x3f */
4341da177e4SLinus Torvalds 0x40, 0x61, 0x62, 0x63, 0x64, 0x65, 0x66, 0x67, /* 0x40-0x47 */
4351da177e4SLinus Torvalds 0x68, 0x69, 0x6a, 0x6b, 0x6c, 0x6d, 0x6e, 0x6f, /* 0x48-0x4f */
4361da177e4SLinus Torvalds 0x70, 0x71, 0x72, 0x73, 0x74, 0x75, 0x76, 0x77, /* 0x50-0x57 */
4371da177e4SLinus Torvalds 0x78, 0x79, 0x7a, 0x5b, 0x5c, 0x5d, 0x5e, 0x5f, /* 0x58-0x5f */
4381da177e4SLinus Torvalds 0x60, 0x61, 0x62, 0x63, 0x64, 0x65, 0x66, 0x67, /* 0x60-0x67 */
4391da177e4SLinus Torvalds 0x68, 0x69, 0x6a, 0x6b, 0x6c, 0x6d, 0x6e, 0x6f, /* 0x68-0x6f */
4401da177e4SLinus Torvalds 0x70, 0x71, 0x72, 0x73, 0x74, 0x75, 0x76, 0x77, /* 0x70-0x77 */
4411da177e4SLinus Torvalds 0x78, 0x79, 0x7a, 0x7b, 0x7c, 0x7d, 0x7e, 0x7f, /* 0x78-0x7f */
4421da177e4SLinus Torvalds
4431da177e4SLinus Torvalds 0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87, /* 0x80-0x87 */
4441da177e4SLinus Torvalds 0x88, 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, 0x8f, /* 0x88-0x8f */
4451da177e4SLinus Torvalds 0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97, /* 0x90-0x97 */
4461da177e4SLinus Torvalds 0x98, 0x99, 0x9a, 0x9b, 0x9c, 0x9d, 0x9e, 0x9f, /* 0x98-0x9f */
4471da177e4SLinus Torvalds 0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7, /* 0xa0-0xa7 */
4481da177e4SLinus Torvalds 0xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad, 0xae, 0xaf, /* 0xa8-0xaf */
4491da177e4SLinus Torvalds 0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7, /* 0xb0-0xb7 */
4501da177e4SLinus Torvalds 0xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf, /* 0xb8-0xbf */
4511da177e4SLinus Torvalds 0xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7, /* 0xc0-0xc7 */
4521da177e4SLinus Torvalds 0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf, /* 0xc8-0xcf */
4531da177e4SLinus Torvalds 0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7, /* 0xd0-0xd7 */
4541da177e4SLinus Torvalds 0xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf, /* 0xd8-0xdf */
4551da177e4SLinus Torvalds 0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, /* 0xe0-0xe7 */
4561da177e4SLinus Torvalds 0xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef, /* 0xe8-0xef */
4571da177e4SLinus Torvalds 0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7, /* 0xf0-0xf7 */
4581da177e4SLinus Torvalds 0xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe, 0xff, /* 0xf8-0xff */
4591da177e4SLinus Torvalds };
4601da177e4SLinus Torvalds
461b9ec0339SDenys Vlasenko static const unsigned char charset2upper[256] = {
4621da177e4SLinus Torvalds 0x00, 0x01, 0x02, 0x03, 0x04, 0x05, 0x06, 0x07, /* 0x00-0x07 */
4631da177e4SLinus Torvalds 0x08, 0x09, 0x0a, 0x0b, 0x0c, 0x0d, 0x0e, 0x0f, /* 0x08-0x0f */
4641da177e4SLinus Torvalds 0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17, /* 0x10-0x17 */
4651da177e4SLinus Torvalds 0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f, /* 0x18-0x1f */
4661da177e4SLinus Torvalds 0x20, 0x21, 0x22, 0x23, 0x24, 0x25, 0x26, 0x27, /* 0x20-0x27 */
4671da177e4SLinus Torvalds 0x28, 0x29, 0x2a, 0x2b, 0x2c, 0x2d, 0x2e, 0x2f, /* 0x28-0x2f */
4681da177e4SLinus Torvalds 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37, /* 0x30-0x37 */
4691da177e4SLinus Torvalds 0x38, 0x39, 0x3a, 0x3b, 0x3c, 0x3d, 0x3e, 0x3f, /* 0x38-0x3f */
4701da177e4SLinus Torvalds 0x40, 0x41, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47, /* 0x40-0x47 */
4711da177e4SLinus Torvalds 0x48, 0x49, 0x4a, 0x4b, 0x4c, 0x4d, 0x4e, 0x4f, /* 0x48-0x4f */
4721da177e4SLinus Torvalds 0x50, 0x51, 0x52, 0x53, 0x54, 0x55, 0x56, 0x57, /* 0x50-0x57 */
4731da177e4SLinus Torvalds 0x58, 0x59, 0x5a, 0x5b, 0x5c, 0x5d, 0x5e, 0x5f, /* 0x58-0x5f */
4741da177e4SLinus Torvalds 0x60, 0x41, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47, /* 0x60-0x67 */
4751da177e4SLinus Torvalds 0x48, 0x49, 0x4a, 0x4b, 0x4c, 0x4d, 0x4e, 0x4f, /* 0x68-0x6f */
4761da177e4SLinus Torvalds 0x50, 0x51, 0x52, 0x53, 0x54, 0x55, 0x56, 0x57, /* 0x70-0x77 */
4771da177e4SLinus Torvalds 0x58, 0x59, 0x5a, 0x7b, 0x7c, 0x7d, 0x7e, 0x7f, /* 0x78-0x7f */
4781da177e4SLinus Torvalds
4791da177e4SLinus Torvalds 0x80, 0x81, 0x82, 0x83, 0x84, 0x85, 0x86, 0x87, /* 0x80-0x87 */
4801da177e4SLinus Torvalds 0x88, 0x89, 0x8a, 0x8b, 0x8c, 0x8d, 0x8e, 0x8f, /* 0x88-0x8f */
4811da177e4SLinus Torvalds 0x90, 0x91, 0x92, 0x93, 0x94, 0x95, 0x96, 0x97, /* 0x90-0x97 */
4821da177e4SLinus Torvalds 0x98, 0x99, 0x9a, 0x9b, 0x9c, 0x9d, 0x9e, 0x9f, /* 0x98-0x9f */
4831da177e4SLinus Torvalds 0xa0, 0xa1, 0xa2, 0xa3, 0xa4, 0xa5, 0xa6, 0xa7, /* 0xa0-0xa7 */
4841da177e4SLinus Torvalds 0xa8, 0xa9, 0xaa, 0xab, 0xac, 0xad, 0xae, 0xaf, /* 0xa8-0xaf */
4851da177e4SLinus Torvalds 0xb0, 0xb1, 0xb2, 0xb3, 0xb4, 0xb5, 0xb6, 0xb7, /* 0xb0-0xb7 */
4861da177e4SLinus Torvalds 0xb8, 0xb9, 0xba, 0xbb, 0xbc, 0xbd, 0xbe, 0xbf, /* 0xb8-0xbf */
4871da177e4SLinus Torvalds 0xc0, 0xc1, 0xc2, 0xc3, 0xc4, 0xc5, 0xc6, 0xc7, /* 0xc0-0xc7 */
4881da177e4SLinus Torvalds 0xc8, 0xc9, 0xca, 0xcb, 0xcc, 0xcd, 0xce, 0xcf, /* 0xc8-0xcf */
4891da177e4SLinus Torvalds 0xd0, 0xd1, 0xd2, 0xd3, 0xd4, 0xd5, 0xd6, 0xd7, /* 0xd0-0xd7 */
4901da177e4SLinus Torvalds 0xd8, 0xd9, 0xda, 0xdb, 0xdc, 0xdd, 0xde, 0xdf, /* 0xd8-0xdf */
4911da177e4SLinus Torvalds 0xe0, 0xe1, 0xe2, 0xe3, 0xe4, 0xe5, 0xe6, 0xe7, /* 0xe0-0xe7 */
4921da177e4SLinus Torvalds 0xe8, 0xe9, 0xea, 0xeb, 0xec, 0xed, 0xee, 0xef, /* 0xe8-0xef */
4931da177e4SLinus Torvalds 0xf0, 0xf1, 0xf2, 0xf3, 0xf4, 0xf5, 0xf6, 0xf7, /* 0xf0-0xf7 */
4941da177e4SLinus Torvalds 0xf8, 0xf9, 0xfa, 0xfb, 0xfc, 0xfd, 0xfe, 0xff, /* 0xf8-0xff */
4951da177e4SLinus Torvalds };
4961da177e4SLinus Torvalds
4971da177e4SLinus Torvalds
uni2char(wchar_t uni,unsigned char * out,int boundlen)4981da177e4SLinus Torvalds static int uni2char(wchar_t uni, unsigned char *out, int boundlen)
4991da177e4SLinus Torvalds {
500b9ec0339SDenys Vlasenko const unsigned char *uni2charset;
5011da177e4SLinus Torvalds unsigned char cl = uni & 0x00ff;
5021da177e4SLinus Torvalds unsigned char ch = (uni & 0xff00) >> 8;
5031da177e4SLinus Torvalds
5041da177e4SLinus Torvalds if (boundlen <= 0)
5051da177e4SLinus Torvalds return -ENAMETOOLONG;
5061da177e4SLinus Torvalds
5071da177e4SLinus Torvalds uni2charset = page_uni2charset[ch];
5081da177e4SLinus Torvalds if (uni2charset && uni2charset[cl])
5091da177e4SLinus Torvalds out[0] = uni2charset[cl];
5101da177e4SLinus Torvalds else
5111da177e4SLinus Torvalds return -EINVAL;
5121da177e4SLinus Torvalds return 1;
5131da177e4SLinus Torvalds }
5141da177e4SLinus Torvalds
char2uni(const unsigned char * rawstring,int boundlen,wchar_t * uni)5151da177e4SLinus Torvalds static int char2uni(const unsigned char *rawstring, int boundlen, wchar_t *uni)
5161da177e4SLinus Torvalds {
5171da177e4SLinus Torvalds *uni = charset2uni[*rawstring];
5181da177e4SLinus Torvalds if (*uni == 0x0000)
5191da177e4SLinus Torvalds return -EINVAL;
5201da177e4SLinus Torvalds return 1;
5211da177e4SLinus Torvalds }
5221da177e4SLinus Torvalds
5231da177e4SLinus Torvalds static struct nls_table default_table = {
5241da177e4SLinus Torvalds .charset = "default",
5251da177e4SLinus Torvalds .uni2char = uni2char,
5261da177e4SLinus Torvalds .char2uni = char2uni,
5271da177e4SLinus Torvalds .charset2lower = charset2lower,
5281da177e4SLinus Torvalds .charset2upper = charset2upper,
5291da177e4SLinus Torvalds };
5301da177e4SLinus Torvalds
5311da177e4SLinus Torvalds /* Returns a simple default translation table */
load_nls_default(void)5321da177e4SLinus Torvalds struct nls_table *load_nls_default(void)
5331da177e4SLinus Torvalds {
5341da177e4SLinus Torvalds struct nls_table *default_nls;
5351da177e4SLinus Torvalds
5361da177e4SLinus Torvalds default_nls = load_nls(CONFIG_NLS_DEFAULT);
5371da177e4SLinus Torvalds if (default_nls != NULL)
5381da177e4SLinus Torvalds return default_nls;
5391da177e4SLinus Torvalds else
5401da177e4SLinus Torvalds return &default_table;
5411da177e4SLinus Torvalds }
5421da177e4SLinus Torvalds
5431da177e4SLinus Torvalds EXPORT_SYMBOL(unregister_nls);
5441da177e4SLinus Torvalds EXPORT_SYMBOL(unload_nls);
5451da177e4SLinus Torvalds EXPORT_SYMBOL(load_nls);
5461da177e4SLinus Torvalds EXPORT_SYMBOL(load_nls_default);
5471da177e4SLinus Torvalds
5481da177e4SLinus Torvalds MODULE_LICENSE("Dual BSD/GPL");
549