Commit | Line | Data |
---|---|---|
9d53690f GKB |
1 | /* SPDX-License-Identifier: GPL-2.0 */ |
2 | #include <linux/module.h> | |
3 | #include <linux/kernel.h> | |
4 | #include <linux/string.h> | |
5 | #include <linux/slab.h> | |
6 | #include <linux/parser.h> | |
7 | #include <linux/errno.h> | |
8 | #include <linux/unicode.h> | |
9 | ||
10 | #include "utf8n.h" | |
11 | ||
12 | int utf8_validate(const struct unicode_map *um, const struct qstr *str) | |
13 | { | |
14 | const struct utf8data *data = utf8nfdi(um->version); | |
15 | ||
16 | if (utf8nlen(data, str->name, str->len) < 0) | |
17 | return -1; | |
18 | return 0; | |
19 | } | |
20 | EXPORT_SYMBOL(utf8_validate); | |
21 | ||
22 | int utf8_strncmp(const struct unicode_map *um, | |
23 | const struct qstr *s1, const struct qstr *s2) | |
24 | { | |
25 | const struct utf8data *data = utf8nfdi(um->version); | |
26 | struct utf8cursor cur1, cur2; | |
27 | int c1, c2; | |
28 | ||
29 | if (utf8ncursor(&cur1, data, s1->name, s1->len) < 0) | |
30 | return -EINVAL; | |
31 | ||
32 | if (utf8ncursor(&cur2, data, s2->name, s2->len) < 0) | |
33 | return -EINVAL; | |
34 | ||
35 | do { | |
36 | c1 = utf8byte(&cur1); | |
37 | c2 = utf8byte(&cur2); | |
38 | ||
39 | if (c1 < 0 || c2 < 0) | |
40 | return -EINVAL; | |
41 | if (c1 != c2) | |
42 | return 1; | |
43 | } while (c1); | |
44 | ||
45 | return 0; | |
46 | } | |
47 | EXPORT_SYMBOL(utf8_strncmp); | |
48 | ||
49 | int utf8_strncasecmp(const struct unicode_map *um, | |
50 | const struct qstr *s1, const struct qstr *s2) | |
51 | { | |
52 | const struct utf8data *data = utf8nfdicf(um->version); | |
53 | struct utf8cursor cur1, cur2; | |
54 | int c1, c2; | |
55 | ||
56 | if (utf8ncursor(&cur1, data, s1->name, s1->len) < 0) | |
57 | return -EINVAL; | |
58 | ||
59 | if (utf8ncursor(&cur2, data, s2->name, s2->len) < 0) | |
60 | return -EINVAL; | |
61 | ||
62 | do { | |
63 | c1 = utf8byte(&cur1); | |
64 | c2 = utf8byte(&cur2); | |
65 | ||
66 | if (c1 < 0 || c2 < 0) | |
67 | return -EINVAL; | |
68 | if (c1 != c2) | |
69 | return 1; | |
70 | } while (c1); | |
71 | ||
72 | return 0; | |
73 | } | |
74 | EXPORT_SYMBOL(utf8_strncasecmp); | |
75 | ||
3ae72562 GKB |
76 | /* String cf is expected to be a valid UTF-8 casefolded |
77 | * string. | |
78 | */ | |
79 | int utf8_strncasecmp_folded(const struct unicode_map *um, | |
80 | const struct qstr *cf, | |
81 | const struct qstr *s1) | |
82 | { | |
83 | const struct utf8data *data = utf8nfdicf(um->version); | |
84 | struct utf8cursor cur1; | |
85 | int c1, c2; | |
86 | int i = 0; | |
87 | ||
88 | if (utf8ncursor(&cur1, data, s1->name, s1->len) < 0) | |
89 | return -EINVAL; | |
90 | ||
91 | do { | |
92 | c1 = utf8byte(&cur1); | |
93 | c2 = cf->name[i++]; | |
94 | if (c1 < 0) | |
95 | return -EINVAL; | |
96 | if (c1 != c2) | |
97 | return 1; | |
98 | } while (c1); | |
99 | ||
100 | return 0; | |
101 | } | |
102 | EXPORT_SYMBOL(utf8_strncasecmp_folded); | |
103 | ||
9d53690f GKB |
104 | int utf8_casefold(const struct unicode_map *um, const struct qstr *str, |
105 | unsigned char *dest, size_t dlen) | |
106 | { | |
107 | const struct utf8data *data = utf8nfdicf(um->version); | |
108 | struct utf8cursor cur; | |
109 | size_t nlen = 0; | |
110 | ||
111 | if (utf8ncursor(&cur, data, str->name, str->len) < 0) | |
112 | return -EINVAL; | |
113 | ||
114 | for (nlen = 0; nlen < dlen; nlen++) { | |
115 | int c = utf8byte(&cur); | |
116 | ||
117 | dest[nlen] = c; | |
118 | if (!c) | |
119 | return nlen; | |
120 | if (c == -1) | |
121 | break; | |
122 | } | |
123 | return -EINVAL; | |
124 | } | |
125 | ||
126 | EXPORT_SYMBOL(utf8_casefold); | |
127 | ||
128 | int utf8_normalize(const struct unicode_map *um, const struct qstr *str, | |
129 | unsigned char *dest, size_t dlen) | |
130 | { | |
131 | const struct utf8data *data = utf8nfdi(um->version); | |
132 | struct utf8cursor cur; | |
133 | ssize_t nlen = 0; | |
134 | ||
135 | if (utf8ncursor(&cur, data, str->name, str->len) < 0) | |
136 | return -EINVAL; | |
137 | ||
138 | for (nlen = 0; nlen < dlen; nlen++) { | |
139 | int c = utf8byte(&cur); | |
140 | ||
141 | dest[nlen] = c; | |
142 | if (!c) | |
143 | return nlen; | |
144 | if (c == -1) | |
145 | break; | |
146 | } | |
147 | return -EINVAL; | |
148 | } | |
149 | ||
150 | EXPORT_SYMBOL(utf8_normalize); | |
151 | ||
152 | static int utf8_parse_version(const char *version, unsigned int *maj, | |
153 | unsigned int *min, unsigned int *rev) | |
154 | { | |
155 | substring_t args[3]; | |
156 | char version_string[12]; | |
aa28b98d | 157 | static const struct match_token token[] = { |
9d53690f GKB |
158 | {1, "%d.%d.%d"}, |
159 | {0, NULL} | |
160 | }; | |
161 | ||
162 | strncpy(version_string, version, sizeof(version_string)); | |
163 | ||
164 | if (match_token(version_string, token, args) != 1) | |
165 | return -EINVAL; | |
166 | ||
167 | if (match_int(&args[0], maj) || match_int(&args[1], min) || | |
168 | match_int(&args[2], rev)) | |
169 | return -EINVAL; | |
170 | ||
171 | return 0; | |
172 | } | |
173 | ||
174 | struct unicode_map *utf8_load(const char *version) | |
175 | { | |
176 | struct unicode_map *um = NULL; | |
177 | int unicode_version; | |
178 | ||
179 | if (version) { | |
180 | unsigned int maj, min, rev; | |
181 | ||
182 | if (utf8_parse_version(version, &maj, &min, &rev) < 0) | |
183 | return ERR_PTR(-EINVAL); | |
184 | ||
185 | if (!utf8version_is_supported(maj, min, rev)) | |
186 | return ERR_PTR(-EINVAL); | |
187 | ||
188 | unicode_version = UNICODE_AGE(maj, min, rev); | |
189 | } else { | |
190 | unicode_version = utf8version_latest(); | |
191 | printk(KERN_WARNING"UTF-8 version not specified. " | |
192 | "Assuming latest supported version (%d.%d.%d).", | |
193 | (unicode_version >> 16) & 0xff, | |
194 | (unicode_version >> 8) & 0xff, | |
195 | (unicode_version & 0xff)); | |
196 | } | |
197 | ||
198 | um = kzalloc(sizeof(struct unicode_map), GFP_KERNEL); | |
199 | if (!um) | |
200 | return ERR_PTR(-ENOMEM); | |
201 | ||
202 | um->charset = "UTF-8"; | |
203 | um->version = unicode_version; | |
204 | ||
205 | return um; | |
206 | } | |
207 | EXPORT_SYMBOL(utf8_load); | |
208 | ||
209 | void utf8_unload(struct unicode_map *um) | |
210 | { | |
211 | kfree(um); | |
212 | } | |
213 | EXPORT_SYMBOL(utf8_unload); | |
214 | ||
215 | MODULE_LICENSE("GPL v2"); |