| /* SPDX-License-Identifier: GPL-2.0 */ |
| #include <linux/module.h> |
| #include <linux/kernel.h> |
| #include <linux/string.h> |
| #include <linux/slab.h> |
| #include <linux/parser.h> |
| #include <linux/errno.h> |
| #include <linux/unicode.h> |
| #include <linux/fs.h> |
| |
| #include "utf8n.h" |
| |
| int utf8_validate(const struct unicode_map *um, const struct qstr *str) |
| { |
| const struct utf8data *data = utf8nfdi(um->version); |
| |
| if (utf8nlen(data, str->name, str->len) < 0) |
| return -1; |
| return 0; |
| } |
| EXPORT_SYMBOL(utf8_validate); |
| |
| int utf8_strncmp(const struct unicode_map *um, |
| const struct qstr *s1, const struct qstr *s2) |
| { |
| const struct utf8data *data = utf8nfdi(um->version); |
| struct utf8cursor cur1, cur2; |
| int c1, c2; |
| |
| if (utf8ncursor(&cur1, data, s1->name, s1->len) < 0) |
| return -EINVAL; |
| |
| if (utf8ncursor(&cur2, data, s2->name, s2->len) < 0) |
| return -EINVAL; |
| |
| do { |
| c1 = utf8byte(&cur1); |
| c2 = utf8byte(&cur2); |
| |
| if (c1 < 0 || c2 < 0) |
| return -EINVAL; |
| if (c1 != c2) |
| return 1; |
| } while (c1); |
| |
| return 0; |
| } |
| EXPORT_SYMBOL(utf8_strncmp); |
| |
| int utf8_strncasecmp(const struct unicode_map *um, |
| const struct qstr *s1, const struct qstr *s2) |
| { |
| const struct utf8data *data = utf8nfdicf(um->version); |
| struct utf8cursor cur1, cur2; |
| int c1, c2; |
| |
| if (utf8ncursor(&cur1, data, s1->name, s1->len) < 0) |
| return -EINVAL; |
| |
| if (utf8ncursor(&cur2, data, s2->name, s2->len) < 0) |
| return -EINVAL; |
| |
| do { |
| c1 = utf8byte(&cur1); |
| c2 = utf8byte(&cur2); |
| |
| if (c1 < 0 || c2 < 0) |
| return -EINVAL; |
| if (c1 != c2) |
| return 1; |
| } while (c1); |
| |
| return 0; |
| } |
| EXPORT_SYMBOL(utf8_strncasecmp); |
| |
| /* String cf is expected to be a valid UTF-8 casefolded |
| * string. |
| */ |
| int utf8_strncasecmp_folded(const struct unicode_map *um, |
| const struct qstr *cf, |
| const struct qstr *s1) |
| { |
| const struct utf8data *data = utf8nfdicf(um->version); |
| struct utf8cursor cur1; |
| int c1, c2; |
| int i = 0; |
| |
| if (utf8ncursor(&cur1, data, s1->name, s1->len) < 0) |
| return -EINVAL; |
| |
| do { |
| c1 = utf8byte(&cur1); |
| c2 = cf->name[i++]; |
| if (c1 < 0) |
| return -EINVAL; |
| if (c1 != c2) |
| return 1; |
| } while (c1); |
| |
| return 0; |
| } |
| EXPORT_SYMBOL(utf8_strncasecmp_folded); |
| |
| int utf8_casefold(const struct unicode_map *um, const struct qstr *str, |
| unsigned char *dest, size_t dlen) |
| { |
| const struct utf8data *data = utf8nfdicf(um->version); |
| struct utf8cursor cur; |
| size_t nlen = 0; |
| |
| if (utf8ncursor(&cur, data, str->name, str->len) < 0) |
| return -EINVAL; |
| |
| for (nlen = 0; nlen < dlen; nlen++) { |
| int c = utf8byte(&cur); |
| |
| dest[nlen] = c; |
| if (!c) |
| return nlen; |
| if (c == -1) |
| break; |
| } |
| return -EINVAL; |
| } |
| |
| EXPORT_SYMBOL(utf8_casefold); |
| |
| int utf8_normalize(const struct unicode_map *um, const struct qstr *str, |
| unsigned char *dest, size_t dlen) |
| { |
| const struct utf8data *data = utf8nfdi(um->version); |
| struct utf8cursor cur; |
| ssize_t nlen = 0; |
| |
| if (utf8ncursor(&cur, data, str->name, str->len) < 0) |
| return -EINVAL; |
| |
| for (nlen = 0; nlen < dlen; nlen++) { |
| int c = utf8byte(&cur); |
| |
| dest[nlen] = c; |
| if (!c) |
| return nlen; |
| if (c == -1) |
| break; |
| } |
| return -EINVAL; |
| } |
| |
| EXPORT_SYMBOL(utf8_normalize); |
| |
| static int utf8_parse_version(const char *version, unsigned int *maj, |
| unsigned int *min, unsigned int *rev) |
| { |
| substring_t args[3]; |
| char version_string[12]; |
| static const struct match_token token[] = { |
| {1, "%d.%d.%d"}, |
| {0, NULL} |
| }; |
| |
| strncpy(version_string, version, sizeof(version_string)); |
| |
| if (match_token(version_string, token, args) != 1) |
| return -EINVAL; |
| |
| if (match_int(&args[0], maj) || match_int(&args[1], min) || |
| match_int(&args[2], rev)) |
| return -EINVAL; |
| |
| return 0; |
| } |
| |
| struct unicode_map *utf8_load(const char *version) |
| { |
| struct unicode_map *um = NULL; |
| int unicode_version; |
| |
| if (version) { |
| unsigned int maj, min, rev; |
| |
| if (utf8_parse_version(version, &maj, &min, &rev) < 0) |
| return ERR_PTR(-EINVAL); |
| |
| if (!utf8version_is_supported(maj, min, rev)) |
| return ERR_PTR(-EINVAL); |
| |
| unicode_version = UNICODE_AGE(maj, min, rev); |
| } else { |
| unicode_version = utf8version_latest(); |
| printk(KERN_WARNING"UTF-8 version not specified. " |
| "Assuming latest supported version (%d.%d.%d).", |
| (unicode_version >> 16) & 0xff, |
| (unicode_version >> 8) & 0xff, |
| (unicode_version & 0xff)); |
| } |
| |
| um = kzalloc(sizeof(struct unicode_map), GFP_KERNEL); |
| if (!um) |
| return ERR_PTR(-ENOMEM); |
| |
| um->charset = "UTF-8"; |
| um->version = unicode_version; |
| |
| return um; |
| } |
| EXPORT_SYMBOL(utf8_load); |
| |
| void utf8_unload(struct unicode_map *um) |
| { |
| kfree(um); |
| } |
| EXPORT_SYMBOL(utf8_unload); |
| |
| static ssize_t latest_version_show(struct kobject *kobj, |
| struct kobj_attribute *attr, char *buf) |
| { |
| int l = utf8version_latest(); |
| |
| return snprintf(buf, PAGE_SIZE, "%d.%d.%d\n", |
| UNICODE_AGE_MAJ(l), UNICODE_AGE_MIN(l), |
| UNICODE_AGE_REV(l)); |
| } |
| |
| #define UNICODE_ATTR(x) \ |
| static struct kobj_attribute x ## _attr = __ATTR_RO(x) |
| |
| UNICODE_ATTR(latest_version); |
| |
| static struct attribute *encoding_attrs[] = { |
| &latest_version_attr.attr, |
| NULL, |
| }; |
| static const struct attribute_group encoding_attr_group = { |
| .attrs = encoding_attrs, |
| }; |
| |
| static struct kobject *unicode_kobj; |
| static struct kobject *utf8_kobj; |
| |
| static int __init unicode_init(void) |
| { |
| int ret = 0; |
| |
| unicode_kobj = kobject_create_and_add("unicode", fs_kobj); |
| if (!unicode_kobj) |
| return -ENOMEM; |
| |
| utf8_kobj = kobject_create_and_add("utf-8", unicode_kobj); |
| if (!utf8_kobj) { |
| ret = -ENOMEM; |
| goto fail_unicode; |
| } |
| |
| ret = sysfs_create_group(utf8_kobj, &encoding_attr_group); |
| if (ret) |
| goto fail_utf8; |
| |
| return 0; |
| |
| fail_utf8: |
| kobject_put(utf8_kobj); |
| fail_unicode: |
| kobject_put(unicode_kobj); |
| return ret; |
| } |
| fs_initcall(unicode_init); |
| |
| MODULE_LICENSE("GPL v2"); |