18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0 28c2ecf20Sopenharmony_ci/* 38c2ecf20Sopenharmony_ci * linux/fs/hfsplus/unicode.c 48c2ecf20Sopenharmony_ci * 58c2ecf20Sopenharmony_ci * Copyright (C) 2001 68c2ecf20Sopenharmony_ci * Brad Boyer (flar@allandria.com) 78c2ecf20Sopenharmony_ci * (C) 2003 Ardis Technologies <roman@ardistech.com> 88c2ecf20Sopenharmony_ci * 98c2ecf20Sopenharmony_ci * Handler routines for unicode strings 108c2ecf20Sopenharmony_ci */ 118c2ecf20Sopenharmony_ci 128c2ecf20Sopenharmony_ci#include <linux/types.h> 138c2ecf20Sopenharmony_ci#include <linux/nls.h> 148c2ecf20Sopenharmony_ci#include "hfsplus_fs.h" 158c2ecf20Sopenharmony_ci#include "hfsplus_raw.h" 168c2ecf20Sopenharmony_ci 178c2ecf20Sopenharmony_ci/* Fold the case of a unicode char, given the 16 bit value */ 188c2ecf20Sopenharmony_ci/* Returns folded char, or 0 if ignorable */ 198c2ecf20Sopenharmony_cistatic inline u16 case_fold(u16 c) 208c2ecf20Sopenharmony_ci{ 218c2ecf20Sopenharmony_ci u16 tmp; 228c2ecf20Sopenharmony_ci 238c2ecf20Sopenharmony_ci tmp = hfsplus_case_fold_table[c >> 8]; 248c2ecf20Sopenharmony_ci if (tmp) 258c2ecf20Sopenharmony_ci tmp = hfsplus_case_fold_table[tmp + (c & 0xff)]; 268c2ecf20Sopenharmony_ci else 278c2ecf20Sopenharmony_ci tmp = c; 288c2ecf20Sopenharmony_ci return tmp; 298c2ecf20Sopenharmony_ci} 308c2ecf20Sopenharmony_ci 318c2ecf20Sopenharmony_ci/* Compare unicode strings, return values like normal strcmp */ 328c2ecf20Sopenharmony_ciint hfsplus_strcasecmp(const struct hfsplus_unistr *s1, 338c2ecf20Sopenharmony_ci const struct hfsplus_unistr *s2) 348c2ecf20Sopenharmony_ci{ 358c2ecf20Sopenharmony_ci u16 len1, len2, c1, c2; 368c2ecf20Sopenharmony_ci const hfsplus_unichr *p1, *p2; 378c2ecf20Sopenharmony_ci 388c2ecf20Sopenharmony_ci len1 = be16_to_cpu(s1->length); 398c2ecf20Sopenharmony_ci len2 = be16_to_cpu(s2->length); 408c2ecf20Sopenharmony_ci p1 = s1->unicode; 418c2ecf20Sopenharmony_ci p2 = s2->unicode; 428c2ecf20Sopenharmony_ci 438c2ecf20Sopenharmony_ci while (1) { 448c2ecf20Sopenharmony_ci c1 = c2 = 0; 458c2ecf20Sopenharmony_ci 468c2ecf20Sopenharmony_ci while (len1 && !c1) { 478c2ecf20Sopenharmony_ci c1 = case_fold(be16_to_cpu(*p1)); 488c2ecf20Sopenharmony_ci p1++; 498c2ecf20Sopenharmony_ci len1--; 508c2ecf20Sopenharmony_ci } 518c2ecf20Sopenharmony_ci while (len2 && !c2) { 528c2ecf20Sopenharmony_ci c2 = case_fold(be16_to_cpu(*p2)); 538c2ecf20Sopenharmony_ci p2++; 548c2ecf20Sopenharmony_ci len2--; 558c2ecf20Sopenharmony_ci } 568c2ecf20Sopenharmony_ci 578c2ecf20Sopenharmony_ci if (c1 != c2) 588c2ecf20Sopenharmony_ci return (c1 < c2) ? -1 : 1; 598c2ecf20Sopenharmony_ci if (!c1 && !c2) 608c2ecf20Sopenharmony_ci return 0; 618c2ecf20Sopenharmony_ci } 628c2ecf20Sopenharmony_ci} 638c2ecf20Sopenharmony_ci 648c2ecf20Sopenharmony_ci/* Compare names as a sequence of 16-bit unsigned integers */ 658c2ecf20Sopenharmony_ciint hfsplus_strcmp(const struct hfsplus_unistr *s1, 668c2ecf20Sopenharmony_ci const struct hfsplus_unistr *s2) 678c2ecf20Sopenharmony_ci{ 688c2ecf20Sopenharmony_ci u16 len1, len2, c1, c2; 698c2ecf20Sopenharmony_ci const hfsplus_unichr *p1, *p2; 708c2ecf20Sopenharmony_ci int len; 718c2ecf20Sopenharmony_ci 728c2ecf20Sopenharmony_ci len1 = be16_to_cpu(s1->length); 738c2ecf20Sopenharmony_ci len2 = be16_to_cpu(s2->length); 748c2ecf20Sopenharmony_ci p1 = s1->unicode; 758c2ecf20Sopenharmony_ci p2 = s2->unicode; 768c2ecf20Sopenharmony_ci 778c2ecf20Sopenharmony_ci for (len = min(len1, len2); len > 0; len--) { 788c2ecf20Sopenharmony_ci c1 = be16_to_cpu(*p1); 798c2ecf20Sopenharmony_ci c2 = be16_to_cpu(*p2); 808c2ecf20Sopenharmony_ci if (c1 != c2) 818c2ecf20Sopenharmony_ci return c1 < c2 ? -1 : 1; 828c2ecf20Sopenharmony_ci p1++; 838c2ecf20Sopenharmony_ci p2++; 848c2ecf20Sopenharmony_ci } 858c2ecf20Sopenharmony_ci 868c2ecf20Sopenharmony_ci return len1 < len2 ? -1 : 878c2ecf20Sopenharmony_ci len1 > len2 ? 1 : 0; 888c2ecf20Sopenharmony_ci} 898c2ecf20Sopenharmony_ci 908c2ecf20Sopenharmony_ci 918c2ecf20Sopenharmony_ci#define Hangul_SBase 0xac00 928c2ecf20Sopenharmony_ci#define Hangul_LBase 0x1100 938c2ecf20Sopenharmony_ci#define Hangul_VBase 0x1161 948c2ecf20Sopenharmony_ci#define Hangul_TBase 0x11a7 958c2ecf20Sopenharmony_ci#define Hangul_SCount 11172 968c2ecf20Sopenharmony_ci#define Hangul_LCount 19 978c2ecf20Sopenharmony_ci#define Hangul_VCount 21 988c2ecf20Sopenharmony_ci#define Hangul_TCount 28 998c2ecf20Sopenharmony_ci#define Hangul_NCount (Hangul_VCount * Hangul_TCount) 1008c2ecf20Sopenharmony_ci 1018c2ecf20Sopenharmony_ci 1028c2ecf20Sopenharmony_cistatic u16 *hfsplus_compose_lookup(u16 *p, u16 cc) 1038c2ecf20Sopenharmony_ci{ 1048c2ecf20Sopenharmony_ci int i, s, e; 1058c2ecf20Sopenharmony_ci 1068c2ecf20Sopenharmony_ci s = 1; 1078c2ecf20Sopenharmony_ci e = p[1]; 1088c2ecf20Sopenharmony_ci if (!e || cc < p[s * 2] || cc > p[e * 2]) 1098c2ecf20Sopenharmony_ci return NULL; 1108c2ecf20Sopenharmony_ci do { 1118c2ecf20Sopenharmony_ci i = (s + e) / 2; 1128c2ecf20Sopenharmony_ci if (cc > p[i * 2]) 1138c2ecf20Sopenharmony_ci s = i + 1; 1148c2ecf20Sopenharmony_ci else if (cc < p[i * 2]) 1158c2ecf20Sopenharmony_ci e = i - 1; 1168c2ecf20Sopenharmony_ci else 1178c2ecf20Sopenharmony_ci return hfsplus_compose_table + p[i * 2 + 1]; 1188c2ecf20Sopenharmony_ci } while (s <= e); 1198c2ecf20Sopenharmony_ci return NULL; 1208c2ecf20Sopenharmony_ci} 1218c2ecf20Sopenharmony_ci 1228c2ecf20Sopenharmony_ciint hfsplus_uni2asc(struct super_block *sb, 1238c2ecf20Sopenharmony_ci const struct hfsplus_unistr *ustr, 1248c2ecf20Sopenharmony_ci char *astr, int *len_p) 1258c2ecf20Sopenharmony_ci{ 1268c2ecf20Sopenharmony_ci const hfsplus_unichr *ip; 1278c2ecf20Sopenharmony_ci struct nls_table *nls = HFSPLUS_SB(sb)->nls; 1288c2ecf20Sopenharmony_ci u8 *op; 1298c2ecf20Sopenharmony_ci u16 cc, c0, c1; 1308c2ecf20Sopenharmony_ci u16 *ce1, *ce2; 1318c2ecf20Sopenharmony_ci int i, len, ustrlen, res, compose; 1328c2ecf20Sopenharmony_ci 1338c2ecf20Sopenharmony_ci op = astr; 1348c2ecf20Sopenharmony_ci ip = ustr->unicode; 1358c2ecf20Sopenharmony_ci ustrlen = be16_to_cpu(ustr->length); 1368c2ecf20Sopenharmony_ci len = *len_p; 1378c2ecf20Sopenharmony_ci ce1 = NULL; 1388c2ecf20Sopenharmony_ci compose = !test_bit(HFSPLUS_SB_NODECOMPOSE, &HFSPLUS_SB(sb)->flags); 1398c2ecf20Sopenharmony_ci 1408c2ecf20Sopenharmony_ci while (ustrlen > 0) { 1418c2ecf20Sopenharmony_ci c0 = be16_to_cpu(*ip++); 1428c2ecf20Sopenharmony_ci ustrlen--; 1438c2ecf20Sopenharmony_ci /* search for single decomposed char */ 1448c2ecf20Sopenharmony_ci if (likely(compose)) 1458c2ecf20Sopenharmony_ci ce1 = hfsplus_compose_lookup(hfsplus_compose_table, c0); 1468c2ecf20Sopenharmony_ci if (ce1) 1478c2ecf20Sopenharmony_ci cc = ce1[0]; 1488c2ecf20Sopenharmony_ci else 1498c2ecf20Sopenharmony_ci cc = 0; 1508c2ecf20Sopenharmony_ci if (cc) { 1518c2ecf20Sopenharmony_ci /* start of a possibly decomposed Hangul char */ 1528c2ecf20Sopenharmony_ci if (cc != 0xffff) 1538c2ecf20Sopenharmony_ci goto done; 1548c2ecf20Sopenharmony_ci if (!ustrlen) 1558c2ecf20Sopenharmony_ci goto same; 1568c2ecf20Sopenharmony_ci c1 = be16_to_cpu(*ip) - Hangul_VBase; 1578c2ecf20Sopenharmony_ci if (c1 < Hangul_VCount) { 1588c2ecf20Sopenharmony_ci /* compose the Hangul char */ 1598c2ecf20Sopenharmony_ci cc = (c0 - Hangul_LBase) * Hangul_VCount; 1608c2ecf20Sopenharmony_ci cc = (cc + c1) * Hangul_TCount; 1618c2ecf20Sopenharmony_ci cc += Hangul_SBase; 1628c2ecf20Sopenharmony_ci ip++; 1638c2ecf20Sopenharmony_ci ustrlen--; 1648c2ecf20Sopenharmony_ci if (!ustrlen) 1658c2ecf20Sopenharmony_ci goto done; 1668c2ecf20Sopenharmony_ci c1 = be16_to_cpu(*ip) - Hangul_TBase; 1678c2ecf20Sopenharmony_ci if (c1 > 0 && c1 < Hangul_TCount) { 1688c2ecf20Sopenharmony_ci cc += c1; 1698c2ecf20Sopenharmony_ci ip++; 1708c2ecf20Sopenharmony_ci ustrlen--; 1718c2ecf20Sopenharmony_ci } 1728c2ecf20Sopenharmony_ci goto done; 1738c2ecf20Sopenharmony_ci } 1748c2ecf20Sopenharmony_ci } 1758c2ecf20Sopenharmony_ci while (1) { 1768c2ecf20Sopenharmony_ci /* main loop for common case of not composed chars */ 1778c2ecf20Sopenharmony_ci if (!ustrlen) 1788c2ecf20Sopenharmony_ci goto same; 1798c2ecf20Sopenharmony_ci c1 = be16_to_cpu(*ip); 1808c2ecf20Sopenharmony_ci if (likely(compose)) 1818c2ecf20Sopenharmony_ci ce1 = hfsplus_compose_lookup( 1828c2ecf20Sopenharmony_ci hfsplus_compose_table, c1); 1838c2ecf20Sopenharmony_ci if (ce1) 1848c2ecf20Sopenharmony_ci break; 1858c2ecf20Sopenharmony_ci switch (c0) { 1868c2ecf20Sopenharmony_ci case 0: 1878c2ecf20Sopenharmony_ci c0 = 0x2400; 1888c2ecf20Sopenharmony_ci break; 1898c2ecf20Sopenharmony_ci case '/': 1908c2ecf20Sopenharmony_ci c0 = ':'; 1918c2ecf20Sopenharmony_ci break; 1928c2ecf20Sopenharmony_ci } 1938c2ecf20Sopenharmony_ci res = nls->uni2char(c0, op, len); 1948c2ecf20Sopenharmony_ci if (res < 0) { 1958c2ecf20Sopenharmony_ci if (res == -ENAMETOOLONG) 1968c2ecf20Sopenharmony_ci goto out; 1978c2ecf20Sopenharmony_ci *op = '?'; 1988c2ecf20Sopenharmony_ci res = 1; 1998c2ecf20Sopenharmony_ci } 2008c2ecf20Sopenharmony_ci op += res; 2018c2ecf20Sopenharmony_ci len -= res; 2028c2ecf20Sopenharmony_ci c0 = c1; 2038c2ecf20Sopenharmony_ci ip++; 2048c2ecf20Sopenharmony_ci ustrlen--; 2058c2ecf20Sopenharmony_ci } 2068c2ecf20Sopenharmony_ci ce2 = hfsplus_compose_lookup(ce1, c0); 2078c2ecf20Sopenharmony_ci if (ce2) { 2088c2ecf20Sopenharmony_ci i = 1; 2098c2ecf20Sopenharmony_ci while (i < ustrlen) { 2108c2ecf20Sopenharmony_ci ce1 = hfsplus_compose_lookup(ce2, 2118c2ecf20Sopenharmony_ci be16_to_cpu(ip[i])); 2128c2ecf20Sopenharmony_ci if (!ce1) 2138c2ecf20Sopenharmony_ci break; 2148c2ecf20Sopenharmony_ci i++; 2158c2ecf20Sopenharmony_ci ce2 = ce1; 2168c2ecf20Sopenharmony_ci } 2178c2ecf20Sopenharmony_ci cc = ce2[0]; 2188c2ecf20Sopenharmony_ci if (cc) { 2198c2ecf20Sopenharmony_ci ip += i; 2208c2ecf20Sopenharmony_ci ustrlen -= i; 2218c2ecf20Sopenharmony_ci goto done; 2228c2ecf20Sopenharmony_ci } 2238c2ecf20Sopenharmony_ci } 2248c2ecf20Sopenharmony_cisame: 2258c2ecf20Sopenharmony_ci switch (c0) { 2268c2ecf20Sopenharmony_ci case 0: 2278c2ecf20Sopenharmony_ci cc = 0x2400; 2288c2ecf20Sopenharmony_ci break; 2298c2ecf20Sopenharmony_ci case '/': 2308c2ecf20Sopenharmony_ci cc = ':'; 2318c2ecf20Sopenharmony_ci break; 2328c2ecf20Sopenharmony_ci default: 2338c2ecf20Sopenharmony_ci cc = c0; 2348c2ecf20Sopenharmony_ci } 2358c2ecf20Sopenharmony_cidone: 2368c2ecf20Sopenharmony_ci res = nls->uni2char(cc, op, len); 2378c2ecf20Sopenharmony_ci if (res < 0) { 2388c2ecf20Sopenharmony_ci if (res == -ENAMETOOLONG) 2398c2ecf20Sopenharmony_ci goto out; 2408c2ecf20Sopenharmony_ci *op = '?'; 2418c2ecf20Sopenharmony_ci res = 1; 2428c2ecf20Sopenharmony_ci } 2438c2ecf20Sopenharmony_ci op += res; 2448c2ecf20Sopenharmony_ci len -= res; 2458c2ecf20Sopenharmony_ci } 2468c2ecf20Sopenharmony_ci res = 0; 2478c2ecf20Sopenharmony_ciout: 2488c2ecf20Sopenharmony_ci *len_p = (char *)op - astr; 2498c2ecf20Sopenharmony_ci return res; 2508c2ecf20Sopenharmony_ci} 2518c2ecf20Sopenharmony_ci 2528c2ecf20Sopenharmony_ci/* 2538c2ecf20Sopenharmony_ci * Convert one or more ASCII characters into a single unicode character. 2548c2ecf20Sopenharmony_ci * Returns the number of ASCII characters corresponding to the unicode char. 2558c2ecf20Sopenharmony_ci */ 2568c2ecf20Sopenharmony_cistatic inline int asc2unichar(struct super_block *sb, const char *astr, int len, 2578c2ecf20Sopenharmony_ci wchar_t *uc) 2588c2ecf20Sopenharmony_ci{ 2598c2ecf20Sopenharmony_ci int size = HFSPLUS_SB(sb)->nls->char2uni(astr, len, uc); 2608c2ecf20Sopenharmony_ci if (size <= 0) { 2618c2ecf20Sopenharmony_ci *uc = '?'; 2628c2ecf20Sopenharmony_ci size = 1; 2638c2ecf20Sopenharmony_ci } 2648c2ecf20Sopenharmony_ci switch (*uc) { 2658c2ecf20Sopenharmony_ci case 0x2400: 2668c2ecf20Sopenharmony_ci *uc = 0; 2678c2ecf20Sopenharmony_ci break; 2688c2ecf20Sopenharmony_ci case ':': 2698c2ecf20Sopenharmony_ci *uc = '/'; 2708c2ecf20Sopenharmony_ci break; 2718c2ecf20Sopenharmony_ci } 2728c2ecf20Sopenharmony_ci return size; 2738c2ecf20Sopenharmony_ci} 2748c2ecf20Sopenharmony_ci 2758c2ecf20Sopenharmony_ci/* Decomposes a non-Hangul unicode character. */ 2768c2ecf20Sopenharmony_cistatic u16 *hfsplus_decompose_nonhangul(wchar_t uc, int *size) 2778c2ecf20Sopenharmony_ci{ 2788c2ecf20Sopenharmony_ci int off; 2798c2ecf20Sopenharmony_ci 2808c2ecf20Sopenharmony_ci off = hfsplus_decompose_table[(uc >> 12) & 0xf]; 2818c2ecf20Sopenharmony_ci if (off == 0 || off == 0xffff) 2828c2ecf20Sopenharmony_ci return NULL; 2838c2ecf20Sopenharmony_ci 2848c2ecf20Sopenharmony_ci off = hfsplus_decompose_table[off + ((uc >> 8) & 0xf)]; 2858c2ecf20Sopenharmony_ci if (!off) 2868c2ecf20Sopenharmony_ci return NULL; 2878c2ecf20Sopenharmony_ci 2888c2ecf20Sopenharmony_ci off = hfsplus_decompose_table[off + ((uc >> 4) & 0xf)]; 2898c2ecf20Sopenharmony_ci if (!off) 2908c2ecf20Sopenharmony_ci return NULL; 2918c2ecf20Sopenharmony_ci 2928c2ecf20Sopenharmony_ci off = hfsplus_decompose_table[off + (uc & 0xf)]; 2938c2ecf20Sopenharmony_ci *size = off & 3; 2948c2ecf20Sopenharmony_ci if (*size == 0) 2958c2ecf20Sopenharmony_ci return NULL; 2968c2ecf20Sopenharmony_ci return hfsplus_decompose_table + (off / 4); 2978c2ecf20Sopenharmony_ci} 2988c2ecf20Sopenharmony_ci 2998c2ecf20Sopenharmony_ci/* 3008c2ecf20Sopenharmony_ci * Try to decompose a unicode character as Hangul. Return 0 if @uc is not 3018c2ecf20Sopenharmony_ci * precomposed Hangul, otherwise return the length of the decomposition. 3028c2ecf20Sopenharmony_ci * 3038c2ecf20Sopenharmony_ci * This function was adapted from sample code from the Unicode Standard 3048c2ecf20Sopenharmony_ci * Annex #15: Unicode Normalization Forms, version 3.2.0. 3058c2ecf20Sopenharmony_ci * 3068c2ecf20Sopenharmony_ci * Copyright (C) 1991-2018 Unicode, Inc. All rights reserved. Distributed 3078c2ecf20Sopenharmony_ci * under the Terms of Use in http://www.unicode.org/copyright.html. 3088c2ecf20Sopenharmony_ci */ 3098c2ecf20Sopenharmony_cistatic int hfsplus_try_decompose_hangul(wchar_t uc, u16 *result) 3108c2ecf20Sopenharmony_ci{ 3118c2ecf20Sopenharmony_ci int index; 3128c2ecf20Sopenharmony_ci int l, v, t; 3138c2ecf20Sopenharmony_ci 3148c2ecf20Sopenharmony_ci index = uc - Hangul_SBase; 3158c2ecf20Sopenharmony_ci if (index < 0 || index >= Hangul_SCount) 3168c2ecf20Sopenharmony_ci return 0; 3178c2ecf20Sopenharmony_ci 3188c2ecf20Sopenharmony_ci l = Hangul_LBase + index / Hangul_NCount; 3198c2ecf20Sopenharmony_ci v = Hangul_VBase + (index % Hangul_NCount) / Hangul_TCount; 3208c2ecf20Sopenharmony_ci t = Hangul_TBase + index % Hangul_TCount; 3218c2ecf20Sopenharmony_ci 3228c2ecf20Sopenharmony_ci result[0] = l; 3238c2ecf20Sopenharmony_ci result[1] = v; 3248c2ecf20Sopenharmony_ci if (t != Hangul_TBase) { 3258c2ecf20Sopenharmony_ci result[2] = t; 3268c2ecf20Sopenharmony_ci return 3; 3278c2ecf20Sopenharmony_ci } 3288c2ecf20Sopenharmony_ci return 2; 3298c2ecf20Sopenharmony_ci} 3308c2ecf20Sopenharmony_ci 3318c2ecf20Sopenharmony_ci/* Decomposes a single unicode character. */ 3328c2ecf20Sopenharmony_cistatic u16 *decompose_unichar(wchar_t uc, int *size, u16 *hangul_buffer) 3338c2ecf20Sopenharmony_ci{ 3348c2ecf20Sopenharmony_ci u16 *result; 3358c2ecf20Sopenharmony_ci 3368c2ecf20Sopenharmony_ci /* Hangul is handled separately */ 3378c2ecf20Sopenharmony_ci result = hangul_buffer; 3388c2ecf20Sopenharmony_ci *size = hfsplus_try_decompose_hangul(uc, result); 3398c2ecf20Sopenharmony_ci if (*size == 0) 3408c2ecf20Sopenharmony_ci result = hfsplus_decompose_nonhangul(uc, size); 3418c2ecf20Sopenharmony_ci return result; 3428c2ecf20Sopenharmony_ci} 3438c2ecf20Sopenharmony_ci 3448c2ecf20Sopenharmony_ciint hfsplus_asc2uni(struct super_block *sb, 3458c2ecf20Sopenharmony_ci struct hfsplus_unistr *ustr, int max_unistr_len, 3468c2ecf20Sopenharmony_ci const char *astr, int len) 3478c2ecf20Sopenharmony_ci{ 3488c2ecf20Sopenharmony_ci int size, dsize, decompose; 3498c2ecf20Sopenharmony_ci u16 *dstr, outlen = 0; 3508c2ecf20Sopenharmony_ci wchar_t c; 3518c2ecf20Sopenharmony_ci u16 dhangul[3]; 3528c2ecf20Sopenharmony_ci 3538c2ecf20Sopenharmony_ci decompose = !test_bit(HFSPLUS_SB_NODECOMPOSE, &HFSPLUS_SB(sb)->flags); 3548c2ecf20Sopenharmony_ci while (outlen < max_unistr_len && len > 0) { 3558c2ecf20Sopenharmony_ci size = asc2unichar(sb, astr, len, &c); 3568c2ecf20Sopenharmony_ci 3578c2ecf20Sopenharmony_ci if (decompose) 3588c2ecf20Sopenharmony_ci dstr = decompose_unichar(c, &dsize, dhangul); 3598c2ecf20Sopenharmony_ci else 3608c2ecf20Sopenharmony_ci dstr = NULL; 3618c2ecf20Sopenharmony_ci if (dstr) { 3628c2ecf20Sopenharmony_ci if (outlen + dsize > max_unistr_len) 3638c2ecf20Sopenharmony_ci break; 3648c2ecf20Sopenharmony_ci do { 3658c2ecf20Sopenharmony_ci ustr->unicode[outlen++] = cpu_to_be16(*dstr++); 3668c2ecf20Sopenharmony_ci } while (--dsize > 0); 3678c2ecf20Sopenharmony_ci } else 3688c2ecf20Sopenharmony_ci ustr->unicode[outlen++] = cpu_to_be16(c); 3698c2ecf20Sopenharmony_ci 3708c2ecf20Sopenharmony_ci astr += size; 3718c2ecf20Sopenharmony_ci len -= size; 3728c2ecf20Sopenharmony_ci } 3738c2ecf20Sopenharmony_ci ustr->length = cpu_to_be16(outlen); 3748c2ecf20Sopenharmony_ci if (len > 0) 3758c2ecf20Sopenharmony_ci return -ENAMETOOLONG; 3768c2ecf20Sopenharmony_ci return 0; 3778c2ecf20Sopenharmony_ci} 3788c2ecf20Sopenharmony_ci 3798c2ecf20Sopenharmony_ci/* 3808c2ecf20Sopenharmony_ci * Hash a string to an integer as appropriate for the HFS+ filesystem. 3818c2ecf20Sopenharmony_ci * Composed unicode characters are decomposed and case-folding is performed 3828c2ecf20Sopenharmony_ci * if the appropriate bits are (un)set on the superblock. 3838c2ecf20Sopenharmony_ci */ 3848c2ecf20Sopenharmony_ciint hfsplus_hash_dentry(const struct dentry *dentry, struct qstr *str) 3858c2ecf20Sopenharmony_ci{ 3868c2ecf20Sopenharmony_ci struct super_block *sb = dentry->d_sb; 3878c2ecf20Sopenharmony_ci const char *astr; 3888c2ecf20Sopenharmony_ci const u16 *dstr; 3898c2ecf20Sopenharmony_ci int casefold, decompose, size, len; 3908c2ecf20Sopenharmony_ci unsigned long hash; 3918c2ecf20Sopenharmony_ci wchar_t c; 3928c2ecf20Sopenharmony_ci u16 c2; 3938c2ecf20Sopenharmony_ci u16 dhangul[3]; 3948c2ecf20Sopenharmony_ci 3958c2ecf20Sopenharmony_ci casefold = test_bit(HFSPLUS_SB_CASEFOLD, &HFSPLUS_SB(sb)->flags); 3968c2ecf20Sopenharmony_ci decompose = !test_bit(HFSPLUS_SB_NODECOMPOSE, &HFSPLUS_SB(sb)->flags); 3978c2ecf20Sopenharmony_ci hash = init_name_hash(dentry); 3988c2ecf20Sopenharmony_ci astr = str->name; 3998c2ecf20Sopenharmony_ci len = str->len; 4008c2ecf20Sopenharmony_ci while (len > 0) { 4018c2ecf20Sopenharmony_ci int dsize; 4028c2ecf20Sopenharmony_ci size = asc2unichar(sb, astr, len, &c); 4038c2ecf20Sopenharmony_ci astr += size; 4048c2ecf20Sopenharmony_ci len -= size; 4058c2ecf20Sopenharmony_ci 4068c2ecf20Sopenharmony_ci if (decompose) 4078c2ecf20Sopenharmony_ci dstr = decompose_unichar(c, &dsize, dhangul); 4088c2ecf20Sopenharmony_ci else 4098c2ecf20Sopenharmony_ci dstr = NULL; 4108c2ecf20Sopenharmony_ci if (dstr) { 4118c2ecf20Sopenharmony_ci do { 4128c2ecf20Sopenharmony_ci c2 = *dstr++; 4138c2ecf20Sopenharmony_ci if (casefold) 4148c2ecf20Sopenharmony_ci c2 = case_fold(c2); 4158c2ecf20Sopenharmony_ci if (!casefold || c2) 4168c2ecf20Sopenharmony_ci hash = partial_name_hash(c2, hash); 4178c2ecf20Sopenharmony_ci } while (--dsize > 0); 4188c2ecf20Sopenharmony_ci } else { 4198c2ecf20Sopenharmony_ci c2 = c; 4208c2ecf20Sopenharmony_ci if (casefold) 4218c2ecf20Sopenharmony_ci c2 = case_fold(c2); 4228c2ecf20Sopenharmony_ci if (!casefold || c2) 4238c2ecf20Sopenharmony_ci hash = partial_name_hash(c2, hash); 4248c2ecf20Sopenharmony_ci } 4258c2ecf20Sopenharmony_ci } 4268c2ecf20Sopenharmony_ci str->hash = end_name_hash(hash); 4278c2ecf20Sopenharmony_ci 4288c2ecf20Sopenharmony_ci return 0; 4298c2ecf20Sopenharmony_ci} 4308c2ecf20Sopenharmony_ci 4318c2ecf20Sopenharmony_ci/* 4328c2ecf20Sopenharmony_ci * Compare strings with HFS+ filename ordering. 4338c2ecf20Sopenharmony_ci * Composed unicode characters are decomposed and case-folding is performed 4348c2ecf20Sopenharmony_ci * if the appropriate bits are (un)set on the superblock. 4358c2ecf20Sopenharmony_ci */ 4368c2ecf20Sopenharmony_ciint hfsplus_compare_dentry(const struct dentry *dentry, 4378c2ecf20Sopenharmony_ci unsigned int len, const char *str, const struct qstr *name) 4388c2ecf20Sopenharmony_ci{ 4398c2ecf20Sopenharmony_ci struct super_block *sb = dentry->d_sb; 4408c2ecf20Sopenharmony_ci int casefold, decompose, size; 4418c2ecf20Sopenharmony_ci int dsize1, dsize2, len1, len2; 4428c2ecf20Sopenharmony_ci const u16 *dstr1, *dstr2; 4438c2ecf20Sopenharmony_ci const char *astr1, *astr2; 4448c2ecf20Sopenharmony_ci u16 c1, c2; 4458c2ecf20Sopenharmony_ci wchar_t c; 4468c2ecf20Sopenharmony_ci u16 dhangul_1[3], dhangul_2[3]; 4478c2ecf20Sopenharmony_ci 4488c2ecf20Sopenharmony_ci casefold = test_bit(HFSPLUS_SB_CASEFOLD, &HFSPLUS_SB(sb)->flags); 4498c2ecf20Sopenharmony_ci decompose = !test_bit(HFSPLUS_SB_NODECOMPOSE, &HFSPLUS_SB(sb)->flags); 4508c2ecf20Sopenharmony_ci astr1 = str; 4518c2ecf20Sopenharmony_ci len1 = len; 4528c2ecf20Sopenharmony_ci astr2 = name->name; 4538c2ecf20Sopenharmony_ci len2 = name->len; 4548c2ecf20Sopenharmony_ci dsize1 = dsize2 = 0; 4558c2ecf20Sopenharmony_ci dstr1 = dstr2 = NULL; 4568c2ecf20Sopenharmony_ci 4578c2ecf20Sopenharmony_ci while (len1 > 0 && len2 > 0) { 4588c2ecf20Sopenharmony_ci if (!dsize1) { 4598c2ecf20Sopenharmony_ci size = asc2unichar(sb, astr1, len1, &c); 4608c2ecf20Sopenharmony_ci astr1 += size; 4618c2ecf20Sopenharmony_ci len1 -= size; 4628c2ecf20Sopenharmony_ci 4638c2ecf20Sopenharmony_ci if (decompose) 4648c2ecf20Sopenharmony_ci dstr1 = decompose_unichar(c, &dsize1, 4658c2ecf20Sopenharmony_ci dhangul_1); 4668c2ecf20Sopenharmony_ci if (!decompose || !dstr1) { 4678c2ecf20Sopenharmony_ci c1 = c; 4688c2ecf20Sopenharmony_ci dstr1 = &c1; 4698c2ecf20Sopenharmony_ci dsize1 = 1; 4708c2ecf20Sopenharmony_ci } 4718c2ecf20Sopenharmony_ci } 4728c2ecf20Sopenharmony_ci 4738c2ecf20Sopenharmony_ci if (!dsize2) { 4748c2ecf20Sopenharmony_ci size = asc2unichar(sb, astr2, len2, &c); 4758c2ecf20Sopenharmony_ci astr2 += size; 4768c2ecf20Sopenharmony_ci len2 -= size; 4778c2ecf20Sopenharmony_ci 4788c2ecf20Sopenharmony_ci if (decompose) 4798c2ecf20Sopenharmony_ci dstr2 = decompose_unichar(c, &dsize2, 4808c2ecf20Sopenharmony_ci dhangul_2); 4818c2ecf20Sopenharmony_ci if (!decompose || !dstr2) { 4828c2ecf20Sopenharmony_ci c2 = c; 4838c2ecf20Sopenharmony_ci dstr2 = &c2; 4848c2ecf20Sopenharmony_ci dsize2 = 1; 4858c2ecf20Sopenharmony_ci } 4868c2ecf20Sopenharmony_ci } 4878c2ecf20Sopenharmony_ci 4888c2ecf20Sopenharmony_ci c1 = *dstr1; 4898c2ecf20Sopenharmony_ci c2 = *dstr2; 4908c2ecf20Sopenharmony_ci if (casefold) { 4918c2ecf20Sopenharmony_ci c1 = case_fold(c1); 4928c2ecf20Sopenharmony_ci if (!c1) { 4938c2ecf20Sopenharmony_ci dstr1++; 4948c2ecf20Sopenharmony_ci dsize1--; 4958c2ecf20Sopenharmony_ci continue; 4968c2ecf20Sopenharmony_ci } 4978c2ecf20Sopenharmony_ci c2 = case_fold(c2); 4988c2ecf20Sopenharmony_ci if (!c2) { 4998c2ecf20Sopenharmony_ci dstr2++; 5008c2ecf20Sopenharmony_ci dsize2--; 5018c2ecf20Sopenharmony_ci continue; 5028c2ecf20Sopenharmony_ci } 5038c2ecf20Sopenharmony_ci } 5048c2ecf20Sopenharmony_ci if (c1 < c2) 5058c2ecf20Sopenharmony_ci return -1; 5068c2ecf20Sopenharmony_ci else if (c1 > c2) 5078c2ecf20Sopenharmony_ci return 1; 5088c2ecf20Sopenharmony_ci 5098c2ecf20Sopenharmony_ci dstr1++; 5108c2ecf20Sopenharmony_ci dsize1--; 5118c2ecf20Sopenharmony_ci dstr2++; 5128c2ecf20Sopenharmony_ci dsize2--; 5138c2ecf20Sopenharmony_ci } 5148c2ecf20Sopenharmony_ci 5158c2ecf20Sopenharmony_ci if (len1 < len2) 5168c2ecf20Sopenharmony_ci return -1; 5178c2ecf20Sopenharmony_ci if (len1 > len2) 5188c2ecf20Sopenharmony_ci return 1; 5198c2ecf20Sopenharmony_ci return 0; 5208c2ecf20Sopenharmony_ci} 521