18c2ecf20Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0
28c2ecf20Sopenharmony_ci/*
38c2ecf20Sopenharmony_ci *  linux/fs/hfsplus/unicode.c
48c2ecf20Sopenharmony_ci *
58c2ecf20Sopenharmony_ci * Copyright (C) 2001
68c2ecf20Sopenharmony_ci * Brad Boyer (flar@allandria.com)
78c2ecf20Sopenharmony_ci * (C) 2003 Ardis Technologies <roman@ardistech.com>
88c2ecf20Sopenharmony_ci *
98c2ecf20Sopenharmony_ci * Handler routines for unicode strings
108c2ecf20Sopenharmony_ci */
118c2ecf20Sopenharmony_ci
128c2ecf20Sopenharmony_ci#include <linux/types.h>
138c2ecf20Sopenharmony_ci#include <linux/nls.h>
148c2ecf20Sopenharmony_ci#include "hfsplus_fs.h"
158c2ecf20Sopenharmony_ci#include "hfsplus_raw.h"
168c2ecf20Sopenharmony_ci
178c2ecf20Sopenharmony_ci/* Fold the case of a unicode char, given the 16 bit value */
188c2ecf20Sopenharmony_ci/* Returns folded char, or 0 if ignorable */
198c2ecf20Sopenharmony_cistatic inline u16 case_fold(u16 c)
208c2ecf20Sopenharmony_ci{
218c2ecf20Sopenharmony_ci	u16 tmp;
228c2ecf20Sopenharmony_ci
238c2ecf20Sopenharmony_ci	tmp = hfsplus_case_fold_table[c >> 8];
248c2ecf20Sopenharmony_ci	if (tmp)
258c2ecf20Sopenharmony_ci		tmp = hfsplus_case_fold_table[tmp + (c & 0xff)];
268c2ecf20Sopenharmony_ci	else
278c2ecf20Sopenharmony_ci		tmp = c;
288c2ecf20Sopenharmony_ci	return tmp;
298c2ecf20Sopenharmony_ci}
308c2ecf20Sopenharmony_ci
318c2ecf20Sopenharmony_ci/* Compare unicode strings, return values like normal strcmp */
328c2ecf20Sopenharmony_ciint hfsplus_strcasecmp(const struct hfsplus_unistr *s1,
338c2ecf20Sopenharmony_ci		       const struct hfsplus_unistr *s2)
348c2ecf20Sopenharmony_ci{
358c2ecf20Sopenharmony_ci	u16 len1, len2, c1, c2;
368c2ecf20Sopenharmony_ci	const hfsplus_unichr *p1, *p2;
378c2ecf20Sopenharmony_ci
388c2ecf20Sopenharmony_ci	len1 = be16_to_cpu(s1->length);
398c2ecf20Sopenharmony_ci	len2 = be16_to_cpu(s2->length);
408c2ecf20Sopenharmony_ci	p1 = s1->unicode;
418c2ecf20Sopenharmony_ci	p2 = s2->unicode;
428c2ecf20Sopenharmony_ci
438c2ecf20Sopenharmony_ci	while (1) {
448c2ecf20Sopenharmony_ci		c1 = c2 = 0;
458c2ecf20Sopenharmony_ci
468c2ecf20Sopenharmony_ci		while (len1 && !c1) {
478c2ecf20Sopenharmony_ci			c1 = case_fold(be16_to_cpu(*p1));
488c2ecf20Sopenharmony_ci			p1++;
498c2ecf20Sopenharmony_ci			len1--;
508c2ecf20Sopenharmony_ci		}
518c2ecf20Sopenharmony_ci		while (len2 && !c2) {
528c2ecf20Sopenharmony_ci			c2 = case_fold(be16_to_cpu(*p2));
538c2ecf20Sopenharmony_ci			p2++;
548c2ecf20Sopenharmony_ci			len2--;
558c2ecf20Sopenharmony_ci		}
568c2ecf20Sopenharmony_ci
578c2ecf20Sopenharmony_ci		if (c1 != c2)
588c2ecf20Sopenharmony_ci			return (c1 < c2) ? -1 : 1;
598c2ecf20Sopenharmony_ci		if (!c1 && !c2)
608c2ecf20Sopenharmony_ci			return 0;
618c2ecf20Sopenharmony_ci	}
628c2ecf20Sopenharmony_ci}
638c2ecf20Sopenharmony_ci
648c2ecf20Sopenharmony_ci/* Compare names as a sequence of 16-bit unsigned integers */
658c2ecf20Sopenharmony_ciint hfsplus_strcmp(const struct hfsplus_unistr *s1,
668c2ecf20Sopenharmony_ci		   const struct hfsplus_unistr *s2)
678c2ecf20Sopenharmony_ci{
688c2ecf20Sopenharmony_ci	u16 len1, len2, c1, c2;
698c2ecf20Sopenharmony_ci	const hfsplus_unichr *p1, *p2;
708c2ecf20Sopenharmony_ci	int len;
718c2ecf20Sopenharmony_ci
728c2ecf20Sopenharmony_ci	len1 = be16_to_cpu(s1->length);
738c2ecf20Sopenharmony_ci	len2 = be16_to_cpu(s2->length);
748c2ecf20Sopenharmony_ci	p1 = s1->unicode;
758c2ecf20Sopenharmony_ci	p2 = s2->unicode;
768c2ecf20Sopenharmony_ci
778c2ecf20Sopenharmony_ci	for (len = min(len1, len2); len > 0; len--) {
788c2ecf20Sopenharmony_ci		c1 = be16_to_cpu(*p1);
798c2ecf20Sopenharmony_ci		c2 = be16_to_cpu(*p2);
808c2ecf20Sopenharmony_ci		if (c1 != c2)
818c2ecf20Sopenharmony_ci			return c1 < c2 ? -1 : 1;
828c2ecf20Sopenharmony_ci		p1++;
838c2ecf20Sopenharmony_ci		p2++;
848c2ecf20Sopenharmony_ci	}
858c2ecf20Sopenharmony_ci
868c2ecf20Sopenharmony_ci	return len1 < len2 ? -1 :
878c2ecf20Sopenharmony_ci	       len1 > len2 ? 1 : 0;
888c2ecf20Sopenharmony_ci}
898c2ecf20Sopenharmony_ci
908c2ecf20Sopenharmony_ci
918c2ecf20Sopenharmony_ci#define Hangul_SBase	0xac00
928c2ecf20Sopenharmony_ci#define Hangul_LBase	0x1100
938c2ecf20Sopenharmony_ci#define Hangul_VBase	0x1161
948c2ecf20Sopenharmony_ci#define Hangul_TBase	0x11a7
958c2ecf20Sopenharmony_ci#define Hangul_SCount	11172
968c2ecf20Sopenharmony_ci#define Hangul_LCount	19
978c2ecf20Sopenharmony_ci#define Hangul_VCount	21
988c2ecf20Sopenharmony_ci#define Hangul_TCount	28
998c2ecf20Sopenharmony_ci#define Hangul_NCount	(Hangul_VCount * Hangul_TCount)
1008c2ecf20Sopenharmony_ci
1018c2ecf20Sopenharmony_ci
1028c2ecf20Sopenharmony_cistatic u16 *hfsplus_compose_lookup(u16 *p, u16 cc)
1038c2ecf20Sopenharmony_ci{
1048c2ecf20Sopenharmony_ci	int i, s, e;
1058c2ecf20Sopenharmony_ci
1068c2ecf20Sopenharmony_ci	s = 1;
1078c2ecf20Sopenharmony_ci	e = p[1];
1088c2ecf20Sopenharmony_ci	if (!e || cc < p[s * 2] || cc > p[e * 2])
1098c2ecf20Sopenharmony_ci		return NULL;
1108c2ecf20Sopenharmony_ci	do {
1118c2ecf20Sopenharmony_ci		i = (s + e) / 2;
1128c2ecf20Sopenharmony_ci		if (cc > p[i * 2])
1138c2ecf20Sopenharmony_ci			s = i + 1;
1148c2ecf20Sopenharmony_ci		else if (cc < p[i * 2])
1158c2ecf20Sopenharmony_ci			e = i - 1;
1168c2ecf20Sopenharmony_ci		else
1178c2ecf20Sopenharmony_ci			return hfsplus_compose_table + p[i * 2 + 1];
1188c2ecf20Sopenharmony_ci	} while (s <= e);
1198c2ecf20Sopenharmony_ci	return NULL;
1208c2ecf20Sopenharmony_ci}
1218c2ecf20Sopenharmony_ci
1228c2ecf20Sopenharmony_ciint hfsplus_uni2asc(struct super_block *sb,
1238c2ecf20Sopenharmony_ci		const struct hfsplus_unistr *ustr,
1248c2ecf20Sopenharmony_ci		char *astr, int *len_p)
1258c2ecf20Sopenharmony_ci{
1268c2ecf20Sopenharmony_ci	const hfsplus_unichr *ip;
1278c2ecf20Sopenharmony_ci	struct nls_table *nls = HFSPLUS_SB(sb)->nls;
1288c2ecf20Sopenharmony_ci	u8 *op;
1298c2ecf20Sopenharmony_ci	u16 cc, c0, c1;
1308c2ecf20Sopenharmony_ci	u16 *ce1, *ce2;
1318c2ecf20Sopenharmony_ci	int i, len, ustrlen, res, compose;
1328c2ecf20Sopenharmony_ci
1338c2ecf20Sopenharmony_ci	op = astr;
1348c2ecf20Sopenharmony_ci	ip = ustr->unicode;
1358c2ecf20Sopenharmony_ci	ustrlen = be16_to_cpu(ustr->length);
1368c2ecf20Sopenharmony_ci	len = *len_p;
1378c2ecf20Sopenharmony_ci	ce1 = NULL;
1388c2ecf20Sopenharmony_ci	compose = !test_bit(HFSPLUS_SB_NODECOMPOSE, &HFSPLUS_SB(sb)->flags);
1398c2ecf20Sopenharmony_ci
1408c2ecf20Sopenharmony_ci	while (ustrlen > 0) {
1418c2ecf20Sopenharmony_ci		c0 = be16_to_cpu(*ip++);
1428c2ecf20Sopenharmony_ci		ustrlen--;
1438c2ecf20Sopenharmony_ci		/* search for single decomposed char */
1448c2ecf20Sopenharmony_ci		if (likely(compose))
1458c2ecf20Sopenharmony_ci			ce1 = hfsplus_compose_lookup(hfsplus_compose_table, c0);
1468c2ecf20Sopenharmony_ci		if (ce1)
1478c2ecf20Sopenharmony_ci			cc = ce1[0];
1488c2ecf20Sopenharmony_ci		else
1498c2ecf20Sopenharmony_ci			cc = 0;
1508c2ecf20Sopenharmony_ci		if (cc) {
1518c2ecf20Sopenharmony_ci			/* start of a possibly decomposed Hangul char */
1528c2ecf20Sopenharmony_ci			if (cc != 0xffff)
1538c2ecf20Sopenharmony_ci				goto done;
1548c2ecf20Sopenharmony_ci			if (!ustrlen)
1558c2ecf20Sopenharmony_ci				goto same;
1568c2ecf20Sopenharmony_ci			c1 = be16_to_cpu(*ip) - Hangul_VBase;
1578c2ecf20Sopenharmony_ci			if (c1 < Hangul_VCount) {
1588c2ecf20Sopenharmony_ci				/* compose the Hangul char */
1598c2ecf20Sopenharmony_ci				cc = (c0 - Hangul_LBase) * Hangul_VCount;
1608c2ecf20Sopenharmony_ci				cc = (cc + c1) * Hangul_TCount;
1618c2ecf20Sopenharmony_ci				cc += Hangul_SBase;
1628c2ecf20Sopenharmony_ci				ip++;
1638c2ecf20Sopenharmony_ci				ustrlen--;
1648c2ecf20Sopenharmony_ci				if (!ustrlen)
1658c2ecf20Sopenharmony_ci					goto done;
1668c2ecf20Sopenharmony_ci				c1 = be16_to_cpu(*ip) - Hangul_TBase;
1678c2ecf20Sopenharmony_ci				if (c1 > 0 && c1 < Hangul_TCount) {
1688c2ecf20Sopenharmony_ci					cc += c1;
1698c2ecf20Sopenharmony_ci					ip++;
1708c2ecf20Sopenharmony_ci					ustrlen--;
1718c2ecf20Sopenharmony_ci				}
1728c2ecf20Sopenharmony_ci				goto done;
1738c2ecf20Sopenharmony_ci			}
1748c2ecf20Sopenharmony_ci		}
1758c2ecf20Sopenharmony_ci		while (1) {
1768c2ecf20Sopenharmony_ci			/* main loop for common case of not composed chars */
1778c2ecf20Sopenharmony_ci			if (!ustrlen)
1788c2ecf20Sopenharmony_ci				goto same;
1798c2ecf20Sopenharmony_ci			c1 = be16_to_cpu(*ip);
1808c2ecf20Sopenharmony_ci			if (likely(compose))
1818c2ecf20Sopenharmony_ci				ce1 = hfsplus_compose_lookup(
1828c2ecf20Sopenharmony_ci					hfsplus_compose_table, c1);
1838c2ecf20Sopenharmony_ci			if (ce1)
1848c2ecf20Sopenharmony_ci				break;
1858c2ecf20Sopenharmony_ci			switch (c0) {
1868c2ecf20Sopenharmony_ci			case 0:
1878c2ecf20Sopenharmony_ci				c0 = 0x2400;
1888c2ecf20Sopenharmony_ci				break;
1898c2ecf20Sopenharmony_ci			case '/':
1908c2ecf20Sopenharmony_ci				c0 = ':';
1918c2ecf20Sopenharmony_ci				break;
1928c2ecf20Sopenharmony_ci			}
1938c2ecf20Sopenharmony_ci			res = nls->uni2char(c0, op, len);
1948c2ecf20Sopenharmony_ci			if (res < 0) {
1958c2ecf20Sopenharmony_ci				if (res == -ENAMETOOLONG)
1968c2ecf20Sopenharmony_ci					goto out;
1978c2ecf20Sopenharmony_ci				*op = '?';
1988c2ecf20Sopenharmony_ci				res = 1;
1998c2ecf20Sopenharmony_ci			}
2008c2ecf20Sopenharmony_ci			op += res;
2018c2ecf20Sopenharmony_ci			len -= res;
2028c2ecf20Sopenharmony_ci			c0 = c1;
2038c2ecf20Sopenharmony_ci			ip++;
2048c2ecf20Sopenharmony_ci			ustrlen--;
2058c2ecf20Sopenharmony_ci		}
2068c2ecf20Sopenharmony_ci		ce2 = hfsplus_compose_lookup(ce1, c0);
2078c2ecf20Sopenharmony_ci		if (ce2) {
2088c2ecf20Sopenharmony_ci			i = 1;
2098c2ecf20Sopenharmony_ci			while (i < ustrlen) {
2108c2ecf20Sopenharmony_ci				ce1 = hfsplus_compose_lookup(ce2,
2118c2ecf20Sopenharmony_ci					be16_to_cpu(ip[i]));
2128c2ecf20Sopenharmony_ci				if (!ce1)
2138c2ecf20Sopenharmony_ci					break;
2148c2ecf20Sopenharmony_ci				i++;
2158c2ecf20Sopenharmony_ci				ce2 = ce1;
2168c2ecf20Sopenharmony_ci			}
2178c2ecf20Sopenharmony_ci			cc = ce2[0];
2188c2ecf20Sopenharmony_ci			if (cc) {
2198c2ecf20Sopenharmony_ci				ip += i;
2208c2ecf20Sopenharmony_ci				ustrlen -= i;
2218c2ecf20Sopenharmony_ci				goto done;
2228c2ecf20Sopenharmony_ci			}
2238c2ecf20Sopenharmony_ci		}
2248c2ecf20Sopenharmony_cisame:
2258c2ecf20Sopenharmony_ci		switch (c0) {
2268c2ecf20Sopenharmony_ci		case 0:
2278c2ecf20Sopenharmony_ci			cc = 0x2400;
2288c2ecf20Sopenharmony_ci			break;
2298c2ecf20Sopenharmony_ci		case '/':
2308c2ecf20Sopenharmony_ci			cc = ':';
2318c2ecf20Sopenharmony_ci			break;
2328c2ecf20Sopenharmony_ci		default:
2338c2ecf20Sopenharmony_ci			cc = c0;
2348c2ecf20Sopenharmony_ci		}
2358c2ecf20Sopenharmony_cidone:
2368c2ecf20Sopenharmony_ci		res = nls->uni2char(cc, op, len);
2378c2ecf20Sopenharmony_ci		if (res < 0) {
2388c2ecf20Sopenharmony_ci			if (res == -ENAMETOOLONG)
2398c2ecf20Sopenharmony_ci				goto out;
2408c2ecf20Sopenharmony_ci			*op = '?';
2418c2ecf20Sopenharmony_ci			res = 1;
2428c2ecf20Sopenharmony_ci		}
2438c2ecf20Sopenharmony_ci		op += res;
2448c2ecf20Sopenharmony_ci		len -= res;
2458c2ecf20Sopenharmony_ci	}
2468c2ecf20Sopenharmony_ci	res = 0;
2478c2ecf20Sopenharmony_ciout:
2488c2ecf20Sopenharmony_ci	*len_p = (char *)op - astr;
2498c2ecf20Sopenharmony_ci	return res;
2508c2ecf20Sopenharmony_ci}
2518c2ecf20Sopenharmony_ci
2528c2ecf20Sopenharmony_ci/*
2538c2ecf20Sopenharmony_ci * Convert one or more ASCII characters into a single unicode character.
2548c2ecf20Sopenharmony_ci * Returns the number of ASCII characters corresponding to the unicode char.
2558c2ecf20Sopenharmony_ci */
2568c2ecf20Sopenharmony_cistatic inline int asc2unichar(struct super_block *sb, const char *astr, int len,
2578c2ecf20Sopenharmony_ci			      wchar_t *uc)
2588c2ecf20Sopenharmony_ci{
2598c2ecf20Sopenharmony_ci	int size = HFSPLUS_SB(sb)->nls->char2uni(astr, len, uc);
2608c2ecf20Sopenharmony_ci	if (size <= 0) {
2618c2ecf20Sopenharmony_ci		*uc = '?';
2628c2ecf20Sopenharmony_ci		size = 1;
2638c2ecf20Sopenharmony_ci	}
2648c2ecf20Sopenharmony_ci	switch (*uc) {
2658c2ecf20Sopenharmony_ci	case 0x2400:
2668c2ecf20Sopenharmony_ci		*uc = 0;
2678c2ecf20Sopenharmony_ci		break;
2688c2ecf20Sopenharmony_ci	case ':':
2698c2ecf20Sopenharmony_ci		*uc = '/';
2708c2ecf20Sopenharmony_ci		break;
2718c2ecf20Sopenharmony_ci	}
2728c2ecf20Sopenharmony_ci	return size;
2738c2ecf20Sopenharmony_ci}
2748c2ecf20Sopenharmony_ci
2758c2ecf20Sopenharmony_ci/* Decomposes a non-Hangul unicode character. */
2768c2ecf20Sopenharmony_cistatic u16 *hfsplus_decompose_nonhangul(wchar_t uc, int *size)
2778c2ecf20Sopenharmony_ci{
2788c2ecf20Sopenharmony_ci	int off;
2798c2ecf20Sopenharmony_ci
2808c2ecf20Sopenharmony_ci	off = hfsplus_decompose_table[(uc >> 12) & 0xf];
2818c2ecf20Sopenharmony_ci	if (off == 0 || off == 0xffff)
2828c2ecf20Sopenharmony_ci		return NULL;
2838c2ecf20Sopenharmony_ci
2848c2ecf20Sopenharmony_ci	off = hfsplus_decompose_table[off + ((uc >> 8) & 0xf)];
2858c2ecf20Sopenharmony_ci	if (!off)
2868c2ecf20Sopenharmony_ci		return NULL;
2878c2ecf20Sopenharmony_ci
2888c2ecf20Sopenharmony_ci	off = hfsplus_decompose_table[off + ((uc >> 4) & 0xf)];
2898c2ecf20Sopenharmony_ci	if (!off)
2908c2ecf20Sopenharmony_ci		return NULL;
2918c2ecf20Sopenharmony_ci
2928c2ecf20Sopenharmony_ci	off = hfsplus_decompose_table[off + (uc & 0xf)];
2938c2ecf20Sopenharmony_ci	*size = off & 3;
2948c2ecf20Sopenharmony_ci	if (*size == 0)
2958c2ecf20Sopenharmony_ci		return NULL;
2968c2ecf20Sopenharmony_ci	return hfsplus_decompose_table + (off / 4);
2978c2ecf20Sopenharmony_ci}
2988c2ecf20Sopenharmony_ci
2998c2ecf20Sopenharmony_ci/*
3008c2ecf20Sopenharmony_ci * Try to decompose a unicode character as Hangul. Return 0 if @uc is not
3018c2ecf20Sopenharmony_ci * precomposed Hangul, otherwise return the length of the decomposition.
3028c2ecf20Sopenharmony_ci *
3038c2ecf20Sopenharmony_ci * This function was adapted from sample code from the Unicode Standard
3048c2ecf20Sopenharmony_ci * Annex #15: Unicode Normalization Forms, version 3.2.0.
3058c2ecf20Sopenharmony_ci *
3068c2ecf20Sopenharmony_ci * Copyright (C) 1991-2018 Unicode, Inc.  All rights reserved.  Distributed
3078c2ecf20Sopenharmony_ci * under the Terms of Use in http://www.unicode.org/copyright.html.
3088c2ecf20Sopenharmony_ci */
3098c2ecf20Sopenharmony_cistatic int hfsplus_try_decompose_hangul(wchar_t uc, u16 *result)
3108c2ecf20Sopenharmony_ci{
3118c2ecf20Sopenharmony_ci	int index;
3128c2ecf20Sopenharmony_ci	int l, v, t;
3138c2ecf20Sopenharmony_ci
3148c2ecf20Sopenharmony_ci	index = uc - Hangul_SBase;
3158c2ecf20Sopenharmony_ci	if (index < 0 || index >= Hangul_SCount)
3168c2ecf20Sopenharmony_ci		return 0;
3178c2ecf20Sopenharmony_ci
3188c2ecf20Sopenharmony_ci	l = Hangul_LBase + index / Hangul_NCount;
3198c2ecf20Sopenharmony_ci	v = Hangul_VBase + (index % Hangul_NCount) / Hangul_TCount;
3208c2ecf20Sopenharmony_ci	t = Hangul_TBase + index % Hangul_TCount;
3218c2ecf20Sopenharmony_ci
3228c2ecf20Sopenharmony_ci	result[0] = l;
3238c2ecf20Sopenharmony_ci	result[1] = v;
3248c2ecf20Sopenharmony_ci	if (t != Hangul_TBase) {
3258c2ecf20Sopenharmony_ci		result[2] = t;
3268c2ecf20Sopenharmony_ci		return 3;
3278c2ecf20Sopenharmony_ci	}
3288c2ecf20Sopenharmony_ci	return 2;
3298c2ecf20Sopenharmony_ci}
3308c2ecf20Sopenharmony_ci
3318c2ecf20Sopenharmony_ci/* Decomposes a single unicode character. */
3328c2ecf20Sopenharmony_cistatic u16 *decompose_unichar(wchar_t uc, int *size, u16 *hangul_buffer)
3338c2ecf20Sopenharmony_ci{
3348c2ecf20Sopenharmony_ci	u16 *result;
3358c2ecf20Sopenharmony_ci
3368c2ecf20Sopenharmony_ci	/* Hangul is handled separately */
3378c2ecf20Sopenharmony_ci	result = hangul_buffer;
3388c2ecf20Sopenharmony_ci	*size = hfsplus_try_decompose_hangul(uc, result);
3398c2ecf20Sopenharmony_ci	if (*size == 0)
3408c2ecf20Sopenharmony_ci		result = hfsplus_decompose_nonhangul(uc, size);
3418c2ecf20Sopenharmony_ci	return result;
3428c2ecf20Sopenharmony_ci}
3438c2ecf20Sopenharmony_ci
3448c2ecf20Sopenharmony_ciint hfsplus_asc2uni(struct super_block *sb,
3458c2ecf20Sopenharmony_ci		    struct hfsplus_unistr *ustr, int max_unistr_len,
3468c2ecf20Sopenharmony_ci		    const char *astr, int len)
3478c2ecf20Sopenharmony_ci{
3488c2ecf20Sopenharmony_ci	int size, dsize, decompose;
3498c2ecf20Sopenharmony_ci	u16 *dstr, outlen = 0;
3508c2ecf20Sopenharmony_ci	wchar_t c;
3518c2ecf20Sopenharmony_ci	u16 dhangul[3];
3528c2ecf20Sopenharmony_ci
3538c2ecf20Sopenharmony_ci	decompose = !test_bit(HFSPLUS_SB_NODECOMPOSE, &HFSPLUS_SB(sb)->flags);
3548c2ecf20Sopenharmony_ci	while (outlen < max_unistr_len && len > 0) {
3558c2ecf20Sopenharmony_ci		size = asc2unichar(sb, astr, len, &c);
3568c2ecf20Sopenharmony_ci
3578c2ecf20Sopenharmony_ci		if (decompose)
3588c2ecf20Sopenharmony_ci			dstr = decompose_unichar(c, &dsize, dhangul);
3598c2ecf20Sopenharmony_ci		else
3608c2ecf20Sopenharmony_ci			dstr = NULL;
3618c2ecf20Sopenharmony_ci		if (dstr) {
3628c2ecf20Sopenharmony_ci			if (outlen + dsize > max_unistr_len)
3638c2ecf20Sopenharmony_ci				break;
3648c2ecf20Sopenharmony_ci			do {
3658c2ecf20Sopenharmony_ci				ustr->unicode[outlen++] = cpu_to_be16(*dstr++);
3668c2ecf20Sopenharmony_ci			} while (--dsize > 0);
3678c2ecf20Sopenharmony_ci		} else
3688c2ecf20Sopenharmony_ci			ustr->unicode[outlen++] = cpu_to_be16(c);
3698c2ecf20Sopenharmony_ci
3708c2ecf20Sopenharmony_ci		astr += size;
3718c2ecf20Sopenharmony_ci		len -= size;
3728c2ecf20Sopenharmony_ci	}
3738c2ecf20Sopenharmony_ci	ustr->length = cpu_to_be16(outlen);
3748c2ecf20Sopenharmony_ci	if (len > 0)
3758c2ecf20Sopenharmony_ci		return -ENAMETOOLONG;
3768c2ecf20Sopenharmony_ci	return 0;
3778c2ecf20Sopenharmony_ci}
3788c2ecf20Sopenharmony_ci
3798c2ecf20Sopenharmony_ci/*
3808c2ecf20Sopenharmony_ci * Hash a string to an integer as appropriate for the HFS+ filesystem.
3818c2ecf20Sopenharmony_ci * Composed unicode characters are decomposed and case-folding is performed
3828c2ecf20Sopenharmony_ci * if the appropriate bits are (un)set on the superblock.
3838c2ecf20Sopenharmony_ci */
3848c2ecf20Sopenharmony_ciint hfsplus_hash_dentry(const struct dentry *dentry, struct qstr *str)
3858c2ecf20Sopenharmony_ci{
3868c2ecf20Sopenharmony_ci	struct super_block *sb = dentry->d_sb;
3878c2ecf20Sopenharmony_ci	const char *astr;
3888c2ecf20Sopenharmony_ci	const u16 *dstr;
3898c2ecf20Sopenharmony_ci	int casefold, decompose, size, len;
3908c2ecf20Sopenharmony_ci	unsigned long hash;
3918c2ecf20Sopenharmony_ci	wchar_t c;
3928c2ecf20Sopenharmony_ci	u16 c2;
3938c2ecf20Sopenharmony_ci	u16 dhangul[3];
3948c2ecf20Sopenharmony_ci
3958c2ecf20Sopenharmony_ci	casefold = test_bit(HFSPLUS_SB_CASEFOLD, &HFSPLUS_SB(sb)->flags);
3968c2ecf20Sopenharmony_ci	decompose = !test_bit(HFSPLUS_SB_NODECOMPOSE, &HFSPLUS_SB(sb)->flags);
3978c2ecf20Sopenharmony_ci	hash = init_name_hash(dentry);
3988c2ecf20Sopenharmony_ci	astr = str->name;
3998c2ecf20Sopenharmony_ci	len = str->len;
4008c2ecf20Sopenharmony_ci	while (len > 0) {
4018c2ecf20Sopenharmony_ci		int dsize;
4028c2ecf20Sopenharmony_ci		size = asc2unichar(sb, astr, len, &c);
4038c2ecf20Sopenharmony_ci		astr += size;
4048c2ecf20Sopenharmony_ci		len -= size;
4058c2ecf20Sopenharmony_ci
4068c2ecf20Sopenharmony_ci		if (decompose)
4078c2ecf20Sopenharmony_ci			dstr = decompose_unichar(c, &dsize, dhangul);
4088c2ecf20Sopenharmony_ci		else
4098c2ecf20Sopenharmony_ci			dstr = NULL;
4108c2ecf20Sopenharmony_ci		if (dstr) {
4118c2ecf20Sopenharmony_ci			do {
4128c2ecf20Sopenharmony_ci				c2 = *dstr++;
4138c2ecf20Sopenharmony_ci				if (casefold)
4148c2ecf20Sopenharmony_ci					c2 = case_fold(c2);
4158c2ecf20Sopenharmony_ci				if (!casefold || c2)
4168c2ecf20Sopenharmony_ci					hash = partial_name_hash(c2, hash);
4178c2ecf20Sopenharmony_ci			} while (--dsize > 0);
4188c2ecf20Sopenharmony_ci		} else {
4198c2ecf20Sopenharmony_ci			c2 = c;
4208c2ecf20Sopenharmony_ci			if (casefold)
4218c2ecf20Sopenharmony_ci				c2 = case_fold(c2);
4228c2ecf20Sopenharmony_ci			if (!casefold || c2)
4238c2ecf20Sopenharmony_ci				hash = partial_name_hash(c2, hash);
4248c2ecf20Sopenharmony_ci		}
4258c2ecf20Sopenharmony_ci	}
4268c2ecf20Sopenharmony_ci	str->hash = end_name_hash(hash);
4278c2ecf20Sopenharmony_ci
4288c2ecf20Sopenharmony_ci	return 0;
4298c2ecf20Sopenharmony_ci}
4308c2ecf20Sopenharmony_ci
4318c2ecf20Sopenharmony_ci/*
4328c2ecf20Sopenharmony_ci * Compare strings with HFS+ filename ordering.
4338c2ecf20Sopenharmony_ci * Composed unicode characters are decomposed and case-folding is performed
4348c2ecf20Sopenharmony_ci * if the appropriate bits are (un)set on the superblock.
4358c2ecf20Sopenharmony_ci */
4368c2ecf20Sopenharmony_ciint hfsplus_compare_dentry(const struct dentry *dentry,
4378c2ecf20Sopenharmony_ci		unsigned int len, const char *str, const struct qstr *name)
4388c2ecf20Sopenharmony_ci{
4398c2ecf20Sopenharmony_ci	struct super_block *sb = dentry->d_sb;
4408c2ecf20Sopenharmony_ci	int casefold, decompose, size;
4418c2ecf20Sopenharmony_ci	int dsize1, dsize2, len1, len2;
4428c2ecf20Sopenharmony_ci	const u16 *dstr1, *dstr2;
4438c2ecf20Sopenharmony_ci	const char *astr1, *astr2;
4448c2ecf20Sopenharmony_ci	u16 c1, c2;
4458c2ecf20Sopenharmony_ci	wchar_t c;
4468c2ecf20Sopenharmony_ci	u16 dhangul_1[3], dhangul_2[3];
4478c2ecf20Sopenharmony_ci
4488c2ecf20Sopenharmony_ci	casefold = test_bit(HFSPLUS_SB_CASEFOLD, &HFSPLUS_SB(sb)->flags);
4498c2ecf20Sopenharmony_ci	decompose = !test_bit(HFSPLUS_SB_NODECOMPOSE, &HFSPLUS_SB(sb)->flags);
4508c2ecf20Sopenharmony_ci	astr1 = str;
4518c2ecf20Sopenharmony_ci	len1 = len;
4528c2ecf20Sopenharmony_ci	astr2 = name->name;
4538c2ecf20Sopenharmony_ci	len2 = name->len;
4548c2ecf20Sopenharmony_ci	dsize1 = dsize2 = 0;
4558c2ecf20Sopenharmony_ci	dstr1 = dstr2 = NULL;
4568c2ecf20Sopenharmony_ci
4578c2ecf20Sopenharmony_ci	while (len1 > 0 && len2 > 0) {
4588c2ecf20Sopenharmony_ci		if (!dsize1) {
4598c2ecf20Sopenharmony_ci			size = asc2unichar(sb, astr1, len1, &c);
4608c2ecf20Sopenharmony_ci			astr1 += size;
4618c2ecf20Sopenharmony_ci			len1 -= size;
4628c2ecf20Sopenharmony_ci
4638c2ecf20Sopenharmony_ci			if (decompose)
4648c2ecf20Sopenharmony_ci				dstr1 = decompose_unichar(c, &dsize1,
4658c2ecf20Sopenharmony_ci							  dhangul_1);
4668c2ecf20Sopenharmony_ci			if (!decompose || !dstr1) {
4678c2ecf20Sopenharmony_ci				c1 = c;
4688c2ecf20Sopenharmony_ci				dstr1 = &c1;
4698c2ecf20Sopenharmony_ci				dsize1 = 1;
4708c2ecf20Sopenharmony_ci			}
4718c2ecf20Sopenharmony_ci		}
4728c2ecf20Sopenharmony_ci
4738c2ecf20Sopenharmony_ci		if (!dsize2) {
4748c2ecf20Sopenharmony_ci			size = asc2unichar(sb, astr2, len2, &c);
4758c2ecf20Sopenharmony_ci			astr2 += size;
4768c2ecf20Sopenharmony_ci			len2 -= size;
4778c2ecf20Sopenharmony_ci
4788c2ecf20Sopenharmony_ci			if (decompose)
4798c2ecf20Sopenharmony_ci				dstr2 = decompose_unichar(c, &dsize2,
4808c2ecf20Sopenharmony_ci							  dhangul_2);
4818c2ecf20Sopenharmony_ci			if (!decompose || !dstr2) {
4828c2ecf20Sopenharmony_ci				c2 = c;
4838c2ecf20Sopenharmony_ci				dstr2 = &c2;
4848c2ecf20Sopenharmony_ci				dsize2 = 1;
4858c2ecf20Sopenharmony_ci			}
4868c2ecf20Sopenharmony_ci		}
4878c2ecf20Sopenharmony_ci
4888c2ecf20Sopenharmony_ci		c1 = *dstr1;
4898c2ecf20Sopenharmony_ci		c2 = *dstr2;
4908c2ecf20Sopenharmony_ci		if (casefold) {
4918c2ecf20Sopenharmony_ci			c1 = case_fold(c1);
4928c2ecf20Sopenharmony_ci			if (!c1) {
4938c2ecf20Sopenharmony_ci				dstr1++;
4948c2ecf20Sopenharmony_ci				dsize1--;
4958c2ecf20Sopenharmony_ci				continue;
4968c2ecf20Sopenharmony_ci			}
4978c2ecf20Sopenharmony_ci			c2 = case_fold(c2);
4988c2ecf20Sopenharmony_ci			if (!c2) {
4998c2ecf20Sopenharmony_ci				dstr2++;
5008c2ecf20Sopenharmony_ci				dsize2--;
5018c2ecf20Sopenharmony_ci				continue;
5028c2ecf20Sopenharmony_ci			}
5038c2ecf20Sopenharmony_ci		}
5048c2ecf20Sopenharmony_ci		if (c1 < c2)
5058c2ecf20Sopenharmony_ci			return -1;
5068c2ecf20Sopenharmony_ci		else if (c1 > c2)
5078c2ecf20Sopenharmony_ci			return 1;
5088c2ecf20Sopenharmony_ci
5098c2ecf20Sopenharmony_ci		dstr1++;
5108c2ecf20Sopenharmony_ci		dsize1--;
5118c2ecf20Sopenharmony_ci		dstr2++;
5128c2ecf20Sopenharmony_ci		dsize2--;
5138c2ecf20Sopenharmony_ci	}
5148c2ecf20Sopenharmony_ci
5158c2ecf20Sopenharmony_ci	if (len1 < len2)
5168c2ecf20Sopenharmony_ci		return -1;
5178c2ecf20Sopenharmony_ci	if (len1 > len2)
5188c2ecf20Sopenharmony_ci		return 1;
5198c2ecf20Sopenharmony_ci	return 0;
5208c2ecf20Sopenharmony_ci}
521