linux/fs/hfsplus/unicode.c

/*
 *  linux/fs/hfsplus/unicode.c
 *
 * Copyright (C) 2001
 * Brad Boyer (flar@allandria.com)
 * (C) 2003 Ardis Technologies <roman@ardistech.com>
 *
 * Handler routines for unicode strings
 */

#include <linux/types.h>
#include <linux/nls.h>
#include "hfsplus_fs.h"
#include "hfsplus_raw.h"

/* Fold the case of a unicode char, given the 16 bit value */
/* Returns folded char, or 0 if ignorable */
static inline u16 case_fold(u16 c)
{
        u16 tmp;

        tmp = hfsplus_case_fold_table[c >> 8];
        if (tmp)
                tmp = hfsplus_case_fold_table[tmp + (c & 0xff)];
        else
                tmp = c;
        return tmp;
}

/* Compare unicode strings, return values like normal strcmp */
int hfsplus_strcasecmp(const struct hfsplus_unistr *s1,
		       const struct hfsplus_unistr *s2)
{
	u16 len1, len2, c1, c2;
	const hfsplus_unichr *p1, *p2;

	len1 = be16_to_cpu(s1->length);
	len2 = be16_to_cpu(s2->length);
	p1 = s1->unicode;
	p2 = s2->unicode;

	while (1) {
		c1 = c2 = 0;

		while (len1 && !c1) {
			c1 = case_fold(be16_to_cpu(*p1));
			p1++;
			len1--;
		}
		while (len2 && !c2) {
			c2 = case_fold(be16_to_cpu(*p2));
			p2++;
			len2--;
		}

		if (c1 != c2)
			return (c1 < c2) ? -1 : 1;
		if (!c1 && !c2)
			return 0;
	}
}

/* Compare names as a sequence of 16-bit unsigned integers */
int hfsplus_strcmp(const struct hfsplus_unistr *s1,
		   const struct hfsplus_unistr *s2)
{
	u16 len1, len2, c1, c2;
	const hfsplus_unichr *p1, *p2;
	int len;

	len1 = be16_to_cpu(s1->length);
	len2 = be16_to_cpu(s2->length);
	p1 = s1->unicode;
	p2 = s2->unicode;

	for (len = min(len1, len2); len > 0; len--) {
		c1 = be16_to_cpu(*p1);
		c2 = be16_to_cpu(*p2);
		if (c1 != c2)
			return c1 < c2 ? -1 : 1;
		p1++;
		p2++;
	}

	return len1 < len2 ? -1 :
	       len1 > len2 ? 1 : 0;
}


#define Hangul_SBase	0xac00
#define Hangul_LBase	0x1100
#define Hangul_VBase	0x1161
#define Hangul_TBase	0x11a7
#define Hangul_SCount	11172
#define Hangul_LCount	19
#define Hangul_VCount	21
#define Hangul_TCount	28
#define Hangul_NCount	(Hangul_VCount * Hangul_TCount)


static u16 *hfsplus_compose_lookup(u16 *p, u16 cc)
{
	int i, s, e;

	s = 1;
	e = p[1];
	if (!e || cc < p[s * 2] || cc > p[e * 2])
		return NULL;
	do {
		i = (s + e) / 2;
		if (cc > p[i * 2])
			s = i + 1;
		else if (cc < p[i * 2])
			e = i - 1;
		else
			return hfsplus_compose_table + p[i * 2 + 1];
	} while (s <= e);
	return NULL;
}

int hfsplus_uni2asc(struct super_block *sb, const struct hfsplus_unistr *ustr, char *astr, int *len_p)
{
	const hfsplus_unichr *ip;
	struct nls_table *nls = HFSPLUS_SB(sb).nls;
	u8 *op;
	u16 cc, c0, c1;
	u16 *ce1, *ce2;
	int i, len, ustrlen, res, compose;

	op = astr;
	ip = ustr->unicode;
	ustrlen = be16_to_cpu(ustr->length);
	len = *len_p;
	ce1 = NULL;
	compose = !(HFSPLUS_SB(sb).flags & HFSPLUS_SB_NODECOMPOSE);

	while (ustrlen > 0) {
		c0 = be16_to_cpu(*ip++);
		ustrlen--;
		/* search for single decomposed char */
		if (likely(compose))
			ce1 = hfsplus_compose_lookup(hfsplus_compose_table, c0);
		if (ce1 && (cc = ce1[0])) {
			/* start of a possibly decomposed Hangul char */
			if (cc != 0xffff)
				goto done;
			if (!ustrlen)
				goto same;
			c1 = be16_to_cpu(*ip) - Hangul_VBase;
			if (c1 < Hangul_VCount) {
				/* compose the Hangul char */
				cc = (c0 - Hangul_LBase) * Hangul_VCount;
				cc = (cc + c1) * Hangul_TCount;
				cc += Hangul_SBase;
				ip++;
				ustrlen--;
				if (!ustrlen)
					goto done;
				c1 = be16_to_cpu(*ip) - Hangul_TBase;
				if (c1 > 0 && c1 < Hangul_TCount) {
					cc += c1;
					ip++;
					ustrlen--;
				}
				goto done;
			}
		}
		while (1) {
			/* main loop for common case of not composed chars */
			if (!ustrlen)
				goto same;
			c1 = be16_to_cpu(*ip);
			if (likely(compose))
				ce1 = hfsplus_compose_lookup(hfsplus_compose_table, c1);
			if (ce1)
				break;
			switch (c0) {
			case 0:
				c0 = 0x2400;
				break;
			case '/':
				c0 = ':';
				break;
			}
			res = nls->uni2char(c0, op, len);
			if (res < 0) {
				if (res == -ENAMETOOLONG)
					goto out;
				*op = '?';
				res = 1;
			}
			op += res;
			len -= res;
			c0 = c1;
			ip++;
			ustrlen--;
		}
		ce2 = hfsplus_compose_lookup(ce1, c0);
		if (ce2) {
			i = 1;
			while (i < ustrlen) {
				ce1 = hfsplus_compose_lookup(ce2, be16_to_cpu(ip[i]));
				if (!ce1)
					break;
				i++;
				ce2 = ce1;
			}
			if ((cc = ce2[0])) {
				ip += i;
				ustrlen -= i;
				goto done;
			}
		}
	same:
		switch (c0) {
		case 0:
			cc = 0x2400;
			break;
		case '/':
			cc = ':';
			break;
		default:
			cc = c0;
		}
	done:
		res = nls->uni2char(cc, op, len);
		if (res < 0) {
			if (res == -ENAMETOOLONG)
				goto out;
			*op = '?';
			res = 1;
		}
		op += res;
		len -= res;
	}
	res = 0;
out:
	*len_p = (char *)op - astr;
	return res;
}

/*
 * Convert one or more ASCII characters into a single unicode character.
 * Returns the number of ASCII characters corresponding to the unicode char.
 */
static inline int asc2unichar(struct super_block *sb, const char *astr, int len,
			      wchar_t *uc)
{
	int size = HFSPLUS_SB(sb).nls->char2uni(astr, len, uc);
	if (size <= 0) {
		*uc = '?';
		size = 1;
	}
	switch (*uc) {
	case 0x2400:
		*uc = 0;
		break;
	case ':':
		*uc = '/';
		break;
	}
	return size;
}

/* Decomposes a single unicode character. */
static inline u16 *decompose_unichar(wchar_t uc, int *size)
{
	int off;

	off = hfsplus_decompose_table[(uc >> 12) & 0xf];
	if (off == 0 || off == 0xffff)
		return NULL;

	off = hfsplus_decompose_table[off + ((uc >> 8) & 0xf)];
	if (!off)
		return NULL;

	off = hfsplus_decompose_table[off + ((uc >> 4) & 0xf)];
	if (!off)
		return NULL;

	off = hfsplus_decompose_table[off + (uc & 0xf)];
	*size = off & 3;
	if (*size == 0)
		return NULL;
	return hfsplus_decompose_table + (off / 4);
}

int hfsplus_asc2uni(struct super_block *sb, struct hfsplus_unistr *ustr,
		    const char *astr, int len)
{
	int size, dsize, decompose;
	u16 *dstr, outlen = 0;
	wchar_t c;

	decompose = !(HFSPLUS_SB(sb).flags & HFSPLUS_SB_NODECOMPOSE);
	while (outlen < HFSPLUS_MAX_STRLEN && len > 0) {
		size = asc2unichar(sb, astr, len, &c);

		if (decompose && (dstr = decompose_unichar(c, &dsize))) {
			if (outlen + dsize > HFSPLUS_MAX_STRLEN)
				break;
			do {
				ustr->unicode[outlen++] = cpu_to_be16(*dstr++);
			} while (--dsize > 0);
		} else
			ustr->unicode[outlen++] = cpu_to_be16(c);

		astr += size;
		len -= size;
	}
	ustr->length = cpu_to_be16(outlen);
	if (len > 0)
		return -ENAMETOOLONG;
	return 0;
}

/*
 * Hash a string to an integer as appropriate for the HFS+ filesystem.
 * Composed unicode characters are decomposed and case-folding is performed
 * if the appropriate bits are (un)set on the superblock.
 */
int hfsplus_hash_dentry(struct dentry *dentry, struct qstr *str)
{
	struct super_block *sb = dentry->d_sb;
	const char *astr;
	const u16 *dstr;
	int casefold, decompose, size, len;
	unsigned long hash;
	wchar_t c;
	u16 c2;

	casefold = (HFSPLUS_SB(sb).flags & HFSPLUS_SB_CASEFOLD);
	decompose = !(HFSPLUS_SB(sb).flags & HFSPLUS_SB_NODECOMPOSE);
	hash = init_name_hash();
	astr = str->name;
	len = str->len;
	while (len > 0) {
		int uninitialized_var(dsize);
		size = asc2unichar(sb, astr, len, &c);
		astr += size;
		len -= size;

		if (decompose && (dstr = decompose_unichar(c, &dsize))) {
			do {
				c2 = *dstr++;
				if (!casefold || (c2 = case_fold(c2)))
					hash = partial_name_hash(c2, hash);
			} while (--dsize > 0);
		} else {
			c2 = c;
			if (!casefold || (c2 = case_fold(c2)))
				hash = partial_name_hash(c2, hash);
		}
	}
	str->hash = end_name_hash(hash);

	return 0;
}

/*
 * Compare strings with HFS+ filename ordering.
 * Composed unicode characters are decomposed and case-folding is performed
 * if the appropriate bits are (un)set on the superblock.
 */
int hfsplus_compare_dentry(struct dentry *dentry, struct qstr *s1, struct qstr *s2)
{
	struct super_block *sb = dentry->d_sb;
	int casefold, decompose, size;
	int dsize1, dsize2, len1, len2;
	const u16 *dstr1, *dstr2;
	const char *astr1, *astr2;
	u16 c1, c2;
	wchar_t c;

	casefold = (HFSPLUS_SB(sb).flags & HFSPLUS_SB_CASEFOLD);
	decompose = !(HFSPLUS_SB(sb).flags & HFSPLUS_SB_NODECOMPOSE);
	astr1 = s1->name;
	len1 = s1->len;
	astr2 = s2->name;
	len2 = s2->len;
	dsize1 = dsize2 = 0;
	dstr1 = dstr2 = NULL;

	while (len1 > 0 && len2 > 0) {
		if (!dsize1) {
			size = asc2unichar(sb, astr1, len1, &c);
			astr1 += size;
			len1 -= size;

			if (!decompose || !(dstr1 = decompose_unichar(c, &dsize1))) {
				c1 = c;
				dstr1 = &c1;
				dsize1 = 1;
			}
		}

		if (!dsize2) {
			size = asc2unichar(sb, astr2, len2, &c);
			astr2 += size;
			len2 -= size;

			if (!decompose || !(dstr2 = decompose_unichar(c, &dsize2))) {
				c2 = c;
				dstr2 = &c2;
				dsize2 = 1;
			}
		}

		c1 = *dstr1;
		c2 = *dstr2;
		if (casefold) {
			if  (!(c1 = case_fold(c1))) {
				dstr1++;
				dsize1--;
				continue;
			}
			if (!(c2 = case_fold(c2))) {
				dstr2++;
				dsize2--;
				continue;
			}
		}
		if (c1 < c2)
			return -1;
		else if (c1 > c2)
			return 1;

		dstr1++;
		dsize1--;
		dstr2++;
		dsize2--;
	}

	if (len1 < len2)
		return -1;
	if (len1 > len2)
		return 1;
	return 0;
}
Linux-2.6.12-rc2 Initial git repository build. I'm not bothering with the full history, even though we have it. We can create a separate "historical" git archive of that later if we want to, and in the meantime it's about 3.2GB when imported into git - space that would just make the early git days unnecessarily complicated, when we don't have a lot of good infrastructure for it. Let it rip! 2005-04-17 02:20:36 +04:00			`/*`
			`* linux/fs/hfsplus/unicode.c`
			`*`
			`* Copyright (C) 2001`
			`* Brad Boyer (flar@allandria.com)`
			`* (C) 2003 Ardis Technologies <roman@ardistech.com>`
			`*`
			`* Handler routines for unicode strings`
			`*/`

			`#include <linux/types.h>`
			`#include <linux/nls.h>`
			`#include "hfsplus_fs.h"`
			`#include "hfsplus_raw.h"`

			`/* Fold the case of a unicode char, given the 16 bit value */`
			`/* Returns folded char, or 0 if ignorable */`
			`static inline u16 case_fold(u16 c)`
			`{`
			`u16 tmp;`

			`tmp = hfsplus_case_fold_table[c >> 8];`
			`if (tmp)`
			`tmp = hfsplus_case_fold_table[tmp + (c & 0xff)];`
			`else`
			`tmp = c;`
			`return tmp;`
			`}`

			`/* Compare unicode strings, return values like normal strcmp */`
[PATCH] hfs: add HFSX support Add support for HFSX, which allows for case-sensitive filenames. Signed-off-by: Roman Zippel <zippel@linux-m68k.org> Signed-off-by: Andrew Morton <akpm@osdl.org> Signed-off-by: Linus Torvalds <torvalds@osdl.org> 2006-01-19 04:43:08 +03:00			`int hfsplus_strcasecmp(const struct hfsplus_unistr *s1,`
			`const struct hfsplus_unistr *s2)`
Linux-2.6.12-rc2 Initial git repository build. I'm not bothering with the full history, even though we have it. We can create a separate "historical" git archive of that later if we want to, and in the meantime it's about 3.2GB when imported into git - space that would just make the early git days unnecessarily complicated, when we don't have a lot of good infrastructure for it. Let it rip! 2005-04-17 02:20:36 +04:00			`{`
			`u16 len1, len2, c1, c2;`
			`const hfsplus_unichr p1, p2;`

			`len1 = be16_to_cpu(s1->length);`
			`len2 = be16_to_cpu(s2->length);`
			`p1 = s1->unicode;`
			`p2 = s2->unicode;`

			`while (1) {`
			`c1 = c2 = 0;`

			`while (len1 && !c1) {`
			`c1 = case_fold(be16_to_cpu(*p1));`
			`p1++;`
			`len1--;`
			`}`
			`while (len2 && !c2) {`
			`c2 = case_fold(be16_to_cpu(*p2));`
			`p2++;`
			`len2--;`
			`}`

			`if (c1 != c2)`
			`return (c1 < c2) ? -1 : 1;`
			`if (!c1 && !c2)`
			`return 0;`
			`}`
			`}`

[PATCH] hfs: add HFSX support Add support for HFSX, which allows for case-sensitive filenames. Signed-off-by: Roman Zippel <zippel@linux-m68k.org> Signed-off-by: Andrew Morton <akpm@osdl.org> Signed-off-by: Linus Torvalds <torvalds@osdl.org> 2006-01-19 04:43:08 +03:00			`/* Compare names as a sequence of 16-bit unsigned integers */`
			`int hfsplus_strcmp(const struct hfsplus_unistr *s1,`
			`const struct hfsplus_unistr *s2)`
			`{`
			`u16 len1, len2, c1, c2;`
			`const hfsplus_unichr p1, p2;`
			`int len;`

			`len1 = be16_to_cpu(s1->length);`
			`len2 = be16_to_cpu(s2->length);`
			`p1 = s1->unicode;`
			`p2 = s2->unicode;`

			`for (len = min(len1, len2); len > 0; len--) {`
			`c1 = be16_to_cpu(*p1);`
			`c2 = be16_to_cpu(*p2);`
			`if (c1 != c2)`
			`return c1 < c2 ? -1 : 1;`
			`p1++;`
			`p2++;`
			`}`

			`return len1 < len2 ? -1 :`
			`len1 > len2 ? 1 : 0;`
			`}`


Linux-2.6.12-rc2 Initial git repository build. I'm not bothering with the full history, even though we have it. We can create a separate "historical" git archive of that later if we want to, and in the meantime it's about 3.2GB when imported into git - space that would just make the early git days unnecessarily complicated, when we don't have a lot of good infrastructure for it. Let it rip! 2005-04-17 02:20:36 +04:00			`#define Hangul_SBase 0xac00`
			`#define Hangul_LBase 0x1100`
			`#define Hangul_VBase 0x1161`
			`#define Hangul_TBase 0x11a7`
			`#define Hangul_SCount 11172`
			`#define Hangul_LCount 19`
			`#define Hangul_VCount 21`
			`#define Hangul_TCount 28`
			`#define Hangul_NCount (Hangul_VCount * Hangul_TCount)`


			`static u16 hfsplus_compose_lookup(u16 p, u16 cc)`
			`{`
			`int i, s, e;`

			`s = 1;`
			`e = p[1];`
			`if (!e \|\| cc < p[s * 2] \|\| cc > p[e * 2])`
			`return NULL;`
			`do {`
			`i = (s + e) / 2;`
			`if (cc > p[i * 2])`
			`s = i + 1;`
			`else if (cc < p[i * 2])`
			`e = i - 1;`
			`else`
			`return hfsplus_compose_table + p[i * 2 + 1];`
			`} while (s <= e);`
			`return NULL;`
			`}`

			`int hfsplus_uni2asc(struct super_block sb, const struct hfsplus_unistr ustr, char astr, int len_p)`
			`{`
			`const hfsplus_unichr *ip;`
			`struct nls_table *nls = HFSPLUS_SB(sb).nls;`
			`u8 *op;`
			`u16 cc, c0, c1;`
			`u16 ce1, ce2;`
			`int i, len, ustrlen, res, compose;`

			`op = astr;`
			`ip = ustr->unicode;`
			`ustrlen = be16_to_cpu(ustr->length);`
			`len = *len_p;`
			`ce1 = NULL;`
			`compose = !(HFSPLUS_SB(sb).flags & HFSPLUS_SB_NODECOMPOSE);`

			`while (ustrlen > 0) {`
			`c0 = be16_to_cpu(*ip++);`
			`ustrlen--;`
			`/* search for single decomposed char */`
			`if (likely(compose))`
			`ce1 = hfsplus_compose_lookup(hfsplus_compose_table, c0);`
			`if (ce1 && (cc = ce1[0])) {`
			`/* start of a possibly decomposed Hangul char */`
			`if (cc != 0xffff)`
			`goto done;`
			`if (!ustrlen)`
			`goto same;`
			`c1 = be16_to_cpu(*ip) - Hangul_VBase;`
			`if (c1 < Hangul_VCount) {`
			`/* compose the Hangul char */`
			`cc = (c0 - Hangul_LBase) * Hangul_VCount;`
			`cc = (cc + c1) * Hangul_TCount;`
			`cc += Hangul_SBase;`
			`ip++;`
			`ustrlen--;`
			`if (!ustrlen)`
			`goto done;`
			`c1 = be16_to_cpu(*ip) - Hangul_TBase;`
			`if (c1 > 0 && c1 < Hangul_TCount) {`
			`cc += c1;`
			`ip++;`
			`ustrlen--;`
			`}`
			`goto done;`
			`}`
			`}`
			`while (1) {`
			`/* main loop for common case of not composed chars */`
			`if (!ustrlen)`
			`goto same;`
			`c1 = be16_to_cpu(*ip);`
			`if (likely(compose))`
			`ce1 = hfsplus_compose_lookup(hfsplus_compose_table, c1);`
			`if (ce1)`
			`break;`
			`switch (c0) {`
			`case 0:`
			`c0 = 0x2400;`
			`break;`
			`case '/':`
			`c0 = ':';`
			`break;`
			`}`
			`res = nls->uni2char(c0, op, len);`
			`if (res < 0) {`
			`if (res == -ENAMETOOLONG)`
			`goto out;`
			`*op = '?';`
			`res = 1;`
			`}`
			`op += res;`
			`len -= res;`
			`c0 = c1;`
			`ip++;`
			`ustrlen--;`
			`}`
			`ce2 = hfsplus_compose_lookup(ce1, c0);`
			`if (ce2) {`
			`i = 1;`
			`while (i < ustrlen) {`
			`ce1 = hfsplus_compose_lookup(ce2, be16_to_cpu(ip[i]));`
			`if (!ce1)`
			`break;`
			`i++;`
			`ce2 = ce1;`
			`}`
			`if ((cc = ce2[0])) {`
			`ip += i;`
			`ustrlen -= i;`
			`goto done;`
			`}`
			`}`
			`same:`
			`switch (c0) {`
			`case 0:`
			`cc = 0x2400;`
			`break;`
			`case '/':`
			`cc = ':';`
			`break;`
			`default:`
			`cc = c0;`
			`}`
			`done:`
			`res = nls->uni2char(cc, op, len);`
			`if (res < 0) {`
			`if (res == -ENAMETOOLONG)`
			`goto out;`
			`*op = '?';`
			`res = 1;`
			`}`
			`op += res;`
			`len -= res;`
			`}`
			`res = 0;`
			`out:`
			`len_p = (char )op - astr;`
			`return res;`
			`}`

HFS+: refactor ASCII to unicode conversion routine for later reuse The HFS+ filesystem is case-insensitive and does automatic unicode decomposition by default, but does not provide custom dentry operations. This can lead to multiple dentries being cached for lookups on a filename with varying case and/or character (de)composition. These patches add custom dentry hash and comparison operations for case-sensitive and/or automatically decomposing HFS+ filesystems. Unicode decomposition and case-folding are performed as required to ensure equivalent filenames are hashed to the same values and compare as equal. This patch: Refactor existing HFS+ ASCII to unicode string conversion routine to split out character conversion functionality. This will be reused by the custom dentry hash and comparison routines. This approach avoids unnecessary memory allocation compared to using the string conversion routine directly in the new functions. [akpm@linux-foundation.org: avoid use-of-uninitialised] Signed-off-by: Duane Griffin <duaneg@dghda.com> Signed-off-by: Roman Zippel <zippel@linux-m68k.org> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2007-07-16 10:41:22 +04:00			`/*`
			`* Convert one or more ASCII characters into a single unicode character.`
			`* Returns the number of ASCII characters corresponding to the unicode char.`
			`*/`
			`static inline int asc2unichar(struct super_block sb, const char astr, int len,`
			`wchar_t *uc)`
Linux-2.6.12-rc2 Initial git repository build. I'm not bothering with the full history, even though we have it. We can create a separate "historical" git archive of that later if we want to, and in the meantime it's about 3.2GB when imported into git - space that would just make the early git days unnecessarily complicated, when we don't have a lot of good infrastructure for it. Let it rip! 2005-04-17 02:20:36 +04:00			`{`
HFS+: refactor ASCII to unicode conversion routine for later reuse The HFS+ filesystem is case-insensitive and does automatic unicode decomposition by default, but does not provide custom dentry operations. This can lead to multiple dentries being cached for lookups on a filename with varying case and/or character (de)composition. These patches add custom dentry hash and comparison operations for case-sensitive and/or automatically decomposing HFS+ filesystems. Unicode decomposition and case-folding are performed as required to ensure equivalent filenames are hashed to the same values and compare as equal. This patch: Refactor existing HFS+ ASCII to unicode string conversion routine to split out character conversion functionality. This will be reused by the custom dentry hash and comparison routines. This approach avoids unnecessary memory allocation compared to using the string conversion routine directly in the new functions. [akpm@linux-foundation.org: avoid use-of-uninitialised] Signed-off-by: Duane Griffin <duaneg@dghda.com> Signed-off-by: Roman Zippel <zippel@linux-m68k.org> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2007-07-16 10:41:22 +04:00			`int size = HFSPLUS_SB(sb).nls->char2uni(astr, len, uc);`
			`if (size <= 0) {`
			`*uc = '?';`
			`size = 1;`
			`}`
			`switch (*uc) {`
			`case 0x2400:`
			`*uc = 0;`
			`break;`
			`case ':':`
			`*uc = '/';`
			`break;`
			`}`
			`return size;`
			`}`

			`/* Decomposes a single unicode character. */`
			`static inline u16 decompose_unichar(wchar_t uc, int size)`
			`{`
			`int off;`

			`off = hfsplus_decompose_table[(uc >> 12) & 0xf];`
			`if (off == 0 \|\| off == 0xffff)`
			`return NULL;`

			`off = hfsplus_decompose_table[off + ((uc >> 8) & 0xf)];`
			`if (!off)`
			`return NULL;`

			`off = hfsplus_decompose_table[off + ((uc >> 4) & 0xf)];`
			`if (!off)`
			`return NULL;`

			`off = hfsplus_decompose_table[off + (uc & 0xf)];`
			`*size = off & 3;`
			`if (*size == 0)`
			`return NULL;`
			`return hfsplus_decompose_table + (off / 4);`
			`}`

			`int hfsplus_asc2uni(struct super_block sb, struct hfsplus_unistr ustr,`
			`const char *astr, int len)`
			`{`
			`int size, dsize, decompose;`
			`u16 *dstr, outlen = 0;`
Linux-2.6.12-rc2 Initial git repository build. I'm not bothering with the full history, even though we have it. We can create a separate "historical" git archive of that later if we want to, and in the meantime it's about 3.2GB when imported into git - space that would just make the early git days unnecessarily complicated, when we don't have a lot of good infrastructure for it. Let it rip! 2005-04-17 02:20:36 +04:00			`wchar_t c;`

			`decompose = !(HFSPLUS_SB(sb).flags & HFSPLUS_SB_NODECOMPOSE);`
			`while (outlen < HFSPLUS_MAX_STRLEN && len > 0) {`
HFS+: refactor ASCII to unicode conversion routine for later reuse The HFS+ filesystem is case-insensitive and does automatic unicode decomposition by default, but does not provide custom dentry operations. This can lead to multiple dentries being cached for lookups on a filename with varying case and/or character (de)composition. These patches add custom dentry hash and comparison operations for case-sensitive and/or automatically decomposing HFS+ filesystems. Unicode decomposition and case-folding are performed as required to ensure equivalent filenames are hashed to the same values and compare as equal. This patch: Refactor existing HFS+ ASCII to unicode string conversion routine to split out character conversion functionality. This will be reused by the custom dentry hash and comparison routines. This approach avoids unnecessary memory allocation compared to using the string conversion routine directly in the new functions. [akpm@linux-foundation.org: avoid use-of-uninitialised] Signed-off-by: Duane Griffin <duaneg@dghda.com> Signed-off-by: Roman Zippel <zippel@linux-m68k.org> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2007-07-16 10:41:22 +04:00			`size = asc2unichar(sb, astr, len, &c);`

			`if (decompose && (dstr = decompose_unichar(c, &dsize))) {`
			`if (outlen + dsize > HFSPLUS_MAX_STRLEN)`
Linux-2.6.12-rc2 Initial git repository build. I'm not bothering with the full history, even though we have it. We can create a separate "historical" git archive of that later if we want to, and in the meantime it's about 3.2GB when imported into git - space that would just make the early git days unnecessarily complicated, when we don't have a lot of good infrastructure for it. Let it rip! 2005-04-17 02:20:36 +04:00			`break;`
			`do {`
HFS+: refactor ASCII to unicode conversion routine for later reuse The HFS+ filesystem is case-insensitive and does automatic unicode decomposition by default, but does not provide custom dentry operations. This can lead to multiple dentries being cached for lookups on a filename with varying case and/or character (de)composition. These patches add custom dentry hash and comparison operations for case-sensitive and/or automatically decomposing HFS+ filesystems. Unicode decomposition and case-folding are performed as required to ensure equivalent filenames are hashed to the same values and compare as equal. This patch: Refactor existing HFS+ ASCII to unicode string conversion routine to split out character conversion functionality. This will be reused by the custom dentry hash and comparison routines. This approach avoids unnecessary memory allocation compared to using the string conversion routine directly in the new functions. [akpm@linux-foundation.org: avoid use-of-uninitialised] Signed-off-by: Duane Griffin <duaneg@dghda.com> Signed-off-by: Roman Zippel <zippel@linux-m68k.org> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2007-07-16 10:41:22 +04:00			`ustr->unicode[outlen++] = cpu_to_be16(*dstr++);`
			`} while (--dsize > 0);`
			`} else`
			`ustr->unicode[outlen++] = cpu_to_be16(c);`

			`astr += size;`
			`len -= size;`
Linux-2.6.12-rc2 Initial git repository build. I'm not bothering with the full history, even though we have it. We can create a separate "historical" git archive of that later if we want to, and in the meantime it's about 3.2GB when imported into git - space that would just make the early git days unnecessarily complicated, when we don't have a lot of good infrastructure for it. Let it rip! 2005-04-17 02:20:36 +04:00			`}`
			`ustr->length = cpu_to_be16(outlen);`
			`if (len > 0)`
			`return -ENAMETOOLONG;`
			`return 0;`
			`}`
HFS+: add custom dentry hash and comparison operations Add custom dentry hash and comparison operations for HFS+ filesystems that are case-insensitive and/or do automatic unicode decomposition. The new operations reuse the existing HFS+ ASCII to unicode conversion, unicode decomposition and case folding functionality. Signed-off-by: Duane Griffin <duaneg@dghda.com> Signed-off-by: Roman Zippel <zippel@linux-m68k.org> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2007-07-16 10:41:23 +04:00
			`/*`
			`* Hash a string to an integer as appropriate for the HFS+ filesystem.`
			`* Composed unicode characters are decomposed and case-folding is performed`
			`* if the appropriate bits are (un)set on the superblock.`
			`*/`
			`int hfsplus_hash_dentry(struct dentry dentry, struct qstr str)`
			`{`
			`struct super_block *sb = dentry->d_sb;`
			`const char *astr;`
			`const u16 *dstr;`
fs/hfsplus/unicode.c: fix uninitialized var warning fs/hfsplus/unicode.c: In function 'hfsplus_hash_dentry': fs/hfsplus/unicode.c:328: warning: 'dsize' may be used uninitialized in this function Cc: Roman Zippel <zippel@linux-m68k.org> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2008-02-08 15:20:52 +03:00			`int casefold, decompose, size, len;`
HFS+: add custom dentry hash and comparison operations Add custom dentry hash and comparison operations for HFS+ filesystems that are case-insensitive and/or do automatic unicode decomposition. The new operations reuse the existing HFS+ ASCII to unicode conversion, unicode decomposition and case folding functionality. Signed-off-by: Duane Griffin <duaneg@dghda.com> Signed-off-by: Roman Zippel <zippel@linux-m68k.org> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2007-07-16 10:41:23 +04:00			`unsigned long hash;`
			`wchar_t c;`
			`u16 c2;`

			`casefold = (HFSPLUS_SB(sb).flags & HFSPLUS_SB_CASEFOLD);`
			`decompose = !(HFSPLUS_SB(sb).flags & HFSPLUS_SB_NODECOMPOSE);`
			`hash = init_name_hash();`
			`astr = str->name;`
			`len = str->len;`
			`while (len > 0) {`
fs/hfsplus/unicode.c: fix uninitialized var warning fs/hfsplus/unicode.c: In function 'hfsplus_hash_dentry': fs/hfsplus/unicode.c:328: warning: 'dsize' may be used uninitialized in this function Cc: Roman Zippel <zippel@linux-m68k.org> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2008-02-08 15:20:52 +03:00			`int uninitialized_var(dsize);`
HFS+: add custom dentry hash and comparison operations Add custom dentry hash and comparison operations for HFS+ filesystems that are case-insensitive and/or do automatic unicode decomposition. The new operations reuse the existing HFS+ ASCII to unicode conversion, unicode decomposition and case folding functionality. Signed-off-by: Duane Griffin <duaneg@dghda.com> Signed-off-by: Roman Zippel <zippel@linux-m68k.org> Signed-off-by: Andrew Morton <akpm@linux-foundation.org> Signed-off-by: Linus Torvalds <torvalds@linux-foundation.org> 2007-07-16 10:41:23 +04:00			`size = asc2unichar(sb, astr, len, &c);`
			`astr += size;`
			`len -= size;`

			`if (decompose && (dstr = decompose_unichar(c, &dsize))) {`
			`do {`
			`c2 = *dstr++;`
			`if (!casefold \|\| (c2 = case_fold(c2)))`
			`hash = partial_name_hash(c2, hash);`
			`} while (--dsize > 0);`
			`} else {`
			`c2 = c;`
			`if (!casefold \|\| (c2 = case_fold(c2)))`
			`hash = partial_name_hash(c2, hash);`
			`}`
			`}`
			`str->hash = end_name_hash(hash);`

			`return 0;`
			`}`

			`/*`
			`* Compare strings with HFS+ filename ordering.`
			`* Composed unicode characters are decomposed and case-folding is performed`
			`* if the appropriate bits are (un)set on the superblock.`
			`*/`
			`int hfsplus_compare_dentry(struct dentry dentry, struct qstr s1, struct qstr *s2)`
			`{`
			`struct super_block *sb = dentry->d_sb;`
			`int casefold, decompose, size;`
			`int dsize1, dsize2, len1, len2;`
			`const u16 dstr1, dstr2;`
			`const char astr1, astr2;`
			`u16 c1, c2;`
			`wchar_t c;`

			`casefold = (HFSPLUS_SB(sb).flags & HFSPLUS_SB_CASEFOLD);`
			`decompose = !(HFSPLUS_SB(sb).flags & HFSPLUS_SB_NODECOMPOSE);`
			`astr1 = s1->name;`
			`len1 = s1->len;`
			`astr2 = s2->name;`
			`len2 = s2->len;`
			`dsize1 = dsize2 = 0;`
			`dstr1 = dstr2 = NULL;`

			`while (len1 > 0 && len2 > 0) {`
			`if (!dsize1) {`
			`size = asc2unichar(sb, astr1, len1, &c);`
			`astr1 += size;`
			`len1 -= size;`

			`if (!decompose \|\| !(dstr1 = decompose_unichar(c, &dsize1))) {`
			`c1 = c;`
			`dstr1 = &c1;`
			`dsize1 = 1;`
			`}`
			`}`

			`if (!dsize2) {`
			`size = asc2unichar(sb, astr2, len2, &c);`
			`astr2 += size;`
			`len2 -= size;`

			`if (!decompose \|\| !(dstr2 = decompose_unichar(c, &dsize2))) {`
			`c2 = c;`
			`dstr2 = &c2;`
			`dsize2 = 1;`
			`}`
			`}`

			`c1 = *dstr1;`
			`c2 = *dstr2;`
			`if (casefold) {`
			`if (!(c1 = case_fold(c1))) {`
			`dstr1++;`
			`dsize1--;`
			`continue;`
			`}`
			`if (!(c2 = case_fold(c2))) {`
			`dstr2++;`
			`dsize2--;`
			`continue;`
			`}`
			`}`
			`if (c1 < c2)`
			`return -1;`
			`else if (c1 > c2)`
			`return 1;`

			`dstr1++;`
			`dsize1--;`
			`dstr2++;`
			`dsize2--;`
			`}`

			`if (len1 < len2)`
			`return -1;`
			`if (len1 > len2)`
			`return 1;`
			`return 0;`
			`}`