| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605 | /*  Copyright (C) 2002     Manuel Novoa III * *  This library is free software; you can redistribute it and/or *  modify it under the terms of the GNU Library General Public *  License as published by the Free Software Foundation; either *  version 2 of the License, or (at your option) any later version. * *  This library is distributed in the hope that it will be useful, *  but WITHOUT ANY WARRANTY; without even the implied warranty of *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU *  Library General Public License for more details. * *  You should have received a copy of the GNU Library General Public *  License along with this library; if not, write to the Free *  Software Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA. *//*  ATTENTION!   ATTENTION!   ATTENTION!   ATTENTION!   ATTENTION! * *  Besides uClibc, I'm using this code in my libc for elks, which is *  a 16-bit environment with a fairly limited compiler.  It would make *  things much easier for me if this file isn't modified unnecessarily. *  In particular, please put any new or replacement functions somewhere *  else, and modify the makefile to use your version instead. *  Thanks.  Manuel * *  ATTENTION!   ATTENTION!   ATTENTION!   ATTENTION!   ATTENTION! */#define _GNU_SOURCE#define __NO_CTYPE#include <wctype.h>#include <assert.h>#include <string.h>#include <errno.h>#include <locale.h>#include <ctype.h>/* We know wide char support is enabled.  We wouldn't be here otherwise. *//* Define this if you want to unify the towupper and towlower code in the * towctrans function. *//*  #define SMALL_UPLOW */#ifndef __LOCALE_C_ONLY#define __WCTYPE_WITH_LOCALE#endif/**********************************************************************/#ifndef __PASTE#define __PASTE(X,Y)		X ## Y#endif#define C_MACRO(X)		__PASTE(__C_,X)(wc)#define CT_MACRO(X)		__PASTE(__ctype_,X)(wc)/**********************************************************************//* TODO: fix this! */#ifdef __WCTYPE_WITH_LOCALE#define WCctype			(__global_locale.tblwctype)#define WCuplow			(__global_locale.tblwuplow)#define WCcmob			(__global_locale.tblwcomb)#define WCuplow_diff	(__global_locale.tblwuplow_diff)#define ENCODING		(__global_locale.encoding)#define ISW_FUNC_BODY(NAME) \int NAME (wint_t wc) \{ \	return iswctype(wc, __PASTE(_CTYPE_,NAME)); \}#else  /* __WCTYPE_WITH_LOCALE */#define ISW_FUNC_BODY(NAME) \int NAME (wint_t wc) \{ \	return C_MACRO(NAME); \}#endif /* __WCTYPE_WITH_LOCALE *//**********************************************************************/#ifdef L_iswalnumISW_FUNC_BODY(iswalnum);#endif/**********************************************************************/#ifdef L_iswalphaISW_FUNC_BODY(iswalpha);#endif/**********************************************************************/#ifdef L_iswblankISW_FUNC_BODY(iswblank);#endif/**********************************************************************/#ifdef L_iswcntrlISW_FUNC_BODY(iswcntrl);#endif/**********************************************************************/#ifdef L_iswdigitint iswdigit(wint_t wc){	return __C_iswdigit(wc);}#endif/**********************************************************************/#ifdef L_iswgraphISW_FUNC_BODY(iswgraph);#endif/**********************************************************************/#ifdef L_iswlowerISW_FUNC_BODY(iswlower);#endif/**********************************************************************/#ifdef L_iswprintISW_FUNC_BODY(iswprint);#endif/**********************************************************************/#ifdef L_iswpunctISW_FUNC_BODY(iswpunct);#endif/**********************************************************************/#ifdef L_iswspaceISW_FUNC_BODY(iswspace);#endif/**********************************************************************/#ifdef L_iswupperISW_FUNC_BODY(iswupper);#endif/**********************************************************************/#ifdef L_iswxdigitint iswxdigit(wint_t wc){	return __C_iswxdigit(wc);}#endif/**********************************************************************/#ifdef L_towlower#ifdef __WCTYPE_WITH_LOCALE#ifdef SMALL_UPLOWwint_t towlower(wint_t wc){	return towctrans(wc, _CTYPE_tolower);}#elsewint_t towlower(wint_t wc){	unsigned int sc, n, i;	__uwchar_t u = wc;	if (ENCODING == __ctype_encoding_7_bit) {		/* We're in the C/POSIX locale, so ignore the tables. */		return __C_towlower(wc);	}	if (u <= WC_TABLE_DOMAIN_MAX) {		sc = u & ((1 << WCuplow_TI_SHIFT) - 1);		u >>= WCuplow_TI_SHIFT;		n = u & ((1 << WCuplow_II_SHIFT) - 1);		u >>= WCuplow_II_SHIFT;		i = ((unsigned int) WCuplow[u]) << WCuplow_II_SHIFT;		i = ((unsigned int) WCuplow[WCuplow_II_LEN + i + n])			<< WCuplow_TI_SHIFT;		i = ((unsigned int) WCuplow[WCuplow_II_LEN + WCuplow_TI_LEN										+ i + sc]) << 1;		wc += WCuplow_diff[i + 1];	}	return wc;}#endif#else  /* __WCTYPE_WITH_LOCALE */wint_t towlower(wint_t wc){	return __C_towlower(wc);}#endif /* __WCTYPE_WITH_LOCALE */#endif/**********************************************************************/#ifdef L_towupper#ifdef __WCTYPE_WITH_LOCALE#ifdef SMALL_UPLOWwint_t towupper(wint_t wc){	return towctrans(wc, _CTYPE_toupper);}#elsewint_t towupper(wint_t wc){	unsigned int sc, n, i;	__uwchar_t u = wc;	if (ENCODING == __ctype_encoding_7_bit) {		/* We're in the C/POSIX locale, so ignore the tables. */		return __C_towupper(wc);	}	if (u <= WC_TABLE_DOMAIN_MAX) {		sc = u & ((1 << WCuplow_TI_SHIFT) - 1);		u >>= WCuplow_TI_SHIFT;		n = u & ((1 << WCuplow_II_SHIFT) - 1);		u >>= WCuplow_II_SHIFT;		i = ((unsigned int) WCuplow[u]) << WCuplow_II_SHIFT;		i = ((unsigned int) WCuplow[WCuplow_II_LEN + i + n])			<< WCuplow_TI_SHIFT;		i = ((unsigned int) WCuplow[WCuplow_II_LEN + WCuplow_TI_LEN										+ i + sc]) << 1;		wc += WCuplow_diff[i];	}	return wc;}#endif#else  /* __WCTYPE_WITH_LOCALE */wint_t towupper(wint_t wc){	return __C_towupper(wc);}#endif /* __WCTYPE_WITH_LOCALE */#endif/**********************************************************************/#ifdef L_wctypestatic const unsigned char typestring[] = __CTYPE_TYPESTRING;/*  extern const unsigned char typestring[]; */wctype_t wctype(const char *property){	const unsigned char *p;	int i;	p = typestring;	i = 1;	do {		if (!strcmp(property, ++p)) {			return i;		}		++i;		p += p[-1];	} while (*p);	/* TODO - Add locale-specific classifications. */	return 0;}#endif/**********************************************************************/#ifdef L_iswctype#ifdef __UCLIBC_MJN3_ONLY__#warning duh... replace the range-based classification with table lookup!#endif#ifdef __WCTYPE_WITH_LOCALE#ifdef __UCLIBC_MJN3_ONLY__#warning TODO: need to fix locale ctype table lookup stuff#endif#if 0extern const char ctype_range[];#elsestatic const char ctype_range[] = {	__CTYPE_RANGES};#endif#ifdef __UCLIBC_MJN3_ONLY__#warning TODO: need to handle combining class!#endif#define WCctype_TI_MASK		((1 << WCctype_TI_SHIFT) - 1)#define WCctype_II_MASK		((1 << WCctype_II_SHIFT) - 1)int iswctype(wint_t wc, wctype_t desc){	unsigned int sc, n, i0, i1;	unsigned char d = __CTYPE_unclassified;	if ((ENCODING != __ctype_encoding_7_bit) || (((__uwchar_t) wc) <= 0x7f)){		if (desc < _CTYPE_iswxdigit) {			if (((__uwchar_t) wc) <= WC_TABLE_DOMAIN_MAX) {				/* From here on, we know wc > 0. */				sc = wc & WCctype_TI_MASK;				wc >>= WCctype_TI_SHIFT;				n = wc & WCctype_II_MASK;				wc >>= WCctype_II_SHIFT;				i0 = WCctype[wc];				i0 <<= WCctype_II_SHIFT;				i1 = WCctype[WCctype_II_LEN + i0 + n];				i1 <<= (WCctype_TI_SHIFT-1);				d = WCctype[WCctype_II_LEN + WCctype_TI_LEN + i1 + (sc >> 1)];				d = (sc & 1) ? (d >> 4) : (d & 0xf);			} else if ( ((((__uwchar_t)(wc - 0xe0020UL)) <= 0x5f)						 || (wc == 0xe0001UL))						|| ( (((__uwchar_t)(wc - 0xf0000UL)) < 0x20000UL)							 && ((wc & 0xffffU) <= 0xfffdU))						) {				d = __CTYPE_punct;			}			return ( ((unsigned char)(d - ctype_range[2*desc]))					 <= ctype_range[2*desc + 1] )				&& ((desc != _CTYPE_iswblank) || (d & 1));		}		/* TODO - Add locale-specific classifications. */		return (desc == _CTYPE_iswxdigit) ? __C_iswxdigit(wc) : 0;	}	return 0;}#elsestatic const unsigned char WCctype[] = {	__CTYPE_cntrl_nonspace       | (__CTYPE_cntrl_nonspace        << 4),	__CTYPE_cntrl_nonspace       | (__CTYPE_cntrl_nonspace        << 4),	__CTYPE_cntrl_nonspace       | (__CTYPE_cntrl_nonspace        << 4),	__CTYPE_cntrl_nonspace       | (__CTYPE_cntrl_nonspace        << 4),	__CTYPE_cntrl_nonspace       | (__CTYPE_cntrl_space_blank     << 4),	__CTYPE_cntrl_space_nonblank | (__CTYPE_cntrl_space_nonblank  << 4),	__CTYPE_cntrl_space_nonblank | (__CTYPE_cntrl_space_nonblank  << 4),	__CTYPE_cntrl_nonspace       | (__CTYPE_cntrl_nonspace        << 4),	__CTYPE_cntrl_nonspace       | (__CTYPE_cntrl_nonspace        << 4),	__CTYPE_cntrl_nonspace       | (__CTYPE_cntrl_nonspace        << 4),	__CTYPE_cntrl_nonspace       | (__CTYPE_cntrl_nonspace        << 4),	__CTYPE_cntrl_nonspace       | (__CTYPE_cntrl_nonspace        << 4),	__CTYPE_cntrl_nonspace       | (__CTYPE_cntrl_nonspace        << 4),	__CTYPE_cntrl_nonspace       | (__CTYPE_cntrl_nonspace        << 4),	__CTYPE_cntrl_nonspace       | (__CTYPE_cntrl_nonspace        << 4),	__CTYPE_cntrl_nonspace       | (__CTYPE_cntrl_nonspace        << 4),	__CTYPE_print_space_blank    | (__CTYPE_punct                 << 4),	__CTYPE_punct                | (__CTYPE_punct                 << 4),	__CTYPE_punct                | (__CTYPE_punct                 << 4),	__CTYPE_punct                | (__CTYPE_punct                 << 4),	__CTYPE_punct                | (__CTYPE_punct                 << 4),	__CTYPE_punct                | (__CTYPE_punct                 << 4),	__CTYPE_punct                | (__CTYPE_punct                 << 4),	__CTYPE_punct                | (__CTYPE_punct                 << 4),	__CTYPE_digit                | (__CTYPE_digit                 << 4),	__CTYPE_digit                | (__CTYPE_digit                 << 4),	__CTYPE_digit                | (__CTYPE_digit                 << 4),	__CTYPE_digit                | (__CTYPE_digit                 << 4),	__CTYPE_digit                | (__CTYPE_digit                 << 4),	__CTYPE_punct                | (__CTYPE_punct                 << 4),	__CTYPE_punct                | (__CTYPE_punct                 << 4),	__CTYPE_punct                | (__CTYPE_punct                 << 4),	__CTYPE_punct                | (__CTYPE_alpha_upper           << 4),	__CTYPE_alpha_upper          | (__CTYPE_alpha_upper           << 4),	__CTYPE_alpha_upper          | (__CTYPE_alpha_upper           << 4),	__CTYPE_alpha_upper          | (__CTYPE_alpha_upper           << 4),	__CTYPE_alpha_upper          | (__CTYPE_alpha_upper           << 4),	__CTYPE_alpha_upper          | (__CTYPE_alpha_upper           << 4),	__CTYPE_alpha_upper          | (__CTYPE_alpha_upper           << 4),	__CTYPE_alpha_upper          | (__CTYPE_alpha_upper           << 4),	__CTYPE_alpha_upper          | (__CTYPE_alpha_upper           << 4),	__CTYPE_alpha_upper          | (__CTYPE_alpha_upper           << 4),	__CTYPE_alpha_upper          | (__CTYPE_alpha_upper           << 4),	__CTYPE_alpha_upper          | (__CTYPE_alpha_upper           << 4),	__CTYPE_alpha_upper          | (__CTYPE_alpha_upper           << 4),	__CTYPE_alpha_upper          | (__CTYPE_punct                 << 4),	__CTYPE_punct                | (__CTYPE_punct                 << 4),	__CTYPE_punct                | (__CTYPE_punct                 << 4),	__CTYPE_punct                | (__CTYPE_alpha_lower           << 4),	__CTYPE_alpha_lower          | (__CTYPE_alpha_lower           << 4),	__CTYPE_alpha_lower          | (__CTYPE_alpha_lower           << 4),	__CTYPE_alpha_lower          | (__CTYPE_alpha_lower           << 4),	__CTYPE_alpha_lower          | (__CTYPE_alpha_lower           << 4),	__CTYPE_alpha_lower          | (__CTYPE_alpha_lower           << 4),	__CTYPE_alpha_lower          | (__CTYPE_alpha_lower           << 4),	__CTYPE_alpha_lower          | (__CTYPE_alpha_lower           << 4),	__CTYPE_alpha_lower          | (__CTYPE_alpha_lower           << 4),	__CTYPE_alpha_lower          | (__CTYPE_alpha_lower           << 4),	__CTYPE_alpha_lower          | (__CTYPE_alpha_lower           << 4),	__CTYPE_alpha_lower          | (__CTYPE_alpha_lower           << 4),	__CTYPE_alpha_lower          | (__CTYPE_alpha_lower           << 4),	__CTYPE_alpha_lower          | (__CTYPE_punct                 << 4),	__CTYPE_punct                | (__CTYPE_punct                 << 4),	__CTYPE_punct                | (__CTYPE_cntrl_nonspace        << 4),};static const char ctype_range[] = {	__CTYPE_RANGES};int iswctype(wint_t wc, wctype_t desc){	unsigned char d = __CTYPE_unclassified;	if (((__uwchar_t) wc) <= 0x7f) {		if (desc < _CTYPE_iswxdigit) {			d = WCctype[wc >> 1];			d = (wc & 1) ? (d >> 4) : (d & 0xf);			return ( ((unsigned char)(d - ctype_range[2*desc]))					 <= ctype_range[2*desc + 1] )				&& ((desc != _CTYPE_iswblank) || (d & 1));		}		if (desc == _CTYPE_iswxdigit) {			return __C_isxdigit(((char) wc));		}	}	return 0;}#endif#endif/**********************************************************************/#ifdef L_towctrans#ifdef __WCTYPE_WITH_LOCALE#ifdef SMALL_UPLOWwint_t towctrans(wint_t wc, wctrans_t desc){	unsigned int sc, n, i;	__uwchar_t u = wc;	/* TODO - clean up */	if (ENCODING == __ctype_encoding_7_bit) {		if ((((__uwchar_t) wc) > 0x7f)			|| (((unsigned int)(desc - _CTYPE_tolower))				> (_CTYPE_toupper - _CTYPE_tolower))			){			/* We're in the C/POSIX locale, so ignore non-ASCII values			 * as well an any mappings other than toupper or tolower. */			return wc;		}	}	if (((unsigned int)(desc - _CTYPE_tolower))		<= (_CTYPE_totitle - _CTYPE_tolower)		) {		if (u <= WC_TABLE_DOMAIN_MAX) {			sc = u & ((1 << WCuplow_TI_SHIFT) - 1);			u >>= WCuplow_TI_SHIFT;			n = u & ((1 << WCuplow_II_SHIFT) - 1);			u >>= WCuplow_II_SHIFT;			i = ((unsigned int) WCuplow[u]) << WCuplow_II_SHIFT;			i = ((unsigned int) WCuplow[WCuplow_II_LEN + i + n])				<< WCuplow_TI_SHIFT;			i = ((unsigned int) WCuplow[WCuplow_II_LEN + WCuplow_TI_LEN											+ i + sc]) << 1;			if (desc == _CTYPE_tolower) {				++i;			}			wc += WCuplow_diff[i];			if (desc == _CTYPE_totitle) {				/* WARNING! These special cases work for glibc 2.2.4.  Changes				 * may be needed if the glibc locale tables are updated. */				if ( (((__uwchar_t)(wc - 0x1c4)) <= (0x1cc - 0x1c4))					 || (wc == 0x1f1)					 ) {					++wc;				}			}		}	} else {		/* TODO - Deal with other transliterations. */		__set_errno(EINVAL);	}	return wc;}#elsewint_t towctrans(wint_t wc, wctrans_t desc){	if (ENCODING == __ctype_encoding_7_bit) {		if ((((__uwchar_t) wc) > 0x7f)			|| (((unsigned int)(desc - _CTYPE_tolower))				> (_CTYPE_toupper - _CTYPE_tolower))			){			/* We're in the C/POSIX locale, so ignore non-ASCII values			 * as well an any mappings other than toupper or tolower. */			return wc;		}	}	if (desc == _CTYPE_tolower) {		return towlower(wc);	} else if (((unsigned int)(desc - _CTYPE_toupper))		<= (_CTYPE_totitle - _CTYPE_toupper)		) {		wc = towupper(wc);		if (desc == _CTYPE_totitle) {			/* WARNING! These special cases work for glibc 2.2.4.  Changes			 * may be needed if the glibc locale tables are updated. */			if ( (((__uwchar_t)(wc - 0x1c4)) <= (0x1cc - 0x1c4))				 || (wc == 0x1f1)				 ) {				++wc;			}		}	} else {		/* TODO - Deal with other transliterations. */		__set_errno(EINVAL);	}	return wc;}#endif#else  /* __WCTYPE_WITH_LOCALE *//* Minimal support for C/POSIX locale. */wint_t towctrans(wint_t wc, wctrans_t desc){	if (((unsigned int)(desc - _CTYPE_tolower))		<= (_CTYPE_toupper - _CTYPE_tolower)		) {		/* Transliteration is either tolower or toupper. */		if (((__uwchar_t) wc) <= 0x7f) {			return (desc == _CTYPE_tolower) ? _tolower(wc) : _toupper(wc);		}	} else {		__set_errno(EINVAL);	/* Invalid transliteration. */	}	return wc;}#endif /* __WCTYPE_WITH_LOCALE */#endif/**********************************************************************/#ifdef L_wctransstatic const char transstring[] = __CTYPE_TRANSTRING;wctrans_t wctrans(const char *property){	const unsigned char *p;	int i;	p = transstring;	i = 1;	do {		if (!strcmp(property, ++p)) {			return i;		}		++i;		p += p[-1];	} while (*p);	/* TODO - Add locale-specific translations. */	return 0;}#endif/**********************************************************************/
 |