summaryrefslogtreecommitdiff
path: root/wctype
diff options
context:
space:
mode:
Diffstat (limited to 'wctype')
-rw-r--r--wctype/Makefile30
-rw-r--r--wctype/cname-lookup.h45
-rw-r--r--wctype/iswctype.c39
-rw-r--r--wctype/test_wctype.c75
-rw-r--r--wctype/towctrans.c36
-rw-r--r--wctype/wcfuncs.c52
-rw-r--r--wctype/wctrans.c59
-rw-r--r--wctype/wctype.c56
-rw-r--r--wctype/wctype.h215
9 files changed, 607 insertions, 0 deletions
diff --git a/wctype/Makefile b/wctype/Makefile
new file mode 100644
index 0000000000..e0c84c39f1
--- /dev/null
+++ b/wctype/Makefile
@@ -0,0 +1,30 @@
+# Copyright (C) 1996 Free Software Foundation, Inc.
+# This file is part of the GNU C Library.
+
+# The GNU C Library is free software; you can redistribute it and/or
+# modify it under the terms of the GNU Library General Public License as
+# published by the Free Software Foundation; either version 2 of the
+# License, or (at your option) any later version.
+
+# The GNU C Library is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+# Library General Public License for more details.
+
+# You should have received a copy of the GNU Library General Public
+# License along with the GNU C Library; see the file COPYING.LIB. If
+# not, write to the Free Software Foundation, Inc., 675 Mass Ave,
+# Cambridge, MA 02139, USA.
+
+#
+# Sub-makefile for wctype portion of the library.
+#
+subdir := wctype
+
+headers := wctype.h
+distribute := cname-lookup.h
+routines := wcfuncs wctype iswctype wctrans towctrans
+
+tests := test_wctype
+
+include ../Rules
diff --git a/wctype/cname-lookup.h b/wctype/cname-lookup.h
new file mode 100644
index 0000000000..bef38a12d3
--- /dev/null
+++ b/wctype/cname-lookup.h
@@ -0,0 +1,45 @@
+/* Copyright (C) 1996 Free Software Foundation, Inc.
+This file is part of the GNU C Library.
+Contributed by Ulrich Drepper, <drepper@gnu.ai.mit.edu>.
+
+The GNU C Library is free software; you can redistribute it and/or
+modify it under the terms of the GNU Library General Public License as
+published by the Free Software Foundation; either version 2 of the
+License, or (at your option) any later version.
+
+The GNU C Library is distributed in the hope that it will be useful,
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+Library General Public License for more details.
+
+You should have received a copy of the GNU Library General Public
+License along with the GNU C Library; see the file COPYING.LIB. If
+not, write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+Boston, MA 02111-1307, USA. */
+
+#include "localeinfo.h"
+
+/* Some words on the runtime of this functions. Although there is a
+ loop in the function the runtime is asymptotically quasi constant.
+ The reason is that even for the largest character sets HASH_LAYERS
+ will not grow beyond 15 (a guess!). */
+static __inline size_t
+cname_lookup (wint_t wc)
+{
+ extern unsigned int *__ctype_names;
+ unsigned int hash_size, hash_layers;
+ size_t result, cnt;
+
+ hash_size = _NL_CURRENT_WORD (LC_CTYPE, _NL_CTYPE_HASH_SIZE);
+ hash_layers = _NL_CURRENT_WORD (LC_CTYPE, _NL_CTYPE_HASH_LAYERS);
+
+ result = wc % hash_size;
+ for (cnt = 0; cnt < hash_layers; ++cnt)
+ {
+ if (__ctype_names[result] == wc)
+ break;
+ result += hash_size;
+ }
+
+ return cnt < hash_layers ? result : ~((size_t) 0);
+}
diff --git a/wctype/iswctype.c b/wctype/iswctype.c
new file mode 100644
index 0000000000..041548b2dc
--- /dev/null
+++ b/wctype/iswctype.c
@@ -0,0 +1,39 @@
+/* Copyright (C) 1996 Free Software Foundation, Inc.
+This file is part of the GNU C Library.
+Contributed by Ulrich Drepper, <drepper@gnu.ai.mit.edu>.
+
+The GNU C Library is free software; you can redistribute it and/or
+modify it under the terms of the GNU Library General Public License as
+published by the Free Software Foundation; either version 2 of the
+License, or (at your option) any later version.
+
+The GNU C Library is distributed in the hope that it will be useful,
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+Library General Public License for more details.
+
+You should have received a copy of the GNU Library General Public
+License along with the GNU C Library; see the file COPYING.LIB. If
+not, write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+Boston, MA 02111-1307, USA. */
+
+#include <ctype.h>
+#include <wctype.h>
+
+#include "cname-lookup.h"
+
+
+extern unsigned int *__ctype32_b;
+
+
+int
+iswctype (wint_t wc, wctype_t desc)
+{
+ size_t idx;
+
+ idx = cname_lookup (wc);
+ if (idx == ~((size_t) 0))
+ return 0;
+
+ return __ctype32_b[idx] & desc;
+}
diff --git a/wctype/test_wctype.c b/wctype/test_wctype.c
new file mode 100644
index 0000000000..bf3de172df
--- /dev/null
+++ b/wctype/test_wctype.c
@@ -0,0 +1,75 @@
+/* Copyright (C) 1996 Free Software Foundation, Inc.
+This file is part of the GNU C Library.
+
+The GNU C Library is free software; you can redistribute it and/or
+modify it under the terms of the GNU Library General Public License as
+published by the Free Software Foundation; either version 2 of the
+License, or (at your option) any later version.
+
+The GNU C Library is distributed in the hope that it will be useful,
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+Library General Public License for more details.
+
+You should have received a copy of the GNU Library General Public
+License along with the GNU C Library; see the file COPYING.LIB. If
+not, write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+Boston, MA 02111-1307, USA. */
+
+#include <ctype.h>
+#include <stdio.h>
+#include <stdlib.h>
+#include <wctype.h>
+
+int
+main (int argc, char *argv[])
+{
+ int result = 0;
+ wctype_t bit_alnum = wctype ("alnum");
+ wctype_t bit_alpha = wctype ("alpha");
+ wctype_t bit_cntrl = wctype ("cntrl");
+ wctype_t bit_digit = wctype ("digit");
+ wctype_t bit_graph = wctype ("graph");
+ wctype_t bit_lower = wctype ("lower");
+ wctype_t bit_print = wctype ("print");
+ wctype_t bit_punct = wctype ("punct");
+ wctype_t bit_space = wctype ("space");
+ wctype_t bit_upper = wctype ("upper");
+ wctype_t bit_xdigit = wctype ("xdigit");
+ int ch;
+
+ if (wctype ("does not exist") != 0)
+ {
+ puts ("wctype return value != 0 for non existing property");
+ result = 1;
+ }
+
+ for (ch = 0; ch < 256; ++ch)
+ {
+#define TEST(test) \
+ do \
+ if (is##test (ch) != iswctype ((wchar_t) ch, bit_##test)) \
+ { \
+ printf ("class `%s' test for character \\%o failed\n", \
+ #test, ch); \
+ result = 1; \
+ } \
+ while (0)
+
+ TEST (alnum);
+ TEST (alpha);
+ TEST (cntrl);
+ TEST (digit);
+ TEST (graph);
+ TEST (lower);
+ TEST (print);
+ TEST (punct);
+ TEST (space);
+ TEST (upper);
+ TEST (xdigit);
+ }
+
+ if (result == 0)
+ puts ("All test successful!");
+ exit (result);
+}
diff --git a/wctype/towctrans.c b/wctype/towctrans.c
new file mode 100644
index 0000000000..fd15599a6e
--- /dev/null
+++ b/wctype/towctrans.c
@@ -0,0 +1,36 @@
+/* towctrans - map wide character using given mapping.
+Copyright (C) 1996 Free Software Foundation, Inc.
+This file is part of the GNU C Library.
+
+The GNU C Library is free software; you can redistribute it and/or
+modify it under the terms of the GNU Library General Public License as
+published by the Free Software Foundation; either version 2 of the
+License, or (at your option) any later version.
+
+The GNU C Library is distributed in the hope that it will be useful,
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+Library General Public License for more details.
+
+You should have received a copy of the GNU Library General Public
+License along with the GNU C Library; see the file COPYING.LIB. If
+not, write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+Boston, MA 02111-1307, USA. */
+
+#include <wctype.h>
+
+/* Define the lookup function. */
+#include "cname-lookup.h"
+
+wint_t
+towctrans (wint_t wc, wctrans_t desc)
+{
+ size_t idx;
+
+ idx = cname_lookup (wc);
+ if (idx == ~((size_t) 0))
+ /* Character is not known. Default action is to simply return it. */
+ return wc;
+
+ return (wint_t) desc[idx];
+}
diff --git a/wctype/wcfuncs.c b/wctype/wcfuncs.c
new file mode 100644
index 0000000000..b5ac890609
--- /dev/null
+++ b/wctype/wcfuncs.c
@@ -0,0 +1,52 @@
+/* Copyright (C) 1996 Free Software Foundation, Inc.
+This file is part of the GNU C Library.
+
+The GNU C Library is free software; you can redistribute it and/or
+modify it under the terms of the GNU Library General Public License as
+published by the Free Software Foundation; either version 2 of the
+License, or (at your option) any later version.
+
+The GNU C Library is distributed in the hope that it will be useful,
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+Library General Public License for more details.
+
+You should have received a copy of the GNU Library General Public
+License along with the GNU C Library; see the file COPYING.LIB. If
+not, write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+Boston, MA 02111-1307, USA. */
+
+#define __NO_WCTYPE
+#include <wctype.h>
+#include <ctype.h> /* For __ctype_tolower and __ctype_toupper. */
+
+/* Provide real-function versions of all the wctype macros. */
+
+#define func(name, type) \
+ int name (wc) wint_t wc; { return iswctype (wc, type); }
+
+func (iswalnum, _ISalnum)
+func (iswalpha, _ISalpha)
+func (iswcntrl, _IScntrl)
+func (iswdigit, _ISdigit)
+func (iswlower, _ISlower)
+func (iswgraph, _ISgraph)
+func (iswprint, _ISprint)
+func (iswpunct, _ISpunct)
+func (iswspace, _ISspace)
+func (iswupper, _ISupper)
+func (iswxdigit, _ISxdigit)
+
+wint_t
+towlower (wc)
+ wint_t wc;
+{
+ return towctrans (wc, __ctype_tolower);
+}
+
+wint_t
+towupper (wc)
+ wint_t wc;
+{
+ return towctrans (wc, __ctype_toupper);
+}
diff --git a/wctype/wctrans.c b/wctype/wctrans.c
new file mode 100644
index 0000000000..afe47a915d
--- /dev/null
+++ b/wctype/wctrans.c
@@ -0,0 +1,59 @@
+/* Copyright (C) 1996 Free Software Foundation, Inc.
+This file is part of the GNU C Library.
+Contributed by Ulrich Drepper, <drepper@gnu.ai.mit.edu>.
+
+The GNU C Library is free software; you can redistribute it and/or
+modify it under the terms of the GNU Library General Public License as
+published by the Free Software Foundation; either version 2 of the
+License, or (at your option) any later version.
+
+The GNU C Library is distributed in the hope that it will be useful,
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+Library General Public License for more details.
+
+You should have received a copy of the GNU Library General Public
+License along with the GNU C Library; see the file COPYING.LIB. If
+not, write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+Boston, MA 02111-1307, USA. */
+
+#include <ctype.h>
+#include <string.h>
+#include <wctype.h>
+#include "localeinfo.h"
+
+wctrans_t
+wctrans (const char *property)
+{
+ const char *names;
+ size_t cnt;
+ unsigned int **result;
+
+ names = _NL_CURRENT (LC_CTYPE, _NL_CTYPE_MAP_NAMES);
+ cnt = 0;
+ while (names[0] != '\0')
+ {
+ if (strcmp (property, names) == 0)
+ break;
+
+ names = strchr (names, '\0') + 1;
+ ++cnt;
+ }
+
+ if (names[0] == '\0')
+ return 0;
+
+ if (cnt == 0)
+ return (wctrans_t) __ctype_toupper;
+ else if (cnt == 1)
+ return (wctrans_t) __ctype_tolower;
+
+ /* We have to search the table. */
+ result = (unsigned int **) &_NL_CURRENT (LC_CTYPE, _NL_CTYPE_WIDTH);
+
+#if __BYTE_ORDER == _BIG_ENDIAN
+ return (wctrans_t) result[1 + 2 * cnt];
+#else
+ return (wctrans_t) result[1 + 2 * cnt + 1];
+#endif
+}
diff --git a/wctype/wctype.c b/wctype/wctype.c
new file mode 100644
index 0000000000..36db3b95a4
--- /dev/null
+++ b/wctype/wctype.c
@@ -0,0 +1,56 @@
+/* Copyright (C) 1996 Free Software Foundation, Inc.
+This file is part of the GNU C Library.
+Contributed by Ulrich Drepper, <drepper@gnu.ai.mit.edu>.
+
+The GNU C Library is free software; you can redistribute it and/or
+modify it under the terms of the GNU Library General Public License as
+published by the Free Software Foundation; either version 2 of the
+License, or (at your option) any later version.
+
+The GNU C Library is distributed in the hope that it will be useful,
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+Library General Public License for more details.
+
+You should have received a copy of the GNU Library General Public
+License along with the GNU C Library; see the file COPYING.LIB. If
+not, write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+Boston, MA 02111-1307, USA. */
+
+#include <endian.h>
+#include <string.h>
+#include <wctype.h>
+#include "localeinfo.h"
+
+wctype_t
+wctype (const char *property)
+{
+ const char *names;
+ wctype_t result;
+
+ names = _NL_CURRENT (LC_CTYPE, _NL_CTYPE_CLASS_NAMES);
+ for (result = 1; result != 0; result <<= 1)
+ {
+ if (strcmp (property, names) == 0)
+ break;
+
+ names = strchr (names, '\0') + 1;
+ if (names[0] == '\0')
+ return 0;
+ }
+
+#if __BYTE_ORDER == __BIG_ENDIAN
+ return result;
+#else
+# define SWAPU32(w) \
+ (((w) << 24) | (((w) & 0xff00) << 8) | (((w) >> 8) & 0xff00) | ((w) >> 24))
+
+# define SWAPU16(w) \
+ (((w) >> 8) | ((w) << 8))
+
+ if (sizeof (wctype_t) == 4)
+ return SWAPU32 (result);
+ else
+ return SWAPU16 (result);
+#endif
+}
diff --git a/wctype/wctype.h b/wctype/wctype.h
new file mode 100644
index 0000000000..7e90e2bad5
--- /dev/null
+++ b/wctype/wctype.h
@@ -0,0 +1,215 @@
+/* Copyright (C) 1996 Free Software Foundation, Inc.
+This file is part of the GNU C Library.
+
+The GNU C Library is free software; you can redistribute it and/or
+modify it under the terms of the GNU Library General Public License as
+published by the Free Software Foundation; either version 2 of the
+License, or (at your option) any later version.
+
+The GNU C Library is distributed in the hope that it will be useful,
+but WITHOUT ANY WARRANTY; without even the implied warranty of
+MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
+Library General Public License for more details.
+
+You should have received a copy of the GNU Library General Public
+License along with the GNU C Library; see the file COPYING.LIB. If
+not, write to the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
+Boston, MA 02111-1307, USA. */
+
+/*
+ * ISO/IEC 9899:1990/Amendment 1:1995 7.15:
+ * Wide-character classification and mapping utilities <wctype.h>
+ */
+
+#ifndef _WCTYPE_H
+
+#define _WCTYPE_H 1
+#include <features.h>
+
+
+__BEGIN_DECLS
+
+/* FIXME: should this go into <stddef.h>??? */
+#if 0
+#define __need_wint_t
+#include <stddef.h>
+#else
+/* Integral type unchanged by default argument promotions that can
+ hold any value corresponding to members of the extended character
+ set, as well as at least one value that does not correspond to any
+ member of the extended character set. */
+typedef unsigned int wint_t;
+#endif
+
+/* Scalar type that can hold values which represent locale-specific
+ character mappings. */
+typedef const unsigned int *wctrans_t;
+
+/* Scalar type that can hold values which represent locale-specific
+ character classifications. */
+#if 0
+typedef unsigned long int wctype_t;
+#else
+/* For compatibility reasons we have to use shorts for now. */
+typedef unsigned short int wctype_t;
+#endif
+
+
+/* Constant expression of type `wint_t' whose value does not correspond
+ to any member of the extended character set. */
+#ifndef WEOF
+#define WEOF (0xffffffffu)
+#endif
+
+#ifndef _ISbit
+/* These are all the characteristics of characters.
+ If there get to be more than 16 distinct characteristics,
+ many things must be changed that use `unsigned short int's.
+
+ The characteristics are stored always in network byte order (big
+ endian). We define the bit value interpretations here dependent on the
+ machine's byte order. */
+
+#include <endian.h>
+#if __BYTE_ORDER == __BIG_ENDIAN
+#define _ISbit(bit) (1 << bit)
+#else /* __BYTE_ORDER == __LITTLE_ENDIAN */
+#define _ISbit(bit) (bit < 8 ? ((1 << bit) << 8) : ((1 << bit) >> 8))
+#endif
+
+enum
+{
+ _ISupper = _ISbit (0), /* UPPERCASE. */
+ _ISlower = _ISbit (1), /* lowercase. */
+ _ISalpha = _ISbit (2), /* Alphabetic. */
+ _ISdigit = _ISbit (3), /* Numeric. */
+ _ISxdigit = _ISbit (4), /* Hexadecimal numeric. */
+ _ISspace = _ISbit (5), /* Whitespace. */
+ _ISprint = _ISbit (6), /* Printing. */
+ _ISgraph = _ISbit (7), /* Graphical. */
+ _ISblank = _ISbit (8), /* Blank (usually SPC and TAB). */
+ _IScntrl = _ISbit (9), /* Control character. */
+ _ISpunct = _ISbit (10), /* Punctuation. */
+ _ISalnum = _ISbit (11) /* Alphanumeric. */
+};
+#endif /* Not _ISbit */
+
+
+/*
+ * Wide-character classification functions: 7.15.2.1.
+ */
+
+/* Test for any wide character for which `iswalpha' or `iswdigit' is
+ true. */
+int iswalnum __P ((wint_t __wc));
+
+/* Test for any wide character for which `iswupper' or 'iswlower' is
+ true, or any wide character that is one of a locale-specific set of
+ wide-characters for which none of `iswcntrl', `iswdigit',
+ `iswpunct', or `iswspace' is true. */
+int iswalpha __P ((wint_t __wc));
+
+/* Test for any control wide character. */
+int iswcntrl __P ((wint_t __wc));
+
+/* Test for any wide character that corresponds to a decimal-digit
+ character. */
+int iswdigit __P ((wint_t __wc));
+
+/* Test for any wide character for which `iswprint' is true and
+ `iswspace' is false. */
+int iswgraph __P ((wint_t __wc));
+
+/* Test for any wide character that corresponds to a lowercase letter
+ or is one of a locale-specific set of wide characters for which
+ none of `iswcntrl', `iswdigit', `iswpunct', or `iswspace' is true. */
+int iswlower __P ((wint_t __wc));
+
+/* Test for any printing wide character. */
+int iswprint __P ((wint_t __wc));
+
+/* Test for any printing wide character that is one of a
+ locale-specific et of wide characters for which neither `iswspace'
+ nor `iswalnum' is true. */
+int iswpunct __P ((wint_t __wc));
+
+/* Test for any wide character that corresponds to a locale-specific
+ set of wide characters for which none of `iswalnum', `iswgraph', or
+ `iswpunct' is true. */
+int iswspace __P ((wint_t __wc));
+
+/* Test for any wide character that corresponds to an uppercase letter
+ or is one of a locale-specific set of wide character for which none
+ of `iswcntrl', `iswdigit', `iswpunct', or `iswspace' is true. */
+int iswupper __P ((wint_t __wc));
+
+/* Test for any wide character that corresponds to a hexadecimal-digit
+ character equivalent to that performed be the functions described
+ in the previous subclause. */
+int iswxdigit __P ((wint_t __wc));
+
+/*
+ * Extensible wide-character classification functions: 7.15.2.2.
+ */
+
+/* Construct value that describes a class of wide characters identified
+ by the string argument PROPERTY. */
+wctype_t wctype __P ((__const char *__property));
+
+/* Determine whether the wide-character WC has the property described by
+ DESC. */
+int iswctype __P ((wint_t __wc, wctype_t __desc));
+
+
+/*
+ * Wide-character case-mapping functions: 7.15.3.1.
+ */
+
+/* Converts an uppercase letter to the corresponding lowercase letter. */
+wint_t towlower __P ((wint_t __wc));
+
+/* Converts an lowercase letter to the corresponding uppercase letter. */
+wint_t towupper __P ((wint_t __wc));
+
+/*
+ * Extensible wide-character mapping functions: 7.15.3.2.
+ */
+
+/* Construct value that describes a mapping between wide characters
+ identified by the string argument PROPERTY. */
+wctrans_t wctrans __P ((__const char *__property));
+
+/* Map the wide character WC using the mapping described by DESC. */
+wint_t towctrans __P ((wint_t __wc, wctrans_t __desc));
+
+
+
+#ifndef __NO_WCTYPE
+#define iswalnum(wc) iswctype ((wc), _ISalnum)
+#define iswalpha(wc) iswctype ((wc), _ISalpha)
+#define iswcntrl(wc) iswctype ((wc), _IScntrl)
+#define iswdigit(wc) iswctype ((wc), _ISdigit)
+#define iswlower(wc) iswctype ((wc), _ISlower)
+#define iswgraph(wc) iswctype ((wc), _ISgraph)
+#define iswprint(wc) iswctype ((wc), _ISprint)
+#define iswpunct(wc) iswctype ((wc), _ISpunct)
+#define iswspace(wc) iswctype ((wc), _ISspace)
+#define iswupper(wc) iswctype ((wc), _ISupper)
+#define iswxdigit(wc) iswctype ((wc), _ISxdigit)
+
+#ifdef __USE_GNU
+#define iswblank(wc) iswctype ((wc), _ISblank)
+#endif
+
+/* Pointer to conversion tables. */
+extern __const int *__ctype_tolower; /* Case conversions. */
+extern __const int *__ctype_toupper; /* Case conversions. */
+
+#define towlower(wc) towctrans (wc, __ctype_tolower)
+#define towupper(wc) towctrans (wc, __ctype_toupper)
+
+#endif /* Not __NO_WCTYPE. */
+
+__END_DECLS
+
+#endif /* wctype.h */