diff options
Diffstat (limited to 'gl/m4/regex.m4')
-rw-r--r-- | gl/m4/regex.m4 | 198 |
1 files changed, 198 insertions, 0 deletions
diff --git a/gl/m4/regex.m4 b/gl/m4/regex.m4 new file mode 100644 index 00000000..25da645e --- /dev/null +++ b/gl/m4/regex.m4 | |||
@@ -0,0 +1,198 @@ | |||
1 | #serial 42 | ||
2 | |||
3 | # Copyright (C) 1996, 1997, 1998, 1999, 2000, 2001, 2003, 2004, 2005, | ||
4 | # 2006, 2007 Free Software Foundation, Inc. | ||
5 | # | ||
6 | # This file is free software; the Free Software Foundation | ||
7 | # gives unlimited permission to copy and/or distribute it, | ||
8 | # with or without modifications, as long as this notice is preserved. | ||
9 | |||
10 | dnl Initially derived from code in GNU grep. | ||
11 | dnl Mostly written by Jim Meyering. | ||
12 | |||
13 | AC_PREREQ([2.50]) | ||
14 | |||
15 | AC_DEFUN([gl_REGEX], | ||
16 | [ | ||
17 | AC_CHECK_HEADERS_ONCE([locale.h]) | ||
18 | |||
19 | AC_ARG_WITH([included-regex], | ||
20 | [AC_HELP_STRING([--without-included-regex], | ||
21 | [don't compile regex; this is the default on | ||
22 | systems with recent-enough versions of the GNU C | ||
23 | Library (use with caution on other systems)])]) | ||
24 | |||
25 | case $with_included_regex in #( | ||
26 | yes|no) ac_use_included_regex=$with_included_regex | ||
27 | ;; | ||
28 | '') | ||
29 | # If the system regex support is good enough that it passes the | ||
30 | # following run test, then default to *not* using the included regex.c. | ||
31 | # If cross compiling, assume the test would fail and use the included | ||
32 | # regex.c. The first failing regular expression is from `Spencer ere | ||
33 | # test #75' in grep-2.3. | ||
34 | AC_CACHE_CHECK([for working re_compile_pattern], | ||
35 | [gl_cv_func_re_compile_pattern_working], | ||
36 | [AC_RUN_IFELSE( | ||
37 | [AC_LANG_PROGRAM( | ||
38 | [AC_INCLUDES_DEFAULT | ||
39 | #if HAVE_LOCALE_H | ||
40 | #include <locale.h> | ||
41 | #endif | ||
42 | #include <limits.h> | ||
43 | #include <regex.h> | ||
44 | ], | ||
45 | [[static struct re_pattern_buffer regex; | ||
46 | unsigned char folded_chars[UCHAR_MAX + 1]; | ||
47 | int i; | ||
48 | const char *s; | ||
49 | struct re_registers regs; | ||
50 | |||
51 | #if HAVE_LOCALE_H | ||
52 | /* http://sourceware.org/ml/libc-hacker/2006-09/msg00008.html | ||
53 | This test needs valgrind to catch the bug on Debian | ||
54 | GNU/Linux 3.1 x86, but it might catch the bug better | ||
55 | on other platforms and it shouldn't hurt to try the | ||
56 | test here. */ | ||
57 | if (setlocale (LC_ALL, "en_US.UTF-8")) | ||
58 | { | ||
59 | static char const pat[] = "insert into"; | ||
60 | static char const data[] = | ||
61 | "\xFF\0\x12\xA2\xAA\xC4\xB1,K\x12\xC4\xB1*\xACK"; | ||
62 | re_set_syntax (RE_SYNTAX_GREP | RE_HAT_LISTS_NOT_NEWLINE | ||
63 | | RE_ICASE); | ||
64 | memset (®ex, 0, sizeof regex); | ||
65 | s = re_compile_pattern (pat, sizeof pat - 1, ®ex); | ||
66 | if (s) | ||
67 | return 1; | ||
68 | if (re_search (®ex, data, sizeof data - 1, | ||
69 | 0, sizeof data - 1, ®s) | ||
70 | != -1) | ||
71 | return 1; | ||
72 | if (! setlocale (LC_ALL, "C")) | ||
73 | return 1; | ||
74 | } | ||
75 | #endif | ||
76 | |||
77 | re_set_syntax (RE_SYNTAX_POSIX_EGREP); | ||
78 | memset (®ex, 0, sizeof (regex)); | ||
79 | for (i = 0; i <= UCHAR_MAX; i++) | ||
80 | folded_chars[i] = i; | ||
81 | regex.translate = folded_chars; | ||
82 | s = re_compile_pattern ("a[[:@:>@:]]b\n", 11, ®ex); | ||
83 | /* This should fail with _Invalid character class name_ error. */ | ||
84 | if (!s) | ||
85 | exit (1); | ||
86 | |||
87 | /* This should succeed, but does not for e.g. glibc-2.1.3. */ | ||
88 | memset (®ex, 0, sizeof (regex)); | ||
89 | s = re_compile_pattern ("{1", 2, ®ex); | ||
90 | |||
91 | if (s) | ||
92 | exit (1); | ||
93 | |||
94 | /* The following example is derived from a problem report | ||
95 | against gawk from Jorge Stolfi <stolfi@ic.unicamp.br>. */ | ||
96 | memset (®ex, 0, sizeof (regex)); | ||
97 | s = re_compile_pattern ("[an\371]*n", 7, ®ex); | ||
98 | if (s) | ||
99 | exit (1); | ||
100 | |||
101 | /* This should match, but does not for e.g. glibc-2.2.1. */ | ||
102 | if (re_match (®ex, "an", 2, 0, ®s) != 2) | ||
103 | exit (1); | ||
104 | |||
105 | memset (®ex, 0, sizeof (regex)); | ||
106 | s = re_compile_pattern ("x", 1, ®ex); | ||
107 | if (s) | ||
108 | exit (1); | ||
109 | |||
110 | /* The version of regex.c in e.g. GNU libc-2.2.93 did not | ||
111 | work with a negative RANGE argument. */ | ||
112 | if (re_search (®ex, "wxy", 3, 2, -2, ®s) != 1) | ||
113 | exit (1); | ||
114 | |||
115 | /* The version of regex.c in older versions of gnulib | ||
116 | ignored RE_ICASE. Detect that problem too. */ | ||
117 | memset (®ex, 0, sizeof (regex)); | ||
118 | re_set_syntax (RE_SYNTAX_EMACS | RE_ICASE); | ||
119 | s = re_compile_pattern ("x", 1, ®ex); | ||
120 | if (s) | ||
121 | exit (1); | ||
122 | |||
123 | if (re_search (®ex, "WXY", 3, 0, 3, ®s) < 0) | ||
124 | exit (1); | ||
125 | |||
126 | /* REG_STARTEND was added to glibc on 2004-01-15. | ||
127 | Reject older versions. */ | ||
128 | if (! REG_STARTEND) | ||
129 | exit (1); | ||
130 | |||
131 | /* Reject hosts whose regoff_t values are too narrow. | ||
132 | These include glibc 2.3.5 on hosts with 64-bit ptrdiff_t | ||
133 | and 32-bit int. */ | ||
134 | if (sizeof (regoff_t) < sizeof (ptrdiff_t) | ||
135 | || sizeof (regoff_t) < sizeof (ssize_t)) | ||
136 | exit (1); | ||
137 | |||
138 | exit (0);]])], | ||
139 | [gl_cv_func_re_compile_pattern_working=yes], | ||
140 | [gl_cv_func_re_compile_pattern_working=no], | ||
141 | dnl When crosscompiling, assume it is not working. | ||
142 | [gl_cv_func_re_compile_pattern_working=no])]) | ||
143 | case $gl_cv_func_re_compile_pattern_working in #( | ||
144 | yes) ac_use_included_regex=no;; #( | ||
145 | no) ac_use_included_regex=yes;; | ||
146 | esac | ||
147 | ;; | ||
148 | *) AC_MSG_ERROR([Invalid value for --with-included-regex: $with_included_regex]) | ||
149 | ;; | ||
150 | esac | ||
151 | |||
152 | if test $ac_use_included_regex = yes; then | ||
153 | AC_DEFINE([_REGEX_LARGE_OFFSETS], 1, | ||
154 | [Define if you want regoff_t to be at least as wide POSIX requires.]) | ||
155 | AC_DEFINE([re_syntax_options], [rpl_re_syntax_options], | ||
156 | [Define to rpl_re_syntax_options if the replacement should be used.]) | ||
157 | AC_DEFINE([re_set_syntax], [rpl_re_set_syntax], | ||
158 | [Define to rpl_re_set_syntax if the replacement should be used.]) | ||
159 | AC_DEFINE([re_compile_pattern], [rpl_re_compile_pattern], | ||
160 | [Define to rpl_re_compile_pattern if the replacement should be used.]) | ||
161 | AC_DEFINE([re_compile_fastmap], [rpl_re_compile_fastmap], | ||
162 | [Define to rpl_re_compile_fastmap if the replacement should be used.]) | ||
163 | AC_DEFINE([re_search], [rpl_re_search], | ||
164 | [Define to rpl_re_search if the replacement should be used.]) | ||
165 | AC_DEFINE([re_search_2], [rpl_re_search_2], | ||
166 | [Define to rpl_re_search_2 if the replacement should be used.]) | ||
167 | AC_DEFINE([re_match], [rpl_re_match], | ||
168 | [Define to rpl_re_match if the replacement should be used.]) | ||
169 | AC_DEFINE([re_match_2], [rpl_re_match_2], | ||
170 | [Define to rpl_re_match_2 if the replacement should be used.]) | ||
171 | AC_DEFINE([re_set_registers], [rpl_re_set_registers], | ||
172 | [Define to rpl_re_set_registers if the replacement should be used.]) | ||
173 | AC_DEFINE([re_comp], [rpl_re_comp], | ||
174 | [Define to rpl_re_comp if the replacement should be used.]) | ||
175 | AC_DEFINE([re_exec], [rpl_re_exec], | ||
176 | [Define to rpl_re_exec if the replacement should be used.]) | ||
177 | AC_DEFINE([regcomp], [rpl_regcomp], | ||
178 | [Define to rpl_regcomp if the replacement should be used.]) | ||
179 | AC_DEFINE([regexec], [rpl_regexec], | ||
180 | [Define to rpl_regexec if the replacement should be used.]) | ||
181 | AC_DEFINE([regerror], [rpl_regerror], | ||
182 | [Define to rpl_regerror if the replacement should be used.]) | ||
183 | AC_DEFINE([regfree], [rpl_regfree], | ||
184 | [Define to rpl_regfree if the replacement should be used.]) | ||
185 | AC_LIBOBJ([regex]) | ||
186 | gl_PREREQ_REGEX | ||
187 | fi | ||
188 | ]) | ||
189 | |||
190 | # Prerequisites of lib/regex.c and lib/regex_internal.c. | ||
191 | AC_DEFUN([gl_PREREQ_REGEX], | ||
192 | [ | ||
193 | AC_REQUIRE([AC_GNU_SOURCE]) | ||
194 | AC_REQUIRE([AC_C_RESTRICT]) | ||
195 | AC_REQUIRE([AM_LANGINFO_CODESET]) | ||
196 | AC_CHECK_FUNCS_ONCE([iswctype mbrtowc mempcpy wcrtomb wcscoll]) | ||
197 | AC_CHECK_DECLS([isblank], [], [], [#include <ctype.h>]) | ||
198 | ]) | ||