]> git.proxmox.com Git - mirror_edk2.git/blame - MdeModulePkg/Universal/RegularExpressionDxe/Oniguruma/regerror.c
MdeModulePkg RegularExpressionDxe: Update Oniguruma to 6.9.0
[mirror_edk2.git] / MdeModulePkg / Universal / RegularExpressionDxe / Oniguruma / regerror.c
CommitLineData
14b0e578
CS
1/**********************************************************************\r
2 regerror.c - Oniguruma (regular expression library)\r
3**********************************************************************/\r
4/*-\r
b602265d 5 * Copyright (c) 2002-2018 K.Kosako <sndgk393 AT ybb DOT ne DOT jp>\r
14b0e578
CS
6 * All rights reserved.\r
7 *\r
14b0e578
CS
8 * Redistribution and use in source and binary forms, with or without\r
9 * modification, are permitted provided that the following conditions\r
10 * are met:\r
11 * 1. Redistributions of source code must retain the above copyright\r
12 * notice, this list of conditions and the following disclaimer.\r
13 * 2. Redistributions in binary form must reproduce the above copyright\r
14 * notice, this list of conditions and the following disclaimer in the\r
15 * documentation and/or other materials provided with the distribution.\r
16 *\r
17 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND\r
18 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE\r
19 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE\r
20 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE\r
21 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL\r
22 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS\r
23 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)\r
24 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT\r
25 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY\r
26 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF\r
27 * SUCH DAMAGE.\r
28 */\r
29\r
14b0e578 30#include "regint.h"\r
b602265d 31#define HAVE_STDARG_PROTOTYPES\r
14b0e578
CS
32#if 0\r
33#include <stdio.h> /* for vsnprintf() */\r
34\r
35#ifdef HAVE_STDARG_PROTOTYPES\r
36#include <stdarg.h>\r
37#define va_init_list(a,b) va_start(a,b)\r
38#else\r
39#include <varargs.h>\r
40#define va_init_list(a,b) va_start(a)\r
41#endif\r
42#endif\r
43\r
44extern UChar*\r
45onig_error_code_to_format(int code)\r
46{\r
47 char *p;\r
48\r
14b0e578
CS
49 switch (code) {\r
50 case ONIG_MISMATCH:\r
51 p = "mismatch"; break;\r
52 case ONIG_NO_SUPPORT_CONFIG:\r
53 p = "no support in this configuration"; break;\r
b602265d
DG
54 case ONIG_ABORT:\r
55 p = "abort"; break;\r
14b0e578
CS
56 case ONIGERR_MEMORY:\r
57 p = "fail to memory allocation"; break;\r
58 case ONIGERR_MATCH_STACK_LIMIT_OVER:\r
59 p = "match-stack limit over"; break;\r
b602265d
DG
60 case ONIGERR_PARSE_DEPTH_LIMIT_OVER:\r
61 p = "parse depth limit over"; break;\r
62 case ONIGERR_RETRY_LIMIT_IN_MATCH_OVER:\r
63 p = "retry-limit-in-match over"; break;\r
14b0e578
CS
64 case ONIGERR_TYPE_BUG:\r
65 p = "undefined type (bug)"; break;\r
66 case ONIGERR_PARSER_BUG:\r
67 p = "internal parser error (bug)"; break;\r
68 case ONIGERR_STACK_BUG:\r
69 p = "stack error (bug)"; break;\r
70 case ONIGERR_UNDEFINED_BYTECODE:\r
71 p = "undefined bytecode (bug)"; break;\r
72 case ONIGERR_UNEXPECTED_BYTECODE:\r
73 p = "unexpected bytecode (bug)"; break;\r
74 case ONIGERR_DEFAULT_ENCODING_IS_NOT_SETTED:\r
75 p = "default multibyte-encoding is not setted"; break;\r
76 case ONIGERR_SPECIFIED_ENCODING_CANT_CONVERT_TO_WIDE_CHAR:\r
77 p = "can't convert to wide-char on specified multibyte-encoding"; break;\r
b602265d
DG
78 case ONIGERR_FAIL_TO_INITIALIZE:\r
79 p = "fail to initialize"; break;\r
14b0e578
CS
80 case ONIGERR_INVALID_ARGUMENT:\r
81 p = "invalid argument"; break;\r
82 case ONIGERR_END_PATTERN_AT_LEFT_BRACE:\r
83 p = "end pattern at left brace"; break;\r
84 case ONIGERR_END_PATTERN_AT_LEFT_BRACKET:\r
85 p = "end pattern at left bracket"; break;\r
86 case ONIGERR_EMPTY_CHAR_CLASS:\r
87 p = "empty char-class"; break;\r
88 case ONIGERR_PREMATURE_END_OF_CHAR_CLASS:\r
89 p = "premature end of char-class"; break;\r
90 case ONIGERR_END_PATTERN_AT_ESCAPE:\r
91 p = "end pattern at escape"; break;\r
92 case ONIGERR_END_PATTERN_AT_META:\r
93 p = "end pattern at meta"; break;\r
94 case ONIGERR_END_PATTERN_AT_CONTROL:\r
95 p = "end pattern at control"; break;\r
96 case ONIGERR_META_CODE_SYNTAX:\r
97 p = "invalid meta-code syntax"; break;\r
98 case ONIGERR_CONTROL_CODE_SYNTAX:\r
99 p = "invalid control-code syntax"; break;\r
100 case ONIGERR_CHAR_CLASS_VALUE_AT_END_OF_RANGE:\r
101 p = "char-class value at end of range"; break;\r
102 case ONIGERR_CHAR_CLASS_VALUE_AT_START_OF_RANGE:\r
103 p = "char-class value at start of range"; break;\r
104 case ONIGERR_UNMATCHED_RANGE_SPECIFIER_IN_CHAR_CLASS:\r
105 p = "unmatched range specifier in char-class"; break;\r
106 case ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED:\r
107 p = "target of repeat operator is not specified"; break;\r
108 case ONIGERR_TARGET_OF_REPEAT_OPERATOR_INVALID:\r
109 p = "target of repeat operator is invalid"; break;\r
110 case ONIGERR_NESTED_REPEAT_OPERATOR:\r
111 p = "nested repeat operator"; break;\r
112 case ONIGERR_UNMATCHED_CLOSE_PARENTHESIS:\r
113 p = "unmatched close parenthesis"; break;\r
114 case ONIGERR_END_PATTERN_WITH_UNMATCHED_PARENTHESIS:\r
115 p = "end pattern with unmatched parenthesis"; break;\r
116 case ONIGERR_END_PATTERN_IN_GROUP:\r
117 p = "end pattern in group"; break;\r
118 case ONIGERR_UNDEFINED_GROUP_OPTION:\r
119 p = "undefined group option"; break;\r
120 case ONIGERR_INVALID_POSIX_BRACKET_TYPE:\r
121 p = "invalid POSIX bracket type"; break;\r
122 case ONIGERR_INVALID_LOOK_BEHIND_PATTERN:\r
123 p = "invalid pattern in look-behind"; break;\r
124 case ONIGERR_INVALID_REPEAT_RANGE_PATTERN:\r
125 p = "invalid repeat range {lower,upper}"; break;\r
126 case ONIGERR_TOO_BIG_NUMBER:\r
127 p = "too big number"; break;\r
128 case ONIGERR_TOO_BIG_NUMBER_FOR_REPEAT_RANGE:\r
129 p = "too big number for repeat range"; break;\r
130 case ONIGERR_UPPER_SMALLER_THAN_LOWER_IN_REPEAT_RANGE:\r
131 p = "upper is smaller than lower in repeat range"; break;\r
132 case ONIGERR_EMPTY_RANGE_IN_CHAR_CLASS:\r
133 p = "empty range in char class"; break;\r
134 case ONIGERR_MISMATCH_CODE_LENGTH_IN_CLASS_RANGE:\r
135 p = "mismatch multibyte code length in char-class range"; break;\r
136 case ONIGERR_TOO_MANY_MULTI_BYTE_RANGES:\r
137 p = "too many multibyte code ranges are specified"; break;\r
138 case ONIGERR_TOO_SHORT_MULTI_BYTE_STRING:\r
139 p = "too short multibyte code string"; break;\r
140 case ONIGERR_TOO_BIG_BACKREF_NUMBER:\r
141 p = "too big backref number"; break;\r
142 case ONIGERR_INVALID_BACKREF:\r
14b0e578 143 p = "invalid backref number/name"; break;\r
14b0e578
CS
144 case ONIGERR_NUMBERED_BACKREF_OR_CALL_NOT_ALLOWED:\r
145 p = "numbered backref/call is not allowed. (use name)"; break;\r
b602265d
DG
146 case ONIGERR_TOO_MANY_CAPTURES:\r
147 p = "too many captures"; break;\r
14b0e578
CS
148 case ONIGERR_TOO_BIG_WIDE_CHAR_VALUE:\r
149 p = "too big wide-char value"; break;\r
150 case ONIGERR_TOO_LONG_WIDE_CHAR_VALUE:\r
151 p = "too long wide-char value"; break;\r
152 case ONIGERR_INVALID_CODE_POINT_VALUE:\r
153 p = "invalid code point value"; break;\r
154 case ONIGERR_EMPTY_GROUP_NAME:\r
155 p = "group name is empty"; break;\r
156 case ONIGERR_INVALID_GROUP_NAME:\r
157 p = "invalid group name <%n>"; break;\r
158 case ONIGERR_INVALID_CHAR_IN_GROUP_NAME:\r
14b0e578 159 p = "invalid char in group name <%n>"; break;\r
14b0e578
CS
160 case ONIGERR_UNDEFINED_NAME_REFERENCE:\r
161 p = "undefined name <%n> reference"; break;\r
162 case ONIGERR_UNDEFINED_GROUP_REFERENCE:\r
163 p = "undefined group <%n> reference"; break;\r
164 case ONIGERR_MULTIPLEX_DEFINED_NAME:\r
165 p = "multiplex defined name <%n>"; break;\r
166 case ONIGERR_MULTIPLEX_DEFINITION_NAME_CALL:\r
167 p = "multiplex definition name <%n> call"; break;\r
168 case ONIGERR_NEVER_ENDING_RECURSION:\r
169 p = "never ending recursion"; break;\r
170 case ONIGERR_GROUP_NUMBER_OVER_FOR_CAPTURE_HISTORY:\r
171 p = "group number is too big for capture history"; break;\r
172 case ONIGERR_INVALID_CHAR_PROPERTY_NAME:\r
173 p = "invalid character property name {%n}"; break;\r
b602265d
DG
174 case ONIGERR_INVALID_IF_ELSE_SYNTAX:\r
175 p = "invalid if-else syntax"; break;\r
176 case ONIGERR_INVALID_ABSENT_GROUP_PATTERN:\r
177 p = "invalid absent group pattern"; break;\r
178 case ONIGERR_INVALID_ABSENT_GROUP_GENERATOR_PATTERN:\r
179 p = "invalid absent group generator pattern"; break;\r
180 case ONIGERR_INVALID_CALLOUT_PATTERN:\r
181 p = "invalid callout pattern"; break;\r
182 case ONIGERR_INVALID_CALLOUT_NAME:\r
183 p = "invalid callout name"; break;\r
184 case ONIGERR_UNDEFINED_CALLOUT_NAME:\r
185 p = "undefined callout name"; break;\r
186 case ONIGERR_INVALID_CALLOUT_BODY:\r
187 p = "invalid callout body"; break;\r
188 case ONIGERR_INVALID_CALLOUT_TAG_NAME:\r
189 p = "invalid callout tag name"; break;\r
190 case ONIGERR_INVALID_CALLOUT_ARG:\r
191 p = "invalid callout arg"; break;\r
14b0e578
CS
192 case ONIGERR_NOT_SUPPORTED_ENCODING_COMBINATION:\r
193 p = "not supported encoding combination"; break;\r
194 case ONIGERR_INVALID_COMBINATION_OF_OPTIONS:\r
195 p = "invalid combination of options"; break;\r
b602265d
DG
196 case ONIGERR_LIBRARY_IS_NOT_INITIALIZED:\r
197 p = "library is not initialized"; break;\r
14b0e578
CS
198\r
199 default:\r
200 p = "undefined error code"; break;\r
201 }\r
202\r
203 return (UChar* )p;\r
204}\r
205\r
206static void sprint_byte(char* s, unsigned int v)\r
207{\r
61e078dd 208 sprintf_s(s, sizeof("00"), "%02x", (v & 0377));\r
14b0e578
CS
209}\r
210\r
211static void sprint_byte_with_x(char* s, unsigned int v)\r
212{\r
61e078dd 213 sprintf_s(s, sizeof("\\x00"), "\\x%02x", (v & 0377));\r
14b0e578
CS
214}\r
215\r
216static int to_ascii(OnigEncoding enc, UChar *s, UChar *end,\r
217 UChar buf[], int buf_size, int *is_over)\r
218{\r
219 int len;\r
220 UChar *p;\r
221 OnigCodePoint code;\r
222\r
223 if (ONIGENC_MBC_MINLEN(enc) > 1) {\r
224 p = s;\r
225 len = 0;\r
226 while (p < end) {\r
227 code = ONIGENC_MBC_TO_CODE(enc, p, end);\r
228 if (code >= 0x80) {\r
b602265d
DG
229 if (code > 0xffff && len + 10 <= buf_size) {\r
230 sprint_byte_with_x((char*)(&(buf[len])), (unsigned int)(code >> 24));\r
231 sprint_byte((char*)(&(buf[len+4])), (unsigned int)(code >> 16));\r
232 sprint_byte((char*)(&(buf[len+6])), (unsigned int)(code >> 8));\r
233 sprint_byte((char*)(&(buf[len+8])), (unsigned int)code);\r
234 len += 10;\r
235 }\r
236 else if (len + 6 <= buf_size) {\r
237 sprint_byte_with_x((char*)(&(buf[len])), (unsigned int)(code >> 8));\r
238 sprint_byte((char*)(&(buf[len+4])), (unsigned int)code);\r
239 len += 6;\r
240 }\r
241 else {\r
242 break;\r
243 }\r
14b0e578
CS
244 }\r
245 else {\r
b602265d 246 buf[len++] = (UChar )code;\r
14b0e578
CS
247 }\r
248\r
249 p += enclen(enc, p);\r
250 if (len >= buf_size) break;\r
251 }\r
252\r
253 *is_over = ((p < end) ? 1 : 0);\r
254 }\r
255 else {\r
b602265d 256 len = MIN((int )(end - s), buf_size);\r
14b0e578
CS
257 xmemcpy(buf, s, (size_t )len);\r
258 *is_over = ((buf_size < (end - s)) ? 1 : 0);\r
259 }\r
260\r
261 return len;\r
262}\r
263\r
264\r
265/* for ONIG_MAX_ERROR_MESSAGE_LEN */\r
266#define MAX_ERROR_PAR_LEN 30\r
267\r
268extern int\r
a12b214e 269EFIAPI\r
14b0e578
CS
270#ifdef HAVE_STDARG_PROTOTYPES\r
271onig_error_code_to_str(UChar* s, int code, ...)\r
272#else\r
273onig_error_code_to_str(s, code, va_alist)\r
274 UChar* s;\r
275 int code;\r
276 va_dcl \r
277#endif\r
278{\r
279 UChar *p, *q;\r
280 OnigErrorInfo* einfo;\r
281 int len, is_over;\r
282 UChar parbuf[MAX_ERROR_PAR_LEN];\r
283 va_list vargs;\r
284\r
285 va_init_list(vargs, code);\r
286\r
287 switch (code) {\r
288 case ONIGERR_UNDEFINED_NAME_REFERENCE:\r
289 case ONIGERR_UNDEFINED_GROUP_REFERENCE:\r
290 case ONIGERR_MULTIPLEX_DEFINED_NAME:\r
291 case ONIGERR_MULTIPLEX_DEFINITION_NAME_CALL:\r
292 case ONIGERR_INVALID_GROUP_NAME:\r
293 case ONIGERR_INVALID_CHAR_IN_GROUP_NAME:\r
294 case ONIGERR_INVALID_CHAR_PROPERTY_NAME:\r
295 einfo = va_arg(vargs, OnigErrorInfo*);\r
296 len = to_ascii(einfo->enc, einfo->par, einfo->par_end,\r
b602265d 297 parbuf, MAX_ERROR_PAR_LEN - 3, &is_over);\r
14b0e578
CS
298 q = onig_error_code_to_format(code);\r
299 p = s;\r
300 while (*q != '\0') {\r
301 if (*q == '%') {\r
b602265d
DG
302 q++;\r
303 if (*q == 'n') { /* '%n': name */\r
304 xmemcpy(p, parbuf, len);\r
305 p += len;\r
306 if (is_over != 0) {\r
307 xmemcpy(p, "...", 3);\r
308 p += 3;\r
309 }\r
310 q++;\r
311 }\r
312 else\r
313 goto normal_char;\r
14b0e578
CS
314 }\r
315 else {\r
316 normal_char:\r
b602265d 317 *p++ = *q++;\r
14b0e578
CS
318 }\r
319 }\r
320 *p = '\0';\r
b602265d 321 len = (int )(p - s);\r
14b0e578
CS
322 break;\r
323\r
324 default:\r
325 q = onig_error_code_to_format(code);\r
326 len = onigenc_str_bytelen_null(ONIG_ENCODING_ASCII, q);\r
327 xmemcpy(s, q, len);\r
328 s[len] = '\0';\r
329 break;\r
330 }\r
331\r
332 va_end(vargs);\r
333 return len;\r
334}\r
335\r
336\r
337void\r
a12b214e 338EFIAPI\r
14b0e578
CS
339#ifdef HAVE_STDARG_PROTOTYPES\r
340onig_snprintf_with_pattern(UChar buf[], int bufsize, OnigEncoding enc,\r
341 UChar* pat, UChar* pat_end, const UChar *fmt, ...)\r
342#else\r
343onig_snprintf_with_pattern(buf, bufsize, enc, pat, pat_end, fmt, va_alist)\r
344 UChar buf[];\r
345 int bufsize;\r
346 OnigEncoding enc;\r
347 UChar* pat;\r
348 UChar* pat_end;\r
349 const UChar *fmt;\r
350 va_dcl\r
351#endif\r
352{\r
353 int n, need, len;\r
354 UChar *p, *s, *bp;\r
355 UChar bs[6];\r
356 va_list args;\r
357\r
358 va_init_list(args, fmt);\r
359 n = xvsnprintf((char* )buf, bufsize, (const char* )fmt, args);\r
360 va_end(args);\r
361\r
b602265d 362 need = (int )(pat_end - pat) * 4 + 4;\r
14b0e578
CS
363\r
364 if (n + need < bufsize) {\r
365 strcat_s((char* )buf, bufsize, ": /");\r
366 s = buf + onigenc_str_bytelen_null(ONIG_ENCODING_ASCII, buf);\r
367\r
368 p = pat;\r
369 while (p < pat_end) {\r
b602265d 370 if (ONIGENC_IS_MBC_HEAD(enc, p)) {\r
14b0e578
CS
371 len = enclen(enc, p);\r
372 if (ONIGENC_MBC_MINLEN(enc) == 1) {\r
373 while (len-- > 0) *s++ = *p++;\r
374 }\r
b602265d 375 else { /* for UTF16/32 */\r
14b0e578
CS
376 int blen;\r
377\r
378 while (len-- > 0) {\r
b602265d 379 sprint_byte_with_x((char* )bs, (unsigned int )(*p++));\r
14b0e578
CS
380 blen = onigenc_str_bytelen_null(ONIG_ENCODING_ASCII, bs);\r
381 bp = bs;\r
382 while (blen-- > 0) *s++ = *bp++;\r
383 }\r
384 }\r
385 }\r
b602265d
DG
386 else if (*p == '\\') {\r
387 *s++ = *p++;\r
388 len = enclen(enc, p);\r
389 while (len-- > 0) *s++ = *p++;\r
390 }\r
391 else if (*p == '/') {\r
392 *s++ = (unsigned char )'\\';\r
393 *s++ = *p++;\r
394 }\r
14b0e578 395 else if (!ONIGENC_IS_CODE_PRINT(enc, *p) &&\r
b602265d
DG
396 !ONIGENC_IS_CODE_SPACE(enc, *p)) {\r
397 sprint_byte_with_x((char* )bs, (unsigned int )(*p++));\r
398 len = onigenc_str_bytelen_null(ONIG_ENCODING_ASCII, bs);\r
14b0e578 399 bp = bs;\r
b602265d 400 while (len-- > 0) *s++ = *bp++;\r
14b0e578
CS
401 }\r
402 else {\r
b602265d 403 *s++ = *p++;\r
14b0e578
CS
404 }\r
405 }\r
406\r
407 *s++ = '/';\r
408 *s = '\0';\r
409 }\r
410}\r