pcre/pcretest.c

5774 lines
170 KiB
C

/*************************************************
* PCRE testing program *
*************************************************/
/* This program was hacked up as a tester for PCRE. I really should have
written it more tidily in the first place. Will I ever learn? It has grown and
been extended and consequently is now rather, er, *very* untidy in places. The
addition of 16-bit support has made it even worse. :-(
-----------------------------------------------------------------------------
Redistribution and use in source and binary forms, with or without
modification, are permitted provided that the following conditions are met:
* Redistributions of source code must retain the above copyright notice,
this list of conditions and the following disclaimer.
* Redistributions in binary form must reproduce the above copyright
notice, this list of conditions and the following disclaimer in the
documentation and/or other materials provided with the distribution.
* Neither the name of the University of Cambridge nor the names of its
contributors may be used to endorse or promote products derived from
this software without specific prior written permission.
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
POSSIBILITY OF SUCH DAMAGE.
-----------------------------------------------------------------------------
*/
/* This program now supports the testing of all of the 8-bit, 16-bit, and
32-bit PCRE libraries in a single program. This is different from the modules
such as pcre_compile.c in the library itself, which are compiled separately for
each mode. If two modes are enabled, for example, pcre_compile.c is compiled
twice. By contrast, pcretest.c is compiled only once. Therefore, it must not
make use of any of the macros from pcre_internal.h that depend on
COMPILE_PCRE8, COMPILE_PCRE16, or COMPILE_PCRE32. It does, however, make use of
SUPPORT_PCRE8, SUPPORT_PCRE16, and SUPPORT_PCRE32 to ensure that it calls only
supported library functions. */
#ifdef HAVE_CONFIG_H
#include "config.h"
#endif
#include <ctype.h>
#include <stdio.h>
#include <string.h>
#include <stdlib.h>
#include <time.h>
#include <locale.h>
#include <errno.h>
/* Both libreadline and libedit are optionally supported. The user-supplied
original patch uses readline/readline.h for libedit, but in at least one system
it is installed as editline/readline.h, so the configuration code now looks for
that first, falling back to readline/readline.h. */
#if defined(SUPPORT_LIBREADLINE) || defined(SUPPORT_LIBEDIT)
#ifdef HAVE_UNISTD_H
#include <unistd.h>
#endif
#if defined(SUPPORT_LIBREADLINE)
#include <readline/readline.h>
#include <readline/history.h>
#else
#if defined(HAVE_EDITLINE_READLINE_H)
#include <editline/readline.h>
#else
#include <readline/readline.h>
#endif
#endif
#endif
/* A number of things vary for Windows builds. Originally, pcretest opened its
input and output without "b"; then I was told that "b" was needed in some
environments, so it was added for release 5.0 to both the input and output. (It
makes no difference on Unix-like systems.) Later I was told that it is wrong
for the input on Windows. I've now abstracted the modes into two macros that
are set here, to make it easier to fiddle with them, and removed "b" from the
input mode under Windows. */
#if defined(_WIN32) || defined(WIN32)
#include <io.h> /* For _setmode() */
#include <fcntl.h> /* For _O_BINARY */
#define INPUT_MODE "r"
#define OUTPUT_MODE "wb"
#ifndef isatty
#define isatty _isatty /* This is what Windows calls them, I'm told, */
#endif /* though in some environments they seem to */
/* be already defined, hence the #ifndefs. */
#ifndef fileno
#define fileno _fileno
#endif
/* A user sent this fix for Borland Builder 5 under Windows. */
#ifdef __BORLANDC__
#define _setmode(handle, mode) setmode(handle, mode)
#endif
/* Not Windows */
#else
#include <sys/time.h> /* These two includes are needed */
#include <sys/resource.h> /* for setrlimit(). */
#if defined NATIVE_ZOS /* z/OS uses non-binary I/O */
#define INPUT_MODE "r"
#define OUTPUT_MODE "w"
#else
#define INPUT_MODE "rb"
#define OUTPUT_MODE "wb"
#endif
#endif
#ifdef __VMS
#include <ssdef.h>
void vms_setsymbol( char *, char *, int );
#endif
#define PRIV(name) name
/* We have to include pcre_internal.h because we need the internal info for
displaying the results of pcre_study() and we also need to know about the
internal macros, structures, and other internal data values; pcretest has
"inside information" compared to a program that strictly follows the PCRE API.
Although pcre_internal.h does itself include pcre.h, we explicitly include it
here before pcre_internal.h so that the PCRE_EXP_xxx macros get set
appropriately for an application, not for building PCRE. */
#include "pcre.h"
#include "pcre_internal.h"
/* The pcre_printint() function, which prints the internal form of a compiled
regex, is held in a separate file so that (a) it can be compiled in either
8-, 16- or 32-bit mode, and (b) it can be #included directly in pcre_compile.c
when that is compiled in debug mode. */
#ifdef SUPPORT_PCRE8
void pcre_printint(pcre *external_re, FILE *f, BOOL print_lengths);
#endif
#ifdef SUPPORT_PCRE16
void pcre16_printint(pcre *external_re, FILE *f, BOOL print_lengths);
#endif
#ifdef SUPPORT_PCRE32
void pcre32_printint(pcre *external_re, FILE *f, BOOL print_lengths);
#endif
/* We need access to some of the data tables that PCRE uses. So as not to have
to keep two copies, we include the source files here, changing the names of the
external symbols to prevent clashes. */
#define PCRE_INCLUDED
#include "pcre_tables.c"
#include "pcre_ucd.c"
/* The definition of the macro PRINTABLE, which determines whether to print an
output character as-is or as a hex value when showing compiled patterns, is
the same as in the printint.src file. We uses it here in cases when the locale
has not been explicitly changed, so as to get consistent output from systems
that differ in their output from isprint() even in the "C" locale. */
#ifdef EBCDIC
#define PRINTABLE(c) ((c) >= 64 && (c) < 255)
#else
#define PRINTABLE(c) ((c) >= 32 && (c) < 127)
#endif
#define PRINTOK(c) (locale_set? (((c) < 256) && isprint(c)) : PRINTABLE(c))
/* Posix support is disabled in 16 or 32 bit only mode. */
#if !defined SUPPORT_PCRE8 && !defined NOPOSIX
#define NOPOSIX
#endif
/* It is possible to compile this test program without including support for
testing the POSIX interface, though this is not available via the standard
Makefile. */
#if !defined NOPOSIX
#include "pcreposix.h"
#endif
/* It is also possible, originally for the benefit of a version that was
imported into Exim, to build pcretest without support for UTF8 or UTF16 (define
NOUTF), without the interface to the DFA matcher (NODFA). In fact, we
automatically cut out the UTF support if PCRE is built without it. */
#ifndef SUPPORT_UTF
#ifndef NOUTF
#define NOUTF
#endif
#endif
/* To make the code a bit tidier for 8/16/32-bit support, we define macros
for all the pcre[16]_xxx functions (except pcre16_fullinfo, which is called
only from one place and is handled differently). I couldn't dream up any way of
using a single macro to do this in a generic way, because of the many different
argument requirements. We know that at least one of SUPPORT_PCRE8 and
SUPPORT_PCRE16 must be set. First define macros for each individual mode; then
use these in the definitions of generic macros.
**** Special note about the PCHARSxxx macros: the address of the string to be
printed is always given as two arguments: a base address followed by an offset.
The base address is cast to the correct data size for 8 or 16 bit data; the
offset is in units of this size. If the string were given as base+offset in one
argument, the casting might be incorrectly applied. */
#ifdef SUPPORT_PCRE8
#define PCHARS8(lv, p, offset, len, f) \
lv = pchars((pcre_uint8 *)(p) + offset, len, f)
#define PCHARSV8(p, offset, len, f) \
(void)pchars((pcre_uint8 *)(p) + offset, len, f)
#define READ_CAPTURE_NAME8(p, cn8, cn16, cn32, re) \
p = read_capture_name8(p, cn8, re)
#define STRLEN8(p) ((int)strlen((char *)p))
#define SET_PCRE_CALLOUT8(callout) \
pcre_callout = callout
#define SET_PCRE_STACK_GUARD8(stack_guard) \
pcre_stack_guard = stack_guard
#define PCRE_ASSIGN_JIT_STACK8(extra, callback, userdata) \
pcre_assign_jit_stack(extra, callback, userdata)
#define PCRE_COMPILE8(re, pat, options, error, erroffset, tables) \
re = pcre_compile((char *)pat, options, error, erroffset, tables)
#define PCRE_COPY_NAMED_SUBSTRING8(rc, re, bptr, offsets, count, \
namesptr, cbuffer, size) \
rc = pcre_copy_named_substring(re, (char *)bptr, offsets, count, \
(char *)namesptr, cbuffer, size)
#define PCRE_COPY_SUBSTRING8(rc, bptr, offsets, count, i, cbuffer, size) \
rc = pcre_copy_substring((char *)bptr, offsets, count, i, cbuffer, size)
#define PCRE_DFA_EXEC8(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets, workspace, size_workspace) \
count = pcre_dfa_exec(re, extra, (char *)bptr, len, start_offset, options, \
offsets, size_offsets, workspace, size_workspace)
#define PCRE_EXEC8(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets) \
count = pcre_exec(re, extra, (char *)bptr, len, start_offset, options, \
offsets, size_offsets)
#define PCRE_FREE_STUDY8(extra) \
pcre_free_study(extra)
#define PCRE_FREE_SUBSTRING8(substring) \
pcre_free_substring(substring)
#define PCRE_FREE_SUBSTRING_LIST8(listptr) \
pcre_free_substring_list(listptr)
#define PCRE_GET_NAMED_SUBSTRING8(rc, re, bptr, offsets, count, \
getnamesptr, subsptr) \
rc = pcre_get_named_substring(re, (char *)bptr, offsets, count, \
(char *)getnamesptr, subsptr)
#define PCRE_GET_STRINGNUMBER8(n, rc, ptr) \
n = pcre_get_stringnumber(re, (char *)ptr)
#define PCRE_GET_SUBSTRING8(rc, bptr, offsets, count, i, subsptr) \
rc = pcre_get_substring((char *)bptr, offsets, count, i, subsptr)
#define PCRE_GET_SUBSTRING_LIST8(rc, bptr, offsets, count, listptr) \
rc = pcre_get_substring_list((const char *)bptr, offsets, count, listptr)
#define PCRE_PATTERN_TO_HOST_BYTE_ORDER8(rc, re, extra, tables) \
rc = pcre_pattern_to_host_byte_order(re, extra, tables)
#define PCRE_PRINTINT8(re, outfile, debug_lengths) \
pcre_printint(re, outfile, debug_lengths)
#define PCRE_STUDY8(extra, re, options, error) \
extra = pcre_study(re, options, error)
#define PCRE_JIT_STACK_ALLOC8(startsize, maxsize) \
pcre_jit_stack_alloc(startsize, maxsize)
#define PCRE_JIT_STACK_FREE8(stack) \
pcre_jit_stack_free(stack)
#define pcre8_maketables pcre_maketables
#endif /* SUPPORT_PCRE8 */
/* -----------------------------------------------------------*/
#ifdef SUPPORT_PCRE16
#define PCHARS16(lv, p, offset, len, f) \
lv = pchars16((PCRE_SPTR16)(p) + offset, len, f)
#define PCHARSV16(p, offset, len, f) \
(void)pchars16((PCRE_SPTR16)(p) + offset, len, f)
#define READ_CAPTURE_NAME16(p, cn8, cn16, cn32, re) \
p = read_capture_name16(p, cn16, re)
#define STRLEN16(p) ((int)strlen16((PCRE_SPTR16)p))
#define SET_PCRE_CALLOUT16(callout) \
pcre16_callout = (int (*)(pcre16_callout_block *))callout
#define SET_PCRE_STACK_GUARD16(stack_guard) \
pcre16_stack_guard = (int (*)(void))stack_guard
#define PCRE_ASSIGN_JIT_STACK16(extra, callback, userdata) \
pcre16_assign_jit_stack((pcre16_extra *)extra, \
(pcre16_jit_callback)callback, userdata)
#define PCRE_COMPILE16(re, pat, options, error, erroffset, tables) \
re = (pcre *)pcre16_compile((PCRE_SPTR16)pat, options, error, erroffset, \
tables)
#define PCRE_COPY_NAMED_SUBSTRING16(rc, re, bptr, offsets, count, \
namesptr, cbuffer, size) \
rc = pcre16_copy_named_substring((pcre16 *)re, (PCRE_SPTR16)bptr, offsets, \
count, (PCRE_SPTR16)namesptr, (PCRE_UCHAR16 *)cbuffer, size/2)
#define PCRE_COPY_SUBSTRING16(rc, bptr, offsets, count, i, cbuffer, size) \
rc = pcre16_copy_substring((PCRE_SPTR16)bptr, offsets, count, i, \
(PCRE_UCHAR16 *)cbuffer, size/2)
#define PCRE_DFA_EXEC16(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets, workspace, size_workspace) \
count = pcre16_dfa_exec((pcre16 *)re, (pcre16_extra *)extra, \
(PCRE_SPTR16)bptr, len, start_offset, options, offsets, size_offsets, \
workspace, size_workspace)
#define PCRE_EXEC16(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets) \
count = pcre16_exec((pcre16 *)re, (pcre16_extra *)extra, (PCRE_SPTR16)bptr, \
len, start_offset, options, offsets, size_offsets)
#define PCRE_FREE_STUDY16(extra) \
pcre16_free_study((pcre16_extra *)extra)
#define PCRE_FREE_SUBSTRING16(substring) \
pcre16_free_substring((PCRE_SPTR16)substring)
#define PCRE_FREE_SUBSTRING_LIST16(listptr) \
pcre16_free_substring_list((PCRE_SPTR16 *)listptr)
#define PCRE_GET_NAMED_SUBSTRING16(rc, re, bptr, offsets, count, \
getnamesptr, subsptr) \
rc = pcre16_get_named_substring((pcre16 *)re, (PCRE_SPTR16)bptr, offsets, \
count, (PCRE_SPTR16)getnamesptr, (PCRE_SPTR16 *)(void*)subsptr)
#define PCRE_GET_STRINGNUMBER16(n, rc, ptr) \
n = pcre16_get_stringnumber(re, (PCRE_SPTR16)ptr)
#define PCRE_GET_SUBSTRING16(rc, bptr, offsets, count, i, subsptr) \
rc = pcre16_get_substring((PCRE_SPTR16)bptr, offsets, count, i, \
(PCRE_SPTR16 *)(void*)subsptr)
#define PCRE_GET_SUBSTRING_LIST16(rc, bptr, offsets, count, listptr) \
rc = pcre16_get_substring_list((PCRE_SPTR16)bptr, offsets, count, \
(PCRE_SPTR16 **)(void*)listptr)
#define PCRE_PATTERN_TO_HOST_BYTE_ORDER16(rc, re, extra, tables) \
rc = pcre16_pattern_to_host_byte_order((pcre16 *)re, (pcre16_extra *)extra, \
tables)
#define PCRE_PRINTINT16(re, outfile, debug_lengths) \
pcre16_printint(re, outfile, debug_lengths)
#define PCRE_STUDY16(extra, re, options, error) \
extra = (pcre_extra *)pcre16_study((pcre16 *)re, options, error)
#define PCRE_JIT_STACK_ALLOC16(startsize, maxsize) \
(pcre_jit_stack *)pcre16_jit_stack_alloc(startsize, maxsize)
#define PCRE_JIT_STACK_FREE16(stack) \
pcre16_jit_stack_free((pcre16_jit_stack *)stack)
#endif /* SUPPORT_PCRE16 */
/* -----------------------------------------------------------*/
#ifdef SUPPORT_PCRE32
#define PCHARS32(lv, p, offset, len, f) \
lv = pchars32((PCRE_SPTR32)(p) + offset, len, use_utf, f)
#define PCHARSV32(p, offset, len, f) \
(void)pchars32((PCRE_SPTR32)(p) + offset, len, use_utf, f)
#define READ_CAPTURE_NAME32(p, cn8, cn16, cn32, re) \
p = read_capture_name32(p, cn32, re)
#define STRLEN32(p) ((int)strlen32((PCRE_SPTR32)p))
#define SET_PCRE_CALLOUT32(callout) \
pcre32_callout = (int (*)(pcre32_callout_block *))callout
#define SET_PCRE_STACK_GUARD32(stack_guard) \
pcre32_stack_guard = (int (*)(void))stack_guard
#define PCRE_ASSIGN_JIT_STACK32(extra, callback, userdata) \
pcre32_assign_jit_stack((pcre32_extra *)extra, \
(pcre32_jit_callback)callback, userdata)
#define PCRE_COMPILE32(re, pat, options, error, erroffset, tables) \
re = (pcre *)pcre32_compile((PCRE_SPTR32)pat, options, error, erroffset, \
tables)
#define PCRE_COPY_NAMED_SUBSTRING32(rc, re, bptr, offsets, count, \
namesptr, cbuffer, size) \
rc = pcre32_copy_named_substring((pcre32 *)re, (PCRE_SPTR32)bptr, offsets, \
count, (PCRE_SPTR32)namesptr, (PCRE_UCHAR32 *)cbuffer, size/4)
#define PCRE_COPY_SUBSTRING32(rc, bptr, offsets, count, i, cbuffer, size) \
rc = pcre32_copy_substring((PCRE_SPTR32)bptr, offsets, count, i, \
(PCRE_UCHAR32 *)cbuffer, size/4)
#define PCRE_DFA_EXEC32(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets, workspace, size_workspace) \
count = pcre32_dfa_exec((pcre32 *)re, (pcre32_extra *)extra, \
(PCRE_SPTR32)bptr, len, start_offset, options, offsets, size_offsets, \
workspace, size_workspace)
#define PCRE_EXEC32(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets) \
count = pcre32_exec((pcre32 *)re, (pcre32_extra *)extra, (PCRE_SPTR32)bptr, \
len, start_offset, options, offsets, size_offsets)
#define PCRE_FREE_STUDY32(extra) \
pcre32_free_study((pcre32_extra *)extra)
#define PCRE_FREE_SUBSTRING32(substring) \
pcre32_free_substring((PCRE_SPTR32)substring)
#define PCRE_FREE_SUBSTRING_LIST32(listptr) \
pcre32_free_substring_list((PCRE_SPTR32 *)listptr)
#define PCRE_GET_NAMED_SUBSTRING32(rc, re, bptr, offsets, count, \
getnamesptr, subsptr) \
rc = pcre32_get_named_substring((pcre32 *)re, (PCRE_SPTR32)bptr, offsets, \
count, (PCRE_SPTR32)getnamesptr, (PCRE_SPTR32 *)(void*)subsptr)
#define PCRE_GET_STRINGNUMBER32(n, rc, ptr) \
n = pcre32_get_stringnumber(re, (PCRE_SPTR32)ptr)
#define PCRE_GET_SUBSTRING32(rc, bptr, offsets, count, i, subsptr) \
rc = pcre32_get_substring((PCRE_SPTR32)bptr, offsets, count, i, \
(PCRE_SPTR32 *)(void*)subsptr)
#define PCRE_GET_SUBSTRING_LIST32(rc, bptr, offsets, count, listptr) \
rc = pcre32_get_substring_list((PCRE_SPTR32)bptr, offsets, count, \
(PCRE_SPTR32 **)(void*)listptr)
#define PCRE_PATTERN_TO_HOST_BYTE_ORDER32(rc, re, extra, tables) \
rc = pcre32_pattern_to_host_byte_order((pcre32 *)re, (pcre32_extra *)extra, \
tables)
#define PCRE_PRINTINT32(re, outfile, debug_lengths) \
pcre32_printint(re, outfile, debug_lengths)
#define PCRE_STUDY32(extra, re, options, error) \
extra = (pcre_extra *)pcre32_study((pcre32 *)re, options, error)
#define PCRE_JIT_STACK_ALLOC32(startsize, maxsize) \
(pcre_jit_stack *)pcre32_jit_stack_alloc(startsize, maxsize)
#define PCRE_JIT_STACK_FREE32(stack) \
pcre32_jit_stack_free((pcre32_jit_stack *)stack)
#endif /* SUPPORT_PCRE32 */
/* ----- More than one mode is supported; a runtime test is needed, except for
pcre_config(), and the JIT stack functions, when it doesn't matter which
available version is called. ----- */
enum {
PCRE8_MODE,
PCRE16_MODE,
PCRE32_MODE
};
#if (defined (SUPPORT_PCRE8) + defined (SUPPORT_PCRE16) + \
defined (SUPPORT_PCRE32)) >= 2
#define CHAR_SIZE (1U << pcre_mode)
/* There doesn't seem to be an easy way of writing these macros that can cope
with the 3 pairs of bit sizes plus all three bit sizes. So just handle all the
cases separately. */
/* ----- All three modes supported ----- */
#if defined(SUPPORT_PCRE8) && defined(SUPPORT_PCRE16) && defined(SUPPORT_PCRE32)
#define PCHARS(lv, p, offset, len, f) \
if (pcre_mode == PCRE32_MODE) \
PCHARS32(lv, p, offset, len, f); \
else if (pcre_mode == PCRE16_MODE) \
PCHARS16(lv, p, offset, len, f); \
else \
PCHARS8(lv, p, offset, len, f)
#define PCHARSV(p, offset, len, f) \
if (pcre_mode == PCRE32_MODE) \
PCHARSV32(p, offset, len, f); \
else if (pcre_mode == PCRE16_MODE) \
PCHARSV16(p, offset, len, f); \
else \
PCHARSV8(p, offset, len, f)
#define READ_CAPTURE_NAME(p, cn8, cn16, cn32, re) \
if (pcre_mode == PCRE32_MODE) \
READ_CAPTURE_NAME32(p, cn8, cn16, cn32, re); \
else if (pcre_mode == PCRE16_MODE) \
READ_CAPTURE_NAME16(p, cn8, cn16, cn32, re); \
else \
READ_CAPTURE_NAME8(p, cn8, cn16, cn32, re)
#define SET_PCRE_CALLOUT(callout) \
if (pcre_mode == PCRE32_MODE) \
SET_PCRE_CALLOUT32(callout); \
else if (pcre_mode == PCRE16_MODE) \
SET_PCRE_CALLOUT16(callout); \
else \
SET_PCRE_CALLOUT8(callout)
#define SET_PCRE_STACK_GUARD(stack_guard) \
if (pcre_mode == PCRE32_MODE) \
SET_PCRE_STACK_GUARD32(stack_guard); \
else if (pcre_mode == PCRE16_MODE) \
SET_PCRE_STACK_GUARD16(stack_guard); \
else \
SET_PCRE_STACK_GUARD8(stack_guard)
#define STRLEN(p) (pcre_mode == PCRE32_MODE ? STRLEN32(p) : pcre_mode == PCRE16_MODE ? STRLEN16(p) : STRLEN8(p))
#define PCRE_ASSIGN_JIT_STACK(extra, callback, userdata) \
if (pcre_mode == PCRE32_MODE) \
PCRE_ASSIGN_JIT_STACK32(extra, callback, userdata); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_ASSIGN_JIT_STACK16(extra, callback, userdata); \
else \
PCRE_ASSIGN_JIT_STACK8(extra, callback, userdata)
#define PCRE_COMPILE(re, pat, options, error, erroffset, tables) \
if (pcre_mode == PCRE32_MODE) \
PCRE_COMPILE32(re, pat, options, error, erroffset, tables); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_COMPILE16(re, pat, options, error, erroffset, tables); \
else \
PCRE_COMPILE8(re, pat, options, error, erroffset, tables)
#define PCRE_CONFIG pcre_config
#define PCRE_COPY_NAMED_SUBSTRING(rc, re, bptr, offsets, count, \
namesptr, cbuffer, size) \
if (pcre_mode == PCRE32_MODE) \
PCRE_COPY_NAMED_SUBSTRING32(rc, re, bptr, offsets, count, \
namesptr, cbuffer, size); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_COPY_NAMED_SUBSTRING16(rc, re, bptr, offsets, count, \
namesptr, cbuffer, size); \
else \
PCRE_COPY_NAMED_SUBSTRING8(rc, re, bptr, offsets, count, \
namesptr, cbuffer, size)
#define PCRE_COPY_SUBSTRING(rc, bptr, offsets, count, i, cbuffer, size) \
if (pcre_mode == PCRE32_MODE) \
PCRE_COPY_SUBSTRING32(rc, bptr, offsets, count, i, cbuffer, size); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_COPY_SUBSTRING16(rc, bptr, offsets, count, i, cbuffer, size); \
else \
PCRE_COPY_SUBSTRING8(rc, bptr, offsets, count, i, cbuffer, size)
#define PCRE_DFA_EXEC(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets, workspace, size_workspace) \
if (pcre_mode == PCRE32_MODE) \
PCRE_DFA_EXEC32(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets, workspace, size_workspace); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_DFA_EXEC16(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets, workspace, size_workspace); \
else \
PCRE_DFA_EXEC8(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets, workspace, size_workspace)
#define PCRE_EXEC(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets) \
if (pcre_mode == PCRE32_MODE) \
PCRE_EXEC32(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_EXEC16(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets); \
else \
PCRE_EXEC8(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets)
#define PCRE_FREE_STUDY(extra) \
if (pcre_mode == PCRE32_MODE) \
PCRE_FREE_STUDY32(extra); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_FREE_STUDY16(extra); \
else \
PCRE_FREE_STUDY8(extra)
#define PCRE_FREE_SUBSTRING(substring) \
if (pcre_mode == PCRE32_MODE) \
PCRE_FREE_SUBSTRING32(substring); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_FREE_SUBSTRING16(substring); \
else \
PCRE_FREE_SUBSTRING8(substring)
#define PCRE_FREE_SUBSTRING_LIST(listptr) \
if (pcre_mode == PCRE32_MODE) \
PCRE_FREE_SUBSTRING_LIST32(listptr); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_FREE_SUBSTRING_LIST16(listptr); \
else \
PCRE_FREE_SUBSTRING_LIST8(listptr)
#define PCRE_GET_NAMED_SUBSTRING(rc, re, bptr, offsets, count, \
getnamesptr, subsptr) \
if (pcre_mode == PCRE32_MODE) \
PCRE_GET_NAMED_SUBSTRING32(rc, re, bptr, offsets, count, \
getnamesptr, subsptr); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_GET_NAMED_SUBSTRING16(rc, re, bptr, offsets, count, \
getnamesptr, subsptr); \
else \
PCRE_GET_NAMED_SUBSTRING8(rc, re, bptr, offsets, count, \
getnamesptr, subsptr)
#define PCRE_GET_STRINGNUMBER(n, rc, ptr) \
if (pcre_mode == PCRE32_MODE) \
PCRE_GET_STRINGNUMBER32(n, rc, ptr); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_GET_STRINGNUMBER16(n, rc, ptr); \
else \
PCRE_GET_STRINGNUMBER8(n, rc, ptr)
#define PCRE_GET_SUBSTRING(rc, bptr, use_offsets, count, i, subsptr) \
if (pcre_mode == PCRE32_MODE) \
PCRE_GET_SUBSTRING32(rc, bptr, use_offsets, count, i, subsptr); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_GET_SUBSTRING16(rc, bptr, use_offsets, count, i, subsptr); \
else \
PCRE_GET_SUBSTRING8(rc, bptr, use_offsets, count, i, subsptr)
#define PCRE_GET_SUBSTRING_LIST(rc, bptr, offsets, count, listptr) \
if (pcre_mode == PCRE32_MODE) \
PCRE_GET_SUBSTRING_LIST32(rc, bptr, offsets, count, listptr); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_GET_SUBSTRING_LIST16(rc, bptr, offsets, count, listptr); \
else \
PCRE_GET_SUBSTRING_LIST8(rc, bptr, offsets, count, listptr)
#define PCRE_JIT_STACK_ALLOC(startsize, maxsize) \
(pcre_mode == PCRE32_MODE ? \
PCRE_JIT_STACK_ALLOC32(startsize, maxsize) \
: pcre_mode == PCRE16_MODE ? \
PCRE_JIT_STACK_ALLOC16(startsize, maxsize) \
: PCRE_JIT_STACK_ALLOC8(startsize, maxsize))
#define PCRE_JIT_STACK_FREE(stack) \
if (pcre_mode == PCRE32_MODE) \
PCRE_JIT_STACK_FREE32(stack); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_JIT_STACK_FREE16(stack); \
else \
PCRE_JIT_STACK_FREE8(stack)
#define PCRE_MAKETABLES \
(pcre_mode == PCRE32_MODE ? pcre32_maketables() : pcre_mode == PCRE16_MODE ? pcre16_maketables() : pcre_maketables())
#define PCRE_PATTERN_TO_HOST_BYTE_ORDER(rc, re, extra, tables) \
if (pcre_mode == PCRE32_MODE) \
PCRE_PATTERN_TO_HOST_BYTE_ORDER32(rc, re, extra, tables); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_PATTERN_TO_HOST_BYTE_ORDER16(rc, re, extra, tables); \
else \
PCRE_PATTERN_TO_HOST_BYTE_ORDER8(rc, re, extra, tables)
#define PCRE_PRINTINT(re, outfile, debug_lengths) \
if (pcre_mode == PCRE32_MODE) \
PCRE_PRINTINT32(re, outfile, debug_lengths); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_PRINTINT16(re, outfile, debug_lengths); \
else \
PCRE_PRINTINT8(re, outfile, debug_lengths)
#define PCRE_STUDY(extra, re, options, error) \
if (pcre_mode == PCRE32_MODE) \
PCRE_STUDY32(extra, re, options, error); \
else if (pcre_mode == PCRE16_MODE) \
PCRE_STUDY16(extra, re, options, error); \
else \
PCRE_STUDY8(extra, re, options, error)
/* ----- Two out of three modes are supported ----- */
#else
/* We can use some macro trickery to make a single set of definitions work in
the three different cases. */
/* ----- 32-bit and 16-bit but not 8-bit supported ----- */
#if defined(SUPPORT_PCRE32) && defined(SUPPORT_PCRE16)
#define BITONE 32
#define BITTWO 16
/* ----- 32-bit and 8-bit but not 16-bit supported ----- */
#elif defined(SUPPORT_PCRE32) && defined(SUPPORT_PCRE8)
#define BITONE 32
#define BITTWO 8
/* ----- 16-bit and 8-bit but not 32-bit supported ----- */
#else
#define BITONE 16
#define BITTWO 8
#endif
#define glue(a,b) a##b
#define G(a,b) glue(a,b)
/* ----- Common macros for two-mode cases ----- */
#define PCHARS(lv, p, offset, len, f) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCHARS,BITONE)(lv, p, offset, len, f); \
else \
G(PCHARS,BITTWO)(lv, p, offset, len, f)
#define PCHARSV(p, offset, len, f) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCHARSV,BITONE)(p, offset, len, f); \
else \
G(PCHARSV,BITTWO)(p, offset, len, f)
#define READ_CAPTURE_NAME(p, cn8, cn16, cn32, re) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(READ_CAPTURE_NAME,BITONE)(p, cn8, cn16, cn32, re); \
else \
G(READ_CAPTURE_NAME,BITTWO)(p, cn8, cn16, cn32, re)
#define SET_PCRE_CALLOUT(callout) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(SET_PCRE_CALLOUT,BITONE)(callout); \
else \
G(SET_PCRE_CALLOUT,BITTWO)(callout)
#define SET_PCRE_STACK_GUARD(stack_guard) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(SET_PCRE_STACK_GUARD,BITONE)(stack_guard); \
else \
G(SET_PCRE_STACK_GUARD,BITTWO)(stack_guard)
#define STRLEN(p) ((pcre_mode == G(G(PCRE,BITONE),_MODE)) ? \
G(STRLEN,BITONE)(p) : G(STRLEN,BITTWO)(p))
#define PCRE_ASSIGN_JIT_STACK(extra, callback, userdata) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_ASSIGN_JIT_STACK,BITONE)(extra, callback, userdata); \
else \
G(PCRE_ASSIGN_JIT_STACK,BITTWO)(extra, callback, userdata)
#define PCRE_COMPILE(re, pat, options, error, erroffset, tables) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_COMPILE,BITONE)(re, pat, options, error, erroffset, tables); \
else \
G(PCRE_COMPILE,BITTWO)(re, pat, options, error, erroffset, tables)
#define PCRE_CONFIG G(G(pcre,BITONE),_config)
#define PCRE_COPY_NAMED_SUBSTRING(rc, re, bptr, offsets, count, \
namesptr, cbuffer, size) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_COPY_NAMED_SUBSTRING,BITONE)(rc, re, bptr, offsets, count, \
namesptr, cbuffer, size); \
else \
G(PCRE_COPY_NAMED_SUBSTRING,BITTWO)(rc, re, bptr, offsets, count, \
namesptr, cbuffer, size)
#define PCRE_COPY_SUBSTRING(rc, bptr, offsets, count, i, cbuffer, size) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_COPY_SUBSTRING,BITONE)(rc, bptr, offsets, count, i, cbuffer, size); \
else \
G(PCRE_COPY_SUBSTRING,BITTWO)(rc, bptr, offsets, count, i, cbuffer, size)
#define PCRE_DFA_EXEC(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets, workspace, size_workspace) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_DFA_EXEC,BITONE)(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets, workspace, size_workspace); \
else \
G(PCRE_DFA_EXEC,BITTWO)(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets, workspace, size_workspace)
#define PCRE_EXEC(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_EXEC,BITONE)(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets); \
else \
G(PCRE_EXEC,BITTWO)(count, re, extra, bptr, len, start_offset, options, \
offsets, size_offsets)
#define PCRE_FREE_STUDY(extra) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_FREE_STUDY,BITONE)(extra); \
else \
G(PCRE_FREE_STUDY,BITTWO)(extra)
#define PCRE_FREE_SUBSTRING(substring) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_FREE_SUBSTRING,BITONE)(substring); \
else \
G(PCRE_FREE_SUBSTRING,BITTWO)(substring)
#define PCRE_FREE_SUBSTRING_LIST(listptr) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_FREE_SUBSTRING_LIST,BITONE)(listptr); \
else \
G(PCRE_FREE_SUBSTRING_LIST,BITTWO)(listptr)
#define PCRE_GET_NAMED_SUBSTRING(rc, re, bptr, offsets, count, \
getnamesptr, subsptr) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_GET_NAMED_SUBSTRING,BITONE)(rc, re, bptr, offsets, count, \
getnamesptr, subsptr); \
else \
G(PCRE_GET_NAMED_SUBSTRING,BITTWO)(rc, re, bptr, offsets, count, \
getnamesptr, subsptr)
#define PCRE_GET_STRINGNUMBER(n, rc, ptr) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_GET_STRINGNUMBER,BITONE)(n, rc, ptr); \
else \
G(PCRE_GET_STRINGNUMBER,BITTWO)(n, rc, ptr)
#define PCRE_GET_SUBSTRING(rc, bptr, use_offsets, count, i, subsptr) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_GET_SUBSTRING,BITONE)(rc, bptr, use_offsets, count, i, subsptr); \
else \
G(PCRE_GET_SUBSTRING,BITTWO)(rc, bptr, use_offsets, count, i, subsptr)
#define PCRE_GET_SUBSTRING_LIST(rc, bptr, offsets, count, listptr) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_GET_SUBSTRING_LIST,BITONE)(rc, bptr, offsets, count, listptr); \
else \
G(PCRE_GET_SUBSTRING_LIST,BITTWO)(rc, bptr, offsets, count, listptr)
#define PCRE_JIT_STACK_ALLOC(startsize, maxsize) \
(pcre_mode == G(G(PCRE,BITONE),_MODE)) ? \
G(PCRE_JIT_STACK_ALLOC,BITONE)(startsize, maxsize) \
: G(PCRE_JIT_STACK_ALLOC,BITTWO)(startsize, maxsize)
#define PCRE_JIT_STACK_FREE(stack) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_JIT_STACK_FREE,BITONE)(stack); \
else \
G(PCRE_JIT_STACK_FREE,BITTWO)(stack)
#define PCRE_MAKETABLES \
(pcre_mode == G(G(PCRE,BITONE),_MODE)) ? \
G(G(pcre,BITONE),_maketables)() : G(G(pcre,BITTWO),_maketables)()
#define PCRE_PATTERN_TO_HOST_BYTE_ORDER(rc, re, extra, tables) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_PATTERN_TO_HOST_BYTE_ORDER,BITONE)(rc, re, extra, tables); \
else \
G(PCRE_PATTERN_TO_HOST_BYTE_ORDER,BITTWO)(rc, re, extra, tables)
#define PCRE_PRINTINT(re, outfile, debug_lengths) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_PRINTINT,BITONE)(re, outfile, debug_lengths); \
else \
G(PCRE_PRINTINT,BITTWO)(re, outfile, debug_lengths)
#define PCRE_STUDY(extra, re, options, error) \
if (pcre_mode == G(G(PCRE,BITONE),_MODE)) \
G(PCRE_STUDY,BITONE)(extra, re, options, error); \
else \
G(PCRE_STUDY,BITTWO)(extra, re, options, error)
#endif /* Two out of three modes */
/* ----- End of cases where more than one mode is supported ----- */
/* ----- Only 8-bit mode is supported ----- */
#elif defined SUPPORT_PCRE8
#define CHAR_SIZE 1
#define PCHARS PCHARS8
#define PCHARSV PCHARSV8
#define READ_CAPTURE_NAME READ_CAPTURE_NAME8
#define SET_PCRE_CALLOUT SET_PCRE_CALLOUT8
#define SET_PCRE_STACK_GUARD SET_PCRE_STACK_GUARD8
#define STRLEN STRLEN8
#define PCRE_ASSIGN_JIT_STACK PCRE_ASSIGN_JIT_STACK8
#define PCRE_COMPILE PCRE_COMPILE8
#define PCRE_CONFIG pcre_config
#define PCRE_COPY_NAMED_SUBSTRING PCRE_COPY_NAMED_SUBSTRING8
#define PCRE_COPY_SUBSTRING PCRE_COPY_SUBSTRING8
#define PCRE_DFA_EXEC PCRE_DFA_EXEC8
#define PCRE_EXEC PCRE_EXEC8
#define PCRE_FREE_STUDY PCRE_FREE_STUDY8
#define PCRE_FREE_SUBSTRING PCRE_FREE_SUBSTRING8
#define PCRE_FREE_SUBSTRING_LIST PCRE_FREE_SUBSTRING_LIST8
#define PCRE_GET_NAMED_SUBSTRING PCRE_GET_NAMED_SUBSTRING8
#define PCRE_GET_STRINGNUMBER PCRE_GET_STRINGNUMBER8
#define PCRE_GET_SUBSTRING PCRE_GET_SUBSTRING8
#define PCRE_GET_SUBSTRING_LIST PCRE_GET_SUBSTRING_LIST8
#define PCRE_JIT_STACK_ALLOC PCRE_JIT_STACK_ALLOC8
#define PCRE_JIT_STACK_FREE PCRE_JIT_STACK_FREE8
#define PCRE_MAKETABLES pcre_maketables()
#define PCRE_PATTERN_TO_HOST_BYTE_ORDER PCRE_PATTERN_TO_HOST_BYTE_ORDER8
#define PCRE_PRINTINT PCRE_PRINTINT8
#define PCRE_STUDY PCRE_STUDY8
/* ----- Only 16-bit mode is supported ----- */
#elif defined SUPPORT_PCRE16
#define CHAR_SIZE 2
#define PCHARS PCHARS16
#define PCHARSV PCHARSV16
#define READ_CAPTURE_NAME READ_CAPTURE_NAME16
#define SET_PCRE_CALLOUT SET_PCRE_CALLOUT16
#define SET_PCRE_STACK_GUARD SET_PCRE_STACK_GUARD16
#define STRLEN STRLEN16
#define PCRE_ASSIGN_JIT_STACK PCRE_ASSIGN_JIT_STACK16
#define PCRE_COMPILE PCRE_COMPILE16
#define PCRE_CONFIG pcre16_config
#define PCRE_COPY_NAMED_SUBSTRING PCRE_COPY_NAMED_SUBSTRING16
#define PCRE_COPY_SUBSTRING PCRE_COPY_SUBSTRING16
#define PCRE_DFA_EXEC PCRE_DFA_EXEC16
#define PCRE_EXEC PCRE_EXEC16
#define PCRE_FREE_STUDY PCRE_FREE_STUDY16
#define PCRE_FREE_SUBSTRING PCRE_FREE_SUBSTRING16
#define PCRE_FREE_SUBSTRING_LIST PCRE_FREE_SUBSTRING_LIST16
#define PCRE_GET_NAMED_SUBSTRING PCRE_GET_NAMED_SUBSTRING16
#define PCRE_GET_STRINGNUMBER PCRE_GET_STRINGNUMBER16
#define PCRE_GET_SUBSTRING PCRE_GET_SUBSTRING16
#define PCRE_GET_SUBSTRING_LIST PCRE_GET_SUBSTRING_LIST16
#define PCRE_JIT_STACK_ALLOC PCRE_JIT_STACK_ALLOC16
#define PCRE_JIT_STACK_FREE PCRE_JIT_STACK_FREE16
#define PCRE_MAKETABLES pcre16_maketables()
#define PCRE_PATTERN_TO_HOST_BYTE_ORDER PCRE_PATTERN_TO_HOST_BYTE_ORDER16
#define PCRE_PRINTINT PCRE_PRINTINT16
#define PCRE_STUDY PCRE_STUDY16
/* ----- Only 32-bit mode is supported ----- */
#elif defined SUPPORT_PCRE32
#define CHAR_SIZE 4
#define PCHARS PCHARS32
#define PCHARSV PCHARSV32
#define READ_CAPTURE_NAME READ_CAPTURE_NAME32
#define SET_PCRE_CALLOUT SET_PCRE_CALLOUT32
#define SET_PCRE_STACK_GUARD SET_PCRE_STACK_GUARD32
#define STRLEN STRLEN32
#define PCRE_ASSIGN_JIT_STACK PCRE_ASSIGN_JIT_STACK32
#define PCRE_COMPILE PCRE_COMPILE32
#define PCRE_CONFIG pcre32_config
#define PCRE_COPY_NAMED_SUBSTRING PCRE_COPY_NAMED_SUBSTRING32
#define PCRE_COPY_SUBSTRING PCRE_COPY_SUBSTRING32
#define PCRE_DFA_EXEC PCRE_DFA_EXEC32
#define PCRE_EXEC PCRE_EXEC32
#define PCRE_FREE_STUDY PCRE_FREE_STUDY32
#define PCRE_FREE_SUBSTRING PCRE_FREE_SUBSTRING32
#define PCRE_FREE_SUBSTRING_LIST PCRE_FREE_SUBSTRING_LIST32
#define PCRE_GET_NAMED_SUBSTRING PCRE_GET_NAMED_SUBSTRING32
#define PCRE_GET_STRINGNUMBER PCRE_GET_STRINGNUMBER32
#define PCRE_GET_SUBSTRING PCRE_GET_SUBSTRING32
#define PCRE_GET_SUBSTRING_LIST PCRE_GET_SUBSTRING_LIST32
#define PCRE_JIT_STACK_ALLOC PCRE_JIT_STACK_ALLOC32
#define PCRE_JIT_STACK_FREE PCRE_JIT_STACK_FREE32
#define PCRE_MAKETABLES pcre32_maketables()
#define PCRE_PATTERN_TO_HOST_BYTE_ORDER PCRE_PATTERN_TO_HOST_BYTE_ORDER32
#define PCRE_PRINTINT PCRE_PRINTINT32
#define PCRE_STUDY PCRE_STUDY32
#endif
/* ----- End of mode-specific function call macros ----- */
/* Other parameters */
#ifndef CLOCKS_PER_SEC
#ifdef CLK_TCK
#define CLOCKS_PER_SEC CLK_TCK
#else
#define CLOCKS_PER_SEC 100
#endif
#endif
#if !defined NODFA
#define DFA_WS_DIMENSION 1000
#endif
/* This is the default loop count for timing. */
#define LOOPREPEAT 500000
/* Static variables */
static FILE *outfile;
static int log_store = 0;
static int callout_count;
static int callout_extra;
static int callout_fail_count;
static int callout_fail_id;
static int debug_lengths;
static int first_callout;
static int jit_was_used;
static int locale_set = 0;
static int show_malloc;
static int stack_guard_return;
static int use_utf;
static const unsigned char *last_callout_mark = NULL;
/* The buffers grow automatically if very long input lines are encountered. */
static int buffer_size = 50000;
static pcre_uint8 *buffer = NULL;
static pcre_uint8 *pbuffer = NULL;
/* Just as a safety check, make sure that COMPILE_PCRE[16|32] are *not* set. */
#ifdef COMPILE_PCRE16
#error COMPILE_PCRE16 must not be set when compiling pcretest.c
#endif
#ifdef COMPILE_PCRE32
#error COMPILE_PCRE32 must not be set when compiling pcretest.c
#endif
/* We need buffers for building 16/32-bit strings, and the tables of operator
lengths that are used for 16/32-bit compiling, in order to swap bytes in a
pattern for saving/reloading testing. Luckily, the data for these tables is
defined as a macro. However, we must ensure that LINK_SIZE and IMM2_SIZE (which
are used in the tables) are adjusted appropriately for the 16/32-bit world.
LINK_SIZE is also used later in this program. */
#ifdef SUPPORT_PCRE16
#undef IMM2_SIZE
#define IMM2_SIZE 1
#if LINK_SIZE == 2
#undef LINK_SIZE
#define LINK_SIZE 1
#elif LINK_SIZE == 3 || LINK_SIZE == 4
#undef LINK_SIZE
#define LINK_SIZE 2
#else
#error LINK_SIZE must be either 2, 3, or 4
#endif
static int buffer16_size = 0;
static pcre_uint16 *buffer16 = NULL;
static const pcre_uint16 OP_lengths16[] = { OP_LENGTHS };
#endif /* SUPPORT_PCRE16 */
#ifdef SUPPORT_PCRE32
#undef IMM2_SIZE
#define IMM2_SIZE 1
#undef LINK_SIZE
#define LINK_SIZE 1
static int buffer32_size = 0;
static pcre_uint32 *buffer32 = NULL;
static const pcre_uint32 OP_lengths32[] = { OP_LENGTHS };
#endif /* SUPPORT_PCRE32 */
/* If we have 8-bit support, default to it; if there is also 16-or 32-bit
support, it can be changed by an option. If there is no 8-bit support, there
must be 16-or 32-bit support, so default it to 1. */
#if defined SUPPORT_PCRE8
static int pcre_mode = PCRE8_MODE;
#elif defined SUPPORT_PCRE16
static int pcre_mode = PCRE16_MODE;
#elif defined SUPPORT_PCRE32
static int pcre_mode = PCRE32_MODE;
#endif
/* JIT study options for -s+n and /S+n where '1' <= n <= '7'. */
static int jit_study_bits[] =
{
PCRE_STUDY_JIT_COMPILE,
PCRE_STUDY_JIT_PARTIAL_SOFT_COMPILE,
PCRE_STUDY_JIT_COMPILE + PCRE_STUDY_JIT_PARTIAL_SOFT_COMPILE,
PCRE_STUDY_JIT_PARTIAL_HARD_COMPILE,
PCRE_STUDY_JIT_COMPILE + PCRE_STUDY_JIT_PARTIAL_HARD_COMPILE,
PCRE_STUDY_JIT_PARTIAL_SOFT_COMPILE + PCRE_STUDY_JIT_PARTIAL_HARD_COMPILE,
PCRE_STUDY_JIT_COMPILE + PCRE_STUDY_JIT_PARTIAL_SOFT_COMPILE +
PCRE_STUDY_JIT_PARTIAL_HARD_COMPILE
};
#define PCRE_STUDY_ALLJIT (PCRE_STUDY_JIT_COMPILE | \
PCRE_STUDY_JIT_PARTIAL_SOFT_COMPILE | PCRE_STUDY_JIT_PARTIAL_HARD_COMPILE)
/* Textual explanations for runtime error codes */
static const char *errtexts[] = {
NULL, /* 0 is no error */
NULL, /* NOMATCH is handled specially */
"NULL argument passed",
"bad option value",
"magic number missing",
"unknown opcode - pattern overwritten?",
"no more memory",
NULL, /* never returned by pcre_exec() or pcre_dfa_exec() */
"match limit exceeded",
"callout error code",
NULL, /* BADUTF8/16 is handled specially */
NULL, /* BADUTF8/16 offset is handled specially */
NULL, /* PARTIAL is handled specially */
"not used - internal error",
"internal error - pattern overwritten?",
"bad count value",
"item unsupported for DFA matching",
"backreference condition or recursion test not supported for DFA matching",
"match limit not supported for DFA matching",
"workspace size exceeded in DFA matching",
"too much recursion for DFA matching",
"recursion limit exceeded",
"not used - internal error",
"invalid combination of newline options",
"bad offset value",
NULL, /* SHORTUTF8/16 is handled specially */
"nested recursion at the same subject position",
"JIT stack limit reached",
"pattern compiled in wrong mode: 8-bit/16-bit error",
"pattern compiled with other endianness",
"invalid data in workspace for DFA restart",
"bad JIT option",
"bad length"
};
/*************************************************
* Alternate character tables *
*************************************************/
/* By default, the "tables" pointer when calling PCRE is set to NULL, thereby
using the default tables of the library. However, the T option can be used to
select alternate sets of tables, for different kinds of testing. Note also that
the L (locale) option also adjusts the tables. */
/* This is the set of tables distributed as default with PCRE. It recognizes
only ASCII characters. */
static const pcre_uint8 tables0[] = {
/* This table is a lower casing table. */
0, 1, 2, 3, 4, 5, 6, 7,
8, 9, 10, 11, 12, 13, 14, 15,
16, 17, 18, 19, 20, 21, 22, 23,
24, 25, 26, 27, 28, 29, 30, 31,
32, 33, 34, 35, 36, 37, 38, 39,
40, 41, 42, 43, 44, 45, 46, 47,
48, 49, 50, 51, 52, 53, 54, 55,
56, 57, 58, 59, 60, 61, 62, 63,
64, 97, 98, 99,100,101,102,103,
104,105,106,107,108,109,110,111,
112,113,114,115,116,117,118,119,
120,121,122, 91, 92, 93, 94, 95,
96, 97, 98, 99,100,101,102,103,
104,105,106,107,108,109,110,111,
112,113,114,115,116,117,118,119,
120,121,122,123,124,125,126,127,
128,129,130,131,132,133,134,135,
136,137,138,139,140,141,142,143,
144,145,146,147,148,149,150,151,
152,153,154,155,156,157,158,159,
160,161,162,163,164,165,166,167,
168,169,170,171,172,173,174,175,
176,177,178,179,180,181,182,183,
184,185,186,187,188,189,190,191,
192,193,194,195,196,197,198,199,
200,201,202,203,204,205,206,207,
208,209,210,211,212,213,214,215,
216,217,218,219,220,221,222,223,
224,225,226,227,228,229,230,231,
232,233,234,235,236,237,238,239,
240,241,242,243,244,245,246,247,
248,249,250,251,252,253,254,255,
/* This table is a case flipping table. */
0, 1, 2, 3, 4, 5, 6, 7,
8, 9, 10, 11, 12, 13, 14, 15,
16, 17, 18, 19, 20, 21, 22, 23,
24, 25, 26, 27, 28, 29, 30, 31,
32, 33, 34, 35, 36, 37, 38, 39,
40, 41, 42, 43, 44, 45, 46, 47,
48, 49, 50, 51, 52, 53, 54, 55,
56, 57, 58, 59, 60, 61, 62, 63,
64, 97, 98, 99,100,101,102,103,
104,105,106,107,108,109,110,111,
112,113,114,115,116,117,118,119,
120,121,122, 91, 92, 93, 94, 95,
96, 65, 66, 67, 68, 69, 70, 71,
72, 73, 74, 75, 76, 77, 78, 79,
80, 81, 82, 83, 84, 85, 86, 87,
88, 89, 90,123,124,125,126,127,
128,129,130,131,132,133,134,135,
136,137,138,139,140,141,142,143,
144,145,146,147,148,149,150,151,
152,153,154,155,156,157,158,159,
160,161,162,163,164,165,166,167,
168,169,170,171,172,173,174,175,
176,177,178,179,180,181,182,183,
184,185,186,187,188,189,190,191,
192,193,194,195,196,197,198,199,
200,201,202,203,204,205,206,207,
208,209,210,211,212,213,214,215,
216,217,218,219,220,221,222,223,
224,225,226,227,228,229,230,231,
232,233,234,235,236,237,238,239,
240,241,242,243,244,245,246,247,
248,249,250,251,252,253,254,255,
/* This table contains bit maps for various character classes. Each map is 32
bytes long and the bits run from the least significant end of each byte. The
classes that have their own maps are: space, xdigit, digit, upper, lower, word,
graph, print, punct, and cntrl. Other classes are built from combinations. */
0x00,0x3e,0x00,0x00,0x01,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0xff,0x03,
0x7e,0x00,0x00,0x00,0x7e,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0xff,0x03,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0xfe,0xff,0xff,0x07,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0xfe,0xff,0xff,0x07,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0xff,0x03,
0xfe,0xff,0xff,0x87,0xfe,0xff,0xff,0x07,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0xfe,0xff,0xff,0xff,
0xff,0xff,0xff,0xff,0xff,0xff,0xff,0x7f,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0xff,0xff,0xff,0xff,
0xff,0xff,0xff,0xff,0xff,0xff,0xff,0x7f,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0xfe,0xff,0x00,0xfc,
0x01,0x00,0x00,0xf8,0x01,0x00,0x00,0x78,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0xff,0xff,0xff,0xff,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x80,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00,
/* This table identifies various classes of character by individual bits:
0x01 white space character
0x02 letter
0x04 decimal digit
0x08 hexadecimal digit
0x10 alphanumeric or '_'
0x80 regular expression metacharacter or binary zero
*/
0x80,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 0- 7 */
0x00,0x01,0x01,0x01,0x01,0x01,0x00,0x00, /* 8- 15 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 16- 23 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 24- 31 */
0x01,0x00,0x00,0x00,0x80,0x00,0x00,0x00, /* - ' */
0x80,0x80,0x80,0x80,0x00,0x00,0x80,0x00, /* ( - / */
0x1c,0x1c,0x1c,0x1c,0x1c,0x1c,0x1c,0x1c, /* 0 - 7 */
0x1c,0x1c,0x00,0x00,0x00,0x00,0x00,0x80, /* 8 - ? */
0x00,0x1a,0x1a,0x1a,0x1a,0x1a,0x1a,0x12, /* @ - G */
0x12,0x12,0x12,0x12,0x12,0x12,0x12,0x12, /* H - O */
0x12,0x12,0x12,0x12,0x12,0x12,0x12,0x12, /* P - W */
0x12,0x12,0x12,0x80,0x80,0x00,0x80,0x10, /* X - _ */
0x00,0x1a,0x1a,0x1a,0x1a,0x1a,0x1a,0x12, /* ` - g */
0x12,0x12,0x12,0x12,0x12,0x12,0x12,0x12, /* h - o */
0x12,0x12,0x12,0x12,0x12,0x12,0x12,0x12, /* p - w */
0x12,0x12,0x12,0x80,0x80,0x00,0x00,0x00, /* x -127 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 128-135 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 136-143 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 144-151 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 152-159 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 160-167 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 168-175 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 176-183 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 184-191 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 192-199 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 200-207 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 208-215 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 216-223 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 224-231 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 232-239 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00, /* 240-247 */
0x00,0x00,0x00,0x00,0x00,0x00,0x00,0x00};/* 248-255 */
/* This is a set of tables that came originally from a Windows user. It seems
to be at least an approximation of ISO 8859. In particular, there are
characters greater than 128 that are marked as spaces, letters, etc. */
static const pcre_uint8 tables1[] = {
0,1,2,3,4,5,6,7,
8,9,10,11,12,13,14,15,
16,17,18,19,20,21,22,23,
24,25,26,27,28,29,30,31,
32,33,34,35,36,37,38,39,
40,41,42,43,44,45,46,47,
48,49,50,51,52,53,54,55,
56,57,58,59,60,61,62,63,
64,97,98,99,100,101,102,103,
104,105,106,107,108,109,110,111,
112,113,114,115,116,117,118,119,
120,121,122,91,92,93,94,95,
96,97,98,99,100,101,102,103,
104,105,106,107,108,109,110,111,
112,113,114,115,116,117,118,119,
120,121,122,123,124,125,126,127,
128,129,130,131,132,133,134,135,
136,137,138,139,140,141,142,143,
144,145,146,147,148,149,150,151,
152,153,154,155,156,157,158,159,
160,161,162,163,164,165,166,167,
168,169,170,171,172,173,174,175,
176,177,178,179,180,181,182,183,
184,185,186,187,188,189,190,191,
224,225,226,227,228,229,230,231,
232,233,234,235,236,237,238,239,
240,241,242,243,244,245,246,215,
248,249,250,251,252,253,254,223,
224,225,226,227,228,229,230,231,
232,233,234,235,236,237,238,239,
240,241,242,243,244,245,246,247,
248,249,250,251,252,253,254,255,
0,1,2,3,4,5,6,7,
8,9,10,11,12,13,14,15,
16,17,18,19,20,21,22,23,
24,25,26,27,28,29,30,31,
32,33,34,35,36,37,38,39,
40,41,42,43,44,45,46,47,
48,49,50,51,52,53,54,55,
56,57,58,59,60,61,62,63,
64,97,98,99,100,101,102,103,
104,105,106,107,108,109,110,111,
112,113,114,115,116,117,118,119,
120,121,122,91,92,93,94,95,
96,65,66,67,68,69,70,71,
72,73,74,75,76,77,78,79,
80,81,82,83,84,85,86,87,
88,89,90,123,124,125,126,127,
128,129,130,131,132,133,134,135,
136,137,138,139,140,141,142,143,
144,145,146,147,148,149,150,151,
152,153,154,155,156,157,158,159,
160,161,162,163,164,165,166,167,
168,169,170,171,172,173,174,175,
176,177,178,179,180,181,182,183,
184,185,186,187,188,189,190,191,
224,225,226,227,228,229,230,231,
232,233,234,235,236,237,238,239,
240,241,242,243,244,245,246,215,
248,249,250,251,252,253,254,223,
192,193,194,195,196,197,198,199,
200,201,202,203,204,205,206,207,
208,209,210,211,212,213,214,247,
216,217,218,219,220,221,222,255,
0,62,0,0,1,0,0,0,
0,0,0,0,0,0,0,0,
32,0,0,0,1,0,0,0,
0,0,0,0,0,0,0,0,
0,0,0,0,0,0,255,3,
126,0,0,0,126,0,0,0,
0,0,0,0,0,0,0,0,
0,0,0,0,0,0,0,0,
0,0,0,0,0,0,255,3,
0,0,0,0,0,0,0,0,
0,0,0,0,0,0,12,2,
0,0,0,0,0,0,0,0,
0,0,0,0,0,0,0,0,
254,255,255,7,0,0,0,0,
0,0,0,0,0,0,0,0,
255,255,127,127,0,0,0,0,
0,0,0,0,0,0,0,0,
0,0,0,0,254,255,255,7,
0,0,0,0,0,4,32,4,
0,0,0,128,255,255,127,255,
0,0,0,0,0,0,255,3,
254,255,255,135,254,255,255,7,
0,0,0,0,0,4,44,6,
255,255,127,255,255,255,127,255,
0,0,0,0,254,255,255,255,
255,255,255,255,255,255,255,127,
0,0,0,0,254,255,255,255,
255,255,255,255,255,255,255,255,
0,2,0,0,255,255,255,255,
255,255,255,255,255,255,255,127,
0,0,0,0,255,255,255,255,
255,255,255,255,255,255,255,255,
0,0,0,0,254,255,0,252,
1,0,0,248,1,0,0,120,
0,0,0,0,254,255,255,255,
0,0,128,0,0,0,128,0,
255,255,255,255,0,0,0,0,
0,0,0,0,0,0,0,128,
255,255,255,255,0,0,0,0,
0,0,0,0,0,0,0,0,
128,0,0,0,0,0,0,0,
0,1,1,0,1,1,0,0,
0,0,0,0,0,0,0,0,
0,0,0,0,0,0,0,0,
1,0,0,0,128,0,0,0,
128,128,128,128,0,0,128,0,
28,28,28,28,28,28,28,28,
28,28,0,0,0,0,0,128,
0,26,26,26,26,26,26,18,
18,18,18,18,18,18,18,18,
18,18,18,18,18,18,18,18,
18,18,18,128,128,0,128,16,
0,26,26,26,26,26,26,18,
18,18,18,18,18,18,18,18,
18,18,18,18,18,18,18,18,
18,18,18,128,128,0,0,0,
0,0,0,0,0,1,0,0,
0,0,0,0,0,0,0,0,
0,0,0,0,0,0,0,0,
0,0,0,0,0,0,0,0,
1,0,0,0,0,0,0,0,
0,0,18,0,0,0,0,0,
0,0,20,20,0,18,0,0,
0,20,18,0,0,0,0,0,
18,18,18,18,18,18,18,18,
18,18,18,18,18,18,18,18,
18,18,18,18,18,18,18,0,
18,18,18,18,18,18,18,18,
18,18,18,18,18,18,18,18,
18,18,18,18,18,18,18,18,
18,18,18,18,18,18,18,0,
18,18,18,18,18,18,18,18
};
#ifndef HAVE_STRERROR
/*************************************************
* Provide strerror() for non-ANSI libraries *
*************************************************/
/* Some old-fashioned systems still around (e.g. SunOS4) don't have strerror()
in their libraries, but can provide the same facility by this simple
alternative function. */
extern int sys_nerr;
extern char *sys_errlist[];
char *
strerror(int n)
{
if (n < 0 || n >= sys_nerr) return "unknown error number";
return sys_errlist[n];
}
#endif /* HAVE_STRERROR */
/*************************************************
* Print newline configuration *
*************************************************/
/*
Arguments:
rc the return code from PCRE_CONFIG_NEWLINE
isc TRUE if called from "-C newline"
Returns: nothing
*/
static void
print_newline_config(int rc, BOOL isc)
{
const char *s = NULL;
if (!isc) printf(" Newline sequence is ");
switch(rc)
{
case CHAR_CR: s = "CR"; break;
case CHAR_LF: s = "LF"; break;
case (CHAR_CR<<8 | CHAR_LF): s = "CRLF"; break;
case -1: s = "ANY"; break;
case -2: s = "ANYCRLF"; break;
default:
printf("a non-standard value: 0x%04x\n", rc);
return;
}
printf("%s\n", s);
}
/*************************************************
* JIT memory callback *
*************************************************/
static pcre_jit_stack* jit_callback(void *arg)
{
jit_was_used = TRUE;
return (pcre_jit_stack *)arg;
}
#if !defined NOUTF || defined SUPPORT_PCRE16 || defined SUPPORT_PCRE32
/*************************************************
* Convert UTF-8 string to value *
*************************************************/
/* This function takes one or more bytes that represents a UTF-8 character,
and returns the value of the character.
Argument:
utf8bytes a pointer to the byte vector
vptr a pointer to an int to receive the value
Returns: > 0 => the number of bytes consumed
-6 to 0 => malformed UTF-8 character at offset = (-return)
*/
static int
utf82ord(pcre_uint8 *utf8bytes, pcre_uint32 *vptr)
{
pcre_uint32 c = *utf8bytes++;
pcre_uint32 d = c;
int i, j, s;
for (i = -1; i < 6; i++) /* i is number of additional bytes */
{
if ((d & 0x80) == 0) break;
d <<= 1;
}
if (i == -1) { *vptr = c; return 1; } /* ascii character */
if (i == 0 || i == 6) return 0; /* invalid UTF-8 */
/* i now has a value in the range 1-5 */
s = 6*i;
d = (c & utf8_table3[i]) << s;
for (j = 0; j < i; j++)
{
c = *utf8bytes++;
if ((c & 0xc0) != 0x80) return -(j+1);
s -= 6;
d |= (c & 0x3f) << s;
}
/* Check that encoding was the correct unique one */
for (j = 0; j < utf8_table1_size; j++)
if (d <= (pcre_uint32)utf8_table1[j]) break;
if (j != i) return -(i+1);
/* Valid value */
*vptr = d;
return i+1;
}
#endif /* NOUTF || SUPPORT_PCRE16 */
#if defined SUPPORT_PCRE8 && !defined NOUTF
/*************************************************
* Convert character value to UTF-8 *
*************************************************/
/* This function takes an integer value in the range 0 - 0x7fffffff
and encodes it as a UTF-8 character in 0 to 6 bytes.
Arguments:
cvalue the character value
utf8bytes pointer to buffer for result - at least 6 bytes long
Returns: number of characters placed in the buffer
*/
static int
ord2utf8(pcre_uint32 cvalue, pcre_uint8 *utf8bytes)
{
register int i, j;
if (cvalue > 0x7fffffffu)
return -1;
for (i = 0; i < utf8_table1_size; i++)
if (cvalue <= (pcre_uint32)utf8_table1[i]) break;
utf8bytes += i;
for (j = i; j > 0; j--)
{
*utf8bytes-- = 0x80 | (cvalue & 0x3f);
cvalue >>= 6;
}
*utf8bytes = utf8_table2[i] | cvalue;
return i + 1;
}
#endif
#ifdef SUPPORT_PCRE16
/*************************************************
* Convert a string to 16-bit *
*************************************************/
/* In non-UTF mode, the space needed for a 16-bit string is exactly double the
8-bit size. For a UTF-8 string, the size needed for UTF-16 is no more than
double, because up to 0xffff uses no more than 3 bytes in UTF-8 but possibly 4
in UTF-16. Higher values use 4 bytes in UTF-8 and up to 4 bytes in UTF-16. The
result is always left in buffer16.
Note that this function does not object to surrogate values. This is
deliberate; it makes it possible to construct UTF-16 strings that are invalid,
for the purpose of testing that they are correctly faulted.
Patterns to be converted are either plain ASCII or UTF-8; data lines are always
in UTF-8 so that values greater than 255 can be handled.
Arguments:
data TRUE if converting a data line; FALSE for a regex
p points to a byte string
utf true if UTF-8 (to be converted to UTF-16)
len number of bytes in the string (excluding trailing zero)
Returns: number of 16-bit data items used (excluding trailing zero)
OR -1 if a UTF-8 string is malformed
OR -2 if a value > 0x10ffff is encountered
OR -3 if a value > 0xffff is encountered when not in UTF mode
*/
static int
to16(int data, pcre_uint8 *p, int utf, int len)
{
pcre_uint16 *pp;
if (buffer16_size < 2*len + 2)
{
if (buffer16 != NULL) free(buffer16);
buffer16_size = 2*len + 2;
buffer16 = (pcre_uint16 *)malloc(buffer16_size);
if (buffer16 == NULL)
{
fprintf(stderr, "pcretest: malloc(%d) failed for buffer16\n", buffer16_size);
exit(1);
}
}
pp = buffer16;
if (!utf && !data)
{
while (len-- > 0) *pp++ = *p++;
}
else
{
pcre_uint32 c = 0;
while (len > 0)
{
int chlen = utf82ord(p, &c);
if (chlen <= 0) return -1;
if (c > 0x10ffff) return -2;
p += chlen;
len -= chlen;
if (c < 0x10000) *pp++ = c; else
{
if (!utf) return -3;
c -= 0x10000;
*pp++ = 0xD800 | (c >> 10);
*pp++ = 0xDC00 | (c & 0x3ff);
}
}
}
*pp = 0;
return pp - buffer16;
}
#endif
#ifdef SUPPORT_PCRE32
/*************************************************
* Convert a string to 32-bit *
*************************************************/
/* In non-UTF mode, the space needed for a 32-bit string is exactly four times the
8-bit size. For a UTF-8 string, the size needed for UTF-32 is no more than four
times, because up to 0xffff uses no more than 3 bytes in UTF-8 but possibly 4
in UTF-32. Higher values use 4 bytes in UTF-8 and up to 4 bytes in UTF-32. The
result is always left in buffer32.
Note that this function does not object to surrogate values. This is
deliberate; it makes it possible to construct UTF-32 strings that are invalid,
for the purpose of testing that they are correctly faulted.
Patterns to be converted are either plain ASCII or UTF-8; data lines are always
in UTF-8 so that values greater than 255 can be handled.
Arguments:
data TRUE if converting a data line; FALSE for a regex
p points to a byte string
utf true if UTF-8 (to be converted to UTF-32)
len number of bytes in the string (excluding trailing zero)
Returns: number of 32-bit data items used (excluding trailing zero)
OR -1 if a UTF-8 string is malformed
OR -2 if a value > 0x10ffff is encountered
OR -3 if an ill-formed value is encountered (i.e. a surrogate)
*/
static int
to32(int data, pcre_uint8 *p, int utf, int len)
{
pcre_uint32 *pp;
if (buffer32_size < 4*len + 4)
{
if (buffer32 != NULL) free(buffer32);
buffer32_size = 4*len + 4;
buffer32 = (pcre_uint32 *)malloc(buffer32_size);
if (buffer32 == NULL)
{
fprintf(stderr, "pcretest: malloc(%d) failed for buffer32\n", buffer32_size);
exit(1);
}
}
pp = buffer32;
if (!utf && !data)
{
while (len-- > 0) *pp++ = *p++;
}
else
{
pcre_uint32 c = 0;
while (len > 0)
{
int chlen = utf82ord(p, &c);
if (chlen <= 0) return -1;
if (utf)
{
if (c > 0x10ffff) return -2;
if (!data && (c & 0xfffff800u) == 0xd800u) return -3;
}
p += chlen;
len -= chlen;
*pp++ = c;
}
}
*pp = 0;
return pp - buffer32;
}
/* Check that a 32-bit character string is valid UTF-32.
Arguments:
string points to the string
length length of string, or -1 if the string is zero-terminated
Returns: TRUE if the string is a valid UTF-32 string
FALSE otherwise
*/
#ifdef NEVER /* Not used */
#ifdef SUPPORT_UTF
static BOOL
valid_utf32(pcre_uint32 *string, int length)
{
register pcre_uint32 *p;
register pcre_uint32 c;
for (p = string; length-- > 0; p++)
{
c = *p;
if (c > 0x10ffffu) return FALSE; /* Too big */
if ((c & 0xfffff800u) == 0xd800u) return FALSE; /* Surrogate */
}
return TRUE;
}
#endif /* SUPPORT_UTF */
#endif /* NEVER */
#endif /* SUPPORT_PCRE32 */
/*************************************************
* Read or extend an input line *
*************************************************/
/* Input lines are read into buffer, but both patterns and data lines can be
continued over multiple input lines. In addition, if the buffer fills up, we
want to automatically expand it so as to be able to handle extremely large
lines that are needed for certain stress tests. When the input buffer is
expanded, the other two buffers must also be expanded likewise, and the
contents of pbuffer, which are a copy of the input for callouts, must be
preserved (for when expansion happens for a data line). This is not the most
optimal way of handling this, but hey, this is just a test program!
Arguments:
f the file to read
start where in buffer to start (this *must* be within buffer)
prompt for stdin or readline()
Returns: pointer to the start of new data
could be a copy of start, or could be moved
NULL if no data read and EOF reached
*/
static pcre_uint8 *
extend_inputline(FILE *f, pcre_uint8 *start, const char *prompt)
{
pcre_uint8 *here = start;
for (;;)
{
size_t rlen = (size_t)(buffer_size - (here - buffer));
if (rlen > 1000)
{
int dlen;
/* If libreadline or libedit support is required, use readline() to read a
line if the input is a terminal. Note that readline() removes the trailing
newline, so we must put it back again, to be compatible with fgets(). */
#if defined(SUPPORT_LIBREADLINE) || defined(SUPPORT_LIBEDIT)
if (isatty(fileno(f)))
{
size_t len;
char *s = readline(prompt);
if (s == NULL) return (here == start)? NULL : start;
len = strlen(s);
if (len > 0) add_history(s);
if (len > rlen - 1) len = rlen - 1;
memcpy(here, s, len);
here[len] = '\n';
here[len+1] = 0;
free(s);
}
else
#endif
/* Read the next line by normal means, prompting if the file is stdin. */
{
if (f == stdin) printf("%s", prompt);
if (fgets((char *)here, rlen, f) == NULL)
return (here == start)? NULL : start;
}
dlen = (int)strlen((char *)here);
if (dlen > 0 && here[dlen - 1] == '\n') return start;
here += dlen;
}
else
{
int new_buffer_size = 2*buffer_size;
pcre_uint8 *new_buffer = (pcre_uint8 *)malloc(new_buffer_size);
pcre_uint8 *new_pbuffer = (pcre_uint8 *)malloc(new_buffer_size);
if (new_buffer == NULL || new_pbuffer == NULL)
{
fprintf(stderr, "pcretest: malloc(%d) failed\n", new_buffer_size);
exit(1);
}
memcpy(new_buffer, buffer, buffer_size);
memcpy(new_pbuffer, pbuffer, buffer_size);
buffer_size = new_buffer_size;
start = new_buffer + (start - buffer);
here = new_buffer + (here - buffer);
free(buffer);
free(pbuffer);
buffer = new_buffer;
pbuffer = new_pbuffer;
}
}
/* Control never gets here */
}
/*************************************************
* Read number from string *
*************************************************/
/* We don't use strtoul() because SunOS4 doesn't have it. Rather than mess
around with conditional compilation, just do the job by hand. It is only used
for unpicking arguments, so just keep it simple.
Arguments:
str string to be converted
endptr where to put the end pointer
Returns: the unsigned long
*/
static int
get_value(pcre_uint8 *str, pcre_uint8 **endptr)
{
int result = 0;
while(*str != 0 && isspace(*str)) str++;
while (isdigit(*str)) result = result * 10 + (int)(*str++ - '0');
*endptr = str;
return(result);
}
/*************************************************
* Print one character *
*************************************************/
/* Print a single character either literally, or as a hex escape. */
static int pchar(pcre_uint32 c, FILE *f)
{
int n = 0;
char tempbuffer[16];
if (PRINTOK(c))
{
if (f != NULL) fprintf(f, "%c", c);
return 1;
}
if (c < 0x100)
{
if (use_utf)
{
if (f != NULL) fprintf(f, "\\x{%02x}", c);
return 6;
}
else
{
if (f != NULL) fprintf(f, "\\x%02x", c);
return 4;
}
}
if (f != NULL) n = fprintf(f, "\\x{%02x}", c);
else n = sprintf(tempbuffer, "\\x{%02x}", c);
return n >= 0 ? n : 0;
}
#ifdef SUPPORT_PCRE8
/*************************************************
* Print 8-bit character string *
*************************************************/
/* Must handle UTF-8 strings in utf8 mode. Yields number of characters printed.
If handed a NULL file, just counts chars without printing. */
static int pchars(pcre_uint8 *p, int length, FILE *f)
{
pcre_uint32 c = 0;
int yield = 0;
if (length < 0)
length = strlen((char *)p);
while (length-- > 0)
{
#if !defined NOUTF
if (use_utf)
{
int rc = utf82ord(p, &c);
if (rc > 0 && rc <= length + 1) /* Mustn't run over the end */
{
length -= rc - 1;
p += rc;
yield += pchar(c, f);
continue;
}
}
#endif
c = *p++;
yield += pchar(c, f);
}
return yield;
}
#endif
#ifdef SUPPORT_PCRE16
/*************************************************
* Find length of 0-terminated 16-bit string *
*************************************************/
static int strlen16(PCRE_SPTR16 p)
{
PCRE_SPTR16 pp = p;
while (*pp != 0) pp++;
return (int)(pp - p);
}
#endif /* SUPPORT_PCRE16 */
#ifdef SUPPORT_PCRE32
/*************************************************
* Find length of 0-terminated 32-bit string *
*************************************************/
static int strlen32(PCRE_SPTR32 p)
{
PCRE_SPTR32 pp = p;
while (*pp != 0) pp++;
return (int)(pp - p);
}
#endif /* SUPPORT_PCRE32 */
#ifdef SUPPORT_PCRE16
/*************************************************
* Print 16-bit character string *
*************************************************/
/* Must handle UTF-16 strings in utf mode. Yields number of characters printed.
If handed a NULL file, just counts chars without printing. */
static int pchars16(PCRE_SPTR16 p, int length, FILE *f)
{
int yield = 0;
if (length < 0)
length = strlen16(p);
while (length-- > 0)
{
pcre_uint32 c = *p++ & 0xffff;
#if !defined NOUTF
if (use_utf && c >= 0xD800 && c < 0xDC00 && length > 0)
{
int d = *p & 0xffff;
if (d >= 0xDC00 && d <= 0xDFFF)
{
c = ((c & 0x3ff) << 10) + (d & 0x3ff) + 0x10000;
length--;
p++;
}
}
#endif
yield += pchar(c, f);
}
return yield;
}
#endif /* SUPPORT_PCRE16 */
#ifdef SUPPORT_PCRE32
/*************************************************
* Print 32-bit character string *
*************************************************/
/* Must handle UTF-32 strings in utf mode. Yields number of characters printed.
If handed a NULL file, just counts chars without printing. */
static int pchars32(PCRE_SPTR32 p, int length, BOOL utf, FILE *f)
{
int yield = 0;
(void)(utf); /* Avoid compiler warning */
if (length < 0)
length = strlen32(p);
while (length-- > 0)
{
pcre_uint32 c = *p++;
yield += pchar(c, f);
}
return yield;
}
#endif /* SUPPORT_PCRE32 */
#ifdef SUPPORT_PCRE8
/*************************************************
* Read a capture name (8-bit) and check it *
*************************************************/
static pcre_uint8 *
read_capture_name8(pcre_uint8 *p, pcre_uint8 **pp, pcre *re)
{
pcre_uint8 *npp = *pp;
while (isalnum(*p)) *npp++ = *p++;
*npp++ = 0;
*npp = 0;
if (pcre_get_stringnumber(re, (char *)(*pp)) < 0)
{
fprintf(outfile, "no parentheses with name \"");
PCHARSV(*pp, 0, -1, outfile);
fprintf(outfile, "\"\n");
}
*pp = npp;
return p;
}
#endif /* SUPPORT_PCRE8 */
#ifdef SUPPORT_PCRE16
/*************************************************
* Read a capture name (16-bit) and check it *
*************************************************/
/* Note that the text being read is 8-bit. */
static pcre_uint8 *
read_capture_name16(pcre_uint8 *p, pcre_uint16 **pp, pcre *re)
{
pcre_uint16 *npp = *pp;
while (isalnum(*p)) *npp++ = *p++;
*npp++ = 0;
*npp = 0;
if (pcre16_get_stringnumber((pcre16 *)re, (PCRE_SPTR16)(*pp)) < 0)
{
fprintf(outfile, "no parentheses with name \"");
PCHARSV(*pp, 0, -1, outfile);
fprintf(outfile, "\"\n");
}
*pp = npp;
return p;
}
#endif /* SUPPORT_PCRE16 */
#ifdef SUPPORT_PCRE32
/*************************************************
* Read a capture name (32-bit) and check it *
*************************************************/
/* Note that the text being read is 8-bit. */
static pcre_uint8 *
read_capture_name32(pcre_uint8 *p, pcre_uint32 **pp, pcre *re)
{
pcre_uint32 *npp = *pp;
while (isalnum(*p)) *npp++ = *p++;
*npp++ = 0;
*npp = 0;
if (pcre32_get_stringnumber((pcre32 *)re, (PCRE_SPTR32)(*pp)) < 0)
{
fprintf(outfile, "no parentheses with name \"");
PCHARSV(*pp, 0, -1, outfile);
fprintf(outfile, "\"\n");
}
*pp = npp;
return p;
}
#endif /* SUPPORT_PCRE32 */
/*************************************************
* Stack guard function *
*************************************************/
/* Called from PCRE when set in pcre_stack_guard. We give an error (non-zero)
return when a count overflows. */
static int stack_guard(void)
{
return stack_guard_return;
}
/*************************************************
* Callout function *
*************************************************/
/* Called from PCRE as a result of the (?C) item. We print out where we are in
the match. Yield zero unless more callouts than the fail count, or the callout
data is not zero. */
static int callout(pcre_callout_block *cb)
{
FILE *f = (first_callout | callout_extra)? outfile : NULL;
int i, current_position, pre_start, post_start, subject_length;
if (callout_extra)
{
fprintf(f, "Callout %d: last capture = %d\n",
cb->callout_number, cb->capture_last);
if (cb->offset_vector != NULL)
{
for (i = 0; i < cb->capture_top * 2; i += 2)
{
if (cb->offset_vector[i] < 0)
fprintf(f, "%2d: <unset>\n", i/2);
else
{
fprintf(f, "%2d: ", i/2);
PCHARSV(cb->subject, cb->offset_vector[i],
cb->offset_vector[i+1] - cb->offset_vector[i], f);
fprintf(f, "\n");
}
}
}
}
/* Re-print the subject in canonical form, the first time or if giving full
datails. On subsequent calls in the same match, we use pchars just to find the
printed lengths of the substrings. */
if (f != NULL) fprintf(f, "--->");
/* If a lookbehind is involved, the current position may be earlier than the
match start. If so, use the match start instead. */
current_position = (cb->current_position >= cb->start_match)?
cb->current_position : cb->start_match;
PCHARS(pre_start, cb->subject, 0, cb->start_match, f);
PCHARS(post_start, cb->subject, cb->start_match,
current_position - cb->start_match, f);
PCHARS(subject_length, cb->subject, 0, cb->subject_length, NULL);
PCHARSV(cb->subject, current_position, cb->subject_length - current_position, f);
if (f != NULL) fprintf(f, "\n");
/* Always print appropriate indicators, with callout number if not already
shown. For automatic callouts, show the pattern offset. */
if (cb->callout_number == 255)
{
fprintf(outfile, "%+3d ", cb->pattern_position);
if (cb->pattern_position > 99) fprintf(outfile, "\n ");
}
else
{
if (callout_extra) fprintf(outfile, " ");
else fprintf(outfile, "%3d ", cb->callout_number);
}
for (i = 0; i < pre_start; i++) fprintf(outfile, " ");
fprintf(outfile, "^");
if (post_start > 0)
{
for (i = 0; i < post_start - 1; i++) fprintf(outfile, " ");
fprintf(outfile, "^");
}
for (i = 0; i < subject_length - pre_start - post_start + 4; i++)
fprintf(outfile, " ");
fprintf(outfile, "%.*s", (cb->next_item_length == 0)? 1 : cb->next_item_length,
pbuffer + cb->pattern_position);
fprintf(outfile, "\n");
first_callout = 0;
if (cb->mark != last_callout_mark)
{
if (cb->mark == NULL)
fprintf(outfile, "Latest Mark: <unset>\n");
else
{
fprintf(outfile, "Latest Mark: ");
PCHARSV(cb->mark, 0, -1, outfile);
putc('\n', outfile);
}
last_callout_mark = cb->mark;
}
if (cb->callout_data != NULL)
{
int callout_data = *((int *)(cb->callout_data));
if (callout_data != 0)
{
fprintf(outfile, "Callout data = %d\n", callout_data);
return callout_data;
}
}
return (cb->callout_number != callout_fail_id)? 0 :
(++callout_count >= callout_fail_count)? 1 : 0;
}
/*************************************************
* Local malloc functions *
*************************************************/
/* Alternative malloc function, to test functionality and save the size of a
compiled re, which is the first store request that pcre_compile() makes. The
show_malloc variable is set only during matching. */
static void *new_malloc(size_t size)
{
void *block = malloc(size);
if (show_malloc)
fprintf(outfile, "malloc %3d %p\n", (int)size, block);
return block;
}
static void new_free(void *block)
{
if (show_malloc)
fprintf(outfile, "free %p\n", block);
free(block);
}
/* For recursion malloc/free, to test stacking calls */
static void *stack_malloc(size_t size)
{
void *block = malloc(size);
if (show_malloc)
fprintf(outfile, "stack_malloc %3d %p\n", (int)size, block);
return block;
}
static void stack_free(void *block)
{
if (show_malloc)
fprintf(outfile, "stack_free %p\n", block);
free(block);
}
/*************************************************
* Call pcre_fullinfo() *
*************************************************/
/* Get one piece of information from the pcre_fullinfo() function. When only
one of 8-, 16- or 32-bit is supported, pcre_mode should always have the correct
value, but the code is defensive.
Arguments:
re compiled regex
study study data
option PCRE_INFO_xxx option
ptr where to put the data
Returns: 0 when OK, < 0 on error
*/
static int
new_info(pcre *re, pcre_extra *study, int option, void *ptr)
{
int rc;
if (pcre_mode == PCRE32_MODE)
#ifdef SUPPORT_PCRE32
rc = pcre32_fullinfo((pcre32 *)re, (pcre32_extra *)study, option, ptr);
#else
rc = PCRE_ERROR_BADMODE;
#endif
else if (pcre_mode == PCRE16_MODE)
#ifdef SUPPORT_PCRE16
rc = pcre16_fullinfo((pcre16 *)re, (pcre16_extra *)study, option, ptr);
#else
rc = PCRE_ERROR_BADMODE;
#endif
else
#ifdef SUPPORT_PCRE8
rc = pcre_fullinfo(re, study, option, ptr);
#else
rc = PCRE_ERROR_BADMODE;
#endif
if (rc < 0 && rc != PCRE_ERROR_UNSET)
{
fprintf(outfile, "Error %d from pcre%s_fullinfo(%d)\n", rc,
pcre_mode == PCRE32_MODE ? "32" : pcre_mode == PCRE16_MODE ? "16" : "", option);
if (rc == PCRE_ERROR_BADMODE)
fprintf(outfile, "Running in %d-bit mode but pattern was compiled in "
"%d-bit mode\n", 8 * CHAR_SIZE,
8 * (REAL_PCRE_FLAGS(re) & PCRE_MODE_MASK));
}
return rc;
}
/*************************************************
* Swap byte functions *
*************************************************/
/* The following functions swap the bytes of a pcre_uint16 and pcre_uint32
value, respectively.
Arguments:
value any number
Returns: the byte swapped value
*/
static pcre_uint32
swap_uint32(pcre_uint32 value)
{
return ((value & 0x000000ff) << 24) |
((value & 0x0000ff00) << 8) |
((value & 0x00ff0000) >> 8) |
(value >> 24);
}
static pcre_uint16
swap_uint16(pcre_uint16 value)
{
return (value >> 8) | (value << 8);
}
/*************************************************
* Flip bytes in a compiled pattern *
*************************************************/
/* This function is called if the 'F' option was present on a pattern that is
to be written to a file. We flip the bytes of all the integer fields in the
regex data block and the study block. In 16-bit mode this also flips relevant
bytes in the pattern itself. This is to make it possible to test PCRE's
ability to reload byte-flipped patterns, e.g. those compiled on a different
architecture. */
#if defined SUPPORT_PCRE8 || defined SUPPORT_PCRE16
static void
regexflip8_or_16(pcre *ere, pcre_extra *extra)
{
real_pcre8_or_16 *re = (real_pcre8_or_16 *)ere;
#ifdef SUPPORT_PCRE16
int op;
pcre_uint16 *ptr = (pcre_uint16 *)re + re->name_table_offset;
int length = re->name_count * re->name_entry_size;
#ifdef SUPPORT_UTF
BOOL utf = (re->options & PCRE_UTF16) != 0;
BOOL utf16_char = FALSE;
#endif /* SUPPORT_UTF */
#endif /* SUPPORT_PCRE16 */
/* Always flip the bytes in the main data block and study blocks. */
re->magic_number = REVERSED_MAGIC_NUMBER;
re->size = swap_uint32(re->size);
re->options = swap_uint32(re->options);
re->flags = swap_uint32(re->flags);
re->limit_match = swap_uint32(re->limit_match);
re->limit_recursion = swap_uint32(re->limit_recursion);
re->first_char = swap_uint16(re->first_char);
re->req_char = swap_uint16(re->req_char);
re->max_lookbehind = swap_uint16(re->max_lookbehind);
re->top_bracket = swap_uint16(re->top_bracket);
re->top_backref = swap_uint16(re->top_backref);
re->name_table_offset = swap_uint16(re->name_table_offset);
re->name_entry_size = swap_uint16(re->name_entry_size);
re->name_count = swap_uint16(re->name_count);
re->ref_count = swap_uint16(re->ref_count);
if (extra != NULL && (extra->flags & PCRE_EXTRA_STUDY_DATA) != 0)
{
pcre_study_data *rsd = (pcre_study_data *)(extra->study_data);
rsd->size = swap_uint32(rsd->size);
rsd->flags = swap_uint32(rsd->flags);
rsd->minlength = swap_uint32(rsd->minlength);
}
/* In 8-bit mode, that is all we need to do. In 16-bit mode we must swap bytes
in the name table, if present, and then in the pattern itself. */
#ifdef SUPPORT_PCRE16
if (pcre_mode != PCRE16_MODE) return;
while(TRUE)
{
/* Swap previous characters. */
while (length-- > 0)
{
*ptr = swap_uint16(*ptr);
ptr++;
}
#ifdef SUPPORT_UTF
if (utf16_char)
{
if ((ptr[-1] & 0xfc00) == 0xd800)
{
/* We know that there is only one extra character in UTF-16. */
*ptr = swap_uint16(*ptr);
ptr++;
}
}
utf16_char = FALSE;
#endif /* SUPPORT_UTF */
/* Get next opcode. */
length = 0;
op = *ptr;
*ptr++ = swap_uint16(op);
switch (op)
{
case OP_END:
return;
#ifdef SUPPORT_UTF
case OP_CHAR:
case OP_CHARI:
case OP_NOT:
case OP_NOTI:
case OP_STAR:
case OP_MINSTAR:
case OP_PLUS:
case OP_MINPLUS:
case OP_QUERY:
case OP_MINQUERY:
case OP_UPTO:
case OP_MINUPTO:
case OP_EXACT:
case OP_POSSTAR:
case OP_POSPLUS:
case OP_POSQUERY:
case OP_POSUPTO:
case OP_STARI:
case OP_MINSTARI:
case OP_PLUSI:
case OP_MINPLUSI:
case OP_QUERYI:
case OP_MINQUERYI:
case OP_UPTOI:
case OP_MINUPTOI:
case OP_EXACTI:
case OP_POSSTARI:
case OP_POSPLUSI:
case OP_POSQUERYI:
case OP_POSUPTOI:
case OP_NOTSTAR:
case OP_NOTMINSTAR:
case OP_NOTPLUS:
case OP_NOTMINPLUS:
case OP_NOTQUERY:
case OP_NOTMINQUERY:
case OP_NOTUPTO:
case OP_NOTMINUPTO:
case OP_NOTEXACT:
case OP_NOTPOSSTAR:
case OP_NOTPOSPLUS:
case OP_NOTPOSQUERY:
case OP_NOTPOSUPTO:
case OP_NOTSTARI:
case OP_NOTMINSTARI:
case OP_NOTPLUSI:
case OP_NOTMINPLUSI:
case OP_NOTQUERYI:
case OP_NOTMINQUERYI:
case OP_NOTUPTOI:
case OP_NOTMINUPTOI:
case OP_NOTEXACTI:
case OP_NOTPOSSTARI:
case OP_NOTPOSPLUSI:
case OP_NOTPOSQUERYI:
case OP_NOTPOSUPTOI:
if (utf) utf16_char = TRUE;
#endif
/* Fall through. */
default:
length = OP_lengths16[op] - 1;
break;
case OP_CLASS:
case OP_NCLASS:
/* Skip the character bit map. */
ptr += 32/sizeof(pcre_uint16);
length = 0;
break;
case OP_XCLASS:
/* LINK_SIZE can be 1 or 2 in 16 bit mode. */
if (LINK_SIZE > 1)
length = (int)((((unsigned int)(ptr[0]) << 16) | (unsigned int)(ptr[1]))
- (1 + LINK_SIZE + 1));
else
length = (int)((unsigned int)(ptr[0]) - (1 + LINK_SIZE + 1));
/* Reverse the size of the XCLASS instance. */
*ptr = swap_uint16(*ptr);
ptr++;
if (LINK_SIZE > 1)
{
*ptr = swap_uint16(*ptr);
ptr++;
}
op = *ptr;
*ptr = swap_uint16(op);
ptr++;
if ((op & XCL_MAP) != 0)
{
/* Skip the character bit map. */
ptr += 32/sizeof(pcre_uint16);
length -= 32/sizeof(pcre_uint16);
}
break;
}
}
/* Control should never reach here in 16 bit mode. */
#endif /* SUPPORT_PCRE16 */
}
#endif /* SUPPORT_PCRE[8|16] */
#if defined SUPPORT_PCRE32
static void
regexflip_32(pcre *ere, pcre_extra *extra)
{
real_pcre32 *re = (real_pcre32 *)ere;
int op;
pcre_uint32 *ptr = (pcre_uint32 *)re + re->name_table_offset;
int length = re->name_count * re->name_entry_size;
/* Always flip the bytes in the main data block and study blocks. */
re->magic_number = REVERSED_MAGIC_NUMBER;
re->size = swap_uint32(re->size);
re->options = swap_uint32(re->options);
re->flags = swap_uint32(re->flags);
re->limit_match = swap_uint32(re->limit_match);
re->limit_recursion = swap_uint32(re->limit_recursion);
re->first_char = swap_uint32(re->first_char);
re->req_char = swap_uint32(re->req_char);
re->max_lookbehind = swap_uint16(re->max_lookbehind);
re->top_bracket = swap_uint16(re->top_bracket);
re->top_backref = swap_uint16(re->top_backref);
re->name_table_offset = swap_uint16(re->name_table_offset);
re->name_entry_size = swap_uint16(re->name_entry_size);
re->name_count = swap_uint16(re->name_count);
re->ref_count = swap_uint16(re->ref_count);
if (extra != NULL && (extra->flags & PCRE_EXTRA_STUDY_DATA) != 0)
{
pcre_study_data *rsd = (pcre_study_data *)(extra->study_data);
rsd->size = swap_uint32(rsd->size);
rsd->flags = swap_uint32(rsd->flags);
rsd->minlength = swap_uint32(rsd->minlength);
}
/* In 32-bit mode we must swap bytes in the name table, if present, and then in
the pattern itself. */
while(TRUE)
{
/* Swap previous characters. */
while (length-- > 0)
{
*ptr = swap_uint32(*ptr);
ptr++;
}
/* Get next opcode. */
length = 0;
op = *ptr;
*ptr++ = swap_uint32(op);
switch (op)
{
case OP_END:
return;
default:
length = OP_lengths32[op] - 1;
break;
case OP_CLASS:
case OP_NCLASS:
/* Skip the character bit map. */
ptr += 32/sizeof(pcre_uint32);
length = 0;
break;
case OP_XCLASS:
/* LINK_SIZE can only be 1 in 32-bit mode. */
length = (int)((unsigned int)(ptr[0]) - (1 + LINK_SIZE + 1));
/* Reverse the size of the XCLASS instance. */
*ptr = swap_uint32(*ptr);
ptr++;
op = *ptr;
*ptr = swap_uint32(op);
ptr++;
if ((op & XCL_MAP) != 0)
{
/* Skip the character bit map. */
ptr += 32/sizeof(pcre_uint32);
length -= 32/sizeof(pcre_uint32);
}
break;
}
}
/* Control should never reach here in 32 bit mode. */
}
#endif /* SUPPORT_PCRE32 */
static void
regexflip(pcre *ere, pcre_extra *extra)
{
#if defined SUPPORT_PCRE32
if (REAL_PCRE_FLAGS(ere) & PCRE_MODE32)
regexflip_32(ere, extra);
#endif
#if defined SUPPORT_PCRE8 || defined SUPPORT_PCRE16
if (REAL_PCRE_FLAGS(ere) & (PCRE_MODE8 | PCRE_MODE16))
regexflip8_or_16(ere, extra);
#endif
}
/*************************************************
* Check match or recursion limit *
*************************************************/
static int
check_match_limit(pcre *re, pcre_extra *extra, pcre_uint8 *bptr, int len,
int start_offset, int options, int *use_offsets, int use_size_offsets,
int flag, unsigned long int *limit, int errnumber, const char *msg)
{
int count;