2014-03-07 18:28:52 +01:00
|
|
|
/*************************************************
|
|
|
|
* Perl-Compatible Regular Expressions *
|
|
|
|
*************************************************/
|
|
|
|
|
2014-08-30 10:52:32 +02:00
|
|
|
/* PCRE2 is a library of functions to support regular expressions whose syntax
|
2014-03-07 18:28:52 +01:00
|
|
|
and semantics are as close as possible to those of the Perl 5 language.
|
|
|
|
|
|
|
|
Written by Philip Hazel
|
|
|
|
Original API code Copyright (c) 1997-2012 University of Cambridge
|
|
|
|
New API code Copyright (c) 2014 University of Cambridge
|
|
|
|
|
|
|
|
-----------------------------------------------------------------------------
|
|
|
|
Redistribution and use in source and binary forms, with or without
|
|
|
|
modification, are permitted provided that the following conditions are met:
|
|
|
|
|
|
|
|
* Redistributions of source code must retain the above copyright notice,
|
|
|
|
this list of conditions and the following disclaimer.
|
|
|
|
|
|
|
|
* Redistributions in binary form must reproduce the above copyright
|
|
|
|
notice, this list of conditions and the following disclaimer in the
|
|
|
|
documentation and/or other materials provided with the distribution.
|
|
|
|
|
|
|
|
* Neither the name of the University of Cambridge nor the names of its
|
|
|
|
contributors may be used to endorse or promote products derived from
|
|
|
|
this software without specific prior written permission.
|
|
|
|
|
|
|
|
THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
|
|
AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
|
|
ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
|
|
|
LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
|
|
CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
|
|
SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
|
|
INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
|
|
CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
|
|
ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
|
|
POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
-----------------------------------------------------------------------------
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
|
|
/* Have to include stdlib.h in order to ensure that size_t is defined. */
|
|
|
|
|
|
|
|
#include <stdlib.h>
|
|
|
|
|
|
|
|
/* Allow for C++ users */
|
|
|
|
|
|
|
|
#ifdef __cplusplus
|
|
|
|
extern "C" {
|
|
|
|
#endif
|
|
|
|
|
|
|
|
/* Options, mostly defined by POSIX, but with some extras. */
|
|
|
|
|
|
|
|
#define REG_ICASE 0x0001 /* Maps to PCRE2_CASELESS */
|
|
|
|
#define REG_NEWLINE 0x0002 /* Maps to PCRE2_MULTILINE */
|
|
|
|
#define REG_NOTBOL 0x0004 /* Maps to PCRE2_NOTBOL */
|
|
|
|
#define REG_NOTEOL 0x0008 /* Maps to PCRE2_NOTEOL */
|
|
|
|
#define REG_DOTALL 0x0010 /* NOT defined by POSIX; maps to PCRE2_DOTALL */
|
|
|
|
#define REG_NOSUB 0x0020 /* Maps to PCRE2_NO_AUTO_CAPTURE */
|
|
|
|
#define REG_UTF 0x0040 /* NOT defined by POSIX; maps to PCRE2_UTF */
|
|
|
|
#define REG_STARTEND 0x0080 /* BSD feature: pass subject string by so,eo */
|
|
|
|
#define REG_NOTEMPTY 0x0100 /* NOT defined by POSIX; maps to PCRE2_NOTEMPTY */
|
|
|
|
#define REG_UNGREEDY 0x0200 /* NOT defined by POSIX; maps to PCRE2_UNGREEDY */
|
|
|
|
#define REG_UCP 0x0400 /* NOT defined by POSIX; maps to PCRE2_UCP */
|
|
|
|
|
2014-08-30 10:52:32 +02:00
|
|
|
/* This is not used by PCRE2, but by defining it we make it easier
|
|
|
|
to slot PCRE2 into existing programs that make POSIX calls. */
|
2014-03-07 18:28:52 +01:00
|
|
|
|
|
|
|
#define REG_EXTENDED 0
|
|
|
|
|
|
|
|
/* Error values. Not all these are relevant or used by the wrapper. */
|
|
|
|
|
|
|
|
enum {
|
|
|
|
REG_ASSERT = 1, /* internal error ? */
|
|
|
|
REG_BADBR, /* invalid repeat counts in {} */
|
|
|
|
REG_BADPAT, /* pattern error */
|
|
|
|
REG_BADRPT, /* ? * + invalid */
|
|
|
|
REG_EBRACE, /* unbalanced {} */
|
|
|
|
REG_EBRACK, /* unbalanced [] */
|
|
|
|
REG_ECOLLATE, /* collation error - not relevant */
|
|
|
|
REG_ECTYPE, /* bad class */
|
|
|
|
REG_EESCAPE, /* bad escape sequence */
|
|
|
|
REG_EMPTY, /* empty expression */
|
|
|
|
REG_EPAREN, /* unbalanced () */
|
|
|
|
REG_ERANGE, /* bad range inside [] */
|
|
|
|
REG_ESIZE, /* expression too big */
|
|
|
|
REG_ESPACE, /* failed to get memory */
|
|
|
|
REG_ESUBREG, /* bad back reference */
|
|
|
|
REG_INVARG, /* bad argument */
|
|
|
|
REG_NOMATCH /* match failed */
|
|
|
|
};
|
|
|
|
|
|
|
|
|
|
|
|
/* The structure representing a compiled regular expression. */
|
|
|
|
|
|
|
|
typedef struct {
|
|
|
|
void *re_pcre2_code;
|
2014-10-20 19:28:49 +02:00
|
|
|
void *re_match_data;
|
2014-03-07 18:28:52 +01:00
|
|
|
size_t re_nsub;
|
|
|
|
size_t re_erroffset;
|
|
|
|
} regex_t;
|
|
|
|
|
|
|
|
/* The structure in which a captured offset is returned. */
|
|
|
|
|
|
|
|
typedef int regoff_t;
|
|
|
|
|
|
|
|
typedef struct {
|
|
|
|
regoff_t rm_so;
|
|
|
|
regoff_t rm_eo;
|
|
|
|
} regmatch_t;
|
|
|
|
|
2014-08-30 10:52:32 +02:00
|
|
|
/* When an application links to a PCRE2 DLL in Windows, the symbols that are
|
|
|
|
imported have to be identified as such. When building PCRE2, the appropriate
|
2014-03-07 18:28:52 +01:00
|
|
|
export settings are needed, and are set in pcre2posix.c before including this
|
|
|
|
file. */
|
|
|
|
|
2014-08-30 10:52:32 +02:00
|
|
|
#if defined(_WIN32) && !defined(PCRE2_STATIC) && !defined(PCRE2POSIX_EXP_DECL)
|
|
|
|
# define PCRE2POSIX_EXP_DECL extern __declspec(dllimport)
|
|
|
|
# define PCRE2POSIX_EXP_DEFN __declspec(dllimport)
|
2014-03-07 18:28:52 +01:00
|
|
|
#endif
|
|
|
|
|
|
|
|
/* By default, we use the standard "extern" declarations. */
|
|
|
|
|
2014-08-30 10:52:32 +02:00
|
|
|
#ifndef PCRE2POSIX_EXP_DECL
|
2014-03-07 18:28:52 +01:00
|
|
|
# ifdef __cplusplus
|
2014-08-30 10:52:32 +02:00
|
|
|
# define PCRE2POSIX_EXP_DECL extern "C"
|
|
|
|
# define PCRE2POSIX_EXP_DEFN extern "C"
|
2014-03-07 18:28:52 +01:00
|
|
|
# else
|
2014-08-30 10:52:32 +02:00
|
|
|
# define PCRE2POSIX_EXP_DECL extern
|
|
|
|
# define PCRE2POSIX_EXP_DEFN extern
|
2014-03-07 18:28:52 +01:00
|
|
|
# endif
|
|
|
|
#endif
|
|
|
|
|
|
|
|
/* The functions */
|
|
|
|
|
2014-08-30 10:52:32 +02:00
|
|
|
PCRE2POSIX_EXP_DECL int regcomp(regex_t *, const char *, int);
|
|
|
|
PCRE2POSIX_EXP_DECL int regexec(const regex_t *, const char *, size_t,
|
2014-03-07 18:28:52 +01:00
|
|
|
regmatch_t *, int);
|
2014-08-30 10:52:32 +02:00
|
|
|
PCRE2POSIX_EXP_DECL size_t regerror(int, const regex_t *, char *, size_t);
|
|
|
|
PCRE2POSIX_EXP_DECL void regfree(regex_t *);
|
2014-03-07 18:28:52 +01:00
|
|
|
|
|
|
|
#ifdef __cplusplus
|
|
|
|
} /* extern "C" */
|
|
|
|
#endif
|
|
|
|
|
|
|
|
/* End of pcre2posix.h */
|