• Main Page
  • Related Pages
  • Modules
  • Namespaces
  • Classes
  • Files
  • File List
  • File Members

src/pcre/pcre.h

00001 /*************************************************
00002 *       Perl-Compatible Regular Expressions      *
00003 *************************************************/
00004 
00005 /* This is the public header file for the PCRE library, to be #included by
00006 applications that call the PCRE functions.
00007 
00008            Copyright (c) 1997-2009 University of Cambridge
00009 
00010 -----------------------------------------------------------------------------
00011 Redistribution and use in source and binary forms, with or without
00012 modification, are permitted provided that the following conditions are met:
00013 
00014     * Redistributions of source code must retain the above copyright notice,
00015       this list of conditions and the following disclaimer.
00016 
00017     * Redistributions in binary form must reproduce the above copyright
00018       notice, this list of conditions and the following disclaimer in the
00019       documentation and/or other materials provided with the distribution.
00020 
00021     * Neither the name of the University of Cambridge nor the names of its
00022       contributors may be used to endorse or promote products derived from
00023       this software without specific prior written permission.
00024 
00025 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
00026 AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
00027 IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
00028 ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
00029 LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
00030 CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
00031 SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
00032 INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
00033 CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
00034 ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
00035 POSSIBILITY OF SUCH DAMAGE.
00036 -----------------------------------------------------------------------------
00037 */
00038 
00039 #ifndef _PCRE_H
00040 #define _PCRE_H
00041 
00042 /* The current PCRE version information. */
00043 
00044 #define PCRE_MAJOR          8
00045 #define PCRE_MINOR          00
00046 #define PCRE_PRERELEASE     
00047 #define PCRE_DATE           2009-10-19
00048 
00049 /* When an application links to a PCRE DLL in Windows, the symbols that are
00050 imported have to be identified as such. When building PCRE, the appropriate
00051 export setting is defined in pcre_internal.h, which includes this file. So we
00052 don't change existing definitions of PCRE_EXP_DECL and PCRECPP_EXP_DECL. */
00053 
00054 //#if defined(_WIN32) && !defined(PCRE_STATIC)
00055 //#  ifndef PCRE_EXP_DECL
00056 //#    define PCRE_EXP_DECL  extern __declspec(dllimport)
00057 //#  endif
00058 //#  ifdef __cplusplus
00059 //#    ifndef PCRECPP_EXP_DECL
00060 //#      define PCRECPP_EXP_DECL  extern __declspec(dllimport)
00061 //#    endif
00062 //#    ifndef PCRECPP_EXP_DEFN
00063 //#      define PCRECPP_EXP_DEFN  __declspec(dllimport)
00064 //#    endif
00065 //#  endif
00066 //#endif
00067 
00068 /* By default, we use the standard "extern" declarations. */
00069 
00070 #ifndef PCRE_EXP_DECL
00071 #  ifdef __cplusplus
00072 #    define PCRE_EXP_DECL  extern "C"
00073 #  else
00074 #    define PCRE_EXP_DECL  extern
00075 #  endif
00076 #endif
00077 
00078 #ifdef __cplusplus
00079 #  ifndef PCRECPP_EXP_DECL
00080 #    define PCRECPP_EXP_DECL  extern
00081 #  endif
00082 #  ifndef PCRECPP_EXP_DEFN
00083 #    define PCRECPP_EXP_DEFN
00084 #  endif
00085 #endif
00086 
00087 /* Have to include stdlib.h in order to ensure that size_t is defined;
00088 it is needed here for malloc. */
00089 
00090 #include <stdlib.h>
00091 
00092 /* Allow for C++ users */
00093 
00094 #ifdef __cplusplus
00095 extern "C" {
00096 #endif
00097 
00098 /* Options. Some are compile-time only, some are run-time only, and some are
00099 both, so we keep them all distinct. */
00100 
00101 #define PCRE_CASELESS           0x00000001
00102 #define PCRE_MULTILINE          0x00000002
00103 #define PCRE_DOTALL             0x00000004
00104 #define PCRE_EXTENDED           0x00000008
00105 #define PCRE_ANCHORED           0x00000010
00106 #define PCRE_DOLLAR_ENDONLY     0x00000020
00107 #define PCRE_EXTRA              0x00000040
00108 #define PCRE_NOTBOL             0x00000080
00109 #define PCRE_NOTEOL             0x00000100
00110 #define PCRE_UNGREEDY           0x00000200
00111 #define PCRE_NOTEMPTY           0x00000400
00112 #define PCRE_UTF8               0x00000800
00113 #define PCRE_NO_AUTO_CAPTURE    0x00001000
00114 #define PCRE_NO_UTF8_CHECK      0x00002000
00115 #define PCRE_AUTO_CALLOUT       0x00004000
00116 #define PCRE_PARTIAL_SOFT       0x00008000
00117 #define PCRE_PARTIAL            0x00008000  /* Backwards compatible synonym */
00118 #define PCRE_DFA_SHORTEST       0x00010000
00119 #define PCRE_DFA_RESTART        0x00020000
00120 #define PCRE_FIRSTLINE          0x00040000
00121 #define PCRE_DUPNAMES           0x00080000
00122 #define PCRE_NEWLINE_CR         0x00100000
00123 #define PCRE_NEWLINE_LF         0x00200000
00124 #define PCRE_NEWLINE_CRLF       0x00300000
00125 #define PCRE_NEWLINE_ANY        0x00400000
00126 #define PCRE_NEWLINE_ANYCRLF    0x00500000
00127 #define PCRE_BSR_ANYCRLF        0x00800000
00128 #define PCRE_BSR_UNICODE        0x01000000
00129 #define PCRE_JAVASCRIPT_COMPAT  0x02000000
00130 #define PCRE_NO_START_OPTIMIZE  0x04000000
00131 #define PCRE_NO_START_OPTIMISE  0x04000000
00132 #define PCRE_PARTIAL_HARD       0x08000000
00133 #define PCRE_NOTEMPTY_ATSTART   0x10000000
00134 
00135 /* Exec-time and get/set-time error codes */
00136 
00137 #define PCRE_ERROR_NOMATCH         (-1)
00138 #define PCRE_ERROR_NULL            (-2)
00139 #define PCRE_ERROR_BADOPTION       (-3)
00140 #define PCRE_ERROR_BADMAGIC        (-4)
00141 #define PCRE_ERROR_UNKNOWN_OPCODE  (-5)
00142 #define PCRE_ERROR_UNKNOWN_NODE    (-5)  /* For backward compatibility */
00143 #define PCRE_ERROR_NOMEMORY        (-6)
00144 #define PCRE_ERROR_NOSUBSTRING     (-7)
00145 #define PCRE_ERROR_MATCHLIMIT      (-8)
00146 #define PCRE_ERROR_CALLOUT         (-9)  /* Never used by PCRE itself */
00147 #define PCRE_ERROR_BADUTF8        (-10)
00148 #define PCRE_ERROR_BADUTF8_OFFSET (-11)
00149 #define PCRE_ERROR_PARTIAL        (-12)
00150 #define PCRE_ERROR_BADPARTIAL     (-13)
00151 #define PCRE_ERROR_INTERNAL       (-14)
00152 #define PCRE_ERROR_BADCOUNT       (-15)
00153 #define PCRE_ERROR_DFA_UITEM      (-16)
00154 #define PCRE_ERROR_DFA_UCOND      (-17)
00155 #define PCRE_ERROR_DFA_UMLIMIT    (-18)
00156 #define PCRE_ERROR_DFA_WSSIZE     (-19)
00157 #define PCRE_ERROR_DFA_RECURSE    (-20)
00158 #define PCRE_ERROR_RECURSIONLIMIT (-21)
00159 #define PCRE_ERROR_NULLWSLIMIT    (-22)  /* No longer actually used */
00160 #define PCRE_ERROR_BADNEWLINE     (-23)
00161 
00162 /* Request types for pcre_fullinfo() */
00163 
00164 #define PCRE_INFO_OPTIONS            0
00165 #define PCRE_INFO_SIZE               1
00166 #define PCRE_INFO_CAPTURECOUNT       2
00167 #define PCRE_INFO_BACKREFMAX         3
00168 #define PCRE_INFO_FIRSTBYTE          4
00169 #define PCRE_INFO_FIRSTCHAR          4  /* For backwards compatibility */
00170 #define PCRE_INFO_FIRSTTABLE         5
00171 #define PCRE_INFO_LASTLITERAL        6
00172 #define PCRE_INFO_NAMEENTRYSIZE      7
00173 #define PCRE_INFO_NAMECOUNT          8
00174 #define PCRE_INFO_NAMETABLE          9
00175 #define PCRE_INFO_STUDYSIZE         10
00176 #define PCRE_INFO_DEFAULT_TABLES    11
00177 #define PCRE_INFO_OKPARTIAL         12
00178 #define PCRE_INFO_JCHANGED          13
00179 #define PCRE_INFO_HASCRORLF         14
00180 #define PCRE_INFO_MINLENGTH         15
00181 
00182 /* Request types for pcre_config(). Do not re-arrange, in order to remain
00183 compatible. */
00184 
00185 #define PCRE_CONFIG_UTF8                    0
00186 #define PCRE_CONFIG_NEWLINE                 1
00187 #define PCRE_CONFIG_LINK_SIZE               2
00188 #define PCRE_CONFIG_POSIX_MALLOC_THRESHOLD  3
00189 #define PCRE_CONFIG_MATCH_LIMIT             4
00190 #define PCRE_CONFIG_STACKRECURSE            5
00191 #define PCRE_CONFIG_UNICODE_PROPERTIES      6
00192 #define PCRE_CONFIG_MATCH_LIMIT_RECURSION   7
00193 #define PCRE_CONFIG_BSR                     8
00194 
00195 /* Bit flags for the pcre_extra structure. Do not re-arrange or redefine
00196 these bits, just add new ones on the end, in order to remain compatible. */
00197 
00198 #define PCRE_EXTRA_STUDY_DATA             0x0001
00199 #define PCRE_EXTRA_MATCH_LIMIT            0x0002
00200 #define PCRE_EXTRA_CALLOUT_DATA           0x0004
00201 #define PCRE_EXTRA_TABLES                 0x0008
00202 #define PCRE_EXTRA_MATCH_LIMIT_RECURSION  0x0010
00203 
00204 /* Types */
00205 
00206 struct real_pcre;                 /* declaration; the definition is private  */
00207 typedef struct real_pcre pcre;
00208 
00209 /* When PCRE is compiled as a C++ library, the subject pointer type can be
00210 replaced with a custom type. For conventional use, the public interface is a
00211 const char *. */
00212 
00213 #ifndef PCRE_SPTR
00214 #define PCRE_SPTR const char *
00215 #endif
00216 
00217 /* The structure for passing additional data to pcre_exec(). This is defined in
00218 such as way as to be extensible. Always add new fields at the end, in order to
00219 remain compatible. */
00220 
00221 typedef struct pcre_extra {
00222   unsigned long int flags;        /* Bits for which fields are set */
00223   void *study_data;               /* Opaque data from pcre_study() */
00224   unsigned long int match_limit;  /* Maximum number of calls to match() */
00225   void *callout_data;             /* Data passed back in callouts */
00226   const unsigned char *tables;    /* Pointer to character tables */
00227   unsigned long int match_limit_recursion; /* Max recursive calls to match() */
00228 } pcre_extra;
00229 
00230 /* The structure for passing out data via the pcre_callout_function. We use a
00231 structure so that new fields can be added on the end in future versions,
00232 without changing the API of the function, thereby allowing old clients to work
00233 without modification. */
00234 
00235 typedef struct pcre_callout_block {
00236   int          version;           /* Identifies version of block */
00237   /* ------------------------ Version 0 ------------------------------- */
00238   int          callout_number;    /* Number compiled into pattern */
00239   int         *offset_vector;     /* The offset vector */
00240   PCRE_SPTR    subject;           /* The subject being matched */
00241   int          subject_length;    /* The length of the subject */
00242   int          start_match;       /* Offset to start of this match attempt */
00243   int          current_position;  /* Where we currently are in the subject */
00244   int          capture_top;       /* Max current capture */
00245   int          capture_last;      /* Most recently closed capture */
00246   void        *callout_data;      /* Data passed in with the call */
00247   /* ------------------- Added for Version 1 -------------------------- */
00248   int          pattern_position;  /* Offset to next item in the pattern */
00249   int          next_item_length;  /* Length of next item in the pattern */
00250   /* ------------------------------------------------------------------ */
00251 } pcre_callout_block;
00252 
00253 /* Indirection for store get and free functions. These can be set to
00254 alternative malloc/free functions if required. Special ones are used in the
00255 non-recursive case for "frames". There is also an optional callout function
00256 that is triggered by the (?) regex item. For Virtual Pascal, these definitions
00257 have to take another form. */
00258 
00259 #ifndef VPCOMPAT
00260 PCRE_EXP_DECL void *(*pcre_malloc)(size_t);
00261 PCRE_EXP_DECL void  (*pcre_free)(void *);
00262 PCRE_EXP_DECL void *(*pcre_stack_malloc)(size_t);
00263 PCRE_EXP_DECL void  (*pcre_stack_free)(void *);
00264 PCRE_EXP_DECL int   (*pcre_callout)(pcre_callout_block *);
00265 #else   /* VPCOMPAT */
00266 PCRE_EXP_DECL void *pcre_malloc(size_t);
00267 PCRE_EXP_DECL void  pcre_free(void *);
00268 PCRE_EXP_DECL void *pcre_stack_malloc(size_t);
00269 PCRE_EXP_DECL void  pcre_stack_free(void *);
00270 PCRE_EXP_DECL int   pcre_callout(pcre_callout_block *);
00271 #endif  /* VPCOMPAT */
00272 
00273 /* Exported PCRE functions */
00274 
00275 PCRE_EXP_DECL pcre *pcre_compile(const char *, int, const char **, int *,
00276                   const unsigned char *);
00277 PCRE_EXP_DECL pcre *pcre_compile2(const char *, int, int *, const char **,
00278                   int *, const unsigned char *);
00279 PCRE_EXP_DECL int  pcre_config(int, void *);
00280 PCRE_EXP_DECL int  pcre_copy_named_substring(const pcre *, const char *,
00281                   int *, int, const char *, char *, int);
00282 PCRE_EXP_DECL int  pcre_copy_substring(const char *, int *, int, int, char *,
00283                   int);
00284 PCRE_EXP_DECL int  pcre_dfa_exec(const pcre *, const pcre_extra *,
00285                   const char *, int, int, int, int *, int , int *, int);
00286 PCRE_EXP_DECL int  pcre_exec(const pcre *, const pcre_extra *, PCRE_SPTR,
00287                    int, int, int, int *, int);
00288 PCRE_EXP_DECL void pcre_free_substring(const char *);
00289 PCRE_EXP_DECL void pcre_free_substring_list(const char **);
00290 PCRE_EXP_DECL int  pcre_fullinfo(const pcre *, const pcre_extra *, int,
00291                   void *);
00292 PCRE_EXP_DECL int  pcre_get_named_substring(const pcre *, const char *,
00293                   int *, int, const char *, const char **);
00294 PCRE_EXP_DECL int  pcre_get_stringnumber(const pcre *, const char *);
00295 PCRE_EXP_DECL int  pcre_get_stringtable_entries(const pcre *, const char *,
00296                   char **, char **);
00297 PCRE_EXP_DECL int  pcre_get_substring(const char *, int *, int, int,
00298                   const char **);
00299 PCRE_EXP_DECL int  pcre_get_substring_list(const char *, int *, int,
00300                   const char ***);
00301 PCRE_EXP_DECL int  pcre_info(const pcre *, int *, int *);
00302 PCRE_EXP_DECL const unsigned char *pcre_maketables(void);
00303 PCRE_EXP_DECL int  pcre_refcount(pcre *, int);
00304 PCRE_EXP_DECL pcre_extra *pcre_study(const pcre *, int, const char **);
00305 PCRE_EXP_DECL const char *pcre_version(void);
00306 
00307 #ifdef __cplusplus
00308 }  /* extern "C" */
00309 #endif
00310 
00311 #endif /* End of pcre.h */