mirror of
https://github.com/nim-lang/Nim.git
synced 2026-01-04 20:17:42 +00:00
Merge pull request #2506 from BlaXpirit/update-pcre
Update and improve PCRE wrapper
This commit is contained in:
@@ -44,11 +44,11 @@ type
|
||||
reExtended = 3, ## ignore whitespace and ``#`` comments
|
||||
reStudy = 4 ## study the expression (may be omitted if the
|
||||
## expression will be used only once)
|
||||
|
||||
RegexDesc = object
|
||||
h: PPcre
|
||||
e: ptr TExtra
|
||||
|
||||
|
||||
RegexDesc = object
|
||||
h: ptr Pcre
|
||||
e: ptr ExtraData
|
||||
|
||||
Regex* = ref RegexDesc ## a compiled regular expression
|
||||
|
||||
RegexError* = object of ValueError
|
||||
@@ -63,7 +63,7 @@ proc raiseInvalidRegex(msg: string) {.noinline, noreturn.} =
|
||||
e.msg = msg
|
||||
raise e
|
||||
|
||||
proc rawCompile(pattern: string, flags: cint): PPcre =
|
||||
proc rawCompile(pattern: string, flags: cint): ptr Pcre =
|
||||
var
|
||||
msg: cstring
|
||||
offset: cint
|
||||
@@ -87,7 +87,7 @@ proc re*(s: string, flags = {reExtended, reStudy}): Regex =
|
||||
result.h = rawCompile(s, cast[cint](flags - {reStudy}))
|
||||
if reStudy in flags:
|
||||
var msg: cstring
|
||||
result.e = pcre.study(result.h, 0, msg)
|
||||
result.e = pcre.study(result.h, 0, addr msg)
|
||||
if not isNil(msg): raiseInvalidRegex($msg)
|
||||
|
||||
proc matchOrFind(s: string, pattern: Regex, matches: var openArray[string],
|
||||
|
||||
@@ -1,158 +1,190 @@
|
||||
#************************************************
|
||||
# Perl-Compatible Regular Expressions *
|
||||
#***********************************************
|
||||
# Perl-Compatible Regular Expressions *
|
||||
#************************************************
|
||||
# This is the public header file for the PCRE library, to be #included by
|
||||
#applications that call the PCRE functions.
|
||||
# applications that call the PCRE functions.
|
||||
#
|
||||
# Copyright (c) 1997-2010 University of Cambridge
|
||||
# Copyright (c) 1997-2014 University of Cambridge
|
||||
#
|
||||
#-----------------------------------------------------------------------------
|
||||
#Redistribution and use in source and binary forms, with or without
|
||||
#modification, are permitted provided that the following conditions are met:
|
||||
# Redistribution and use in source and binary forms, with or without
|
||||
# modification, are permitted provided that the following conditions are met:
|
||||
#
|
||||
# Redistributions of source code must retain the above copyright notice,
|
||||
# * Redistributions of source code must retain the above copyright notice,
|
||||
# this list of conditions and the following disclaimer.
|
||||
#
|
||||
# Redistributions in binary form must reproduce the above copyright
|
||||
# * Redistributions in binary form must reproduce the above copyright
|
||||
# notice, this list of conditions and the following disclaimer in the
|
||||
# documentation and/or other materials provided with the distribution.
|
||||
#
|
||||
# Neither the name of the University of Cambridge nor the names of its
|
||||
# * Neither the name of the University of Cambridge nor the names of its
|
||||
# contributors may be used to endorse or promote products derived from
|
||||
# this software without specific prior written permission.
|
||||
#
|
||||
#THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
||||
#AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
||||
#IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
||||
#ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
||||
#LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
||||
#CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
||||
#SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
||||
#INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
||||
#CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
||||
#ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
||||
#POSSIBILITY OF SUCH DAMAGE.
|
||||
# THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
||||
# AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
||||
# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
||||
# ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
||||
# LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
||||
# CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
||||
# SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
||||
# INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
||||
# CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
||||
# ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
||||
# POSSIBILITY OF SUCH DAMAGE.
|
||||
#-----------------------------------------------------------------------------
|
||||
#
|
||||
|
||||
{.deadcodeElim: on.}
|
||||
{.deadCodeElim: on.}
|
||||
|
||||
when not defined(pcreDll):
|
||||
when hostOS == "windows":
|
||||
const pcreDll = "pcre.dll"
|
||||
elif hostOS == "macosx":
|
||||
const pcreDll = "libpcre(.3|.1|).dylib"
|
||||
else:
|
||||
const pcreDll = "libpcre.so(.3|.1|)"
|
||||
{.pragma: pcreImport, dynlib: pcreDll.}
|
||||
else:
|
||||
{.pragma: pcreImport, header: "<pcre.h>".}
|
||||
# The current PCRE version information.
|
||||
|
||||
# The current PCRE version information.
|
||||
|
||||
const
|
||||
MAJOR* = 8
|
||||
MINOR* = 31
|
||||
PRERELEASE* = true
|
||||
DATE* = "2012-07-06"
|
||||
const
|
||||
PCRE_MAJOR* = 8
|
||||
PCRE_MINOR* = 36
|
||||
PCRE_PRERELEASE* = true
|
||||
PCRE_DATE* = "2014-09-26"
|
||||
|
||||
# When an application links to a PCRE DLL in Windows, the symbols that are
|
||||
# imported have to be identified as such. When building PCRE, the appropriate
|
||||
# export setting is defined in pcre_internal.h, which includes this file. So we
|
||||
# don't change existing definitions of PCRE_EXP_DECL and PCRECPP_EXP_DECL.
|
||||
# don't change existing definitions of PCRE_EXP_DECL and PCRECPP_EXP_DECL.
|
||||
|
||||
# Have to include stdlib.h in order to ensure that size_t is defined;
|
||||
# it is needed here for malloc.
|
||||
# By default, we use the standard "extern" declarations.
|
||||
|
||||
# Allow for C++ users
|
||||
# Allow for C++ users
|
||||
|
||||
# Options. Some are compile-time only, some are run-time only, and some are
|
||||
# both, so we keep them all distinct.
|
||||
|
||||
const
|
||||
CASELESS* = 0x00000001
|
||||
MULTILINE* = 0x00000002
|
||||
DOTALL* = 0x00000004
|
||||
EXTENDED* = 0x00000008
|
||||
ANCHORED* = 0x00000010
|
||||
DOLLAR_ENDONLY* = 0x00000020
|
||||
EXTRA* = 0x00000040
|
||||
NOTBOL* = 0x00000080
|
||||
NOTEOL* = 0x00000100
|
||||
UNGREEDY* = 0x00000200
|
||||
NOTEMPTY* = 0x00000400
|
||||
UTF8* = 0x00000800
|
||||
NO_AUTO_CAPTURE* = 0x00001000
|
||||
NO_UTF8_CHECK* = 0x00002000
|
||||
AUTO_CALLOUT* = 0x00004000
|
||||
PARTIAL_SOFT* = 0x00008000
|
||||
PARTIAL* = 0x00008000 # Backwards compatible synonym
|
||||
DFA_SHORTEST* = 0x00010000
|
||||
DFA_RESTART* = 0x00020000
|
||||
FIRSTLINE* = 0x00040000
|
||||
DUPNAMES* = 0x00080000
|
||||
NEWLINE_CR* = 0x00100000
|
||||
NEWLINE_LF* = 0x00200000
|
||||
NEWLINE_CRLF* = 0x00300000
|
||||
NEWLINE_ANY* = 0x00400000
|
||||
NEWLINE_ANYCRLF* = 0x00500000
|
||||
BSR_ANYCRLF* = 0x00800000
|
||||
BSR_UNICODE* = 0x01000000
|
||||
JAVASCRIPT_COMPAT* = 0x02000000
|
||||
NO_START_OPTIMIZE* = 0x04000000
|
||||
NO_START_OPTIMISE* = 0x04000000
|
||||
PARTIAL_HARD* = 0x08000000
|
||||
NOTEMPTY_ATSTART* = 0x10000000
|
||||
UCP* = 0x20000000
|
||||
|
||||
# Exec-time and get/set-time error codes
|
||||
|
||||
const
|
||||
ERROR_NOMATCH* = (- 1)
|
||||
ERROR_NULL* = (- 2)
|
||||
ERROR_BADOPTION* = (- 3)
|
||||
ERROR_BADMAGIC* = (- 4)
|
||||
ERROR_UNKNOWN_OPCODE* = (- 5)
|
||||
ERROR_UNKNOWN_NODE* = (- 5) # For backward compatibility
|
||||
ERROR_NOMEMORY* = (- 6)
|
||||
ERROR_NOSUBSTRING* = (- 7)
|
||||
ERROR_MATCHLIMIT* = (- 8)
|
||||
ERROR_CALLOUT* = (- 9) # Never used by PCRE itself
|
||||
ERROR_BADUTF8* = (- 10)
|
||||
ERROR_BADUTF8_OFFSET* = (- 11)
|
||||
ERROR_PARTIAL* = (- 12)
|
||||
ERROR_BADPARTIAL* = (- 13)
|
||||
ERROR_INTERNAL* = (- 14)
|
||||
ERROR_BADCOUNT* = (- 15)
|
||||
ERROR_DFA_UITEM* = (- 16)
|
||||
ERROR_DFA_UCOND* = (- 17)
|
||||
ERROR_DFA_UMLIMIT* = (- 18)
|
||||
ERROR_DFA_WSSIZE* = (- 19)
|
||||
ERROR_DFA_RECURSE* = (- 20)
|
||||
ERROR_RECURSIONLIMIT* = (- 21)
|
||||
ERROR_NULLWSLIMIT* = (- 22) # No longer actually used
|
||||
ERROR_BADNEWLINE* = (- 23)
|
||||
ERROR_BADOFFSET* = (- 24)
|
||||
ERROR_SHORTUTF8* = (- 25)
|
||||
ERROR_RECURSELOOP* = (- 26)
|
||||
ERROR_JIT_STACKLIMIT* = (- 27)
|
||||
ERROR_BADMODE* = (- 28)
|
||||
ERROR_BADENDIANNESS* = (- 29)
|
||||
ERROR_DFA_BADRESTART* = (- 30)
|
||||
|
||||
# Specific error codes for UTF-8 validity checks
|
||||
# Public options. Some are compile-time only, some are run-time only, and some
|
||||
# are both. Most of the compile-time options are saved with the compiled regex
|
||||
# so that they can be inspected during studying (and therefore JIT compiling).
|
||||
# Note that pcre_study() has its own set of options. Originally, all the options
|
||||
# defined here used distinct bits. However, almost all the bits in a 32-bit word
|
||||
# are now used, so in order to conserve them, option bits that were previously
|
||||
# only recognized at matching time (i.e. by pcre_exec() or pcre_dfa_exec()) may
|
||||
# also be used for compile-time options that affect only compiling and are not
|
||||
# relevant for studying or JIT compiling.
|
||||
#
|
||||
# Some options for pcre_compile() change its behaviour but do not affect the
|
||||
# behaviour of the execution functions. Other options are passed through to the
|
||||
# execution functions and affect their behaviour, with or without affecting the
|
||||
# behaviour of pcre_compile().
|
||||
#
|
||||
# Options that can be passed to pcre_compile() are tagged Cx below, with these
|
||||
# variants:
|
||||
#
|
||||
# C1 Affects compile only
|
||||
# C2 Does not affect compile; affects exec, dfa_exec
|
||||
# C3 Affects compile, exec, dfa_exec
|
||||
# C4 Affects compile, exec, dfa_exec, study
|
||||
# C5 Affects compile, exec, study
|
||||
#
|
||||
# Options that can be set for pcre_exec() and/or pcre_dfa_exec() are flagged
|
||||
# with E and D, respectively. They take precedence over C3, C4, and C5 settings
|
||||
# passed from pcre_compile(). Those that are compatible with JIT execution are
|
||||
# flagged with J.
|
||||
|
||||
const
|
||||
UTF8_ERR0* = 0
|
||||
UTF8_ERR1* = 1
|
||||
UTF8_ERR2* = 2
|
||||
UTF8_ERR3* = 3
|
||||
UTF8_ERR4* = 4
|
||||
UTF8_ERR5* = 5
|
||||
UTF8_ERR6* = 6
|
||||
UTF8_ERR7* = 7
|
||||
UTF8_ERR8* = 8
|
||||
UTF8_ERR9* = 9
|
||||
CASELESS* = 0x00000001 # C1
|
||||
MULTILINE* = 0x00000002 # C1
|
||||
DOTALL* = 0x00000004 # C1
|
||||
EXTENDED* = 0x00000008 # C1
|
||||
ANCHORED* = 0x00000010 # C4 E D
|
||||
DOLLAR_ENDONLY* = 0x00000020 # C2
|
||||
EXTRA* = 0x00000040 # C1
|
||||
NOTBOL* = 0x00000080 # E D J
|
||||
NOTEOL* = 0x00000100 # E D J
|
||||
UNGREEDY* = 0x00000200 # C1
|
||||
NOTEMPTY* = 0x00000400 # E D J
|
||||
UTF8* = 0x00000800 # C4 )
|
||||
UTF16* = 0x00000800 # C4 ) Synonyms
|
||||
UTF32* = 0x00000800 # C4 )
|
||||
NO_AUTO_CAPTURE* = 0x00001000 # C1
|
||||
NO_UTF8_CHECK* = 0x00002000 # C1 E D J )
|
||||
NO_UTF16_CHECK* = 0x00002000 # C1 E D J ) Synonyms
|
||||
NO_UTF32_CHECK* = 0x00002000 # C1 E D J )
|
||||
AUTO_CALLOUT* = 0x00004000 # C1
|
||||
PARTIAL_SOFT* = 0x00008000 # E D J ) Synonyms
|
||||
PARTIAL* = 0x00008000 # E D J )
|
||||
|
||||
# This pair use the same bit.
|
||||
const
|
||||
NEVER_UTF* = 0x00010000 # C1 ) Overlaid
|
||||
DFA_SHORTEST* = 0x00010000 # D ) Overlaid
|
||||
|
||||
# This pair use the same bit.
|
||||
const
|
||||
NO_AUTO_POSSESS* = 0x00020000 # C1 ) Overlaid
|
||||
DFA_RESTART* = 0x00020000 # D ) Overlaid
|
||||
|
||||
const
|
||||
FIRSTLINE* = 0x00040000 # C3
|
||||
DUPNAMES* = 0x00080000 # C1
|
||||
NEWLINE_CR* = 0x00100000 # C3 E D
|
||||
NEWLINE_LF* = 0x00200000 # C3 E D
|
||||
NEWLINE_CRLF* = 0x00300000 # C3 E D
|
||||
NEWLINE_ANY* = 0x00400000 # C3 E D
|
||||
NEWLINE_ANYCRLF* = 0x00500000 # C3 E D
|
||||
BSR_ANYCRLF* = 0x00800000 # C3 E D
|
||||
BSR_UNICODE* = 0x01000000 # C3 E D
|
||||
JAVASCRIPT_COMPAT* = 0x02000000 # C5
|
||||
NO_START_OPTIMIZE* = 0x04000000 # C2 E D ) Synonyms
|
||||
NO_START_OPTIMISE* = 0x04000000 # C2 E D )
|
||||
PARTIAL_HARD* = 0x08000000 # E D J
|
||||
NOTEMPTY_ATSTART* = 0x10000000 # E D J
|
||||
UCP* = 0x20000000 # C3
|
||||
|
||||
## Exec-time and get/set-time error codes
|
||||
const
|
||||
ERROR_NOMATCH* = -1
|
||||
ERROR_NULL* = -2
|
||||
ERROR_BADOPTION* = -3
|
||||
ERROR_BADMAGIC* = -4
|
||||
ERROR_UNKNOWN_OPCODE* = -5
|
||||
ERROR_UNKNOWN_NODE* = -5 ## For backward compatibility
|
||||
ERROR_NOMEMORY* = -6
|
||||
ERROR_NOSUBSTRING* = -7
|
||||
ERROR_MATCHLIMIT* = -8
|
||||
ERROR_CALLOUT* = -9 ## Never used by PCRE itself
|
||||
ERROR_BADUTF8* = -10 ## Same for 8/16/32
|
||||
ERROR_BADUTF16* = -10 ## Same for 8/16/32
|
||||
ERROR_BADUTF32* = -10 ## Same for 8/16/32
|
||||
ERROR_BADUTF8_OFFSET* = -11 ## Same for 8/16
|
||||
ERROR_BADUTF16_OFFSET* = -11 ## Same for 8/16
|
||||
ERROR_PARTIAL* = -12
|
||||
ERROR_BADPARTIAL* = -13
|
||||
ERROR_INTERNAL* = -14
|
||||
ERROR_BADCOUNT* = -15
|
||||
ERROR_DFA_UITEM* = -16
|
||||
ERROR_DFA_UCOND* = -17
|
||||
ERROR_DFA_UMLIMIT* = -18
|
||||
ERROR_DFA_WSSIZE* = -19
|
||||
ERROR_DFA_RECURSE* = -20
|
||||
ERROR_RECURSIONLIMIT* = -21
|
||||
ERROR_NULLWSLIMIT* = -22 ## No longer actually used
|
||||
ERROR_BADNEWLINE* = -23
|
||||
ERROR_BADOFFSET* = -24
|
||||
ERROR_SHORTUTF8* = -25
|
||||
ERROR_SHORTUTF16* = -25 ## Same for 8/16
|
||||
ERROR_RECURSELOOP* = -26
|
||||
ERROR_JIT_STACKLIMIT* = -27
|
||||
ERROR_BADMODE* = -28
|
||||
ERROR_BADENDIANNESS* = -29
|
||||
ERROR_DFA_BADRESTART* = -30
|
||||
ERROR_JIT_BADOPTION* = -31
|
||||
ERROR_BADLENGTH* = -32
|
||||
ERROR_UNSET* = -33
|
||||
|
||||
## Specific error codes for UTF-8 validity checks
|
||||
const
|
||||
UTF8_ERR0* = 0
|
||||
UTF8_ERR1* = 1
|
||||
UTF8_ERR2* = 2
|
||||
UTF8_ERR3* = 3
|
||||
UTF8_ERR4* = 4
|
||||
UTF8_ERR5* = 5
|
||||
UTF8_ERR6* = 6
|
||||
UTF8_ERR7* = 7
|
||||
UTF8_ERR8* = 8
|
||||
UTF8_ERR9* = 9
|
||||
UTF8_ERR10* = 10
|
||||
UTF8_ERR11* = 11
|
||||
UTF8_ERR12* = 12
|
||||
@@ -165,193 +197,305 @@ const
|
||||
UTF8_ERR19* = 19
|
||||
UTF8_ERR20* = 20
|
||||
UTF8_ERR21* = 21
|
||||
UTF8_ERR22* = 22 # Unused (was non-character)
|
||||
|
||||
# Request types for pcre_fullinfo()
|
||||
|
||||
const
|
||||
INFO_OPTIONS* = 0
|
||||
INFO_SIZE* = 1
|
||||
INFO_CAPTURECOUNT* = 2
|
||||
INFO_BACKREFMAX* = 3
|
||||
INFO_FIRSTBYTE* = 4
|
||||
INFO_FIRSTCHAR* = 4 # For backwards compatibility
|
||||
INFO_FIRSTTABLE* = 5
|
||||
INFO_LASTLITERAL* = 6
|
||||
INFO_NAMEENTRYSIZE* = 7
|
||||
INFO_NAMECOUNT* = 8
|
||||
INFO_NAMETABLE* = 9
|
||||
INFO_STUDYSIZE* = 10
|
||||
INFO_DEFAULT_TABLES* = 11
|
||||
INFO_OKPARTIAL* = 12
|
||||
INFO_JCHANGED* = 13
|
||||
INFO_HASCRORLF* = 14
|
||||
INFO_MINLENGTH* = 15
|
||||
INFO_JIT* = 16
|
||||
INFO_JITSIZE* = 17
|
||||
INFO_MAXLOOKBEHIND* = 18
|
||||
|
||||
# Request types for pcre_config(). Do not re-arrange, in order to remain
|
||||
# compatible.
|
||||
|
||||
const
|
||||
CONFIG_UTF8* = 0
|
||||
CONFIG_NEWLINE* = 1
|
||||
CONFIG_LINK_SIZE* = 2
|
||||
CONFIG_POSIX_MALLOC_THRESHOLD* = 3
|
||||
CONFIG_MATCH_LIMIT* = 4
|
||||
CONFIG_STACKRECURSE* = 5
|
||||
CONFIG_UNICODE_PROPERTIES* = 6
|
||||
CONFIG_MATCH_LIMIT_RECURSION* = 7
|
||||
CONFIG_BSR* = 8
|
||||
CONFIG_JIT* = 9
|
||||
CONFIG_JITTARGET* = 11
|
||||
|
||||
# Request types for pcre_study(). Do not re-arrange, in order to remain
|
||||
# compatible.
|
||||
|
||||
## Specific error codes for UTF-16 validity checks
|
||||
const
|
||||
STUDY_JIT_COMPILE* = 0x00000001
|
||||
STUDY_JIT_PARTIAL_SOFT_COMPILE* = 0x00000002
|
||||
STUDY_JIT_PARTIAL_HARD_COMPILE* = 0x00000004
|
||||
UTF16_ERR0* = 0
|
||||
UTF16_ERR1* = 1
|
||||
UTF16_ERR2* = 2
|
||||
UTF16_ERR3* = 3
|
||||
UTF16_ERR4* = 4 # Unused (was non-character)
|
||||
|
||||
# Bit flags for the pcre_extra structure. Do not re-arrange or redefine
|
||||
# these bits, just add new ones on the end, in order to remain compatible.
|
||||
## Specific error codes for UTF-32 validity checks
|
||||
const
|
||||
UTF32_ERR0* = 0
|
||||
UTF32_ERR1* = 1
|
||||
UTF32_ERR2* = 2 # Unused (was non-character)
|
||||
UTF32_ERR3* = 3
|
||||
|
||||
const
|
||||
EXTRA_STUDY_DATA* = 0x00000001
|
||||
EXTRA_MATCH_LIMIT* = 0x00000002
|
||||
EXTRA_CALLOUT_DATA* = 0x00000004
|
||||
EXTRA_TABLES* = 0x00000008
|
||||
EXTRA_MATCH_LIMIT_RECURSION* = 0x00000010
|
||||
EXTRA_MARK* = 0x00000020
|
||||
EXTRA_EXECUTABLE_JIT* = 0x00000040
|
||||
## Request types for pcre_fullinfo()
|
||||
const
|
||||
INFO_OPTIONS* = 0
|
||||
INFO_SIZE* = 1
|
||||
INFO_CAPTURECOUNT* = 2
|
||||
INFO_BACKREFMAX* = 3
|
||||
INFO_FIRSTBYTE* = 4
|
||||
INFO_FIRSTCHAR* = 4 ## For backwards compatibility
|
||||
INFO_FIRSTTABLE* = 5
|
||||
INFO_LASTLITERAL* = 6
|
||||
INFO_NAMEENTRYSIZE* = 7
|
||||
INFO_NAMECOUNT* = 8
|
||||
INFO_NAMETABLE* = 9
|
||||
INFO_STUDYSIZE* = 10
|
||||
INFO_DEFAULT_TABLES* = 11
|
||||
INFO_OKPARTIAL* = 12
|
||||
INFO_JCHANGED* = 13
|
||||
INFO_HASCRORLF* = 14
|
||||
INFO_MINLENGTH* = 15
|
||||
INFO_JIT* = 16
|
||||
INFO_JITSIZE* = 17
|
||||
INFO_MAXLOOKBEHIND* = 18
|
||||
INFO_FIRSTCHARACTER* = 19
|
||||
INFO_FIRSTCHARACTERFLAGS* = 20
|
||||
INFO_REQUIREDCHAR* = 21
|
||||
INFO_REQUIREDCHARFLAGS* = 22
|
||||
INFO_MATCHLIMIT* = 23
|
||||
INFO_RECURSIONLIMIT* = 24
|
||||
INFO_MATCH_EMPTY* = 25
|
||||
|
||||
# Types
|
||||
## Request types for pcre_config(). Do not re-arrange, in order to remain
|
||||
## compatible.
|
||||
const
|
||||
CONFIG_UTF8* = 0
|
||||
CONFIG_NEWLINE* = 1
|
||||
CONFIG_LINK_SIZE* = 2
|
||||
CONFIG_POSIX_MALLOC_THRESHOLD* = 3
|
||||
CONFIG_MATCH_LIMIT* = 4
|
||||
CONFIG_STACKRECURSE* = 5
|
||||
CONFIG_UNICODE_PROPERTIES* = 6
|
||||
CONFIG_MATCH_LIMIT_RECURSION* = 7
|
||||
CONFIG_BSR* = 8
|
||||
CONFIG_JIT* = 9
|
||||
CONFIG_UTF16* = 10
|
||||
CONFIG_JITTARGET* = 11
|
||||
CONFIG_UTF32* = 12
|
||||
CONFIG_PARENS_LIMIT* = 13
|
||||
|
||||
type
|
||||
TPcre*{.pure, final.} = object
|
||||
PPcre* = ptr TPcre
|
||||
Tjit_stack*{.pure, final.} = object
|
||||
Pjit_stack* = ptr Tjit_stack
|
||||
## Request types for pcre_study(). Do not re-arrange, in order to remain
|
||||
## compatible.
|
||||
const
|
||||
STUDY_JIT_COMPILE* = 0x0001
|
||||
STUDY_JIT_PARTIAL_SOFT_COMPILE* = 0x0002
|
||||
STUDY_JIT_PARTIAL_HARD_COMPILE* = 0x0004
|
||||
STUDY_EXTRA_NEEDED* = 0x0008
|
||||
|
||||
# When PCRE is compiled as a C++ library, the subject pointer type can be
|
||||
# replaced with a custom type. For conventional use, the public interface is a
|
||||
# const char *.
|
||||
|
||||
# The structure for passing additional data to pcre_exec(). This is defined in
|
||||
# such as way as to be extensible. Always add new fields at the end, in order to
|
||||
# remain compatible.
|
||||
|
||||
type
|
||||
TExtra*{.pure, final.} = object
|
||||
flags*: int ## Bits for which fields are set
|
||||
study_data*: pointer ## Opaque data from pcre_study()
|
||||
match_limit*: int ## Maximum number of calls to match()
|
||||
callout_data*: pointer ## Data passed back in callouts
|
||||
tables*: cstring ## Pointer to character tables
|
||||
match_limit_recursion*: int ## Max recursive calls to match()
|
||||
mark*: ptr cstring ## For passing back a mark pointer
|
||||
executable_jit*: pointer ## Contains a pointer to a compiled jit code
|
||||
|
||||
|
||||
# The structure for passing out data via the pcre_callout_function. We use a
|
||||
# structure so that new fields can be added on the end in future versions,
|
||||
# without changing the API of the function, thereby allowing old clients to work
|
||||
# without modification.
|
||||
|
||||
type
|
||||
TCalloutBlock*{.pure, final.} = object
|
||||
version*: cint ## Identifies version of block
|
||||
callout_number*: cint ## Number compiled into pattern
|
||||
offset_vector*: ptr cint ## The offset vector
|
||||
subject*: cstring ## The subject being matched
|
||||
subject_length*: cint ## The length of the subject
|
||||
start_match*: cint ## Offset to start of this match attempt
|
||||
current_position*: cint ## Where we currently are in the subject
|
||||
capture_top*: cint ## Max current capture
|
||||
capture_last*: cint ## Most recently closed capture
|
||||
callout_data*: pointer ## Data passed in with the call
|
||||
pattern_position*: cint ## Offset to next item in the pattern
|
||||
next_item_length*: cint ## Length of next item in the pattern
|
||||
mark*: cstring ## Pointer to current mark or NULL
|
||||
|
||||
# Indirection for store get and free functions. These can be set to
|
||||
#alternative malloc/free functions if required. Special ones are used in the
|
||||
#non-recursive case for "frames". There is also an optional callout function
|
||||
#that is triggered by the (?) regex item. For Virtual Pascal, these definitions
|
||||
#have to take another form.
|
||||
|
||||
# User defined callback which provides a stack just before the match starts.
|
||||
## Bit flags for the pcre[16|32]_extra structure. Do not re-arrange or redefine
|
||||
## these bits, just add new ones on the end, in order to remain compatible.
|
||||
const
|
||||
EXTRA_STUDY_DATA* = 0x0001
|
||||
EXTRA_MATCH_LIMIT* = 0x0002
|
||||
EXTRA_CALLOUT_DATA* = 0x0004
|
||||
EXTRA_TABLES* = 0x0008
|
||||
EXTRA_MATCH_LIMIT_RECURSION* = 0x0010
|
||||
EXTRA_MARK* = 0x0020
|
||||
EXTRA_EXECUTABLE_JIT* = 0x0040
|
||||
|
||||
## Types
|
||||
type
|
||||
TJitCallback* = proc(p: pointer): ptr Tjit_stack{.cdecl.}
|
||||
Pcre* = object
|
||||
Pcre16* = object
|
||||
Pcre32* = object
|
||||
JitStack* = object
|
||||
JitStack16* = object
|
||||
JitStack32* = object
|
||||
|
||||
# Exported PCRE functions
|
||||
|
||||
proc compile*(a2: cstring, a3: cint, a4: ptr cstring, a5: ptr cint,
|
||||
a6: ptr char): ptr TPcre{.cdecl, importc: "pcre_compile",
|
||||
pcreImport.}
|
||||
proc compile2*(a2: cstring, a3: cint, a4: ptr cint, a5: ptr cstring,
|
||||
a6: ptr cint, a7: ptr char): ptr TPcre{.cdecl,
|
||||
importc: "pcre_compile2", pcreImport.}
|
||||
proc config*(a2: cint, a3: pointer): cint{.cdecl, importc: "pcre_config",
|
||||
pcreImport.}
|
||||
proc copy_named_substring*(a2: ptr TPcre, a3: cstring, a4: ptr cint, a5: cint,
|
||||
a6: cstring, a7: cstring, a8: cint): cint{.cdecl,
|
||||
importc: "pcre_copy_named_substring", pcreImport.}
|
||||
proc copy_substring*(a2: cstring, a3: ptr cint, a4: cint, a5: cint,
|
||||
a6: cstring,
|
||||
a7: cint): cint{.cdecl, importc: "pcre_copy_substring",
|
||||
pcreImport.}
|
||||
proc dfa_exec*(a2: ptr TPcre, a3: ptr TExtra, a4: cstring, a5: cint,
|
||||
a6: cint, a7: cint, a8: ptr cint, a9: cint, a10: ptr cint,
|
||||
a11: cint): cint{.cdecl, importc: "pcre_dfa_exec",
|
||||
pcreImport.}
|
||||
proc exec*(a2: ptr TPcre, a3: ptr TExtra, a4: cstring, a5: cint, a6: cint,
|
||||
a7: cint, a8: ptr cint, a9: cint): cint {.
|
||||
cdecl, importc: "pcre_exec", pcreImport.}
|
||||
proc free_substring*(a2: cstring){.cdecl, importc: "pcre_free_substring",
|
||||
pcreImport.}
|
||||
proc free_substring_list*(a2: cstringArray){.cdecl,
|
||||
importc: "pcre_free_substring_list", pcreImport.}
|
||||
proc fullinfo*(a2: ptr TPcre, a3: ptr TExtra, a4: cint, a5: pointer): cint{.
|
||||
cdecl, importc: "pcre_fullinfo", pcreImport.}
|
||||
proc get_named_substring*(a2: ptr TPcre, a3: cstring, a4: ptr cint, a5: cint,
|
||||
a6: cstring, a7: cstringArray): cint{.cdecl,
|
||||
importc: "pcre_get_named_substring", pcreImport.}
|
||||
proc get_stringnumber*(a2: ptr TPcre, a3: cstring): cint{.cdecl,
|
||||
importc: "pcre_get_stringnumber", pcreImport.}
|
||||
proc get_stringtable_entries*(a2: ptr TPcre, a3: cstring, a4: cstringArray,
|
||||
a5: cstringArray): cint{.cdecl,
|
||||
importc: "pcre_get_stringtable_entries", pcreImport.}
|
||||
proc get_substring*(a2: cstring, a3: ptr cint, a4: cint, a5: cint,
|
||||
a6: cstringArray): cint{.cdecl,
|
||||
importc: "pcre_get_substring", pcreImport.}
|
||||
proc get_substring_list*(a2: cstring, a3: ptr cint, a4: cint,
|
||||
a5: ptr cstringArray): cint{.cdecl,
|
||||
importc: "pcre_get_substring_list", pcreImport.}
|
||||
proc maketables*(): ptr char{.cdecl, importc: "pcre_maketables",
|
||||
pcreImport.}
|
||||
proc refcount*(a2: ptr TPcre, a3: cint): cint{.cdecl, importc: "pcre_refcount",
|
||||
pcreImport.}
|
||||
proc study*(a2: ptr TPcre, a3: cint, a4: var cstring): ptr TExtra{.cdecl,
|
||||
importc: "pcre_study", pcreImport.}
|
||||
proc version*(): cstring{.cdecl, importc: "pcre_version", pcreImport.}
|
||||
## The structure for passing additional data to pcre_exec(). This is defined in
|
||||
## such as way as to be extensible. Always add new fields at the end, in order
|
||||
## to remain compatible.
|
||||
type
|
||||
ExtraData* = object
|
||||
flags*: clong ## Bits for which fields are set
|
||||
study_data*: pointer ## Opaque data from pcre_study()
|
||||
match_limit*: clong ## Maximum number of calls to match()
|
||||
callout_data*: pointer ## Data passed back in callouts
|
||||
tables*: pointer ## Pointer to character tables
|
||||
match_limit_recursion*: clong ## Max recursive calls to match()
|
||||
mark*: pointer ## For passing back a mark pointer
|
||||
executable_jit*: pointer ## Contains a pointer to a compiled jit code
|
||||
|
||||
## The structure for passing out data via the pcre_callout_function. We use a
|
||||
## structure so that new fields can be added on the end in future versions,
|
||||
## without changing the API of the function, thereby allowing old clients to
|
||||
## work without modification.
|
||||
type
|
||||
CalloutBlock* = object
|
||||
version* : cint ## Identifies version of block
|
||||
# ------------------------ Version 0 -------------------------------
|
||||
callout_number* : cint ## Number compiled into pattern
|
||||
offset_vector* : ptr cint ## The offset vector
|
||||
subject* : cstring ## The subject being matched
|
||||
subject_length* : cint ## The length of the subject
|
||||
start_match* : cint ## Offset to start of this match attempt
|
||||
current_position*: cint ## Where we currently are in the subject
|
||||
capture_top* : cint ## Max current capture
|
||||
capture_last* : cint ## Most recently closed capture
|
||||
callout_data* : pointer ## Data passed in with the call
|
||||
# ------------------- Added for Version 1 --------------------------
|
||||
pattern_position*: cint ## Offset to next item in the pattern
|
||||
next_item_length*: cint ## Length of next item in the pattern
|
||||
# ------------------- Added for Version 2 --------------------------
|
||||
mark* : pointer ## Pointer to current mark or NULL
|
||||
# ------------------------------------------------------------------
|
||||
|
||||
|
||||
## User defined callback which provides a stack just before the match starts.
|
||||
type
|
||||
JitCallback* = proc (a: pointer): ptr JitStack {.cdecl.}
|
||||
|
||||
|
||||
when not defined(usePcreHeader):
|
||||
when hostOS == "windows":
|
||||
const pcreDll = "pcre.dll"
|
||||
elif hostOS == "macosx":
|
||||
const pcreDll = "libpcre(.3|.1|).dylib"
|
||||
else:
|
||||
const pcreDll = "libpcre.so(.3|.1|)"
|
||||
{.push dynlib: pcreDll.}
|
||||
else:
|
||||
{.push header: "<pcre.h>".}
|
||||
|
||||
{.push cdecl, importc: "pcre_$1".}
|
||||
|
||||
# Exported PCRE functions
|
||||
|
||||
proc compile*(pattern: cstring,
|
||||
options: cint,
|
||||
errptr: ptr cstring,
|
||||
erroffset: ptr cint,
|
||||
tableptr: pointer): ptr Pcre
|
||||
|
||||
proc compile2*(pattern: cstring,
|
||||
options: cint,
|
||||
errorcodeptr: ptr cint,
|
||||
errptr: ptr cstring,
|
||||
erroffset: ptr cint,
|
||||
tableptr: pointer): ptr Pcre
|
||||
|
||||
proc config*(what: cint,
|
||||
where: pointer): cint
|
||||
|
||||
proc copy_named_substring*(code: ptr Pcre,
|
||||
subject: cstring,
|
||||
ovector: ptr cint,
|
||||
stringcount: cint,
|
||||
stringname: cstring,
|
||||
buffer: cstring,
|
||||
buffersize: cint): cint
|
||||
|
||||
proc copy_substring*(subject: cstring,
|
||||
ovector: ptr cint,
|
||||
stringcount: cint,
|
||||
stringnumber: cint,
|
||||
buffer: cstring,
|
||||
buffersize: cint): cint
|
||||
|
||||
proc dfa_exec*(code: ptr Pcre,
|
||||
extra: ptr ExtraData,
|
||||
subject: cstring,
|
||||
length: cint,
|
||||
startoffset: cint,
|
||||
options: cint,
|
||||
ovector: ptr cint,
|
||||
ovecsize: cint,
|
||||
workspace: ptr cint,
|
||||
wscount: cint): cint
|
||||
|
||||
proc exec*(code: ptr Pcre,
|
||||
extra: ptr ExtraData,
|
||||
subject: cstring,
|
||||
length: cint,
|
||||
startoffset: cint,
|
||||
options: cint,
|
||||
ovector: ptr cint,
|
||||
ovecsize: cint): cint
|
||||
|
||||
proc jit_exec*(code: ptr Pcre,
|
||||
extra: ptr ExtraData,
|
||||
subject: cstring,
|
||||
length: cint,
|
||||
startoffset: cint,
|
||||
options: cint,
|
||||
ovector: ptr cint,
|
||||
ovecsize: cint,
|
||||
jstack: ptr JitStack): cint
|
||||
|
||||
proc free_substring*(stringptr: cstring)
|
||||
|
||||
proc free_substring_list*(stringptr: cstringArray)
|
||||
|
||||
proc fullinfo*(code: ptr Pcre,
|
||||
extra: ptr ExtraData,
|
||||
what: cint,
|
||||
where: pointer): cint
|
||||
|
||||
proc get_named_substring*(code: ptr Pcre,
|
||||
subject: cstring,
|
||||
ovector: ptr cint,
|
||||
stringcount: cint,
|
||||
stringname: cstring,
|
||||
stringptr: cstringArray): cint
|
||||
|
||||
proc get_stringnumber*(code: ptr Pcre,
|
||||
name: cstring): cint
|
||||
|
||||
proc get_stringtable_entries*(code: ptr Pcre,
|
||||
name: cstring,
|
||||
first: cstringArray,
|
||||
last: cstringArray): cint
|
||||
|
||||
proc get_substring*(subject: cstring,
|
||||
ovector: ptr cint,
|
||||
stringcount: cint,
|
||||
stringnumber: cint,
|
||||
stringptr: cstringArray): cint
|
||||
|
||||
proc get_substring_list*(subject: cstring,
|
||||
ovector: ptr cint,
|
||||
stringcount: cint,
|
||||
listptr: ptr cstringArray): cint
|
||||
|
||||
proc maketables*(): pointer
|
||||
|
||||
proc refcount*(code: ptr Pcre,
|
||||
adjust: cint): cint
|
||||
|
||||
proc study*(code: ptr Pcre,
|
||||
options: cint,
|
||||
errptr: ptr cstring): ptr ExtraData
|
||||
|
||||
proc free_study*(extra: ptr ExtraData)
|
||||
|
||||
proc version*(): cstring
|
||||
|
||||
# Utility functions for byte order swaps.
|
||||
|
||||
proc pattern_to_host_byte_order*(a2: ptr TPcre, a3: ptr TExtra,
|
||||
a4: ptr char): cint{.cdecl, importc: "pcre_pattern_to_host_byte_order",
|
||||
pcreImport.}
|
||||
proc pattern_to_host_byte_order*(code: ptr Pcre,
|
||||
extra: ptr ExtraData,
|
||||
tables: pointer): cint
|
||||
|
||||
# JIT compiler related functions.
|
||||
|
||||
proc jit_stack_alloc*(a2: cint, a3: cint): ptr Tjit_stack{.cdecl,
|
||||
importc: "pcre_jit_stack_alloc", pcreImport.}
|
||||
proc jit_stack_free*(a2: ptr Tjit_stack){.cdecl, importc: "pcre_jit_stack_free",
|
||||
pcreImport.}
|
||||
proc assign_jit_stack*(a2: ptr TExtra, a3: TJitCallback, a4: pointer){.cdecl,
|
||||
importc: "pcre_assign_jit_stack", pcreImport.}
|
||||
proc jit_stack_alloc*(startsize: cint,
|
||||
maxsize: cint): ptr JitStack
|
||||
|
||||
var
|
||||
pcre_free*: proc (p: ptr TPcre) {.cdecl.}
|
||||
proc jit_stack_free*(stack: ptr JitStack)
|
||||
|
||||
proc assign_jit_stack*(extra: ptr ExtraData,
|
||||
callback: JitCallback,
|
||||
data: pointer)
|
||||
|
||||
proc jit_free_unused_memory*()
|
||||
|
||||
|
||||
# There was an odd function with `var cstring` instead of `ptr`
|
||||
proc study*(code: ptr Pcre,
|
||||
options: cint,
|
||||
errptr: var cstring): ptr ExtraData {.deprecated.}
|
||||
|
||||
{.pop.}
|
||||
{.pop.}
|
||||
|
||||
|
||||
{.deprecated: [MAJOR: PCRE_MAJOR, MINOR: PCRE_MINOR,
|
||||
PRERELEASE: PCRE_PRERELEASE, DATE: PCRE_DATE].}
|
||||
|
||||
{.deprecated: [TPcre: Pcre, TJitStack: JitStack].}
|
||||
type
|
||||
PPcre* {.deprecated.} = ptr Pcre
|
||||
PJitStack* {.deprecated.} = ptr JitStack
|
||||
|
||||
{.deprecated: [TExtra: ExtraData].}
|
||||
{.deprecated: [TCalloutBlock: CalloutBlock].}
|
||||
{.deprecated: [TJitCallback: JitCallback].}
|
||||
|
||||
Reference in New Issue
Block a user