1*22dc650dSSadaf Ebrahimi /*************************************************
2*22dc650dSSadaf Ebrahimi * Perl-Compatible Regular Expressions *
3*22dc650dSSadaf Ebrahimi *************************************************/
4*22dc650dSSadaf Ebrahimi
5*22dc650dSSadaf Ebrahimi /* PCRE is a library of functions to support regular expressions whose syntax
6*22dc650dSSadaf Ebrahimi and semantics are as close as possible to those of the Perl 5 language.
7*22dc650dSSadaf Ebrahimi
8*22dc650dSSadaf Ebrahimi Written by Philip Hazel
9*22dc650dSSadaf Ebrahimi Original API code Copyright (c) 1997-2012 University of Cambridge
10*22dc650dSSadaf Ebrahimi New API code Copyright (c) 2016-2020 University of Cambridge
11*22dc650dSSadaf Ebrahimi
12*22dc650dSSadaf Ebrahimi -----------------------------------------------------------------------------
13*22dc650dSSadaf Ebrahimi Redistribution and use in source and binary forms, with or without
14*22dc650dSSadaf Ebrahimi modification, are permitted provided that the following conditions are met:
15*22dc650dSSadaf Ebrahimi
16*22dc650dSSadaf Ebrahimi * Redistributions of source code must retain the above copyright notice,
17*22dc650dSSadaf Ebrahimi this list of conditions and the following disclaimer.
18*22dc650dSSadaf Ebrahimi
19*22dc650dSSadaf Ebrahimi * Redistributions in binary form must reproduce the above copyright
20*22dc650dSSadaf Ebrahimi notice, this list of conditions and the following disclaimer in the
21*22dc650dSSadaf Ebrahimi documentation and/or other materials provided with the distribution.
22*22dc650dSSadaf Ebrahimi
23*22dc650dSSadaf Ebrahimi * Neither the name of the University of Cambridge nor the names of its
24*22dc650dSSadaf Ebrahimi contributors may be used to endorse or promote products derived from
25*22dc650dSSadaf Ebrahimi this software without specific prior written permission.
26*22dc650dSSadaf Ebrahimi
27*22dc650dSSadaf Ebrahimi THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
28*22dc650dSSadaf Ebrahimi AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
29*22dc650dSSadaf Ebrahimi IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
30*22dc650dSSadaf Ebrahimi ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
31*22dc650dSSadaf Ebrahimi LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
32*22dc650dSSadaf Ebrahimi CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
33*22dc650dSSadaf Ebrahimi SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
34*22dc650dSSadaf Ebrahimi INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
35*22dc650dSSadaf Ebrahimi CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
36*22dc650dSSadaf Ebrahimi ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
37*22dc650dSSadaf Ebrahimi POSSIBILITY OF SUCH DAMAGE.
38*22dc650dSSadaf Ebrahimi -----------------------------------------------------------------------------
39*22dc650dSSadaf Ebrahimi */
40*22dc650dSSadaf Ebrahimi
41*22dc650dSSadaf Ebrahimi #ifdef HAVE_CONFIG_H
42*22dc650dSSadaf Ebrahimi #include "config.h"
43*22dc650dSSadaf Ebrahimi #endif
44*22dc650dSSadaf Ebrahimi
45*22dc650dSSadaf Ebrahimi /* Save the configured link size, which is in bytes. In 16-bit and 32-bit modes
46*22dc650dSSadaf Ebrahimi its value gets changed by pcre2_intmodedep.h (included by pcre2_internal.h) to
47*22dc650dSSadaf Ebrahimi be in code units. */
48*22dc650dSSadaf Ebrahimi
49*22dc650dSSadaf Ebrahimi static int configured_link_size = LINK_SIZE;
50*22dc650dSSadaf Ebrahimi
51*22dc650dSSadaf Ebrahimi #include "pcre2_internal.h"
52*22dc650dSSadaf Ebrahimi
53*22dc650dSSadaf Ebrahimi /* These macros are the standard way of turning unquoted text into C strings.
54*22dc650dSSadaf Ebrahimi They allow macros like PCRE2_MAJOR to be defined without quotes, which is
55*22dc650dSSadaf Ebrahimi convenient for user programs that want to test their values. */
56*22dc650dSSadaf Ebrahimi
57*22dc650dSSadaf Ebrahimi #define STRING(a) # a
58*22dc650dSSadaf Ebrahimi #define XSTRING(s) STRING(s)
59*22dc650dSSadaf Ebrahimi
60*22dc650dSSadaf Ebrahimi
61*22dc650dSSadaf Ebrahimi /*************************************************
62*22dc650dSSadaf Ebrahimi * Return info about what features are configured *
63*22dc650dSSadaf Ebrahimi *************************************************/
64*22dc650dSSadaf Ebrahimi
65*22dc650dSSadaf Ebrahimi /* If where is NULL, the length of memory required is returned.
66*22dc650dSSadaf Ebrahimi
67*22dc650dSSadaf Ebrahimi Arguments:
68*22dc650dSSadaf Ebrahimi what what information is required
69*22dc650dSSadaf Ebrahimi where where to put the information
70*22dc650dSSadaf Ebrahimi
71*22dc650dSSadaf Ebrahimi Returns: 0 if a numerical value is returned
72*22dc650dSSadaf Ebrahimi >= 0 if a string value
73*22dc650dSSadaf Ebrahimi PCRE2_ERROR_BADOPTION if "where" not recognized
74*22dc650dSSadaf Ebrahimi or JIT target requested when JIT not enabled
75*22dc650dSSadaf Ebrahimi */
76*22dc650dSSadaf Ebrahimi
77*22dc650dSSadaf Ebrahimi PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_config(uint32_t what,void * where)78*22dc650dSSadaf Ebrahimi pcre2_config(uint32_t what, void *where)
79*22dc650dSSadaf Ebrahimi {
80*22dc650dSSadaf Ebrahimi if (where == NULL) /* Requests a length */
81*22dc650dSSadaf Ebrahimi {
82*22dc650dSSadaf Ebrahimi switch(what)
83*22dc650dSSadaf Ebrahimi {
84*22dc650dSSadaf Ebrahimi default:
85*22dc650dSSadaf Ebrahimi return PCRE2_ERROR_BADOPTION;
86*22dc650dSSadaf Ebrahimi
87*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_BSR:
88*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_COMPILED_WIDTHS:
89*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_DEPTHLIMIT:
90*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_HEAPLIMIT:
91*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_JIT:
92*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_LINKSIZE:
93*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_MATCHLIMIT:
94*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_NEVER_BACKSLASH_C:
95*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_NEWLINE:
96*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_PARENSLIMIT:
97*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_STACKRECURSE: /* Obsolete */
98*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_TABLES_LENGTH:
99*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_UNICODE:
100*22dc650dSSadaf Ebrahimi return sizeof(uint32_t);
101*22dc650dSSadaf Ebrahimi
102*22dc650dSSadaf Ebrahimi /* These are handled below */
103*22dc650dSSadaf Ebrahimi
104*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_JITTARGET:
105*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_UNICODE_VERSION:
106*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_VERSION:
107*22dc650dSSadaf Ebrahimi break;
108*22dc650dSSadaf Ebrahimi }
109*22dc650dSSadaf Ebrahimi }
110*22dc650dSSadaf Ebrahimi
111*22dc650dSSadaf Ebrahimi switch (what)
112*22dc650dSSadaf Ebrahimi {
113*22dc650dSSadaf Ebrahimi default:
114*22dc650dSSadaf Ebrahimi return PCRE2_ERROR_BADOPTION;
115*22dc650dSSadaf Ebrahimi
116*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_BSR:
117*22dc650dSSadaf Ebrahimi #ifdef BSR_ANYCRLF
118*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = PCRE2_BSR_ANYCRLF;
119*22dc650dSSadaf Ebrahimi #else
120*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = PCRE2_BSR_UNICODE;
121*22dc650dSSadaf Ebrahimi #endif
122*22dc650dSSadaf Ebrahimi break;
123*22dc650dSSadaf Ebrahimi
124*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_COMPILED_WIDTHS:
125*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = 0
126*22dc650dSSadaf Ebrahimi #ifdef SUPPORT_PCRE2_8
127*22dc650dSSadaf Ebrahimi + 1
128*22dc650dSSadaf Ebrahimi #endif
129*22dc650dSSadaf Ebrahimi #ifdef SUPPORT_PCRE2_16
130*22dc650dSSadaf Ebrahimi + 2
131*22dc650dSSadaf Ebrahimi #endif
132*22dc650dSSadaf Ebrahimi #ifdef SUPPORT_PCRE2_32
133*22dc650dSSadaf Ebrahimi + 4
134*22dc650dSSadaf Ebrahimi #endif
135*22dc650dSSadaf Ebrahimi ;
136*22dc650dSSadaf Ebrahimi break;
137*22dc650dSSadaf Ebrahimi
138*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_DEPTHLIMIT:
139*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = MATCH_LIMIT_DEPTH;
140*22dc650dSSadaf Ebrahimi break;
141*22dc650dSSadaf Ebrahimi
142*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_HEAPLIMIT:
143*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = HEAP_LIMIT;
144*22dc650dSSadaf Ebrahimi break;
145*22dc650dSSadaf Ebrahimi
146*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_JIT:
147*22dc650dSSadaf Ebrahimi #ifdef SUPPORT_JIT
148*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = 1;
149*22dc650dSSadaf Ebrahimi #else
150*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = 0;
151*22dc650dSSadaf Ebrahimi #endif
152*22dc650dSSadaf Ebrahimi break;
153*22dc650dSSadaf Ebrahimi
154*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_JITTARGET:
155*22dc650dSSadaf Ebrahimi #ifdef SUPPORT_JIT
156*22dc650dSSadaf Ebrahimi {
157*22dc650dSSadaf Ebrahimi const char *v = PRIV(jit_get_target)();
158*22dc650dSSadaf Ebrahimi return (int)(1 + ((where == NULL)?
159*22dc650dSSadaf Ebrahimi strlen(v) : PRIV(strcpy_c8)((PCRE2_UCHAR *)where, v)));
160*22dc650dSSadaf Ebrahimi }
161*22dc650dSSadaf Ebrahimi #else
162*22dc650dSSadaf Ebrahimi return PCRE2_ERROR_BADOPTION;
163*22dc650dSSadaf Ebrahimi #endif
164*22dc650dSSadaf Ebrahimi
165*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_LINKSIZE:
166*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = (uint32_t)configured_link_size;
167*22dc650dSSadaf Ebrahimi break;
168*22dc650dSSadaf Ebrahimi
169*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_MATCHLIMIT:
170*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = MATCH_LIMIT;
171*22dc650dSSadaf Ebrahimi break;
172*22dc650dSSadaf Ebrahimi
173*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_NEWLINE:
174*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = NEWLINE_DEFAULT;
175*22dc650dSSadaf Ebrahimi break;
176*22dc650dSSadaf Ebrahimi
177*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_NEVER_BACKSLASH_C:
178*22dc650dSSadaf Ebrahimi #ifdef NEVER_BACKSLASH_C
179*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = 1;
180*22dc650dSSadaf Ebrahimi #else
181*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = 0;
182*22dc650dSSadaf Ebrahimi #endif
183*22dc650dSSadaf Ebrahimi break;
184*22dc650dSSadaf Ebrahimi
185*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_PARENSLIMIT:
186*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = PARENS_NEST_LIMIT;
187*22dc650dSSadaf Ebrahimi break;
188*22dc650dSSadaf Ebrahimi
189*22dc650dSSadaf Ebrahimi /* This is now obsolete. The stack is no longer used via recursion for
190*22dc650dSSadaf Ebrahimi handling backtracking in pcre2_match(). */
191*22dc650dSSadaf Ebrahimi
192*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_STACKRECURSE:
193*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = 0;
194*22dc650dSSadaf Ebrahimi break;
195*22dc650dSSadaf Ebrahimi
196*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_TABLES_LENGTH:
197*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = TABLES_LENGTH;
198*22dc650dSSadaf Ebrahimi break;
199*22dc650dSSadaf Ebrahimi
200*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_UNICODE_VERSION:
201*22dc650dSSadaf Ebrahimi {
202*22dc650dSSadaf Ebrahimi #if defined SUPPORT_UNICODE
203*22dc650dSSadaf Ebrahimi const char *v = PRIV(unicode_version);
204*22dc650dSSadaf Ebrahimi #else
205*22dc650dSSadaf Ebrahimi const char *v = "Unicode not supported";
206*22dc650dSSadaf Ebrahimi #endif
207*22dc650dSSadaf Ebrahimi return (int)(1 + ((where == NULL)?
208*22dc650dSSadaf Ebrahimi strlen(v) : PRIV(strcpy_c8)((PCRE2_UCHAR *)where, v)));
209*22dc650dSSadaf Ebrahimi }
210*22dc650dSSadaf Ebrahimi break;
211*22dc650dSSadaf Ebrahimi
212*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_UNICODE:
213*22dc650dSSadaf Ebrahimi #if defined SUPPORT_UNICODE
214*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = 1;
215*22dc650dSSadaf Ebrahimi #else
216*22dc650dSSadaf Ebrahimi *((uint32_t *)where) = 0;
217*22dc650dSSadaf Ebrahimi #endif
218*22dc650dSSadaf Ebrahimi break;
219*22dc650dSSadaf Ebrahimi
220*22dc650dSSadaf Ebrahimi /* The hackery in setting "v" below is to cope with the case when
221*22dc650dSSadaf Ebrahimi PCRE2_PRERELEASE is set to an empty string (which it is for real releases).
222*22dc650dSSadaf Ebrahimi If the second alternative is used in this case, it does not leave a space
223*22dc650dSSadaf Ebrahimi before the date. On the other hand, if all four macros are put into a single
224*22dc650dSSadaf Ebrahimi XSTRING when PCRE2_PRERELEASE is not empty, an unwanted space is inserted.
225*22dc650dSSadaf Ebrahimi There are problems using an "obvious" approach like this:
226*22dc650dSSadaf Ebrahimi
227*22dc650dSSadaf Ebrahimi XSTRING(PCRE2_MAJOR) "." XSTRING(PCRE_MINOR)
228*22dc650dSSadaf Ebrahimi XSTRING(PCRE2_PRERELEASE) " " XSTRING(PCRE_DATE)
229*22dc650dSSadaf Ebrahimi
230*22dc650dSSadaf Ebrahimi because, when PCRE2_PRERELEASE is empty, this leads to an attempted expansion
231*22dc650dSSadaf Ebrahimi of STRING(). The C standard states: "If (before argument substitution) any
232*22dc650dSSadaf Ebrahimi argument consists of no preprocessing tokens, the behavior is undefined." It
233*22dc650dSSadaf Ebrahimi turns out the gcc treats this case as a single empty string - which is what
234*22dc650dSSadaf Ebrahimi we really want - but Visual C grumbles about the lack of an argument for the
235*22dc650dSSadaf Ebrahimi macro. Unfortunately, both are within their rights. As there seems to be no
236*22dc650dSSadaf Ebrahimi way to test for a macro's value being empty at compile time, we have to
237*22dc650dSSadaf Ebrahimi resort to a runtime test. */
238*22dc650dSSadaf Ebrahimi
239*22dc650dSSadaf Ebrahimi case PCRE2_CONFIG_VERSION:
240*22dc650dSSadaf Ebrahimi {
241*22dc650dSSadaf Ebrahimi const char *v = (XSTRING(Z PCRE2_PRERELEASE)[1] == 0)?
242*22dc650dSSadaf Ebrahimi XSTRING(PCRE2_MAJOR.PCRE2_MINOR PCRE2_DATE) :
243*22dc650dSSadaf Ebrahimi XSTRING(PCRE2_MAJOR.PCRE2_MINOR) XSTRING(PCRE2_PRERELEASE PCRE2_DATE);
244*22dc650dSSadaf Ebrahimi return (int)(1 + ((where == NULL)?
245*22dc650dSSadaf Ebrahimi strlen(v) : PRIV(strcpy_c8)((PCRE2_UCHAR *)where, v)));
246*22dc650dSSadaf Ebrahimi }
247*22dc650dSSadaf Ebrahimi }
248*22dc650dSSadaf Ebrahimi
249*22dc650dSSadaf Ebrahimi return 0;
250*22dc650dSSadaf Ebrahimi }
251*22dc650dSSadaf Ebrahimi
252*22dc650dSSadaf Ebrahimi /* End of pcre2_config.c */
253