1 /*************************************************
2 * Perl-Compatible Regular Expressions *
3 *************************************************/
4
5 /* PCRE is a library of functions to support regular expressions whose syntax
6 and semantics are as close as possible to those of the Perl 5 language.
7
8 Written by Philip Hazel
9 Original API code Copyright (c) 1997-2012 University of Cambridge
10 New API code Copyright (c) 2016-2024 University of Cambridge
11
12 -----------------------------------------------------------------------------
13 Redistribution and use in source and binary forms, with or without
14 modification, are permitted provided that the following conditions are met:
15
16 * Redistributions of source code must retain the above copyright notice,
17 this list of conditions and the following disclaimer.
18
19 * Redistributions in binary form must reproduce the above copyright
20 notice, this list of conditions and the following disclaimer in the
21 documentation and/or other materials provided with the distribution.
22
23 * Neither the name of the University of Cambridge nor the names of its
24 contributors may be used to endorse or promote products derived from
25 this software without specific prior written permission.
26
27 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
28 AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
29 IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
30 ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
31 LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
32 CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
33 SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
34 INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
35 CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
36 ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
37 POSSIBILITY OF SUCH DAMAGE.
38 -----------------------------------------------------------------------------
39 */
40
41
42 #ifdef HAVE_CONFIG_H
43 #include "config.h"
44 #endif
45
46 #include "pcre2_internal.h"
47
48
49
50 /*************************************************
51 * Default malloc/free functions *
52 *************************************************/
53
54 /* Ignore the "user data" argument in each case. */
55
default_malloc(size_t size,void * data)56 static void *default_malloc(size_t size, void *data)
57 {
58 (void)data;
59 return malloc(size);
60 }
61
62
default_free(void * block,void * data)63 static void default_free(void *block, void *data)
64 {
65 (void)data;
66 free(block);
67 }
68
69
70
71 /*************************************************
72 * Get a block and save memory control *
73 *************************************************/
74
75 /* This internal function is called to get a block of memory in which the
76 memory control data is to be stored at the start for future use.
77
78 Arguments:
79 size amount of memory required
80 memctl pointer to a memctl block or NULL
81
82 Returns: pointer to memory or NULL on failure
83 */
84
85 extern void *
PRIV(memctl_malloc)86 PRIV(memctl_malloc)(size_t size, pcre2_memctl *memctl)
87 {
88 pcre2_memctl *newmemctl;
89 void *yield = (memctl == NULL)? malloc(size) :
90 memctl->malloc(size, memctl->memory_data);
91 if (yield == NULL) return NULL;
92 newmemctl = (pcre2_memctl *)yield;
93 if (memctl == NULL)
94 {
95 newmemctl->malloc = default_malloc;
96 newmemctl->free = default_free;
97 newmemctl->memory_data = NULL;
98 }
99 else *newmemctl = *memctl;
100 return yield;
101 }
102
103
104
105 /*************************************************
106 * Create and initialize contexts *
107 *************************************************/
108
109 /* Initializing for compile and match contexts is done in separate, private
110 functions so that these can be called from functions such as pcre2_compile()
111 when an external context is not supplied. The initializing functions have an
112 option to set up default memory management. */
113
114 PCRE2_EXP_DEFN pcre2_general_context * PCRE2_CALL_CONVENTION
pcre2_general_context_create(void * (* private_malloc)(size_t,void *),void (* private_free)(void *,void *),void * memory_data)115 pcre2_general_context_create(void *(*private_malloc)(size_t, void *),
116 void (*private_free)(void *, void *), void *memory_data)
117 {
118 pcre2_general_context *gcontext;
119 if (private_malloc == NULL) private_malloc = default_malloc;
120 if (private_free == NULL) private_free = default_free;
121 gcontext = private_malloc(sizeof(pcre2_real_general_context), memory_data);
122 if (gcontext == NULL) return NULL;
123 gcontext->memctl.malloc = private_malloc;
124 gcontext->memctl.free = private_free;
125 gcontext->memctl.memory_data = memory_data;
126 return gcontext;
127 }
128
129
130 /* A default compile context is set up to save having to initialize at run time
131 when no context is supplied to the compile function. */
132
133 const pcre2_compile_context PRIV(default_compile_context) = {
134 { default_malloc, default_free, NULL }, /* Default memory handling */
135 NULL, /* Stack guard */
136 NULL, /* Stack guard data */
137 PRIV(default_tables), /* Character tables */
138 PCRE2_UNSET, /* Max pattern length */
139 PCRE2_UNSET, /* Max pattern compiled length */
140 BSR_DEFAULT, /* Backslash R default */
141 NEWLINE_DEFAULT, /* Newline convention */
142 PARENS_NEST_LIMIT, /* As it says */
143 0, /* Extra options */
144 MAX_VARLOOKBEHIND /* As it says */
145 };
146
147 /* The create function copies the default into the new memory, but must
148 override the default memory handling functions if a gcontext was provided. */
149
150 PCRE2_EXP_DEFN pcre2_compile_context * PCRE2_CALL_CONVENTION
pcre2_compile_context_create(pcre2_general_context * gcontext)151 pcre2_compile_context_create(pcre2_general_context *gcontext)
152 {
153 pcre2_compile_context *ccontext = PRIV(memctl_malloc)(
154 sizeof(pcre2_real_compile_context), (pcre2_memctl *)gcontext);
155 if (ccontext == NULL) return NULL;
156 *ccontext = PRIV(default_compile_context);
157 if (gcontext != NULL)
158 *((pcre2_memctl *)ccontext) = *((pcre2_memctl *)gcontext);
159 return ccontext;
160 }
161
162
163 /* A default match context is set up to save having to initialize at run time
164 when no context is supplied to a match function. */
165
166 const pcre2_match_context PRIV(default_match_context) = {
167 { default_malloc, default_free, NULL },
168 #ifdef SUPPORT_JIT
169 NULL, /* JIT callback */
170 NULL, /* JIT callback data */
171 #endif
172 NULL, /* Callout function */
173 NULL, /* Callout data */
174 NULL, /* Substitute callout function */
175 NULL, /* Substitute callout data */
176 PCRE2_UNSET, /* Offset limit */
177 HEAP_LIMIT,
178 MATCH_LIMIT,
179 MATCH_LIMIT_DEPTH };
180
181 /* The create function copies the default into the new memory, but must
182 override the default memory handling functions if a gcontext was provided. */
183
184 PCRE2_EXP_DEFN pcre2_match_context * PCRE2_CALL_CONVENTION
pcre2_match_context_create(pcre2_general_context * gcontext)185 pcre2_match_context_create(pcre2_general_context *gcontext)
186 {
187 pcre2_match_context *mcontext = PRIV(memctl_malloc)(
188 sizeof(pcre2_real_match_context), (pcre2_memctl *)gcontext);
189 if (mcontext == NULL) return NULL;
190 *mcontext = PRIV(default_match_context);
191 if (gcontext != NULL)
192 *((pcre2_memctl *)mcontext) = *((pcre2_memctl *)gcontext);
193 return mcontext;
194 }
195
196
197 /* A default convert context is set up to save having to initialize at run time
198 when no context is supplied to the convert function. */
199
200 const pcre2_convert_context PRIV(default_convert_context) = {
201 { default_malloc, default_free, NULL }, /* Default memory handling */
202 #ifdef _WIN32
203 CHAR_BACKSLASH, /* Default path separator */
204 CHAR_GRAVE_ACCENT /* Default escape character */
205 #else /* Not Windows */
206 CHAR_SLASH, /* Default path separator */
207 CHAR_BACKSLASH /* Default escape character */
208 #endif
209 };
210
211 /* The create function copies the default into the new memory, but must
212 override the default memory handling functions if a gcontext was provided. */
213
214 PCRE2_EXP_DEFN pcre2_convert_context * PCRE2_CALL_CONVENTION
pcre2_convert_context_create(pcre2_general_context * gcontext)215 pcre2_convert_context_create(pcre2_general_context *gcontext)
216 {
217 pcre2_convert_context *ccontext = PRIV(memctl_malloc)(
218 sizeof(pcre2_real_convert_context), (pcre2_memctl *)gcontext);
219 if (ccontext == NULL) return NULL;
220 *ccontext = PRIV(default_convert_context);
221 if (gcontext != NULL)
222 *((pcre2_memctl *)ccontext) = *((pcre2_memctl *)gcontext);
223 return ccontext;
224 }
225
226
227 /*************************************************
228 * Context copy functions *
229 *************************************************/
230
231 PCRE2_EXP_DEFN pcre2_general_context * PCRE2_CALL_CONVENTION
pcre2_general_context_copy(pcre2_general_context * gcontext)232 pcre2_general_context_copy(pcre2_general_context *gcontext)
233 {
234 pcre2_general_context *newcontext =
235 gcontext->memctl.malloc(sizeof(pcre2_real_general_context),
236 gcontext->memctl.memory_data);
237 if (newcontext == NULL) return NULL;
238 memcpy(newcontext, gcontext, sizeof(pcre2_real_general_context));
239 return newcontext;
240 }
241
242
243 PCRE2_EXP_DEFN pcre2_compile_context * PCRE2_CALL_CONVENTION
pcre2_compile_context_copy(pcre2_compile_context * ccontext)244 pcre2_compile_context_copy(pcre2_compile_context *ccontext)
245 {
246 pcre2_compile_context *newcontext =
247 ccontext->memctl.malloc(sizeof(pcre2_real_compile_context),
248 ccontext->memctl.memory_data);
249 if (newcontext == NULL) return NULL;
250 memcpy(newcontext, ccontext, sizeof(pcre2_real_compile_context));
251 return newcontext;
252 }
253
254
255 PCRE2_EXP_DEFN pcre2_match_context * PCRE2_CALL_CONVENTION
pcre2_match_context_copy(pcre2_match_context * mcontext)256 pcre2_match_context_copy(pcre2_match_context *mcontext)
257 {
258 pcre2_match_context *newcontext =
259 mcontext->memctl.malloc(sizeof(pcre2_real_match_context),
260 mcontext->memctl.memory_data);
261 if (newcontext == NULL) return NULL;
262 memcpy(newcontext, mcontext, sizeof(pcre2_real_match_context));
263 return newcontext;
264 }
265
266
267 PCRE2_EXP_DEFN pcre2_convert_context * PCRE2_CALL_CONVENTION
pcre2_convert_context_copy(pcre2_convert_context * ccontext)268 pcre2_convert_context_copy(pcre2_convert_context *ccontext)
269 {
270 pcre2_convert_context *newcontext =
271 ccontext->memctl.malloc(sizeof(pcre2_real_convert_context),
272 ccontext->memctl.memory_data);
273 if (newcontext == NULL) return NULL;
274 memcpy(newcontext, ccontext, sizeof(pcre2_real_convert_context));
275 return newcontext;
276 }
277
278
279 /*************************************************
280 * Context free functions *
281 *************************************************/
282
283 PCRE2_EXP_DEFN void PCRE2_CALL_CONVENTION
pcre2_general_context_free(pcre2_general_context * gcontext)284 pcre2_general_context_free(pcre2_general_context *gcontext)
285 {
286 if (gcontext != NULL)
287 gcontext->memctl.free(gcontext, gcontext->memctl.memory_data);
288 }
289
290
291 PCRE2_EXP_DEFN void PCRE2_CALL_CONVENTION
pcre2_compile_context_free(pcre2_compile_context * ccontext)292 pcre2_compile_context_free(pcre2_compile_context *ccontext)
293 {
294 if (ccontext != NULL)
295 ccontext->memctl.free(ccontext, ccontext->memctl.memory_data);
296 }
297
298
299 PCRE2_EXP_DEFN void PCRE2_CALL_CONVENTION
pcre2_match_context_free(pcre2_match_context * mcontext)300 pcre2_match_context_free(pcre2_match_context *mcontext)
301 {
302 if (mcontext != NULL)
303 mcontext->memctl.free(mcontext, mcontext->memctl.memory_data);
304 }
305
306
307 PCRE2_EXP_DEFN void PCRE2_CALL_CONVENTION
pcre2_convert_context_free(pcre2_convert_context * ccontext)308 pcre2_convert_context_free(pcre2_convert_context *ccontext)
309 {
310 if (ccontext != NULL)
311 ccontext->memctl.free(ccontext, ccontext->memctl.memory_data);
312 }
313
314
315 /*************************************************
316 * Set values in contexts *
317 *************************************************/
318
319 /* All these functions return 0 for success or PCRE2_ERROR_BADDATA if invalid
320 data is given. Only some of the functions are able to test the validity of the
321 data. */
322
323
324 /* ------------ Compile context ------------ */
325
326 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_character_tables(pcre2_compile_context * ccontext,const uint8_t * tables)327 pcre2_set_character_tables(pcre2_compile_context *ccontext,
328 const uint8_t *tables)
329 {
330 ccontext->tables = tables;
331 return 0;
332 }
333
334 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_bsr(pcre2_compile_context * ccontext,uint32_t value)335 pcre2_set_bsr(pcre2_compile_context *ccontext, uint32_t value)
336 {
337 switch(value)
338 {
339 case PCRE2_BSR_ANYCRLF:
340 case PCRE2_BSR_UNICODE:
341 ccontext->bsr_convention = value;
342 return 0;
343
344 default:
345 return PCRE2_ERROR_BADDATA;
346 }
347 }
348
349 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_max_pattern_length(pcre2_compile_context * ccontext,PCRE2_SIZE length)350 pcre2_set_max_pattern_length(pcre2_compile_context *ccontext, PCRE2_SIZE length)
351 {
352 ccontext->max_pattern_length = length;
353 return 0;
354 }
355
356 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_max_pattern_compiled_length(pcre2_compile_context * ccontext,PCRE2_SIZE length)357 pcre2_set_max_pattern_compiled_length(pcre2_compile_context *ccontext, PCRE2_SIZE length)
358 {
359 ccontext->max_pattern_compiled_length = length;
360 return 0;
361 }
362
363 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_newline(pcre2_compile_context * ccontext,uint32_t newline)364 pcre2_set_newline(pcre2_compile_context *ccontext, uint32_t newline)
365 {
366 switch(newline)
367 {
368 case PCRE2_NEWLINE_CR:
369 case PCRE2_NEWLINE_LF:
370 case PCRE2_NEWLINE_CRLF:
371 case PCRE2_NEWLINE_ANY:
372 case PCRE2_NEWLINE_ANYCRLF:
373 case PCRE2_NEWLINE_NUL:
374 ccontext->newline_convention = newline;
375 return 0;
376
377 default:
378 return PCRE2_ERROR_BADDATA;
379 }
380 }
381
382 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_max_varlookbehind(pcre2_compile_context * ccontext,uint32_t limit)383 pcre2_set_max_varlookbehind(pcre2_compile_context *ccontext, uint32_t limit)
384 {
385 ccontext->max_varlookbehind = limit;
386 return 0;
387 }
388
389 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_parens_nest_limit(pcre2_compile_context * ccontext,uint32_t limit)390 pcre2_set_parens_nest_limit(pcre2_compile_context *ccontext, uint32_t limit)
391 {
392 ccontext->parens_nest_limit = limit;
393 return 0;
394 }
395
396 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_compile_extra_options(pcre2_compile_context * ccontext,uint32_t options)397 pcre2_set_compile_extra_options(pcre2_compile_context *ccontext, uint32_t options)
398 {
399 ccontext->extra_options = options;
400 return 0;
401 }
402
403 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_compile_recursion_guard(pcre2_compile_context * ccontext,int (* guard)(uint32_t,void *),void * user_data)404 pcre2_set_compile_recursion_guard(pcre2_compile_context *ccontext,
405 int (*guard)(uint32_t, void *), void *user_data)
406 {
407 ccontext->stack_guard = guard;
408 ccontext->stack_guard_data = user_data;
409 return 0;
410 }
411
412
413 /* ------------ Match context ------------ */
414
415 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_callout(pcre2_match_context * mcontext,int (* callout)(pcre2_callout_block *,void *),void * callout_data)416 pcre2_set_callout(pcre2_match_context *mcontext,
417 int (*callout)(pcre2_callout_block *, void *), void *callout_data)
418 {
419 mcontext->callout = callout;
420 mcontext->callout_data = callout_data;
421 return 0;
422 }
423
424 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_substitute_callout(pcre2_match_context * mcontext,int (* substitute_callout)(pcre2_substitute_callout_block *,void *),void * substitute_callout_data)425 pcre2_set_substitute_callout(pcre2_match_context *mcontext,
426 int (*substitute_callout)(pcre2_substitute_callout_block *, void *),
427 void *substitute_callout_data)
428 {
429 mcontext->substitute_callout = substitute_callout;
430 mcontext->substitute_callout_data = substitute_callout_data;
431 return 0;
432 }
433
434 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_heap_limit(pcre2_match_context * mcontext,uint32_t limit)435 pcre2_set_heap_limit(pcre2_match_context *mcontext, uint32_t limit)
436 {
437 mcontext->heap_limit = limit;
438 return 0;
439 }
440
441 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_match_limit(pcre2_match_context * mcontext,uint32_t limit)442 pcre2_set_match_limit(pcre2_match_context *mcontext, uint32_t limit)
443 {
444 mcontext->match_limit = limit;
445 return 0;
446 }
447
448 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_depth_limit(pcre2_match_context * mcontext,uint32_t limit)449 pcre2_set_depth_limit(pcre2_match_context *mcontext, uint32_t limit)
450 {
451 mcontext->depth_limit = limit;
452 return 0;
453 }
454
455 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_offset_limit(pcre2_match_context * mcontext,PCRE2_SIZE limit)456 pcre2_set_offset_limit(pcre2_match_context *mcontext, PCRE2_SIZE limit)
457 {
458 mcontext->offset_limit = limit;
459 return 0;
460 }
461
462 /* These functions became obsolete at release 10.30. The first is kept as a
463 synonym for backwards compatibility. The second now does nothing. Exclude both
464 from coverage reports. */
465
466 /* LCOV_EXCL_START */
467
468 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_recursion_limit(pcre2_match_context * mcontext,uint32_t limit)469 pcre2_set_recursion_limit(pcre2_match_context *mcontext, uint32_t limit)
470 {
471 return pcre2_set_depth_limit(mcontext, limit);
472 }
473
474 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_recursion_memory_management(pcre2_match_context * mcontext,void * (* mymalloc)(size_t,void *),void (* myfree)(void *,void *),void * mydata)475 pcre2_set_recursion_memory_management(pcre2_match_context *mcontext,
476 void *(*mymalloc)(size_t, void *), void (*myfree)(void *, void *),
477 void *mydata)
478 {
479 (void)mcontext;
480 (void)mymalloc;
481 (void)myfree;
482 (void)mydata;
483 return 0;
484 }
485
486 /* LCOV_EXCL_STOP */
487
488
489 /* ------------ Convert context ------------ */
490
491 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_glob_separator(pcre2_convert_context * ccontext,uint32_t separator)492 pcre2_set_glob_separator(pcre2_convert_context *ccontext, uint32_t separator)
493 {
494 if (separator != CHAR_SLASH && separator != CHAR_BACKSLASH &&
495 separator != CHAR_DOT) return PCRE2_ERROR_BADDATA;
496 ccontext->glob_separator = separator;
497 return 0;
498 }
499
500 PCRE2_EXP_DEFN int PCRE2_CALL_CONVENTION
pcre2_set_glob_escape(pcre2_convert_context * ccontext,uint32_t escape)501 pcre2_set_glob_escape(pcre2_convert_context *ccontext, uint32_t escape)
502 {
503 if (escape > 255 || (escape != 0 && !ispunct(escape)))
504 return PCRE2_ERROR_BADDATA;
505 ccontext->glob_escape = escape;
506 return 0;
507 }
508
509 /* End of pcre2_context.c */
510
511