@@ -267,6 +267,85 @@ data_stack_grow(SRE_STATE* state, Py_ssize_t size)
267
267
return 0 ;
268
268
}
269
269
270
+ /* memory pool functions for SRE_REPEAT, this can avoid memory
271
+ leak when SRE(match) function terminates abruptly.
272
+ state->repeat_pool_used is a doubly-linked list, so that we
273
+ can remove a SRE_REPEAT node from it.
274
+ state->repeat_pool_unused is a singly-linked list, we put/get
275
+ node at the head. */
276
+ static SRE_REPEAT *
277
+ repeat_pool_malloc (SRE_STATE * state )
278
+ {
279
+ SRE_REPEAT * repeat ;
280
+
281
+ if (state -> repeat_pool_unused ) {
282
+ /* remove from unused pool (singly-linked list) */
283
+ repeat = state -> repeat_pool_unused ;
284
+ state -> repeat_pool_unused = repeat -> pool_next ;
285
+ }
286
+ else {
287
+ repeat = PyMem_Malloc (sizeof (SRE_REPEAT ));
288
+ if (!repeat ) {
289
+ return NULL ;
290
+ }
291
+ }
292
+
293
+ /* add to used pool (doubly-linked list) */
294
+ SRE_REPEAT * temp = state -> repeat_pool_used ;
295
+ if (temp ) {
296
+ temp -> pool_prev = repeat ;
297
+ }
298
+ repeat -> pool_prev = NULL ;
299
+ repeat -> pool_next = temp ;
300
+ state -> repeat_pool_used = repeat ;
301
+
302
+ return repeat ;
303
+ }
304
+
305
+ static void
306
+ repeat_pool_free (SRE_STATE * state , SRE_REPEAT * repeat )
307
+ {
308
+ SRE_REPEAT * prev = repeat -> pool_prev ;
309
+ SRE_REPEAT * next = repeat -> pool_next ;
310
+
311
+ /* remove from used pool (doubly-linked list) */
312
+ if (prev ) {
313
+ prev -> pool_next = next ;
314
+ }
315
+ else {
316
+ state -> repeat_pool_used = next ;
317
+ }
318
+ if (next ) {
319
+ next -> pool_prev = prev ;
320
+ }
321
+
322
+ /* add to unused pool (singly-linked list) */
323
+ repeat -> pool_next = state -> repeat_pool_unused ;
324
+ state -> repeat_pool_unused = repeat ;
325
+ }
326
+
327
+ static void
328
+ repeat_pool_clear (SRE_STATE * state )
329
+ {
330
+ /* clear used pool */
331
+ SRE_REPEAT * next = state -> repeat_pool_used ;
332
+ state -> repeat_pool_used = NULL ;
333
+ while (next ) {
334
+ SRE_REPEAT * temp = next ;
335
+ next = temp -> pool_next ;
336
+ PyMem_Free (temp );
337
+ }
338
+
339
+ /* clear unused pool */
340
+ next = state -> repeat_pool_unused ;
341
+ state -> repeat_pool_unused = NULL ;
342
+ while (next ) {
343
+ SRE_REPEAT * temp = next ;
344
+ next = temp -> pool_next ;
345
+ PyMem_Free (temp );
346
+ }
347
+ }
348
+
270
349
/* generate 8-bit version */
271
350
272
351
#define SRE_CHAR Py_UCS1
@@ -511,6 +590,11 @@ state_init(SRE_STATE* state, PatternObject* pattern, PyObject* string,
511
590
state -> pos = start ;
512
591
state -> endpos = end ;
513
592
593
+ #ifdef Py_DEBUG
594
+ state -> fail_after_count = pattern -> fail_after_count ;
595
+ state -> fail_after_exc = pattern -> fail_after_exc ; // borrowed ref
596
+ #endif
597
+
514
598
return string ;
515
599
err :
516
600
/* We add an explicit cast here because MSVC has a bug when
@@ -533,6 +617,8 @@ state_fini(SRE_STATE* state)
533
617
/* See above PyMem_Del for why we explicitly cast here. */
534
618
PyMem_Free ((void * ) state -> mark );
535
619
state -> mark = NULL ;
620
+ /* SRE_REPEAT pool */
621
+ repeat_pool_clear (state );
536
622
}
537
623
538
624
/* calculate offset from start of string */
@@ -619,6 +705,9 @@ pattern_traverse(PatternObject *self, visitproc visit, void *arg)
619
705
Py_VISIT (self -> groupindex );
620
706
Py_VISIT (self -> indexgroup );
621
707
Py_VISIT (self -> pattern );
708
+ #ifdef Py_DEBUG
709
+ Py_VISIT (self -> fail_after_exc );
710
+ #endif
622
711
return 0 ;
623
712
}
624
713
@@ -628,6 +717,9 @@ pattern_clear(PatternObject *self)
628
717
Py_CLEAR (self -> groupindex );
629
718
Py_CLEAR (self -> indexgroup );
630
719
Py_CLEAR (self -> pattern );
720
+ #ifdef Py_DEBUG
721
+ Py_CLEAR (self -> fail_after_exc );
722
+ #endif
631
723
return 0 ;
632
724
}
633
725
@@ -690,7 +782,7 @@ _sre_SRE_Pattern_match_impl(PatternObject *self, PyTypeObject *cls,
690
782
Py_ssize_t status ;
691
783
PyObject * match ;
692
784
693
- if (!state_init (& state , ( PatternObject * ) self , string , pos , endpos ))
785
+ if (!state_init (& state , self , string , pos , endpos ))
694
786
return NULL ;
695
787
696
788
INIT_TRACE (& state );
@@ -1381,6 +1473,29 @@ _sre_SRE_Pattern___deepcopy__(PatternObject *self, PyObject *memo)
1381
1473
return Py_NewRef (self );
1382
1474
}
1383
1475
1476
+ #ifdef Py_DEBUG
1477
+ /*[clinic input]
1478
+ _sre.SRE_Pattern._fail_after
1479
+
1480
+ count: int
1481
+ exception: object
1482
+ /
1483
+
1484
+ For debugging.
1485
+ [clinic start generated code]*/
1486
+
1487
+ static PyObject *
1488
+ _sre_SRE_Pattern__fail_after_impl (PatternObject * self , int count ,
1489
+ PyObject * exception )
1490
+ /*[clinic end generated code: output=9a6bf12135ac50c2 input=ef80a45c66c5499d]*/
1491
+ {
1492
+ self -> fail_after_count = count ;
1493
+ Py_INCREF (exception );
1494
+ Py_XSETREF (self -> fail_after_exc , exception );
1495
+ Py_RETURN_NONE ;
1496
+ }
1497
+ #endif /* Py_DEBUG */
1498
+
1384
1499
static PyObject *
1385
1500
pattern_repr (PatternObject * obj )
1386
1501
{
@@ -1506,6 +1621,10 @@ _sre_compile_impl(PyObject *module, PyObject *pattern, int flags,
1506
1621
self -> pattern = NULL ;
1507
1622
self -> groupindex = NULL ;
1508
1623
self -> indexgroup = NULL ;
1624
+ #ifdef Py_DEBUG
1625
+ self -> fail_after_count = -1 ;
1626
+ self -> fail_after_exc = NULL ;
1627
+ #endif
1509
1628
1510
1629
self -> codesize = n ;
1511
1630
@@ -2604,7 +2723,8 @@ pattern_new_match(_sremodulestate* module_state,
2604
2723
if (!match )
2605
2724
return NULL ;
2606
2725
2607
- match -> pattern = (PatternObject * )Py_NewRef (pattern );
2726
+ Py_INCREF (pattern );
2727
+ match -> pattern = pattern ;
2608
2728
2609
2729
match -> string = Py_NewRef (state -> string );
2610
2730
@@ -2740,7 +2860,7 @@ _sre_SRE_Scanner_match_impl(ScannerObject *self, PyTypeObject *cls)
2740
2860
return NULL ;
2741
2861
}
2742
2862
2743
- match = pattern_new_match (module_state , ( PatternObject * ) self -> pattern ,
2863
+ match = pattern_new_match (module_state , self -> pattern ,
2744
2864
state , status );
2745
2865
2746
2866
if (status == 0 )
@@ -2790,7 +2910,7 @@ _sre_SRE_Scanner_search_impl(ScannerObject *self, PyTypeObject *cls)
2790
2910
return NULL ;
2791
2911
}
2792
2912
2793
- match = pattern_new_match (module_state , ( PatternObject * ) self -> pattern ,
2913
+ match = pattern_new_match (module_state , self -> pattern ,
2794
2914
state , status );
2795
2915
2796
2916
if (status == 0 )
@@ -2826,7 +2946,8 @@ pattern_scanner(_sremodulestate *module_state,
2826
2946
return NULL ;
2827
2947
}
2828
2948
2829
- scanner -> pattern = Py_NewRef (self );
2949
+ Py_INCREF (self );
2950
+ scanner -> pattern = self ;
2830
2951
2831
2952
PyObject_GC_Track (scanner );
2832
2953
return (PyObject * ) scanner ;
@@ -3020,6 +3141,7 @@ static PyMethodDef pattern_methods[] = {
3020
3141
_SRE_SRE_PATTERN_SCANNER_METHODDEF
3021
3142
_SRE_SRE_PATTERN___COPY___METHODDEF
3022
3143
_SRE_SRE_PATTERN___DEEPCOPY___METHODDEF
3144
+ _SRE_SRE_PATTERN__FAIL_AFTER_METHODDEF
3023
3145
{"__class_getitem__" , Py_GenericAlias , METH_O |METH_CLASS ,
3024
3146
PyDoc_STR ("See PEP 585" )},
3025
3147
{NULL , NULL }
0 commit comments