205 lines
6.5 KiB
Diff
205 lines
6.5 KiB
Diff
diff -up onig-6.8.2/src/regexec.c.orig onig-6.8.2/src/regexec.c
|
|
--- onig-6.8.2/src/regexec.c.orig 2018-04-17 02:08:37.000000000 +0200
|
|
+++ onig-6.8.2/src/regexec.c 2023-12-07 15:39:01.502781873 +0100
|
|
@@ -4384,14 +4384,14 @@ forward_search_range(regex_t* reg, const
|
|
#endif
|
|
|
|
p = s;
|
|
- if (reg->dmin > 0) {
|
|
+ if (reg->dmin != 0) {
|
|
+ if (end - p <= reg->dmin)
|
|
+ return 0; /* fail */
|
|
if (ONIGENC_IS_SINGLEBYTE(reg->enc)) {
|
|
p += reg->dmin;
|
|
}
|
|
else {
|
|
UChar *q = p + reg->dmin;
|
|
-
|
|
- if (q >= end) return 0; /* fail */
|
|
while (p < q) p += enclen(reg->enc, p);
|
|
}
|
|
}
|
|
@@ -4420,7 +4420,7 @@ forward_search_range(regex_t* reg, const
|
|
}
|
|
|
|
if (p && p < range) {
|
|
- if (p - reg->dmin < s) {
|
|
+ if (p - s < reg->dmin) {
|
|
retry_gate:
|
|
pprev = p;
|
|
p += enclen(reg->enc, p);
|
|
@@ -4468,6 +4468,7 @@ forward_search_range(regex_t* reg, const
|
|
*low_prev = onigenc_get_prev_char_head(reg->enc,
|
|
(pprev ? pprev : str), p);
|
|
}
|
|
+ *high = p;
|
|
}
|
|
else {
|
|
if (reg->dmax != INFINITE_LEN) {
|
|
@@ -4492,9 +4493,12 @@ forward_search_range(regex_t* reg, const
|
|
}
|
|
}
|
|
}
|
|
+ /* no needs to adjust *high, *high is used as range check only */
|
|
+ if (p - str < reg->dmin)
|
|
+ *high = (UChar* )str;
|
|
+ else
|
|
+ *high = p - reg->dmin;
|
|
}
|
|
- /* no needs to adjust *high, *high is used as range check only */
|
|
- *high = p - reg->dmin;
|
|
|
|
#ifdef ONIG_DEBUG_SEARCH
|
|
fprintf(stderr,
|
|
@@ -4517,7 +4521,6 @@ backward_search_range(regex_t* reg, cons
|
|
{
|
|
UChar *p;
|
|
|
|
- range += reg->dmin;
|
|
p = s;
|
|
|
|
retry:
|
|
@@ -4598,10 +4601,22 @@ backward_search_range(regex_t* reg, cons
|
|
}
|
|
}
|
|
|
|
- /* no needs to adjust *high, *high is used as range check only */
|
|
if (reg->dmax != INFINITE_LEN) {
|
|
- *low = p - reg->dmax;
|
|
- *high = p - reg->dmin;
|
|
+ if (p - str < reg->dmax)
|
|
+ *low = (UChar* )str;
|
|
+ else
|
|
+ *low = p - reg->dmax;
|
|
+
|
|
+ if (reg->dmin != 0) {
|
|
+ if (p - str < reg->dmin)
|
|
+ *high = (UChar* )str;
|
|
+ else
|
|
+ *high = p - reg->dmin;
|
|
+ }
|
|
+ else {
|
|
+ *high = p;
|
|
+ }
|
|
+
|
|
*high = onigenc_get_right_adjust_char_head(reg->enc, adjrange, *high);
|
|
}
|
|
|
|
@@ -4731,13 +4746,16 @@ onig_search_with_param(regex_t* reg, con
|
|
goto mismatch_no_msa;
|
|
|
|
if (range > start) {
|
|
- if ((OnigLen )(min_semi_end - start) > reg->anchor_dmax) {
|
|
+ if (min_semi_end - start > reg->anchor_dmax) {
|
|
start = min_semi_end - reg->anchor_dmax;
|
|
if (start < end)
|
|
start = onigenc_get_right_adjust_char_head(reg->enc, str, start);
|
|
}
|
|
- if ((OnigLen )(max_semi_end - (range - 1)) < reg->anchor_dmin) {
|
|
- range = max_semi_end - reg->anchor_dmin + 1;
|
|
+ if (max_semi_end - (range - 1) < reg->anchor_dmin) {
|
|
+ if (max_semi_end - str + 1 < reg->anchor_dmin)
|
|
+ goto mismatch_no_msa;
|
|
+ else
|
|
+ range = max_semi_end - reg->anchor_dmin + 1;
|
|
}
|
|
|
|
if (start > range) goto mismatch_no_msa;
|
|
@@ -4745,12 +4763,16 @@ onig_search_with_param(regex_t* reg, con
|
|
Backward search is used. */
|
|
}
|
|
else {
|
|
- if ((OnigLen )(min_semi_end - range) > reg->anchor_dmax) {
|
|
+ if (min_semi_end - range > reg->anchor_dmax) {
|
|
range = min_semi_end - reg->anchor_dmax;
|
|
}
|
|
- if ((OnigLen )(max_semi_end - start) < reg->anchor_dmin) {
|
|
- start = max_semi_end - reg->anchor_dmin;
|
|
- start = ONIGENC_LEFT_ADJUST_CHAR_HEAD(reg->enc, str, start);
|
|
+ if (max_semi_end - start < reg->anchor_dmin) {
|
|
+ if (max_semi_end - str < reg->anchor_dmin)
|
|
+ goto mismatch_no_msa;
|
|
+ else {
|
|
+ start = max_semi_end - reg->anchor_dmin;
|
|
+ start = ONIGENC_LEFT_ADJUST_CHAR_HEAD(reg->enc, str, start);
|
|
+ }
|
|
}
|
|
if (range > start) goto mismatch_no_msa;
|
|
}
|
|
@@ -4818,15 +4840,19 @@ onig_search_with_param(regex_t* reg, con
|
|
if (reg->optimize != OPTIMIZE_NONE) {
|
|
UChar *sch_range, *low, *high, *low_prev;
|
|
|
|
- sch_range = (UChar* )range;
|
|
if (reg->dmax != 0) {
|
|
if (reg->dmax == INFINITE_LEN)
|
|
sch_range = (UChar* )end;
|
|
else {
|
|
- sch_range += reg->dmax;
|
|
- if (sch_range > end) sch_range = (UChar* )end;
|
|
+ if ((end - range) < reg->dmax)
|
|
+ sch_range = (UChar* )end;
|
|
+ else {
|
|
+ sch_range = (UChar* )range + reg->dmax;
|
|
+ }
|
|
}
|
|
}
|
|
+ else
|
|
+ sch_range = (UChar* )range;
|
|
|
|
if ((end - start) < reg->threshold_len)
|
|
goto mismatch;
|
|
@@ -4885,18 +4911,28 @@ onig_search_with_param(regex_t* reg, con
|
|
|
|
if (reg->optimize != OPTIMIZE_NONE) {
|
|
UChar *low, *high, *adjrange, *sch_start;
|
|
+ const UChar *min_range;
|
|
|
|
if (range < end)
|
|
adjrange = ONIGENC_LEFT_ADJUST_CHAR_HEAD(reg->enc, str, range);
|
|
else
|
|
adjrange = (UChar* )end;
|
|
|
|
+ if (end - range > reg->dmin)
|
|
+ min_range = range + reg->dmin;
|
|
+ else
|
|
+ min_range = end;
|
|
+
|
|
if (reg->dmax != INFINITE_LEN &&
|
|
(end - range) >= reg->threshold_len) {
|
|
do {
|
|
- sch_start = s + reg->dmax;
|
|
- if (sch_start > end) sch_start = (UChar* )end;
|
|
- if (backward_search_range(reg, str, end, sch_start, range, adjrange,
|
|
+ if (end - s > reg->dmax)
|
|
+ sch_start = s + reg->dmax;
|
|
+ else {
|
|
+ sch_start = (UChar* )end;
|
|
+ }
|
|
+
|
|
+ if (backward_search_range(reg, str, end, sch_start, min_range, adjrange,
|
|
&low, &high) <= 0)
|
|
goto mismatch;
|
|
|
|
@@ -4914,19 +4950,7 @@ onig_search_with_param(regex_t* reg, con
|
|
else { /* check only. */
|
|
if ((end - range) < reg->threshold_len) goto mismatch;
|
|
|
|
- sch_start = s;
|
|
- if (reg->dmax != 0) {
|
|
- if (reg->dmax == INFINITE_LEN)
|
|
- sch_start = (UChar* )end;
|
|
- else {
|
|
- sch_start += reg->dmax;
|
|
- if (sch_start > end) sch_start = (UChar* )end;
|
|
- else
|
|
- sch_start = ONIGENC_LEFT_ADJUST_CHAR_HEAD(reg->enc,
|
|
- start, sch_start);
|
|
- }
|
|
- }
|
|
- if (backward_search_range(reg, str, end, sch_start, range, adjrange,
|
|
+ if (backward_search_range(reg, str, end, sch_start, min_range, adjrange,
|
|
&low, &high) <= 0) goto mismatch;
|
|
}
|
|
}
|