Compare commits
No commits in common. 'i8c' and 'c9' have entirely different histories.
@ -1 +1 @@
|
|||||||
SOURCES/pcre-8.42.tar.bz2
|
SOURCES/pcre-8.44.tar.bz2
|
||||||
|
@ -1 +1 @@
|
|||||||
df0d1c2ff04c359220cb902539a6e134af4497f4 SOURCES/pcre-8.42.tar.bz2
|
8179b083053fce9b4a766513fa1f14807aabee42 SOURCES/pcre-8.44.tar.bz2
|
||||||
|
@ -0,0 +1,39 @@
|
|||||||
|
This is Philip Hazel's public GPG key.
|
||||||
|
|
||||||
|
-----BEGIN PGP PUBLIC KEY BLOCK-----
|
||||||
|
Version: GnuPG v1.2.0 (SunOS)
|
||||||
|
|
||||||
|
mQEMBD2z9g0BCACpGWJ4K2mjR6K9nv7/K+HLjJtDO0E0ckudeNjg2JvnuUU7m1bK
|
||||||
|
87nSklHTSMNiqmuVU5hFAuGiMGBMj31GPpce3VbABdm6TmAJB8ZndvJXyf8lC7Ko
|
||||||
|
5iZX/gCYU6817UI5pFwYR3MTIUSSxTGqk1y62pYLKUq9keSU5Cew4q1KMwl46Bn3
|
||||||
|
SwlfQeST4WGwL2w9b8mWNltBBY23bgzwYu7vFBD4GQnfzJsvMC9lj825wob2nKy5
|
||||||
|
CL4bY6tiYUqALzDYaIVCBqJ1Ky1rpPzRcDZUeeF8Ta3njh18Y0KzPEj+Xu5Ksexg
|
||||||
|
7LUy/2wFzVRtJgqvAFZo43KIOptsj/63zxJjAAkBAbQhUGhpbGlwIEhhemVsIDxw
|
||||||
|
aDEwQGN1cy5jYW0uYWMudWs+iQEyBBMBAgAcBQI9s/YNAhsDBAsHAwIDFQIDAxYC
|
||||||
|
AQIeAQIXgAAKCRCXZuCE+w9D2JbrCACBHrxybV+9t3TGR3+uk2QnUuct90a+udcB
|
||||||
|
cbWgKQgX345ZgwIfyoPKAbG84mN/+SFUN/Ie4ZHZxVsbN//l2P/Osx0CNQBfem4e
|
||||||
|
HUWegkFGzC5DxQhN5nsJ/GR6pnxG1l/DbNhupNY73oTajWFdi7K8jYfamU/zS/Da
|
||||||
|
VCwUKxWtGqyEqOxvbdqcjsnTMmLVfXtefx7CbKyhaClPP8Pe4FL+eqyfHJF7uywK
|
||||||
|
VWlUNmQa4E+ZAK8tkoK9sZAc0ImWwZMumiKZDEpr2D8Ty+Gg2umTS2OMIcbY8QF1
|
||||||
|
r6DeubFabdPIe1kn0BGXtdAurhbdJCIbcAEQS0eEeWC4A4LiDprntB1QaGlsaXAg
|
||||||
|
SGF6ZWwgPHBoMTBAY2FtLmFjLnVrPokBMgQTAQIAHAUCPbaC8QIbAwQLBwMCAxUC
|
||||||
|
AwMWAgECHgECF4AACgkQl2bghPsPQ9ho5Qf+I2HUhZeXOUneeqSa+cITsIELJMrZ
|
||||||
|
UWcydY1z+L68yOqURVHB1jF4aC6QSlq0pLjozwF6KfZO5AfN9FvkRQ0DzCEXH48W
|
||||||
|
OXqzbjzgNxRMdaP5+49Axl0UQuhupGJg66T4FiGnSVBhK8kTURPCSpLLgkCJqNcY
|
||||||
|
t5zuNwk3e7JvleT59EVpk/kw3a5p9oeKYBln57pHwq+HdPLSCdkedQBKdsbNrazy
|
||||||
|
qduYEXen4ogsIoTpA9lLH1Xsi9wL+soLAlWXtl/GNa1h7Jpwn41zp1hqIZe1ebIM
|
||||||
|
dSGbtMEaGJlqgDauYJSl0lkVgaPtZCTmfAf57TsGfD0IckN2XNGLuwb6DLkBCwQ9
|
||||||
|
s/eJAQgAuXq2I1VTDB108O0NAB6QKfA2gMHafoj3OcwEUHnJgXrHqjYOpFr0r5lC
|
||||||
|
YjwMRMvHO7r4jgtwKjGACI/1IE2hiGXkKFOWZFkCf7Qjoi13a78myC/VRwe4uEIs
|
||||||
|
xdz++w8WfzuC1sYw8d/rlybVzHTfTsKfmFOQamuyLCTm3Kdx/wZyGM7JMmgVn2zF
|
||||||
|
HWasdID0n7QJFZGR3yEfqis5zq1t3w28AaXlTZG7QtFj9V0cWIhZRjjjVe1biPA8
|
||||||
|
Btp+eFkmcat79N9hHbiEiAY3u2qmQCcn1fiBBC0Og09cY4dRyX0/bXUo4n8lHysp
|
||||||
|
JcL/sIZ7Ahd1LOfg9h+yQfoaey78LQAGKYkBHwQYAQIACQUCPbP3iQIbDAAKCRCX
|
||||||
|
ZuCE+w9D2P0BCACXsbwFerd4wlnt8PxxQlRGXi1t4EGBFf2zSdgQvIXJ3ntPzcDU
|
||||||
|
+8hnIWQJhCTZ3PfVmoqB6ZOM1RWI/IcP6b4qVb6vJGI/VxRICraAczw+4bdFxFiB
|
||||||
|
n2+SyD4MxZg8t66FcH3fHugQqsApHTmtKmahv5BXB+0dPmP/BRUmzxYUv8hdnhHl
|
||||||
|
91S4R4BDu84DvKYyJK9jlqUl06pvqXrBSNsbWKgAJnmnDe8FaLUk+p0IXeMSavUn
|
||||||
|
T5E26MRIioxAz/G4FZI8IdO92GHTz82O7/mQMhveAdpspDvpV3M4wnldU425GlxZ
|
||||||
|
nmq1bbjAU4QVuIS9nkk2GrGx5+N6cYMy8JqG
|
||||||
|
=EHsz
|
||||||
|
-----END PGP PUBLIC KEY BLOCK-----
|
@ -0,0 +1,161 @@
|
|||||||
|
From f1e9a32ee7fad2263636a51536ce0f9f13f09949 Mon Sep 17 00:00:00 2001
|
||||||
|
From: =?UTF-8?q?Petr=20P=C3=ADsa=C5=99?= <ppisar@redhat.com>
|
||||||
|
Date: Wed, 23 Jan 2019 10:16:20 +0100
|
||||||
|
Subject: [PATCH] Declare POSIX regex function names as macros to PCRE
|
||||||
|
functions
|
||||||
|
MIME-Version: 1.0
|
||||||
|
Content-Type: text/plain; charset=UTF-8
|
||||||
|
Content-Transfer-Encoding: 8bit
|
||||||
|
|
||||||
|
POSIX regex libraries differ in regex_t size. If a program includes
|
||||||
|
<pcreposix.h>, but is not linked to pcreposix library at run-time
|
||||||
|
(either in effect of --as-needed or a lazy binding in dlopen)
|
||||||
|
other implementation touches memory out of the structure and the
|
||||||
|
program can crash.
|
||||||
|
|
||||||
|
That means once a program includes <pcreposix.h>, it must link to the
|
||||||
|
pcreposix library.
|
||||||
|
|
||||||
|
This patch replaces the POSIX regex declaration with macros to the
|
||||||
|
PCRE uniqely-named function. This ensures that the PCRE's regex_t
|
||||||
|
structure is always handled by the PCRE functions.
|
||||||
|
|
||||||
|
This patch still preserves the POSIX regex definitions in order to
|
||||||
|
preseve ABI with application compiled before this change. The
|
||||||
|
definition can be removed in the future.
|
||||||
|
|
||||||
|
Signed-off-by: Petr Písař <ppisar@redhat.com>
|
||||||
|
---
|
||||||
|
pcreposix.c | 50 +++++++++++++++++++++++++++++++++++++++++++++-----
|
||||||
|
pcreposix.h | 20 ++++++++++++++------
|
||||||
|
2 files changed, 59 insertions(+), 11 deletions(-)
|
||||||
|
|
||||||
|
diff --git a/pcreposix.c b/pcreposix.c
|
||||||
|
index a76d6bf..3f2f3ef 100644
|
||||||
|
--- a/pcreposix.c
|
||||||
|
+++ b/pcreposix.c
|
||||||
|
@@ -39,7 +39,10 @@ POSSIBILITY OF SUCH DAMAGE.
|
||||||
|
|
||||||
|
|
||||||
|
/* This module is a wrapper that provides a POSIX API to the underlying PCRE
|
||||||
|
-functions. */
|
||||||
|
+functions. The operative functions are called pcre_regcomp(), etc., with
|
||||||
|
+wrappers that use the plain POSIX names. This makes it easier for an
|
||||||
|
+application to be sure it gets the PCRE versions in the presence of other
|
||||||
|
+POSIX regex libraries. */
|
||||||
|
|
||||||
|
|
||||||
|
#ifdef HAVE_CONFIG_H
|
||||||
|
@@ -204,12 +207,49 @@ static const char *const pstring[] = {
|
||||||
|
|
||||||
|
|
||||||
|
/*************************************************
|
||||||
|
-* Translate error code to string *
|
||||||
|
+* Wrappers with traditional POSIX names *
|
||||||
|
*************************************************/
|
||||||
|
|
||||||
|
+/* Keep defining them to preseve ABI with application linked to pcreposix
|
||||||
|
+ * library before they were changed into macros. */
|
||||||
|
+
|
||||||
|
+#undef regerror
|
||||||
|
PCREPOSIX_EXP_DEFN size_t PCRE_CALL_CONVENTION
|
||||||
|
regerror(int errcode, const regex_t *preg, char *errbuf, size_t errbuf_size)
|
||||||
|
{
|
||||||
|
+return pcre_regerror(errcode, preg, errbuf, errbuf_size);
|
||||||
|
+}
|
||||||
|
+
|
||||||
|
+#undef regfree
|
||||||
|
+PCREPOSIX_EXP_DEFN void PCRE_CALL_CONVENTION
|
||||||
|
+regfree(regex_t *preg)
|
||||||
|
+{
|
||||||
|
+pcre_regfree(preg);
|
||||||
|
+}
|
||||||
|
+
|
||||||
|
+#undef regcomp
|
||||||
|
+PCREPOSIX_EXP_DEFN int PCRE_CALL_CONVENTION
|
||||||
|
+regcomp(regex_t *preg, const char *pattern, int cflags)
|
||||||
|
+{
|
||||||
|
+return pcre_regcomp(preg, pattern, cflags);
|
||||||
|
+}
|
||||||
|
+
|
||||||
|
+#undef regexec
|
||||||
|
+PCREPOSIX_EXP_DEFN int PCRE_CALL_CONVENTION
|
||||||
|
+regexec(const regex_t *preg, const char *string, size_t nmatch,
|
||||||
|
+ regmatch_t pmatch[], int eflags)
|
||||||
|
+{
|
||||||
|
+return pcre_regexec(preg, string, nmatch, pmatch, eflags);
|
||||||
|
+}
|
||||||
|
+
|
||||||
|
+
|
||||||
|
+/*************************************************
|
||||||
|
+* Translate error code to string *
|
||||||
|
+*************************************************/
|
||||||
|
+
|
||||||
|
+PCREPOSIX_EXP_DEFN size_t PCRE_CALL_CONVENTION
|
||||||
|
+pcre_regerror(int errcode, const regex_t *preg, char *errbuf, size_t errbuf_size)
|
||||||
|
+{
|
||||||
|
const char *message, *addmessage;
|
||||||
|
size_t length, addlength;
|
||||||
|
|
||||||
|
@@ -243,7 +283,7 @@ return length + addlength;
|
||||||
|
*************************************************/
|
||||||
|
|
||||||
|
PCREPOSIX_EXP_DEFN void PCRE_CALL_CONVENTION
|
||||||
|
-regfree(regex_t *preg)
|
||||||
|
+pcre_regfree(regex_t *preg)
|
||||||
|
{
|
||||||
|
(PUBL(free))(preg->re_pcre);
|
||||||
|
}
|
||||||
|
@@ -266,7 +306,7 @@ Returns: 0 on success
|
||||||
|
*/
|
||||||
|
|
||||||
|
PCREPOSIX_EXP_DEFN int PCRE_CALL_CONVENTION
|
||||||
|
-regcomp(regex_t *preg, const char *pattern, int cflags)
|
||||||
|
+pcre_regcomp(regex_t *preg, const char *pattern, int cflags)
|
||||||
|
{
|
||||||
|
const char *errorptr;
|
||||||
|
int erroffset;
|
||||||
|
@@ -320,7 +360,7 @@ be set. When this is the case, the nmatch and pmatch arguments are ignored, and
|
||||||
|
the only result is yes/no/error. */
|
||||||
|
|
||||||
|
PCREPOSIX_EXP_DEFN int PCRE_CALL_CONVENTION
|
||||||
|
-regexec(const regex_t *preg, const char *string, size_t nmatch,
|
||||||
|
+pcre_regexec(const regex_t *preg, const char *string, size_t nmatch,
|
||||||
|
regmatch_t pmatch[], int eflags)
|
||||||
|
{
|
||||||
|
int rc, so, eo;
|
||||||
|
diff --git a/pcreposix.h b/pcreposix.h
|
||||||
|
index c77c0b0..6f108b8 100644
|
||||||
|
--- a/pcreposix.h
|
||||||
|
+++ b/pcreposix.h
|
||||||
|
@@ -131,13 +131,21 @@ file. */
|
||||||
|
# endif
|
||||||
|
#endif
|
||||||
|
|
||||||
|
-/* The functions */
|
||||||
|
-
|
||||||
|
-PCREPOSIX_EXP_DECL int regcomp(regex_t *, const char *, int);
|
||||||
|
-PCREPOSIX_EXP_DECL int regexec(const regex_t *, const char *, size_t,
|
||||||
|
+/* The functions. The actual code is in functions with pcre_xxx names for
|
||||||
|
+uniqueness. POSIX names are provided for API compatibility with POSIX regex
|
||||||
|
+functions. It's done this way to ensure to they are always get from the
|
||||||
|
+PCRE library and not by accident from elsewhere. (regex_t differs in size
|
||||||
|
+elsewhere.) */
|
||||||
|
+
|
||||||
|
+PCREPOSIX_EXP_DECL int pcre_regcomp(regex_t *, const char *, int);
|
||||||
|
+#define regcomp pcre_regcomp
|
||||||
|
+PCREPOSIX_EXP_DECL int pcre_regexec(const regex_t *, const char *, size_t,
|
||||||
|
regmatch_t *, int);
|
||||||
|
-PCREPOSIX_EXP_DECL size_t regerror(int, const regex_t *, char *, size_t);
|
||||||
|
-PCREPOSIX_EXP_DECL void regfree(regex_t *);
|
||||||
|
+#define regexec pcre_regexec
|
||||||
|
+PCREPOSIX_EXP_DECL size_t pcre_regerror(int, const regex_t *, char *, size_t);
|
||||||
|
+#define regerror pcre_regerror
|
||||||
|
+PCREPOSIX_EXP_DECL void pcre_regfree(regex_t *);
|
||||||
|
+#define regfree pcre_regfree
|
||||||
|
|
||||||
|
#ifdef __cplusplus
|
||||||
|
} /* extern "C" */
|
||||||
|
--
|
||||||
|
2.17.2
|
||||||
|
|
@ -1,70 +0,0 @@
|
|||||||
From 7abc4de8303e8908eeb96714dac53ae10ff465e3 Mon Sep 17 00:00:00 2001
|
|
||||||
From: ph10 <ph10@2f5784b3-3f2a-0410-8824-cb99058d5e15>
|
|
||||||
Date: Sun, 2 Sep 2018 17:05:38 +0000
|
|
||||||
Subject: [PATCH] Fix anchoring bug in conditional subexpression.
|
|
||||||
MIME-Version: 1.0
|
|
||||||
Content-Type: text/plain; charset=UTF-8
|
|
||||||
Content-Transfer-Encoding: 8bit
|
|
||||||
|
|
||||||
git-svn-id: svn://vcs.exim.org/pcre/code/trunk@1739 2f5784b3-3f2a-0410-8824-cb99058d5e15
|
|
||||||
Petr Písař: Ported to 8.42
|
|
||||||
---
|
|
||||||
pcre_compile.c | 12 ++++++++++--
|
|
||||||
testdata/testinput2 | 3 +++
|
|
||||||
testdata/testoutput2 | 4 ++++
|
|
||||||
|
|
||||||
Version 8.42 20-March-2018
|
|
||||||
--------------------------
|
|
||||||
diff --git a/pcre_compile.c b/pcre_compile.c
|
|
||||||
index 3991d6c..6141fb3 100644
|
|
||||||
--- a/pcre_compile.c
|
|
||||||
+++ b/pcre_compile.c
|
|
||||||
@@ -8682,10 +8682,18 @@ do {
|
|
||||||
if (!is_anchored(scode, new_map, cd, atomcount)) return FALSE;
|
|
||||||
}
|
|
||||||
|
|
||||||
- /* Positive forward assertions and conditions */
|
|
||||||
+ /* Positive forward assertion */
|
|
||||||
|
|
||||||
- else if (op == OP_ASSERT || op == OP_COND)
|
|
||||||
+ else if (op == OP_ASSERT)
|
|
||||||
+ {
|
|
||||||
+ if (!is_anchored(scode, bracket_map, cd, atomcount)) return FALSE;
|
|
||||||
+ }
|
|
||||||
+
|
|
||||||
+ /* Condition; not anchored if no second branch */
|
|
||||||
+
|
|
||||||
+ else if (op == OP_COND)
|
|
||||||
{
|
|
||||||
+ if (scode[GET(scode,1)] != OP_ALT) return FALSE;
|
|
||||||
if (!is_anchored(scode, bracket_map, cd, atomcount)) return FALSE;
|
|
||||||
}
|
|
||||||
|
|
||||||
diff --git a/testdata/testinput2 b/testdata/testinput2
|
|
||||||
index 8ba4dc4..3528de1 100644
|
|
||||||
--- a/testdata/testinput2
|
|
||||||
+++ b/testdata/testinput2
|
|
||||||
@@ -4257,4 +4257,7 @@ backtracking verbs. --/
|
|
||||||
ab
|
|
||||||
aaab
|
|
||||||
|
|
||||||
+/(?(?=^))b/
|
|
||||||
+ abc
|
|
||||||
+
|
|
||||||
/-- End of testinput2 --/
|
|
||||||
diff --git a/testdata/testoutput2 b/testdata/testoutput2
|
|
||||||
index 61ed8d9..4ccda27 100644
|
|
||||||
--- a/testdata/testoutput2
|
|
||||||
+++ b/testdata/testoutput2
|
|
||||||
@@ -14721,4 +14721,8 @@ No need char
|
|
||||||
0: ab
|
|
||||||
1: a
|
|
||||||
|
|
||||||
+/(?(?=^))b/
|
|
||||||
+ abc
|
|
||||||
+ 0: b
|
|
||||||
+
|
|
||||||
/-- End of testinput2 --/
|
|
||||||
--
|
|
||||||
2.14.4
|
|
||||||
|
|
@ -1,29 +0,0 @@
|
|||||||
From 1aa76cb33f04fcea3127a0859450e5d18369e5e2 Mon Sep 17 00:00:00 2001
|
|
||||||
From: zherczeg <zherczeg@2f5784b3-3f2a-0410-8824-cb99058d5e15>
|
|
||||||
Date: Fri, 21 Sep 2018 07:34:10 +0000
|
|
||||||
Subject: [PATCH] Fix subject buffer overread in JIT.
|
|
||||||
MIME-Version: 1.0
|
|
||||||
Content-Type: text/plain; charset=UTF-8
|
|
||||||
Content-Transfer-Encoding: 8bit
|
|
||||||
|
|
||||||
git-svn-id: svn://vcs.exim.org/pcre/code/trunk@1740 2f5784b3-3f2a-0410-8824-cb99058d5e15
|
|
||||||
Petr Písař: Ported to 8.42.
|
|
||||||
---
|
|
||||||
pcre_jit_compile.c | 2 +-
|
|
||||||
|
|
||||||
diff --git a/pcre_jit_compile.c b/pcre_jit_compile.c
|
|
||||||
index 2bad74b..bc5f9c0 100644
|
|
||||||
--- a/pcre_jit_compile.c
|
|
||||||
+++ b/pcre_jit_compile.c
|
|
||||||
@@ -9002,7 +9002,7 @@ if (exact > 1)
|
|
||||||
#ifdef SUPPORT_UTF
|
|
||||||
&& !common->utf
|
|
||||||
#endif
|
|
||||||
- )
|
|
||||||
+ && type != OP_ANYNL && type != OP_EXTUNI)
|
|
||||||
{
|
|
||||||
OP2(SLJIT_ADD, TMP1, 0, STR_PTR, 0, SLJIT_IMM, IN_UCHARS(exact));
|
|
||||||
add_jump(compiler, &backtrack->topbacktracks, CMP(SLJIT_GREATER, TMP1, 0, STR_END, 0));
|
|
||||||
--
|
|
||||||
2.17.2
|
|
||||||
|
|
@ -1,178 +0,0 @@
|
|||||||
From 2ede5a4b4a98add3bbf982f5805e015e8c61c565 Mon Sep 17 00:00:00 2001
|
|
||||||
From: ph10 <ph10@2f5784b3-3f2a-0410-8824-cb99058d5e15>
|
|
||||||
Date: Tue, 26 Jun 2018 16:51:43 +0000
|
|
||||||
Subject: [PATCH] Fix two C++ wrapper bugs, unnoticed for years.
|
|
||||||
MIME-Version: 1.0
|
|
||||||
Content-Type: text/plain; charset=UTF-8
|
|
||||||
Content-Transfer-Encoding: 8bit
|
|
||||||
|
|
||||||
git-svn-id: svn://vcs.exim.org/pcre/code/trunk@1735 2f5784b3-3f2a-0410-8824-cb99058d5e15
|
|
||||||
|
|
||||||
Petr Písař: Ported to 8.42.
|
|
||||||
|
|
||||||
diff --git a/pcrecpp.cc b/pcrecpp.cc
|
|
||||||
index d09c9ab..77a2fed 100644
|
|
||||||
--- a/pcrecpp.cc
|
|
||||||
+++ b/pcrecpp.cc
|
|
||||||
@@ -80,6 +80,24 @@ static const string empty_string;
|
|
||||||
// If the user doesn't ask for any options, we just use this one
|
|
||||||
static RE_Options default_options;
|
|
||||||
|
|
||||||
+// Specials for the start of patterns. See comments where start_options is used
|
|
||||||
+// below. (PH June 2018)
|
|
||||||
+static const char *start_options[] = {
|
|
||||||
+ "(*UTF8)",
|
|
||||||
+ "(*UTF)",
|
|
||||||
+ "(*UCP)",
|
|
||||||
+ "(*NO_START_OPT)",
|
|
||||||
+ "(*NO_AUTO_POSSESS)",
|
|
||||||
+ "(*LIMIT_RECURSION=",
|
|
||||||
+ "(*LIMIT_MATCH=",
|
|
||||||
+ "(*CRLF)",
|
|
||||||
+ "(*CR)",
|
|
||||||
+ "(*BSR_UNICODE)",
|
|
||||||
+ "(*BSR_ANYCRLF)",
|
|
||||||
+ "(*ANYCRLF)",
|
|
||||||
+ "(*ANY)",
|
|
||||||
+ "" };
|
|
||||||
+
|
|
||||||
void RE::Init(const string& pat, const RE_Options* options) {
|
|
||||||
pattern_ = pat;
|
|
||||||
if (options == NULL) {
|
|
||||||
@@ -135,7 +153,49 @@ pcre* RE::Compile(Anchor anchor) {
|
|
||||||
} else {
|
|
||||||
// Tack a '\z' at the end of RE. Parenthesize it first so that
|
|
||||||
// the '\z' applies to all top-level alternatives in the regexp.
|
|
||||||
- string wrapped = "(?:"; // A non-counting grouping operator
|
|
||||||
+
|
|
||||||
+ /* When this code was written (for PCRE 6.0) it was enough just to
|
|
||||||
+ parenthesize the entire pattern. Unfortunately, when the feature of
|
|
||||||
+ starting patterns with (*UTF8) or (*CR) etc. was added to PCRE patterns,
|
|
||||||
+ this code was never updated. This bug was not noticed till 2018, long after
|
|
||||||
+ PCRE became obsolescent and its maintainer no longer around. Since PCRE is
|
|
||||||
+ frozen, I have added a hack to check for all the existing "start of
|
|
||||||
+ pattern" specials - knowing that no new ones will ever be added. I am not a
|
|
||||||
+ C++ programmer, so the code style is no doubt crude. It is also
|
|
||||||
+ inefficient, but is only run when the pattern starts with "(*".
|
|
||||||
+ PH June 2018. */
|
|
||||||
+
|
|
||||||
+ string wrapped = "";
|
|
||||||
+
|
|
||||||
+ if (pattern_.c_str()[0] == '(' && pattern_.c_str()[1] == '*') {
|
|
||||||
+ int kk, klen, kmat;
|
|
||||||
+ for (;;) { // Loop for any number of leading items
|
|
||||||
+
|
|
||||||
+ for (kk = 0; start_options[kk][0] != 0; kk++) {
|
|
||||||
+ klen = strlen(start_options[kk]);
|
|
||||||
+ kmat = strncmp(pattern_.c_str(), start_options[kk], klen);
|
|
||||||
+ if (kmat >= 0) break;
|
|
||||||
+ }
|
|
||||||
+ if (kmat != 0) break; // Not found
|
|
||||||
+
|
|
||||||
+ // If the item ended in "=" we must copy digits up to ")".
|
|
||||||
+
|
|
||||||
+ if (start_options[kk][klen-1] == '=') {
|
|
||||||
+ while (isdigit(pattern_.c_str()[klen])) klen++;
|
|
||||||
+ if (pattern_.c_str()[klen] != ')') break; // Syntax error
|
|
||||||
+ klen++;
|
|
||||||
+ }
|
|
||||||
+
|
|
||||||
+ // Move the item from the pattern to the start of the wrapped string.
|
|
||||||
+
|
|
||||||
+ wrapped += pattern_.substr(0, klen);
|
|
||||||
+ pattern_.erase(0, klen);
|
|
||||||
+ }
|
|
||||||
+ }
|
|
||||||
+
|
|
||||||
+ // Wrap the rest of the pattern.
|
|
||||||
+
|
|
||||||
+ wrapped += "(?:"; // A non-counting grouping operator
|
|
||||||
wrapped += pattern_;
|
|
||||||
wrapped += ")\\z";
|
|
||||||
re = pcre_compile(wrapped.c_str(), pcre_options,
|
|
||||||
@@ -415,7 +475,7 @@ int RE::GlobalReplace(const StringPiece& rewrite,
|
|
||||||
matchend++;
|
|
||||||
}
|
|
||||||
// We also need to advance more than one char if we're in utf8 mode.
|
|
||||||
-#ifdef SUPPORT_UTF8
|
|
||||||
+#ifdef SUPPORT_UTF
|
|
||||||
if (options_.utf8()) {
|
|
||||||
while (matchend < static_cast<int>(str->length()) &&
|
|
||||||
((*str)[matchend] & 0xc0) == 0x80)
|
|
||||||
diff --git a/pcrecpp_unittest.cc b/pcrecpp_unittest.cc
|
|
||||||
index 4b15fbe..255066f 100644
|
|
||||||
--- a/pcrecpp_unittest.cc
|
|
||||||
+++ b/pcrecpp_unittest.cc
|
|
||||||
@@ -309,7 +309,7 @@ static void TestReplace() {
|
|
||||||
"@aa",
|
|
||||||
"@@@",
|
|
||||||
3 },
|
|
||||||
-#ifdef SUPPORT_UTF8
|
|
||||||
+#ifdef SUPPORT_UTF
|
|
||||||
{ "b*",
|
|
||||||
"bb",
|
|
||||||
"\xE3\x83\x9B\xE3\x83\xBC\xE3\x83\xA0\xE3\x81\xB8", // utf8
|
|
||||||
@@ -327,7 +327,7 @@ static void TestReplace() {
|
|
||||||
{ "", NULL, NULL, NULL, NULL, 0 }
|
|
||||||
};
|
|
||||||
|
|
||||||
-#ifdef SUPPORT_UTF8
|
|
||||||
+#ifdef SUPPORT_UTF
|
|
||||||
const bool support_utf8 = true;
|
|
||||||
#else
|
|
||||||
const bool support_utf8 = false;
|
|
||||||
@@ -535,7 +535,7 @@ static void TestQuoteMetaLatin1() {
|
|
||||||
}
|
|
||||||
|
|
||||||
static void TestQuoteMetaUtf8() {
|
|
||||||
-#ifdef SUPPORT_UTF8
|
|
||||||
+#ifdef SUPPORT_UTF
|
|
||||||
TestQuoteMeta("Pl\xc3\xa1\x63ido Domingo", pcrecpp::UTF8());
|
|
||||||
TestQuoteMeta("xyz", pcrecpp::UTF8()); // No fancy utf8
|
|
||||||
TestQuoteMeta("\xc2\xb0", pcrecpp::UTF8()); // 2-byte utf8 (degree symbol)
|
|
||||||
@@ -1178,7 +1178,7 @@ int main(int argc, char** argv) {
|
|
||||||
CHECK(re.error().empty()); // Must have no error
|
|
||||||
}
|
|
||||||
|
|
||||||
-#ifdef SUPPORT_UTF8
|
|
||||||
+#ifdef SUPPORT_UTF
|
|
||||||
// Check UTF-8 handling
|
|
||||||
{
|
|
||||||
printf("Testing UTF-8 handling\n");
|
|
||||||
@@ -1202,6 +1202,24 @@ int main(int argc, char** argv) {
|
|
||||||
CHECK(re_test1.FullMatch(utf8_string));
|
|
||||||
RE re_test2("...", pcrecpp::UTF8());
|
|
||||||
CHECK(re_test2.FullMatch(utf8_string));
|
|
||||||
+
|
|
||||||
+ // PH added these tests for leading option settings
|
|
||||||
+
|
|
||||||
+ RE re_testZ1("(*UTF8)...");
|
|
||||||
+ CHECK(re_testZ1.FullMatch(utf8_string));
|
|
||||||
+
|
|
||||||
+ RE re_testZ2("(*UTF)...");
|
|
||||||
+ CHECK(re_testZ2.FullMatch(utf8_string));
|
|
||||||
+
|
|
||||||
+ RE re_testZ3("(*UCP)(*UTF)...");
|
|
||||||
+ CHECK(re_testZ3.FullMatch(utf8_string));
|
|
||||||
+
|
|
||||||
+ RE re_testZ4("(*UCP)(*LIMIT_MATCH=1000)(*UTF)...");
|
|
||||||
+ CHECK(re_testZ4.FullMatch(utf8_string));
|
|
||||||
+
|
|
||||||
+ RE re_testZ5("(*UCP)(*LIMIT_MATCH=1000)(*ANY)(*UTF)...");
|
|
||||||
+ CHECK(re_testZ5.FullMatch(utf8_string));
|
|
||||||
+
|
|
||||||
|
|
||||||
// Check that '.' matches one byte or UTF-8 character
|
|
||||||
// according to the mode.
|
|
||||||
@@ -1248,7 +1266,7 @@ int main(int argc, char** argv) {
|
|
||||||
CHECK(!match_sentence.FullMatch(target));
|
|
||||||
CHECK(!match_sentence_re.FullMatch(target));
|
|
||||||
}
|
|
||||||
-#endif /* def SUPPORT_UTF8 */
|
|
||||||
+#endif /* def SUPPORT_UTF */
|
|
||||||
|
|
||||||
printf("Testing error reporting\n");
|
|
||||||
|
|
||||||
--
|
|
||||||
2.14.4
|
|
||||||
|
|
@ -1,36 +0,0 @@
|
|||||||
From 6d8fa98d5167bdd915ce1e32bcb6aaed078e5938 Mon Sep 17 00:00:00 2001
|
|
||||||
From: ph10 <ph10@2f5784b3-3f2a-0410-8824-cb99058d5e15>
|
|
||||||
Date: Tue, 26 Jun 2018 17:04:02 +0000
|
|
||||||
Subject: [PATCH] Fix typos in pcrgrep.
|
|
||||||
MIME-Version: 1.0
|
|
||||||
Content-Type: text/plain; charset=UTF-8
|
|
||||||
Content-Transfer-Encoding: 8bit
|
|
||||||
|
|
||||||
git-svn-id: svn://vcs.exim.org/pcre/code/trunk@1736 2f5784b3-3f2a-0410-8824-cb99058d5e15
|
|
||||||
Petr Písař: Ported to 8.42.
|
|
||||||
|
|
||||||
diff --git a/pcregrep.c b/pcregrep.c
|
|
||||||
index a406be9..5982406 100644
|
|
||||||
--- a/pcregrep.c
|
|
||||||
+++ b/pcregrep.c
|
|
||||||
@@ -2252,7 +2252,7 @@ if (isdirectory(pathname))
|
|
||||||
int fnlength = strlen(pathname) + strlen(nextfile) + 2;
|
|
||||||
if (fnlength > 2048)
|
|
||||||
{
|
|
||||||
- fprintf(stderr, "pcre2grep: recursive filename is too long\n");
|
|
||||||
+ fprintf(stderr, "pcregrep: recursive filename is too long\n");
|
|
||||||
rc = 2;
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
@@ -3034,7 +3034,7 @@ LC_ALL environment variable is set, and if so, use it. */
|
|
||||||
if (locale == NULL)
|
|
||||||
{
|
|
||||||
locale = getenv("LC_ALL");
|
|
||||||
- locale_from = "LCC_ALL";
|
|
||||||
+ locale_from = "LC_ALL";
|
|
||||||
}
|
|
||||||
|
|
||||||
if (locale == NULL)
|
|
||||||
--
|
|
||||||
2.14.4
|
|
||||||
|
|
@ -1,55 +0,0 @@
|
|||||||
From 3a9026509f9c1745f378595e55e5024361ad152d Mon Sep 17 00:00:00 2001
|
|
||||||
From: ph10 <ph10@2f5784b3-3f2a-0410-8824-cb99058d5e15>
|
|
||||||
Date: Mon, 10 Feb 2020 17:17:34 +0000
|
|
||||||
Subject: [PATCH] Check the size of the number after (?C as it is read, in
|
|
||||||
order to avoid integer overflow.
|
|
||||||
MIME-Version: 1.0
|
|
||||||
Content-Type: text/plain; charset=UTF-8
|
|
||||||
Content-Transfer-Encoding: 8bit
|
|
||||||
|
|
||||||
git-svn-id: svn://vcs.exim.org/pcre/code/trunk@1761 2f5784b3-3f2a-0410-8824-cb99058d5e15
|
|
||||||
Petr Písař: Ported to 8.43.
|
|
||||||
---
|
|
||||||
pcre_compile.c | 14 ++++++++------
|
|
||||||
|
|
||||||
diff --git a/pcre_compile.c b/pcre_compile.c
|
|
||||||
index 079d30a..1e3d6c3 100644
|
|
||||||
--- a/pcre_compile.c
|
|
||||||
+++ b/pcre_compile.c
|
|
||||||
@@ -6,7 +6,7 @@
|
|
||||||
and semantics are as close as possible to those of the Perl 5 language.
|
|
||||||
|
|
||||||
Written by Philip Hazel
|
|
||||||
- Copyright (c) 1997-2018 University of Cambridge
|
|
||||||
+ Copyright (c) 1997-2020 University of Cambridge
|
|
||||||
|
|
||||||
-----------------------------------------------------------------------------
|
|
||||||
Redistribution and use in source and binary forms, with or without
|
|
||||||
@@ -7130,17 +7130,19 @@ for (;; ptr++)
|
|
||||||
int n = 0;
|
|
||||||
ptr++;
|
|
||||||
while(IS_DIGIT(*ptr))
|
|
||||||
+ {
|
|
||||||
n = n * 10 + *ptr++ - CHAR_0;
|
|
||||||
+ if (n > 255)
|
|
||||||
+ {
|
|
||||||
+ *errorcodeptr = ERR38;
|
|
||||||
+ goto FAILED;
|
|
||||||
+ }
|
|
||||||
+ }
|
|
||||||
if (*ptr != CHAR_RIGHT_PARENTHESIS)
|
|
||||||
{
|
|
||||||
*errorcodeptr = ERR39;
|
|
||||||
goto FAILED;
|
|
||||||
}
|
|
||||||
- if (n > 255)
|
|
||||||
- {
|
|
||||||
- *errorcodeptr = ERR38;
|
|
||||||
- goto FAILED;
|
|
||||||
- }
|
|
||||||
*code++ = n;
|
|
||||||
PUT(code, 0, (int)(ptr - cd->start_pattern + 1)); /* Pattern offset */
|
|
||||||
PUT(code, LINK_SIZE, 0); /* Default length */
|
|
||||||
--
|
|
||||||
2.21.1
|
|
||||||
|
|
@ -0,0 +1,44 @@
|
|||||||
|
From f0bb9e8baf3157e0a84f484f194984295b2db23a Mon Sep 17 00:00:00 2001
|
||||||
|
From: =?UTF-8?q?Petr=20P=C3=ADsa=C5=99?= <ppisar@redhat.com>
|
||||||
|
Date: Mon, 19 Oct 2020 16:15:14 +0200
|
||||||
|
Subject: [PATCH] Inicialize name table memory region
|
||||||
|
MIME-Version: 1.0
|
||||||
|
Content-Type: text/plain; charset=UTF-8
|
||||||
|
Content-Transfer-Encoding: 8bit
|
||||||
|
|
||||||
|
Name table entry values are accessed past their ends in add_name()
|
||||||
|
when comparing the values. Also a size of the entries could grow
|
||||||
|
later. It's safer to initialize just after the allocation than to hunt
|
||||||
|
the gaps later.
|
||||||
|
|
||||||
|
Reproducer:
|
||||||
|
|
||||||
|
pcre_compile2("(?<f>)(?<fir>)", PCRE_NO_AUTO_CAPTURE | PCRE_CASELESS, &ec, &eb, &eo, NULL);
|
||||||
|
|
||||||
|
built with clang++ -fsanitize=memory -fsanitize=fuzzer-no-link.
|
||||||
|
|
||||||
|
https://bugs.exim.org/show_bug.cgi?id=2661
|
||||||
|
Signed-off-by: Petr Písař <ppisar@redhat.com>
|
||||||
|
---
|
||||||
|
pcre_compile.c | 5 +++++
|
||||||
|
1 file changed, 5 insertions(+)
|
||||||
|
|
||||||
|
diff --git a/pcre_compile.c b/pcre_compile.c
|
||||||
|
index 3be0fbf..75309e0 100644
|
||||||
|
--- a/pcre_compile.c
|
||||||
|
+++ b/pcre_compile.c
|
||||||
|
@@ -9423,6 +9423,11 @@ if (re == NULL)
|
||||||
|
goto PCRE_EARLY_ERROR_RETURN;
|
||||||
|
}
|
||||||
|
|
||||||
|
+/* Initialize the memory. Name table entry values are accessed past their ends
|
||||||
|
+ * (e.g. in add_name()) when comparing the values. Also a size of the entry can
|
||||||
|
+ * grow later. It's safer to initialize here than to hunt the gaps later. */
|
||||||
|
+memset(re, 0, size);
|
||||||
|
+
|
||||||
|
/* Put in the magic number, and save the sizes, initial options, internal
|
||||||
|
flags, and character table pointer. NULL is used for the default character
|
||||||
|
tables. The nullpad field is at the end; it's there to help in the case when a
|
||||||
|
--
|
||||||
|
2.25.4
|
||||||
|
|
File diff suppressed because it is too large
Load Diff
@ -0,0 +1,98 @@
|
|||||||
|
From 70fcff23652339438cabef86f2d3d9c645678687 Mon Sep 17 00:00:00 2001
|
||||||
|
From: "H.J. Lu" <hjl.tools@gmail.com>
|
||||||
|
Date: Sun, 20 Dec 2020 13:55:40 -0800
|
||||||
|
Subject: [PATCH 2/2] Pass -mshstk to the compiler when Intel CET is enable
|
||||||
|
|
||||||
|
Copied from PCRE2.
|
||||||
|
---
|
||||||
|
CMakeLists.txt | 18 ++++++++++++++++++
|
||||||
|
Makefile.am | 3 +++
|
||||||
|
configure.ac | 15 +++++++++++++++
|
||||||
|
3 files changed, 36 insertions(+)
|
||||||
|
|
||||||
|
diff --git a/CMakeLists.txt b/CMakeLists.txt
|
||||||
|
index 858a34b..74c27e9 100644
|
||||||
|
--- a/CMakeLists.txt
|
||||||
|
+++ b/CMakeLists.txt
|
||||||
|
@@ -112,6 +112,24 @@ CHECK_FUNCTION_EXISTS(_strtoi64 HAVE__STRTOI64)
|
||||||
|
CHECK_TYPE_SIZE("long long" LONG_LONG)
|
||||||
|
CHECK_TYPE_SIZE("unsigned long long" UNSIGNED_LONG_LONG)
|
||||||
|
|
||||||
|
+# Check whether Intel CET is enabled, and if so, adjust compiler flags. This
|
||||||
|
+# code was written by PH, trying to imitate the logic from the autotools
|
||||||
|
+# configuration.
|
||||||
|
+
|
||||||
|
+CHECK_C_SOURCE_COMPILES(
|
||||||
|
+ "#ifndef __CET__
|
||||||
|
+ #error CET is not enabled
|
||||||
|
+ #endif
|
||||||
|
+ int main() { return 0; }"
|
||||||
|
+ INTEL_CET_ENABLED
|
||||||
|
+)
|
||||||
|
+
|
||||||
|
+IF (INTEL_CET_ENABLED)
|
||||||
|
+ SET(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -mshstk")
|
||||||
|
+ENDIF(INTEL_CET_ENABLED)
|
||||||
|
+
|
||||||
|
+
|
||||||
|
+
|
||||||
|
# User-configurable options
|
||||||
|
#
|
||||||
|
# (Note: CMakeSetup displays these in alphabetical order, regardless of
|
||||||
|
diff --git a/Makefile.am b/Makefile.am
|
||||||
|
index 22b6947..984c686 100644
|
||||||
|
--- a/Makefile.am
|
||||||
|
+++ b/Makefile.am
|
||||||
|
@@ -250,6 +250,7 @@ libpcre_la_SOURCES = \
|
||||||
|
|
||||||
|
libpcre_la_CFLAGS = \
|
||||||
|
$(VISIBILITY_CFLAGS) \
|
||||||
|
+ $(CET_CFLAGS) \
|
||||||
|
$(AM_CFLAGS)
|
||||||
|
|
||||||
|
libpcre_la_LIBADD =
|
||||||
|
@@ -289,6 +290,7 @@ libpcre16_la_SOURCES = \
|
||||||
|
|
||||||
|
libpcre16_la_CFLAGS = \
|
||||||
|
$(VISIBILITY_CFLAGS) \
|
||||||
|
+ $(CET_CFLAGS) \
|
||||||
|
$(AM_CFLAGS)
|
||||||
|
|
||||||
|
libpcre16_la_LIBADD =
|
||||||
|
@@ -328,6 +330,7 @@ libpcre32_la_SOURCES = \
|
||||||
|
|
||||||
|
libpcre32_la_CFLAGS = \
|
||||||
|
$(VISIBILITY_CFLAGS) \
|
||||||
|
+ $(CET_CFLAGS) \
|
||||||
|
$(AM_CFLAGS)
|
||||||
|
|
||||||
|
libpcre32_la_LIBADD =
|
||||||
|
diff --git a/configure.ac b/configure.ac
|
||||||
|
index 6a3e5f3..15f37d1 100644
|
||||||
|
--- a/configure.ac
|
||||||
|
+++ b/configure.ac
|
||||||
|
@@ -1043,6 +1043,21 @@ fi # enable_coverage
|
||||||
|
|
||||||
|
AM_CONDITIONAL([WITH_GCOV],[test "x$enable_coverage" = "xyes"])
|
||||||
|
|
||||||
|
+AC_MSG_CHECKING([whether Intel CET is enabled])
|
||||||
|
+AC_LANG_PUSH([C])
|
||||||
|
+AC_COMPILE_IFELSE([AC_LANG_PROGRAM(,
|
||||||
|
+ [[#ifndef __CET__
|
||||||
|
+# error CET is not enabled
|
||||||
|
+#endif]])],
|
||||||
|
+ [intel_cet_enabled=yes],
|
||||||
|
+ [intel_cet_enabled=no])
|
||||||
|
+AC_MSG_RESULT([$intel_cet_enabled])
|
||||||
|
+if test "$intel_cet_enabled" = yes; then
|
||||||
|
+ CET_CFLAGS="-mshstk"
|
||||||
|
+ AC_SUBST([CET_CFLAGS])
|
||||||
|
+fi
|
||||||
|
+AC_LANG_POP([C])
|
||||||
|
+
|
||||||
|
# Produce these files, in addition to config.h.
|
||||||
|
AC_CONFIG_FILES(
|
||||||
|
Makefile
|
||||||
|
--
|
||||||
|
2.29.2
|
||||||
|
|
Binary file not shown.
Loading…
Reference in new issue