From f20b10ee7b0568ff800588579c7f74ca74f0c23f Mon Sep 17 00:00:00 2001 From: Rob Landley Date: Tue, 26 Jul 2016 13:35:56 -0500 Subject: Move regexec0 into lib (regexec that takes length and matches after NUL). --- lib/lib.c | 35 +++++++++++++++++++++++++++++++++++ lib/lib.h | 2 ++ toys/posix/sed.c | 41 +++-------------------------------------- 3 files changed, 40 insertions(+), 38 deletions(-) diff --git a/lib/lib.c b/lib/lib.c index 09264c95..5c7696d0 100644 --- a/lib/lib.c +++ b/lib/lib.c @@ -1149,3 +1149,38 @@ int readlink0(char *path, char *buf, int len) { return readlinkat0(AT_FDCWD, path, buf, len); } + +// Do regex matching handling embedded NUL bytes in string (hence extra len +// argument). Note that neither the pattern nor the match can currently include +// NUL bytes (even with wildcards) and string must be null terminated at +// string[len]. But this can find a match after the first NUL. +int regexec0(regex_t *preg, char *string, long len, int nmatch, + regmatch_t pmatch[], int eflags) +{ + char *s = string; + + for (;;) { + long ll = 0; + int rc; + + while (len && !*s) { + s++; + len--; + } + while (s[ll] && llrmatch[1]); // regex match end includes matching line, so defer deactivation - if (line && !regex_null(rm, line, len, 0, 0, 0)) miss = 1; + if (line && !regexec0(rm, line, len, 0, 0, 0)) miss = 1; } } else if (lm > 0 && lm < TT.count) command->hit = 0; @@ -339,7 +304,7 @@ static void process_line(char **pline, long plen) if (!(lm = *command->lmatch)) { void *rm = get_regex(command, *command->rmatch); - if (line && !regex_null(rm, line, len, 0, 0, 0)) command->hit++; + if (line && !regexec0(rm, line, len, 0, 0, 0)) command->hit++; } else if (lm == TT.count || (lm == -1 && !pline)) command->hit++; if (!command->lmatch[1] && !command->rmatch[1]) miss = 1; @@ -501,7 +466,7 @@ static void process_line(char **pline, long plen) int mflags = 0, count = 0, zmatch = 1, rlen = len, mlen, off, newlen; // Find match in remaining line (up to remaining len) - while (!regex_null(reg, rline, rlen, 10, match, mflags)) { + while (!regexec0(reg, rline, rlen, 10, match, mflags)) { mflags = REG_NOTBOL; // Zero length matches don't count immediately after a previous match -- cgit v1.2.3