diff options
author | Martijn van Duren <martijn@cvs.openbsd.org> | 2016-05-30 18:10:30 +0000 |
---|---|---|
committer | Martijn van Duren <martijn@cvs.openbsd.org> | 2016-05-30 18:10:30 +0000 |
commit | 16fd89111611e423bf1707e2be4b6091e4b2cfb4 (patch) | |
tree | dfa01e6b643295f572b65fba6737a9563720fafe /usr.bin/sed | |
parent | bf67d0eb4372846649ed5ce64dfb8df77b227d96 (diff) |
Make sed use the new REG_STARTEND | REG_NOTBOL combination. This fixes a begin
of word mismatch as reported by jsg@.
Discussed with otto@ and others early on, earlier version tested in ports build
by aja@
OK millert@
Few readability tweaks and OK schwarze@
Diffstat (limited to 'usr.bin/sed')
-rw-r--r-- | usr.bin/sed/process.c | 41 |
1 files changed, 24 insertions, 17 deletions
diff --git a/usr.bin/sed/process.c b/usr.bin/sed/process.c index f4d801b263c..6ccd51dc713 100644 --- a/usr.bin/sed/process.c +++ b/usr.bin/sed/process.c @@ -1,4 +1,4 @@ -/* $OpenBSD: process.c,v 1.27 2015/10/26 14:08:47 mmcc Exp $ */ +/* $OpenBSD: process.c,v 1.28 2016/05/30 18:10:29 martijn Exp $ */ /*- * Copyright (c) 1992 Diomidis Spinellis. @@ -61,7 +61,8 @@ static SPACE HS, PS, SS; static inline int applies(struct s_command *); static void flush_appends(void); static void lputs(char *); -static inline int regexec_e(regex_t *, const char *, int, int, size_t); +static inline int regexec_e(regex_t *, const char *, int, int, size_t, + size_t); static void regsub(SPACE *, char *, char *); static int substitute(struct s_command *); @@ -267,7 +268,7 @@ new: if (!nflag && !pd) * (lastline, linenumber, ps). */ #define MATCH(a) \ - (a)->type == AT_RE ? regexec_e((a)->u.r, ps, 0, 1, psl) : \ + (a)->type == AT_RE ? regexec_e((a)->u.r, ps, 0, 1, 0, psl) : \ (a)->type == AT_LINE ? linenum == (a)->u.l : lastline() /* @@ -335,6 +336,7 @@ substitute(struct s_command *cp) regex_t *re; regoff_t slen; int n, lastempty; + size_t le = 0; char *s; s = ps; @@ -346,7 +348,7 @@ substitute(struct s_command *cp) cp->u.s->maxbref); } } - if (!regexec_e(re, s, 0, 0, psl)) + if (!regexec_e(re, ps, 0, 0, 0, psl)) return (0); SS.len = 0; /* Clean substitute space. */ @@ -356,28 +358,30 @@ substitute(struct s_command *cp) do { /* Copy the leading retained string. */ - if (n <= 1 && match[0].rm_so) - cspace(&SS, s, match[0].rm_so, APPEND); + if (n <= 1 && (match[0].rm_so > le)) + cspace(&SS, s, match[0].rm_so - le, APPEND); /* Skip zero-length matches right after other matches. */ - if (lastempty || match[0].rm_so || + if (lastempty || (match[0].rm_so - le) || match[0].rm_so != match[0].rm_eo) { if (n <= 1) { /* Want this match: append replacement. */ - regsub(&SS, s, cp->u.s->new); + regsub(&SS, ps, cp->u.s->new); if (n == 1) n = -1; } else { /* Want a later match: append original. */ - if (match[0].rm_eo) - cspace(&SS, s, match[0].rm_eo, APPEND); + if (match[0].rm_eo - le) + cspace(&SS, s, match[0].rm_eo - le, + APPEND); n--; } } /* Move past this match. */ - s += match[0].rm_eo; - slen -= match[0].rm_eo; + s = ps + match[0].rm_eo; + slen = psl - match[0].rm_eo; + le = match[0].rm_eo; /* * After a zero-length match, advance one byte, @@ -388,13 +392,16 @@ substitute(struct s_command *cp) slen = -1; else slen--; - if (*s != '\0') + if (*s != '\0') { cspace(&SS, s++, 1, APPEND); + le++; + } lastempty = 1; } else lastempty = 0; - } while (n >= 0 && slen >= 0 && regexec_e(re, s, REG_NOTBOL, 0, slen)); + } while (n >= 0 && slen >= 0 && + regexec_e(re, ps, REG_NOTBOL, 0, le, psl)); /* Did not find the requested number of matches. */ if (n > 1) @@ -509,7 +516,7 @@ lputs(char *s) static inline int regexec_e(regex_t *preg, const char *string, int eflags, - int nomatch, size_t slen) + int nomatch, size_t start, size_t stop) { int eval; @@ -520,8 +527,8 @@ regexec_e(regex_t *preg, const char *string, int eflags, defpreg = preg; /* Set anchors */ - match[0].rm_so = 0; - match[0].rm_eo = slen; + match[0].rm_so = start; + match[0].rm_eo = stop; eval = regexec(defpreg, string, nomatch ? 0 : maxnsub + 1, match, eflags | REG_STARTEND); |