grep: skip UTF8 checks explicitly
18547aacf5
("grep/pcre: support utf-8", 2016-06-25) that was released
with git 2.10 added the PCRE_UTF8 flag to PCRE1 matching including a
call to has_non_ascii() to try to avoid breakage if there was non-utf8
encoded content in the haystack.
Usually PCRE is compiled with JIT support (even if is not the default),
and therefore the codepath used includes calling pcre_jit_exec, which
skips UTF-8 validation by design (which might result in crashes or hangs)
but when JIT support wasn't compiled we use pcre_exec instead with the
posibility that grep might be aborted if invalid UTF-8 is found in the
haystack.
PCRE1 provides a flag since Mar 5, 2007 that could be used to skip the
checks explicitly so use that to make both codepaths equivalent (the
flag is ignored by pcre1_jit_exec)
this fix is only implemented for PCRE1 because PCRE2 is likely to have
a better solution (without the risks) instead in the future
Helped-by: Johannes Schindelin <Johannes.Schindelin@gmx.de>
Helped-by: Eric Sunshine <sunshine@sunshineco.com>
Helped-by: Ævar Arnfjörð Bjarmason <avarab@gmail.com>
Suggested-by: Junio C Hamano <gitster@pobox.com>
Signed-off-by: Carlo Marcelo Arenas Belón <carenas@gmail.com>
Signed-off-by: Junio C Hamano <gitster@pobox.com>
This commit is contained in:
parent
75b2f01a0f
commit
ad7c543e3b
2
grep.c
2
grep.c
@ -421,7 +421,7 @@ static void compile_pcre1_regexp(struct grep_pat *p, const struct grep_opt *opt)
|
|||||||
static int pcre1match(struct grep_pat *p, const char *line, const char *eol,
|
static int pcre1match(struct grep_pat *p, const char *line, const char *eol,
|
||||||
regmatch_t *match, int eflags)
|
regmatch_t *match, int eflags)
|
||||||
{
|
{
|
||||||
int ovector[30], ret, flags = 0;
|
int ovector[30], ret, flags = PCRE_NO_UTF8_CHECK;
|
||||||
|
|
||||||
if (eflags & REG_NOTBOL)
|
if (eflags & REG_NOTBOL)
|
||||||
flags |= PCRE_NOTBOL;
|
flags |= PCRE_NOTBOL;
|
||||||
|
3
grep.h
3
grep.h
@ -3,6 +3,9 @@
|
|||||||
#include "color.h"
|
#include "color.h"
|
||||||
#ifdef USE_LIBPCRE1
|
#ifdef USE_LIBPCRE1
|
||||||
#include <pcre.h>
|
#include <pcre.h>
|
||||||
|
#ifndef PCRE_NO_UTF8_CHECK
|
||||||
|
#define PCRE_NO_UTF8_CHECK 0
|
||||||
|
#endif
|
||||||
#ifdef PCRE_CONFIG_JIT
|
#ifdef PCRE_CONFIG_JIT
|
||||||
#if PCRE_MAJOR >= 8 && PCRE_MINOR >= 32
|
#if PCRE_MAJOR >= 8 && PCRE_MINOR >= 32
|
||||||
#ifndef NO_LIBPCRE1_JIT
|
#ifndef NO_LIBPCRE1_JIT
|
||||||
|
Loading…
Reference in New Issue
Block a user