Support for pickaxe matching regular expressions

git-diff-* --pickaxe-regex will change the -S pickaxe to match
POSIX extended regular expressions instead of fixed strings.

The regex.h library is a rather stupid interface and I like pcre too, but
with any luck it will be everywhere we will want to run Git on, it being
POSIX.2 and all. I'm not sure if we can expect platforms like AIX to
conform to POSIX.2 or if win32 has regex.h. We might add a flag to
Makefile if there is a portability trouble potential.

Signed-off-by: Petr Baudis <pasky@suse.cz>
This commit is contained in:
Petr Baudis 2006-03-29 02:16:33 +02:00 committed by Junio C Hamano
parent 810e152375
commit d01d8c6782
4 changed files with 57 additions and 16 deletions

View File

@ -69,6 +69,10 @@
changeset, not just the files that contain the change changeset, not just the files that contain the change
in <string>. in <string>.
--pickaxe-regex::
Make the <string> not a plain string but an extended POSIX
regex to match.
-O<orderfile>:: -O<orderfile>::
Output the patch in the order specified in the Output the patch in the order specified in the
<orderfile>, which has one shell glob pattern per line. <orderfile>, which has one shell glob pattern per line.

2
diff.c
View File

@ -883,6 +883,8 @@ int diff_opt_parse(struct diff_options *options, const char **av, int ac)
options->filter = arg + 14; options->filter = arg + 14;
else if (!strcmp(arg, "--pickaxe-all")) else if (!strcmp(arg, "--pickaxe-all"))
options->pickaxe_opts = DIFF_PICKAXE_ALL; options->pickaxe_opts = DIFF_PICKAXE_ALL;
else if (!strcmp(arg, "--pickaxe-regex"))
options->pickaxe_opts = DIFF_PICKAXE_REGEX;
else if (!strncmp(arg, "-B", 2)) { else if (!strncmp(arg, "-B", 2)) {
if ((options->break_opt = if ((options->break_opt =
diff_scoreopt_parse(arg)) == -1) diff_scoreopt_parse(arg)) == -1)

1
diff.h
View File

@ -102,6 +102,7 @@ extern int diff_setup_done(struct diff_options *);
#define DIFF_DETECT_COPY 2 #define DIFF_DETECT_COPY 2
#define DIFF_PICKAXE_ALL 1 #define DIFF_PICKAXE_ALL 1
#define DIFF_PICKAXE_REGEX 2
extern void diffcore_std(struct diff_options *); extern void diffcore_std(struct diff_options *);

View File

@ -1,12 +1,15 @@
/* /*
* Copyright (C) 2005 Junio C Hamano * Copyright (C) 2005 Junio C Hamano
*/ */
#include <regex.h>
#include "cache.h" #include "cache.h"
#include "diff.h" #include "diff.h"
#include "diffcore.h" #include "diffcore.h"
static unsigned int contains(struct diff_filespec *one, static unsigned int contains(struct diff_filespec *one,
const char *needle, unsigned long len) const char *needle, unsigned long len,
regex_t *regexp)
{ {
unsigned int cnt; unsigned int cnt;
unsigned long offset, sz; unsigned long offset, sz;
@ -18,15 +21,28 @@ static unsigned int contains(struct diff_filespec *one,
data = one->data; data = one->data;
cnt = 0; cnt = 0;
/* Yes, I've heard of strstr(), but the thing is *data may if (regexp) {
* not be NUL terminated. Sue me. regmatch_t regmatch;
*/ int flags = 0;
for (offset = 0; offset + len <= sz; offset++) {
/* we count non-overlapping occurrences of needle */ while (*data && !regexec(regexp, data, 1, &regmatch, flags)) {
if (!memcmp(needle, data + offset, len)) { flags |= REG_NOTBOL;
offset += len - 1; data += regmatch.rm_so;
if (*data) data++;
cnt++; cnt++;
} }
} else { /* Classic exact string match */
/* Yes, I've heard of strstr(), but the thing is *data may
* not be NUL terminated. Sue me.
*/
for (offset = 0; offset + len <= sz; offset++) {
/* we count non-overlapping occurrences of needle */
if (!memcmp(needle, data + offset, len)) {
offset += len - 1;
cnt++;
}
}
} }
return cnt; return cnt;
} }
@ -36,10 +52,24 @@ void diffcore_pickaxe(const char *needle, int opts)
struct diff_queue_struct *q = &diff_queued_diff; struct diff_queue_struct *q = &diff_queued_diff;
unsigned long len = strlen(needle); unsigned long len = strlen(needle);
int i, has_changes; int i, has_changes;
regex_t regex, *regexp = NULL;
struct diff_queue_struct outq; struct diff_queue_struct outq;
outq.queue = NULL; outq.queue = NULL;
outq.nr = outq.alloc = 0; outq.nr = outq.alloc = 0;
if (opts & DIFF_PICKAXE_REGEX) {
int err;
err = regcomp(&regex, needle, REG_EXTENDED | REG_NEWLINE);
if (err) {
/* The POSIX.2 people are surely sick */
char errbuf[1024];
regerror(err, &regex, errbuf, 1024);
regfree(&regex);
die("invalid pickaxe regex: %s", errbuf);
}
regexp = &regex;
}
if (opts & DIFF_PICKAXE_ALL) { if (opts & DIFF_PICKAXE_ALL) {
/* Showing the whole changeset if needle exists */ /* Showing the whole changeset if needle exists */
for (i = has_changes = 0; !has_changes && i < q->nr; i++) { for (i = has_changes = 0; !has_changes && i < q->nr; i++) {
@ -48,16 +78,16 @@ void diffcore_pickaxe(const char *needle, int opts)
if (!DIFF_FILE_VALID(p->two)) if (!DIFF_FILE_VALID(p->two))
continue; /* ignore unmerged */ continue; /* ignore unmerged */
/* created */ /* created */
if (contains(p->two, needle, len)) if (contains(p->two, needle, len, regexp))
has_changes++; has_changes++;
} }
else if (!DIFF_FILE_VALID(p->two)) { else if (!DIFF_FILE_VALID(p->two)) {
if (contains(p->one, needle, len)) if (contains(p->one, needle, len, regexp))
has_changes++; has_changes++;
} }
else if (!diff_unmodified_pair(p) && else if (!diff_unmodified_pair(p) &&
contains(p->one, needle, len) != contains(p->one, needle, len, regexp) !=
contains(p->two, needle, len)) contains(p->two, needle, len, regexp))
has_changes++; has_changes++;
} }
if (has_changes) if (has_changes)
@ -80,16 +110,16 @@ void diffcore_pickaxe(const char *needle, int opts)
if (!DIFF_FILE_VALID(p->two)) if (!DIFF_FILE_VALID(p->two))
; /* ignore unmerged */ ; /* ignore unmerged */
/* created */ /* created */
else if (contains(p->two, needle, len)) else if (contains(p->two, needle, len, regexp))
has_changes = 1; has_changes = 1;
} }
else if (!DIFF_FILE_VALID(p->two)) { else if (!DIFF_FILE_VALID(p->two)) {
if (contains(p->one, needle, len)) if (contains(p->one, needle, len, regexp))
has_changes = 1; has_changes = 1;
} }
else if (!diff_unmodified_pair(p) && else if (!diff_unmodified_pair(p) &&
contains(p->one, needle, len) != contains(p->one, needle, len, regexp) !=
contains(p->two, needle, len)) contains(p->two, needle, len, regexp))
has_changes = 1; has_changes = 1;
if (has_changes) if (has_changes)
@ -98,6 +128,10 @@ void diffcore_pickaxe(const char *needle, int opts)
diff_free_filepair(p); diff_free_filepair(p);
} }
if (opts & DIFF_PICKAXE_REGEX) {
regfree(&regex);
}
free(q->queue); free(q->queue);
*q = outq; *q = outq;
return; return;