git-svn: fix segfaults from accessing svn_log_changed_path_t

svn_log_changed_path_t structs were being used out of scope
outside of svn_ra_get_log (because I wanted to eventually be
able to use git-svn with only a single connection to the
repository).  So now we dup them into a hash.

This was fixed while making --follow-parent fetches more
efficient.  I've moved parsing of the command-line --revision
argument outside of the Git::SVN module so Git::SVN::fetch() can
be used in more places (such as find_parent_branch).

Signed-off-by: Eric Wong <normalperson@yhbt.net>
This commit is contained in:
Eric Wong 2007-01-25 17:35:40 -08:00
parent e5a0b240fc
commit 3ebe8df7f6
2 changed files with 68 additions and 37 deletions

View File

@ -283,7 +283,7 @@ sub cmd_fetch {
instead.\n"; instead.\n";
} }
my $gs = Git::SVN->new; my $gs = Git::SVN->new;
$gs->fetch; $gs->fetch(parse_revision_argument());
if ($gs->{last_commit} && !verify_ref('refs/heads/master^0')) { if ($gs->{last_commit} && !verify_ref('refs/heads/master^0')) {
command_noisy(qw(update-ref refs/heads/master), command_noisy(qw(update-ref refs/heads/master),
$gs->{last_commit}); $gs->{last_commit});
@ -482,6 +482,18 @@ sub cmd_commit_diff {
########################### utility functions ######################### ########################### utility functions #########################
sub parse_revision_argument {
if (!defined $_revision || $_revision eq 'BASE:HEAD') {
return (undef, undef);
}
return ($1, $2) if ($_revision =~ /^(\d+):(\d+)$/);
return ($_revision, $_revision) if ($_revision =~ /^\d+$/);
return (undef, $1) if ($_revision =~ /^BASE:(\d+)$/);
return ($1, undef) if ($_revision =~ /^(\d+):HEAD$/);
die "revision argument: $_revision not understood by git-svn\n",
"Try using the command-line svn client instead\n";
}
sub complete_svn_url { sub complete_svn_url {
my ($url, $path) = @_; my ($url, $path) = @_;
$path =~ s#/+$##; $path =~ s#/+$##;
@ -914,6 +926,9 @@ sub traverse_ignore {
} }
} }
sub last_rev { ($_[0]->last_rev_commit)[0] }
sub last_commit { ($_[0]->last_rev_commit)[1] }
# returns the newest SVN revision number and newest commit SHA1 # returns the newest SVN revision number and newest commit SHA1
sub last_rev_commit { sub last_rev_commit {
my ($self) = @_; my ($self) = @_;
@ -951,22 +966,11 @@ sub last_rev_commit {
return ($rev, $c); return ($rev, $c);
} }
sub parse_revision { sub get_fetch_range {
my ($self, $base) = @_; my ($self, $min, $max) = @_;
my $head = $self->ra->get_latest_revnum; $max ||= $self->ra->get_latest_revnum;
if (!defined $::_revision || $::_revision eq 'BASE:HEAD') { $min ||= $self->last_rev || 0;
return ($base + 1, $head) if (defined $base); (++$min, $max);
return (0, $head);
}
return ($1, $2) if ($::_revision =~ /^(\d+):(\d+)$/);
return ($::_revision, $::_revision) if ($::_revision =~ /^\d+$/);
if ($::_revision =~ /^BASE:(\d+)$/) {
return ($base + 1, $1) if (defined $base);
return (0, $head);
}
return ($1, $head) if ($::_revision =~ /^(\d+):HEAD$/);
die "revision argument: $::_revision not understood by git-svn\n",
"Try using the command-line svn client instead\n";
} }
sub tmp_index_do { sub tmp_index_do {
@ -1101,8 +1105,8 @@ sub find_parent_branch {
my ($self, $paths, $rev) = @_; my ($self, $paths, $rev) = @_;
return undef unless $::_follow_parent; return undef unless $::_follow_parent;
unless (defined $paths) { unless (defined $paths) {
$self->ra->get_log([''], $rev, $rev, 0, 1, 1, $self->ra->get_log([$self->{path}], $rev, $rev, 0, 1, 1,
sub { $paths = $_[0] }); sub { $paths = dup_changed_paths($_[0]) });
} }
return undef unless defined $paths; return undef unless defined $paths;
@ -1116,13 +1120,13 @@ sub find_parent_branch {
unshift(@a_path_components, pop(@b_path_components)); unshift(@a_path_components, pop(@b_path_components));
} }
goto not_found unless defined $i; goto not_found unless defined $i;
my $branch_from = $i->copyfrom_path or goto not_found; my $branch_from = $i->{copyfrom_path} or goto not_found;
if (@a_path_components) { if (@a_path_components) {
print STDERR "branch_from: $branch_from => "; print STDERR "branch_from: $branch_from => ";
$branch_from .= '/'.join('/', @a_path_components); $branch_from .= '/'.join('/', @a_path_components);
print STDERR $branch_from, "\n"; print STDERR $branch_from, "\n";
} }
my $r = $i->copyfrom_rev; my $r = $i->{copyfrom_rev};
my $repos_root = $self->ra->{repos_root}; my $repos_root = $self->ra->{repos_root};
my $url = $self->ra->{url}; my $url = $self->ra->{url};
my $new_url = $repos_root . $branch_from; my $new_url = $repos_root . $branch_from;
@ -1151,11 +1155,7 @@ sub find_parent_branch {
} }
my ($r0, $parent) = $gs->find_rev_before($r, 1); my ($r0, $parent) = $gs->find_rev_before($r, 1);
if ($::_follow_parent && (!defined $r0 || !defined $parent)) { if ($::_follow_parent && (!defined $r0 || !defined $parent)) {
foreach (1 .. $r) { $gs->fetch(0, $r);
if (my $log_entry = $gs->do_fetch(undef, $_)) {
$gs->do_git_commit($log_entry);
}
}
($r0, $parent) = $gs->last_rev_commit; ($r0, $parent) = $gs->last_rev_commit;
} }
if (defined $r0 && defined $parent && $gs->revisions_eq($r0, $r)) { if (defined $r0 && defined $parent && $gs->revisions_eq($r0, $r)) {
@ -1183,8 +1183,19 @@ sub find_parent_branch {
} }
not_found: not_found:
print STDERR "Branch parent for path: '/", print STDERR "Branch parent for path: '/",
$self->rel_path, "' @ $rev not found\n"; $self->rel_path, "' @ r$rev not found:\n";
print STDERR ' ', $_, "\n" foreach (sort keys %$paths); return undef unless $paths;
print STDERR "Changed paths:\n";
foreach my $x (sort keys %$paths) {
my $p = $paths->{$x};
print STDERR "\t$p->{action}\t$x";
if ($p->{copyfrom_path}) {
print STDERR "(from $p->{copyfrom_path}: ",
"$p->{copyfrom_rev})";
}
print STDERR "\n";
}
print STDERR '-'x72, "\n";
return undef; return undef;
} }
@ -1302,9 +1313,9 @@ sub make_log_entry {
} }
sub fetch { sub fetch {
my ($self, @parents) = @_; my ($self, $min_rev, $max_rev, @parents) = @_;
my ($last_rev, $last_commit) = $self->last_rev_commit; my ($last_rev, $last_commit) = $self->last_rev_commit;
my ($base, $head) = $self->parse_revision($last_rev); my ($base, $head) = $self->get_fetch_range($min_rev, $max_rev);
return if ($base > $head); return if ($base > $head);
if (defined $last_commit) { if (defined $last_commit) {
$self->assert_index_clean($last_commit); $self->assert_index_clean($last_commit);
@ -1316,13 +1327,16 @@ sub fetch {
$SVN::Error::handler = sub { ($err) = @_; skip_unknown_revs($err); } ; $SVN::Error::handler = sub { ($err) = @_; skip_unknown_revs($err); } ;
while (1) { while (1) {
my @revs; my @revs;
$self->ra->get_log([$self->{path}], $min, $max, 0, 1, 1, sub { $self->ra->get_log([$self->{path}], $min, $max, 0, 1, 1,
my ($paths, $rev, $author, $date, $log) = @_; sub {
push @revs, [ $paths, $rev ] }); my ($paths, $rev) = @_;
if (! @revs && $err) { push @revs, [ dup_changed_paths($paths), $rev ];
});
if (! @revs && $err && $max >= $head) {
print STDERR "Branch probably deleted:\n ", print STDERR "Branch probably deleted:\n ",
$err->expanded_message, $err->expanded_message,
"\nWill attempt to follow revisions ", "\nWill attempt to follow revisions ",
"r$min .. r$max",
"committed before the deletion\n"; "committed before the deletion\n";
@revs = map { [ undef, $_ ] } ($min .. $max); @revs = map { [ undef, $_ ] } ($min .. $max);
} }
@ -1331,7 +1345,7 @@ sub fetch {
$self->do_git_commit($log_entry, @parents); $self->do_git_commit($log_entry, @parents);
} }
} }
last if $max >= $head || $err; last if $max >= $head;
$min = $max + 1; $min = $max + 1;
$max += $inc; $max += $inc;
$max = $head if ($max > $head); $max = $head if ($max > $head);
@ -1347,7 +1361,7 @@ sub set_tree_cb {
$log_entry->{author} = $author; $log_entry->{author} = $author;
$self->do_git_commit($log_entry, "$rev=$tree"); $self->do_git_commit($log_entry, "$rev=$tree");
} else { } else {
$self->fetch("$rev=$tree"); $self->fetch(undef, undef, "$rev=$tree");
} }
} }
@ -1393,6 +1407,24 @@ sub skip_unknown_revs {
croak "Error from SVN, ($errno): ", $err->expanded_message,"\n"; croak "Error from SVN, ($errno): ", $err->expanded_message,"\n";
} }
# svn_log_changed_path_t objects passed to get_log are likely to be
# overwritten even if only the refs are copied to an external variable,
# so we should dup the structures in their entirety. Using an externally
# passed pool (instead of our temporary and quickly cleared pool in
# Git::SVN::Ra) does not help matters at all...
sub dup_changed_paths {
my ($paths) = @_;
return undef unless $paths;
my %ret;
foreach my $p (keys %$paths) {
my $i = $paths->{$p};
my %s = map { $_ => $i->$_ }
qw/copyfrom_path copyfrom_rev action/;
$ret{$p} = \%s;
}
\%ret;
}
# rev_db: # rev_db:
# Tie::File seems to be prone to offset errors if revisions get sparse, # Tie::File seems to be prone to offset errors if revisions get sparse,
# it's not that fast, either. Tie::File is also not in Perl 5.6. So # it's not that fast, either. Tie::File is also not in Perl 5.6. So

View File

@ -78,7 +78,6 @@ test_expect_success 'follow larger parent' "
true true
" "
# This seems to cause segfaults over HTTP...
test_expect_success 'follow higher-level parent' " test_expect_success 'follow higher-level parent' "
svn mkdir -m 'follow higher-level parent' $svnrepo/blob && svn mkdir -m 'follow higher-level parent' $svnrepo/blob &&
svn co $svnrepo/blob blob && svn co $svnrepo/blob blob &&