]>
Commit | Line | Data |
---|---|---|
c65e8987 RA |
1 | #!/usr/bin/perl |
2 | # Copyright 2006, Ryan Anderson <ryan@michonline.com> | |
3 | # | |
4 | # GPL v2 (See COPYING) | |
5 | # | |
6 | # This file is licensed under the GPL v2, or a later version | |
7 | # at the discretion of Linus Torvalds. | |
8 | ||
9 | use warnings; | |
10 | use strict; | |
87475f4d | 11 | use Getopt::Long; |
4788d11a | 12 | use POSIX qw(strftime gmtime); |
c65e8987 | 13 | |
4788d11a | 14 | sub usage() { |
87475f4d RA |
15 | print STDERR 'Usage: ${\basename $0} [-s] [-S revs-file] file [ revision ] |
16 | -l, --long | |
17 | Show long rev (Defaults off) | |
18 | -r, --rename | |
19 | Follow renames (Defaults on). | |
20 | -S, --rev-file revs-file | |
21 | use revs from revs-file instead of calling git-rev-list | |
22 | -h, --help | |
23 | This message. | |
4788d11a JS |
24 | '; |
25 | ||
26 | exit(1); | |
27 | } | |
c65e8987 | 28 | |
87475f4d RA |
29 | our ($help, $longrev, $rename, $starting_rev, $rev_file) = (0, 0, 1); |
30 | ||
31 | my $rc = GetOptions( "long|l" => \$longrev, | |
32 | "help|h" => \$help, | |
33 | "rename|r" => \$rename, | |
34 | "rev-file|S" => \$rev_file); | |
35 | if (!$rc or $help) { | |
36 | usage(); | |
37 | } | |
4788d11a JS |
38 | |
39 | my $filename = shift @ARGV; | |
87475f4d RA |
40 | if (@ARGV) { |
41 | $starting_rev = shift @ARGV; | |
42 | } | |
c65e8987 RA |
43 | |
44 | my @stack = ( | |
45 | { | |
87475f4d | 46 | 'rev' => defined $starting_rev ? $starting_rev : "HEAD", |
c65e8987 RA |
47 | 'filename' => $filename, |
48 | }, | |
49 | ); | |
50 | ||
c65e8987 | 51 | our @filelines = (); |
c65e8987 | 52 | |
87475f4d RA |
53 | if (defined $starting_rev) { |
54 | @filelines = git_cat_file($starting_rev, $filename); | |
55 | } else { | |
56 | open(F,"<",$filename) | |
57 | or die "Failed to open filename: $!"; | |
58 | ||
59 | while(<F>) { | |
60 | chomp; | |
61 | push @filelines, $_; | |
62 | } | |
63 | close(F); | |
64 | ||
c65e8987 | 65 | } |
87475f4d | 66 | |
c65e8987 RA |
67 | our %revs; |
68 | our @revqueue; | |
69 | our $head; | |
70 | ||
71 | my $revsprocessed = 0; | |
72 | while (my $bound = pop @stack) { | |
73 | my @revisions = git_rev_list($bound->{'rev'}, $bound->{'filename'}); | |
74 | foreach my $revinst (@revisions) { | |
75 | my ($rev, @parents) = @$revinst; | |
76 | $head ||= $rev; | |
77 | ||
4788d11a JS |
78 | if (!defined($rev)) { |
79 | $rev = ""; | |
80 | } | |
c65e8987 RA |
81 | $revs{$rev}{'filename'} = $bound->{'filename'}; |
82 | if (scalar @parents > 0) { | |
83 | $revs{$rev}{'parents'} = \@parents; | |
84 | next; | |
85 | } | |
86 | ||
87475f4d | 87 | if (!$rename) { |
4788d11a JS |
88 | next; |
89 | } | |
90 | ||
c65e8987 RA |
91 | my $newbound = find_parent_renames($rev, $bound->{'filename'}); |
92 | if ( exists $newbound->{'filename'} && $newbound->{'filename'} ne $bound->{'filename'}) { | |
93 | push @stack, $newbound; | |
94 | $revs{$rev}{'parents'} = [$newbound->{'rev'}]; | |
95 | } | |
96 | } | |
97 | } | |
98 | push @revqueue, $head; | |
87475f4d RA |
99 | init_claim( defined $starting_rev ? $starting_rev : 'dirty'); |
100 | unless (defined $starting_rev) { | |
6b3e21d6 | 101 | my $diff = open_pipe("git","diff","-R", "HEAD", "--",$filename) |
87475f4d RA |
102 | or die "Failed to call git diff to check for dirty state: $!"; |
103 | ||
6b3e21d6 | 104 | _git_diff_parse($diff, $head, "dirty", ( |
87475f4d RA |
105 | 'author' => gitvar_name("GIT_AUTHOR_IDENT"), |
106 | 'author_date' => sprintf("%s +0000",time()), | |
107 | ) | |
108 | ); | |
6b3e21d6 | 109 | close($diff); |
87475f4d | 110 | } |
c65e8987 RA |
111 | handle_rev(); |
112 | ||
113 | ||
114 | my $i = 0; | |
115 | foreach my $l (@filelines) { | |
116 | my ($output, $rev, $committer, $date); | |
117 | if (ref $l eq 'ARRAY') { | |
118 | ($output, $rev, $committer, $date) = @$l; | |
87475f4d | 119 | if (!$longrev && length($rev) > 8) { |
c65e8987 RA |
120 | $rev = substr($rev,0,8); |
121 | } | |
122 | } else { | |
123 | $output = $l; | |
124 | ($rev, $committer, $date) = ('unknown', 'unknown', 'unknown'); | |
125 | } | |
126 | ||
4788d11a JS |
127 | printf("%s\t(%10s\t%10s\t%d)%s\n", $rev, $committer, |
128 | format_date($date), $i++, $output); | |
c65e8987 RA |
129 | } |
130 | ||
131 | sub init_claim { | |
132 | my ($rev) = @_; | |
c65e8987 RA |
133 | for (my $i = 0; $i < @filelines; $i++) { |
134 | $filelines[$i] = [ $filelines[$i], '', '', '', 1]; | |
135 | # line, | |
136 | # rev, | |
137 | # author, | |
138 | # date, | |
139 | # 1 <-- belongs to the original file. | |
140 | } | |
141 | $revs{$rev}{'lines'} = \@filelines; | |
142 | } | |
143 | ||
144 | ||
145 | sub handle_rev { | |
146 | my $i = 0; | |
87475f4d | 147 | my %seen; |
c65e8987 | 148 | while (my $rev = shift @revqueue) { |
87475f4d | 149 | next if $seen{$rev}++; |
c65e8987 RA |
150 | |
151 | my %revinfo = git_commit_info($rev); | |
152 | ||
153 | foreach my $p (@{$revs{$rev}{'parents'}}) { | |
154 | ||
155 | git_diff_parse($p, $rev, %revinfo); | |
156 | push @revqueue, $p; | |
157 | } | |
158 | ||
159 | ||
160 | if (scalar @{$revs{$rev}{parents}} == 0) { | |
161 | # We must be at the initial rev here, so claim everything that is left. | |
162 | for (my $i = 0; $i < @{$revs{$rev}{lines}}; $i++) { | |
163 | if (ref ${$revs{$rev}{lines}}[$i] eq '' || ${$revs{$rev}{lines}}[$i][1] eq '') { | |
164 | claim_line($i, $rev, $revs{$rev}{lines}, %revinfo); | |
165 | } | |
166 | } | |
167 | } | |
168 | } | |
169 | } | |
170 | ||
171 | ||
172 | sub git_rev_list { | |
173 | my ($rev, $file) = @_; | |
174 | ||
6b3e21d6 | 175 | my $revlist; |
87475f4d | 176 | if ($rev_file) { |
6b3e21d6 | 177 | open($revlist, '<' . $rev_file); |
4788d11a | 178 | } else { |
6b3e21d6 | 179 | $revlist = open_pipe("git-rev-list","--parents","--remove-empty",$rev,"--",$file) |
4788d11a JS |
180 | or die "Failed to exec git-rev-list: $!"; |
181 | } | |
c65e8987 RA |
182 | |
183 | my @revs; | |
6b3e21d6 | 184 | while(my $line = <$revlist>) { |
c65e8987 RA |
185 | chomp $line; |
186 | my ($rev, @parents) = split /\s+/, $line; | |
187 | push @revs, [ $rev, @parents ]; | |
188 | } | |
6b3e21d6 | 189 | close($revlist); |
c65e8987 RA |
190 | |
191 | printf("0 revs found for rev %s (%s)\n", $rev, $file) if (@revs == 0); | |
192 | return @revs; | |
193 | } | |
194 | ||
195 | sub find_parent_renames { | |
196 | my ($rev, $file) = @_; | |
197 | ||
6b3e21d6 | 198 | my $patch = open_pipe("git-diff-tree", "-M50", "-r","--name-status", "-z","$rev") |
c65e8987 RA |
199 | or die "Failed to exec git-diff: $!"; |
200 | ||
201 | local $/ = "\0"; | |
202 | my %bound; | |
6b3e21d6 RA |
203 | my $junk = <$patch>; |
204 | while (my $change = <$patch>) { | |
c65e8987 | 205 | chomp $change; |
6b3e21d6 | 206 | my $filename = <$patch>; |
c65e8987 RA |
207 | chomp $filename; |
208 | ||
209 | if ($change =~ m/^[AMD]$/ ) { | |
210 | next; | |
211 | } elsif ($change =~ m/^R/ ) { | |
212 | my $oldfilename = $filename; | |
6b3e21d6 | 213 | $filename = <$patch>; |
c65e8987 RA |
214 | chomp $filename; |
215 | if ( $file eq $filename ) { | |
216 | my $parent = git_find_parent($rev, $oldfilename); | |
217 | @bound{'rev','filename'} = ($parent, $oldfilename); | |
218 | last; | |
219 | } | |
220 | } | |
221 | } | |
6b3e21d6 | 222 | close($patch); |
c65e8987 RA |
223 | |
224 | return \%bound; | |
225 | } | |
226 | ||
227 | ||
228 | sub git_find_parent { | |
229 | my ($rev, $filename) = @_; | |
230 | ||
6b3e21d6 | 231 | my $revparent = open_pipe("git-rev-list","--remove-empty", "--parents","--max-count=1","$rev","--",$filename) |
c65e8987 RA |
232 | or die "Failed to open git-rev-list to find a single parent: $!"; |
233 | ||
6b3e21d6 | 234 | my $parentline = <$revparent>; |
c65e8987 RA |
235 | chomp $parentline; |
236 | my ($revfound,$parent) = split m/\s+/, $parentline; | |
237 | ||
6b3e21d6 | 238 | close($revparent); |
c65e8987 RA |
239 | |
240 | return $parent; | |
241 | } | |
242 | ||
243 | ||
244 | # Get a diff between the current revision and a parent. | |
245 | # Record the commit information that results. | |
246 | sub git_diff_parse { | |
247 | my ($parent, $rev, %revinfo) = @_; | |
248 | ||
6b3e21d6 | 249 | my $diff = open_pipe("git-diff-tree","-M","-p",$rev,$parent,"--", |
c65e8987 RA |
250 | $revs{$rev}{'filename'}, $revs{$parent}{'filename'}) |
251 | or die "Failed to call git-diff for annotation: $!"; | |
252 | ||
6b3e21d6 | 253 | _git_diff_parse($diff, $parent, $rev, %revinfo); |
87475f4d | 254 | |
6b3e21d6 | 255 | close($diff); |
87475f4d RA |
256 | } |
257 | ||
258 | sub _git_diff_parse { | |
259 | my ($diff, $parent, $rev, %revinfo) = @_; | |
260 | ||
261 | my ($ri, $pi) = (0,0); | |
c65e8987 RA |
262 | my $slines = $revs{$rev}{'lines'}; |
263 | my @plines; | |
264 | ||
265 | my $gotheader = 0; | |
87475f4d RA |
266 | my ($remstart); |
267 | my ($hunk_start, $hunk_index); | |
6b3e21d6 | 268 | while(<$diff>) { |
c65e8987 RA |
269 | chomp; |
270 | if (m/^@@ -(\d+),(\d+) \+(\d+),(\d+)/) { | |
87475f4d | 271 | $remstart = $1; |
c65e8987 RA |
272 | # Adjust for 0-based arrays |
273 | $remstart--; | |
c65e8987 RA |
274 | # Reinit hunk tracking. |
275 | $hunk_start = $remstart; | |
276 | $hunk_index = 0; | |
277 | $gotheader = 1; | |
278 | ||
279 | for (my $i = $ri; $i < $remstart; $i++) { | |
280 | $plines[$pi++] = $slines->[$i]; | |
281 | $ri++; | |
282 | } | |
283 | next; | |
284 | } elsif (!$gotheader) { | |
285 | next; | |
286 | } | |
287 | ||
288 | if (m/^\+(.*)$/) { | |
289 | my $line = $1; | |
290 | $plines[$pi++] = [ $line, '', '', '', 0 ]; | |
291 | next; | |
292 | ||
293 | } elsif (m/^-(.*)$/) { | |
294 | my $line = $1; | |
295 | if (get_line($slines, $ri) eq $line) { | |
296 | # Found a match, claim | |
297 | claim_line($ri, $rev, $slines, %revinfo); | |
298 | } else { | |
299 | die sprintf("Sync error: %d/%d\n|%s\n|%s\n%s => %s\n", | |
300 | $ri, $hunk_start + $hunk_index, | |
301 | $line, | |
302 | get_line($slines, $ri), | |
303 | $rev, $parent); | |
304 | } | |
305 | $ri++; | |
306 | ||
307 | } else { | |
308 | if (substr($_,1) ne get_line($slines,$ri) ) { | |
309 | die sprintf("Line %d (%d) does not match:\n|%s\n|%s\n%s => %s\n", | |
310 | $hunk_start + $hunk_index, $ri, | |
311 | substr($_,1), | |
312 | get_line($slines,$ri), | |
313 | $rev, $parent); | |
314 | } | |
315 | $plines[$pi++] = $slines->[$ri++]; | |
316 | } | |
317 | $hunk_index++; | |
318 | } | |
c65e8987 RA |
319 | for (my $i = $ri; $i < @{$slines} ; $i++) { |
320 | push @plines, $slines->[$ri++]; | |
321 | } | |
322 | ||
323 | $revs{$parent}{lines} = \@plines; | |
324 | return; | |
325 | } | |
326 | ||
327 | sub get_line { | |
328 | my ($lines, $index) = @_; | |
329 | ||
330 | return ref $lines->[$index] ne '' ? $lines->[$index][0] : $lines->[$index]; | |
331 | } | |
332 | ||
333 | sub git_cat_file { | |
87475f4d RA |
334 | my ($rev, $filename) = @_; |
335 | return () unless defined $rev && defined $filename; | |
c65e8987 | 336 | |
87475f4d RA |
337 | my $blob = git_ls_tree($rev, $filename); |
338 | ||
6b3e21d6 | 339 | my $catfile = open_pipe("git","cat-file", "blob", $blob) |
87475f4d | 340 | or die "Failed to git-cat-file blob $blob (rev $rev, file $filename): " . $!; |
c65e8987 RA |
341 | |
342 | my @lines; | |
6b3e21d6 | 343 | while(<$catfile>) { |
c65e8987 RA |
344 | chomp; |
345 | push @lines, $_; | |
346 | } | |
6b3e21d6 | 347 | close($catfile); |
c65e8987 RA |
348 | |
349 | return @lines; | |
350 | } | |
351 | ||
87475f4d RA |
352 | sub git_ls_tree { |
353 | my ($rev, $filename) = @_; | |
354 | ||
6b3e21d6 | 355 | my $lstree = open_pipe("git","ls-tree",$rev,$filename) |
87475f4d RA |
356 | or die "Failed to call git ls-tree: $!"; |
357 | ||
358 | my ($mode, $type, $blob, $tfilename); | |
6b3e21d6 | 359 | while(<$lstree>) { |
87475f4d RA |
360 | ($mode, $type, $blob, $tfilename) = split(/\s+/, $_, 4); |
361 | last if ($tfilename eq $filename); | |
362 | } | |
6b3e21d6 | 363 | close($lstree); |
87475f4d RA |
364 | |
365 | return $blob if $filename eq $filename; | |
366 | die "git-ls-tree failed to find blob for $filename"; | |
367 | ||
368 | } | |
369 | ||
370 | ||
c65e8987 RA |
371 | |
372 | sub claim_line { | |
373 | my ($floffset, $rev, $lines, %revinfo) = @_; | |
374 | my $oline = get_line($lines, $floffset); | |
375 | @{$lines->[$floffset]} = ( $oline, $rev, | |
376 | $revinfo{'author'}, $revinfo{'author_date'} ); | |
377 | #printf("Claiming line %d with rev %s: '%s'\n", | |
378 | # $floffset, $rev, $oline) if 1; | |
379 | } | |
380 | ||
381 | sub git_commit_info { | |
382 | my ($rev) = @_; | |
6b3e21d6 | 383 | my $commit = open_pipe("git-cat-file", "commit", $rev) |
c65e8987 RA |
384 | or die "Failed to call git-cat-file: $!"; |
385 | ||
386 | my %info; | |
6b3e21d6 | 387 | while(<$commit>) { |
c65e8987 RA |
388 | chomp; |
389 | last if (length $_ == 0); | |
390 | ||
391 | if (m/^author (.*) <(.*)> (.*)$/) { | |
392 | $info{'author'} = $1; | |
393 | $info{'author_email'} = $2; | |
394 | $info{'author_date'} = $3; | |
395 | } elsif (m/^committer (.*) <(.*)> (.*)$/) { | |
396 | $info{'committer'} = $1; | |
397 | $info{'committer_email'} = $2; | |
398 | $info{'committer_date'} = $3; | |
399 | } | |
400 | } | |
6b3e21d6 | 401 | close($commit); |
c65e8987 RA |
402 | |
403 | return %info; | |
404 | } | |
4788d11a JS |
405 | |
406 | sub format_date { | |
407 | my ($timestamp, $timezone) = split(' ', $_[0]); | |
408 | ||
409 | return strftime("%Y-%m-%d %H:%M:%S " . $timezone, gmtime($timestamp)); | |
410 | } | |
411 | ||
87475f4d RA |
412 | # Copied from git-send-email.perl - We need a Git.pm module.. |
413 | sub gitvar { | |
414 | my ($var) = @_; | |
415 | my $fh; | |
416 | my $pid = open($fh, '-|'); | |
417 | die "$!" unless defined $pid; | |
418 | if (!$pid) { | |
419 | exec('git-var', $var) or die "$!"; | |
420 | } | |
421 | my ($val) = <$fh>; | |
422 | close $fh or die "$!"; | |
423 | chomp($val); | |
424 | return $val; | |
425 | } | |
426 | ||
427 | sub gitvar_name { | |
428 | my ($name) = @_; | |
429 | my $val = gitvar($name); | |
430 | my @field = split(/\s+/, $val); | |
431 | return join(' ', @field[0...(@field-4)]); | |
432 | } | |
433 | ||
6b3e21d6 | 434 | sub open_pipe { |
f60d4691 RA |
435 | if ($^O eq '##INSERT_ACTIVESTATE_STRING_HERE##') { |
436 | return open_pipe_activestate(@_); | |
437 | } else { | |
438 | return open_pipe_normal(@_); | |
439 | } | |
440 | } | |
441 | ||
442 | sub open_pipe_activestate { | |
443 | tie *fh, "Git::ActiveStatePipe", @_; | |
444 | return *fh; | |
445 | } | |
446 | ||
447 | sub open_pipe_normal { | |
6b3e21d6 RA |
448 | my (@execlist) = @_; |
449 | ||
450 | my $pid = open my $kid, "-|"; | |
451 | defined $pid or die "Cannot fork: $!"; | |
452 | ||
453 | unless ($pid) { | |
454 | exec @execlist; | |
455 | die "Cannot exec @execlist: $!"; | |
456 | } | |
457 | ||
458 | return $kid; | |
459 | } | |
f60d4691 RA |
460 | |
461 | package Git::ActiveStatePipe; | |
462 | use strict; | |
463 | ||
464 | sub TIEHANDLE { | |
465 | my ($class, @params) = @_; | |
466 | my $cmdline = join " ", @params; | |
467 | my @data = qx{$cmdline}; | |
468 | bless { i => 0, data => \@data }, $class; | |
469 | } | |
470 | ||
471 | sub READLINE { | |
472 | my $self = shift; | |
473 | if ($self->{i} >= scalar @{$self->{data}}) { | |
474 | return undef; | |
475 | } | |
476 | return $self->{'data'}->[ $self->{i}++ ]; | |
477 | } | |
478 | ||
479 | sub CLOSE { | |
480 | my $self = shift; | |
481 | delete $self->{data}; | |
482 | delete $self->{i}; | |
483 | } | |
484 | ||
485 | sub EOF { | |
486 | my $self = shift; | |
487 | return ($self->{i} >= scalar @{$self->{data}}); | |
488 | } |