| #!/usr/bin/env perl |
| # |
| # SPDX-License-Identifier: GPL-2.0-only |
| |
| package gerrit_stats; |
| |
| # To install any needed modules install the cpanm app, and use it to install the required modules: |
| # sudo cpan App::cpanminus |
| # sudo /usr/local/bin/cpanm JSON::Util Net::OpenSSH DateTime Devel::Size |
| |
| use strict; |
| use warnings; |
| use English qw( -no_match_vars ); |
| use File::Find; |
| use File::Path; |
| use Getopt::Long; |
| use Getopt::Std; |
| use JSON::Util; |
| use Net::OpenSSH; |
| use Data::Dumper qw(Dumper); |
| use DateTime; |
| use Devel::Size qw(size total_size); |
| |
| my $old_version; |
| my $new_version; |
| my $infodir="$ENV{'HOME'}/.commit_info/" . `git config -l | grep remote.origin.url | sed 's|.*@||' | sed 's|:.*||'`; |
| chomp($infodir); |
| my $URL_WITH_USER; |
| my $SKIP_GERRIT_CHECK; |
| my $print_commit_list = 1; |
| |
| #disable print buffering |
| $OUTPUT_AUTOFLUSH = 1; |
| binmode STDOUT, ":utf8"; |
| |
| Main(); |
| |
| #------------------------------------------------------------------------------- |
| # Main |
| #------------------------------------------------------------------------------- |
| sub Main { |
| check_arguments(); |
| |
| my %submitters = (); |
| my %authors = (); |
| my %owners = (); |
| my %reviewers = (); |
| my %author_added = (); |
| my %author_removed = (); |
| my $total_added = 0; |
| my $total_removed = 0; |
| my $number_of_commits = 0; |
| my $number_of_submitters = 0; |
| my $submit_epoch = ""; |
| my $first_submit_epoch = ""; |
| if (!$URL_WITH_USER) { |
| get_user() |
| } |
| |
| # make sure the versions exist |
| check_versions(); |
| |
| #fetch patches if needed. Get ids of first and last commits |
| my @commits = `git log --pretty=%h "$old_version..$new_version" 2>/dev/null`; |
| get_commits(@commits); |
| my $last_commit_id = $commits[0]; |
| my $first_commit_id = $commits[@commits - 1]; |
| chomp $last_commit_id; |
| chomp $first_commit_id; |
| |
| print "Statistics from commit $first_commit_id to commit $last_commit_id\n"; |
| print "Patch, Date, Owner, Author, Submitter, Inserted lines, Deleted lines, Subject, Reviewers\n"; |
| |
| #loop through all commits |
| for my $commit_id (@commits) { |
| $commit_id =~ s/^\s+|\s+$//g; |
| |
| my $submitter = ""; |
| my %patch_reviewers = (); |
| my $info; |
| my $owner; |
| my $author; |
| my $author_email; |
| my $inserted_lines = 0; |
| my $deleted_lines = 0; |
| my $subject; |
| |
| $number_of_commits++; |
| print "\"$commit_id\", "; |
| |
| #read the data file for the current commit |
| if (-f "$infodir/$commit_id" && -s "$infodir/$commit_id" > 20) { |
| open( my $HANDLE, "<", "$infodir/$commit_id" ) or die "Error: could not open file '$infodir/$commit_id'\n"; |
| $info = <$HANDLE>; |
| close $HANDLE; |
| |
| my $commit_info = JSON::Util->decode($info); |
| |
| #get the easy data |
| $owner = $commit_info->{'owner'}{'name'}; |
| if (! $owner) { |
| $owner = $commit_info->{'owner'}{'username'}; |
| } |
| if (! $owner) { |
| $owner = ""; |
| } |
| $author = $commit_info->{'currentPatchSet'}{'author'}{'name'}; |
| $author_email = $commit_info->{'currentPatchSet'}{'author'}{'email'}; |
| if (! $author) { |
| $author = $commit_info->{'currentPatchSet'}{'author'}{'username'}; |
| } |
| |
| $inserted_lines = $commit_info->{'currentPatchSet'}{'sizeInsertions'}; |
| $deleted_lines = $commit_info->{'currentPatchSet'}{'sizeDeletions'}; |
| $subject = $commit_info->{'subject'}; |
| |
| #get the patch's submitter |
| my $approvals = $commit_info->{'currentPatchSet'}{'approvals'}; |
| for my $approval (@$approvals) { |
| if ($approval->{'type'} eq "SUBM") { |
| $submit_epoch = $approval->{'grantedOn'}; |
| $submitter = $approval->{'by'}{'name'}; |
| } |
| } |
| |
| #get all the reviewers for all patch revisions |
| my $patchsets = $commit_info->{'patchSets'}; |
| for my $patch (@$patchsets) { |
| if (! $author) { |
| $author = $patch->{'author'}{'name'}; |
| } |
| my $approvals = $patch->{'approvals'}; |
| for my $approval (@$approvals) { |
| |
| if ( (! $submitter) && ($approval->{'type'} eq "SUBM")) { |
| $submit_epoch = $approval->{'grantedOn'}; |
| $submitter = $approval->{'by'}{'name'}; |
| } |
| |
| if ($approval->{'type'} eq "Code-Review") { |
| my $patch_reviewer = $approval->{'by'}{'name'}; |
| if ($patch_reviewer) { |
| if (exists $patch_reviewers{$patch_reviewer}) { |
| $patch_reviewers{$patch_reviewer}++; |
| } else { |
| $patch_reviewers{$patch_reviewer} = 1; |
| } |
| } |
| } |
| } |
| } |
| |
| } else { |
| # get the info from git |
| my $logline = `git log --pretty="%ct@@@%s@@@%an@@@%aE@@@%cn" $commit_id^..$commit_id --`; |
| $logline =~ m/^(.*)@@@(.*)@@@(.*)@@@(.*)@@@(.*)\n/; |
| ($submit_epoch, $subject, $author, $author_email, $submitter) = ($1, $2, $3, $4, $5); |
| $owner = $author; |
| $logline = `git log --pretty= --shortstat $commit_id^..$commit_id --`; |
| if ($logline =~ m/\s+(\d+)\s+insertion/) { |
| $inserted_lines = $1; |
| } |
| if ($logline =~ m/\s+(\d+)\s+deletion/) { |
| $deleted_lines = $1 * -1; |
| } |
| my @loglines = `git log $commit_id^..$commit_id -- | grep '\\sReviewed-by:'`; |
| for my $line (@loglines){ |
| if ($line =~ m/.*:\s+(.*)\s</) { |
| my $patch_reviewer = $1; |
| if ($patch_reviewer) { |
| if (exists $patch_reviewers{$patch_reviewer}) { |
| $patch_reviewers{$patch_reviewer}++; |
| } else { |
| $patch_reviewers{$patch_reviewer} = 1; |
| } |
| } |
| } |
| } |
| |
| } |
| |
| # Not entirely certain why this is needed, but for a number of patches have been submitted |
| # the submit time in gerrit is set to April 9, 2015. |
| if ($submit_epoch == 1428586219){ |
| my $logline = `git log --pretty="%ct" $commit_id^..$commit_id --`; |
| $logline =~ m/^(.*)\n/; |
| $submit_epoch = $1; |
| } |
| |
| #add the count and owner to the submitter hash |
| if (exists $submitters{$submitter}) { |
| $submitters{$submitter}++; |
| } else { |
| $submitters{$submitter} = 1; |
| $number_of_submitters++; |
| } |
| |
| #create a readable date |
| my $dt = DateTime->from_epoch(epoch => $submit_epoch); |
| $dt->set_time_zone( 'Europe/Paris' ); |
| my $submit_time = $dt->strftime('%Y/%m/%d %H:%M:%S'); |
| if (!$first_submit_epoch) { |
| $first_submit_epoch = $submit_epoch; |
| } |
| |
| #create the list of reviewers to print |
| my $reviewerlist = ""; |
| foreach my $reviewer (keys %patch_reviewers) { |
| if ($reviewerlist eq "") { |
| $reviewerlist = $reviewer; |
| } else { |
| $reviewerlist .= ", $reviewer"; |
| } |
| |
| if (exists $reviewers{$reviewer}) { |
| $reviewers{$reviewer}++; |
| } else { |
| $reviewers{$reviewer} = 1; |
| } |
| } |
| if (! $reviewerlist) { |
| $reviewerlist = "-" |
| } |
| |
| if ($print_commit_list) { |
| print "$submit_time, $owner, $author, $submitter, $inserted_lines, $deleted_lines, \"$subject\", \"$reviewerlist\"\n"; |
| } else { |
| print "$number_of_commits\n"; |
| } |
| $total_added += $inserted_lines; |
| $total_removed += $deleted_lines; |
| if (exists $owners{$owner}) { |
| $owners{$owner}++; |
| } else { |
| $owners{$owner} = 1; |
| } |
| |
| if (exists $authors{$author}{"num"}) { |
| $authors{$author}{"num"}++; |
| $author_added{$author} += $inserted_lines; |
| $author_removed{$author} += $deleted_lines; |
| $authors{$author}{"earliest_commit"}=$submit_time; |
| } else { |
| $authors{$author}{"num"} = 1; |
| $authors{$author}{"latest_commit"}=$submit_time; |
| $authors{$author}{"earliest_commit"}=$submit_time; |
| $author_added{$author} = $inserted_lines; |
| $author_removed{$author} = $deleted_lines; |
| } |
| if (! exists $authors{$author}{email} && $author_email) { |
| $authors{$author}{email} = "$author_email"; |
| } |
| } |
| my $Days = ($first_submit_epoch - $submit_epoch) / 86400; |
| if (($first_submit_epoch - $submit_epoch) % 86400) { |
| $Days += 1; |
| } |
| |
| print "- Total Commits: $number_of_commits\n"; |
| printf "- Average Commits per day: %.2f\n", $number_of_commits / $Days; |
| print "- Total lines added: $total_added\n"; |
| print "- Total lines removed: $total_removed\n"; |
| print "- Total difference: " . ($total_added + $total_removed) . "\n\n"; |
| |
| print "=== Authors - Number of commits ===\n"; |
| my $number_of_authors = 0; |
| foreach my $author (sort { $authors{$b}{num} <=> $authors{$a}{num} } (keys %authors) ) { |
| if (! exists $authors{$author}{"email"}) { |
| $authors{$author}{"email"} = "-"; |
| } |
| printf "%-25s %5d %-40s (%2.2f%%) {%s / %s}\n",$author, $authors{$author}{"num"}, $authors{$author}{"email"}, $authors{$author}{"num"} / $number_of_commits * 100, $authors{$author}{"latest_commit"}, $authors{$author}{"earliest_commit"}; |
| $number_of_authors++; |
| } |
| print "Total Authors: $number_of_authors\n\n"; |
| |
| print "=== Authors - Lines added ===\n"; |
| foreach my $author (sort { $author_added{$b} <=> $author_added{$a} } (keys %author_added) ) { |
| if ($author_added{$author}) { |
| printf "%-25s %5d (%2.3f%%)\n",$author, $author_added{$author}, $author_added{$author} / $total_added * 100; |
| } |
| } |
| print "\n"; |
| |
| print "=== Authors - Lines removed ===\n"; |
| foreach my $author (sort { $author_removed{$a} <=> $author_removed{$b} } (keys %author_removed) ) { |
| if ($author_removed{$author}) { |
| printf "%-25s %5d (%2.3f%%)\n",$author,$author_removed{$author} * -1, $author_removed{$author} / $total_removed * 100; |
| } |
| } |
| print "\n"; |
| |
| print "=== Reviewers - Number of patches reviewed ===\n"; |
| my $number_of_reviewers = 0; |
| foreach my $reviewer (sort { $reviewers{$b} <=> $reviewers{$a} } (keys %reviewers) ) { |
| printf "%-25s %5d (%2.3f%%)\n",$reviewer, $reviewers{$reviewer}, $reviewers{$reviewer} / $number_of_commits * 100; |
| $number_of_reviewers++; |
| } |
| print "Total Reviewers: $number_of_reviewers\n\n"; |
| |
| print "=== Submitters - Number of patches submitted ===\n"; |
| foreach my $submitter (sort { $submitters{$b} <=> $submitters{$a} } (keys %submitters) ) { |
| printf "%-25s %5d (%2.3f%%)\n",$submitter, $submitters{$submitter}, $submitters{$submitter} / $number_of_commits * 100; |
| } |
| print "Total Submitters: $number_of_submitters\n\n"; |
| |
| print "Commits, Ave, Added, Removed, Diff, Authors, Reviewers, Submitters\n"; |
| printf "$number_of_commits, %.2f, $total_added, $total_removed, " . ($total_added + $total_removed) . ", $number_of_authors, $number_of_reviewers, $number_of_submitters\n", $number_of_commits / $Days; |
| } |
| |
| #------------------------------------------------------------------------------- |
| #------------------------------------------------------------------------------- |
| sub check_versions { |
| `git cat-file -e $old_version^{commit} 2>/dev/null`; |
| if (${^CHILD_ERROR_NATIVE}){ |
| print "Error: Old version ($old_version) does not exist.\n"; |
| exit 1; |
| } |
| |
| `git cat-file -e $new_version^{commit} 2>/dev/null`; |
| if (${^CHILD_ERROR_NATIVE}){ |
| print "Error: New version ($new_version) does not exist.\n"; |
| exit 1; |
| } |
| } |
| |
| #------------------------------------------------------------------------------- |
| #------------------------------------------------------------------------------- |
| sub get_user { |
| my $url=`git config -l | grep remote.origin.url`; |
| |
| if ($url =~ /.*url=ssh:\/\/(\w+@[a-zA-Z][a-zA-Z0-9\.]+:\d+)/) |
| { |
| $URL_WITH_USER = $1; |
| } else { |
| print "Error: Could not get a ssh url with a username from gitconfig.\n"; |
| print " use the -u option to set a url.\n"; |
| exit 1; |
| } |
| } |
| |
| #------------------------------------------------------------------------------- |
| #------------------------------------------------------------------------------- |
| sub get_commits { |
| my @commits = @_; |
| my $submit_time = ""; |
| if (defined $SKIP_GERRIT_CHECK) { |
| return; |
| } |
| my $ssh = Net::OpenSSH->new("$URL_WITH_USER", ); |
| $ssh->error and die "Couldn't establish SSH connection to $URL_WITH_USER:". $ssh->error; |
| |
| print "Using URL: ssh://$URL_WITH_USER\n"; |
| |
| if (! -d $infodir) { |
| mkpath($infodir) |
| } |
| |
| for my $commit_id (@commits) { |
| $commit_id =~ s/^\s+|\s+$//g; |
| $submit_time = ""; |
| my $gerrit_review; |
| |
| # Quit if we've reeached the last coreboot commit supporting these queries |
| if ($commit_id =~ /^7309709/) { |
| last; |
| } |
| |
| if (-f "$infodir/$commit_id") { |
| $gerrit_review = 1; |
| } else { |
| $gerrit_review = `git log $commit_id^..$commit_id | grep '\\sReviewed-on:\\s'`; |
| } |
| |
| if ($gerrit_review && $commit_id && (! -f "$infodir/$commit_id") ) { |
| print "Downloading $commit_id"; |
| my @info = $ssh->capture("gerrit query --format=JSON --comments --files --current-patch-set --all-approvals --submit-records --dependencies commit:$commit_id"); |
| $ssh->error and die "remote ls command failed: " . $ssh->error; |
| |
| my $commit_info = JSON::Util->decode($info[0]); |
| my $rowcount = $commit_info->{'rowCount'}; |
| if (defined $rowcount && ($rowcount eq "0")) { |
| print " - no gerrit commit for that id.\n"; |
| open( my $HANDLE, ">", "$infodir/$commit_id" ) or die "Error: could not open file '$infodir/$commit_id'\n"; |
| print $HANDLE "No gerrit commit"; |
| close $HANDLE; |
| next; |
| } |
| my $approvals = $commit_info->{'currentPatchSet'}{'approvals'}; |
| |
| for my $approval (@$approvals) { |
| if ($approval->{'type'} eq "SUBM") { |
| $submit_time = $approval->{'grantedOn'} |
| } |
| } |
| my $dt=""; |
| if ($submit_time) { |
| $dt = DateTime->from_epoch(epoch => $submit_time); |
| } else { |
| print " - no submit time for that id.\n"; |
| open( my $HANDLE, ">", "$infodir/$commit_id" ) or die "Error: could not open file '$infodir/$commit_id'\n"; |
| print $HANDLE "No submit time"; |
| close $HANDLE; |
| |
| next; |
| } |
| |
| open( my $HANDLE, ">", "$infodir/$commit_id" ) or die "Error: could not open file '$infodir/$commit_id'\n"; |
| print $HANDLE $info[0]; |
| close $HANDLE; |
| |
| $dt->set_time_zone( 'Europe/Paris' ); |
| print " - submit time: " . $dt->strftime('%Y/%m/%d %H:%M:%S') . "\n"; |
| } elsif ($commit_id && (! -f "$infodir/$commit_id")) { |
| print "No gerrit commit for $commit_id\n"; |
| open( my $HANDLE, ">", "$infodir/$commit_id" ) or die "Error: could not open file '$infodir/$commit_id'\n"; |
| print $HANDLE "No gerrit commit"; |
| close $HANDLE; |
| } |
| } |
| print "\n"; |
| } |
| |
| #------------------------------------------------------------------------------- |
| # check_arguments parse the command line arguments |
| #------------------------------------------------------------------------------- |
| sub check_arguments { |
| my $show_usage = 0; |
| GetOptions( |
| 'help|?' => sub { usage() }, |
| 'url|u=s' => \$URL_WITH_USER, |
| 'skip|s' => \$SKIP_GERRIT_CHECK, |
| ); |
| # strip ssh:// from url if passed in. |
| if (defined $URL_WITH_USER) { |
| $URL_WITH_USER =~ s|ssh://||; |
| } |
| if (@ARGV) { |
| ($old_version, $new_version) = @ARGV; |
| } else { |
| usage(); |
| } |
| } |
| |
| #------------------------------------------------------------------------------- |
| # usage - Print the arguments for the user |
| #------------------------------------------------------------------------------- |
| sub usage { |
| print "gerrit_stats <options> [Old version] [New version]\n"; |
| print "Old version should be a tag (4.1), a branch (origin/4.1), or a commit id\n"; |
| print "New version can be 'HEAD' a branch (origin/master) a tag (4.2), or a commit id\n"; |
| print " Options:\n"; |
| print " u | url [url] url with username.\n"; |
| print "Example: \"$0 -u Gaumless\@review.coreboot.org:29418 origin/4.1 4.2\"\n"; |
| exit(0); |
| } |
| |
| 1; |