This script is based on blame-count-lines-by-name-and-commit-list.plx.
It will handle finding lines of text in a blame file for commits that match a given user, and give out a list of commit ids that are not on a commit list.
This commit is contained in:
parent
ff49fe5311
commit
f407f1e8b2
1 changed files with 91 additions and 0 deletions
91
blame-find-commits-by-name-not-on-commit-id-list.plx
Executable file
91
blame-find-commits-by-name-not-on-commit-id-list.plx
Executable file
|
@ -0,0 +1,91 @@
|
|||
#!/usr/bin/perl -w
|
||||
# blame-count-lines-by-name-and-commit-list.plx -*- Perl -*-
|
||||
#
|
||||
# Copyright (C) 2011, 2012 Bradley M. Kuhn <bkuhn@ebb.org>
|
||||
#
|
||||
# This software's license gives you freedom; you can copy, convey,
|
||||
# propogate, redistribute and/or modify this program under the terms of
|
||||
# the GNU General Public License (GPL) as published by the Free
|
||||
# Software Foundation (FSF), either version 3 of the License, or (at your
|
||||
# option) any later version of the GPL published by the FSF.
|
||||
#
|
||||
# This program is distributed in the hope that it will be useful, but
|
||||
# WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||||
# General Public License for more details.
|
||||
#
|
||||
# You should have received a copy of the GNU General Public License
|
||||
# along with this program in a file in the toplevel directory called
|
||||
# "GPLv3". If not, see <http://www.gnu.org/licenses/>.
|
||||
#
|
||||
|
||||
use strict;
|
||||
use warnings;
|
||||
|
||||
my $VERBOSE = 0;
|
||||
|
||||
######################################################################
|
||||
|
||||
|
||||
if (@ARGV != 3) {
|
||||
print "usage: $0 <BLAME_DATA_FILE> ", "<NAME_REGEX> <BOUNDING_COMMIT_ID_LIST_FILE>\n";
|
||||
exit 1;
|
||||
}
|
||||
# Note: $BLAME_DATA_FILE is in the format as output from:
|
||||
# for i in `find -type f -print | egrep -v '^./.git'`; do
|
||||
# echo "FILE: $i" >> ../DATA_FILE; git blame -M -M -M -C -C -C -w -f -n -l $i >> ../DATA_FILE
|
||||
# done
|
||||
|
||||
my($BLAME_DATA_FILE, $NAME_REGEX, $BOUNDING_COMMIT_ID_LIST_FILE) = @ARGV;
|
||||
|
||||
open(BOUNDING_COMMIT_IDS, "<", $BOUNDING_COMMIT_ID_LIST_FILE) or die "unable to open $BOUNDING_COMMIT_ID_LIST_FILE: $!";
|
||||
|
||||
my %boundingCommitIDs;
|
||||
|
||||
while (my $commitLine = <BOUNDING_COMMIT_IDS>) {
|
||||
die "invalid line in $BOUNDING_COMMIT_ID_LIST_FILE: $commitLine"
|
||||
unless $commitLine =~ /^\s*(\S+)\s*$/;
|
||||
$boundingCommitIDs{$1} = $BOUNDING_COMMIT_ID_LIST_FILE;
|
||||
}
|
||||
close BOUNDING_COMMIT_IDS;
|
||||
die "error($?) closing $BOUNDING_COMMIT_ID_LIST_FILE: $!" unless $? == 0;
|
||||
|
||||
open(DATA_FILE, "<", $BLAME_DATA_FILE) or die "unable to open $BLAME_DATA_FILE for reading: $!";
|
||||
|
||||
my %commitsMatchingRegex;
|
||||
my $currentFile;
|
||||
my $overalTotalLines = 0;
|
||||
|
||||
print "LINES FOUND IN $BLAME_DATA_FILE that are on $BOUNDING_COMMIT_ID_LIST_FILE: and match $NAME_REGEX:\n" if $VERBOSE;
|
||||
while (my $dataLine = <DATA_FILE>) {
|
||||
if ($dataLine =~ /^\s*FILE\s*:\s*(.*?)\s*$/) {
|
||||
$currentFile = $1;
|
||||
} else {
|
||||
die "invalid line: $dataLine in blame output" unless ($dataLine =~
|
||||
/^\s*(\S+)\s+\S+\s+\d+\s+\((.+)\s+(\d{4,4}\-\d{2,2}\-\d{2,2}\s+\d{2,2}:\d{2,2}:\d{2,2})\s+([\+\-\d]+)\s+(\d+)\s*\)\s+(.*)$/);
|
||||
my($commitID, $name, $date, $tz, $curLineNumber, $actualCurrentLine) = ($1, $2, $3, $4, $5, $6);
|
||||
next if $currentFile =~ /ChangeLog/i; # Ignore the changelog, as that may just be a dump
|
||||
# from the revision history.
|
||||
if ($name =~ /$NAME_REGEX/i and defined $boundingCommitIDs{$commitID}) {
|
||||
$commitsMatchingRegex{$commitID} = { __totalLines => 0, __VERBOSE_LINE_OUTPUT => "" } unless defined $commitsMatchingRegex{$commitID};
|
||||
$commitsMatchingRegex{$commitID}{$currentFile} = 0 unless defined $commitsMatchingRegex{$commitID}{$currentFile};
|
||||
$commitsMatchingRegex{$commitID}{$currentFile}++;
|
||||
$commitsMatchingRegex{$commitID}{__totalLines}++;
|
||||
$commitsMatchingRegex{$commitID}{__VERBOSE_LINE_OUTPUT} .= $dataLine;
|
||||
print " $dataLine" if $VERBOSE;
|
||||
$overalTotalLines++;
|
||||
}
|
||||
}
|
||||
}
|
||||
close DATA_FILE;
|
||||
|
||||
print "Total patches by author(s) matching $NAME_REGEX in $BLAME_DATA_FILE and found in $BOUNDING_COMMIT_ID_LIST_FILE:\n",
|
||||
" ", scalar(keys %commitsMatchingRegex), "\n";
|
||||
print "Total lines by author(s) matching $NAME_REGEX in $BLAME_DATA_FILE and found in $BOUNDING_COMMIT_ID_LIST_FILE:\n",
|
||||
" ", $overalTotalLines, "\n";
|
||||
|
||||
|
||||
#
|
||||
# Local variables:
|
||||
# compile-command: "perl -c blame-count-lines-by-name-and-commit-list.plx"
|
||||
# End:
|
Loading…
Reference in a new issue