figured out the bash-fu to get all names of biggest files

Project: http://git-wip-us.apache.org/repos/asf/brooklyn-client/repo
Commit: http://git-wip-us.apache.org/repos/asf/brooklyn-client/commit/777ababf
Tree: http://git-wip-us.apache.org/repos/asf/brooklyn-client/tree/777ababf
Diff: http://git-wip-us.apache.org/repos/asf/brooklyn-client/diff/777ababf

Branch: refs/heads/master
Commit: 777ababfd55d123e34cce341b12cc341199414ca
Parents: 873af8c
Author: Alex Heneveld <[email protected]>
Authored: Thu Dec 17 00:45:46 2015 +0000
Committer: Alex Heneveld <[email protected]>
Committed: Thu Dec 17 00:45:46 2015 +0000

----------------------------------------------------------------------
 git-biggest-files.sh | 1 +
 1 file changed, 1 insertion(+)
----------------------------------------------------------------------


http://git-wip-us.apache.org/repos/asf/brooklyn-client/blob/777ababf/git-biggest-files.sh
----------------------------------------------------------------------
diff --git a/git-biggest-files.sh b/git-biggest-files.sh
index 5ffaab5..c881e15 100755
--- a/git-biggest-files.sh
+++ b/git-biggest-files.sh
@@ -8,6 +8,7 @@ if [ ! -z "$1" ] ; then SIZE=$1 ; fi
 
 # however this does not show the former names of the blobs so if the same file 
is in 
 # multiple times this script will show only one instance; apply 
`git-follow-file` to do that
+# e.g.   git-biggest-files.sh | while read line ; do if [ ! -z "$( echo $line 
| awk '{print $3}' )" ] ; then echo $( echo $line | awk '{print $2 }' ) $( 
git-follow-file.sh $( echo $line | awk '{print $3}' )) ; fi ; done
 
 git rev-list --objects --all | sort -k 2 > /tmp/TMP-big-shas.txt
 git gc 2> /tmp/TMP-big-log.txt && git verify-pack -v 
.git/objects/pack/pack-*.idx | egrep "^\w+ blob\W+[0-9]+ [0-9]+ [0-9]+$" | sort 
-k 3 -n -r | head -${SIZE} > /tmp/TMP-big-objects.txt

Reply via email to