figured out the bash-fu to get all names of biggest files
Project: http://git-wip-us.apache.org/repos/asf/brooklyn-client/repo Commit: http://git-wip-us.apache.org/repos/asf/brooklyn-client/commit/777ababf Tree: http://git-wip-us.apache.org/repos/asf/brooklyn-client/tree/777ababf Diff: http://git-wip-us.apache.org/repos/asf/brooklyn-client/diff/777ababf Branch: refs/heads/master Commit: 777ababfd55d123e34cce341b12cc341199414ca Parents: 873af8c Author: Alex Heneveld <[email protected]> Authored: Thu Dec 17 00:45:46 2015 +0000 Committer: Alex Heneveld <[email protected]> Committed: Thu Dec 17 00:45:46 2015 +0000 ---------------------------------------------------------------------- git-biggest-files.sh | 1 + 1 file changed, 1 insertion(+) ---------------------------------------------------------------------- http://git-wip-us.apache.org/repos/asf/brooklyn-client/blob/777ababf/git-biggest-files.sh ---------------------------------------------------------------------- diff --git a/git-biggest-files.sh b/git-biggest-files.sh index 5ffaab5..c881e15 100755 --- a/git-biggest-files.sh +++ b/git-biggest-files.sh @@ -8,6 +8,7 @@ if [ ! -z "$1" ] ; then SIZE=$1 ; fi # however this does not show the former names of the blobs so if the same file is in # multiple times this script will show only one instance; apply `git-follow-file` to do that +# e.g. git-biggest-files.sh | while read line ; do if [ ! -z "$( echo $line | awk '{print $3}' )" ] ; then echo $( echo $line | awk '{print $2 }' ) $( git-follow-file.sh $( echo $line | awk '{print $3}' )) ; fi ; done git rev-list --objects --all | sort -k 2 > /tmp/TMP-big-shas.txt git gc 2> /tmp/TMP-big-log.txt && git verify-pack -v .git/objects/pack/pack-*.idx | egrep "^\w+ blob\W+[0-9]+ [0-9]+ [0-9]+$" | sort -k 3 -n -r | head -${SIZE} > /tmp/TMP-big-objects.txt
