As part of my talk for KVM Forum, I am collecting some stats on the project since last year. I thought I'd share the scripts in case anyone is interested in how they work.
I think this is just about all of the data I need, but patches are certainly welcome. Of course, you'll have to come to KVM Forum to see the pretty version of these stats (there should be videos too for those that can't make it :-)) And thanks to Alex for poking me to collect these too. --- scripts/aliases.txt | 18 +++++++++ scripts/companies.txt | 20 ++++++++++ scripts/genstats.sh | 96 +++++++++++++++++++++++++++++++++++++++++++++++++ 3 files changed, 134 insertions(+), 0 deletions(-) create mode 100644 scripts/aliases.txt create mode 100644 scripts/companies.txt create mode 100755 scripts/genstats.sh diff --git a/scripts/aliases.txt b/scripts/aliases.txt new file mode 100644 index 0000000..aadea25 --- /dev/null +++ b/scripts/aliases.txt @@ -0,0 +1,18 @@ +andrew.zaborow...@intel.com: bal...@zabor.org +ed...@axis.com: edgar.igles...@gmail.com +edgar.igles...@petalogix.com: edgar.igles...@gmail.com +lcapitul...@gmail.com: lcapitul...@redhat.com +riku.voi...@nokia.com: riku.voi...@linaro.org +riku.voi...@iki.fi: riku.voi...@linaro.org +andreas.faerber: andreas.faer...@web.de +anth...@codemonkey.ws: aligu...@us.ibm.com +atar4q...@googlemail.com: atar4q...@gmail.com +bernhard.k...@gmx.net: bernhard.k...@nsn.com +jan.kis...@web.de: jan.kis...@siemens.com +m...@kevin-wolf.de: kw...@redhat.com +marcandre.lur...@gmail.com: marcandre.lur...@redhat.com +r...@twiddle.net: r...@redhat.com +sripa...@sripathi.in.ibm.com: sripat...@in.ibm.com + + + diff --git a/scripts/companies.txt b/scripts/companies.txt new file mode 100644 index 0000000..436e3b3 --- /dev/null +++ b/scripts/companies.txt @@ -0,0 +1,20 @@ +Red Hat: redhat.com h...@lst.de glommer@mothafucka.localdomain +SuSE: suse.de novell.com +IBM: ibm.com kernel.crashing.org gibson.dropbear.id.au +AMD: amd.com +Citrix: citrix.com +Canonical: canonical.com +Intel: intel.com +VIA: viatech.com.cn +Linaro: linaro +Google: google.com +Code Sourcery: codesourcery.com +Siemens: siemens.com siemens-enterprise.com +Fujitsu: fujitsu.com +Dream Host: dreamhost.com +Nokia: nokia.com +Samsung: samsung.com +NTT: lab.ntt.co.jp +FreeScale: freescale.com +XenSource: xensource.com +VA Linux: valinux.co.jp diff --git a/scripts/genstats.sh b/scripts/genstats.sh new file mode 100755 index 0000000..6d1228f --- /dev/null +++ b/scripts/genstats.sh @@ -0,0 +1,96 @@ +#!/bin/bash + +# Usage: scripts/genstats.sh "today" "1 year ago" + +aliases="scripts/aliases.txt" +companies="scripts/companies.txt" + +function dedup() { + while read addr; do + f=`grep "^$addr: " "$aliases" | cut -f2- -d' '` + if test "$f"; then + echo "$f" + else + echo "$addr" + fi + done +} + +function gen-committers() { + until="$1" + since="$2" + + git log --until="$until" --since="$since" --pretty=format:%ce | \ + sort -u | dedup | sort -u | while read committer; do + addresses=`grep " $committer\$" "$aliases" | cut -f1 -d: | while read a; do echo -n "--committer=$a "; done` + + echo -n "$committer, " + git log --until="$until" --since="$since" \ + --pretty=oneline --committer="$committer" $addresses | wc -l + done +} + +function gen-authors() { + until="$1" + since="$2" + + git log --until="$until" --since="$since" --pretty=format:%ae | \ + sort -u | dedup | sort -u | while read author; do + addresses=`grep " $author\$" "$aliases" | cut -f1 -d: | while read a; do echo -n "--author=$a "; done` + + echo -n "$author, " + git log --until="$until" --since="$since" \ + --pretty=oneline --author="$author" | wc -l + done +} + +function gen-commits() { + until="$1" + since="$2" + + git log --until="$until" --since="$since" --pretty=oneline | wc -l +} + +function gen-companies() { + until="$1" + since="$2" + + cat "$companies" | while read LINE; do + company=`echo $LINE | cut -f1 -d:` + addrs=`echo $LINE | cut -f2- -d:` + + authors=`echo "$addrs" | sed -e 's: : --author=:g'` + echo "$company," \ + `git log --until="$until" --since="$since" --pretty=oneline \ + $authors | wc -l`, \ + `git log --until="$until" --since="$since" --pretty="format:%ae\n" \ + $authors | sort -u | dedup | sort -u | wc -l` + done +} + +function gen-stats() { + until="$1" + since="$2" + + echo 'Total Commits' + echo '-------------' + gen-commits "$until" "$since" + echo + + echo 'Committers' + echo '----------' + gen-committers "$until" "$since" + echo + + echo 'Authors' + echo '-------' + gen-authors "$until" "$since" + echo + + echo 'Companies' + echo '---------' + gen-companies "$util" "$since" +} + +gen-stats "$1" "$2" + -- 1.7.4.1