As part of my talk for KVM Forum, I am collecting some stats on the project
since last year.  I thought I'd share the scripts in case anyone is interested
in how they work.

I think this is just about all of the data I need, but patches are certainly
welcome.

Of course, you'll have to come to KVM Forum to see the pretty version of these
stats (there should be videos too for those that can't make it :-))

And thanks to Alex for poking me to collect these too.
---
 scripts/aliases.txt   |   18 +++++++++
 scripts/companies.txt |   20 ++++++++++
 scripts/genstats.sh   |   96 +++++++++++++++++++++++++++++++++++++++++++++++++
 3 files changed, 134 insertions(+), 0 deletions(-)
 create mode 100644 scripts/aliases.txt
 create mode 100644 scripts/companies.txt
 create mode 100755 scripts/genstats.sh

diff --git a/scripts/aliases.txt b/scripts/aliases.txt
new file mode 100644
index 0000000..aadea25
--- /dev/null
+++ b/scripts/aliases.txt
@@ -0,0 +1,18 @@
+andrew.zaborow...@intel.com: bal...@zabor.org
+ed...@axis.com: edgar.igles...@gmail.com
+edgar.igles...@petalogix.com: edgar.igles...@gmail.com
+lcapitul...@gmail.com: lcapitul...@redhat.com
+riku.voi...@nokia.com: riku.voi...@linaro.org
+riku.voi...@iki.fi: riku.voi...@linaro.org
+andreas.faerber: andreas.faer...@web.de
+anth...@codemonkey.ws: aligu...@us.ibm.com
+atar4q...@googlemail.com: atar4q...@gmail.com
+bernhard.k...@gmx.net: bernhard.k...@nsn.com
+jan.kis...@web.de: jan.kis...@siemens.com
+m...@kevin-wolf.de: kw...@redhat.com
+marcandre.lur...@gmail.com: marcandre.lur...@redhat.com
+r...@twiddle.net: r...@redhat.com
+sripa...@sripathi.in.ibm.com: sripat...@in.ibm.com
+
+
+
diff --git a/scripts/companies.txt b/scripts/companies.txt
new file mode 100644
index 0000000..436e3b3
--- /dev/null
+++ b/scripts/companies.txt
@@ -0,0 +1,20 @@
+Red Hat: redhat.com h...@lst.de glommer@mothafucka.localdomain
+SuSE: suse.de novell.com
+IBM: ibm.com kernel.crashing.org gibson.dropbear.id.au
+AMD: amd.com
+Citrix: citrix.com
+Canonical: canonical.com
+Intel: intel.com
+VIA: viatech.com.cn
+Linaro: linaro
+Google: google.com
+Code Sourcery: codesourcery.com
+Siemens: siemens.com siemens-enterprise.com
+Fujitsu: fujitsu.com
+Dream Host: dreamhost.com
+Nokia: nokia.com
+Samsung: samsung.com
+NTT: lab.ntt.co.jp
+FreeScale: freescale.com
+XenSource: xensource.com
+VA Linux: valinux.co.jp
diff --git a/scripts/genstats.sh b/scripts/genstats.sh
new file mode 100755
index 0000000..6d1228f
--- /dev/null
+++ b/scripts/genstats.sh
@@ -0,0 +1,96 @@
+#!/bin/bash
+
+# Usage: scripts/genstats.sh "today" "1 year ago"
+
+aliases="scripts/aliases.txt"
+companies="scripts/companies.txt"
+
+function dedup() {
+    while read addr; do
+       f=`grep "^$addr: " "$aliases" | cut -f2- -d' '`
+       if test "$f"; then
+           echo "$f"
+       else
+           echo "$addr"
+       fi
+    done
+}
+
+function gen-committers() {
+    until="$1"
+    since="$2"
+
+    git log --until="$until" --since="$since" --pretty=format:%ce | \
+       sort -u | dedup | sort -u | while read committer; do
+       addresses=`grep " $committer\$" "$aliases" | cut -f1 -d: | while read 
a; do echo -n "--committer=$a "; done`
+       
+       echo -n "$committer, "
+       git log --until="$until" --since="$since" \
+           --pretty=oneline --committer="$committer" $addresses | wc -l
+    done
+}
+
+function gen-authors() {
+    until="$1"
+    since="$2"
+
+    git log --until="$until" --since="$since" --pretty=format:%ae | \
+       sort -u | dedup | sort -u | while read author; do
+       addresses=`grep " $author\$" "$aliases" | cut -f1 -d: | while read a; 
do echo -n "--author=$a "; done`
+       
+       echo -n "$author, "
+       git log --until="$until" --since="$since" \
+           --pretty=oneline --author="$author" | wc -l
+    done
+}
+
+function gen-commits() {
+    until="$1"
+    since="$2"
+
+    git log --until="$until" --since="$since" --pretty=oneline | wc -l
+}
+
+function gen-companies() {
+    until="$1"
+    since="$2"
+
+    cat "$companies" | while read LINE; do
+       company=`echo $LINE | cut -f1 -d:`
+       addrs=`echo $LINE | cut -f2- -d:`
+
+       authors=`echo "$addrs" | sed -e 's: : --author=:g'`
+       echo "$company," \
+           `git log --until="$until" --since="$since" --pretty=oneline \
+                $authors | wc -l`, \
+            `git log --until="$until" --since="$since" --pretty="format:%ae\n" 
\
+                $authors | sort -u | dedup | sort -u | wc -l`
+    done
+}
+
+function gen-stats() {
+    until="$1"
+    since="$2"
+
+    echo 'Total Commits'
+    echo '-------------'
+    gen-commits "$until" "$since"
+    echo
+
+    echo 'Committers'
+    echo '----------'
+    gen-committers "$until" "$since"
+    echo
+
+    echo 'Authors'
+    echo '-------'
+    gen-authors "$until" "$since"
+    echo
+
+    echo 'Companies'
+    echo '---------'
+    gen-companies "$util" "$since"
+}
+
+gen-stats "$1" "$2"
+
-- 
1.7.4.1


Reply via email to