#compile the code
g++ -O3 -Wall -o chunk chunk.c

#get example project
git clone --mirror git://git.moodle.org/moodle.git

#get individual delta
git --git-dir=moodle.git log --numstat -M -C --diff-filter=ACMR --full-history --pretty=tformat:"STARTOFTHECOMMIT%n%H;%T;%P;%an;%ae;%at;%cn;%ce;%ct;%s" | perl extrgitP.perl | gzip > moodle.git.delta.gz

#just get right columns
gunzip -c moodle.git.delta.gz| cut -d\; -f1,4- > aa1

#prepare data for 2010 2011 period (read commits from aa1)
perl index0.perl moodle 2010 2011 > moodle.2010-2011.considered

#run the program selecting in 
# ten bins (see c code)
# containing from 10 1000 files 
# for 5e10 iterations
# 10000 restarts
time ./chunk moodle.2010-2011 10 1000 5e10 10000 2> moodle.2010-2011.out.10-1000-5e10-10000

#Inspect quality of the results in 
# moodle.2010-2011.freq
#and the solutions are in 
# moodle.2010-2011.res

