@conference {1823, title = {"May the fork be with you": novel metrics to analyze collaboration on GitHub}, booktitle = {Proceedings of the 5th International Workshop on Emerging Trends in Software Metrics - WETSoM 2014}, year = {2014}, note = {"According to FLOSSmole [8] (Free Libre OpenSource Software) statistics, GitHub had 191765 repositories publicly available at May 2012."}, pages = {37 - 43}, publisher = {ACM Press}, organization = {ACM Press}, address = {New York, New York, USA}, abstract = {Multi{\textendash}repository software projects are becoming more and more popular, thanks to web{\textendash}based facilities such as GitHub. Code and process metrics generally assume a single repository must be analyzed, in order to measure the characteristics of a codebase. Thus they are not apt to measure how much relevant information is hosted in multiple repositories contributing to the same codebase. Nor can they feature the characteristics of such a distributed development process. We present a set of novel metrics, based on an original classification of commits, conceived to capture some interesting aspects of a multi{\textendash}repository development process. We also describe an efficient way to build a data structure that allows to compute these metrics on a set of Git repositories. Interesting outcomes, obtained by applying our metrics on a large sample of projects hosted on GitHub, show the usefulness of our contribution.}, keywords = {flossmole, github}, isbn = {9781450328548}, doi = {10.1145/2593868.2593875}, url = {http://marbiaz.github.io/docs/Biazzini14b.pdf}, author = {Marco Biazzini and Benoit Baudry} }