@inproceedings{a862c1cc6cf04abe87722cda33ed36de,
title = "Which Change Sets in Git Repositories Are Related?",
abstract = "Software repositories contain valuable information about the history of software changes. Using data mining, researchers have identified file changes that happened together frequently to present hints for necessary changes to developers. However, not all file change sets are related. This can affect the recommendations about coupled file changes negatively by delivering irrelevant couplings to the developers. The commit time and branching characteristics of Git have not been investigated together in previous heuristics for grouping related change sets. We exploit the mappings between commit messages and issue ids for judging the relatedness of change sets. We propose a heuristic for Git and investigate the influence of two factors, the time between the commits and their branching on the relatedness of change sets using the repositories of five open-source systems using logistic regression. According to our findings, the combination of these two factors influences the relatedness of change sets. Individually measured, only the time significantly influences the relatedness, the branching itself does not. Our results support previous heuristic that also in Git repositories the commit time is important for grouping related change sets.",
keywords = "branch, change sets, commit, data mining, git, repositories",
author = "Jasmin Ramadani and Stefan Wagner",
note = "Publisher Copyright: {\textcopyright} 2016 IEEE.; 2nd IEEE International Conference on Software Quality, Reliability and Security, QRS 2016 ; Conference date: 01-08-2016 Through 03-08-2016",
year = "2016",
month = oct,
day = "12",
doi = "10.1109/QRS.2016.52",
language = "English",
series = "Proceedings - 2016 IEEE International Conference on Software Quality, Reliability and Security, QRS 2016",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "406--413",
booktitle = "Proceedings - 2016 IEEE International Conference on Software Quality, Reliability and Security, QRS 2016",
}