| // Copyright (C) 2017 The Android Open Source Project |
| // |
| // Licensed under the Apache License, Version 2.0 (the "License"); |
| // you may not use this file except in compliance with the License. |
| // You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, software |
| // distributed under the License is distributed on an "AS IS" BASIS, |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| // See the License for the specific language governing permissions and |
| // limitations under the License. |
| |
| package com.googlesource.gerrit.plugins.analytics.common |
| |
| import com.googlesource.gerrit.plugins.analytics.CommitInfo |
| import com.googlesource.gerrit.plugins.analytics.common.ManagedResource.use |
| import org.eclipse.jgit.diff.{DiffFormatter, RawTextComparator} |
| import org.eclipse.jgit.lib.{ObjectId, Repository} |
| import org.eclipse.jgit.revwalk.{RevCommit, RevWalk} |
| import org.eclipse.jgit.treewalk.{CanonicalTreeParser, EmptyTreeIterator} |
| import org.eclipse.jgit.util.io.DisabledOutputStream |
| |
| import scala.collection.JavaConversions._ |
| |
| /** |
| * Collects overall stats on a series of commits and provides some basic info on the included commits |
| * |
| * @param addedLines sum of the number of line additions in the included commits |
| * @param deletedLines sum of the number of line deletions in the included commits |
| * @param isForMergeCommits true if the current instance is including stats for merge commits and false if |
| * calculated for NON merge commits. The current code is not generating stats objects for |
| * a mixture of merge and non-merge commits |
| * @param commits list of commits the stats are calculated for |
| */ |
| case class CommitsStatistics( |
| addedLines: Int, |
| deletedLines: Int, |
| isForMergeCommits: Boolean, |
| commits: List[CommitInfo] |
| ) { |
| require(commits.forall(_.merge == isForMergeCommits), s"Creating a stats object with isMergeCommit = $isForMergeCommits but containing commits of different type") |
| |
| /** |
| * sum of the number of files in each of the included commits |
| */ |
| val numFiles: Int = commits.map(_.files.size).sum |
| |
| /** |
| * number of distinct files the included commits have been touching |
| */ |
| val numDistinctFiles: Int = changedFiles.size |
| |
| def isEmpty: Boolean = commits.isEmpty |
| |
| def changedFiles: Set[String] = commits.map(_.files.toSet).fold(Set.empty)(_ union _) |
| |
| // Is not a proper monoid since we cannot sum a MergeCommit with a non merge one but it would overkill to define two classes |
| def + (that: CommitsStatistics) = { |
| require(this.isForMergeCommits == that.isForMergeCommits, "Cannot sum a merge commit stats with a non merge commit stats") |
| this.copy( |
| addedLines = this.addedLines + that.addedLines, |
| deletedLines = this.deletedLines + that.deletedLines, |
| commits = this.commits ++ that.commits |
| ) |
| } |
| } |
| |
| object CommitsStatistics { |
| val Empty = CommitsStatistics(0, 0, false, List.empty) |
| val EmptyMerge = Empty.copy(isForMergeCommits = true) |
| } |
| |
| class Statistics(repo: Repository) { |
| |
| /** |
| * Returns up to two different CommitsStatistics object grouping the stats into merge and non-merge commits |
| * |
| * @param commits |
| * @return |
| */ |
| def forCommits(commits: ObjectId*): Iterable[CommitsStatistics] = { |
| |
| val stats = commits.map(forSingleCommit) |
| |
| val nonMergeStats = stats.filterNot(_.isForMergeCommits).foldLeft(CommitsStatistics.Empty)(_ + _) |
| val mergeStats = stats.filter(_.isForMergeCommits).foldLeft(CommitsStatistics.EmptyMerge)(_ + _) |
| |
| List(nonMergeStats, mergeStats).filterNot(_.isEmpty) |
| } |
| |
| protected def forSingleCommit(objectId: ObjectId): CommitsStatistics = { |
| import RevisionBrowsingSupport._ |
| |
| // I can imagine this kind of statistics is already being available in Gerrit but couldn't understand how to access it |
| // which Injection can be useful for this task? |
| use(new RevWalk(repo)) { rw => |
| val reader = repo.newObjectReader() |
| val commit = rw.parseCommit(objectId) |
| |
| val oldTree = { |
| // protects against initial commit |
| if (commit.getParentCount == 0) |
| new EmptyTreeIterator |
| else |
| new CanonicalTreeParser(null, reader, rw.parseCommit(commit.getParent(0).getId).getTree) |
| } |
| |
| val newTree = new CanonicalTreeParser(null, reader, commit.getTree) |
| |
| val df = new DiffFormatter(DisabledOutputStream.INSTANCE) |
| df.setRepository(repo) |
| df.setDiffComparator(RawTextComparator.DEFAULT) |
| df.setDetectRenames(true) |
| val diffs = df.scan(oldTree, newTree) |
| case class Lines(deleted: Int, added: Int) { |
| def +(other: Lines) = Lines(deleted + other.deleted, added + other.added) |
| } |
| val lines = (for { |
| diff <- diffs |
| edit <- df.toFileHeader(diff).toEditList |
| } yield Lines(edit.getEndA - edit.getBeginA, edit.getEndB - edit.getBeginB)).fold(Lines(0, 0))(_ + _) |
| |
| val files: Set[String] = diffs.map(df.toFileHeader(_).getNewPath).toSet |
| |
| val commitInfo = CommitInfo(objectId.getName, commit.getAuthorIdent.getWhen.getTime, commit.isMerge, files) |
| |
| CommitsStatistics(lines.added, lines.deleted, commitInfo.merge, List(commitInfo)) |
| } |
| } |
| |
| } |