blob: f8f64e2e4c7ac7b2b842787cbea816b091a87a84 [file] [log] [blame]
// Copyright (C) 2016 The Android Open Source Project
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
package com.google.gerrit.server.mail.receive;
import com.google.gerrit.reviewdb.client.Comment;
import java.util.StringJoiner;
import java.util.regex.Pattern;
public class ParserUtil {
private static final Pattern SIMPLE_EMAIL_PATTERN =
Pattern.compile(
"[_A-Za-z0-9-\\+]+(\\.[_A-Za-z0-9-]+)*@[A-Za-z0-9-]+"
+ "(\\.[A-Za-z0-9]+)*(\\.[A-Za-z]{2,})");
/**
* Trims the quotation that email clients add Example: On Sun, Nov 20, 2016 at 10:33 PM,
* <gerrit@gerritcodereview.com> wrote:
*
* @param comment Comment parsed from an email.
* @return Trimmed comment.
*/
public static String trimQuotation(String comment) {
StringJoiner j = new StringJoiner("\n");
String[] lines = comment.split("\n");
for (int i = 0; i < lines.length - 2; i++) {
j.add(lines[i]);
}
// Check if the last line contains the full quotation pattern (date + email)
String lastLine = lines[lines.length - 1];
if (containsQuotationPattern(lastLine)) {
if (lines.length > 1) {
j.add(lines[lines.length - 2]);
}
return j.toString().trim();
}
// Check if the second last line + the last line contain the full quotation pattern. This is
// necessary, as the quotation line can be split across the last two lines if it gets too long.
if (lines.length > 1) {
String lastLines = lines[lines.length - 2] + lastLine;
if (containsQuotationPattern(lastLines)) {
return j.toString().trim();
}
}
// Add the last two lines
if (lines.length > 1) {
j.add(lines[lines.length - 2]);
}
j.add(lines[lines.length - 1]);
return j.toString().trim();
}
/** Check if string is an inline comment url on a patch set or the base */
public static boolean isCommentUrl(String str, String changeUrl, Comment comment) {
int lineNbr = comment.range == null ? comment.lineNbr : comment.range.startLine;
return str.equals(filePath(changeUrl, comment) + "@" + lineNbr)
|| str.equals(filePath(changeUrl, comment) + "@a" + lineNbr);
}
/** Generate the fully qualified filepath */
public static String filePath(String changeUrl, Comment comment) {
return changeUrl + "/" + comment.key.patchSetId + "/" + comment.key.filename;
}
private static boolean containsQuotationPattern(String s) {
// Identifying the quotation line is hard, as it can be in any language.
// We identify this line by it's characteristics: It usually contains a
// valid email address, some digits for the date in groups of 1-4 in a row
// as well as some characters.
// Count occurrences of digit groups
int numConsecutiveDigits = 0;
int maxConsecutiveDigits = 0;
int numDigitGroups = 0;
for (char c : s.toCharArray()) {
if (c >= '0' && c <= '9') {
numConsecutiveDigits++;
} else if (numConsecutiveDigits > 0) {
maxConsecutiveDigits = Integer.max(maxConsecutiveDigits, numConsecutiveDigits);
numConsecutiveDigits = 0;
numDigitGroups++;
}
}
if (numDigitGroups < 4 || maxConsecutiveDigits > 4) {
return false;
}
// Check if the string contains an email address
return SIMPLE_EMAIL_PATTERN.matcher(s).find();
}
}