mirror of
https://we.phorge.it/source/phorge.git
synced 2025-01-11 15:21:03 +01:00
Include email in Git author/committer lookup
Summary: We currently omit email from Git author/committer lookups, which gives us some bad results when identify commit authors. Include email. Also simplify this block a little bit. Test Plan: Ran "reparse.php --message" on several commits, verified that the author/committer seemed reasonable with var_dump()s. Reviewers: btrahan, vrana, nh Reviewed By: btrahan CC: aran Maniphest Tasks: T1337 Differential Revision: https://secure.phabricator.com/D3039
This commit is contained in:
parent
9a3998806d
commit
8cbd860e31
1 changed files with 32 additions and 12 deletions
|
@ -29,26 +29,46 @@ final class PhabricatorRepositoryGitCommitMessageParserWorker
|
||||||
// we try a little harder, since git *does* tell us what the actual encoding
|
// we try a little harder, since git *does* tell us what the actual encoding
|
||||||
// is correctly (unless it doesn't; encoding is sometimes empty).
|
// is correctly (unless it doesn't; encoding is sometimes empty).
|
||||||
list($info) = $repository->execxLocalCommand(
|
list($info) = $repository->execxLocalCommand(
|
||||||
"log -n 1 --encoding='UTF-8' " .
|
'log -n 1 --encoding=%s --format=%s %s --',
|
||||||
"--pretty=format:%%e%%x00%%cn%%x00%%an%%x00%%s%%n%%n%%b %s",
|
'UTF-8',
|
||||||
|
implode('%x00', array('%e', '%cn', '%ce', '%an', '%ae', '%s%n%n%b')),
|
||||||
$commit->getCommitIdentifier());
|
$commit->getCommitIdentifier());
|
||||||
|
|
||||||
list($encoding, $committer, $author, $message) = explode("\0", $info);
|
$parts = explode("\0", $info);
|
||||||
|
$encoding = array_shift($parts);
|
||||||
|
|
||||||
// See note above - git doesn't always convert the encoding correctly.
|
// See note above - git doesn't always convert the encoding correctly.
|
||||||
if (strlen($encoding) && strtoupper($encoding) != "UTF-8") {
|
$do_convert = false;
|
||||||
|
if (strlen($encoding) && strtoupper($encoding) != 'UTF-8') {
|
||||||
if (function_exists('mb_convert_encoding')) {
|
if (function_exists('mb_convert_encoding')) {
|
||||||
$message = mb_convert_encoding($message, "UTF-8", $encoding);
|
$do_convert = true;
|
||||||
$author = mb_convert_encoding($author, "UTF-8", $encoding);
|
|
||||||
$committer = mb_convert_encoding($committer, "UTF-8", $encoding);
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
// Make completely sure these are valid UTF-8.
|
foreach ($parts as $key => $part) {
|
||||||
$committer = phutil_utf8ize($committer);
|
if ($do_convert) {
|
||||||
$author = phutil_utf8ize($author);
|
$parts[$key] = mb_convert_encoding($part, 'UTF-8', $encoding);
|
||||||
$message = phutil_utf8ize($message);
|
}
|
||||||
$message = trim($message);
|
$parts[$key] = phutil_utf8ize($part);
|
||||||
|
}
|
||||||
|
|
||||||
|
$committer_name = $parts[0];
|
||||||
|
$committer_email = $parts[1];
|
||||||
|
$author_name = $parts[2];
|
||||||
|
$author_email = $parts[3];
|
||||||
|
$message = $parts[4];
|
||||||
|
|
||||||
|
if (strlen($author_email)) {
|
||||||
|
$author = "{$author_name} <{$author_email}>";
|
||||||
|
} else {
|
||||||
|
$author = "{$author_name}";
|
||||||
|
}
|
||||||
|
|
||||||
|
if (strlen($committer_email)) {
|
||||||
|
$committer = "{$committer_name} <{$committer_email}>";
|
||||||
|
} else {
|
||||||
|
$committer = "{$committer_name}";
|
||||||
|
}
|
||||||
|
|
||||||
if ($committer == $author) {
|
if ($committer == $author) {
|
||||||
$committer = null;
|
$committer = null;
|
||||||
|
|
Loading…
Reference in a new issue