mirror of
https://we.phorge.it/source/phorge.git
synced 2024-12-11 16:16:14 +01:00
d44a5fa933
Summary: Ref T10423. This flag can cause `git diff` to take an enormously long time (the problem case was a 5M line, 20K file commit). Instead: - Run without the flag first. - If that shows that the diff is definitely small, try again with the flag. - If that works, return the slower, better output. - If the fast diff affects too many paths or generating the slow diff takes too long, return the faster, slightly worse output. The quality of the output differs in how well Git is able to detect "M" and "C" (moves and copies of files). For example, if you copy `src/` to `srcpro/`, the fast output may not show that you copied files. The slow output will. I think this is rarely useful for large copies anyway: it's interesting if a 1-2 file diff is a copy, but usually obvious/uninteresting if a 500-file diff is a copy. Test Plan: - Ran `bin/repository reparse --change rXnnn` on Git changes. - Saw fast and slow commands execute normally. - Tried on a large diff, saw only the fast command execute. Reviewers: chad Reviewed By: chad Maniphest Tasks: T10423 Differential Revision: https://secure.phabricator.com/D16266
123 lines
3.5 KiB
PHP
123 lines
3.5 KiB
PHP
<?php
|
|
|
|
final class DiffusionInternalGitRawDiffQueryConduitAPIMethod
|
|
extends DiffusionQueryConduitAPIMethod {
|
|
|
|
public function isInternalAPI() {
|
|
return true;
|
|
}
|
|
|
|
public function getAPIMethodName() {
|
|
return 'diffusion.internal.gitrawdiffquery';
|
|
}
|
|
|
|
public function getMethodDescription() {
|
|
return pht('Internal method for getting raw diff information.');
|
|
}
|
|
|
|
protected function defineReturnType() {
|
|
return 'string';
|
|
}
|
|
|
|
protected function defineCustomParamTypes() {
|
|
return array(
|
|
'commit' => 'required string',
|
|
);
|
|
}
|
|
|
|
protected function getResult(ConduitAPIRequest $request) {
|
|
$drequest = $this->getDiffusionRequest();
|
|
$repository = $drequest->getRepository();
|
|
$commit = $request->getValue('commit');
|
|
|
|
if (!$repository->isGit()) {
|
|
throw new Exception(
|
|
pht(
|
|
'This API method can only be called on Git repositories.'));
|
|
}
|
|
|
|
// Check if the commit has parents. We're testing to see whether it is the
|
|
// first commit in history (in which case we must use "git log") or some
|
|
// other commit (in which case we can use "git diff"). We'd rather use
|
|
// "git diff" because it has the right behavior for merge commits, but
|
|
// it requires the commit to have a parent that we can diff against. The
|
|
// first commit doesn't, so "commit^" is not a valid ref.
|
|
list($parents) = $repository->execxLocalCommand(
|
|
'log -n1 --format=%s %s',
|
|
'%P',
|
|
$commit);
|
|
$use_log = !strlen(trim($parents));
|
|
|
|
// First, get a fast raw diff without "--find-copies-harder". This flag
|
|
// produces better results for moves and copies, but is explosively slow
|
|
// for large changes to large repositories. See T10423.
|
|
$raw = $this->getRawDiff($repository, $commit, $use_log, false);
|
|
|
|
// If we got a normal-sized diff (no more than 100 modified files), we'll
|
|
// try using "--find-copies-harder" to improve the output. This improved
|
|
// output is mostly useful for small changes anyway.
|
|
$try_harder = (substr_count($raw, "\n") <= 100);
|
|
if ($try_harder) {
|
|
try {
|
|
$raw = $this->getRawDiff($repository, $commit, $use_log, true);
|
|
} catch (Exception $ex) {
|
|
// Just ignore any exception we hit, we'll use the fast output
|
|
// instead.
|
|
}
|
|
}
|
|
|
|
return $raw;
|
|
}
|
|
|
|
private function getRawDiff(
|
|
PhabricatorRepository $repository,
|
|
$commit,
|
|
$use_log,
|
|
$try_harder) {
|
|
|
|
$flags = array(
|
|
'-n1',
|
|
'-M',
|
|
'-C',
|
|
'-B',
|
|
'--raw',
|
|
'-t',
|
|
'--abbrev=40',
|
|
);
|
|
|
|
if ($try_harder) {
|
|
$flags[] = '--find-copies-harder';
|
|
}
|
|
|
|
if ($use_log) {
|
|
// This is the first commit so we need to use "log". We know it's not a
|
|
// merge commit because it couldn't be merging anything, so this is safe.
|
|
|
|
// NOTE: "--pretty=format: " is to disable diff output, we only want the
|
|
// part we get from "--raw".
|
|
$future = $repository->getLocalCommandFuture(
|
|
'log %Ls --pretty=format: %s',
|
|
$flags,
|
|
$commit);
|
|
} else {
|
|
// Otherwise, we can use "diff", which will give us output for merges.
|
|
// We diff against the first parent, as this is generally the expectation
|
|
// and results in sensible behavior.
|
|
$future = $repository->getLocalCommandFuture(
|
|
'diff %Ls %s^1 %s',
|
|
$flags,
|
|
$commit,
|
|
$commit);
|
|
}
|
|
|
|
// Don't spend more than 30 seconds generating the slower output.
|
|
if ($try_harder) {
|
|
$future->setTimeout(30);
|
|
}
|
|
|
|
list($raw) = $future->resolvex();
|
|
|
|
return $raw;
|
|
}
|
|
|
|
}
|