mirror of
https://we.phorge.it/source/arcanist.git
synced 2024-11-29 10:12:41 +01:00
Add a lint check for clobbering locals with iterators
Summary: See D2049, D2050. Identify reuses of locals as iterator variables. Before raising an error, we require: - Variable is declared before the loop. - Variable is used after the loop, ignoring uses as an iterator variable. I think this identifies all problems with a very low false positive rate (the false positives are suspicious/unconventional code, but not necessarily errors). Also fix an issue identified by the linter. Test Plan: - Verified this identified the bugs in D2049 and D2050. - Ran linter against libphutil/, arcanist/ and phabricator/ (see D2051, this, and next diff). - Ran unit tests. Reviewers: vrana, btrahan Reviewed By: vrana CC: aran, epriestley, jungejason Differential Revision: https://secure.phabricator.com/D2052
This commit is contained in:
parent
ff94d699fe
commit
3ae1bf1a8c
4 changed files with 207 additions and 30 deletions
|
@ -137,7 +137,7 @@ abstract class ArcanistLinterTestCase extends ArcanistPhutilTestCase {
|
||||||
$expect = array();
|
$expect = array();
|
||||||
}
|
}
|
||||||
foreach ($expect as $key => $expected) {
|
foreach ($expect as $key => $expected) {
|
||||||
$expect[$key] = reset(explode(' ', $expected));
|
$expect[$key] = head(explode(' ', $expected));
|
||||||
}
|
}
|
||||||
|
|
||||||
$expect = array_fill_keys($expect, true);
|
$expect = array_fill_keys($expect, true);
|
||||||
|
|
|
@ -55,6 +55,7 @@ final class ArcanistXHPASTLinter extends ArcanistLinter {
|
||||||
const LINT_RAGGED_CLASSTREE_EDGE = 29;
|
const LINT_RAGGED_CLASSTREE_EDGE = 29;
|
||||||
const LINT_IMPLICIT_FALLTHROUGH = 30;
|
const LINT_IMPLICIT_FALLTHROUGH = 30;
|
||||||
const LINT_PHP_53_FEATURES = 31;
|
const LINT_PHP_53_FEATURES = 31;
|
||||||
|
const LINT_REUSED_AS_ITERATOR = 32;
|
||||||
|
|
||||||
|
|
||||||
public function getLintNameMap() {
|
public function getLintNameMap() {
|
||||||
|
@ -89,6 +90,7 @@ final class ArcanistXHPASTLinter extends ArcanistLinter {
|
||||||
self::LINT_RAGGED_CLASSTREE_EDGE => 'Class Not abstract Or final',
|
self::LINT_RAGGED_CLASSTREE_EDGE => 'Class Not abstract Or final',
|
||||||
self::LINT_IMPLICIT_FALLTHROUGH => 'Implicit Fallthrough',
|
self::LINT_IMPLICIT_FALLTHROUGH => 'Implicit Fallthrough',
|
||||||
self::LINT_PHP_53_FEATURES => 'Use Of PHP 5.3 Features',
|
self::LINT_PHP_53_FEATURES => 'Use Of PHP 5.3 Features',
|
||||||
|
self::LINT_REUSED_AS_ITERATOR => 'Variable Reused As Iterator',
|
||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -677,25 +679,6 @@ final class ArcanistXHPASTLinter extends ArcanistLinter {
|
||||||
$vars[] = $var;
|
$vars[] = $var;
|
||||||
}
|
}
|
||||||
|
|
||||||
$foreaches = $body->selectDescendantsOfType('n_FOREACH_EXPRESSION');
|
|
||||||
foreach ($foreaches as $foreach_expr) {
|
|
||||||
$key_var = $foreach_expr->getChildByIndex(1);
|
|
||||||
if ($key_var->getTypeName() == 'n_VARIABLE') {
|
|
||||||
$vars[] = $key_var;
|
|
||||||
}
|
|
||||||
|
|
||||||
$value_var = $foreach_expr->getChildByIndex(2);
|
|
||||||
if ($value_var->getTypeName() == 'n_VARIABLE') {
|
|
||||||
$vars[] = $value_var;
|
|
||||||
} else {
|
|
||||||
// The root-level token may be a reference, as in:
|
|
||||||
// foreach ($a as $b => &$c) { ... }
|
|
||||||
// Reach into the n_VARIABLE_REFERENCE node to grab the n_VARIABLE
|
|
||||||
// node.
|
|
||||||
$vars[] = $value_var->getChildOfType(0, 'n_VARIABLE');
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
$binary = $body->selectDescendantsOfType('n_BINARY_EXPRESSION');
|
$binary = $body->selectDescendantsOfType('n_BINARY_EXPRESSION');
|
||||||
foreach ($binary as $expr) {
|
foreach ($binary as $expr) {
|
||||||
if ($expr->getChildByIndex(1)->getConcreteString() != '=') {
|
if ($expr->getChildByIndex(1)->getConcreteString() != '=') {
|
||||||
|
@ -744,10 +727,10 @@ final class ArcanistXHPASTLinter extends ArcanistLinter {
|
||||||
'Avoid extract(). It is confusing and hinders static analysis.');
|
'Avoid extract(). It is confusing and hinders static analysis.');
|
||||||
}
|
}
|
||||||
|
|
||||||
// Now we have every declaration. Build two maps, one which just keeps
|
// Now we have every declaration except foreach(), handled below. Build
|
||||||
// track of which tokens are part of declarations ($declaration_tokens)
|
// two maps, one which just keeps track of which tokens are part of
|
||||||
// and one which has the first offset where a variable is declared
|
// declarations ($declaration_tokens) and one which has the first offset
|
||||||
// ($declarations).
|
// where a variable is declared ($declarations).
|
||||||
|
|
||||||
foreach ($vars as $var) {
|
foreach ($vars as $var) {
|
||||||
$concrete = $this->getConcreteVariableString($var);
|
$concrete = $this->getConcreteVariableString($var);
|
||||||
|
@ -768,13 +751,26 @@ final class ArcanistXHPASTLinter extends ArcanistLinter {
|
||||||
$exclude_tokens[$var->getID()] = true;
|
$exclude_tokens[$var->getID()] = true;
|
||||||
}
|
}
|
||||||
|
|
||||||
// Issue a warning for every variable token, unless it appears in a
|
|
||||||
// declaration, we know about a prior declaration, we have explicitly
|
// Find all the variables in scope, and figure out where they are used.
|
||||||
// exlcuded it, or scope has been made unknowable before it appears.
|
// We want to find foreach() iterators which are both declared before and
|
||||||
|
// used after the foreach() loop.
|
||||||
|
|
||||||
|
$uses = array();
|
||||||
|
|
||||||
$all_vars = $body->selectDescendantsOfType('n_VARIABLE');
|
$all_vars = $body->selectDescendantsOfType('n_VARIABLE');
|
||||||
$issued_warnings = array();
|
$all = array();
|
||||||
|
|
||||||
|
// NOTE: $all_vars is not a real array so we can't unset() it.
|
||||||
foreach ($all_vars as $var) {
|
foreach ($all_vars as $var) {
|
||||||
|
|
||||||
|
// Be strict since it's easier; we don't let you reuse an iterator you
|
||||||
|
// declared before a loop after the loop, even if you're just assigning
|
||||||
|
// to it.
|
||||||
|
|
||||||
|
$concrete = $var->getConcreteString();
|
||||||
|
$uses[$concrete][$var->getID()] = $var->getOffset();
|
||||||
|
|
||||||
if (isset($declaration_tokens[$var->getID()])) {
|
if (isset($declaration_tokens[$var->getID()])) {
|
||||||
// We know this is part of a declaration, so it's fine.
|
// We know this is part of a declaration, so it's fine.
|
||||||
continue;
|
continue;
|
||||||
|
@ -783,6 +779,109 @@ final class ArcanistXHPASTLinter extends ArcanistLinter {
|
||||||
// We know this is part of isset() or similar, so it's fine.
|
// We know this is part of isset() or similar, so it's fine.
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
$all[$var->getID()] = $var;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
// Do foreach() last, we want to handle implicit redeclaration of a
|
||||||
|
// variable already in scope since this probably means we're ovewriting a
|
||||||
|
// local.
|
||||||
|
|
||||||
|
// NOTE: Processing foreach expressions in order allows programs which
|
||||||
|
// reuse iterator variables in other foreach() loops -- this is fine. We
|
||||||
|
// have a separate warning to prevent nested loops from reusing the same
|
||||||
|
// iterators.
|
||||||
|
|
||||||
|
$foreaches = $body->selectDescendantsOfType('n_FOREACH');
|
||||||
|
$all_foreach_vars = array();
|
||||||
|
foreach ($foreaches as $foreach) {
|
||||||
|
$foreach_expr = $foreach->getChildOfType(0, 'n_FOREACH_EXPRESSION');
|
||||||
|
|
||||||
|
$foreach_vars = array();
|
||||||
|
|
||||||
|
// Determine the end of the foreach() loop.
|
||||||
|
$foreach_tokens = $foreach->getTokens();
|
||||||
|
$last_token = end($foreach_tokens);
|
||||||
|
$foreach_end = $last_token->getOffset();
|
||||||
|
|
||||||
|
$key_var = $foreach_expr->getChildByIndex(1);
|
||||||
|
if ($key_var->getTypeName() == 'n_VARIABLE') {
|
||||||
|
$foreach_vars[] = $key_var;
|
||||||
|
}
|
||||||
|
|
||||||
|
$value_var = $foreach_expr->getChildByIndex(2);
|
||||||
|
if ($value_var->getTypeName() == 'n_VARIABLE') {
|
||||||
|
$foreach_vars[] = $value_var;
|
||||||
|
} else {
|
||||||
|
// The root-level token may be a reference, as in:
|
||||||
|
// foreach ($a as $b => &$c) { ... }
|
||||||
|
// Reach into the n_VARIABLE_REFERENCE node to grab the n_VARIABLE
|
||||||
|
// node.
|
||||||
|
$foreach_vars[] = $value_var->getChildOfType(0, 'n_VARIABLE');
|
||||||
|
}
|
||||||
|
|
||||||
|
// Remove all uses of the iterators inside of the foreach() loop from
|
||||||
|
// the $uses map.
|
||||||
|
|
||||||
|
foreach ($foreach_vars as $var) {
|
||||||
|
$concrete = $this->getConcreteVariableString($var);
|
||||||
|
$offset = $var->getOffset();
|
||||||
|
|
||||||
|
foreach ($uses[$concrete] as $id => $use_offset) {
|
||||||
|
if (($use_offset >= $offset) && ($use_offset < $foreach_end)) {
|
||||||
|
unset($uses[$concrete][$id]);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
$all_foreach_vars[] = $var;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
foreach ($all_foreach_vars as $var) {
|
||||||
|
$concrete = $this->getConcreteVariableString($var);
|
||||||
|
$offset = $var->getOffset();
|
||||||
|
|
||||||
|
// If a variable was declared before a foreach() and is used after
|
||||||
|
// it, raise a message.
|
||||||
|
|
||||||
|
if (isset($declarations[$concrete])) {
|
||||||
|
if ($declarations[$concrete] < $offset) {
|
||||||
|
if (!empty($uses[$concrete]) &&
|
||||||
|
max($uses[$concrete]) > $offset) {
|
||||||
|
$this->raiseLintAtNode(
|
||||||
|
$var,
|
||||||
|
self::LINT_REUSED_AS_ITERATOR,
|
||||||
|
'This iterator variable is a previously declared local '.
|
||||||
|
'variable. To avoid overwriting locals, do not reuse them '.
|
||||||
|
'as iterator variables.');
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// This is a declration, exclude it from the "declare variables prior
|
||||||
|
// to use" check below.
|
||||||
|
unset($all[$var->getID()]);
|
||||||
|
|
||||||
|
$vars[] = $var;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Now rebuild declarations to include foreach().
|
||||||
|
|
||||||
|
foreach ($vars as $var) {
|
||||||
|
$concrete = $this->getConcreteVariableString($var);
|
||||||
|
$declarations[$concrete] = min(
|
||||||
|
idx($declarations, $concrete, PHP_INT_MAX),
|
||||||
|
$var->getOffset());
|
||||||
|
$declaration_tokens[$var->getID()] = true;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Issue a warning for every variable token, unless it appears in a
|
||||||
|
// declaration, we know about a prior declaration, we have explicitly
|
||||||
|
// exlcuded it, or scope has been made unknowable before it appears.
|
||||||
|
|
||||||
|
$issued_warnings = array();
|
||||||
|
foreach ($all as $id => $var) {
|
||||||
if ($var->getOffset() >= $scope_destroyed_at) {
|
if ($var->getOffset() >= $scope_destroyed_at) {
|
||||||
// This appears after an extract() or $$var so we have no idea
|
// This appears after an extract() or $$var so we have no idea
|
||||||
// whether it's legitimate or not. We raised a harshly-worded warning
|
// whether it's legitimate or not. We raised a harshly-worded warning
|
||||||
|
|
78
src/lint/linter/xhpast/__tests__/data/reused-local.lint-test
Normal file
78
src/lint/linter/xhpast/__tests__/data/reused-local.lint-test
Normal file
|
@ -0,0 +1,78 @@
|
||||||
|
<?php
|
||||||
|
|
||||||
|
function f($stuff, $thing) {
|
||||||
|
foreach ($stuff as $ii) {
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
// OK: Only reused for iteration.
|
||||||
|
|
||||||
|
foreach ($stuff as $ii) {
|
||||||
|
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
function g($stuff, $thing) {
|
||||||
|
foreach ($stuff as $thing) {
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
// OK: Not reused later.
|
||||||
|
}
|
||||||
|
|
||||||
|
function h($stuff, $thing) {
|
||||||
|
|
||||||
|
// OK: Used afterwards but not before.
|
||||||
|
|
||||||
|
foreach ($stuff as $key => $val) {
|
||||||
|
|
||||||
|
}
|
||||||
|
|
||||||
|
$key = 1;
|
||||||
|
$thing = 1;
|
||||||
|
$thing = $key;
|
||||||
|
$key = $thing;
|
||||||
|
}
|
||||||
|
|
||||||
|
function i($stuff, $thing) {
|
||||||
|
foreach ($stuff as $thing) {
|
||||||
|
$thing++;
|
||||||
|
}
|
||||||
|
|
||||||
|
// OK: Used afterwards but inside loop.
|
||||||
|
|
||||||
|
foreach ($stuff as $thing) {
|
||||||
|
$thing++;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
function j($stuff, $thing) {
|
||||||
|
|
||||||
|
foreach ($stuff as $thing) {
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
|
||||||
|
// ERROR: Clobbers $thing; probably not what the author intended.
|
||||||
|
|
||||||
|
f($thing);
|
||||||
|
}
|
||||||
|
|
||||||
|
function k($stuff, $thing) {
|
||||||
|
foreach ($stuff as $thing) {
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
|
||||||
|
// ERROR: Clobbers $thing. Test case to cover some errors of implementation
|
||||||
|
// where subsequent legitimate foreach()es threw a wrench in the gears.
|
||||||
|
|
||||||
|
f($thing);
|
||||||
|
|
||||||
|
$other = array();
|
||||||
|
foreach ($other as $item) {
|
||||||
|
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
~~~~~~~~~~
|
||||||
|
error:51:22
|
||||||
|
error:61:22
|
|
@ -161,8 +161,8 @@ EOTEXT
|
||||||
}
|
}
|
||||||
if (count($groups) > 1) {
|
if (count($groups) > 1) {
|
||||||
$message = array();
|
$message = array();
|
||||||
foreach ($groups as $config => $group) {
|
foreach ($groups as $project => $group) {
|
||||||
$message[] = "Files underneath '{$config}':\n\n";
|
$message[] = "Files underneath '{$project}':\n\n";
|
||||||
$message[] = " ".implode("\n ", $group)."\n\n";
|
$message[] = " ".implode("\n ", $group)."\n\n";
|
||||||
}
|
}
|
||||||
$message = implode('', $message);
|
$message = implode('', $message);
|
||||||
|
|
Loading…
Reference in a new issue