1
0
Fork 0
mirror of https://we.phorge.it/source/arcanist.git synced 2024-11-25 16:22:42 +01:00

Add a lint check for clobbering locals with iterators

Summary:
See D2049, D2050. Identify reuses of locals as iterator variables. Before raising an error, we require:

  - Variable is declared before the loop.
  - Variable is used after the loop, ignoring uses as an iterator variable.

I think this identifies all problems with a very low false positive rate (the false positives are suspicious/unconventional code, but not necessarily errors).

Also fix an issue identified by the linter.

Test Plan:
  - Verified this identified the bugs in D2049 and D2050.
  - Ran linter against libphutil/, arcanist/ and phabricator/ (see D2051, this, and next diff).
  - Ran unit tests.

Reviewers: vrana, btrahan

Reviewed By: vrana

CC: aran, epriestley, jungejason

Differential Revision: https://secure.phabricator.com/D2052
This commit is contained in:
epriestley 2012-03-29 13:21:18 -07:00
parent ff94d699fe
commit 3ae1bf1a8c
4 changed files with 207 additions and 30 deletions

View file

@ -137,7 +137,7 @@ abstract class ArcanistLinterTestCase extends ArcanistPhutilTestCase {
$expect = array(); $expect = array();
} }
foreach ($expect as $key => $expected) { foreach ($expect as $key => $expected) {
$expect[$key] = reset(explode(' ', $expected)); $expect[$key] = head(explode(' ', $expected));
} }
$expect = array_fill_keys($expect, true); $expect = array_fill_keys($expect, true);

View file

@ -55,6 +55,7 @@ final class ArcanistXHPASTLinter extends ArcanistLinter {
const LINT_RAGGED_CLASSTREE_EDGE = 29; const LINT_RAGGED_CLASSTREE_EDGE = 29;
const LINT_IMPLICIT_FALLTHROUGH = 30; const LINT_IMPLICIT_FALLTHROUGH = 30;
const LINT_PHP_53_FEATURES = 31; const LINT_PHP_53_FEATURES = 31;
const LINT_REUSED_AS_ITERATOR = 32;
public function getLintNameMap() { public function getLintNameMap() {
@ -89,6 +90,7 @@ final class ArcanistXHPASTLinter extends ArcanistLinter {
self::LINT_RAGGED_CLASSTREE_EDGE => 'Class Not abstract Or final', self::LINT_RAGGED_CLASSTREE_EDGE => 'Class Not abstract Or final',
self::LINT_IMPLICIT_FALLTHROUGH => 'Implicit Fallthrough', self::LINT_IMPLICIT_FALLTHROUGH => 'Implicit Fallthrough',
self::LINT_PHP_53_FEATURES => 'Use Of PHP 5.3 Features', self::LINT_PHP_53_FEATURES => 'Use Of PHP 5.3 Features',
self::LINT_REUSED_AS_ITERATOR => 'Variable Reused As Iterator',
); );
} }
@ -677,25 +679,6 @@ final class ArcanistXHPASTLinter extends ArcanistLinter {
$vars[] = $var; $vars[] = $var;
} }
$foreaches = $body->selectDescendantsOfType('n_FOREACH_EXPRESSION');
foreach ($foreaches as $foreach_expr) {
$key_var = $foreach_expr->getChildByIndex(1);
if ($key_var->getTypeName() == 'n_VARIABLE') {
$vars[] = $key_var;
}
$value_var = $foreach_expr->getChildByIndex(2);
if ($value_var->getTypeName() == 'n_VARIABLE') {
$vars[] = $value_var;
} else {
// The root-level token may be a reference, as in:
// foreach ($a as $b => &$c) { ... }
// Reach into the n_VARIABLE_REFERENCE node to grab the n_VARIABLE
// node.
$vars[] = $value_var->getChildOfType(0, 'n_VARIABLE');
}
}
$binary = $body->selectDescendantsOfType('n_BINARY_EXPRESSION'); $binary = $body->selectDescendantsOfType('n_BINARY_EXPRESSION');
foreach ($binary as $expr) { foreach ($binary as $expr) {
if ($expr->getChildByIndex(1)->getConcreteString() != '=') { if ($expr->getChildByIndex(1)->getConcreteString() != '=') {
@ -744,10 +727,10 @@ final class ArcanistXHPASTLinter extends ArcanistLinter {
'Avoid extract(). It is confusing and hinders static analysis.'); 'Avoid extract(). It is confusing and hinders static analysis.');
} }
// Now we have every declaration. Build two maps, one which just keeps // Now we have every declaration except foreach(), handled below. Build
// track of which tokens are part of declarations ($declaration_tokens) // two maps, one which just keeps track of which tokens are part of
// and one which has the first offset where a variable is declared // declarations ($declaration_tokens) and one which has the first offset
// ($declarations). // where a variable is declared ($declarations).
foreach ($vars as $var) { foreach ($vars as $var) {
$concrete = $this->getConcreteVariableString($var); $concrete = $this->getConcreteVariableString($var);
@ -768,13 +751,26 @@ final class ArcanistXHPASTLinter extends ArcanistLinter {
$exclude_tokens[$var->getID()] = true; $exclude_tokens[$var->getID()] = true;
} }
// Issue a warning for every variable token, unless it appears in a
// declaration, we know about a prior declaration, we have explicitly // Find all the variables in scope, and figure out where they are used.
// exlcuded it, or scope has been made unknowable before it appears. // We want to find foreach() iterators which are both declared before and
// used after the foreach() loop.
$uses = array();
$all_vars = $body->selectDescendantsOfType('n_VARIABLE'); $all_vars = $body->selectDescendantsOfType('n_VARIABLE');
$issued_warnings = array(); $all = array();
// NOTE: $all_vars is not a real array so we can't unset() it.
foreach ($all_vars as $var) { foreach ($all_vars as $var) {
// Be strict since it's easier; we don't let you reuse an iterator you
// declared before a loop after the loop, even if you're just assigning
// to it.
$concrete = $var->getConcreteString();
$uses[$concrete][$var->getID()] = $var->getOffset();
if (isset($declaration_tokens[$var->getID()])) { if (isset($declaration_tokens[$var->getID()])) {
// We know this is part of a declaration, so it's fine. // We know this is part of a declaration, so it's fine.
continue; continue;
@ -783,6 +779,109 @@ final class ArcanistXHPASTLinter extends ArcanistLinter {
// We know this is part of isset() or similar, so it's fine. // We know this is part of isset() or similar, so it's fine.
continue; continue;
} }
$all[$var->getID()] = $var;
}
// Do foreach() last, we want to handle implicit redeclaration of a
// variable already in scope since this probably means we're ovewriting a
// local.
// NOTE: Processing foreach expressions in order allows programs which
// reuse iterator variables in other foreach() loops -- this is fine. We
// have a separate warning to prevent nested loops from reusing the same
// iterators.
$foreaches = $body->selectDescendantsOfType('n_FOREACH');
$all_foreach_vars = array();
foreach ($foreaches as $foreach) {
$foreach_expr = $foreach->getChildOfType(0, 'n_FOREACH_EXPRESSION');
$foreach_vars = array();
// Determine the end of the foreach() loop.
$foreach_tokens = $foreach->getTokens();
$last_token = end($foreach_tokens);
$foreach_end = $last_token->getOffset();
$key_var = $foreach_expr->getChildByIndex(1);
if ($key_var->getTypeName() == 'n_VARIABLE') {
$foreach_vars[] = $key_var;
}
$value_var = $foreach_expr->getChildByIndex(2);
if ($value_var->getTypeName() == 'n_VARIABLE') {
$foreach_vars[] = $value_var;
} else {
// The root-level token may be a reference, as in:
// foreach ($a as $b => &$c) { ... }
// Reach into the n_VARIABLE_REFERENCE node to grab the n_VARIABLE
// node.
$foreach_vars[] = $value_var->getChildOfType(0, 'n_VARIABLE');
}
// Remove all uses of the iterators inside of the foreach() loop from
// the $uses map.
foreach ($foreach_vars as $var) {
$concrete = $this->getConcreteVariableString($var);
$offset = $var->getOffset();
foreach ($uses[$concrete] as $id => $use_offset) {
if (($use_offset >= $offset) && ($use_offset < $foreach_end)) {
unset($uses[$concrete][$id]);
}
}
$all_foreach_vars[] = $var;
}
}
foreach ($all_foreach_vars as $var) {
$concrete = $this->getConcreteVariableString($var);
$offset = $var->getOffset();
// If a variable was declared before a foreach() and is used after
// it, raise a message.
if (isset($declarations[$concrete])) {
if ($declarations[$concrete] < $offset) {
if (!empty($uses[$concrete]) &&
max($uses[$concrete]) > $offset) {
$this->raiseLintAtNode(
$var,
self::LINT_REUSED_AS_ITERATOR,
'This iterator variable is a previously declared local '.
'variable. To avoid overwriting locals, do not reuse them '.
'as iterator variables.');
}
}
}
// This is a declration, exclude it from the "declare variables prior
// to use" check below.
unset($all[$var->getID()]);
$vars[] = $var;
}
// Now rebuild declarations to include foreach().
foreach ($vars as $var) {
$concrete = $this->getConcreteVariableString($var);
$declarations[$concrete] = min(
idx($declarations, $concrete, PHP_INT_MAX),
$var->getOffset());
$declaration_tokens[$var->getID()] = true;
}
// Issue a warning for every variable token, unless it appears in a
// declaration, we know about a prior declaration, we have explicitly
// exlcuded it, or scope has been made unknowable before it appears.
$issued_warnings = array();
foreach ($all as $id => $var) {
if ($var->getOffset() >= $scope_destroyed_at) { if ($var->getOffset() >= $scope_destroyed_at) {
// This appears after an extract() or $$var so we have no idea // This appears after an extract() or $$var so we have no idea
// whether it's legitimate or not. We raised a harshly-worded warning // whether it's legitimate or not. We raised a harshly-worded warning

View file

@ -0,0 +1,78 @@
<?php
function f($stuff, $thing) {
foreach ($stuff as $ii) {
}
// OK: Only reused for iteration.
foreach ($stuff as $ii) {
}
}
function g($stuff, $thing) {
foreach ($stuff as $thing) {
}
// OK: Not reused later.
}
function h($stuff, $thing) {
// OK: Used afterwards but not before.
foreach ($stuff as $key => $val) {
}
$key = 1;
$thing = 1;
$thing = $key;
$key = $thing;
}
function i($stuff, $thing) {
foreach ($stuff as $thing) {
$thing++;
}
// OK: Used afterwards but inside loop.
foreach ($stuff as $thing) {
$thing++;
}
}
function j($stuff, $thing) {
foreach ($stuff as $thing) {
break;
}
// ERROR: Clobbers $thing; probably not what the author intended.
f($thing);
}
function k($stuff, $thing) {
foreach ($stuff as $thing) {
break;
}
// ERROR: Clobbers $thing. Test case to cover some errors of implementation
// where subsequent legitimate foreach()es threw a wrench in the gears.
f($thing);
$other = array();
foreach ($other as $item) {
}
}
~~~~~~~~~~
error:51:22
error:61:22

View file

@ -161,8 +161,8 @@ EOTEXT
} }
if (count($groups) > 1) { if (count($groups) > 1) {
$message = array(); $message = array();
foreach ($groups as $config => $group) { foreach ($groups as $project => $group) {
$message[] = "Files underneath '{$config}':\n\n"; $message[] = "Files underneath '{$project}':\n\n";
$message[] = " ".implode("\n ", $group)."\n\n"; $message[] = " ".implode("\n ", $group)."\n\n";
} }
$message = implode('', $message); $message = implode('', $message);