2012-12-30 15:37:49 +01:00
|
|
|
<?php
|
|
|
|
|
2015-06-15 10:02:26 +02:00
|
|
|
abstract class PhabricatorSetupCheck extends Phobject {
|
2012-12-30 15:37:49 +01:00
|
|
|
|
|
|
|
private $issues;
|
|
|
|
|
|
|
|
abstract protected function executeChecks();
|
|
|
|
|
2015-02-10 21:53:00 +01:00
|
|
|
const GROUP_OTHER = 'other';
|
|
|
|
const GROUP_MYSQL = 'mysql';
|
|
|
|
const GROUP_PHP = 'php';
|
|
|
|
const GROUP_IMPORTANT = 'important';
|
|
|
|
|
2013-01-23 00:16:26 +01:00
|
|
|
public function getExecutionOrder() {
|
2016-09-06 20:03:17 +02:00
|
|
|
if ($this->isPreflightCheck()) {
|
|
|
|
return 0;
|
|
|
|
} else {
|
|
|
|
return 1000;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Should this check execute before we load configuration?
|
|
|
|
*
|
|
|
|
* The majority of checks (particularly, those checks which examine
|
|
|
|
* configuration) should run in the normal setup phase, after configuration
|
|
|
|
* loads. However, a small set of critical checks (mostly, tests for PHP
|
|
|
|
* setup and extensions) need to run before we can load configuration.
|
|
|
|
*
|
|
|
|
* @return bool True to execute before configuration is loaded.
|
|
|
|
*/
|
|
|
|
public function isPreflightCheck() {
|
|
|
|
return false;
|
2013-01-23 00:16:26 +01:00
|
|
|
}
|
|
|
|
|
2012-12-30 15:37:49 +01:00
|
|
|
final protected function newIssue($key) {
|
|
|
|
$issue = id(new PhabricatorSetupIssue())
|
|
|
|
->setIssueKey($key);
|
|
|
|
$this->issues[$key] = $issue;
|
2015-02-11 01:53:38 +01:00
|
|
|
|
|
|
|
if ($this->getDefaultGroup()) {
|
|
|
|
$issue->setGroup($this->getDefaultGroup());
|
|
|
|
}
|
2012-12-30 15:37:49 +01:00
|
|
|
|
|
|
|
return $issue;
|
|
|
|
}
|
|
|
|
|
|
|
|
final public function getIssues() {
|
|
|
|
return $this->issues;
|
|
|
|
}
|
|
|
|
|
2015-04-08 20:31:01 +02:00
|
|
|
protected function addIssue(PhabricatorSetupIssue $issue) {
|
|
|
|
$this->issues[$issue->getIssueKey()] = $issue;
|
|
|
|
return $this;
|
|
|
|
}
|
|
|
|
|
2015-02-11 01:53:38 +01:00
|
|
|
public function getDefaultGroup() {
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
|
2012-12-30 15:37:49 +01:00
|
|
|
final public function runSetupChecks() {
|
|
|
|
$this->issues = array();
|
|
|
|
$this->executeChecks();
|
|
|
|
}
|
|
|
|
|
2015-02-11 22:00:59 +01:00
|
|
|
final public static function getOpenSetupIssueKeys() {
|
2012-12-30 15:37:49 +01:00
|
|
|
$cache = PhabricatorCaches::getSetupCache();
|
2015-02-11 22:00:59 +01:00
|
|
|
return $cache->getKey('phabricator.setup.issue-keys');
|
2012-12-30 15:37:49 +01:00
|
|
|
}
|
|
|
|
|
When we "discover" new fatal setup issues, stop serving traffic
Summary:
Ref T10759. We may "discover" the presence of a fatal setup error later, after starting Phabricator.
This can happen in a few ways, but most are unlikely. The one I'm immediately concerned about is:
- Phabricator starts up during a disaster with some databases unreachable.
- We start with warnings (unreachable databases are generally not fatal, since it's OK for some subset of hosts to be down in replicated/partitioned setups).
- The unreachable databases later recover and become accessible again.
- When we run checks against them, we discover that they are misconfigured.
Currently, "fatal" setup issues are not truly fatal if we're "in flight" -- we've survived setup checks at least once in the past. This is bad in the scenario above.
Especially with partitioning, it could lead to mangled data in a disaster scenario where operations staff makes a small configuration mistake while trying to get things running again.
Instead, if we "discover" a fatal error while already "in flight", reset the whole setup process as though the webserver had just restarted. Don't serve requests again until we can make it through setup without hitting fatals.
Test Plan:
- Started Phabricator with multiple masters, one of which was down and broken.
- Got a warning about the bad master.
- Revived the master.
- Before: Phabricator detects the fatal, but keeps serving requests.
- After: Phabricator detects the fatal, resets the webserver, and stops serving requests until the fatal is resolved.
Reviewers: chad
Reviewed By: chad
Maniphest Tasks: T10759
Differential Revision: https://secure.phabricator.com/D16903
2016-11-21 15:09:10 +01:00
|
|
|
final public static function resetSetupState() {
|
|
|
|
$cache = PhabricatorCaches::getSetupCache();
|
|
|
|
$cache->deleteKey('phabricator.setup.issue-keys');
|
|
|
|
|
|
|
|
$server_cache = PhabricatorCaches::getServerStateCache();
|
|
|
|
$server_cache->deleteKey('phabricator.in-flight');
|
|
|
|
|
|
|
|
$use_scope = AphrontWriteGuard::isGuardActive();
|
|
|
|
if ($use_scope) {
|
|
|
|
$unguarded = AphrontWriteGuard::beginScopedUnguardedWrites();
|
|
|
|
} else {
|
|
|
|
AphrontWriteGuard::allowDangerousUnguardedWrites(true);
|
|
|
|
}
|
|
|
|
|
|
|
|
$caught = null;
|
|
|
|
try {
|
|
|
|
$db_cache = new PhabricatorKeyValueDatabaseCache();
|
|
|
|
$db_cache->deleteKey('phabricator.setup.issue-keys');
|
|
|
|
} catch (Exception $ex) {
|
|
|
|
$caught = $ex;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($use_scope) {
|
|
|
|
unset($unguarded);
|
|
|
|
} else {
|
|
|
|
AphrontWriteGuard::allowDangerousUnguardedWrites(false);
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($caught) {
|
|
|
|
throw $caught;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
When multiple web hosts are in service, don't require setup warnings to be dismissed on each one
Summary:
Fixes T10876. Currently, we can end up with a setup warning banner sticking on each web device, since the state is stored in local cache.
Instead:
- When we actually run the setup checks, save the current state in the database.
- Before we show a cached banner, make sure the database still says the checks are a problem.
This could lead to some inconsistencies if setup checks legitimately pass on some hosts but not on others. For example, if you have `git` installed on one machine but not on another, we may raise a setup warning ("No Git Binary!") about it on one host only.
For now, assume users have their operational environments in some sort of reasonable shape and can install the same stuff everywhere. In the future, we could split the issues into "global" and "per-host" issues if we run into problems with this.
Test Plan:
This is somewhat tricky to test locally since you really need multiple webservers to test it properly, but I:
- Created some setup issues, saw banner.
- Ignored/cleared them, saw banner go away.
- Verified database cache writes were occurring properly.
Then I sort of faked it like this:
- Created a setup issue.
- Manually set the database cache value to `[]` ("no issues").
- Reloaded page.
- No more banner.
Reviewers: chad
Reviewed By: chad
Maniphest Tasks: T10876
Differential Revision: https://secure.phabricator.com/D15802
2016-04-26 16:33:07 +02:00
|
|
|
final public static function setOpenSetupIssueKeys(
|
|
|
|
array $keys,
|
|
|
|
$update_database) {
|
2012-12-30 15:37:49 +01:00
|
|
|
$cache = PhabricatorCaches::getSetupCache();
|
2015-02-11 22:00:59 +01:00
|
|
|
$cache->setKey('phabricator.setup.issue-keys', $keys);
|
When multiple web hosts are in service, don't require setup warnings to be dismissed on each one
Summary:
Fixes T10876. Currently, we can end up with a setup warning banner sticking on each web device, since the state is stored in local cache.
Instead:
- When we actually run the setup checks, save the current state in the database.
- Before we show a cached banner, make sure the database still says the checks are a problem.
This could lead to some inconsistencies if setup checks legitimately pass on some hosts but not on others. For example, if you have `git` installed on one machine but not on another, we may raise a setup warning ("No Git Binary!") about it on one host only.
For now, assume users have their operational environments in some sort of reasonable shape and can install the same stuff everywhere. In the future, we could split the issues into "global" and "per-host" issues if we run into problems with this.
Test Plan:
This is somewhat tricky to test locally since you really need multiple webservers to test it properly, but I:
- Created some setup issues, saw banner.
- Ignored/cleared them, saw banner go away.
- Verified database cache writes were occurring properly.
Then I sort of faked it like this:
- Created a setup issue.
- Manually set the database cache value to `[]` ("no issues").
- Reloaded page.
- No more banner.
Reviewers: chad
Reviewed By: chad
Maniphest Tasks: T10876
Differential Revision: https://secure.phabricator.com/D15802
2016-04-26 16:33:07 +02:00
|
|
|
|
2016-09-12 16:31:53 +02:00
|
|
|
$server_cache = PhabricatorCaches::getServerStateCache();
|
|
|
|
$server_cache->setKey('phabricator.in-flight', 1);
|
|
|
|
|
When multiple web hosts are in service, don't require setup warnings to be dismissed on each one
Summary:
Fixes T10876. Currently, we can end up with a setup warning banner sticking on each web device, since the state is stored in local cache.
Instead:
- When we actually run the setup checks, save the current state in the database.
- Before we show a cached banner, make sure the database still says the checks are a problem.
This could lead to some inconsistencies if setup checks legitimately pass on some hosts but not on others. For example, if you have `git` installed on one machine but not on another, we may raise a setup warning ("No Git Binary!") about it on one host only.
For now, assume users have their operational environments in some sort of reasonable shape and can install the same stuff everywhere. In the future, we could split the issues into "global" and "per-host" issues if we run into problems with this.
Test Plan:
This is somewhat tricky to test locally since you really need multiple webservers to test it properly, but I:
- Created some setup issues, saw banner.
- Ignored/cleared them, saw banner go away.
- Verified database cache writes were occurring properly.
Then I sort of faked it like this:
- Created a setup issue.
- Manually set the database cache value to `[]` ("no issues").
- Reloaded page.
- No more banner.
Reviewers: chad
Reviewed By: chad
Maniphest Tasks: T10876
Differential Revision: https://secure.phabricator.com/D15802
2016-04-26 16:33:07 +02:00
|
|
|
if ($update_database) {
|
|
|
|
$db_cache = new PhabricatorKeyValueDatabaseCache();
|
|
|
|
try {
|
|
|
|
$json = phutil_json_encode($keys);
|
|
|
|
$db_cache->setKey('phabricator.setup.issue-keys', $json);
|
|
|
|
} catch (Exception $ex) {
|
|
|
|
// Ignore any write failures, since they likely just indicate that we
|
|
|
|
// have a database-related setup issue that needs to be resolved.
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
final public static function getOpenSetupIssueKeysFromDatabase() {
|
|
|
|
$db_cache = new PhabricatorKeyValueDatabaseCache();
|
|
|
|
try {
|
|
|
|
$value = $db_cache->getKey('phabricator.setup.issue-keys');
|
|
|
|
if (!strlen($value)) {
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
return phutil_json_decode($value);
|
|
|
|
} catch (Exception $ex) {
|
|
|
|
return null;
|
|
|
|
}
|
2012-12-30 15:37:49 +01:00
|
|
|
}
|
|
|
|
|
2015-02-11 22:00:59 +01:00
|
|
|
final public static function getUnignoredIssueKeys(array $all_issues) {
|
2013-02-22 18:21:01 +01:00
|
|
|
assert_instances_of($all_issues, 'PhabricatorSetupIssue');
|
2015-02-11 22:00:59 +01:00
|
|
|
$keys = array();
|
2013-02-22 18:21:01 +01:00
|
|
|
foreach ($all_issues as $issue) {
|
|
|
|
if (!$issue->getIsIgnored()) {
|
2015-02-11 22:00:59 +01:00
|
|
|
$keys[] = $issue->getIssueKey();
|
2013-02-22 18:21:01 +01:00
|
|
|
}
|
|
|
|
}
|
2015-02-11 22:00:59 +01:00
|
|
|
return $keys;
|
2013-02-22 18:21:01 +01:00
|
|
|
}
|
|
|
|
|
2013-01-18 01:25:38 +01:00
|
|
|
final public static function getConfigNeedsRepair() {
|
|
|
|
$cache = PhabricatorCaches::getSetupCache();
|
|
|
|
return $cache->getKey('phabricator.setup.needs-repair');
|
|
|
|
}
|
|
|
|
|
|
|
|
final public static function setConfigNeedsRepair($needs_repair) {
|
|
|
|
$cache = PhabricatorCaches::getSetupCache();
|
|
|
|
$cache->setKey('phabricator.setup.needs-repair', $needs_repair);
|
|
|
|
}
|
|
|
|
|
|
|
|
final public static function deleteSetupCheckCache() {
|
|
|
|
$cache = PhabricatorCaches::getSetupCache();
|
|
|
|
$cache->deleteKeys(
|
|
|
|
array(
|
|
|
|
'phabricator.setup.needs-repair',
|
2015-02-11 22:00:59 +01:00
|
|
|
'phabricator.setup.issue-keys',
|
2013-01-18 01:25:38 +01:00
|
|
|
));
|
|
|
|
}
|
|
|
|
|
2016-09-06 21:25:37 +02:00
|
|
|
final public static function willPreflightRequest() {
|
|
|
|
$checks = self::loadAllChecks();
|
|
|
|
|
|
|
|
foreach ($checks as $check) {
|
|
|
|
if (!$check->isPreflightCheck()) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
$check->runSetupChecks();
|
|
|
|
|
|
|
|
foreach ($check->getIssues() as $key => $issue) {
|
|
|
|
return self::newIssueResponse($issue);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
|
2016-09-06 21:52:03 +02:00
|
|
|
public static function newIssueResponse(PhabricatorSetupIssue $issue) {
|
2016-09-06 21:25:37 +02:00
|
|
|
$view = id(new PhabricatorSetupIssueView())
|
|
|
|
->setIssue($issue);
|
|
|
|
|
|
|
|
return id(new PhabricatorConfigResponse())
|
|
|
|
->setView($view);
|
|
|
|
}
|
|
|
|
|
2012-12-30 15:37:49 +01:00
|
|
|
final public static function willProcessRequest() {
|
2015-02-11 22:00:59 +01:00
|
|
|
$issue_keys = self::getOpenSetupIssueKeys();
|
|
|
|
if ($issue_keys === null) {
|
When we "discover" new fatal setup issues, stop serving traffic
Summary:
Ref T10759. We may "discover" the presence of a fatal setup error later, after starting Phabricator.
This can happen in a few ways, but most are unlikely. The one I'm immediately concerned about is:
- Phabricator starts up during a disaster with some databases unreachable.
- We start with warnings (unreachable databases are generally not fatal, since it's OK for some subset of hosts to be down in replicated/partitioned setups).
- The unreachable databases later recover and become accessible again.
- When we run checks against them, we discover that they are misconfigured.
Currently, "fatal" setup issues are not truly fatal if we're "in flight" -- we've survived setup checks at least once in the past. This is bad in the scenario above.
Especially with partitioning, it could lead to mangled data in a disaster scenario where operations staff makes a small configuration mistake while trying to get things running again.
Instead, if we "discover" a fatal error while already "in flight", reset the whole setup process as though the webserver had just restarted. Don't serve requests again until we can make it through setup without hitting fatals.
Test Plan:
- Started Phabricator with multiple masters, one of which was down and broken.
- Got a warning about the bad master.
- Revived the master.
- Before: Phabricator detects the fatal, but keeps serving requests.
- After: Phabricator detects the fatal, resets the webserver, and stops serving requests until the fatal is resolved.
Reviewers: chad
Reviewed By: chad
Maniphest Tasks: T10759
Differential Revision: https://secure.phabricator.com/D16903
2016-11-21 15:09:10 +01:00
|
|
|
$engine = new PhabricatorSetupEngine();
|
|
|
|
$response = $engine->execute();
|
|
|
|
if ($response) {
|
|
|
|
return $response;
|
2013-01-23 00:16:26 +01:00
|
|
|
}
|
When multiple web hosts are in service, don't require setup warnings to be dismissed on each one
Summary:
Fixes T10876. Currently, we can end up with a setup warning banner sticking on each web device, since the state is stored in local cache.
Instead:
- When we actually run the setup checks, save the current state in the database.
- Before we show a cached banner, make sure the database still says the checks are a problem.
This could lead to some inconsistencies if setup checks legitimately pass on some hosts but not on others. For example, if you have `git` installed on one machine but not on another, we may raise a setup warning ("No Git Binary!") about it on one host only.
For now, assume users have their operational environments in some sort of reasonable shape and can install the same stuff everywhere. In the future, we could split the issues into "global" and "per-host" issues if we run into problems with this.
Test Plan:
This is somewhat tricky to test locally since you really need multiple webservers to test it properly, but I:
- Created some setup issues, saw banner.
- Ignored/cleared them, saw banner go away.
- Verified database cache writes were occurring properly.
Then I sort of faked it like this:
- Created a setup issue.
- Manually set the database cache value to `[]` ("no issues").
- Reloaded page.
- No more banner.
Reviewers: chad
Reviewed By: chad
Maniphest Tasks: T10876
Differential Revision: https://secure.phabricator.com/D15802
2016-04-26 16:33:07 +02:00
|
|
|
} else if ($issue_keys) {
|
|
|
|
// If Phabricator is configured in a cluster with multiple web devices,
|
|
|
|
// we can end up with setup issues cached on every device. This can cause
|
|
|
|
// a warning banner to show on every device so that each one needs to
|
|
|
|
// be dismissed individually, which is pretty annoying. See T10876.
|
|
|
|
|
|
|
|
// To avoid this, check if the issues we found have already been cleared
|
|
|
|
// in the database. If they have, we'll just wipe out our own cache and
|
|
|
|
// move on.
|
|
|
|
$issue_keys = self::getOpenSetupIssueKeysFromDatabase();
|
|
|
|
if ($issue_keys !== null) {
|
|
|
|
self::setOpenSetupIssueKeys($issue_keys, $update_database = false);
|
|
|
|
}
|
2012-12-30 15:37:49 +01:00
|
|
|
}
|
|
|
|
|
2013-01-18 01:25:38 +01:00
|
|
|
// Try to repair configuration unless we have a clean bill of health on it.
|
|
|
|
// We need to keep doing this on every page load until all the problems
|
|
|
|
// are fixed, which is why it's separate from setup checks (which run
|
|
|
|
// once per restart).
|
|
|
|
$needs_repair = self::getConfigNeedsRepair();
|
|
|
|
if ($needs_repair !== false) {
|
|
|
|
$needs_repair = self::repairConfig();
|
|
|
|
self::setConfigNeedsRepair($needs_repair);
|
|
|
|
}
|
2012-12-30 15:37:49 +01:00
|
|
|
}
|
|
|
|
|
2016-09-06 22:48:22 +02:00
|
|
|
/**
|
|
|
|
* Test if we've survived through setup on at least one normal request
|
|
|
|
* without fataling.
|
|
|
|
*
|
|
|
|
* If we've made it through setup without hitting any fatals, we switch
|
|
|
|
* to render a more friendly error page when encountering issues like
|
|
|
|
* database connection failures. This gives users a smoother experience in
|
|
|
|
* the face of intermittent failures.
|
|
|
|
*
|
|
|
|
* @return bool True if we've made it through setup since the last restart.
|
|
|
|
*/
|
|
|
|
final public static function isInFlight() {
|
2016-09-12 16:31:53 +02:00
|
|
|
$cache = PhabricatorCaches::getServerStateCache();
|
|
|
|
return (bool)$cache->getKey('phabricator.in-flight');
|
2016-09-06 22:48:22 +02:00
|
|
|
}
|
|
|
|
|
2015-06-15 10:07:06 +02:00
|
|
|
final public static function loadAllChecks() {
|
2015-07-07 14:34:30 +02:00
|
|
|
return id(new PhutilClassMapQuery())
|
2015-05-13 22:50:28 +02:00
|
|
|
->setAncestorClass(__CLASS__)
|
2015-07-07 14:34:30 +02:00
|
|
|
->setSortMethod('getExecutionOrder')
|
|
|
|
->execute();
|
2015-06-15 10:07:06 +02:00
|
|
|
}
|
|
|
|
|
2016-09-06 21:25:37 +02:00
|
|
|
final public static function runNormalChecks() {
|
2015-06-15 10:07:06 +02:00
|
|
|
$checks = self::loadAllChecks();
|
2013-01-23 00:16:26 +01:00
|
|
|
|
2016-09-06 21:25:37 +02:00
|
|
|
foreach ($checks as $key => $check) {
|
|
|
|
if ($check->isPreflightCheck()) {
|
|
|
|
unset($checks[$key]);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2012-12-30 15:37:49 +01:00
|
|
|
$issues = array();
|
|
|
|
foreach ($checks as $check) {
|
|
|
|
$check->runSetupChecks();
|
|
|
|
foreach ($check->getIssues() as $key => $issue) {
|
|
|
|
if (isset($issues[$key])) {
|
|
|
|
throw new Exception(
|
2015-05-22 09:27:56 +02:00
|
|
|
pht(
|
|
|
|
"Two setup checks raised an issue with key '%s'!",
|
|
|
|
$key));
|
2012-12-30 15:37:49 +01:00
|
|
|
}
|
|
|
|
$issues[$key] = $issue;
|
2013-01-23 00:16:26 +01:00
|
|
|
if ($issue->getIsFatal()) {
|
|
|
|
break 2;
|
|
|
|
}
|
2012-12-30 15:37:49 +01:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2015-05-22 09:27:56 +02:00
|
|
|
$ignore_issues = PhabricatorEnv::getEnvConfig('config.ignore-issues');
|
|
|
|
foreach ($ignore_issues as $ignorable => $derp) {
|
2013-02-22 18:21:01 +01:00
|
|
|
if (isset($issues[$ignorable])) {
|
|
|
|
$issues[$ignorable]->setIsIgnored(true);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2012-12-30 15:37:49 +01:00
|
|
|
return $issues;
|
|
|
|
}
|
|
|
|
|
2013-01-18 01:25:38 +01:00
|
|
|
final public static function repairConfig() {
|
|
|
|
$needs_repair = false;
|
|
|
|
|
|
|
|
$options = PhabricatorApplicationConfigOptions::loadAllOptions();
|
|
|
|
foreach ($options as $option) {
|
|
|
|
try {
|
|
|
|
$option->getGroup()->validateOption(
|
|
|
|
$option,
|
|
|
|
PhabricatorEnv::getEnvConfig($option->getKey()));
|
|
|
|
} catch (PhabricatorConfigValidationException $ex) {
|
|
|
|
PhabricatorEnv::repairConfig($option->getKey(), $option->getDefault());
|
|
|
|
$needs_repair = true;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
return $needs_repair;
|
|
|
|
}
|
|
|
|
|
2012-12-30 15:37:49 +01:00
|
|
|
}
|