2017-08-18 22:57:27 +02:00
|
|
|
<?php declare(strict_types=1);
|
2014-04-20 00:08:59 +02:00
|
|
|
|
|
|
|
namespace PhpParser;
|
|
|
|
|
|
|
|
/*
|
|
|
|
* This parser is based on a skeleton written by Moriyoshi Koizumi, which in
|
|
|
|
* turn is based on work by Masato Bito.
|
|
|
|
*/
|
2022-08-28 18:48:26 +02:00
|
|
|
|
2024-09-01 12:35:12 +02:00
|
|
|
use PhpParser\Node\Arg;
|
2022-08-28 18:48:26 +02:00
|
|
|
use PhpParser\Node\Expr;
|
|
|
|
use PhpParser\Node\Expr\Array_;
|
2019-01-03 08:59:45 +01:00
|
|
|
use PhpParser\Node\Expr\Cast\Double;
|
2022-09-11 15:22:23 +02:00
|
|
|
use PhpParser\Node\Identifier;
|
2022-09-17 17:12:55 +02:00
|
|
|
use PhpParser\Node\InterpolatedStringPart;
|
2015-06-13 20:16:09 +02:00
|
|
|
use PhpParser\Node\Name;
|
2016-10-09 00:59:44 +02:00
|
|
|
use PhpParser\Node\Param;
|
2024-07-14 21:29:58 +02:00
|
|
|
use PhpParser\Node\PropertyHook;
|
2022-09-03 15:13:42 +02:00
|
|
|
use PhpParser\Node\Scalar\InterpolatedString;
|
2022-09-03 11:58:59 +02:00
|
|
|
use PhpParser\Node\Scalar\Int_;
|
2016-12-07 20:22:53 +01:00
|
|
|
use PhpParser\Node\Scalar\String_;
|
2022-09-17 17:12:55 +02:00
|
|
|
use PhpParser\Node\Stmt;
|
2016-10-09 00:59:44 +02:00
|
|
|
use PhpParser\Node\Stmt\Class_;
|
|
|
|
use PhpParser\Node\Stmt\ClassConst;
|
|
|
|
use PhpParser\Node\Stmt\ClassMethod;
|
2022-09-11 16:57:53 +02:00
|
|
|
use PhpParser\Node\Stmt\Else_;
|
|
|
|
use PhpParser\Node\Stmt\ElseIf_;
|
2021-04-25 21:11:36 +02:00
|
|
|
use PhpParser\Node\Stmt\Enum_;
|
2016-10-09 00:59:44 +02:00
|
|
|
use PhpParser\Node\Stmt\Interface_;
|
|
|
|
use PhpParser\Node\Stmt\Namespace_;
|
2022-09-11 16:57:53 +02:00
|
|
|
use PhpParser\Node\Stmt\Nop;
|
2016-10-09 00:59:44 +02:00
|
|
|
use PhpParser\Node\Stmt\Property;
|
|
|
|
use PhpParser\Node\Stmt\TryCatch;
|
2022-09-03 18:59:48 +02:00
|
|
|
use PhpParser\Node\UseItem;
|
2022-06-06 16:32:48 +02:00
|
|
|
use PhpParser\NodeVisitor\CommentAnnotatingVisitor;
|
2015-06-13 20:16:09 +02:00
|
|
|
|
2022-08-28 22:57:06 +02:00
|
|
|
abstract class ParserAbstract implements Parser {
|
2022-07-04 17:11:08 +02:00
|
|
|
private const SYMBOL_NONE = -1;
|
2014-04-20 13:16:54 +02:00
|
|
|
|
2022-06-06 16:45:02 +02:00
|
|
|
/** @var Lexer Lexer that is used when parsing */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected Lexer $lexer;
|
2022-07-23 16:35:21 +02:00
|
|
|
/** @var PhpVersion PHP version to target on a best-effort basis */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected PhpVersion $phpVersion;
|
2022-06-06 16:45:02 +02:00
|
|
|
|
2014-04-20 13:16:54 +02:00
|
|
|
/*
|
|
|
|
* The following members will be filled with generated parsing data:
|
|
|
|
*/
|
|
|
|
|
|
|
|
/** @var int Size of $tokenToSymbol map */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected int $tokenToSymbolMapSize;
|
2014-04-20 13:16:54 +02:00
|
|
|
/** @var int Size of $action table */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected int $actionTableSize;
|
2014-04-20 13:16:54 +02:00
|
|
|
/** @var int Size of $goto table */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected int $gotoTableSize;
|
2014-04-20 13:16:54 +02:00
|
|
|
|
|
|
|
/** @var int Symbol number signifying an invalid token */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected int $invalidSymbol;
|
2015-02-02 23:25:34 +01:00
|
|
|
/** @var int Symbol number of error recovery token */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected int $errorSymbol;
|
2014-04-20 13:16:54 +02:00
|
|
|
/** @var int Action number signifying default action */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected int $defaultAction;
|
2014-04-20 13:16:54 +02:00
|
|
|
/** @var int Rule number signifying that an unexpected token was encountered */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected int $unexpectedTokenRule;
|
2014-04-20 13:16:54 +02:00
|
|
|
|
2023-08-16 21:18:30 +02:00
|
|
|
protected int $YY2TBLSTATE;
|
2017-11-12 15:58:24 +01:00
|
|
|
/** @var int Number of non-leaf states */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected int $numNonLeafStates;
|
2014-04-20 13:16:54 +02:00
|
|
|
|
2022-06-19 18:05:52 +02:00
|
|
|
/** @var int[] Map of PHP token IDs to internal symbols */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $phpTokenToSymbol;
|
2023-07-29 15:10:11 +02:00
|
|
|
/** @var array<int, bool> Map of PHP token IDs to drop */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $dropTokens;
|
2022-06-19 18:12:20 +02:00
|
|
|
/** @var int[] Map of external symbols (static::T_*) to internal symbols */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $tokenToSymbol;
|
2017-01-26 00:16:54 +01:00
|
|
|
/** @var string[] Map of symbols to their names */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $symbolToName;
|
2022-09-17 17:12:55 +02:00
|
|
|
/** @var array<int, string> Names of the production rules (only necessary for debugging) */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $productions;
|
2014-04-20 13:16:54 +02:00
|
|
|
|
2017-01-26 00:16:54 +01:00
|
|
|
/** @var int[] Map of states to a displacement into the $action table. The corresponding action for this
|
2014-04-20 13:16:54 +02:00
|
|
|
* state/symbol pair is $action[$actionBase[$state] + $symbol]. If $actionBase[$state] is 0, the
|
2021-04-25 13:15:40 +03:00
|
|
|
* action is defaulted, i.e. $actionDefault[$state] should be used instead. */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $actionBase;
|
2017-01-26 00:16:54 +01:00
|
|
|
/** @var int[] Table of actions. Indexed according to $actionBase comment. */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $action;
|
2017-01-26 00:16:54 +01:00
|
|
|
/** @var int[] Table indexed analogously to $action. If $actionCheck[$actionBase[$state] + $symbol] != $symbol
|
2014-04-20 13:16:54 +02:00
|
|
|
* then the action is defaulted, i.e. $actionDefault[$state] should be used instead. */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $actionCheck;
|
2017-02-05 11:53:48 +01:00
|
|
|
/** @var int[] Map of states to their default action */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $actionDefault;
|
2017-02-05 11:53:48 +01:00
|
|
|
/** @var callable[] Semantic action callbacks */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $reduceCallbacks;
|
2014-04-20 13:16:54 +02:00
|
|
|
|
2017-01-26 00:16:54 +01:00
|
|
|
/** @var int[] Map of non-terminals to a displacement into the $goto table. The corresponding goto state for this
|
2014-04-20 13:16:54 +02:00
|
|
|
* non-terminal/state pair is $goto[$gotoBase[$nonTerminal] + $state] (unless defaulted) */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $gotoBase;
|
2017-01-26 00:16:54 +01:00
|
|
|
/** @var int[] Table of states to goto after reduction. Indexed according to $gotoBase comment. */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $goto;
|
2017-01-26 00:16:54 +01:00
|
|
|
/** @var int[] Table indexed analogously to $goto. If $gotoCheck[$gotoBase[$nonTerminal] + $state] != $nonTerminal
|
2014-04-20 13:16:54 +02:00
|
|
|
* then the goto state is defaulted, i.e. $gotoDefault[$nonTerminal] should be used. */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $gotoCheck;
|
2017-01-26 00:16:54 +01:00
|
|
|
/** @var int[] Map of non-terminals to the default state to goto after their reduction */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $gotoDefault;
|
2014-04-20 13:16:54 +02:00
|
|
|
|
2017-01-26 00:16:54 +01:00
|
|
|
/** @var int[] Map of rules to the non-terminal on their left-hand side, i.e. the non-terminal to use for
|
2014-04-20 13:16:54 +02:00
|
|
|
* determining the state to goto after reduction. */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $ruleToNonTerminal;
|
2017-01-26 00:16:54 +01:00
|
|
|
/** @var int[] Map of rules to the length of their right-hand side, which is the number of elements that have to
|
2014-04-20 13:16:54 +02:00
|
|
|
* be popped from the stack(s) on reduction. */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $ruleToLength;
|
2014-04-20 13:16:54 +02:00
|
|
|
|
|
|
|
/*
|
|
|
|
* The following members are part of the parser state:
|
|
|
|
*/
|
|
|
|
|
|
|
|
/** @var mixed Temporary value containing the result of last semantic action (reduction) */
|
|
|
|
protected $semValue;
|
2022-09-17 17:12:55 +02:00
|
|
|
/** @var mixed[] Semantic value stack (contains values of tokens and semantic action results) */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $semStack;
|
2023-07-29 15:10:11 +02:00
|
|
|
/** @var int[] Token start position stack */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $tokenStartStack;
|
2023-07-29 15:10:11 +02:00
|
|
|
/** @var int[] Token end position stack */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $tokenEndStack;
|
2014-04-20 00:08:59 +02:00
|
|
|
|
2016-10-09 13:15:24 +02:00
|
|
|
/** @var ErrorHandler Error handler */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected ErrorHandler $errorHandler;
|
2016-07-25 17:18:52 +02:00
|
|
|
/** @var int Error state, used to avoid error floods */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected int $errorState;
|
2015-02-02 23:25:34 +01:00
|
|
|
|
2022-09-17 17:12:55 +02:00
|
|
|
/** @var \SplObjectStorage<Array_, null>|null Array nodes created during parsing, for postprocessing of empty elements. */
|
2023-08-17 21:35:48 +02:00
|
|
|
protected ?\SplObjectStorage $createdArrays;
|
2022-09-01 21:23:14 +02:00
|
|
|
|
2023-07-29 15:10:11 +02:00
|
|
|
/** @var Token[] Tokens for the current parse */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected array $tokens;
|
2023-07-29 15:10:11 +02:00
|
|
|
/** @var int Current position in token array */
|
2023-08-16 21:18:30 +02:00
|
|
|
protected int $tokenPos;
|
2023-07-29 15:10:11 +02:00
|
|
|
|
2017-02-05 11:53:48 +01:00
|
|
|
/**
|
|
|
|
* Initialize $reduceCallbacks map.
|
|
|
|
*/
|
2022-09-11 17:51:59 +02:00
|
|
|
abstract protected function initReduceCallbacks(): void;
|
2017-02-05 11:53:48 +01:00
|
|
|
|
2014-04-20 00:08:59 +02:00
|
|
|
/**
|
|
|
|
* Creates a parser instance.
|
|
|
|
*
|
2022-06-06 16:45:02 +02:00
|
|
|
* Options:
|
2022-07-23 16:35:21 +02:00
|
|
|
* * phpVersion: ?PhpVersion,
|
2016-12-22 21:13:42 +01:00
|
|
|
*
|
2014-04-20 00:08:59 +02:00
|
|
|
* @param Lexer $lexer A lexer
|
2022-07-23 16:35:21 +02:00
|
|
|
* @param PhpVersion $phpVersion PHP version to target, defaults to latest supported. This
|
2023-09-17 15:59:04 +02:00
|
|
|
* option is best-effort: Even if specified, parsing will generally assume the latest
|
|
|
|
* supported version and only adjust behavior in minor ways, for example by omitting
|
|
|
|
* errors in older versions and interpreting type hints as a name or identifier depending
|
|
|
|
* on version.
|
2014-04-20 00:08:59 +02:00
|
|
|
*/
|
2022-07-23 16:35:21 +02:00
|
|
|
public function __construct(Lexer $lexer, ?PhpVersion $phpVersion = null) {
|
2014-04-20 00:08:59 +02:00
|
|
|
$this->lexer = $lexer;
|
2022-07-23 16:35:21 +02:00
|
|
|
$this->phpVersion = $phpVersion ?? PhpVersion::getNewestSupported();
|
2022-06-06 16:45:02 +02:00
|
|
|
|
|
|
|
$this->initReduceCallbacks();
|
2022-06-19 18:05:52 +02:00
|
|
|
$this->phpTokenToSymbol = $this->createTokenMap();
|
2023-07-29 15:10:11 +02:00
|
|
|
$this->dropTokens = array_fill_keys(
|
2023-08-13 12:45:21 +02:00
|
|
|
[\T_WHITESPACE, \T_OPEN_TAG, \T_COMMENT, \T_DOC_COMMENT, \T_BAD_CHARACTER], true
|
2023-07-29 15:10:11 +02:00
|
|
|
);
|
2022-06-06 16:45:02 +02:00
|
|
|
}
|
2015-02-02 23:25:34 +01:00
|
|
|
|
2014-04-20 00:08:59 +02:00
|
|
|
/**
|
|
|
|
* Parses PHP code into a node tree.
|
|
|
|
*
|
2016-10-09 13:15:24 +02:00
|
|
|
* If a non-throwing error handler is used, the parser will continue parsing after an error
|
|
|
|
* occurred and attempt to build a partial AST.
|
|
|
|
*
|
2014-04-20 00:08:59 +02:00
|
|
|
* @param string $code The source code to parse
|
2016-10-09 13:15:24 +02:00
|
|
|
* @param ErrorHandler|null $errorHandler Error handler to use for lexer/parser errors, defaults
|
|
|
|
* to ErrorHandler\Throwing.
|
2014-04-20 00:08:59 +02:00
|
|
|
*
|
2017-01-19 22:46:28 +01:00
|
|
|
* @return Node\Stmt[]|null Array of statements (or null non-throwing error handler is used and
|
|
|
|
* the parser was unable to recover from an error).
|
2014-04-20 00:08:59 +02:00
|
|
|
*/
|
2022-07-04 17:08:08 +02:00
|
|
|
public function parse(string $code, ?ErrorHandler $errorHandler = null): ?array {
|
2022-08-28 22:57:06 +02:00
|
|
|
$this->errorHandler = $errorHandler ?: new ErrorHandler\Throwing();
|
2022-09-01 21:23:14 +02:00
|
|
|
$this->createdArrays = new \SplObjectStorage();
|
2016-10-09 13:15:24 +02:00
|
|
|
|
2023-08-13 16:03:26 +02:00
|
|
|
$this->tokens = $this->lexer->tokenize($code, $this->errorHandler);
|
2017-11-11 16:54:52 +01:00
|
|
|
$result = $this->doParse();
|
2016-09-30 13:49:34 +02:00
|
|
|
|
2022-09-01 21:23:14 +02:00
|
|
|
// Report errors for any empty elements used inside arrays. This is delayed until after the main parse,
|
|
|
|
// because we don't know a priori whether a given array expression will be used in a destructuring context
|
|
|
|
// or not.
|
|
|
|
foreach ($this->createdArrays as $node) {
|
|
|
|
foreach ($node->items as $item) {
|
|
|
|
if ($item->value instanceof Expr\Error) {
|
|
|
|
$this->errorHandler->handleError(
|
|
|
|
new Error('Cannot use empty array elements in arrays', $item->getAttributes()));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-11-11 16:54:52 +01:00
|
|
|
// Clear out some of the interior state, so we don't hold onto unnecessary
|
|
|
|
// memory between uses of the parser
|
2023-07-29 15:10:11 +02:00
|
|
|
$this->tokenStartStack = [];
|
|
|
|
$this->tokenEndStack = [];
|
2017-11-11 16:54:52 +01:00
|
|
|
$this->semStack = [];
|
|
|
|
$this->semValue = null;
|
2022-09-01 21:23:14 +02:00
|
|
|
$this->createdArrays = null;
|
2017-11-11 16:54:52 +01:00
|
|
|
|
2022-06-06 16:32:48 +02:00
|
|
|
if ($result !== null) {
|
|
|
|
$traverser = new NodeTraverser(new CommentAnnotatingVisitor($this->tokens));
|
|
|
|
$traverser->traverse($result);
|
|
|
|
}
|
|
|
|
|
2017-11-11 16:54:52 +01:00
|
|
|
return $result;
|
|
|
|
}
|
|
|
|
|
2023-08-13 16:03:26 +02:00
|
|
|
public function getTokens(): array {
|
|
|
|
return $this->tokens;
|
2022-06-19 21:05:31 +02:00
|
|
|
}
|
|
|
|
|
2022-09-17 17:12:55 +02:00
|
|
|
/** @return Stmt[]|null */
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function doParse(): ?array {
|
2014-04-20 00:08:59 +02:00
|
|
|
// We start off with no lookahead-token
|
2014-04-20 13:16:54 +02:00
|
|
|
$symbol = self::SYMBOL_NONE;
|
2023-07-29 15:10:11 +02:00
|
|
|
$tokenValue = null;
|
|
|
|
$this->tokenPos = -1;
|
2014-04-20 00:08:59 +02:00
|
|
|
|
2016-10-08 23:54:14 +02:00
|
|
|
// Keep stack of start and end attributes
|
2023-07-29 15:10:11 +02:00
|
|
|
$this->tokenStartStack = [];
|
|
|
|
$this->tokenEndStack = [0];
|
2014-04-20 00:08:59 +02:00
|
|
|
|
|
|
|
// Start off in the initial state and keep a stack of previous states
|
|
|
|
$state = 0;
|
2017-08-13 14:06:08 +02:00
|
|
|
$stateStack = [$state];
|
2014-04-20 00:08:59 +02:00
|
|
|
|
2014-04-20 13:16:54 +02:00
|
|
|
// Semantic value stack (contains values of tokens and semantic action results)
|
2017-08-13 14:06:08 +02:00
|
|
|
$this->semStack = [];
|
2014-04-20 00:08:59 +02:00
|
|
|
|
|
|
|
// Current position in the stack(s)
|
2017-02-04 20:18:56 +01:00
|
|
|
$stackPos = 0;
|
2014-04-20 00:08:59 +02:00
|
|
|
|
2016-07-25 17:18:52 +02:00
|
|
|
$this->errorState = 0;
|
2015-02-02 23:25:34 +01:00
|
|
|
|
2014-04-20 00:08:59 +02:00
|
|
|
for (;;) {
|
2014-04-20 13:16:54 +02:00
|
|
|
//$this->traceNewState($state, $symbol);
|
2014-04-20 00:08:59 +02:00
|
|
|
|
2017-08-13 14:13:51 +02:00
|
|
|
if ($this->actionBase[$state] === 0) {
|
2014-04-20 13:16:54 +02:00
|
|
|
$rule = $this->actionDefault[$state];
|
2014-04-20 00:08:59 +02:00
|
|
|
} else {
|
2014-04-20 13:16:54 +02:00
|
|
|
if ($symbol === self::SYMBOL_NONE) {
|
2023-07-29 15:10:11 +02:00
|
|
|
do {
|
|
|
|
$token = $this->tokens[++$this->tokenPos];
|
|
|
|
$tokenId = $token->id;
|
|
|
|
} while (isset($this->dropTokens[$tokenId]));
|
2014-04-20 00:08:59 +02:00
|
|
|
|
2022-06-19 18:05:52 +02:00
|
|
|
// Map the lexer token id to the internally used symbols.
|
2023-07-29 15:10:11 +02:00
|
|
|
$tokenValue = $token->text;
|
2022-06-19 18:05:52 +02:00
|
|
|
if (!isset($this->phpTokenToSymbol[$tokenId])) {
|
2014-04-20 00:08:59 +02:00
|
|
|
throw new \RangeException(sprintf(
|
|
|
|
'The lexer returned an invalid token (id=%d, value=%s)',
|
2014-04-20 13:16:54 +02:00
|
|
|
$tokenId, $tokenValue
|
2014-04-20 00:08:59 +02:00
|
|
|
));
|
|
|
|
}
|
2022-06-19 18:05:52 +02:00
|
|
|
$symbol = $this->phpTokenToSymbol[$tokenId];
|
2014-04-20 00:08:59 +02:00
|
|
|
|
2014-04-20 13:16:54 +02:00
|
|
|
//$this->traceRead($symbol);
|
2014-04-20 00:08:59 +02:00
|
|
|
}
|
|
|
|
|
2014-04-20 13:16:54 +02:00
|
|
|
$idx = $this->actionBase[$state] + $symbol;
|
2017-08-13 14:13:51 +02:00
|
|
|
if ((($idx >= 0 && $idx < $this->actionTableSize && $this->actionCheck[$idx] === $symbol)
|
2014-04-20 13:16:54 +02:00
|
|
|
|| ($state < $this->YY2TBLSTATE
|
2017-11-12 15:58:24 +01:00
|
|
|
&& ($idx = $this->actionBase[$state + $this->numNonLeafStates] + $symbol) >= 0
|
2017-08-13 14:13:51 +02:00
|
|
|
&& $idx < $this->actionTableSize && $this->actionCheck[$idx] === $symbol))
|
|
|
|
&& ($action = $this->action[$idx]) !== $this->defaultAction) {
|
2014-04-20 00:08:59 +02:00
|
|
|
/*
|
2017-11-12 15:58:24 +01:00
|
|
|
* >= numNonLeafStates: shift and reduce
|
2014-04-20 00:08:59 +02:00
|
|
|
* > 0: shift
|
|
|
|
* = 0: accept
|
|
|
|
* < 0: reduce
|
|
|
|
* = -YYUNEXPECTED: error
|
|
|
|
*/
|
2014-04-20 13:16:54 +02:00
|
|
|
if ($action > 0) {
|
2014-04-20 00:08:59 +02:00
|
|
|
/* shift */
|
2014-04-20 13:16:54 +02:00
|
|
|
//$this->traceShift($symbol);
|
2014-04-20 00:08:59 +02:00
|
|
|
|
2017-02-04 20:18:56 +01:00
|
|
|
++$stackPos;
|
|
|
|
$stateStack[$stackPos] = $state = $action;
|
|
|
|
$this->semStack[$stackPos] = $tokenValue;
|
2023-07-29 15:10:11 +02:00
|
|
|
$this->tokenStartStack[$stackPos] = $this->tokenPos;
|
|
|
|
$this->tokenEndStack[$stackPos] = $this->tokenPos;
|
2014-04-20 13:16:54 +02:00
|
|
|
$symbol = self::SYMBOL_NONE;
|
2014-04-20 00:08:59 +02:00
|
|
|
|
2016-07-25 17:18:52 +02:00
|
|
|
if ($this->errorState) {
|
|
|
|
--$this->errorState;
|
2015-02-02 23:25:34 +01:00
|
|
|
}
|
|
|
|
|
2017-11-12 15:58:24 +01:00
|
|
|
if ($action < $this->numNonLeafStates) {
|
2014-04-20 00:08:59 +02:00
|
|
|
continue;
|
2015-02-02 23:25:34 +01:00
|
|
|
}
|
2014-04-20 00:08:59 +02:00
|
|
|
|
2017-11-12 15:58:24 +01:00
|
|
|
/* $yyn >= numNonLeafStates means shift-and-reduce */
|
|
|
|
$rule = $action - $this->numNonLeafStates;
|
2014-04-20 00:08:59 +02:00
|
|
|
} else {
|
2014-04-20 13:16:54 +02:00
|
|
|
$rule = -$action;
|
2014-04-20 00:08:59 +02:00
|
|
|
}
|
|
|
|
} else {
|
2014-04-20 13:16:54 +02:00
|
|
|
$rule = $this->actionDefault[$state];
|
2014-04-20 00:08:59 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
for (;;) {
|
2014-04-20 13:16:54 +02:00
|
|
|
if ($rule === 0) {
|
2014-04-20 00:08:59 +02:00
|
|
|
/* accept */
|
2014-04-20 13:16:54 +02:00
|
|
|
//$this->traceAccept();
|
|
|
|
return $this->semValue;
|
2022-07-04 17:22:32 +02:00
|
|
|
}
|
|
|
|
if ($rule !== $this->unexpectedTokenRule) {
|
2014-04-20 00:08:59 +02:00
|
|
|
/* reduce */
|
2014-04-20 13:16:54 +02:00
|
|
|
//$this->traceReduce($rule);
|
2014-04-20 00:08:59 +02:00
|
|
|
|
2023-07-09 18:50:02 +02:00
|
|
|
$ruleLength = $this->ruleToLength[$rule];
|
2014-04-20 00:08:59 +02:00
|
|
|
try {
|
2023-07-09 18:50:02 +02:00
|
|
|
$callback = $this->reduceCallbacks[$rule];
|
|
|
|
if ($callback !== null) {
|
2024-02-21 21:11:36 +01:00
|
|
|
$callback($this, $stackPos);
|
2023-07-09 18:50:02 +02:00
|
|
|
} elseif ($ruleLength > 0) {
|
|
|
|
$this->semValue = $this->semStack[$stackPos - $ruleLength + 1];
|
|
|
|
}
|
2014-04-20 00:08:59 +02:00
|
|
|
} catch (Error $e) {
|
2023-07-29 15:10:11 +02:00
|
|
|
if (-1 === $e->getStartLine()) {
|
|
|
|
$e->setStartLine($this->tokens[$this->tokenPos]->line);
|
2014-04-20 00:08:59 +02:00
|
|
|
}
|
|
|
|
|
2016-10-09 00:59:44 +02:00
|
|
|
$this->emitError($e);
|
|
|
|
// Can't recover from this type of error
|
|
|
|
return null;
|
2014-04-20 00:08:59 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
/* Goto - shift nonterminal */
|
2023-07-29 15:10:11 +02:00
|
|
|
$lastTokenEnd = $this->tokenEndStack[$stackPos];
|
2020-12-08 23:04:55 +01:00
|
|
|
$stackPos -= $ruleLength;
|
2014-04-20 13:16:54 +02:00
|
|
|
$nonTerminal = $this->ruleToNonTerminal[$rule];
|
2017-02-04 20:18:56 +01:00
|
|
|
$idx = $this->gotoBase[$nonTerminal] + $stateStack[$stackPos];
|
2017-08-13 14:13:51 +02:00
|
|
|
if ($idx >= 0 && $idx < $this->gotoTableSize && $this->gotoCheck[$idx] === $nonTerminal) {
|
2014-04-20 13:16:54 +02:00
|
|
|
$state = $this->goto[$idx];
|
2014-04-20 00:08:59 +02:00
|
|
|
} else {
|
2014-04-20 13:16:54 +02:00
|
|
|
$state = $this->gotoDefault[$nonTerminal];
|
2014-04-20 00:08:59 +02:00
|
|
|
}
|
|
|
|
|
2017-02-04 20:18:56 +01:00
|
|
|
++$stackPos;
|
|
|
|
$stateStack[$stackPos] = $state;
|
|
|
|
$this->semStack[$stackPos] = $this->semValue;
|
2023-07-29 15:10:11 +02:00
|
|
|
$this->tokenEndStack[$stackPos] = $lastTokenEnd;
|
2020-12-08 23:04:55 +01:00
|
|
|
if ($ruleLength === 0) {
|
|
|
|
// Empty productions use the start attributes of the lookahead token.
|
2023-07-29 15:10:11 +02:00
|
|
|
$this->tokenStartStack[$stackPos] = $this->tokenPos;
|
2020-12-08 23:04:55 +01:00
|
|
|
}
|
2014-04-20 00:08:59 +02:00
|
|
|
} else {
|
|
|
|
/* error */
|
2016-07-25 17:18:52 +02:00
|
|
|
switch ($this->errorState) {
|
2015-02-02 23:25:34 +01:00
|
|
|
case 0:
|
|
|
|
$msg = $this->getErrorMessage($symbol, $state);
|
2023-07-29 15:10:11 +02:00
|
|
|
$this->emitError(new Error($msg, $this->getAttributesForToken($this->tokenPos)));
|
2015-02-02 23:25:34 +01:00
|
|
|
// Break missing intentionally
|
2022-08-28 22:57:06 +02:00
|
|
|
// no break
|
2015-02-02 23:25:34 +01:00
|
|
|
case 1:
|
|
|
|
case 2:
|
2016-07-25 17:18:52 +02:00
|
|
|
$this->errorState = 3;
|
2015-02-02 23:25:34 +01:00
|
|
|
|
|
|
|
// Pop until error-expecting state uncovered
|
|
|
|
while (!(
|
|
|
|
(($idx = $this->actionBase[$state] + $this->errorSymbol) >= 0
|
2017-08-13 14:13:51 +02:00
|
|
|
&& $idx < $this->actionTableSize && $this->actionCheck[$idx] === $this->errorSymbol)
|
2015-02-02 23:25:34 +01:00
|
|
|
|| ($state < $this->YY2TBLSTATE
|
2017-11-12 15:58:24 +01:00
|
|
|
&& ($idx = $this->actionBase[$state + $this->numNonLeafStates] + $this->errorSymbol) >= 0
|
2017-08-13 14:13:51 +02:00
|
|
|
&& $idx < $this->actionTableSize && $this->actionCheck[$idx] === $this->errorSymbol)
|
|
|
|
) || ($action = $this->action[$idx]) === $this->defaultAction) { // Not totally sure about this
|
2017-02-04 20:18:56 +01:00
|
|
|
if ($stackPos <= 0) {
|
2015-04-30 17:37:19 +02:00
|
|
|
// Could not recover from error
|
|
|
|
return null;
|
2015-02-02 23:25:34 +01:00
|
|
|
}
|
2017-02-04 20:18:56 +01:00
|
|
|
$state = $stateStack[--$stackPos];
|
2015-02-02 23:25:34 +01:00
|
|
|
//$this->tracePop($state);
|
|
|
|
}
|
|
|
|
|
|
|
|
//$this->traceShift($this->errorSymbol);
|
2017-02-04 20:18:56 +01:00
|
|
|
++$stackPos;
|
|
|
|
$stateStack[$stackPos] = $state = $action;
|
2017-02-26 23:38:32 +01:00
|
|
|
|
|
|
|
// We treat the error symbol as being empty, so we reset the end attributes
|
|
|
|
// to the end attributes of the last non-error symbol
|
2023-07-29 15:10:11 +02:00
|
|
|
$this->tokenStartStack[$stackPos] = $this->tokenPos;
|
|
|
|
$this->tokenEndStack[$stackPos] = $this->tokenEndStack[$stackPos - 1];
|
2015-02-02 23:25:34 +01:00
|
|
|
break;
|
|
|
|
|
|
|
|
case 3:
|
|
|
|
if ($symbol === 0) {
|
2015-04-30 17:37:19 +02:00
|
|
|
// Reached EOF without recovering from error
|
|
|
|
return null;
|
2015-02-02 23:25:34 +01:00
|
|
|
}
|
|
|
|
|
|
|
|
//$this->traceDiscard($symbol);
|
|
|
|
$symbol = self::SYMBOL_NONE;
|
|
|
|
break 2;
|
2014-04-20 00:08:59 +02:00
|
|
|
}
|
2015-02-02 23:25:34 +01:00
|
|
|
}
|
2014-04-20 00:08:59 +02:00
|
|
|
|
2017-11-12 15:58:24 +01:00
|
|
|
if ($state < $this->numNonLeafStates) {
|
2015-02-02 23:25:34 +01:00
|
|
|
break;
|
2014-04-20 00:08:59 +02:00
|
|
|
}
|
2015-02-02 23:25:34 +01:00
|
|
|
|
2017-11-12 15:58:24 +01:00
|
|
|
/* >= numNonLeafStates means shift-and-reduce */
|
|
|
|
$rule = $state - $this->numNonLeafStates;
|
2014-04-20 13:16:54 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function emitError(Error $error): void {
|
2016-10-09 13:15:24 +02:00
|
|
|
$this->errorHandler->handleError($error);
|
2016-10-09 00:59:44 +02:00
|
|
|
}
|
|
|
|
|
2017-01-24 00:38:55 -07:00
|
|
|
/**
|
2017-01-26 00:16:54 +01:00
|
|
|
* Format error message including expected tokens.
|
|
|
|
*
|
|
|
|
* @param int $symbol Unexpected symbol
|
2023-09-17 15:59:04 +02:00
|
|
|
* @param int $state State at time of error
|
2017-01-26 00:16:54 +01:00
|
|
|
*
|
|
|
|
* @return string Formatted error message
|
2017-01-24 00:38:55 -07:00
|
|
|
*/
|
2022-08-28 22:57:06 +02:00
|
|
|
protected function getErrorMessage(int $symbol, int $state): string {
|
2015-02-02 23:25:34 +01:00
|
|
|
$expectedString = '';
|
|
|
|
if ($expected = $this->getExpectedTokens($state)) {
|
|
|
|
$expectedString = ', expecting ' . implode(' or ', $expected);
|
|
|
|
}
|
|
|
|
|
|
|
|
return 'Syntax error, unexpected ' . $this->symbolToName[$symbol] . $expectedString;
|
|
|
|
}
|
|
|
|
|
2017-01-24 00:38:55 -07:00
|
|
|
/**
|
2017-01-26 00:16:54 +01:00
|
|
|
* Get limited number of expected tokens in given state.
|
|
|
|
*
|
|
|
|
* @param int $state State
|
|
|
|
*
|
|
|
|
* @return string[] Expected tokens. If too many, an empty array is returned.
|
2017-01-24 00:38:55 -07:00
|
|
|
*/
|
2022-08-28 22:57:06 +02:00
|
|
|
protected function getExpectedTokens(int $state): array {
|
2017-08-13 14:06:08 +02:00
|
|
|
$expected = [];
|
2014-04-20 13:16:54 +02:00
|
|
|
|
|
|
|
$base = $this->actionBase[$state];
|
|
|
|
foreach ($this->symbolToName as $symbol => $name) {
|
|
|
|
$idx = $base + $symbol;
|
|
|
|
if ($idx >= 0 && $idx < $this->actionTableSize && $this->actionCheck[$idx] === $symbol
|
|
|
|
|| $state < $this->YY2TBLSTATE
|
2017-11-12 15:58:24 +01:00
|
|
|
&& ($idx = $this->actionBase[$state + $this->numNonLeafStates] + $symbol) >= 0
|
2014-04-20 13:16:54 +02:00
|
|
|
&& $idx < $this->actionTableSize && $this->actionCheck[$idx] === $symbol
|
|
|
|
) {
|
2017-08-13 14:13:51 +02:00
|
|
|
if ($this->action[$idx] !== $this->unexpectedTokenRule
|
|
|
|
&& $this->action[$idx] !== $this->defaultAction
|
|
|
|
&& $symbol !== $this->errorSymbol
|
2016-07-06 02:21:18 +02:00
|
|
|
) {
|
2017-08-13 14:13:51 +02:00
|
|
|
if (count($expected) === 4) {
|
2014-04-20 13:16:54 +02:00
|
|
|
/* Too many expected tokens */
|
2017-08-13 14:06:08 +02:00
|
|
|
return [];
|
2014-04-20 13:16:54 +02:00
|
|
|
}
|
2014-04-20 00:08:59 +02:00
|
|
|
|
2014-04-20 13:16:54 +02:00
|
|
|
$expected[] = $name;
|
|
|
|
}
|
2014-04-20 00:08:59 +02:00
|
|
|
}
|
|
|
|
}
|
2014-04-20 13:16:54 +02:00
|
|
|
|
|
|
|
return $expected;
|
2014-04-20 00:08:59 +02:00
|
|
|
}
|
|
|
|
|
2023-07-29 15:10:11 +02:00
|
|
|
/**
|
|
|
|
* Get attributes for a node with the given start and end token positions.
|
|
|
|
*
|
|
|
|
* @param int $tokenStartPos Token position the node starts at
|
|
|
|
* @param int $tokenEndPos Token position the node ends at
|
2023-08-13 12:45:21 +02:00
|
|
|
* @return array<string, mixed> Attributes
|
2023-07-29 15:10:11 +02:00
|
|
|
*/
|
|
|
|
protected function getAttributes(int $tokenStartPos, int $tokenEndPos): array {
|
|
|
|
$startToken = $this->tokens[$tokenStartPos];
|
|
|
|
$afterEndToken = $this->tokens[$tokenEndPos + 1];
|
2022-06-06 16:32:48 +02:00
|
|
|
return [
|
2023-07-29 15:10:11 +02:00
|
|
|
'startLine' => $startToken->line,
|
|
|
|
'startTokenPos' => $tokenStartPos,
|
|
|
|
'startFilePos' => $startToken->pos,
|
|
|
|
'endLine' => $afterEndToken->line,
|
|
|
|
'endTokenPos' => $tokenEndPos,
|
|
|
|
'endFilePos' => $afterEndToken->pos - 1,
|
|
|
|
];
|
|
|
|
}
|
|
|
|
|
2023-08-13 12:45:21 +02:00
|
|
|
/**
|
|
|
|
* Get attributes for a single token at the given token position.
|
|
|
|
*
|
|
|
|
* @return array<string, mixed> Attributes
|
|
|
|
*/
|
|
|
|
protected function getAttributesForToken(int $tokenPos): array {
|
2023-07-29 15:10:11 +02:00
|
|
|
if ($tokenPos < \count($this->tokens) - 1) {
|
|
|
|
return $this->getAttributes($tokenPos, $tokenPos);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Get attributes for the sentinel token.
|
|
|
|
$token = $this->tokens[$tokenPos];
|
2022-06-06 16:32:48 +02:00
|
|
|
return [
|
2023-07-29 15:10:11 +02:00
|
|
|
'startLine' => $token->line,
|
|
|
|
'startTokenPos' => $tokenPos,
|
|
|
|
'startFilePos' => $token->pos,
|
|
|
|
'endLine' => $token->line,
|
|
|
|
'endTokenPos' => $tokenPos,
|
|
|
|
'endFilePos' => $token->pos,
|
|
|
|
];
|
|
|
|
}
|
|
|
|
|
2014-04-21 12:30:55 +02:00
|
|
|
/*
|
|
|
|
* Tracing functions used for debugging the parser.
|
|
|
|
*/
|
|
|
|
|
2015-05-01 20:17:39 +02:00
|
|
|
/*
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function traceNewState($state, $symbol): void {
|
2014-04-20 00:08:59 +02:00
|
|
|
echo '% State ' . $state
|
2014-04-20 13:16:54 +02:00
|
|
|
. ', Lookahead ' . ($symbol == self::SYMBOL_NONE ? '--none--' : $this->symbolToName[$symbol]) . "\n";
|
2014-04-20 00:08:59 +02:00
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function traceRead($symbol): void {
|
2014-04-20 13:16:54 +02:00
|
|
|
echo '% Reading ' . $this->symbolToName[$symbol] . "\n";
|
2014-04-20 00:08:59 +02:00
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function traceShift($symbol): void {
|
2014-04-20 13:16:54 +02:00
|
|
|
echo '% Shift ' . $this->symbolToName[$symbol] . "\n";
|
2014-04-20 00:08:59 +02:00
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function traceAccept(): void {
|
2014-04-20 00:08:59 +02:00
|
|
|
echo "% Accepted.\n";
|
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function traceReduce($n): void {
|
2014-04-20 13:16:54 +02:00
|
|
|
echo '% Reduce by (' . $n . ') ' . $this->productions[$n] . "\n";
|
2014-04-20 00:08:59 +02:00
|
|
|
}
|
2014-04-21 12:30:55 +02:00
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function tracePop($state): void {
|
2015-02-02 23:25:34 +01:00
|
|
|
echo '% Recovering, uncovered state ' . $state . "\n";
|
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function traceDiscard($symbol): void {
|
2015-02-02 23:25:34 +01:00
|
|
|
echo '% Discard ' . $this->symbolToName[$symbol] . "\n";
|
|
|
|
}
|
2015-05-01 20:17:39 +02:00
|
|
|
*/
|
2015-02-02 23:25:34 +01:00
|
|
|
|
2014-04-21 12:30:55 +02:00
|
|
|
/*
|
|
|
|
* Helper functions invoked by semantic actions
|
|
|
|
*/
|
|
|
|
|
2014-04-21 14:49:35 +02:00
|
|
|
/**
|
|
|
|
* Moves statements of semicolon-style namespaces into $ns->stmts and checks various error conditions.
|
|
|
|
*
|
2017-01-19 22:46:28 +01:00
|
|
|
* @param Node\Stmt[] $stmts
|
|
|
|
* @return Node\Stmt[]
|
2014-04-21 14:49:35 +02:00
|
|
|
*/
|
2022-08-28 22:57:06 +02:00
|
|
|
protected function handleNamespaces(array $stmts): array {
|
2016-10-09 00:59:44 +02:00
|
|
|
$hasErrored = false;
|
2014-04-21 14:49:35 +02:00
|
|
|
$style = $this->getNamespacingStyle($stmts);
|
|
|
|
if (null === $style) {
|
|
|
|
// not namespaced, nothing to do
|
|
|
|
return $stmts;
|
2022-07-04 17:22:32 +02:00
|
|
|
}
|
|
|
|
if ('brace' === $style) {
|
2014-04-21 14:49:35 +02:00
|
|
|
// For braced namespaces we only have to check that there are no invalid statements between the namespaces
|
|
|
|
$afterFirstNamespace = false;
|
|
|
|
foreach ($stmts as $stmt) {
|
|
|
|
if ($stmt instanceof Node\Stmt\Namespace_) {
|
|
|
|
$afterFirstNamespace = true;
|
2016-10-09 00:59:44 +02:00
|
|
|
} elseif (!$stmt instanceof Node\Stmt\HaltCompiler
|
2017-08-29 23:14:27 +02:00
|
|
|
&& !$stmt instanceof Node\Stmt\Nop
|
2016-10-09 00:59:44 +02:00
|
|
|
&& $afterFirstNamespace && !$hasErrored) {
|
|
|
|
$this->emitError(new Error(
|
|
|
|
'No code may exist outside of namespace {}', $stmt->getAttributes()));
|
|
|
|
$hasErrored = true; // Avoid one error for every statement
|
2014-04-21 14:49:35 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
return $stmts;
|
|
|
|
} else {
|
|
|
|
// For semicolon namespaces we have to move the statements after a namespace declaration into ->stmts
|
2017-08-13 14:06:08 +02:00
|
|
|
$resultStmts = [];
|
2023-11-01 18:50:25 +01:00
|
|
|
$targetStmts = &$resultStmts;
|
2016-12-23 14:11:31 +01:00
|
|
|
$lastNs = null;
|
2014-04-21 14:49:35 +02:00
|
|
|
foreach ($stmts as $stmt) {
|
|
|
|
if ($stmt instanceof Node\Stmt\Namespace_) {
|
2016-12-23 14:11:31 +01:00
|
|
|
if ($lastNs !== null) {
|
|
|
|
$this->fixupNamespaceAttributes($lastNs);
|
|
|
|
}
|
2016-10-09 00:59:44 +02:00
|
|
|
if ($stmt->stmts === null) {
|
2017-08-13 14:06:08 +02:00
|
|
|
$stmt->stmts = [];
|
2023-11-01 18:50:25 +01:00
|
|
|
$targetStmts = &$stmt->stmts;
|
2016-10-09 00:59:44 +02:00
|
|
|
$resultStmts[] = $stmt;
|
|
|
|
} else {
|
|
|
|
// This handles the invalid case of mixed style namespaces
|
|
|
|
$resultStmts[] = $stmt;
|
2023-11-01 18:50:25 +01:00
|
|
|
$targetStmts = &$resultStmts;
|
2016-10-09 00:59:44 +02:00
|
|
|
}
|
2016-12-23 14:11:31 +01:00
|
|
|
$lastNs = $stmt;
|
2014-04-21 14:49:35 +02:00
|
|
|
} elseif ($stmt instanceof Node\Stmt\HaltCompiler) {
|
|
|
|
// __halt_compiler() is not moved into the namespace
|
|
|
|
$resultStmts[] = $stmt;
|
|
|
|
} else {
|
|
|
|
$targetStmts[] = $stmt;
|
|
|
|
}
|
|
|
|
}
|
2016-12-23 14:11:31 +01:00
|
|
|
if ($lastNs !== null) {
|
|
|
|
$this->fixupNamespaceAttributes($lastNs);
|
|
|
|
}
|
2014-04-21 14:49:35 +02:00
|
|
|
return $resultStmts;
|
|
|
|
}
|
|
|
|
}
|
2014-04-21 12:30:55 +02:00
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
private function fixupNamespaceAttributes(Node\Stmt\Namespace_ $stmt): void {
|
2016-12-23 14:11:31 +01:00
|
|
|
// We moved the statements into the namespace node, as such the end of the namespace node
|
|
|
|
// needs to be extended to the end of the statements.
|
|
|
|
if (empty($stmt->stmts)) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
// We only move the builtin end attributes here. This is the best we can do with the
|
|
|
|
// knowledge we have.
|
|
|
|
$endAttributes = ['endLine', 'endFilePos', 'endTokenPos'];
|
|
|
|
$lastStmt = $stmt->stmts[count($stmt->stmts) - 1];
|
|
|
|
foreach ($endAttributes as $endAttribute) {
|
|
|
|
if ($lastStmt->hasAttribute($endAttribute)) {
|
|
|
|
$stmt->setAttribute($endAttribute, $lastStmt->getAttribute($endAttribute));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-09-17 17:12:55 +02:00
|
|
|
/** @return array<string, mixed> */
|
2022-09-11 22:05:47 +02:00
|
|
|
private function getNamespaceErrorAttributes(Namespace_ $node): array {
|
|
|
|
$attrs = $node->getAttributes();
|
|
|
|
// Adjust end attributes to only cover the "namespace" keyword, not the whole namespace.
|
|
|
|
if (isset($attrs['startLine'])) {
|
|
|
|
$attrs['endLine'] = $attrs['startLine'];
|
|
|
|
}
|
|
|
|
if (isset($attrs['startTokenPos'])) {
|
|
|
|
$attrs['endTokenPos'] = $attrs['startTokenPos'];
|
|
|
|
}
|
|
|
|
if (isset($attrs['startFilePos'])) {
|
|
|
|
$attrs['endFilePos'] = $attrs['startFilePos'] + \strlen('namespace') - 1;
|
|
|
|
}
|
|
|
|
return $attrs;
|
|
|
|
}
|
|
|
|
|
2017-01-24 00:38:55 -07:00
|
|
|
/**
|
2017-01-26 00:16:54 +01:00
|
|
|
* Determine namespacing style (semicolon or brace)
|
|
|
|
*
|
|
|
|
* @param Node[] $stmts Top-level statements.
|
|
|
|
*
|
|
|
|
* @return null|string One of "semicolon", "brace" or null (no namespaces)
|
2017-01-24 00:38:55 -07:00
|
|
|
*/
|
2022-06-04 12:48:12 +02:00
|
|
|
private function getNamespacingStyle(array $stmts): ?string {
|
2014-04-21 14:49:35 +02:00
|
|
|
$style = null;
|
2014-04-21 12:30:55 +02:00
|
|
|
$hasNotAllowedStmts = false;
|
2016-01-15 22:01:51 +01:00
|
|
|
foreach ($stmts as $i => $stmt) {
|
2014-04-21 12:30:55 +02:00
|
|
|
if ($stmt instanceof Node\Stmt\Namespace_) {
|
2014-04-21 14:49:35 +02:00
|
|
|
$currentStyle = null === $stmt->stmts ? 'semicolon' : 'brace';
|
|
|
|
if (null === $style) {
|
|
|
|
$style = $currentStyle;
|
2014-04-21 12:30:55 +02:00
|
|
|
if ($hasNotAllowedStmts) {
|
2016-10-09 00:59:44 +02:00
|
|
|
$this->emitError(new Error(
|
|
|
|
'Namespace declaration statement has to be the very first statement in the script',
|
2022-09-11 22:05:47 +02:00
|
|
|
$this->getNamespaceErrorAttributes($stmt)
|
2016-10-09 00:59:44 +02:00
|
|
|
));
|
2014-04-21 12:30:55 +02:00
|
|
|
}
|
2014-04-21 14:49:35 +02:00
|
|
|
} elseif ($style !== $currentStyle) {
|
2016-10-09 00:59:44 +02:00
|
|
|
$this->emitError(new Error(
|
|
|
|
'Cannot mix bracketed namespace declarations with unbracketed namespace declarations',
|
2022-09-11 22:05:47 +02:00
|
|
|
$this->getNamespaceErrorAttributes($stmt)
|
2016-10-09 00:59:44 +02:00
|
|
|
));
|
|
|
|
// Treat like semicolon style for namespace normalization
|
|
|
|
return 'semicolon';
|
2014-04-21 12:30:55 +02:00
|
|
|
}
|
2016-01-15 22:01:51 +01:00
|
|
|
continue;
|
2014-04-21 12:30:55 +02:00
|
|
|
}
|
2016-01-15 22:01:51 +01:00
|
|
|
|
2016-04-16 21:39:49 +02:00
|
|
|
/* declare(), __halt_compiler() and nops can be used before a namespace declaration */
|
|
|
|
if ($stmt instanceof Node\Stmt\Declare_
|
|
|
|
|| $stmt instanceof Node\Stmt\HaltCompiler
|
|
|
|
|| $stmt instanceof Node\Stmt\Nop) {
|
2016-01-15 22:01:51 +01:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* There may be a hashbang line at the very start of the file */
|
2017-08-13 14:13:51 +02:00
|
|
|
if ($i === 0 && $stmt instanceof Node\Stmt\InlineHTML && preg_match('/\A#!.*\r?\n\z/', $stmt->value)) {
|
2016-01-15 22:01:51 +01:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
/* Everything else if forbidden before namespace declarations */
|
|
|
|
$hasNotAllowedStmts = true;
|
2014-04-21 12:30:55 +02:00
|
|
|
}
|
2014-04-21 14:49:35 +02:00
|
|
|
return $style;
|
2014-04-21 12:30:55 +02:00
|
|
|
}
|
2015-06-13 20:16:09 +02:00
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
/** @return Name|Identifier */
|
2016-07-05 22:35:27 +02:00
|
|
|
protected function handleBuiltinTypes(Name $name) {
|
2015-06-13 20:16:09 +02:00
|
|
|
if (!$name->isUnqualified()) {
|
|
|
|
return $name;
|
|
|
|
}
|
|
|
|
|
2017-08-15 22:48:24 +02:00
|
|
|
$lowerName = $name->toLowerString();
|
2022-07-23 16:35:21 +02:00
|
|
|
if (!$this->phpVersion->supportsBuiltinType($lowerName)) {
|
2016-12-22 22:23:30 +01:00
|
|
|
return $name;
|
|
|
|
}
|
|
|
|
|
2017-04-28 19:09:39 +02:00
|
|
|
return new Node\Identifier($lowerName, $name->getAttributes());
|
2015-06-13 20:16:09 +02:00
|
|
|
}
|
2016-10-09 00:59:44 +02:00
|
|
|
|
2017-01-24 00:38:55 -07:00
|
|
|
/**
|
2017-01-26 00:16:54 +01:00
|
|
|
* Get combined start and end attributes at a stack location
|
|
|
|
*
|
2023-07-29 15:10:11 +02:00
|
|
|
* @param int $stackPos Stack location
|
2017-01-26 00:16:54 +01:00
|
|
|
*
|
2022-09-17 17:12:55 +02:00
|
|
|
* @return array<string, mixed> Combined start and end attributes
|
2017-01-24 00:38:55 -07:00
|
|
|
*/
|
2023-07-29 15:10:11 +02:00
|
|
|
protected function getAttributesAt(int $stackPos): array {
|
|
|
|
return $this->getAttributes($this->tokenStartStack[$stackPos], $this->tokenEndStack[$stackPos]);
|
2016-10-09 00:59:44 +02:00
|
|
|
}
|
|
|
|
|
2022-08-28 22:57:06 +02:00
|
|
|
protected function getFloatCastKind(string $cast): int {
|
2019-01-03 08:59:45 +01:00
|
|
|
$cast = strtolower($cast);
|
|
|
|
if (strpos($cast, 'float') !== false) {
|
|
|
|
return Double::KIND_FLOAT;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (strpos($cast, 'real') !== false) {
|
|
|
|
return Double::KIND_REAL;
|
|
|
|
}
|
|
|
|
|
|
|
|
return Double::KIND_DOUBLE;
|
|
|
|
}
|
|
|
|
|
2022-09-17 17:12:55 +02:00
|
|
|
/** @param array<string, mixed> $attributes */
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function parseLNumber(string $str, array $attributes, bool $allowInvalidOctal = false): Int_ {
|
2016-10-09 00:59:44 +02:00
|
|
|
try {
|
2022-09-03 11:58:59 +02:00
|
|
|
return Int_::fromString($str, $attributes, $allowInvalidOctal);
|
2016-10-09 00:59:44 +02:00
|
|
|
} catch (Error $error) {
|
|
|
|
$this->emitError($error);
|
|
|
|
// Use dummy value
|
2022-09-03 11:58:59 +02:00
|
|
|
return new Int_(0, $attributes);
|
2016-10-09 00:59:44 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2017-01-24 00:38:55 -07:00
|
|
|
/**
|
2017-01-26 00:16:54 +01:00
|
|
|
* Parse a T_NUM_STRING token into either an integer or string node.
|
|
|
|
*
|
2022-09-17 17:12:55 +02:00
|
|
|
* @param string $str Number string
|
2022-09-11 20:51:31 +02:00
|
|
|
* @param array<string, mixed> $attributes Attributes
|
2017-01-26 00:16:54 +01:00
|
|
|
*
|
2022-09-03 11:58:59 +02:00
|
|
|
* @return Int_|String_ Integer or string node.
|
2017-01-24 00:38:55 -07:00
|
|
|
*/
|
2017-04-28 21:40:59 +02:00
|
|
|
protected function parseNumString(string $str, array $attributes) {
|
2016-12-11 13:44:17 +01:00
|
|
|
if (!preg_match('/^(?:0|-?[1-9][0-9]*)$/', $str)) {
|
2016-12-07 20:22:53 +01:00
|
|
|
return new String_($str, $attributes);
|
|
|
|
}
|
|
|
|
|
|
|
|
$num = +$str;
|
|
|
|
if (!is_int($num)) {
|
|
|
|
return new String_($str, $attributes);
|
|
|
|
}
|
|
|
|
|
2022-09-03 11:58:59 +02:00
|
|
|
return new Int_($num, $attributes);
|
2016-12-07 20:22:53 +01:00
|
|
|
}
|
|
|
|
|
2022-09-17 17:12:55 +02:00
|
|
|
/** @param array<string, mixed> $attributes */
|
2018-09-21 17:26:47 +02:00
|
|
|
protected function stripIndentation(
|
|
|
|
string $string, int $indentLen, string $indentChar,
|
|
|
|
bool $newlineAtStart, bool $newlineAtEnd, array $attributes
|
2022-09-11 17:51:59 +02:00
|
|
|
): string {
|
2018-09-21 17:26:47 +02:00
|
|
|
if ($indentLen === 0) {
|
|
|
|
return $string;
|
|
|
|
}
|
|
|
|
|
|
|
|
$start = $newlineAtStart ? '(?:(?<=\n)|\A)' : '(?<=\n)';
|
|
|
|
$end = $newlineAtEnd ? '(?:(?=[\r\n])|\z)' : '(?=[\r\n])';
|
|
|
|
$regex = '/' . $start . '([ \t]*)(' . $end . ')?/';
|
|
|
|
return preg_replace_callback(
|
|
|
|
$regex,
|
|
|
|
function ($matches) use ($indentLen, $indentChar, $attributes) {
|
|
|
|
$prefix = substr($matches[1], 0, $indentLen);
|
|
|
|
if (false !== strpos($prefix, $indentChar === " " ? "\t" : " ")) {
|
|
|
|
$this->emitError(new Error(
|
|
|
|
'Invalid indentation - tabs and spaces cannot be mixed', $attributes
|
|
|
|
));
|
|
|
|
} elseif (strlen($prefix) < $indentLen && !isset($matches[2])) {
|
|
|
|
$this->emitError(new Error(
|
|
|
|
'Invalid body indentation level ' .
|
|
|
|
'(expecting an indentation level of at least ' . $indentLen . ')',
|
|
|
|
$attributes
|
|
|
|
));
|
|
|
|
}
|
|
|
|
return substr($matches[0], strlen($prefix));
|
|
|
|
},
|
|
|
|
$string
|
|
|
|
);
|
2018-09-21 15:49:09 +02:00
|
|
|
}
|
|
|
|
|
2022-09-17 17:12:55 +02:00
|
|
|
/**
|
|
|
|
* @param string|(Expr|InterpolatedStringPart)[] $contents
|
|
|
|
* @param array<string, mixed> $attributes
|
|
|
|
* @param array<string, mixed> $endTokenAttributes
|
|
|
|
*/
|
2018-09-21 15:49:09 +02:00
|
|
|
protected function parseDocString(
|
|
|
|
string $startToken, $contents, string $endToken,
|
|
|
|
array $attributes, array $endTokenAttributes, bool $parseUnicodeEscape
|
2022-09-11 17:51:59 +02:00
|
|
|
): Expr {
|
2018-09-21 15:49:09 +02:00
|
|
|
$kind = strpos($startToken, "'") === false
|
|
|
|
? String_::KIND_HEREDOC : String_::KIND_NOWDOC;
|
|
|
|
|
|
|
|
$regex = '/\A[bB]?<<<[ \t]*[\'"]?([a-zA-Z_\x7f-\xff][a-zA-Z0-9_\x7f-\xff]*)[\'"]?(?:\r\n|\n|\r)\z/';
|
|
|
|
$result = preg_match($regex, $startToken, $matches);
|
|
|
|
assert($result === 1);
|
|
|
|
$label = $matches[1];
|
|
|
|
|
|
|
|
$result = preg_match('/\A[ \t]*/', $endToken, $matches);
|
|
|
|
assert($result === 1);
|
|
|
|
$indentation = $matches[0];
|
|
|
|
|
|
|
|
$attributes['kind'] = $kind;
|
|
|
|
$attributes['docLabel'] = $label;
|
|
|
|
$attributes['docIndentation'] = $indentation;
|
|
|
|
|
|
|
|
$indentHasSpaces = false !== strpos($indentation, " ");
|
|
|
|
$indentHasTabs = false !== strpos($indentation, "\t");
|
|
|
|
if ($indentHasSpaces && $indentHasTabs) {
|
|
|
|
$this->emitError(new Error(
|
|
|
|
'Invalid indentation - tabs and spaces cannot be mixed',
|
|
|
|
$endTokenAttributes
|
|
|
|
));
|
|
|
|
|
|
|
|
// Proceed processing as if this doc string is not indented
|
|
|
|
$indentation = '';
|
|
|
|
}
|
|
|
|
|
2018-09-21 17:26:47 +02:00
|
|
|
$indentLen = \strlen($indentation);
|
|
|
|
$indentChar = $indentHasSpaces ? " " : "\t";
|
|
|
|
|
2018-09-21 15:49:09 +02:00
|
|
|
if (\is_string($contents)) {
|
|
|
|
if ($contents === '') {
|
2023-09-24 12:47:41 +02:00
|
|
|
$attributes['rawValue'] = $contents;
|
2018-09-21 15:49:09 +02:00
|
|
|
return new String_('', $attributes);
|
|
|
|
}
|
|
|
|
|
2018-09-21 17:26:47 +02:00
|
|
|
$contents = $this->stripIndentation(
|
|
|
|
$contents, $indentLen, $indentChar, true, true, $attributes
|
|
|
|
);
|
|
|
|
$contents = preg_replace('~(\r\n|\n|\r)\z~', '', $contents);
|
2023-09-24 12:47:41 +02:00
|
|
|
$attributes['rawValue'] = $contents;
|
2018-09-21 15:49:09 +02:00
|
|
|
|
|
|
|
if ($kind === String_::KIND_HEREDOC) {
|
2018-09-21 17:26:47 +02:00
|
|
|
$contents = String_::parseEscapeSequences($contents, null, $parseUnicodeEscape);
|
2018-09-21 15:49:09 +02:00
|
|
|
}
|
|
|
|
|
2018-09-21 17:26:47 +02:00
|
|
|
return new String_($contents, $attributes);
|
2018-09-21 15:49:09 +02:00
|
|
|
} else {
|
2018-09-21 17:26:47 +02:00
|
|
|
assert(count($contents) > 0);
|
2022-09-03 13:25:23 +02:00
|
|
|
if (!$contents[0] instanceof Node\InterpolatedStringPart) {
|
2018-09-21 17:26:47 +02:00
|
|
|
// If there is no leading encapsed string part, pretend there is an empty one
|
|
|
|
$this->stripIndentation(
|
|
|
|
'', $indentLen, $indentChar, true, false, $contents[0]->getAttributes()
|
|
|
|
);
|
|
|
|
}
|
|
|
|
|
2018-09-22 10:09:00 +02:00
|
|
|
$newContents = [];
|
|
|
|
foreach ($contents as $i => $part) {
|
2022-09-03 13:25:23 +02:00
|
|
|
if ($part instanceof Node\InterpolatedStringPart) {
|
2018-09-22 10:09:00 +02:00
|
|
|
$isLast = $i === \count($contents) - 1;
|
|
|
|
$part->value = $this->stripIndentation(
|
|
|
|
$part->value, $indentLen, $indentChar,
|
|
|
|
$i === 0, $isLast, $part->getAttributes()
|
2018-09-21 17:26:47 +02:00
|
|
|
);
|
2018-09-22 10:09:00 +02:00
|
|
|
if ($isLast) {
|
|
|
|
$part->value = preg_replace('~(\r\n|\n|\r)\z~', '', $part->value);
|
|
|
|
}
|
2023-09-24 12:47:41 +02:00
|
|
|
$part->setAttribute('rawValue', $part->value);
|
2023-03-01 21:05:55 +01:00
|
|
|
$part->value = String_::parseEscapeSequences($part->value, null, $parseUnicodeEscape);
|
2018-09-22 10:09:00 +02:00
|
|
|
if ('' === $part->value) {
|
|
|
|
continue;
|
|
|
|
}
|
2018-09-21 15:49:09 +02:00
|
|
|
}
|
2018-09-22 10:09:00 +02:00
|
|
|
$newContents[] = $part;
|
2018-09-21 15:49:09 +02:00
|
|
|
}
|
2022-09-03 15:13:42 +02:00
|
|
|
return new InterpolatedString($newContents, $attributes);
|
2018-09-21 15:49:09 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2023-07-29 15:10:11 +02:00
|
|
|
protected function createCommentFromToken(Token $token, int $tokenPos): Comment {
|
|
|
|
assert($token->id === \T_COMMENT || $token->id == \T_DOC_COMMENT);
|
|
|
|
return \T_DOC_COMMENT === $token->id
|
|
|
|
? new Comment\Doc($token->text, $token->line, $token->pos, $tokenPos,
|
|
|
|
$token->getEndLine(), $token->getEndPos() - 1, $tokenPos)
|
|
|
|
: new Comment($token->text, $token->line, $token->pos, $tokenPos,
|
|
|
|
$token->getEndLine(), $token->getEndPos() - 1, $tokenPos);
|
|
|
|
}
|
|
|
|
|
2023-08-13 12:45:21 +02:00
|
|
|
/**
|
2022-06-06 16:32:48 +02:00
|
|
|
* Get last comment before the given token position, if any
|
2023-08-13 12:45:21 +02:00
|
|
|
*/
|
2022-06-06 16:32:48 +02:00
|
|
|
protected function getCommentBeforeToken(int $tokenPos): ?Comment {
|
2023-07-29 15:10:11 +02:00
|
|
|
while (--$tokenPos >= 0) {
|
|
|
|
$token = $this->tokens[$tokenPos];
|
|
|
|
if (!isset($this->dropTokens[$token->id])) {
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($token->id === \T_COMMENT || $token->id === \T_DOC_COMMENT) {
|
2022-06-06 16:32:48 +02:00
|
|
|
return $this->createCommentFromToken($token, $tokenPos);
|
2023-07-29 15:10:11 +02:00
|
|
|
}
|
|
|
|
}
|
2022-06-06 16:32:48 +02:00
|
|
|
return null;
|
2023-07-29 15:10:11 +02:00
|
|
|
}
|
|
|
|
|
2019-05-11 20:01:25 +02:00
|
|
|
/**
|
2023-07-29 15:10:11 +02:00
|
|
|
* Create a zero-length nop to capture preceding comments, if any.
|
2019-05-11 20:01:25 +02:00
|
|
|
*/
|
2023-07-29 15:10:11 +02:00
|
|
|
protected function maybeCreateZeroLengthNop(int $tokenPos): ?Nop {
|
2022-06-06 16:32:48 +02:00
|
|
|
$comment = $this->getCommentBeforeToken($tokenPos);
|
|
|
|
if ($comment === null) {
|
2023-07-29 15:10:11 +02:00
|
|
|
return null;
|
|
|
|
}
|
|
|
|
|
2020-02-09 17:10:33 +01:00
|
|
|
$commentEndLine = $comment->getEndLine();
|
|
|
|
$commentEndFilePos = $comment->getEndFilePos();
|
|
|
|
$commentEndTokenPos = $comment->getEndTokenPos();
|
2023-07-29 15:10:11 +02:00
|
|
|
$attributes = [
|
|
|
|
'startLine' => $commentEndLine,
|
|
|
|
'endLine' => $commentEndLine,
|
|
|
|
'startFilePos' => $commentEndFilePos + 1,
|
|
|
|
'endFilePos' => $commentEndFilePos,
|
|
|
|
'startTokenPos' => $commentEndTokenPos + 1,
|
|
|
|
'endTokenPos' => $commentEndTokenPos,
|
|
|
|
];
|
|
|
|
return new Nop($attributes);
|
|
|
|
}
|
2020-02-09 17:10:33 +01:00
|
|
|
|
2023-07-29 15:10:11 +02:00
|
|
|
protected function maybeCreateNop(int $tokenStartPos, int $tokenEndPos): ?Nop {
|
2022-06-06 16:32:48 +02:00
|
|
|
if ($this->getCommentBeforeToken($tokenStartPos) === null) {
|
2023-07-29 15:10:11 +02:00
|
|
|
return null;
|
2019-05-11 20:01:25 +02:00
|
|
|
}
|
2023-07-29 15:10:11 +02:00
|
|
|
return new Nop($this->getAttributes($tokenStartPos, $tokenEndPos));
|
|
|
|
}
|
|
|
|
|
|
|
|
protected function handleHaltCompiler(): string {
|
|
|
|
// Prevent the lexer from returning any further tokens.
|
|
|
|
$nextToken = $this->tokens[$this->tokenPos + 1];
|
|
|
|
$this->tokenPos = \count($this->tokens) - 2;
|
|
|
|
|
|
|
|
// Return text after __halt_compiler.
|
|
|
|
return $nextToken->id === \T_INLINE_HTML ? $nextToken->text : '';
|
|
|
|
}
|
|
|
|
|
|
|
|
protected function inlineHtmlHasLeadingNewline(int $stackPos): bool {
|
|
|
|
$tokenPos = $this->tokenStartStack[$stackPos];
|
|
|
|
$token = $this->tokens[$tokenPos];
|
|
|
|
assert($token->id == \T_INLINE_HTML);
|
|
|
|
if ($tokenPos > 0) {
|
|
|
|
$prevToken = $this->tokens[$tokenPos - 1];
|
|
|
|
assert($prevToken->id == \T_CLOSE_TAG);
|
|
|
|
return false !== strpos($prevToken->text, "\n")
|
|
|
|
|| false !== strpos($prevToken->text, "\r");
|
2019-05-11 20:01:25 +02:00
|
|
|
}
|
2023-07-29 15:10:11 +02:00
|
|
|
return true;
|
2019-05-11 20:01:25 +02:00
|
|
|
}
|
|
|
|
|
2022-09-17 17:12:55 +02:00
|
|
|
/**
|
|
|
|
* @return array<string, mixed>
|
|
|
|
*/
|
2023-07-29 15:10:11 +02:00
|
|
|
protected function createEmptyElemAttributes(int $tokenPos): array {
|
|
|
|
return $this->getAttributesForToken($tokenPos);
|
2022-09-01 21:23:14 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
protected function fixupArrayDestructuring(Array_ $node): Expr\List_ {
|
|
|
|
$this->createdArrays->detach($node);
|
2022-09-02 22:34:15 +02:00
|
|
|
return new Expr\List_(array_map(function (Node\ArrayItem $item) {
|
2022-09-01 21:23:14 +02:00
|
|
|
if ($item->value instanceof Expr\Error) {
|
|
|
|
// We used Error as a placeholder for empty elements, which are legal for destructuring.
|
|
|
|
return null;
|
|
|
|
}
|
|
|
|
if ($item->value instanceof Array_) {
|
2022-09-02 22:34:15 +02:00
|
|
|
return new Node\ArrayItem(
|
2022-08-28 18:48:26 +02:00
|
|
|
$this->fixupArrayDestructuring($item->value),
|
|
|
|
$item->key, $item->byRef, $item->getAttributes());
|
|
|
|
}
|
|
|
|
return $item;
|
|
|
|
}, $node->items), ['kind' => Expr\List_::KIND_ARRAY] + $node->getAttributes());
|
|
|
|
}
|
|
|
|
|
2022-09-01 21:23:14 +02:00
|
|
|
protected function postprocessList(Expr\List_ $node): void {
|
|
|
|
foreach ($node->items as $i => $item) {
|
|
|
|
if ($item->value instanceof Expr\Error) {
|
|
|
|
// We used Error as a placeholder for empty elements, which are legal for destructuring.
|
|
|
|
$node->items[$i] = null;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-09-11 16:57:53 +02:00
|
|
|
/** @param ElseIf_|Else_ $node */
|
|
|
|
protected function fixupAlternativeElse($node): void {
|
|
|
|
// Make sure a trailing nop statement carrying comments is part of the node.
|
|
|
|
$numStmts = \count($node->stmts);
|
|
|
|
if ($numStmts !== 0 && $node->stmts[$numStmts - 1] instanceof Nop) {
|
|
|
|
$nopAttrs = $node->stmts[$numStmts - 1]->getAttributes();
|
|
|
|
if (isset($nopAttrs['endLine'])) {
|
|
|
|
$node->setAttribute('endLine', $nopAttrs['endLine']);
|
|
|
|
}
|
|
|
|
if (isset($nopAttrs['endFilePos'])) {
|
|
|
|
$node->setAttribute('endFilePos', $nopAttrs['endFilePos']);
|
|
|
|
}
|
|
|
|
if (isset($nopAttrs['endTokenPos'])) {
|
|
|
|
$node->setAttribute('endTokenPos', $nopAttrs['endTokenPos']);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function checkClassModifier(int $a, int $b, int $modifierPos): void {
|
2022-05-15 23:19:31 +02:00
|
|
|
try {
|
2022-09-11 15:25:55 +02:00
|
|
|
Modifiers::verifyClassModifier($a, $b);
|
2022-05-15 23:19:31 +02:00
|
|
|
} catch (Error $error) {
|
|
|
|
$error->setAttributes($this->getAttributesAt($modifierPos));
|
|
|
|
$this->emitError($error);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function checkModifier(int $a, int $b, int $modifierPos): void {
|
2016-10-09 00:59:44 +02:00
|
|
|
// Jumping through some hoops here because verifyModifier() is also used elsewhere
|
|
|
|
try {
|
2022-09-11 15:25:55 +02:00
|
|
|
Modifiers::verifyModifier($a, $b);
|
2016-10-09 00:59:44 +02:00
|
|
|
} catch (Error $error) {
|
|
|
|
$error->setAttributes($this->getAttributesAt($modifierPos));
|
|
|
|
$this->emitError($error);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function checkParam(Param $node): void {
|
2016-10-09 00:59:44 +02:00
|
|
|
if ($node->variadic && null !== $node->default) {
|
|
|
|
$this->emitError(new Error(
|
|
|
|
'Variadic parameter cannot have a default value',
|
|
|
|
$node->default->getAttributes()
|
|
|
|
));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function checkTryCatch(TryCatch $node): void {
|
2016-10-09 00:59:44 +02:00
|
|
|
if (empty($node->catches) && null === $node->finally) {
|
|
|
|
$this->emitError(new Error(
|
|
|
|
'Cannot use try without catch or finally', $node->getAttributes()
|
|
|
|
));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function checkNamespace(Namespace_ $node): void {
|
2016-10-09 00:59:44 +02:00
|
|
|
if (null !== $node->stmts) {
|
|
|
|
foreach ($node->stmts as $stmt) {
|
|
|
|
if ($stmt instanceof Namespace_) {
|
|
|
|
$this->emitError(new Error(
|
|
|
|
'Namespace declarations cannot be nested', $stmt->getAttributes()
|
|
|
|
));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
private function checkClassName(?Identifier $name, int $namePos): void {
|
2021-04-25 21:11:36 +02:00
|
|
|
if (null !== $name && $name->isSpecialClassName()) {
|
2016-10-09 00:59:44 +02:00
|
|
|
$this->emitError(new Error(
|
2021-04-25 21:11:36 +02:00
|
|
|
sprintf('Cannot use \'%s\' as class name as it is reserved', $name),
|
2016-10-09 00:59:44 +02:00
|
|
|
$this->getAttributesAt($namePos)
|
|
|
|
));
|
|
|
|
}
|
2021-04-25 21:11:36 +02:00
|
|
|
}
|
2016-10-09 00:59:44 +02:00
|
|
|
|
2022-09-17 17:12:55 +02:00
|
|
|
/** @param Name[] $interfaces */
|
2022-09-11 17:51:59 +02:00
|
|
|
private function checkImplementedInterfaces(array $interfaces): void {
|
2021-04-25 21:11:36 +02:00
|
|
|
foreach ($interfaces as $interface) {
|
2017-08-15 22:56:53 +02:00
|
|
|
if ($interface->isSpecialClassName()) {
|
2016-10-09 00:59:44 +02:00
|
|
|
$this->emitError(new Error(
|
|
|
|
sprintf('Cannot use \'%s\' as interface name as it is reserved', $interface),
|
|
|
|
$interface->getAttributes()
|
|
|
|
));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function checkClass(Class_ $node, int $namePos): void {
|
2021-04-25 21:11:36 +02:00
|
|
|
$this->checkClassName($node->name, $namePos);
|
|
|
|
|
|
|
|
if ($node->extends && $node->extends->isSpecialClassName()) {
|
2016-10-09 00:59:44 +02:00
|
|
|
$this->emitError(new Error(
|
2021-04-25 21:11:36 +02:00
|
|
|
sprintf('Cannot use \'%s\' as class name as it is reserved', $node->extends),
|
|
|
|
$node->extends->getAttributes()
|
2016-10-09 00:59:44 +02:00
|
|
|
));
|
|
|
|
}
|
|
|
|
|
2021-04-25 21:11:36 +02:00
|
|
|
$this->checkImplementedInterfaces($node->implements);
|
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function checkInterface(Interface_ $node, int $namePos): void {
|
2021-04-25 21:11:36 +02:00
|
|
|
$this->checkClassName($node->name, $namePos);
|
|
|
|
$this->checkImplementedInterfaces($node->extends);
|
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function checkEnum(Enum_ $node, int $namePos): void {
|
2021-04-25 21:11:36 +02:00
|
|
|
$this->checkClassName($node->name, $namePos);
|
|
|
|
$this->checkImplementedInterfaces($node->implements);
|
2016-10-09 00:59:44 +02:00
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function checkClassMethod(ClassMethod $node, int $modifierPos): void {
|
2022-08-28 21:09:00 +02:00
|
|
|
if ($node->flags & Modifiers::STATIC) {
|
2017-08-15 22:48:24 +02:00
|
|
|
switch ($node->name->toLowerString()) {
|
2016-10-09 00:59:44 +02:00
|
|
|
case '__construct':
|
|
|
|
$this->emitError(new Error(
|
|
|
|
sprintf('Constructor %s() cannot be static', $node->name),
|
|
|
|
$this->getAttributesAt($modifierPos)));
|
|
|
|
break;
|
|
|
|
case '__destruct':
|
|
|
|
$this->emitError(new Error(
|
|
|
|
sprintf('Destructor %s() cannot be static', $node->name),
|
|
|
|
$this->getAttributesAt($modifierPos)));
|
|
|
|
break;
|
|
|
|
case '__clone':
|
|
|
|
$this->emitError(new Error(
|
|
|
|
sprintf('Clone method %s() cannot be static', $node->name),
|
|
|
|
$this->getAttributesAt($modifierPos)));
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2021-07-21 12:43:29 +02:00
|
|
|
|
2022-08-28 21:09:00 +02:00
|
|
|
if ($node->flags & Modifiers::READONLY) {
|
2021-07-21 12:43:29 +02:00
|
|
|
$this->emitError(new Error(
|
|
|
|
sprintf('Method %s() cannot be readonly', $node->name),
|
|
|
|
$this->getAttributesAt($modifierPos)));
|
|
|
|
}
|
2016-10-09 00:59:44 +02:00
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function checkClassConst(ClassConst $node, int $modifierPos): void {
|
2024-07-28 17:08:58 +02:00
|
|
|
foreach ([Modifiers::STATIC, Modifiers::ABSTRACT, Modifiers::READONLY] as $modifier) {
|
|
|
|
if ($node->flags & $modifier) {
|
|
|
|
$this->emitError(new Error(
|
|
|
|
"Cannot use '" . Modifiers::toString($modifier) . "' as constant modifier",
|
|
|
|
$this->getAttributesAt($modifierPos)));
|
|
|
|
}
|
2016-10-09 00:59:44 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-09-11 17:51:59 +02:00
|
|
|
protected function checkUseUse(UseItem $node, int $namePos): void {
|
2017-08-15 22:56:53 +02:00
|
|
|
if ($node->alias && $node->alias->isSpecialClassName()) {
|
2016-10-09 00:59:44 +02:00
|
|
|
$this->emitError(new Error(
|
|
|
|
sprintf(
|
|
|
|
'Cannot use %s as %s because \'%2$s\' is a special class name',
|
|
|
|
$node->name, $node->alias
|
|
|
|
),
|
|
|
|
$this->getAttributesAt($namePos)
|
|
|
|
));
|
|
|
|
}
|
|
|
|
}
|
2022-06-19 18:05:52 +02:00
|
|
|
|
2024-12-11 11:34:55 +01:00
|
|
|
protected function checkPropertyHooksForMultiProperty(Property $property, int $hookPos): void {
|
|
|
|
if (count($property->props) > 1) {
|
|
|
|
$this->emitError(new Error(
|
|
|
|
'Cannot use hooks when declaring multiple properties', $this->getAttributesAt($hookPos)));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-07-14 21:29:58 +02:00
|
|
|
/** @param PropertyHook[] $hooks */
|
2024-12-11 11:32:42 +01:00
|
|
|
protected function checkEmptyPropertyHookList(array $hooks, int $hookPos): void {
|
2024-07-14 21:29:58 +02:00
|
|
|
if (empty($hooks)) {
|
|
|
|
$this->emitError(new Error(
|
|
|
|
'Property hook list cannot be empty', $this->getAttributesAt($hookPos)));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
protected function checkPropertyHook(PropertyHook $hook, ?int $paramListPos): void {
|
|
|
|
$name = $hook->name->toLowerString();
|
|
|
|
if ($name !== 'get' && $name !== 'set') {
|
|
|
|
$this->emitError(new Error(
|
|
|
|
'Unknown hook "' . $hook->name . '", expected "get" or "set"',
|
|
|
|
$hook->name->getAttributes()));
|
|
|
|
}
|
|
|
|
if ($name === 'get' && $paramListPos !== null) {
|
|
|
|
$this->emitError(new Error(
|
|
|
|
'get hook must not have a parameter list', $this->getAttributesAt($paramListPos)));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
protected function checkPropertyHookModifiers(int $a, int $b, int $modifierPos): void {
|
|
|
|
try {
|
|
|
|
Modifiers::verifyModifier($a, $b);
|
|
|
|
} catch (Error $error) {
|
|
|
|
$error->setAttributes($this->getAttributesAt($modifierPos));
|
|
|
|
$this->emitError($error);
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($b != Modifiers::FINAL) {
|
|
|
|
$this->emitError(new Error(
|
|
|
|
'Cannot use the ' . Modifiers::toString($b) . ' modifier on a property hook',
|
|
|
|
$this->getAttributesAt($modifierPos)));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-09-01 12:35:12 +02:00
|
|
|
/** @param array<Node\Arg|Node\VariadicPlaceholder> $args */
|
|
|
|
private function isSimpleExit(array $args): bool {
|
|
|
|
if (\count($args) === 0) {
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
if (\count($args) === 1) {
|
|
|
|
$arg = $args[0];
|
|
|
|
return $arg instanceof Arg && $arg->name === null &&
|
|
|
|
$arg->byRef === false && $arg->unpack === false;
|
|
|
|
}
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* @param array<Node\Arg|Node\VariadicPlaceholder> $args
|
|
|
|
* @param array<string, mixed> $attrs
|
|
|
|
*/
|
|
|
|
protected function createExitExpr(string $name, int $namePos, array $args, array $attrs): Expr {
|
|
|
|
if ($this->isSimpleExit($args)) {
|
|
|
|
// Create Exit node for backwards compatibility.
|
|
|
|
$attrs['kind'] = strtolower($name) === 'exit' ? Expr\Exit_::KIND_EXIT : Expr\Exit_::KIND_DIE;
|
|
|
|
return new Expr\Exit_(\count($args) === 1 ? $args[0]->value : null, $attrs);
|
|
|
|
}
|
|
|
|
return new Expr\FuncCall(new Name($name, $this->getAttributesAt($namePos)), $args, $attrs);
|
|
|
|
}
|
|
|
|
|
2022-06-19 18:05:52 +02:00
|
|
|
/**
|
|
|
|
* Creates the token map.
|
|
|
|
*
|
|
|
|
* The token map maps the PHP internal token identifiers
|
|
|
|
* to the identifiers used by the Parser. Additionally it
|
|
|
|
* maps T_OPEN_TAG_WITH_ECHO to T_ECHO and T_CLOSE_TAG to ';'.
|
|
|
|
*
|
2022-09-17 17:12:55 +02:00
|
|
|
* @return array<int, int> The token map
|
2022-06-19 18:05:52 +02:00
|
|
|
*/
|
|
|
|
protected function createTokenMap(): array {
|
|
|
|
$tokenMap = [];
|
|
|
|
|
2024-07-14 20:51:46 +02:00
|
|
|
// Single-char tokens use an identity mapping.
|
|
|
|
for ($i = 0; $i < 256; ++$i) {
|
|
|
|
$tokenMap[$i] = $i;
|
|
|
|
}
|
|
|
|
|
|
|
|
foreach ($this->symbolToName as $name) {
|
|
|
|
if ($name[0] === 'T') {
|
|
|
|
$tokenMap[\constant($name)] = constant(static::class . '::' . $name);
|
2022-06-19 18:05:52 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2024-07-14 20:51:46 +02:00
|
|
|
// T_OPEN_TAG_WITH_ECHO with dropped T_OPEN_TAG results in T_ECHO
|
|
|
|
$tokenMap[\T_OPEN_TAG_WITH_ECHO] = static::T_ECHO;
|
|
|
|
// T_CLOSE_TAG is equivalent to ';'
|
|
|
|
$tokenMap[\T_CLOSE_TAG] = ord(';');
|
|
|
|
|
|
|
|
// We have created a map from PHP token IDs to external symbol IDs.
|
2022-06-19 18:05:52 +02:00
|
|
|
// Now map them to the internal symbol ID.
|
|
|
|
$fullTokenMap = [];
|
|
|
|
foreach ($tokenMap as $phpToken => $extSymbol) {
|
|
|
|
$intSymbol = $this->tokenToSymbol[$extSymbol];
|
|
|
|
if ($intSymbol === $this->invalidSymbol) {
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
$fullTokenMap[$phpToken] = $intSymbol;
|
|
|
|
}
|
|
|
|
|
|
|
|
return $fullTokenMap;
|
|
|
|
}
|
2014-04-20 00:08:59 +02:00
|
|
|
}
|