2017-08-18 22:57:27 +02:00
|
|
|
<?php declare(strict_types=1);
|
2011-12-18 13:04:27 +01:00
|
|
|
|
2014-02-06 14:44:16 +01:00
|
|
|
namespace PhpParser\Lexer;
|
|
|
|
|
2018-04-28 22:14:16 +02:00
|
|
|
use PhpParser\Error;
|
|
|
|
use PhpParser\ErrorHandler;
|
2019-05-09 14:17:28 +02:00
|
|
|
use PhpParser\Lexer;
|
|
|
|
use PhpParser\Lexer\TokenEmulator\CoaleseEqualTokenEmulator;
|
|
|
|
use PhpParser\Lexer\TokenEmulator\FnTokenEmulator;
|
2020-07-15 21:40:05 +02:00
|
|
|
use PhpParser\Lexer\TokenEmulator\MatchTokenEmulator;
|
2020-08-02 10:30:44 +02:00
|
|
|
use PhpParser\Lexer\TokenEmulator\NullsafeTokenEmulator;
|
2019-06-30 12:13:28 +02:00
|
|
|
use PhpParser\Lexer\TokenEmulator\NumericLiteralSeparatorEmulator;
|
2019-05-09 14:17:28 +02:00
|
|
|
use PhpParser\Lexer\TokenEmulator\TokenEmulatorInterface;
|
2019-06-23 14:50:14 +02:00
|
|
|
use PhpParser\Parser\Tokens;
|
2018-04-28 22:14:16 +02:00
|
|
|
|
2019-05-09 14:17:28 +02:00
|
|
|
class Emulative extends Lexer
|
2011-12-18 13:04:27 +01:00
|
|
|
{
|
2020-08-01 22:34:36 +02:00
|
|
|
const PHP_7_3 = '7.3dev';
|
|
|
|
const PHP_7_4 = '7.4dev';
|
|
|
|
const PHP_8_0 = '8.0dev';
|
2019-06-23 14:50:14 +02:00
|
|
|
|
2019-01-22 22:05:17 +01:00
|
|
|
const FLEXIBLE_DOC_STRING_REGEX = <<<'REGEX'
|
|
|
|
/<<<[ \t]*(['"]?)([a-zA-Z_\x80-\xff][a-zA-Z0-9_\x80-\xff]*)\1\r?\n
|
|
|
|
(?:.*\r?\n)*?
|
2019-08-30 20:21:28 +02:00
|
|
|
(?<indentation>\h*)\2(?![a-zA-Z0-9_\x80-\xff])(?<separator>(?:;?[\r\n])?)/x
|
2019-01-22 22:05:17 +01:00
|
|
|
REGEX;
|
|
|
|
|
2019-05-09 14:17:28 +02:00
|
|
|
/** @var mixed[] Patches used to reverse changes introduced in the code */
|
2019-01-22 22:05:17 +01:00
|
|
|
private $patches = [];
|
|
|
|
|
2019-05-09 14:17:28 +02:00
|
|
|
/** @var TokenEmulatorInterface[] */
|
|
|
|
private $tokenEmulators = [];
|
|
|
|
|
2020-08-01 21:56:06 +02:00
|
|
|
/** @var string */
|
|
|
|
private $targetPhpVersion;
|
|
|
|
|
2019-01-22 22:05:17 +01:00
|
|
|
/**
|
2020-08-01 21:56:06 +02:00
|
|
|
* @param mixed[] $options Lexer options. In addition to the usual options,
|
|
|
|
* accepts a 'phpVersion' string that specifies the
|
|
|
|
* version to emulated. Defaults to newest supported.
|
2019-01-22 22:05:17 +01:00
|
|
|
*/
|
|
|
|
public function __construct(array $options = [])
|
|
|
|
{
|
2020-08-01 21:56:06 +02:00
|
|
|
$this->targetPhpVersion = $options['phpVersion'] ?? Emulative::PHP_8_0;
|
|
|
|
unset($options['phpVersion']);
|
|
|
|
|
2019-01-22 22:05:17 +01:00
|
|
|
parent::__construct($options);
|
|
|
|
|
2019-05-09 14:17:28 +02:00
|
|
|
$this->tokenEmulators[] = new FnTokenEmulator();
|
2020-07-15 21:40:05 +02:00
|
|
|
$this->tokenEmulators[] = new MatchTokenEmulator();
|
2019-05-09 14:17:28 +02:00
|
|
|
$this->tokenEmulators[] = new CoaleseEqualTokenEmulator();
|
2019-06-30 12:13:28 +02:00
|
|
|
$this->tokenEmulators[] = new NumericLiteralSeparatorEmulator();
|
2020-08-02 10:30:44 +02:00
|
|
|
$this->tokenEmulators[] = new NullsafeTokenEmulator();
|
2019-01-22 22:05:17 +01:00
|
|
|
}
|
2018-04-28 22:14:16 +02:00
|
|
|
|
|
|
|
public function startLexing(string $code, ErrorHandler $errorHandler = null) {
|
|
|
|
$this->patches = [];
|
2019-01-22 22:05:17 +01:00
|
|
|
|
|
|
|
if ($this->isEmulationNeeded($code) === false) {
|
2018-04-28 22:14:16 +02:00
|
|
|
// Nothing to emulate, yay
|
|
|
|
parent::startLexing($code, $errorHandler);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
$collector = new ErrorHandler\Collecting();
|
2019-01-22 22:05:17 +01:00
|
|
|
|
|
|
|
// 1. emulation of heredoc and nowdoc new syntax
|
|
|
|
$preparedCode = $this->processHeredocNowdoc($code);
|
2018-04-28 22:14:16 +02:00
|
|
|
parent::startLexing($preparedCode, $collector);
|
|
|
|
$this->fixupTokens();
|
|
|
|
|
|
|
|
$errors = $collector->getErrors();
|
|
|
|
if (!empty($errors)) {
|
|
|
|
$this->fixupErrors($errors);
|
|
|
|
foreach ($errors as $error) {
|
|
|
|
$errorHandler->handleError($error);
|
|
|
|
}
|
|
|
|
}
|
2019-06-30 12:13:28 +02:00
|
|
|
|
2020-08-01 21:49:53 +02:00
|
|
|
foreach ($this->tokenEmulators as $tokenEmulator) {
|
2020-08-01 21:56:06 +02:00
|
|
|
$emulatorPhpVersion = $tokenEmulator->getPhpVersion();
|
|
|
|
if (version_compare(\PHP_VERSION, $emulatorPhpVersion, '<')
|
|
|
|
&& version_compare($this->targetPhpVersion, $emulatorPhpVersion, '>=')
|
2020-08-01 21:49:53 +02:00
|
|
|
&& $tokenEmulator->isEmulationNeeded($code)) {
|
|
|
|
$this->tokens = $tokenEmulator->emulate($code, $this->tokens);
|
2020-08-01 22:34:36 +02:00
|
|
|
} else if (version_compare(\PHP_VERSION, $emulatorPhpVersion, '>=')
|
|
|
|
&& version_compare($this->targetPhpVersion, $emulatorPhpVersion, '<')
|
|
|
|
&& $tokenEmulator->isEmulationNeeded($code)) {
|
|
|
|
$this->tokens = $tokenEmulator->reverseEmulate($code, $this->tokens);
|
2019-06-30 12:13:28 +02:00
|
|
|
}
|
|
|
|
}
|
2018-04-28 22:14:16 +02:00
|
|
|
}
|
|
|
|
|
2019-01-22 22:05:17 +01:00
|
|
|
private function isHeredocNowdocEmulationNeeded(string $code): bool
|
|
|
|
{
|
|
|
|
// skip version where this works without emulation
|
2018-04-28 22:14:16 +02:00
|
|
|
if (version_compare(\PHP_VERSION, self::PHP_7_3, '>=')) {
|
2019-01-22 22:05:17 +01:00
|
|
|
return false;
|
2018-04-28 22:14:16 +02:00
|
|
|
}
|
|
|
|
|
2019-01-22 22:05:17 +01:00
|
|
|
return strpos($code, '<<<') !== false;
|
|
|
|
}
|
|
|
|
|
|
|
|
private function processHeredocNowdoc(string $code): string
|
|
|
|
{
|
|
|
|
if ($this->isHeredocNowdocEmulationNeeded($code) === false) {
|
|
|
|
return $code;
|
2018-04-28 22:14:16 +02:00
|
|
|
}
|
|
|
|
|
2019-01-22 22:05:17 +01:00
|
|
|
if (!preg_match_all(self::FLEXIBLE_DOC_STRING_REGEX, $code, $matches, PREG_SET_ORDER|PREG_OFFSET_CAPTURE)) {
|
2018-04-28 22:14:16 +02:00
|
|
|
// No heredoc/nowdoc found
|
2019-01-22 22:05:17 +01:00
|
|
|
return $code;
|
2018-04-28 22:14:16 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
// Keep track of how much we need to adjust string offsets due to the modifications we
|
|
|
|
// already made
|
|
|
|
$posDelta = 0;
|
|
|
|
foreach ($matches as $match) {
|
|
|
|
$indentation = $match['indentation'][0];
|
|
|
|
$indentationStart = $match['indentation'][1];
|
|
|
|
|
|
|
|
$separator = $match['separator'][0];
|
|
|
|
$separatorStart = $match['separator'][1];
|
|
|
|
|
|
|
|
if ($indentation === '' && $separator !== '') {
|
|
|
|
// Ordinary heredoc/nowdoc
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($indentation !== '') {
|
|
|
|
// Remove indentation
|
|
|
|
$indentationLen = strlen($indentation);
|
|
|
|
$code = substr_replace($code, '', $indentationStart + $posDelta, $indentationLen);
|
|
|
|
$this->patches[] = [$indentationStart + $posDelta, 'add', $indentation];
|
|
|
|
$posDelta -= $indentationLen;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($separator === '') {
|
|
|
|
// Insert newline as separator
|
|
|
|
$code = substr_replace($code, "\n", $separatorStart + $posDelta, 0);
|
|
|
|
$this->patches[] = [$separatorStart + $posDelta, 'remove', "\n"];
|
|
|
|
$posDelta += 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2019-01-22 22:05:17 +01:00
|
|
|
return $code;
|
|
|
|
}
|
|
|
|
|
|
|
|
private function isEmulationNeeded(string $code): bool
|
|
|
|
{
|
2019-05-09 14:17:28 +02:00
|
|
|
foreach ($this->tokenEmulators as $emulativeToken) {
|
|
|
|
if ($emulativeToken->isEmulationNeeded($code)) {
|
|
|
|
return true;
|
|
|
|
}
|
2019-01-22 22:05:17 +01:00
|
|
|
}
|
|
|
|
|
2019-05-09 14:17:28 +02:00
|
|
|
return $this->isHeredocNowdocEmulationNeeded($code);
|
2018-04-28 22:14:16 +02:00
|
|
|
}
|
|
|
|
|
2019-01-22 22:05:17 +01:00
|
|
|
private function fixupTokens()
|
|
|
|
{
|
|
|
|
if (\count($this->patches) === 0) {
|
|
|
|
return;
|
|
|
|
}
|
2018-04-28 22:14:16 +02:00
|
|
|
|
|
|
|
// Load first patch
|
|
|
|
$patchIdx = 0;
|
2019-01-22 22:05:17 +01:00
|
|
|
|
2018-04-28 22:14:16 +02:00
|
|
|
list($patchPos, $patchType, $patchText) = $this->patches[$patchIdx];
|
|
|
|
|
|
|
|
// We use a manual loop over the tokens, because we modify the array on the fly
|
|
|
|
$pos = 0;
|
|
|
|
for ($i = 0, $c = \count($this->tokens); $i < $c; $i++) {
|
|
|
|
$token = $this->tokens[$i];
|
|
|
|
if (\is_string($token)) {
|
|
|
|
// We assume that patches don't apply to string tokens
|
|
|
|
$pos += \strlen($token);
|
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
|
|
|
$len = \strlen($token[1]);
|
|
|
|
$posDelta = 0;
|
|
|
|
while ($patchPos >= $pos && $patchPos < $pos + $len) {
|
|
|
|
$patchTextLen = \strlen($patchText);
|
|
|
|
if ($patchType === 'remove') {
|
|
|
|
if ($patchPos === $pos && $patchTextLen === $len) {
|
|
|
|
// Remove token entirely
|
|
|
|
array_splice($this->tokens, $i, 1, []);
|
|
|
|
$i--;
|
|
|
|
$c--;
|
|
|
|
} else {
|
|
|
|
// Remove from token string
|
|
|
|
$this->tokens[$i][1] = substr_replace(
|
|
|
|
$token[1], '', $patchPos - $pos + $posDelta, $patchTextLen
|
|
|
|
);
|
|
|
|
$posDelta -= $patchTextLen;
|
|
|
|
}
|
|
|
|
} elseif ($patchType === 'add') {
|
|
|
|
// Insert into the token string
|
|
|
|
$this->tokens[$i][1] = substr_replace(
|
|
|
|
$token[1], $patchText, $patchPos - $pos + $posDelta, 0
|
|
|
|
);
|
|
|
|
$posDelta += $patchTextLen;
|
|
|
|
} else {
|
|
|
|
assert(false);
|
|
|
|
}
|
|
|
|
|
|
|
|
// Fetch the next patch
|
|
|
|
$patchIdx++;
|
|
|
|
if ($patchIdx >= \count($this->patches)) {
|
|
|
|
// No more patches, we're done
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
list($patchPos, $patchType, $patchText) = $this->patches[$patchIdx];
|
|
|
|
|
|
|
|
// Multiple patches may apply to the same token. Reload the current one to check
|
|
|
|
// If the new patch applies
|
|
|
|
$token = $this->tokens[$i];
|
|
|
|
}
|
|
|
|
|
|
|
|
$pos += $len;
|
|
|
|
}
|
|
|
|
|
|
|
|
// A patch did not apply
|
|
|
|
assert(false);
|
|
|
|
}
|
|
|
|
|
|
|
|
/**
|
|
|
|
* Fixup line and position information in errors.
|
|
|
|
*
|
|
|
|
* @param Error[] $errors
|
|
|
|
*/
|
|
|
|
private function fixupErrors(array $errors) {
|
|
|
|
foreach ($errors as $error) {
|
|
|
|
$attrs = $error->getAttributes();
|
|
|
|
|
|
|
|
$posDelta = 0;
|
|
|
|
$lineDelta = 0;
|
|
|
|
foreach ($this->patches as $patch) {
|
|
|
|
list($patchPos, $patchType, $patchText) = $patch;
|
|
|
|
if ($patchPos >= $attrs['startFilePos']) {
|
|
|
|
// No longer relevant
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
if ($patchType === 'add') {
|
|
|
|
$posDelta += strlen($patchText);
|
|
|
|
$lineDelta += substr_count($patchText, "\n");
|
|
|
|
} else {
|
|
|
|
$posDelta -= strlen($patchText);
|
|
|
|
$lineDelta -= substr_count($patchText, "\n");
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
$attrs['startFilePos'] += $posDelta;
|
|
|
|
$attrs['endFilePos'] += $posDelta;
|
|
|
|
$attrs['startLine'] += $lineDelta;
|
|
|
|
$attrs['endLine'] += $lineDelta;
|
|
|
|
$error->setAttributes($attrs);
|
|
|
|
}
|
|
|
|
}
|
2019-01-22 22:05:17 +01:00
|
|
|
}
|