php-parser/test/PhpParser/LexerTest.php

298 lines
11 KiB
PHP
Raw Normal View History

<?php declare(strict_types=1);
2011-07-13 12:24:10 +02:00
namespace PhpParser;
use PhpParser\Parser\Tokens;
class LexerTest extends \PHPUnit\Framework\TestCase
2011-07-13 12:24:10 +02:00
{
/* To allow overwriting in parent class */
2017-08-13 14:35:03 +02:00
protected function getLexer(array $options = []) {
return new Lexer($options);
}
2011-07-13 12:24:10 +02:00
/**
* @dataProvider provideTestError
*/
public function testError($code, $messages) {
if (defined('HHVM_VERSION')) {
$this->markTestSkipped('HHVM does not throw warnings from token_get_all()');
}
$errorHandler = new ErrorHandler\Collecting();
$lexer = $this->getLexer(['usedAttributes' => [
'comments', 'startLine', 'endLine', 'startFilePos', 'endFilePos'
]]);
$lexer->startLexing($code, $errorHandler);
$errors = $errorHandler->getErrors();
2011-07-13 12:24:10 +02:00
2017-12-12 12:02:49 +01:00
$this->assertCount(count($messages), $errors);
for ($i = 0; $i < count($messages); $i++) {
$this->assertSame($messages[$i], $errors[$i]->getMessageWithColumnInfo($code));
2011-07-13 12:24:10 +02:00
}
}
public function provideTestError() {
2017-08-13 14:35:03 +02:00
return [
["<?php /*", ["Unterminated comment from 1:7 to 1:9"]],
["<?php /*\n", ["Unterminated comment from 1:7 to 2:1"]],
2017-08-13 14:35:03 +02:00
["<?php \1", ["Unexpected character \"\1\" (ASCII 1) from 1:7 to 1:7"]],
["<?php \0", ["Unexpected null byte from 1:7 to 1:7"]],
// Error with potentially emulated token
2017-08-13 14:35:03 +02:00
["<?php ?? \0", ["Unexpected null byte from 1:10 to 1:10"]],
["<?php\n\0\1 foo /* bar", [
"Unexpected null byte from 2:1 to 2:1",
"Unexpected character \"\1\" (ASCII 1) from 2:2 to 2:2",
"Unterminated comment from 2:8 to 2:14"
2017-08-13 14:35:03 +02:00
]],
];
2011-07-13 12:24:10 +02:00
}
/**
* @dataProvider provideTestLex
*/
public function testLex($code, $options, $tokens) {
$lexer = $this->getLexer($options);
$lexer->startLexing($code);
while ($id = $lexer->getNextToken($value, $startAttributes, $endAttributes)) {
2011-07-13 12:24:10 +02:00
$token = array_shift($tokens);
2014-09-30 20:38:09 +02:00
$this->assertSame($token[0], $id);
$this->assertSame($token[1], $value);
$this->assertEquals($token[2], $startAttributes);
$this->assertEquals($token[3], $endAttributes);
2011-07-13 12:24:10 +02:00
}
}
public function provideTestLex() {
2017-08-13 14:35:03 +02:00
return [
// tests conversion of closing PHP tag and drop of whitespace and opening tags
2017-08-13 14:35:03 +02:00
[
'<?php tokens ?>plaintext',
2017-08-13 14:35:03 +02:00
[],
[
[
Tokens::T_STRING, 'tokens',
2017-08-13 14:35:03 +02:00
['startLine' => 1], ['endLine' => 1]
],
[
ord(';'), '?>',
2017-08-13 14:35:03 +02:00
['startLine' => 1], ['endLine' => 1]
],
[
Tokens::T_INLINE_HTML, 'plaintext',
2017-08-13 14:35:03 +02:00
['startLine' => 1, 'hasLeadingNewline' => false],
['endLine' => 1]
],
]
],
2011-07-13 13:27:14 +02:00
// tests line numbers
2017-08-13 14:35:03 +02:00
[
2011-07-13 13:27:14 +02:00
'<?php' . "\n" . '$ token /** doc' . "\n" . 'comment */ $',
2017-08-13 14:35:03 +02:00
[],
[
[
ord('$'), '$',
2017-08-13 14:35:03 +02:00
['startLine' => 2], ['endLine' => 2]
],
[
Tokens::T_STRING, 'token',
2017-08-13 14:35:03 +02:00
['startLine' => 2], ['endLine' => 2]
],
[
ord('$'), '$',
2017-08-13 14:35:03 +02:00
[
'startLine' => 3,
2017-08-13 14:35:03 +02:00
'comments' => [
new Comment\Doc('/** doc' . "\n" . 'comment */',
2, 14, 5,
3, 31, 5),
2017-08-13 14:35:03 +02:00
]
],
['endLine' => 3]
],
]
],
// tests comment extraction
2017-08-13 14:35:03 +02:00
[
'<?php /* comment */ // comment' . "\n" . '/** docComment 1 *//** docComment 2 */ token',
2017-08-13 14:35:03 +02:00
[],
[
[
Tokens::T_STRING, 'token',
2017-08-13 14:35:03 +02:00
[
'startLine' => 2,
2017-08-13 14:35:03 +02:00
'comments' => [
new Comment('/* comment */',
1, 6, 1, 1, 18, 1),
new Comment('// comment',
1, 20, 3, 1, 29, 3),
new Comment\Doc('/** docComment 1 */',
2, 31, 5, 2, 49, 5),
new Comment\Doc('/** docComment 2 */',
2, 50, 6, 2, 68, 6),
2017-08-13 14:35:03 +02:00
],
],
['endLine' => 2]
],
]
],
// tests differing start and end line
2017-08-13 14:35:03 +02:00
[
'<?php "foo' . "\n" . 'bar"',
2017-08-13 14:35:03 +02:00
[],
[
[
Tokens::T_CONSTANT_ENCAPSED_STRING, '"foo' . "\n" . 'bar"',
2017-08-13 14:35:03 +02:00
['startLine' => 1], ['endLine' => 2]
],
]
],
// tests exact file offsets
2017-08-13 14:35:03 +02:00
[
'<?php "a";' . "\n" . '// foo' . "\n" . '"b";',
2017-08-13 14:35:03 +02:00
['usedAttributes' => ['startFilePos', 'endFilePos']],
[
[
Tokens::T_CONSTANT_ENCAPSED_STRING, '"a"',
2017-08-13 14:35:03 +02:00
['startFilePos' => 6], ['endFilePos' => 8]
],
[
ord(';'), ';',
2017-08-13 14:35:03 +02:00
['startFilePos' => 9], ['endFilePos' => 9]
],
[
Tokens::T_CONSTANT_ENCAPSED_STRING, '"b"',
2017-08-13 14:35:03 +02:00
['startFilePos' => 18], ['endFilePos' => 20]
],
[
ord(';'), ';',
2017-08-13 14:35:03 +02:00
['startFilePos' => 21], ['endFilePos' => 21]
],
]
],
// tests token offsets
2017-08-13 14:35:03 +02:00
[
'<?php "a";' . "\n" . '// foo' . "\n" . '"b";',
2017-08-13 14:35:03 +02:00
['usedAttributes' => ['startTokenPos', 'endTokenPos']],
[
[
Tokens::T_CONSTANT_ENCAPSED_STRING, '"a"',
2017-08-13 14:35:03 +02:00
['startTokenPos' => 1], ['endTokenPos' => 1]
],
[
ord(';'), ';',
2017-08-13 14:35:03 +02:00
['startTokenPos' => 2], ['endTokenPos' => 2]
],
[
Tokens::T_CONSTANT_ENCAPSED_STRING, '"b"',
['startTokenPos' => 6], ['endTokenPos' => 6]
2017-08-13 14:35:03 +02:00
],
[
ord(';'), ';',
['startTokenPos' => 7], ['endTokenPos' => 7]
2017-08-13 14:35:03 +02:00
],
]
],
// tests all attributes being disabled
2017-08-13 14:35:03 +02:00
[
'<?php /* foo */ $bar;',
2017-08-13 14:35:03 +02:00
['usedAttributes' => []],
[
[
Tokens::T_VARIABLE, '$bar',
2017-08-13 14:35:03 +02:00
[], []
],
[
ord(';'), ';',
2017-08-13 14:35:03 +02:00
[], []
]
]
],
// tests no tokens
2017-08-13 14:35:03 +02:00
[
'',
2017-08-13 14:35:03 +02:00
[],
[]
],
// tests PHP 8 T_NAME_* emulation
[
'<?php Foo\Bar \Foo\Bar namespace\Foo\Bar Foo\Bar\\',
['usedAttributes' => []],
[
[Tokens::T_NAME_QUALIFIED, 'Foo\Bar', [], []],
[Tokens::T_NAME_FULLY_QUALIFIED, '\Foo\Bar', [], []],
[Tokens::T_NAME_RELATIVE, 'namespace\Foo\Bar', [], []],
[Tokens::T_NAME_QUALIFIED, 'Foo\Bar', [], []],
[Tokens::T_NS_SEPARATOR, '\\', [], []],
2020-08-09 21:11:49 +02:00
]
],
// tests PHP 8 T_NAME_* emulation with reserved keywords
[
'<?php fn\use \fn\use namespace\fn\use fn\use\\',
['usedAttributes' => []],
[
[Tokens::T_NAME_QUALIFIED, 'fn\use', [], []],
[Tokens::T_NAME_FULLY_QUALIFIED, '\fn\use', [], []],
[Tokens::T_NAME_RELATIVE, 'namespace\fn\use', [], []],
[Tokens::T_NAME_QUALIFIED, 'fn\use', [], []],
[Tokens::T_NS_SEPARATOR, '\\', [], []],
]
],
2017-08-13 14:35:03 +02:00
];
2011-07-13 12:24:10 +02:00
}
/**
* @dataProvider provideTestHaltCompiler
*/
public function testHandleHaltCompiler($code, $remaining) {
$lexer = $this->getLexer();
$lexer->startLexing($code);
2011-07-13 12:24:10 +02:00
while (Tokens::T_HALT_COMPILER !== $lexer->getNextToken());
2011-07-13 12:24:10 +02:00
$this->assertSame($remaining, $lexer->handleHaltCompiler());
$this->assertSame(0, $lexer->getNextToken());
2011-07-13 12:24:10 +02:00
}
public function provideTestHaltCompiler() {
2017-08-13 14:35:03 +02:00
return [
['<?php ... __halt_compiler();Remaining Text', 'Remaining Text'],
['<?php ... __halt_compiler ( ) ;Remaining Text', 'Remaining Text'],
['<?php ... __halt_compiler() ?>Remaining Text', 'Remaining Text'],
2011-07-13 12:24:10 +02:00
//array('<?php ... __halt_compiler();' . "\0", "\0"),
//array('<?php ... __halt_compiler /* */ ( ) ;Remaining Text', 'Remaining Text'),
2017-08-13 14:35:03 +02:00
];
2011-07-13 12:24:10 +02:00
}
2015-06-20 12:09:03 +02:00
public function testHandleHaltCompilerError() {
$this->expectException(Error::class);
$this->expectExceptionMessage('__HALT_COMPILER must be followed by "();"');
2015-06-20 12:09:03 +02:00
$lexer = $this->getLexer();
$lexer->startLexing('<?php ... __halt_compiler invalid ();');
2015-06-20 12:34:20 +02:00
while (Tokens::T_HALT_COMPILER !== $lexer->getNextToken());
2015-06-20 12:09:03 +02:00
$lexer->handleHaltCompiler();
}
public function testGetTokens() {
$code = '<?php "a";' . "\n" . '// foo' . "\n" . '// bar' . "\n\n" . '"b";';
2017-08-13 14:35:03 +02:00
$expectedTokens = [
[T_OPEN_TAG, '<?php ', 1],
[T_CONSTANT_ENCAPSED_STRING, '"a"', 1],
';',
2017-08-13 14:35:03 +02:00
[T_WHITESPACE, "\n", 1],
[T_COMMENT, '// foo', 2],
[T_WHITESPACE, "\n", 2],
[T_COMMENT, '// bar', 3],
[T_WHITESPACE, "\n\n", 3],
[T_CONSTANT_ENCAPSED_STRING, '"b"', 5],
';',
2017-08-13 14:35:03 +02:00
];
$lexer = $this->getLexer();
$lexer->startLexing($code);
$this->assertSame($expectedTokens, $lexer->getTokens());
}
}