1, T_COMMENT => 1, T_OPEN_TAG => 1 ); /** * Creates a Lexer. * * @param string $code * * @throws PHPParser_Error on lexing errors (unterminated comment or unexpected character) */ public function __construct($code) { self::initTokenMap(); // Reset the error message in error_get_last() // Still hoping for a better solution to be found. @$errorGetLastResetUndefinedVariable; $this->code = $code; $this->tokens = @token_get_all($code); $this->pos = -1; $this->line = 1; $error = error_get_last(); if (preg_match( '~^Unterminated comment starting line ([0-9]+)$~', $error['message'], $matches ) ) { throw new PHPParser_Error('Unterminated comment', $matches[1]); } if (preg_match( '~^Unexpected character in input: \'(.)\' \(ASCII=([0-9]+)\)~s', $error['message'], $matches ) ) { throw new PHPParser_Error(sprintf( 'Unexpected character "%s" (ASCII %d)', $matches[1], $matches[2] )); } // PHP cuts error message after null byte, so need special case if (preg_match('~^Unexpected character in input: \'$~', $error['message'])) { throw new PHPParser_Error('Unexpected null byte'); } } /** * Returns the next token id. * * @param mixed $value Variable to store token content in * @param mixed $line Variable to store line in * @param mixed $docComment Variable to store doc comment in * * @return int Token id */ public function lex(&$value = null, &$line = null, &$docComment = null) { $docComment = null; while (isset($this->tokens[++$this->pos])) { $token = $this->tokens[$this->pos]; if (is_string($token)) { $value = $token; $line = $this->line; return ord($token); } else { $this->line += substr_count($token[1], "\n"); if (T_DOC_COMMENT === $token[0]) { $docComment = $token[1]; } elseif (!isset(self::$dropTokens[$token[0]])) { $value = $token[1]; $line = $token[2]; return self::$tokenMap[$token[0]]; } } } return 0; } /** * Handles __halt_compiler() by returning the text after it. * * @return string Remaining text */ public function handleHaltCompiler() { // get the length of the text before the T_HALT_COMPILER token $textBefore = ''; for ($i = 0; $i <= $this->pos; ++$i) { if (is_string($this->tokens[$i])) { $textBefore .= $this->tokens[$i]; } else { $textBefore .= $this->tokens[$i][1]; } } // text after T_HALT_COMPILER, still including (); $textAfter = substr($this->code, strlen($textBefore)); // ensure that it is followed by (); // this simplifies the situation, by not allowing any comments // in between of the tokens. if (!preg_match('~\s*\(\s*\)\s*;~', $textAfter, $matches)) { throw new PHPParser_Error('__halt_compiler must be followed by "();"'); } // prevent the lexer from returning any further tokens $this->pos = count($this->tokens); // return with (); removed return substr($textAfter, strlen($matches[0])); } /** * Initializes the token map. * * The token map maps the PHP internal token identifiers * to the identifiers used by the Parser. Additionally it * maps T_OPEN_TAG_WITH_ECHO to T_ECHO and T_CLOSE_TAG to ';'. */ protected static function initTokenMap() { if (!self::$tokenMap) { self::$tokenMap = array(); // 256 is the minimum possible token number, as everything below // it is an ASCII value for ($i = 256; $i < 1000; ++$i) { // T_DOUBLE_COLON is equivalent to T_PAAMAYIM_NEKUDOTAYIM if (T_DOUBLE_COLON === $i) { self::$tokenMap[$i] = PHPParser_Parser::T_PAAMAYIM_NEKUDOTAYIM; // T_OPEN_TAG_WITH_ECHO with dropped T_OPEN_TAG results in T_ECHO } elseif(T_OPEN_TAG_WITH_ECHO === $i) { self::$tokenMap[$i] = PHPParser_Parser::T_ECHO; // T_CLOSE_TAG is equivalent to ';' } elseif(T_CLOSE_TAG === $i) { self::$tokenMap[$i] = ord(';'); // and the others can be mapped directly } elseif ('UNKNOWN' !== ($name = token_name($i)) && defined($name = 'PHPParser_Parser::' . $name) ) { self::$tokenMap[$i] = constant($name); } } } } }