php-parser/lib/PHPParser/Lexer/Emulative.php

<?php

/**
 * ATTENTION: This code is WRITE-ONLY. Do not try to read it.
 */
class PHPParser_Lexer_Emulative extends PHPParser_Lexer
{
    protected $newKeywords;
    protected $inObjectAccess;

    public function __construct() {
        parent::__construct();

        $newKeywordsPerVersion = array(
            '5.5.0-dev' => array(
                'finally'       => PHPParser_Parser::T_FINALLY,
                'yield'         => PHPParser_Parser::T_YIELD,
            ),
            '5.4.0-dev' => array(
                'callable'      => PHPParser_Parser::T_CALLABLE,
                'insteadof'     => PHPParser_Parser::T_INSTEADOF,
                'trait'         => PHPParser_Parser::T_TRAIT,
                '__trait__'     => PHPParser_Parser::T_TRAIT_C,
            ),
            '5.3.0-dev' => array(
                '__dir__'       => PHPParser_Parser::T_DIR,
                'goto'          => PHPParser_Parser::T_GOTO,
                'namespace'     => PHPParser_Parser::T_NAMESPACE,
                '__namespace__' => PHPParser_Parser::T_NS_C,
            ),
        );

        $this->newKeywords = array();
        foreach ($newKeywordsPerVersion as $version => $newKeywords) {
            if (version_compare(PHP_VERSION, $version, '>=')) {
                break;
            }

            $this->newKeywords += $newKeywords;
        }
    }

    public function startLexing($code) {
        $this->inObjectAccess = false;

        // on PHP 5.4 don't do anything
        if (version_compare(PHP_VERSION, '5.4.0RC1', '>=')) {
            parent::startLexing($code);
        } else {
            $code = $this->preprocessCode($code);
            parent::startLexing($code);
            $this->postprocessTokens();
        }
    }

    /*
     * Replaces new features in the code by ~__EMU__{NAME}__{DATA}__~ sequences.
     * ~LABEL~ is never valid PHP code, that's why we can (to some degree) safely
     * use it here.
     * Later when preprocessing the tokens these sequences will either be replaced
     * by real tokens or replaced with their original content (e.g. if they occured
     * inside a string, i.e. a place where they don't have a special meaning).
     */
    protected function preprocessCode($code) {
        // binary notation (0b010101101001...)
        $code = preg_replace('(\b0b[01]+\b)', '~__EMU__BINARY__$0__~', $code);

        if (version_compare(PHP_VERSION, '5.3.0', '<')) {
            // namespace separator (backslash not followed by some special characters,
            // which are not valid after a NS separator, but would cause problems with
            // escape sequence parsing if one would replace the backslash there)
            $code = preg_replace('(\\\\(?!["\'`${\\\\]))', '~__EMU__NS__~', $code);

            // nowdoc (<<<'ABC'\ncontent\nABC;)
            $code = preg_replace_callback(
                '((*BSR_ANYCRLF)        # set \R to (?>\r\n|\r|\n)
                  (b?<<<[\t ]*\'([a-zA-Z_\x7f-\xff][a-zA-Z0-9_\x7f-\xff]*)\'\R) # opening token
                  ((?:(?!\2;?\R).*\R)*) # content
                  (\2)                  # closing token
                  (?=;?\R)              # must be followed by newline (with optional semicolon)
                 )x',
                array($this, 'encodeNowdocCallback'),
                $code
            );
        }

        return $code;
    }

    /*
     * As nowdocs can have arbitrary content but LABELs can only contain a certain
     * range of characters, the nowdoc content is encoded as hex and separated by
     * 'x' tokens. So the result of the encoding will look like this:
     * ~__EMU__NOWDOC__{HEX(START_TOKEN)}x{HEX(CONTENT)}x{HEX(END_TOKEN)}~
     */
    public function encodeNowdocCallback(array $matches) {
        return '~__EMU__NOWDOC__'
                . bin2hex($matches[1]) . 'x' . bin2hex($matches[3]) . 'x' . bin2hex($matches[4])
                . '__~';
    }

    /*
     * Replaces the ~__EMU__...~ sequences with real tokens or their original
     * value.
     */
    protected function postprocessTokens() {
        // we need to manually iterate and manage a count because we'll change
        // the tokens array on the way
        for ($i = 0, $c = count($this->tokens); $i < $c; ++$i) {
            // first check that the following tokens are form ~LABEL~,
            // then match the __EMU__... sequence.
            if ('~' === $this->tokens[$i]
                && isset($this->tokens[$i + 2])
                && '~' === $this->tokens[$i + 2]
                && T_STRING === $this->tokens[$i + 1][0]
                && preg_match('(^__EMU__([A-Z]++)__(?:([A-Za-z0-9]++)__)?$)', $this->tokens[$i + 1][1], $matches)
            ) {
                if ('BINARY' === $matches[1]) {
                    // the binary number can either be an integer or a double, so return a LNUMBER
                    // or DNUMBER respectively
                    $replace = array(
                        array(is_int(bindec($matches[2])) ? T_LNUMBER : T_DNUMBER, $matches[2], $this->tokens[$i + 1][2])
                    );
                } elseif ('NS' === $matches[1]) {
                    // a \ single char token is returned here and replaced by a
                    // PHPParser_Parser::T_NS_SEPARATOR token in ->getNextToken(). This hacks around
                    // the limitations arising from T_NS_SEPARATOR not being defined on 5.3
                    $replace = array('\\');
                } elseif ('NOWDOC' === $matches[1]) {
                    // decode the encoded nowdoc payload; pack('H*' is bin2hex( for 5.3
                    list($start, $content, $end) = explode('x', $matches[2]);
                    list($start, $content, $end) = array(pack('H*', $start), pack('H*', $content), pack('H*', $end));

                    $replace = array();
                    $replace[] = array(T_START_HEREDOC, $start, $this->tokens[$i + 1][2]);
                    if ('' !== $content) {
                        $replace[] = array(T_ENCAPSED_AND_WHITESPACE, $content, -1);
                    }
                    $replace[] = array(T_END_HEREDOC, $end, -1);
                } else {
                    // just ignore all other __EMU__ sequences
                    continue;
                }

                array_splice($this->tokens, $i, 3, $replace);
                $c -= 3 - count($replace);
            // for multichar tokens (e.g. strings) replace any ~__EMU__...~ sequences
            // in their content with the original character sequence
            } elseif (is_array($this->tokens[$i])
                      && 0 !== strpos($this->tokens[$i][1], '__EMU__')
            ) {
                $this->tokens[$i][1] = preg_replace_callback(
                    '(~__EMU__([A-Z]++)__(?:([A-Za-z0-9]++)__)?~)',
                    array($this, 'restoreContentCallback'),
                    $this->tokens[$i][1]
                );
            }
        }
    }

    /*
     * This method is a callback for restoring EMU sequences in
     * multichar tokens (like strings) to their original value.
     */
    public function restoreContentCallback(array $matches) {
        if ('BINARY' === $matches[1]) {
            return $matches[2];
        } elseif ('NS' === $matches[1]) {
            return '\\';
        } elseif ('NOWDOC' === $matches[1]) {
            list($start, $content, $end) = explode('x', $matches[2]);
            return pack('H*', $start) . pack('H*', $content) . pack('H*', $end);
        } else {
            return $matches[0];
        }
    }

    public function getNextToken(&$value = null, &$startAttributes = null, &$endAttributes = null) {
        $token = parent::getNextToken($value, $startAttributes, $endAttributes);

        // replace new keywords by their respective tokens. This is not done
        // if we currently are in an object access (e.g. in $obj->namespace
        // "namespace" stays a T_STRING tokens and isn't converted to T_NAMESPACE)
        if (PHPParser_Parser::T_STRING === $token && !$this->inObjectAccess) {
            if (isset($this->newKeywords[strtolower($value)])) {
                return $this->newKeywords[strtolower($value)];
            }
        // backslashes are replaced by T_NS_SEPARATOR tokens
        } elseif (92 === $token) { // ord('\\')
            return PHPParser_Parser::T_NS_SEPARATOR;
        // keep track of whether we currently are in an object access (after ->)
        } elseif (PHPParser_Parser::T_OBJECT_OPERATOR === $token) {
            $this->inObjectAccess = true;
        } else {
            $this->inObjectAccess = false;
        }

        return $token;
    }
}
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`<?php`

			`/**`
			`* ATTENTION: This code is WRITE-ONLY. Do not try to read it.`
			`*/`
			`class PHPParser_Lexer_Emulative extends PHPParser_Lexer`
			`{`
Use inject-once approach for lexer Now the lexer is injected only once when creating the parser. Instead of $parser = new PHPParser_Parser; $parser->parse(new PHPParser_Lexer($code)); $parser->parse(new PHPParser_Lexer($code2)); you write: $parser = new PHPParser_Parser(new PHPParser_Lexer); $parser->parse($code); $parser->parse($code2); 2012-04-25 20:04:46 +02:00			`protected $newKeywords;`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`protected $inObjectAccess;`

Use inject-once approach for lexer Now the lexer is injected only once when creating the parser. Instead of $parser = new PHPParser_Parser; $parser->parse(new PHPParser_Lexer($code)); $parser->parse(new PHPParser_Lexer($code2)); you write: $parser = new PHPParser_Parser(new PHPParser_Lexer); $parser->parse($code); $parser->parse($code2); 2012-04-25 20:04:46 +02:00			`public function __construct() {`
			`parent::__construct();`

Add support for finally clauses (PHP 5.5) This adds a new finallyStmts subnode to the TryCatch node. If there is no finally clause it will be null. 2012-09-07 18:06:11 +02:00			`$newKeywordsPerVersion = array(`
			`'5.5.0-dev' => array(`
			`'finally' => PHPParser_Parser::T_FINALLY,`
Add support for yield expressions (PHP 5.5) This adds a new Yield expression type, with subnodes key and value. 2012-09-07 19:24:44 +02:00			`'yield' => PHPParser_Parser::T_YIELD,`
Add support for finally clauses (PHP 5.5) This adds a new finallyStmts subnode to the TryCatch node. If there is no finally clause it will be null. 2012-09-07 18:06:11 +02:00			`),`
			`'5.4.0-dev' => array(`
			`'callable' => PHPParser_Parser::T_CALLABLE,`
			`'insteadof' => PHPParser_Parser::T_INSTEADOF,`
			`'trait' => PHPParser_Parser::T_TRAIT,`
			`'__trait__' => PHPParser_Parser::T_TRAIT_C,`
			`),`
			`'5.3.0-dev' => array(`
			`'__dir__' => PHPParser_Parser::T_DIR,`
			`'goto' => PHPParser_Parser::T_GOTO,`
			`'namespace' => PHPParser_Parser::T_NAMESPACE,`
			`'__namespace__' => PHPParser_Parser::T_NS_C,`
			`),`
Use inject-once approach for lexer Now the lexer is injected only once when creating the parser. Instead of $parser = new PHPParser_Parser; $parser->parse(new PHPParser_Lexer($code)); $parser->parse(new PHPParser_Lexer($code2)); you write: $parser = new PHPParser_Parser(new PHPParser_Lexer); $parser->parse($code); $parser->parse($code2); 2012-04-25 20:04:46 +02:00			`);`

Add support for finally clauses (PHP 5.5) This adds a new finallyStmts subnode to the TryCatch node. If there is no finally clause it will be null. 2012-09-07 18:06:11 +02:00			`$this->newKeywords = array();`
			`foreach ($newKeywordsPerVersion as $version => $newKeywords) {`
			`if (version_compare(PHP_VERSION, $version, '>=')) {`
			`break;`
			`}`
Use inject-once approach for lexer Now the lexer is injected only once when creating the parser. Instead of $parser = new PHPParser_Parser; $parser->parse(new PHPParser_Lexer($code)); $parser->parse(new PHPParser_Lexer($code2)); you write: $parser = new PHPParser_Parser(new PHPParser_Lexer); $parser->parse($code); $parser->parse($code2); 2012-04-25 20:04:46 +02:00
Add support for finally clauses (PHP 5.5) This adds a new finallyStmts subnode to the TryCatch node. If there is no finally clause it will be null. 2012-09-07 18:06:11 +02:00			`$this->newKeywords += $newKeywords;`
			`}`
Use inject-once approach for lexer Now the lexer is injected only once when creating the parser. Instead of $parser = new PHPParser_Parser; $parser->parse(new PHPParser_Lexer($code)); $parser->parse(new PHPParser_Lexer($code2)); you write: $parser = new PHPParser_Parser(new PHPParser_Lexer); $parser->parse($code); $parser->parse($code2); 2012-04-25 20:04:46 +02:00			`}`

			`public function startLexing($code) {`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`$this->inObjectAccess = false;`

Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`// on PHP 5.4 don't do anything`
			`if (version_compare(PHP_VERSION, '5.4.0RC1', '>=')) {`
Use inject-once approach for lexer Now the lexer is injected only once when creating the parser. Instead of $parser = new PHPParser_Parser; $parser->parse(new PHPParser_Lexer($code)); $parser->parse(new PHPParser_Lexer($code2)); you write: $parser = new PHPParser_Parser(new PHPParser_Lexer); $parser->parse($code); $parser->parse($code2); 2012-04-25 20:04:46 +02:00			`parent::startLexing($code);`
Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`} else {`
			`$code = $this->preprocessCode($code);`
Use inject-once approach for lexer Now the lexer is injected only once when creating the parser. Instead of $parser = new PHPParser_Parser; $parser->parse(new PHPParser_Lexer($code)); $parser->parse(new PHPParser_Lexer($code2)); you write: $parser = new PHPParser_Parser(new PHPParser_Lexer); $parser->parse($code); $parser->parse($code2); 2012-04-25 20:04:46 +02:00			`parent::startLexing($code);`
Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`$this->postprocessTokens();`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`}`
Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`}`

			`/*`
			`* Replaces new features in the code by ~__EMU__{NAME}__{DATA}__~ sequences.`
			`* ~LABEL~ is never valid PHP code, that's why we can (to some degree) safely`
			`* use it here.`
			`* Later when preprocessing the tokens these sequences will either be replaced`
			`* by real tokens or replaced with their original content (e.g. if they occured`
			`* inside a string, i.e. a place where they don't have a special meaning).`
			`*/`
			`protected function preprocessCode($code) {`
			`// binary notation (0b010101101001...)`
			`$code = preg_replace('(\b0b[01]+\b)', '~__EMU__BINARY__$0__~', $code);`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00
			`if (version_compare(PHP_VERSION, '5.3.0', '<')) {`
Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`// namespace separator (backslash not followed by some special characters,`
			`// which are not valid after a NS separator, but would cause problems with`
			`// escape sequence parsing if one would replace the backslash there)`
Don't replace \ followed by { with NS_SEPARATOR 2012-02-21 19:28:40 +01:00			$code = preg_replace('(\\\\(?!["\'`${\\\\]))', '~__EMU__NS__~', $code);
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00
Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`// nowdoc (<<<'ABC'\ncontent\nABC;)`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`$code = preg_replace_callback(`
Fix NOWDOC emulation Strings where the NOWDOC label appeared at the beginning of a line, but not followed by a newline were not correctly recognized. 2012-01-15 14:37:53 +01:00			`'((*BSR_ANYCRLF) # set \R to (?>\r\n\|\r\|\n)`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`(b?<<<[\t ]\'([a-zA-Z_\x7f-\xff][a-zA-Z0-9_\x7f-\xff])\'\R) # opening token`
Fix NOWDOC emulation Strings where the NOWDOC label appeared at the beginning of a line, but not followed by a newline were not correctly recognized. 2012-01-15 14:37:53 +01:00			`((?:(?!\2;?\R).\R)) # content`
			`(\2) # closing token`
			`(?=;?\R) # must be followed by newline (with optional semicolon)`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`)x',`
			`array($this, 'encodeNowdocCallback'),`
			`$code`
			`);`
			`}`

Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`return $code;`
			`}`

			`/*`
			`* As nowdocs can have arbitrary content but LABELs can only contain a certain`
			`* range of characters, the nowdoc content is encoded as hex and separated by`
			`* 'x' tokens. So the result of the encoding will look like this:`
			`* ~__EMU__NOWDOC__{HEX(START_TOKEN)}x{HEX(CONTENT)}x{HEX(END_TOKEN)}~`
			`*/`
			`public function encodeNowdocCallback(array $matches) {`
			`return '~__EMU__NOWDOC__'`
			`. bin2hex($matches[1]) . 'x' . bin2hex($matches[3]) . 'x' . bin2hex($matches[4])`
			`. '__~';`
			`}`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00
Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`/*`
			`* Replaces the ~__EMU__...~ sequences with real tokens or their original`
			`* value.`
			`*/`
			`protected function postprocessTokens() {`
			`// we need to manually iterate and manage a count because we'll change`
			`// the tokens array on the way`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`for ($i = 0, $c = count($this->tokens); $i < $c; ++$i) {`
Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`// first check that the following tokens are form ~LABEL~,`
			`// then match the __EMU__... sequence.`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`if ('~' === $this->tokens[$i]`
			`&& isset($this->tokens[$i + 2])`
			`&& '~' === $this->tokens[$i + 2]`
			`&& T_STRING === $this->tokens[$i + 1][0]`
			`&& preg_match('(^__EMU__([A-Z]++)__(?:([A-Za-z0-9]++)__)?$)', $this->tokens[$i + 1][1], $matches)`
			`) {`
			`if ('BINARY' === $matches[1]) {`
Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`// the binary number can either be an integer or a double, so return a LNUMBER`
			`// or DNUMBER respectively`
Fix emulation of binary floats All binary literals were lexed as integers, even if they were floats 2012-01-15 15:19:07 +01:00			`$replace = array(`
			`array(is_int(bindec($matches[2])) ? T_LNUMBER : T_DNUMBER, $matches[2], $this->tokens[$i + 1][2])`
			`);`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`} elseif ('NS' === $matches[1]) {`
Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`// a \ single char token is returned here and replaced by a`
Use inject-once approach for lexer Now the lexer is injected only once when creating the parser. Instead of $parser = new PHPParser_Parser; $parser->parse(new PHPParser_Lexer($code)); $parser->parse(new PHPParser_Lexer($code2)); you write: $parser = new PHPParser_Parser(new PHPParser_Lexer); $parser->parse($code); $parser->parse($code2); 2012-04-25 20:04:46 +02:00			`// PHPParser_Parser::T_NS_SEPARATOR token in ->getNextToken(). This hacks around`
			`// the limitations arising from T_NS_SEPARATOR not being defined on 5.3`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`$replace = array('\\');`
			`} elseif ('NOWDOC' === $matches[1]) {`
Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`// decode the encoded nowdoc payload; pack('H*' is bin2hex( for 5.3`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`list($start, $content, $end) = explode('x', $matches[2]);`
			`list($start, $content, $end) = array(pack('H', $start), pack('H', $content), pack('H*', $end));`

			`$replace = array();`
			`$replace[] = array(T_START_HEREDOC, $start, $this->tokens[$i + 1][2]);`
			`if ('' !== $content) {`
			`$replace[] = array(T_ENCAPSED_AND_WHITESPACE, $content, -1);`
			`}`
			`$replace[] = array(T_END_HEREDOC, $end, -1);`
			`} else {`
Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`// just ignore all other __EMU__ sequences`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`continue;`
			`}`

			`array_splice($this->tokens, $i, 3, $replace);`
			`$c -= 3 - count($replace);`
Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`// for multichar tokens (e.g. strings) replace any ~__EMU__...~ sequences`
			`// in their content with the original character sequence`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`} elseif (is_array($this->tokens[$i])`
			`&& 0 !== strpos($this->tokens[$i][1], '__EMU__')`
			`) {`
			`$this->tokens[$i][1] = preg_replace_callback(`
			`'(~__EMU__([A-Z]++)__(?:([A-Za-z0-9]++)__)?~)',`
			`array($this, 'restoreContentCallback'),`
			`$this->tokens[$i][1]`
			`);`
			`}`
			`}`
			`}`

Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`/*`
			`* This method is a callback for restoring EMU sequences in`
			`* multichar tokens (like strings) to their original value.`
			`*/`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`public function restoreContentCallback(array $matches) {`
			`if ('BINARY' === $matches[1]) {`
			`return $matches[2];`
			`} elseif ('NS' === $matches[1]) {`
			`return '\\';`
			`} elseif ('NOWDOC' === $matches[1]) {`
			`list($start, $content, $end) = explode('x', $matches[2]);`
			`return pack('H', $start) . pack('H', $content) . pack('H*', $end);`
			`} else {`
			`return $matches[0];`
			`}`
			`}`

Generalize the attribute generation for nodes Now two arrays are fetched from the lexer: $startAttributes and $endAttributes. When constructing the attributes for a node, the $startAttributes from the first token of the node and the $endAttributes of the last token of the node are merged. Now the end line is saved in the endLine attribute. 2012-05-05 17:34:27 +02:00			`public function getNextToken(&$value = null, &$startAttributes = null, &$endAttributes = null) {`
			`$token = parent::getNextToken($value, $startAttributes, $endAttributes);`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00
Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`// replace new keywords by their respective tokens. This is not done`
			`// if we currently are in an object access (e.g. in $obj->namespace`
			`// "namespace" stays a T_STRING tokens and isn't converted to T_NAMESPACE)`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`if (PHPParser_Parser::T_STRING === $token && !$this->inObjectAccess) {`
Use inject-once approach for lexer Now the lexer is injected only once when creating the parser. Instead of $parser = new PHPParser_Parser; $parser->parse(new PHPParser_Lexer($code)); $parser->parse(new PHPParser_Lexer($code2)); you write: $parser = new PHPParser_Parser(new PHPParser_Lexer); $parser->parse($code); $parser->parse($code2); 2012-04-25 20:04:46 +02:00			`if (isset($this->newKeywords[strtolower($value)])) {`
			`return $this->newKeywords[strtolower($value)];`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`}`
Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`// backslashes are replaced by T_NS_SEPARATOR tokens`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`} elseif (92 === $token) { // ord('\\')`
			`return PHPParser_Parser::T_NS_SEPARATOR;`
Minor refactor and comments for emlative lexer The emulative lexer is a single dirty hack so it needs a few more comments :) 2012-02-21 17:56:07 +01:00			`// keep track of whether we currently are in an object access (after ->)`
Add initial version of an emulative lexer The emulative lexer allows lexing of PHP 5.4 on PHP 5.3 and PHP 5.2. 2011-12-18 13:04:27 +01:00			`} elseif (PHPParser_Parser::T_OBJECT_OPERATOR === $token) {`
			`$this->inObjectAccess = true;`
			`} else {`
			`$this->inObjectAccess = false;`
			`}`

			`return $token;`
			`}`
			`}`