123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208 |
- <?php
- namespace Doctrine\Common\Annotations;
- use function array_merge;
- use function count;
- use function explode;
- use function strtolower;
- use function token_get_all;
- use const PHP_VERSION_ID;
- use const T_AS;
- use const T_COMMENT;
- use const T_DOC_COMMENT;
- use const T_NAME_FULLY_QUALIFIED;
- use const T_NAME_QUALIFIED;
- use const T_NAMESPACE;
- use const T_NS_SEPARATOR;
- use const T_STRING;
- use const T_USE;
- use const T_WHITESPACE;
- /**
- * Parses a file for namespaces/use/class declarations.
- */
- class TokenParser
- {
- /**
- * The token list.
- *
- * @phpstan-var list<mixed[]>
- */
- private $tokens;
- /**
- * The number of tokens.
- *
- * @var int
- */
- private $numTokens;
- /**
- * The current array pointer.
- *
- * @var int
- */
- private $pointer = 0;
- /**
- * @param string $contents
- */
- public function __construct($contents)
- {
- $this->tokens = token_get_all($contents);
- // The PHP parser sets internal compiler globals for certain things. Annoyingly, the last docblock comment it
- // saw gets stored in doc_comment. When it comes to compile the next thing to be include()d this stored
- // doc_comment becomes owned by the first thing the compiler sees in the file that it considers might have a
- // docblock. If the first thing in the file is a class without a doc block this would cause calls to
- // getDocBlock() on said class to return our long lost doc_comment. Argh.
- // To workaround, cause the parser to parse an empty docblock. Sure getDocBlock() will return this, but at least
- // it's harmless to us.
- token_get_all("<?php\n/**\n *\n */");
- $this->numTokens = count($this->tokens);
- }
- /**
- * Gets the next non whitespace and non comment token.
- *
- * @param bool $docCommentIsComment If TRUE then a doc comment is considered a comment and skipped.
- * If FALSE then only whitespace and normal comments are skipped.
- *
- * @return mixed[]|string|null The token if exists, null otherwise.
- */
- public function next($docCommentIsComment = true)
- {
- for ($i = $this->pointer; $i < $this->numTokens; $i++) {
- $this->pointer++;
- if (
- $this->tokens[$i][0] === T_WHITESPACE ||
- $this->tokens[$i][0] === T_COMMENT ||
- ($docCommentIsComment && $this->tokens[$i][0] === T_DOC_COMMENT)
- ) {
- continue;
- }
- return $this->tokens[$i];
- }
- return null;
- }
- /**
- * Parses a single use statement.
- *
- * @return array<string, string> A list with all found class names for a use statement.
- */
- public function parseUseStatement()
- {
- $groupRoot = '';
- $class = '';
- $alias = '';
- $statements = [];
- $explicitAlias = false;
- while (($token = $this->next())) {
- if (! $explicitAlias && $token[0] === T_STRING) {
- $class .= $token[1];
- $alias = $token[1];
- } elseif ($explicitAlias && $token[0] === T_STRING) {
- $alias = $token[1];
- } elseif (
- PHP_VERSION_ID >= 80000 &&
- ($token[0] === T_NAME_QUALIFIED || $token[0] === T_NAME_FULLY_QUALIFIED)
- ) {
- $class .= $token[1];
- $classSplit = explode('\\', $token[1]);
- $alias = $classSplit[count($classSplit) - 1];
- } elseif ($token[0] === T_NS_SEPARATOR) {
- $class .= '\\';
- $alias = '';
- } elseif ($token[0] === T_AS) {
- $explicitAlias = true;
- $alias = '';
- } elseif ($token === ',') {
- $statements[strtolower($alias)] = $groupRoot . $class;
- $class = '';
- $alias = '';
- $explicitAlias = false;
- } elseif ($token === ';') {
- $statements[strtolower($alias)] = $groupRoot . $class;
- break;
- } elseif ($token === '{') {
- $groupRoot = $class;
- $class = '';
- } elseif ($token === '}') {
- continue;
- } else {
- break;
- }
- }
- return $statements;
- }
- /**
- * Gets all use statements.
- *
- * @param string $namespaceName The namespace name of the reflected class.
- *
- * @return array<string, string> A list with all found use statements.
- */
- public function parseUseStatements($namespaceName)
- {
- $statements = [];
- while (($token = $this->next())) {
- if ($token[0] === T_USE) {
- $statements = array_merge($statements, $this->parseUseStatement());
- continue;
- }
- if ($token[0] !== T_NAMESPACE || $this->parseNamespace() !== $namespaceName) {
- continue;
- }
- // Get fresh array for new namespace. This is to prevent the parser to collect the use statements
- // for a previous namespace with the same name. This is the case if a namespace is defined twice
- // or if a namespace with the same name is commented out.
- $statements = [];
- }
- return $statements;
- }
- /**
- * Gets the namespace.
- *
- * @return string The found namespace.
- */
- public function parseNamespace()
- {
- $name = '';
- while (
- ($token = $this->next()) && ($token[0] === T_STRING || $token[0] === T_NS_SEPARATOR || (
- PHP_VERSION_ID >= 80000 &&
- ($token[0] === T_NAME_QUALIFIED || $token[0] === T_NAME_FULLY_QUALIFIED)
- ))
- ) {
- $name .= $token[1];
- }
- return $name;
- }
- /**
- * Gets the class name.
- *
- * @return string The found class name.
- */
- public function parseClass()
- {
- // Namespaces and class names are tokenized the same: T_STRINGs
- // separated by T_NS_SEPARATOR so we can use one function to provide
- // both.
- return $this->parseNamespace();
- }
- }
|