209 lines
		
	
	
		
			6.2 KiB
		
	
	
	
		
			PHP
		
	
	
			
		
		
	
	
			209 lines
		
	
	
		
			6.2 KiB
		
	
	
	
		
			PHP
		
	
	
| <?php
 | |
| 
 | |
| namespace Doctrine\Common\Annotations;
 | |
| 
 | |
| use function array_merge;
 | |
| use function count;
 | |
| use function explode;
 | |
| use function strtolower;
 | |
| use function token_get_all;
 | |
| 
 | |
| use const PHP_VERSION_ID;
 | |
| use const T_AS;
 | |
| use const T_COMMENT;
 | |
| use const T_DOC_COMMENT;
 | |
| use const T_NAME_FULLY_QUALIFIED;
 | |
| use const T_NAME_QUALIFIED;
 | |
| use const T_NAMESPACE;
 | |
| use const T_NS_SEPARATOR;
 | |
| use const T_STRING;
 | |
| use const T_USE;
 | |
| use const T_WHITESPACE;
 | |
| 
 | |
| /**
 | |
|  * Parses a file for namespaces/use/class declarations.
 | |
|  */
 | |
| class TokenParser
 | |
| {
 | |
|     /**
 | |
|      * The token list.
 | |
|      *
 | |
|      * @phpstan-var list<mixed[]>
 | |
|      */
 | |
|     private $tokens;
 | |
| 
 | |
|     /**
 | |
|      * The number of tokens.
 | |
|      *
 | |
|      * @var int
 | |
|      */
 | |
|     private $numTokens;
 | |
| 
 | |
|     /**
 | |
|      * The current array pointer.
 | |
|      *
 | |
|      * @var int
 | |
|      */
 | |
|     private $pointer = 0;
 | |
| 
 | |
|     /**
 | |
|      * @param string $contents
 | |
|      */
 | |
|     public function __construct($contents)
 | |
|     {
 | |
|         $this->tokens = token_get_all($contents);
 | |
| 
 | |
|         // The PHP parser sets internal compiler globals for certain things. Annoyingly, the last docblock comment it
 | |
|         // saw gets stored in doc_comment. When it comes to compile the next thing to be include()d this stored
 | |
|         // doc_comment becomes owned by the first thing the compiler sees in the file that it considers might have a
 | |
|         // docblock. If the first thing in the file is a class without a doc block this would cause calls to
 | |
|         // getDocBlock() on said class to return our long lost doc_comment. Argh.
 | |
|         // To workaround, cause the parser to parse an empty docblock. Sure getDocBlock() will return this, but at least
 | |
|         // it's harmless to us.
 | |
|         token_get_all("<?php\n/**\n *\n */");
 | |
| 
 | |
|         $this->numTokens = count($this->tokens);
 | |
|     }
 | |
| 
 | |
|     /**
 | |
|      * Gets the next non whitespace and non comment token.
 | |
|      *
 | |
|      * @param bool $docCommentIsComment If TRUE then a doc comment is considered a comment and skipped.
 | |
|      * If FALSE then only whitespace and normal comments are skipped.
 | |
|      *
 | |
|      * @return mixed[]|string|null The token if exists, null otherwise.
 | |
|      */
 | |
|     public function next($docCommentIsComment = true)
 | |
|     {
 | |
|         for ($i = $this->pointer; $i < $this->numTokens; $i++) {
 | |
|             $this->pointer++;
 | |
|             if (
 | |
|                 $this->tokens[$i][0] === T_WHITESPACE ||
 | |
|                 $this->tokens[$i][0] === T_COMMENT ||
 | |
|                 ($docCommentIsComment && $this->tokens[$i][0] === T_DOC_COMMENT)
 | |
|             ) {
 | |
|                 continue;
 | |
|             }
 | |
| 
 | |
|             return $this->tokens[$i];
 | |
|         }
 | |
| 
 | |
|         return null;
 | |
|     }
 | |
| 
 | |
|     /**
 | |
|      * Parses a single use statement.
 | |
|      *
 | |
|      * @return array<string, string> A list with all found class names for a use statement.
 | |
|      */
 | |
|     public function parseUseStatement()
 | |
|     {
 | |
|         $groupRoot     = '';
 | |
|         $class         = '';
 | |
|         $alias         = '';
 | |
|         $statements    = [];
 | |
|         $explicitAlias = false;
 | |
|         while (($token = $this->next())) {
 | |
|             if (! $explicitAlias && $token[0] === T_STRING) {
 | |
|                 $class .= $token[1];
 | |
|                 $alias  = $token[1];
 | |
|             } elseif ($explicitAlias && $token[0] === T_STRING) {
 | |
|                 $alias = $token[1];
 | |
|             } elseif (
 | |
|                 PHP_VERSION_ID >= 80000 &&
 | |
|                 ($token[0] === T_NAME_QUALIFIED || $token[0] === T_NAME_FULLY_QUALIFIED)
 | |
|             ) {
 | |
|                 $class .= $token[1];
 | |
| 
 | |
|                 $classSplit = explode('\\', $token[1]);
 | |
|                 $alias      = $classSplit[count($classSplit) - 1];
 | |
|             } elseif ($token[0] === T_NS_SEPARATOR) {
 | |
|                 $class .= '\\';
 | |
|                 $alias  = '';
 | |
|             } elseif ($token[0] === T_AS) {
 | |
|                 $explicitAlias = true;
 | |
|                 $alias         = '';
 | |
|             } elseif ($token === ',') {
 | |
|                 $statements[strtolower($alias)] = $groupRoot . $class;
 | |
|                 $class                          = '';
 | |
|                 $alias                          = '';
 | |
|                 $explicitAlias                  = false;
 | |
|             } elseif ($token === ';') {
 | |
|                 $statements[strtolower($alias)] = $groupRoot . $class;
 | |
|                 break;
 | |
|             } elseif ($token === '{') {
 | |
|                 $groupRoot = $class;
 | |
|                 $class     = '';
 | |
|             } elseif ($token === '}') {
 | |
|                 continue;
 | |
|             } else {
 | |
|                 break;
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         return $statements;
 | |
|     }
 | |
| 
 | |
|     /**
 | |
|      * Gets all use statements.
 | |
|      *
 | |
|      * @param string $namespaceName The namespace name of the reflected class.
 | |
|      *
 | |
|      * @return array<string, string> A list with all found use statements.
 | |
|      */
 | |
|     public function parseUseStatements($namespaceName)
 | |
|     {
 | |
|         $statements = [];
 | |
|         while (($token = $this->next())) {
 | |
|             if ($token[0] === T_USE) {
 | |
|                 $statements = array_merge($statements, $this->parseUseStatement());
 | |
|                 continue;
 | |
|             }
 | |
| 
 | |
|             if ($token[0] !== T_NAMESPACE || $this->parseNamespace() !== $namespaceName) {
 | |
|                 continue;
 | |
|             }
 | |
| 
 | |
|             // Get fresh array for new namespace. This is to prevent the parser to collect the use statements
 | |
|             // for a previous namespace with the same name. This is the case if a namespace is defined twice
 | |
|             // or if a namespace with the same name is commented out.
 | |
|             $statements = [];
 | |
|         }
 | |
| 
 | |
|         return $statements;
 | |
|     }
 | |
| 
 | |
|     /**
 | |
|      * Gets the namespace.
 | |
|      *
 | |
|      * @return string The found namespace.
 | |
|      */
 | |
|     public function parseNamespace()
 | |
|     {
 | |
|         $name = '';
 | |
|         while (
 | |
|             ($token = $this->next()) && ($token[0] === T_STRING || $token[0] === T_NS_SEPARATOR || (
 | |
|             PHP_VERSION_ID >= 80000 &&
 | |
|             ($token[0] === T_NAME_QUALIFIED || $token[0] === T_NAME_FULLY_QUALIFIED)
 | |
|             ))
 | |
|         ) {
 | |
|             $name .= $token[1];
 | |
|         }
 | |
| 
 | |
|         return $name;
 | |
|     }
 | |
| 
 | |
|     /**
 | |
|      * Gets the class name.
 | |
|      *
 | |
|      * @return string The found class name.
 | |
|      */
 | |
|     public function parseClass()
 | |
|     {
 | |
|         // Namespaces and class names are tokenized the same: T_STRINGs
 | |
|         // separated by T_NS_SEPARATOR so we can use one function to provide
 | |
|         // both.
 | |
|         return $this->parseNamespace();
 | |
|     }
 | |
| }
 |