#!/usr/bin/env php directives. use PhpParser\Lexer\Emulative; use PhpParser\Node\Stmt\Class_; use PhpParser\Node\Stmt\Namespace_; use PhpParser\NodeTraverser; use PhpParser\NodeVisitor\NameResolver; use PhpParser\ParserFactory; set_error_handler(function ($num, $str, $file, $line, $context = null): void { throw new ErrorException($str, 0, $num, $file, $line); }); foreach ([__DIR__ . '/../../../autoload.php', __DIR__ . '/../vendor/autoload.php'] as $file) { if (file_exists($file)) { require $file; break; } } $lexer = new Emulative(); $parser = (new ParserFactory)->create( ParserFactory::PREFER_PHP7, $lexer, ); $traverser = new NodeTraverser(); $traverser->addVisitor(new NameResolver); function extractClassesFromStatements(array $statements): array { $classes = []; foreach ($statements as $statement) { if ($statement instanceof Class_) { $classes[strtolower($statement->namespacedName->toString())] = true; } if ($statement instanceof Namespace_) { $classes += extractClassesFromStatements($statement->stmts); } } return $classes; } $stubbedClasses = []; foreach (new RecursiveDirectoryIterator( __DIR__ . '/../stubs', FilesystemIterator::CURRENT_AS_PATHNAME|FilesystemIterator::SKIP_DOTS, ) as $file) { if (is_dir($file)) { continue; } $contents = file_get_contents($file); $stmts = $parser->parse($contents); $stmts = $traverser->traverse($stmts); $stubbedClasses += extractClassesFromStatements($stmts); } unset($file, $contents, $stmts); $docDir = realpath(__DIR__ . '/../build/doc-en'); if (false === $docDir) { echo 'PHP doc not found!' . PHP_EOL; echo 'Please execute: git clone git@github.com:php/doc-en.git ' . dirname(__DIR__) . '/build/doc-en'; } $files = new RegexIterator( new RecursiveIteratorIterator( new RecursiveDirectoryIterator( $docDir, FilesystemIterator::CURRENT_AS_PATHNAME|FilesystemIterator::SKIP_DOTS, ), RecursiveIteratorIterator::LEAVES_ONLY, ), '/.*.xml$/', ); $classes = require_once dirname(__DIR__) . '/dictionaries/ManualPropertyMap.php'; libxml_use_internal_errors(true); foreach ($files as $file) { $contents = file_get_contents($file); // FIXME: find a way to ignore custom entities, for now we strip them. $contents = preg_replace('#&[a-zA-Z\d.\-_]+;#', '', $contents); $contents = preg_replace('#%[a-zA-Z\d.\-_]+;#', '', $contents); $contents = preg_replace('#]+>#', '', $contents); try { $simple = new SimpleXMLElement($contents); } catch (Throwable $exception) { // FIXME: we ignore files with XML errors at the moment because the input XML is not always sober. // Examples are rpminfo/entities.functions.xml, wkhtmltox/wkhtmltox/bits/web.xml, // wkhtmltox/wkhtmltox/bits/load.xml echo sprintf( "%1\$s: Ignoring %2\$s: %3\$s\n%4\$s", $file, get_class($exception), $exception->getMessage(), implode("\n", array_map(fn(LibXMLError $error): string => $error->message, libxml_get_errors())), ); libxml_clear_errors(); continue; } $namespaces = $simple->getNamespaces(); $simple->registerXPathNamespace('docbook', 'http://docbook.org/ns/docbook'); foreach ($simple->xpath('//docbook:classsynopsis') as $classSynopsis) { $classSynopsis->registerXPathNamespace('docbook', 'http://docbook.org/ns/docbook'); $class = strtolower((string) $classSynopsis->xpath('./docbook:ooclass/docbook:classname')[0]); if (isset($stubbedClasses[$class])) { continue; } foreach ($classSynopsis->xpath('//docbook:fieldsynopsis') as $item) { assert($item instanceof SimpleXMLElement); $property = strtolower((string) $item->varname); if (isset($classes[$class][$property])) { continue; } $type = $item->type[0]; if (null === $type) { continue; } assert($type instanceof SimpleXMLElement); $typeClass = $type->attributes(/*'http://docbook.org/ns/docbook'*/)->class; if (null === $typeClass) { $type = (string) $type; } elseif ('union' === (string) $typeClass) { $types = []; foreach ($type as $subType) { $types[] = (string) $subType; } $type = implode('|', $types); } switch ($type) { case '': // Some properties are not properly defined - we ignore them then. continue 2; // case 'integer': // $type = 'int'; default: } $modifier = (string) $item->modifier; // We do not want to handle constants... I guess?! if ('const' === $modifier) { continue; } $classes[$class][$property] = $type; } } } function serializeArray(array $array, string $prefix): string { uksort($array, fn(string $first, string $second): int => strtolower($first) <=> strtolower($second)); $result = "[\n"; $localPrefix = $prefix . ' '; foreach ($array as $key => $value) { $result .= $localPrefix . var_export((string) $key, true) . ' => ' . (is_array($value) ? serializeArray($value, $localPrefix) : var_export($value, true)) . ",\n"; } $result .= $prefix . ']'; return $result; } $serialized = serializeArray($classes, ''); file_put_contents( dirname(__DIR__) . '/dictionaries/PropertyMap.php', <<