123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336 |
- <?php
- /*
- * This file is part of the Symfony package.
- *
- * (c) Fabien Potencier <fabien@symfony.com>
- *
- * For the full copyright and license information, please view the LICENSE
- * file that was distributed with this source code.
- */
- namespace Symfony\Component\Translation\Extractor;
- use Symfony\Component\Finder\Finder;
- use Symfony\Component\Translation\MessageCatalogue;
- /**
- * PhpExtractor extracts translation messages from a PHP template.
- *
- * @author Michel Salib <michelsalib@hotmail.com>
- */
- class PhpExtractor extends AbstractFileExtractor implements ExtractorInterface
- {
- public const MESSAGE_TOKEN = 300;
- public const METHOD_ARGUMENTS_TOKEN = 1000;
- public const DOMAIN_TOKEN = 1001;
- /**
- * Prefix for new found message.
- *
- * @var string
- */
- private $prefix = '';
- /**
- * The sequence that captures translation messages.
- *
- * @var array
- */
- protected $sequences = [
- [
- '->',
- 'trans',
- '(',
- self::MESSAGE_TOKEN,
- ',',
- self::METHOD_ARGUMENTS_TOKEN,
- ',',
- self::DOMAIN_TOKEN,
- ],
- [
- '->',
- 'trans',
- '(',
- self::MESSAGE_TOKEN,
- ],
- [
- 'new',
- 'TranslatableMessage',
- '(',
- self::MESSAGE_TOKEN,
- ',',
- self::METHOD_ARGUMENTS_TOKEN,
- ',',
- self::DOMAIN_TOKEN,
- ],
- [
- 'new',
- 'TranslatableMessage',
- '(',
- self::MESSAGE_TOKEN,
- ],
- [
- 'new',
- '\\',
- 'Symfony',
- '\\',
- 'Component',
- '\\',
- 'Translation',
- '\\',
- 'TranslatableMessage',
- '(',
- self::MESSAGE_TOKEN,
- ',',
- self::METHOD_ARGUMENTS_TOKEN,
- ',',
- self::DOMAIN_TOKEN,
- ],
- [
- 'new',
- '\Symfony\Component\Translation\TranslatableMessage',
- '(',
- self::MESSAGE_TOKEN,
- ',',
- self::METHOD_ARGUMENTS_TOKEN,
- ',',
- self::DOMAIN_TOKEN,
- ],
- [
- 'new',
- '\\',
- 'Symfony',
- '\\',
- 'Component',
- '\\',
- 'Translation',
- '\\',
- 'TranslatableMessage',
- '(',
- self::MESSAGE_TOKEN,
- ],
- [
- 'new',
- '\Symfony\Component\Translation\TranslatableMessage',
- '(',
- self::MESSAGE_TOKEN,
- ],
- [
- 't',
- '(',
- self::MESSAGE_TOKEN,
- ',',
- self::METHOD_ARGUMENTS_TOKEN,
- ',',
- self::DOMAIN_TOKEN,
- ],
- [
- 't',
- '(',
- self::MESSAGE_TOKEN,
- ],
- ];
- /**
- * {@inheritdoc}
- */
- public function extract($resource, MessageCatalogue $catalog)
- {
- $files = $this->extractFiles($resource);
- foreach ($files as $file) {
- $this->parseTokens(token_get_all(file_get_contents($file)), $catalog, $file);
- gc_mem_caches();
- }
- }
- /**
- * {@inheritdoc}
- */
- public function setPrefix(string $prefix)
- {
- $this->prefix = $prefix;
- }
- /**
- * Normalizes a token.
- *
- * @param mixed $token
- *
- * @return string|null
- */
- protected function normalizeToken($token)
- {
- if (isset($token[1]) && 'b"' !== $token) {
- return $token[1];
- }
- return $token;
- }
- /**
- * Seeks to a non-whitespace token.
- */
- private function seekToNextRelevantToken(\Iterator $tokenIterator)
- {
- for (; $tokenIterator->valid(); $tokenIterator->next()) {
- $t = $tokenIterator->current();
- if (\T_WHITESPACE !== $t[0]) {
- break;
- }
- }
- }
- private function skipMethodArgument(\Iterator $tokenIterator)
- {
- $openBraces = 0;
- for (; $tokenIterator->valid(); $tokenIterator->next()) {
- $t = $tokenIterator->current();
- if ('[' === $t[0] || '(' === $t[0]) {
- ++$openBraces;
- }
- if (']' === $t[0] || ')' === $t[0]) {
- --$openBraces;
- }
- if ((0 === $openBraces && ',' === $t[0]) || (-1 === $openBraces && ')' === $t[0])) {
- break;
- }
- }
- }
- /**
- * Extracts the message from the iterator while the tokens
- * match allowed message tokens.
- */
- private function getValue(\Iterator $tokenIterator)
- {
- $message = '';
- $docToken = '';
- $docPart = '';
- for (; $tokenIterator->valid(); $tokenIterator->next()) {
- $t = $tokenIterator->current();
- if ('.' === $t) {
- // Concatenate with next token
- continue;
- }
- if (!isset($t[1])) {
- break;
- }
- switch ($t[0]) {
- case \T_START_HEREDOC:
- $docToken = $t[1];
- break;
- case \T_ENCAPSED_AND_WHITESPACE:
- case \T_CONSTANT_ENCAPSED_STRING:
- if ('' === $docToken) {
- $message .= PhpStringTokenParser::parse($t[1]);
- } else {
- $docPart = $t[1];
- }
- break;
- case \T_END_HEREDOC:
- if ($indentation = strspn($t[1], ' ')) {
- $docPartWithLineBreaks = $docPart;
- $docPart = '';
- foreach (preg_split('~(\r\n|\n|\r)~', $docPartWithLineBreaks, -1, \PREG_SPLIT_DELIM_CAPTURE) as $str) {
- if (\in_array($str, ["\r\n", "\n", "\r"], true)) {
- $docPart .= $str;
- } else {
- $docPart .= substr($str, $indentation);
- }
- }
- }
- $message .= PhpStringTokenParser::parseDocString($docToken, $docPart);
- $docToken = '';
- $docPart = '';
- break;
- case \T_WHITESPACE:
- break;
- default:
- break 2;
- }
- }
- return $message;
- }
- /**
- * Extracts trans message from PHP tokens.
- */
- protected function parseTokens(array $tokens, MessageCatalogue $catalog, string $filename)
- {
- $tokenIterator = new \ArrayIterator($tokens);
- for ($key = 0; $key < $tokenIterator->count(); ++$key) {
- foreach ($this->sequences as $sequence) {
- $message = '';
- $domain = 'messages';
- $tokenIterator->seek($key);
- foreach ($sequence as $sequenceKey => $item) {
- $this->seekToNextRelevantToken($tokenIterator);
- if ($this->normalizeToken($tokenIterator->current()) === $item) {
- $tokenIterator->next();
- continue;
- } elseif (self::MESSAGE_TOKEN === $item) {
- $message = $this->getValue($tokenIterator);
- if (\count($sequence) === ($sequenceKey + 1)) {
- break;
- }
- } elseif (self::METHOD_ARGUMENTS_TOKEN === $item) {
- $this->skipMethodArgument($tokenIterator);
- } elseif (self::DOMAIN_TOKEN === $item) {
- $domainToken = $this->getValue($tokenIterator);
- if ('' !== $domainToken) {
- $domain = $domainToken;
- }
- break;
- } else {
- break;
- }
- }
- if ($message) {
- $catalog->set($message, $this->prefix.$message, $domain);
- $metadata = $catalog->getMetadata($message, $domain) ?? [];
- $normalizedFilename = preg_replace('{[\\\\/]+}', '/', $filename);
- $metadata['sources'][] = $normalizedFilename.':'.$tokens[$key][2];
- $catalog->setMetadata($message, $metadata, $domain);
- break;
- }
- }
- }
- }
- /**
- * @return bool
- *
- * @throws \InvalidArgumentException
- */
- protected function canBeExtracted(string $file)
- {
- return $this->isFile($file) && 'php' === pathinfo($file, \PATHINFO_EXTENSION);
- }
- /**
- * {@inheritdoc}
- */
- protected function extractFromDirectory($directory)
- {
- $finder = new Finder();
- return $finder->files()->name('*.php')->in($directory);
- }
- }
|