PhpExtractor.php 9.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333
  1. <?php
  2. /*
  3. * This file is part of the Symfony package.
  4. *
  5. * (c) Fabien Potencier <fabien@symfony.com>
  6. *
  7. * For the full copyright and license information, please view the LICENSE
  8. * file that was distributed with this source code.
  9. */
  10. namespace Symfony\Component\Translation\Extractor;
  11. trigger_deprecation('symfony/translation', '6.2', '"%s" is deprecated, use "%s" instead.', PhpExtractor::class, PhpAstExtractor::class);
  12. use Symfony\Component\Finder\Finder;
  13. use Symfony\Component\Translation\MessageCatalogue;
  14. /**
  15. * PhpExtractor extracts translation messages from a PHP template.
  16. *
  17. * @author Michel Salib <michelsalib@hotmail.com>
  18. *
  19. * @deprecated since Symfony 6.2, use the PhpAstExtractor instead
  20. */
  21. class PhpExtractor extends AbstractFileExtractor implements ExtractorInterface
  22. {
  23. public const MESSAGE_TOKEN = 300;
  24. public const METHOD_ARGUMENTS_TOKEN = 1000;
  25. public const DOMAIN_TOKEN = 1001;
  26. /**
  27. * Prefix for new found message.
  28. */
  29. private string $prefix = '';
  30. /**
  31. * The sequence that captures translation messages.
  32. */
  33. protected $sequences = [
  34. [
  35. '->',
  36. 'trans',
  37. '(',
  38. self::MESSAGE_TOKEN,
  39. ',',
  40. self::METHOD_ARGUMENTS_TOKEN,
  41. ',',
  42. self::DOMAIN_TOKEN,
  43. ],
  44. [
  45. '->',
  46. 'trans',
  47. '(',
  48. self::MESSAGE_TOKEN,
  49. ],
  50. [
  51. 'new',
  52. 'TranslatableMessage',
  53. '(',
  54. self::MESSAGE_TOKEN,
  55. ',',
  56. self::METHOD_ARGUMENTS_TOKEN,
  57. ',',
  58. self::DOMAIN_TOKEN,
  59. ],
  60. [
  61. 'new',
  62. 'TranslatableMessage',
  63. '(',
  64. self::MESSAGE_TOKEN,
  65. ],
  66. [
  67. 'new',
  68. '\\',
  69. 'Symfony',
  70. '\\',
  71. 'Component',
  72. '\\',
  73. 'Translation',
  74. '\\',
  75. 'TranslatableMessage',
  76. '(',
  77. self::MESSAGE_TOKEN,
  78. ',',
  79. self::METHOD_ARGUMENTS_TOKEN,
  80. ',',
  81. self::DOMAIN_TOKEN,
  82. ],
  83. [
  84. 'new',
  85. '\Symfony\Component\Translation\TranslatableMessage',
  86. '(',
  87. self::MESSAGE_TOKEN,
  88. ',',
  89. self::METHOD_ARGUMENTS_TOKEN,
  90. ',',
  91. self::DOMAIN_TOKEN,
  92. ],
  93. [
  94. 'new',
  95. '\\',
  96. 'Symfony',
  97. '\\',
  98. 'Component',
  99. '\\',
  100. 'Translation',
  101. '\\',
  102. 'TranslatableMessage',
  103. '(',
  104. self::MESSAGE_TOKEN,
  105. ],
  106. [
  107. 'new',
  108. '\Symfony\Component\Translation\TranslatableMessage',
  109. '(',
  110. self::MESSAGE_TOKEN,
  111. ],
  112. [
  113. 't',
  114. '(',
  115. self::MESSAGE_TOKEN,
  116. ',',
  117. self::METHOD_ARGUMENTS_TOKEN,
  118. ',',
  119. self::DOMAIN_TOKEN,
  120. ],
  121. [
  122. 't',
  123. '(',
  124. self::MESSAGE_TOKEN,
  125. ],
  126. ];
  127. /**
  128. * @return void
  129. */
  130. public function extract(string|iterable $resource, MessageCatalogue $catalog)
  131. {
  132. $files = $this->extractFiles($resource);
  133. foreach ($files as $file) {
  134. $this->parseTokens(token_get_all(file_get_contents($file)), $catalog, $file);
  135. gc_mem_caches();
  136. }
  137. }
  138. /**
  139. * @return void
  140. */
  141. public function setPrefix(string $prefix)
  142. {
  143. $this->prefix = $prefix;
  144. }
  145. /**
  146. * Normalizes a token.
  147. */
  148. protected function normalizeToken(mixed $token): ?string
  149. {
  150. if (isset($token[1]) && 'b"' !== $token) {
  151. return $token[1];
  152. }
  153. return $token;
  154. }
  155. /**
  156. * Seeks to a non-whitespace token.
  157. */
  158. private function seekToNextRelevantToken(\Iterator $tokenIterator): void
  159. {
  160. for (; $tokenIterator->valid(); $tokenIterator->next()) {
  161. $t = $tokenIterator->current();
  162. if (\T_WHITESPACE !== $t[0]) {
  163. break;
  164. }
  165. }
  166. }
  167. private function skipMethodArgument(\Iterator $tokenIterator): void
  168. {
  169. $openBraces = 0;
  170. for (; $tokenIterator->valid(); $tokenIterator->next()) {
  171. $t = $tokenIterator->current();
  172. if ('[' === $t[0] || '(' === $t[0]) {
  173. ++$openBraces;
  174. }
  175. if (']' === $t[0] || ')' === $t[0]) {
  176. --$openBraces;
  177. }
  178. if ((0 === $openBraces && ',' === $t[0]) || (-1 === $openBraces && ')' === $t[0])) {
  179. break;
  180. }
  181. }
  182. }
  183. /**
  184. * Extracts the message from the iterator while the tokens
  185. * match allowed message tokens.
  186. */
  187. private function getValue(\Iterator $tokenIterator): string
  188. {
  189. $message = '';
  190. $docToken = '';
  191. $docPart = '';
  192. for (; $tokenIterator->valid(); $tokenIterator->next()) {
  193. $t = $tokenIterator->current();
  194. if ('.' === $t) {
  195. // Concatenate with next token
  196. continue;
  197. }
  198. if (!isset($t[1])) {
  199. break;
  200. }
  201. switch ($t[0]) {
  202. case \T_START_HEREDOC:
  203. $docToken = $t[1];
  204. break;
  205. case \T_ENCAPSED_AND_WHITESPACE:
  206. case \T_CONSTANT_ENCAPSED_STRING:
  207. if ('' === $docToken) {
  208. $message .= PhpStringTokenParser::parse($t[1]);
  209. } else {
  210. $docPart = $t[1];
  211. }
  212. break;
  213. case \T_END_HEREDOC:
  214. if ($indentation = strspn($t[1], ' ')) {
  215. $docPartWithLineBreaks = $docPart;
  216. $docPart = '';
  217. foreach (preg_split('~(\r\n|\n|\r)~', $docPartWithLineBreaks, -1, \PREG_SPLIT_DELIM_CAPTURE) as $str) {
  218. if (\in_array($str, ["\r\n", "\n", "\r"], true)) {
  219. $docPart .= $str;
  220. } else {
  221. $docPart .= substr($str, $indentation);
  222. }
  223. }
  224. }
  225. $message .= PhpStringTokenParser::parseDocString($docToken, $docPart);
  226. $docToken = '';
  227. $docPart = '';
  228. break;
  229. case \T_WHITESPACE:
  230. break;
  231. default:
  232. break 2;
  233. }
  234. }
  235. return $message;
  236. }
  237. /**
  238. * Extracts trans message from PHP tokens.
  239. *
  240. * @return void
  241. */
  242. protected function parseTokens(array $tokens, MessageCatalogue $catalog, string $filename)
  243. {
  244. $tokenIterator = new \ArrayIterator($tokens);
  245. for ($key = 0; $key < $tokenIterator->count(); ++$key) {
  246. foreach ($this->sequences as $sequence) {
  247. $message = '';
  248. $domain = 'messages';
  249. $tokenIterator->seek($key);
  250. foreach ($sequence as $sequenceKey => $item) {
  251. $this->seekToNextRelevantToken($tokenIterator);
  252. if ($this->normalizeToken($tokenIterator->current()) === $item) {
  253. $tokenIterator->next();
  254. continue;
  255. } elseif (self::MESSAGE_TOKEN === $item) {
  256. $message = $this->getValue($tokenIterator);
  257. if (\count($sequence) === ($sequenceKey + 1)) {
  258. break;
  259. }
  260. } elseif (self::METHOD_ARGUMENTS_TOKEN === $item) {
  261. $this->skipMethodArgument($tokenIterator);
  262. } elseif (self::DOMAIN_TOKEN === $item) {
  263. $domainToken = $this->getValue($tokenIterator);
  264. if ('' !== $domainToken) {
  265. $domain = $domainToken;
  266. }
  267. break;
  268. } else {
  269. break;
  270. }
  271. }
  272. if ($message) {
  273. $catalog->set($message, $this->prefix.$message, $domain);
  274. $metadata = $catalog->getMetadata($message, $domain) ?? [];
  275. $normalizedFilename = preg_replace('{[\\\\/]+}', '/', $filename);
  276. $metadata['sources'][] = $normalizedFilename.':'.$tokens[$key][2];
  277. $catalog->setMetadata($message, $metadata, $domain);
  278. break;
  279. }
  280. }
  281. }
  282. }
  283. /**
  284. * @throws \InvalidArgumentException
  285. */
  286. protected function canBeExtracted(string $file): bool
  287. {
  288. return $this->isFile($file) && 'php' === pathinfo($file, \PATHINFO_EXTENSION);
  289. }
  290. protected function extractFromDirectory(string|array $directory): iterable
  291. {
  292. if (!class_exists(Finder::class)) {
  293. throw new \LogicException(sprintf('You cannot use "%s" as the "symfony/finder" package is not installed. Try running "composer require symfony/finder".', static::class));
  294. }
  295. $finder = new Finder();
  296. return $finder->files()->name('*.php')->in($directory);
  297. }
  298. }