123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108 |
- <?php
- /*
- * This file is part of the Symfony package.
- *
- * (c) Fabien Potencier <fabien@symfony.com>
- *
- * For the full copyright and license information, please view the LICENSE
- * file that was distributed with this source code.
- */
- namespace Symfony\Component\Yaml;
- use Symfony\Component\Yaml\Exception\ParseException;
- /**
- * Unescaper encapsulates unescaping rules for single and double-quoted
- * YAML strings.
- *
- * @author Matthew Lewinski <matthew@lewinski.org>
- *
- * @internal
- */
- class Unescaper
- {
- /**
- * Regex fragment that matches an escaped character in a double quoted string.
- */
- public const REGEX_ESCAPED_CHARACTER = '\\\\(x[0-9a-fA-F]{2}|u[0-9a-fA-F]{4}|U[0-9a-fA-F]{8}|.)';
- /**
- * Unescapes a single quoted string.
- *
- * @param string $value A single quoted string
- */
- public function unescapeSingleQuotedString(string $value): string
- {
- return str_replace('\'\'', '\'', $value);
- }
- /**
- * Unescapes a double quoted string.
- *
- * @param string $value A double quoted string
- */
- public function unescapeDoubleQuotedString(string $value): string
- {
- $callback = fn ($match) => $this->unescapeCharacter($match[0]);
- // evaluate the string
- return preg_replace_callback('/'.self::REGEX_ESCAPED_CHARACTER.'/u', $callback, $value);
- }
- /**
- * Unescapes a character that was found in a double-quoted string.
- *
- * @param string $value An escaped character
- */
- private function unescapeCharacter(string $value): string
- {
- return match ($value[1]) {
- '0' => "\x0",
- 'a' => "\x7",
- 'b' => "\x8",
- 't' => "\t",
- "\t" => "\t",
- 'n' => "\n",
- 'v' => "\xB",
- 'f' => "\xC",
- 'r' => "\r",
- 'e' => "\x1B",
- ' ' => ' ',
- '"' => '"',
- '/' => '/',
- '\\' => '\\',
- // U+0085 NEXT LINE
- 'N' => "\xC2\x85",
- // U+00A0 NO-BREAK SPACE
- '_' => "\xC2\xA0",
- // U+2028 LINE SEPARATOR
- 'L' => "\xE2\x80\xA8",
- // U+2029 PARAGRAPH SEPARATOR
- 'P' => "\xE2\x80\xA9",
- 'x' => self::utf8chr(hexdec(substr($value, 2, 2))),
- 'u' => self::utf8chr(hexdec(substr($value, 2, 4))),
- 'U' => self::utf8chr(hexdec(substr($value, 2, 8))),
- default => throw new ParseException(sprintf('Found unknown escape character "%s".', $value)),
- };
- }
- /**
- * Get the UTF-8 character for the given code point.
- */
- private static function utf8chr(int $c): string
- {
- if (0x80 > $c %= 0x200000) {
- return \chr($c);
- }
- if (0x800 > $c) {
- return \chr(0xC0 | $c >> 6).\chr(0x80 | $c & 0x3F);
- }
- if (0x10000 > $c) {
- return \chr(0xE0 | $c >> 12).\chr(0x80 | $c >> 6 & 0x3F).\chr(0x80 | $c & 0x3F);
- }
- return \chr(0xF0 | $c >> 18).\chr(0x80 | $c >> 12 & 0x3F).\chr(0x80 | $c >> 6 & 0x3F).\chr(0x80 | $c & 0x3F);
- }
- }
|