123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161 |
- <?php declare(strict_types=1);
- namespace PhpParser\Node\Scalar;
- use PhpParser\Error;
- use PhpParser\Node\Scalar;
- class String_ extends Scalar {
- /* For use in "kind" attribute */
- public const KIND_SINGLE_QUOTED = 1;
- public const KIND_DOUBLE_QUOTED = 2;
- public const KIND_HEREDOC = 3;
- public const KIND_NOWDOC = 4;
- /** @var string String value */
- public string $value;
- /** @var array<string, string> Escaped character to its decoded value */
- protected static array $replacements = [
- '\\' => '\\',
- '$' => '$',
- 'n' => "\n",
- 'r' => "\r",
- 't' => "\t",
- 'f' => "\f",
- 'v' => "\v",
- 'e' => "\x1B",
- ];
- /**
- * Constructs a string scalar node.
- *
- * @param string $value Value of the string
- * @param array<string, mixed> $attributes Additional attributes
- */
- public function __construct(string $value, array $attributes = []) {
- $this->attributes = $attributes;
- $this->value = $value;
- }
- public function getSubNodeNames(): array {
- return ['value'];
- }
- /**
- * @param array<string, mixed> $attributes
- * @param bool $parseUnicodeEscape Whether to parse PHP 7 \u escapes
- */
- public static function fromString(string $str, array $attributes = [], bool $parseUnicodeEscape = true): self {
- $attributes['kind'] = ($str[0] === "'" || ($str[1] === "'" && ($str[0] === 'b' || $str[0] === 'B')))
- ? Scalar\String_::KIND_SINGLE_QUOTED
- : Scalar\String_::KIND_DOUBLE_QUOTED;
- $attributes['rawValue'] = $str;
- $string = self::parse($str, $parseUnicodeEscape);
- return new self($string, $attributes);
- }
- /**
- * @internal
- *
- * Parses a string token.
- *
- * @param string $str String token content
- * @param bool $parseUnicodeEscape Whether to parse PHP 7 \u escapes
- *
- * @return string The parsed string
- */
- public static function parse(string $str, bool $parseUnicodeEscape = true): string {
- $bLength = 0;
- if ('b' === $str[0] || 'B' === $str[0]) {
- $bLength = 1;
- }
- if ('\'' === $str[$bLength]) {
- return str_replace(
- ['\\\\', '\\\''],
- ['\\', '\''],
- substr($str, $bLength + 1, -1)
- );
- } else {
- return self::parseEscapeSequences(
- substr($str, $bLength + 1, -1), '"', $parseUnicodeEscape
- );
- }
- }
- /**
- * @internal
- *
- * Parses escape sequences in strings (all string types apart from single quoted).
- *
- * @param string $str String without quotes
- * @param null|string $quote Quote type
- * @param bool $parseUnicodeEscape Whether to parse PHP 7 \u escapes
- *
- * @return string String with escape sequences parsed
- */
- public static function parseEscapeSequences(string $str, ?string $quote, bool $parseUnicodeEscape = true): string {
- if (null !== $quote) {
- $str = str_replace('\\' . $quote, $quote, $str);
- }
- $extra = '';
- if ($parseUnicodeEscape) {
- $extra = '|u\{([0-9a-fA-F]+)\}';
- }
- return preg_replace_callback(
- '~\\\\([\\\\$nrtfve]|[xX][0-9a-fA-F]{1,2}|[0-7]{1,3}' . $extra . ')~',
- function ($matches) {
- $str = $matches[1];
- if (isset(self::$replacements[$str])) {
- return self::$replacements[$str];
- }
- if ('x' === $str[0] || 'X' === $str[0]) {
- return chr(hexdec(substr($str, 1)));
- }
- if ('u' === $str[0]) {
- $dec = hexdec($matches[2]);
- // If it overflowed to float, treat as INT_MAX, it will throw an error anyway.
- return self::codePointToUtf8(\is_int($dec) ? $dec : \PHP_INT_MAX);
- } else {
- return chr(octdec($str));
- }
- },
- $str
- );
- }
- /**
- * Converts a Unicode code point to its UTF-8 encoded representation.
- *
- * @param int $num Code point
- *
- * @return string UTF-8 representation of code point
- */
- private static function codePointToUtf8(int $num): string {
- if ($num <= 0x7F) {
- return chr($num);
- }
- if ($num <= 0x7FF) {
- return chr(($num >> 6) + 0xC0) . chr(($num & 0x3F) + 0x80);
- }
- if ($num <= 0xFFFF) {
- return chr(($num >> 12) + 0xE0) . chr((($num >> 6) & 0x3F) + 0x80) . chr(($num & 0x3F) + 0x80);
- }
- if ($num <= 0x1FFFFF) {
- return chr(($num >> 18) + 0xF0) . chr((($num >> 12) & 0x3F) + 0x80)
- . chr((($num >> 6) & 0x3F) + 0x80) . chr(($num & 0x3F) + 0x80);
- }
- throw new Error('Invalid UTF-8 codepoint escape sequence: Codepoint too large');
- }
- public function getType(): string {
- return 'Scalar_String';
- }
- }
|