From 9b89858c26ba0c0c46e9a0eafb46ce9c2df9b321 Mon Sep 17 00:00:00 2001 From: David Grudl Date: Mon, 1 Nov 2021 23:15:10 +0100 Subject: [PATCH] added Strings::ord() --- src/Utils/Strings.php | 18 ++++++++++++++ tests/Utils/Strings.ord().phpt | 44 ++++++++++++++++++++++++++++++++++ 2 files changed, 62 insertions(+) create mode 100644 tests/Utils/Strings.ord().phpt diff --git a/src/Utils/Strings.php b/src/Utils/Strings.php index b3419f084..4c98ed5d4 100644 --- a/src/Utils/Strings.php +++ b/src/Utils/Strings.php @@ -62,6 +62,24 @@ public static function chr(int $code): string } + /** + * Returns a code point of specific character in UTF-8 (number in range 0x0000..D7FF or 0xE000..10FFFF). + */ + public static function ord(string $c): int + { + if (!extension_loaded('iconv')) { + throw new Nette\NotSupportedException(__METHOD__ . '() requires ICONV extension that is not loaded.'); + } + + $tmp = iconv('UTF-8', 'UTF-32BE//IGNORE', $c); + if (!$tmp) { + throw new Nette\InvalidArgumentException('Invalid UTF-8 character "' . ($c === '' ? '' : '\x' . strtoupper(bin2hex($c))) . '".'); + } + + return unpack('N', $tmp)[1]; + } + + /** * Starts the $haystack string with the prefix $needle? */ diff --git a/tests/Utils/Strings.ord().phpt b/tests/Utils/Strings.ord().phpt new file mode 100644 index 000000000..9d5e763e5 --- /dev/null +++ b/tests/Utils/Strings.ord().phpt @@ -0,0 +1,44 @@ + Strings::ord("\u{D800}"), + Nette\InvalidArgumentException::class, + 'Invalid UTF-8 character "\xEDA080".', +); + +Assert::exception( + fn() => Strings::ord(''), + Nette\InvalidArgumentException::class, + 'Invalid UTF-8 character "".', +); + +Assert::exception( + fn() => Strings::ord("\xFF"), + Nette\InvalidArgumentException::class, + 'Invalid UTF-8 character "\xFF".', +);