2004-02-09 01:57:02 -05:00
|
|
|
|
<?php
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2009-12-08 14:59:34 -05:00
|
|
|
|
* Main WordPress Formatting API.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* Handles many functions for formatting output.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @package WordPress
|
2013-02-01 13:07:08 -05:00
|
|
|
|
*/
|
2004-02-09 01:57:02 -05:00
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2019-10-25 20:58:04 -04:00
|
|
|
|
* Replaces common plain text characters with formatted entities.
|
|
|
|
|
*
|
|
|
|
|
* Returns given text with transformations of quotes into smart quotes, apostrophes,
|
|
|
|
|
* dashes, ellipses, the trademark symbol, and the multiplication symbol.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* As an example,
|
2014-11-24 00:30:25 -05:00
|
|
|
|
*
|
|
|
|
|
* 'cause today's effort makes it worth tomorrow's "holiday" ...
|
|
|
|
|
*
|
2008-08-17 07:29:43 -04:00
|
|
|
|
* Becomes:
|
2014-11-24 00:30:25 -05:00
|
|
|
|
*
|
|
|
|
|
* ’cause today’s effort makes it worth tomorrow’s “holiday” …
|
|
|
|
|
*
|
2019-10-25 20:58:04 -04:00
|
|
|
|
* Code within certain HTML blocks are skipped.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2016-05-23 15:01:27 -04:00
|
|
|
|
* Do not use this function before the {@see 'init'} action hook; everything will break.
|
2015-06-15 20:57:24 -04:00
|
|
|
|
*
|
2008-08-17 07:29:43 -04:00
|
|
|
|
* @since 0.71
|
2015-05-25 02:25:25 -04:00
|
|
|
|
*
|
2019-10-25 20:58:04 -04:00
|
|
|
|
* @global array $wp_cockneyreplace Array of formatted entities for certain common phrases.
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @global array $shortcode_tags
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2019-10-25 20:58:04 -04:00
|
|
|
|
* @param string $text The text to be formatted.
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param bool $reset Set to true for unit testing. Translated patterns will reset.
|
2019-10-25 20:58:04 -04:00
|
|
|
|
* @return string The string replaced with HTML entities.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function wptexturize( $text, $reset = false ) {
|
2014-11-20 09:28:23 -05:00
|
|
|
|
global $wp_cockneyreplace, $shortcode_tags;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
static $static_characters = null,
|
|
|
|
|
$static_replacements = null,
|
|
|
|
|
$dynamic_characters = null,
|
|
|
|
|
$dynamic_replacements = null,
|
|
|
|
|
$default_no_texturize_tags = null,
|
2015-05-29 11:43:29 -04:00
|
|
|
|
$default_no_texturize_shortcodes = null,
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$run_texturize = true,
|
|
|
|
|
$apos = null,
|
|
|
|
|
$prime = null,
|
|
|
|
|
$double_prime = null,
|
|
|
|
|
$opening_quote = null,
|
|
|
|
|
$closing_quote = null,
|
|
|
|
|
$opening_single_quote = null,
|
|
|
|
|
$closing_single_quote = null,
|
|
|
|
|
$open_q_flag = '<!--oq-->',
|
|
|
|
|
$open_sq_flag = '<!--osq-->',
|
|
|
|
|
$apos_flag = '<!--apos-->';
|
2014-06-09 21:46:14 -04:00
|
|
|
|
|
2014-06-17 13:57:14 -04:00
|
|
|
|
// If there's nothing to do, just stop.
|
|
|
|
|
if ( empty( $text ) || false === $run_texturize ) {
|
2014-06-09 21:46:14 -04:00
|
|
|
|
return $text;
|
|
|
|
|
}
|
2010-01-15 17:11:12 -05:00
|
|
|
|
|
2014-06-17 13:57:14 -04:00
|
|
|
|
// Set up static variables. Run once only.
|
|
|
|
|
if ( $reset || ! isset( $static_characters ) ) {
|
2014-06-10 02:29:14 -04:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters whether to skip running wptexturize().
|
2014-06-10 02:29:14 -04:00
|
|
|
|
*
|
2020-06-26 14:49:09 -04:00
|
|
|
|
* Returning false from the filter will effectively short-circuit wptexturize()
|
|
|
|
|
* and return the original text passed to the function instead.
|
2014-06-10 02:29:14 -04:00
|
|
|
|
*
|
2014-07-13 21:02:15 -04:00
|
|
|
|
* The filter runs only once, the first time wptexturize() is called.
|
2014-06-10 02:29:14 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 4.0.0
|
|
|
|
|
*
|
2014-07-13 21:02:15 -04:00
|
|
|
|
* @see wptexturize()
|
|
|
|
|
*
|
|
|
|
|
* @param bool $run_texturize Whether to short-circuit wptexturize().
|
2014-06-10 02:29:14 -04:00
|
|
|
|
*/
|
2014-06-09 21:46:14 -04:00
|
|
|
|
$run_texturize = apply_filters( 'run_wptexturize', $run_texturize );
|
|
|
|
|
if ( false === $run_texturize ) {
|
|
|
|
|
return $text;
|
|
|
|
|
}
|
|
|
|
|
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Opening curly double quote. */
|
2012-01-31 09:06:32 -05:00
|
|
|
|
$opening_quote = _x( '“', 'opening curly double quote' );
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Closing curly double quote. */
|
2012-01-31 09:06:32 -05:00
|
|
|
|
$closing_quote = _x( '”', 'closing curly double quote' );
|
|
|
|
|
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Apostrophe, for example in 'cause or can't. */
|
2012-01-31 09:06:32 -05:00
|
|
|
|
$apos = _x( '’', 'apostrophe' );
|
|
|
|
|
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Prime, for example in 9' (nine feet). */
|
2012-01-31 09:06:32 -05:00
|
|
|
|
$prime = _x( '′', 'prime' );
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Double prime, for example in 9" (nine inches). */
|
2012-01-31 09:06:32 -05:00
|
|
|
|
$double_prime = _x( '″', 'double prime' );
|
|
|
|
|
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Opening curly single quote. */
|
2012-01-31 09:06:32 -05:00
|
|
|
|
$opening_single_quote = _x( '‘', 'opening curly single quote' );
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Closing curly single quote. */
|
2012-01-31 09:06:32 -05:00
|
|
|
|
$closing_single_quote = _x( '’', 'closing curly single quote' );
|
|
|
|
|
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: En dash. */
|
2012-01-31 09:06:32 -05:00
|
|
|
|
$en_dash = _x( '–', 'en dash' );
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Em dash. */
|
2012-01-31 09:06:32 -05:00
|
|
|
|
$em_dash = _x( '—', 'em dash' );
|
2009-09-14 10:03:32 -04:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$default_no_texturize_tags = array( 'pre', 'code', 'kbd', 'style', 'script', 'tt' );
|
|
|
|
|
$default_no_texturize_shortcodes = array( 'code' );
|
2009-09-14 10:03:32 -04:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// If a plugin has provided an autocorrect array, use it.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( isset( $wp_cockneyreplace ) ) {
|
|
|
|
|
$cockney = array_keys( $wp_cockneyreplace );
|
2015-01-20 13:44:26 -05:00
|
|
|
|
$cockneyreplace = array_values( $wp_cockneyreplace );
|
2009-10-21 17:57:27 -04:00
|
|
|
|
} else {
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/*
|
|
|
|
|
* translators: This is a comma-separated list of words that defy the syntax of quotations in normal use,
|
2020-01-28 19:45:18 -05:00
|
|
|
|
* for example... 'We do not have enough words yet'... is a typical quoted phrase. But when we write
|
2015-06-15 20:46:24 -04:00
|
|
|
|
* lines of code 'til we have enough of 'em, then we need to insert apostrophes instead of quotes.
|
|
|
|
|
*/
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$cockney = explode(
|
2018-08-16 21:51:36 -04:00
|
|
|
|
',',
|
|
|
|
|
_x(
|
2017-11-30 18:11:00 -05:00
|
|
|
|
"'tain't,'twere,'twas,'tis,'twill,'til,'bout,'nuff,'round,'cause,'em",
|
|
|
|
|
'Comma-separated list of words to texturize in your language'
|
|
|
|
|
)
|
|
|
|
|
);
|
2015-06-15 20:46:24 -04:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$cockneyreplace = explode(
|
2018-08-16 21:51:36 -04:00
|
|
|
|
',',
|
|
|
|
|
_x(
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'’tain’t,’twere,’twas,’tis,’twill,’til,’bout,’nuff,’round,’cause,’em',
|
|
|
|
|
'Comma-separated list of replacement words in your language'
|
|
|
|
|
)
|
|
|
|
|
);
|
2012-01-31 09:06:32 -05:00
|
|
|
|
}
|
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$static_characters = array_merge( array( '...', '``', '\'\'', ' (tm)' ), $cockney );
|
2014-06-10 10:22:15 -04:00
|
|
|
|
$static_replacements = array_merge( array( '…', $opening_quote, $closing_quote, ' ™' ), $cockneyreplace );
|
2012-01-31 09:06:32 -05:00
|
|
|
|
|
2014-03-29 03:16:16 -04:00
|
|
|
|
// Pattern-based replacements of characters.
|
2014-07-03 21:15:15 -04:00
|
|
|
|
// Sort the remaining patterns into several arrays for performance tuning.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$dynamic_characters = array(
|
|
|
|
|
'apos' => array(),
|
|
|
|
|
'quote' => array(),
|
|
|
|
|
'dash' => array(),
|
|
|
|
|
);
|
|
|
|
|
$dynamic_replacements = array(
|
|
|
|
|
'apos' => array(),
|
|
|
|
|
'quote' => array(),
|
|
|
|
|
'dash' => array(),
|
|
|
|
|
);
|
|
|
|
|
$dynamic = array();
|
|
|
|
|
$spaces = wp_spaces_regexp();
|
2014-03-29 03:16:16 -04:00
|
|
|
|
|
2014-06-17 16:14:15 -04:00
|
|
|
|
// '99' and '99" are ambiguous among other patterns; assume it's an abbreviated year at the end of a quotation.
|
|
|
|
|
if ( "'" !== $apos || "'" !== $closing_single_quote ) {
|
2015-06-19 16:06:25 -04:00
|
|
|
|
$dynamic[ '/\'(\d\d)\'(?=\Z|[.,:;!?)}\-\]]|>|' . $spaces . ')/' ] = $apos_flag . '$1' . $closing_single_quote;
|
2014-06-17 13:41:15 -04:00
|
|
|
|
}
|
2014-06-17 16:14:15 -04:00
|
|
|
|
if ( "'" !== $apos || '"' !== $closing_quote ) {
|
2015-06-19 16:06:25 -04:00
|
|
|
|
$dynamic[ '/\'(\d\d)"(?=\Z|[.,:;!?)}\-\]]|>|' . $spaces . ')/' ] = $apos_flag . '$1' . $closing_quote;
|
2014-06-17 16:14:15 -04:00
|
|
|
|
}
|
|
|
|
|
|
2014-06-17 16:19:14 -04:00
|
|
|
|
// '99 '99s '99's (apostrophe) But never '9 or '99% or '999 or '99.0.
|
2014-06-17 13:41:15 -04:00
|
|
|
|
if ( "'" !== $apos ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$dynamic['/\'(?=\d\d(?:\Z|(?![%\d]|[.,]\d)))/'] = $apos_flag;
|
2014-06-17 13:41:15 -04:00
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Quoted numbers like '0.42'.
|
2014-06-09 22:43:14 -04:00
|
|
|
|
if ( "'" !== $opening_single_quote && "'" !== $closing_single_quote ) {
|
2015-06-19 16:06:25 -04:00
|
|
|
|
$dynamic[ '/(?<=\A|' . $spaces . ')\'(\d[.,\d]*)\'/' ] = $open_sq_flag . '$1' . $closing_single_quote;
|
2014-06-09 22:43:14 -04:00
|
|
|
|
}
|
|
|
|
|
|
2014-06-10 10:22:15 -04:00
|
|
|
|
// Single quote at start, or preceded by (, {, <, [, ", -, or spaces.
|
2014-03-29 05:00:15 -04:00
|
|
|
|
if ( "'" !== $opening_single_quote ) {
|
2015-06-19 16:06:25 -04:00
|
|
|
|
$dynamic[ '/(?<=\A|[([{"\-]|<|' . $spaces . ')\'/' ] = $open_sq_flag;
|
2014-03-29 05:00:15 -04:00
|
|
|
|
}
|
2014-03-29 03:16:16 -04:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Apostrophe in a word. No spaces, double apostrophes, or other punctuation.
|
2014-06-17 16:14:15 -04:00
|
|
|
|
if ( "'" !== $apos ) {
|
2015-06-19 16:06:25 -04:00
|
|
|
|
$dynamic[ '/(?<!' . $spaces . ')\'(?!\Z|[.,:;!?"\'(){}[\]\-]|&[lg]t;|' . $spaces . ')/' ] = $apos_flag;
|
2014-07-03 21:15:15 -04:00
|
|
|
|
}
|
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$dynamic_characters['apos'] = array_keys( $dynamic );
|
2014-07-03 21:15:15 -04:00
|
|
|
|
$dynamic_replacements['apos'] = array_values( $dynamic );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$dynamic = array();
|
2014-09-04 11:23:16 -04:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Quoted numbers like "42".
|
2014-07-03 21:15:15 -04:00
|
|
|
|
if ( '"' !== $opening_quote && '"' !== $closing_quote ) {
|
2015-06-19 16:06:25 -04:00
|
|
|
|
$dynamic[ '/(?<=\A|' . $spaces . ')"(\d[.,\d]*)"/' ] = $open_q_flag . '$1' . $closing_quote;
|
2014-07-03 21:15:15 -04:00
|
|
|
|
}
|
|
|
|
|
|
2014-06-10 10:22:15 -04:00
|
|
|
|
// Double quote at start, or preceded by (, {, <, [, -, or spaces, and not followed by spaces.
|
2014-03-29 05:00:15 -04:00
|
|
|
|
if ( '"' !== $opening_quote ) {
|
2015-06-19 16:06:25 -04:00
|
|
|
|
$dynamic[ '/(?<=\A|[([{\-]|<|' . $spaces . ')"(?!' . $spaces . ')/' ] = $open_q_flag;
|
2014-03-29 05:00:15 -04:00
|
|
|
|
}
|
2014-09-04 11:23:16 -04:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$dynamic_characters['quote'] = array_keys( $dynamic );
|
2014-07-03 21:15:15 -04:00
|
|
|
|
$dynamic_replacements['quote'] = array_values( $dynamic );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$dynamic = array();
|
2014-09-04 11:23:16 -04:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Dashes and spaces.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$dynamic['/---/'] = $em_dash;
|
2015-01-15 22:54:24 -05:00
|
|
|
|
$dynamic[ '/(?<=^|' . $spaces . ')--(?=$|' . $spaces . ')/' ] = $em_dash;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$dynamic['/(?<!xn)--/'] = $en_dash;
|
|
|
|
|
$dynamic[ '/(?<=^|' . $spaces . ')-(?=$|' . $spaces . ')/' ] = $en_dash;
|
2014-06-09 22:09:15 -04:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$dynamic_characters['dash'] = array_keys( $dynamic );
|
2014-07-03 21:15:15 -04:00
|
|
|
|
$dynamic_replacements['dash'] = array_values( $dynamic );
|
2006-11-21 17:00:10 -05:00
|
|
|
|
}
|
2004-02-09 01:57:02 -05:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Must do this every time in case plugins use these filters in a context sensitive manner.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the list of HTML elements not to texturize.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 2.8.0
|
|
|
|
|
*
|
2019-10-26 17:09:04 -04:00
|
|
|
|
* @param string[] $default_no_texturize_tags An array of HTML element names.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
2014-06-25 13:49:14 -04:00
|
|
|
|
$no_texturize_tags = apply_filters( 'no_texturize_tags', $default_no_texturize_tags );
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the list of shortcodes not to texturize.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 2.8.0
|
|
|
|
|
*
|
2019-10-26 17:09:04 -04:00
|
|
|
|
* @param string[] $default_no_texturize_shortcodes An array of shortcode names.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
2014-06-25 13:49:14 -04:00
|
|
|
|
$no_texturize_shortcodes = apply_filters( 'no_texturize_shortcodes', $default_no_texturize_shortcodes );
|
2009-04-20 14:18:39 -04:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$no_texturize_tags_stack = array();
|
2009-10-21 17:57:27 -04:00
|
|
|
|
$no_texturize_shortcodes_stack = array();
|
2004-02-09 01:57:02 -05:00
|
|
|
|
|
2014-06-10 10:34:13 -04:00
|
|
|
|
// Look for shortcodes and HTML elements.
|
|
|
|
|
|
2015-12-25 23:46:28 -05:00
|
|
|
|
preg_match_all( '@\[/?([^<>&/\[\]\x00-\x20=]++)@', $text, $matches );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$tagnames = array_intersect( array_keys( $shortcode_tags ), $matches[1] );
|
2015-10-01 14:05:25 -04:00
|
|
|
|
$found_shortcodes = ! empty( $tagnames );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$shortcode_regex = $found_shortcodes ? _get_wptexturize_shortcode_regex( $tagnames ) : '';
|
|
|
|
|
$regex = _get_wptexturize_split_regex( $shortcode_regex );
|
2014-06-10 10:34:13 -04:00
|
|
|
|
|
|
|
|
|
$textarr = preg_split( $regex, $text, -1, PREG_SPLIT_DELIM_CAPTURE | PREG_SPLIT_NO_EMPTY );
|
2011-04-13 13:11:35 -04:00
|
|
|
|
|
|
|
|
|
foreach ( $textarr as &$curl ) {
|
2014-08-12 23:56:17 -04:00
|
|
|
|
// Only call _wptexturize_pushpop_element if $curl is a delimiter.
|
2011-04-13 13:11:35 -04:00
|
|
|
|
$first = $curl[0];
|
2015-10-01 14:05:25 -04:00
|
|
|
|
if ( '<' === $first ) {
|
|
|
|
|
if ( '<!--' === substr( $curl, 0, 4 ) ) {
|
2015-10-02 00:26:25 -04:00
|
|
|
|
// This is an HTML comment delimiter.
|
2015-10-01 14:05:25 -04:00
|
|
|
|
continue;
|
|
|
|
|
} else {
|
|
|
|
|
// This is an HTML element delimiter.
|
2015-12-20 21:43:26 -05:00
|
|
|
|
|
|
|
|
|
// Replace each & with & unless it already looks like an entity.
|
|
|
|
|
$curl = preg_replace( '/&(?!#(?:\d+|x[a-f0-9]+);|[a-z1-4]{1,8};)/i', '&', $curl );
|
|
|
|
|
|
2015-10-01 14:05:25 -04:00
|
|
|
|
_wptexturize_pushpop_element( $curl, $no_texturize_tags_stack, $no_texturize_tags );
|
|
|
|
|
}
|
2014-07-06 04:50:18 -04:00
|
|
|
|
} elseif ( '' === trim( $curl ) ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// This is a newline between delimiters. Performance improves when we check this.
|
2014-07-06 04:50:18 -04:00
|
|
|
|
continue;
|
|
|
|
|
|
2015-10-01 14:05:25 -04:00
|
|
|
|
} elseif ( '[' === $first && $found_shortcodes && 1 === preg_match( '/^' . $shortcode_regex . '$/', $curl ) ) {
|
2014-08-12 23:56:17 -04:00
|
|
|
|
// This is a shortcode delimiter.
|
2014-06-10 10:34:13 -04:00
|
|
|
|
|
2014-09-17 11:14:17 -04:00
|
|
|
|
if ( '[[' !== substr( $curl, 0, 2 ) && ']]' !== substr( $curl, -2 ) ) {
|
|
|
|
|
// Looks like a normal shortcode.
|
|
|
|
|
_wptexturize_pushpop_element( $curl, $no_texturize_shortcodes_stack, $no_texturize_shortcodes );
|
|
|
|
|
} else {
|
|
|
|
|
// Looks like an escaped shortcode.
|
|
|
|
|
continue;
|
|
|
|
|
}
|
2014-06-25 13:49:14 -04:00
|
|
|
|
} elseif ( empty( $no_texturize_shortcodes_stack ) && empty( $no_texturize_tags_stack ) ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// This is neither a delimiter, nor is this content inside of no_texturize pairs. Do texturize.
|
2014-03-29 03:16:16 -04:00
|
|
|
|
|
2014-06-25 13:49:14 -04:00
|
|
|
|
$curl = str_replace( $static_characters, $static_replacements, $curl );
|
2014-07-03 21:15:15 -04:00
|
|
|
|
|
|
|
|
|
if ( false !== strpos( $curl, "'" ) ) {
|
|
|
|
|
$curl = preg_replace( $dynamic_characters['apos'], $dynamic_replacements['apos'], $curl );
|
2015-06-19 16:06:25 -04:00
|
|
|
|
$curl = wptexturize_primes( $curl, "'", $prime, $open_sq_flag, $closing_single_quote );
|
|
|
|
|
$curl = str_replace( $apos_flag, $apos, $curl );
|
|
|
|
|
$curl = str_replace( $open_sq_flag, $opening_single_quote, $curl );
|
2014-07-03 21:15:15 -04:00
|
|
|
|
}
|
|
|
|
|
if ( false !== strpos( $curl, '"' ) ) {
|
|
|
|
|
$curl = preg_replace( $dynamic_characters['quote'], $dynamic_replacements['quote'], $curl );
|
2015-06-19 16:06:25 -04:00
|
|
|
|
$curl = wptexturize_primes( $curl, '"', $double_prime, $open_q_flag, $closing_quote );
|
|
|
|
|
$curl = str_replace( $open_q_flag, $opening_quote, $curl );
|
2014-07-03 21:15:15 -04:00
|
|
|
|
}
|
|
|
|
|
if ( false !== strpos( $curl, '-' ) ) {
|
|
|
|
|
$curl = preg_replace( $dynamic_characters['dash'], $dynamic_replacements['dash'], $curl );
|
|
|
|
|
}
|
2014-03-29 03:16:16 -04:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// 9x9 (times), but never 0x9999.
|
2014-12-06 16:24:23 -05:00
|
|
|
|
if ( 1 === preg_match( '/(?<=\d)x\d/', $curl ) ) {
|
2014-03-29 03:16:16 -04:00
|
|
|
|
// Searching for a digit is 10 times more expensive than for the x, so we avoid doing this one!
|
2014-12-06 16:24:23 -05:00
|
|
|
|
$curl = preg_replace( '/\b(\d(?(?<=0)[\d\.,]+|[\d\.,]*))x(\d[\d\.,]*)\b/', '$1×$2', $curl );
|
2014-03-29 03:16:16 -04:00
|
|
|
|
}
|
2015-11-19 18:31:26 -05:00
|
|
|
|
|
|
|
|
|
// Replace each & with & unless it already looks like an entity.
|
|
|
|
|
$curl = preg_replace( '/&(?!#(?:\d+|x[a-f0-9]+);|[a-z1-4]{1,8};)/i', '&', $curl );
|
2004-02-09 01:57:02 -05:00
|
|
|
|
}
|
|
|
|
|
}
|
2014-06-25 13:49:14 -04:00
|
|
|
|
|
2015-11-19 18:31:26 -05:00
|
|
|
|
return implode( '', $textarr );
|
2004-02-09 01:57:02 -05:00
|
|
|
|
}
|
|
|
|
|
|
2015-06-19 16:06:25 -04:00
|
|
|
|
/**
|
|
|
|
|
* Implements a logic tree to determine whether or not "7'." represents seven feet,
|
|
|
|
|
* then converts the special char into either a prime char or a closing quote char.
|
|
|
|
|
*
|
|
|
|
|
* @since 4.3.0
|
|
|
|
|
*
|
2015-07-13 17:30:24 -04:00
|
|
|
|
* @param string $haystack The plain text to be searched.
|
|
|
|
|
* @param string $needle The character to search for such as ' or ".
|
|
|
|
|
* @param string $prime The prime char to use for replacement.
|
|
|
|
|
* @param string $open_quote The opening quote char. Opening quote replacement must be
|
|
|
|
|
* accomplished already.
|
2015-06-19 16:06:25 -04:00
|
|
|
|
* @param string $close_quote The closing quote char to use for replacement.
|
|
|
|
|
* @return string The $haystack value after primes and quotes replacements.
|
|
|
|
|
*/
|
|
|
|
|
function wptexturize_primes( $haystack, $needle, $prime, $open_quote, $close_quote ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$spaces = wp_spaces_regexp();
|
|
|
|
|
$flag = '<!--wp-prime-or-quote-->';
|
|
|
|
|
$quote_pattern = "/$needle(?=\\Z|[.,:;!?)}\\-\\]]|>|" . $spaces . ')/';
|
2015-06-19 16:06:25 -04:00
|
|
|
|
$prime_pattern = "/(?<=\\d)$needle/";
|
|
|
|
|
$flag_after_digit = "/(?<=\\d)$flag/";
|
|
|
|
|
$flag_no_digit = "/(?<!\\d)$flag/";
|
|
|
|
|
|
|
|
|
|
$sentences = explode( $open_quote, $haystack );
|
|
|
|
|
|
2015-08-25 16:28:22 -04:00
|
|
|
|
foreach ( $sentences as $key => &$sentence ) {
|
2015-06-19 16:06:25 -04:00
|
|
|
|
if ( false === strpos( $sentence, $needle ) ) {
|
|
|
|
|
continue;
|
|
|
|
|
} elseif ( 0 !== $key && 0 === substr_count( $sentence, $close_quote ) ) {
|
|
|
|
|
$sentence = preg_replace( $quote_pattern, $flag, $sentence, -1, $count );
|
|
|
|
|
if ( $count > 1 ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// This sentence appears to have multiple closing quotes. Attempt Vulcan logic.
|
2015-06-19 16:06:25 -04:00
|
|
|
|
$sentence = preg_replace( $flag_no_digit, $close_quote, $sentence, -1, $count2 );
|
|
|
|
|
if ( 0 === $count2 ) {
|
|
|
|
|
// Try looking for a quote followed by a period.
|
|
|
|
|
$count2 = substr_count( $sentence, "$flag." );
|
|
|
|
|
if ( $count2 > 0 ) {
|
|
|
|
|
// Assume the rightmost quote-period match is the end of quotation.
|
|
|
|
|
$pos = strrpos( $sentence, "$flag." );
|
|
|
|
|
} else {
|
|
|
|
|
// When all else fails, make the rightmost candidate a closing quote.
|
|
|
|
|
// This is most likely to be problematic in the context of bug #18549.
|
|
|
|
|
$pos = strrpos( $sentence, $flag );
|
|
|
|
|
}
|
|
|
|
|
$sentence = substr_replace( $sentence, $close_quote, $pos, strlen( $flag ) );
|
|
|
|
|
}
|
|
|
|
|
// Use conventional replacement on any remaining primes and quotes.
|
|
|
|
|
$sentence = preg_replace( $prime_pattern, $prime, $sentence );
|
|
|
|
|
$sentence = preg_replace( $flag_after_digit, $prime, $sentence );
|
|
|
|
|
$sentence = str_replace( $flag, $close_quote, $sentence );
|
|
|
|
|
} elseif ( 1 == $count ) {
|
|
|
|
|
// Found only one closing quote candidate, so give it priority over primes.
|
|
|
|
|
$sentence = str_replace( $flag, $close_quote, $sentence );
|
|
|
|
|
$sentence = preg_replace( $prime_pattern, $prime, $sentence );
|
|
|
|
|
} else {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// No closing quotes found. Just run primes pattern.
|
2015-06-19 16:06:25 -04:00
|
|
|
|
$sentence = preg_replace( $prime_pattern, $prime, $sentence );
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
$sentence = preg_replace( $prime_pattern, $prime, $sentence );
|
|
|
|
|
$sentence = preg_replace( $quote_pattern, $close_quote, $sentence );
|
|
|
|
|
}
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( '"' === $needle && false !== strpos( $sentence, '"' ) ) {
|
2015-06-19 16:06:25 -04:00
|
|
|
|
$sentence = str_replace( '"', $close_quote, $sentence );
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return implode( $open_quote, $sentences );
|
|
|
|
|
}
|
|
|
|
|
|
2009-10-21 17:57:27 -04:00
|
|
|
|
/**
|
|
|
|
|
* Search for disabled element tags. Push element to stack on tag open and pop
|
2014-06-25 13:49:14 -04:00
|
|
|
|
* on tag close.
|
|
|
|
|
*
|
|
|
|
|
* Assumes first char of $text is tag opening and last char is tag closing.
|
|
|
|
|
* Assumes second char of $text is optionally '/' to indicate closing as in </html>.
|
2009-10-21 17:57:27 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 2.9.0
|
2013-02-01 13:07:08 -05:00
|
|
|
|
* @access private
|
2009-10-21 17:57:27 -04:00
|
|
|
|
*
|
2019-10-26 17:09:04 -04:00
|
|
|
|
* @param string $text Text to check. Must be a tag like `<html>` or `[shortcode]`.
|
|
|
|
|
* @param string[] $stack Array of open tag elements.
|
|
|
|
|
* @param string[] $disabled_elements Array of tag names to match against. Spaces are not allowed in tag names.
|
2009-10-21 17:57:27 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function _wptexturize_pushpop_element( $text, &$stack, $disabled_elements ) {
|
2014-06-25 13:49:14 -04:00
|
|
|
|
// Is it an opening tag or closing tag?
|
2016-02-18 15:31:27 -05:00
|
|
|
|
if ( isset( $text[1] ) && '/' !== $text[1] ) {
|
2014-06-25 13:49:14 -04:00
|
|
|
|
$opening_tag = true;
|
|
|
|
|
$name_offset = 1;
|
2020-05-23 07:38:08 -04:00
|
|
|
|
} elseif ( 0 === count( $stack ) ) {
|
2014-06-25 13:49:14 -04:00
|
|
|
|
// Stack is empty. Just stop.
|
|
|
|
|
return;
|
|
|
|
|
} else {
|
|
|
|
|
$opening_tag = false;
|
|
|
|
|
$name_offset = 2;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Parse out the tag name.
|
|
|
|
|
$space = strpos( $text, ' ' );
|
2014-09-17 11:14:17 -04:00
|
|
|
|
if ( false === $space ) {
|
2014-06-25 13:49:14 -04:00
|
|
|
|
$space = -1;
|
|
|
|
|
} else {
|
|
|
|
|
$space -= $name_offset;
|
|
|
|
|
}
|
|
|
|
|
$tag = substr( $text, $name_offset, $space );
|
|
|
|
|
|
|
|
|
|
// Handle disabled tags.
|
2020-04-04 23:02:11 -04:00
|
|
|
|
if ( in_array( $tag, $disabled_elements, true ) ) {
|
2014-06-25 13:49:14 -04:00
|
|
|
|
if ( $opening_tag ) {
|
2009-10-21 17:57:27 -04:00
|
|
|
|
/*
|
|
|
|
|
* This disables texturize until we find a closing tag of our type
|
2020-01-28 19:45:18 -05:00
|
|
|
|
* (e.g. <pre>) even if there was invalid nesting before that.
|
2010-01-15 17:11:12 -05:00
|
|
|
|
*
|
2009-10-21 17:57:27 -04:00
|
|
|
|
* Example: in the case <pre>sadsadasd</code>"baba"</pre>
|
2020-01-28 19:45:18 -05:00
|
|
|
|
* "baba" won't be texturized.
|
2009-10-21 17:57:27 -04:00
|
|
|
|
*/
|
|
|
|
|
|
2014-06-25 13:49:14 -04:00
|
|
|
|
array_push( $stack, $tag );
|
|
|
|
|
} elseif ( end( $stack ) == $tag ) {
|
|
|
|
|
array_pop( $stack );
|
2009-05-15 17:37:18 -04:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2020-06-26 05:30:11 -04:00
|
|
|
|
* Replaces double line breaks with paragraph elements.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* A group of regex replaces used to identify text formatted with newlines and
|
2020-06-26 05:30:11 -04:00
|
|
|
|
* replace double line breaks with HTML paragraph tags. The remaining line breaks
|
2015-03-20 15:47:27 -04:00
|
|
|
|
* after conversion become <<br />> tags, unless $br is set to '0' or 'false'.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 0.71
|
|
|
|
|
*
|
|
|
|
|
* @param string $pee The text which has to be formatted.
|
2020-06-26 05:30:11 -04:00
|
|
|
|
* @param bool $br Optional. If set, this will convert all remaining line breaks
|
2020-06-26 05:20:11 -04:00
|
|
|
|
* after paragraphing. Line breaks within `<script>`, `<style>`,
|
|
|
|
|
* and `<svg>` tags are not affected. Default true.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @return string Text which has been converted into correct paragraph tags.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function wpautop( $pee, $br = true ) {
|
2012-03-28 11:43:31 -04:00
|
|
|
|
$pre_tags = array();
|
2009-12-01 02:46:36 -05:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( trim( $pee ) === '' ) {
|
2009-04-22 03:37:24 -04:00
|
|
|
|
return '';
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2012-03-28 11:43:31 -04:00
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// Just to make things a little easier, pad the end.
|
|
|
|
|
$pee = $pee . "\n";
|
2012-03-28 11:43:31 -04:00
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
/*
|
|
|
|
|
* Pre tags shouldn't be touched by autop.
|
|
|
|
|
* Replace pre tags with placeholders and bring them back after autop.
|
|
|
|
|
*/
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( strpos( $pee, '<pre' ) !== false ) {
|
2012-03-28 11:43:31 -04:00
|
|
|
|
$pee_parts = explode( '</pre>', $pee );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$last_pee = array_pop( $pee_parts );
|
|
|
|
|
$pee = '';
|
|
|
|
|
$i = 0;
|
2012-03-28 11:43:31 -04:00
|
|
|
|
|
|
|
|
|
foreach ( $pee_parts as $pee_part ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$start = strpos( $pee_part, '<pre' );
|
2012-03-28 11:43:31 -04:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Malformed HTML?
|
2020-02-09 11:55:09 -05:00
|
|
|
|
if ( false === $start ) {
|
2012-03-28 11:43:31 -04:00
|
|
|
|
$pee .= $pee_part;
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$name = "<pre wp-pre-tag-$i></pre>";
|
|
|
|
|
$pre_tags[ $name ] = substr( $pee_part, $start ) . '</pre>';
|
2012-03-28 11:43:31 -04:00
|
|
|
|
|
|
|
|
|
$pee .= substr( $pee_part, 0, $start ) . $name;
|
|
|
|
|
$i++;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$pee .= $last_pee;
|
|
|
|
|
}
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Change multiple <br>'s into two line breaks, which will turn into paragraphs.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee = preg_replace( '|<br\s*/?>\s*<br\s*/?>|', "\n\n", $pee );
|
2015-03-20 15:47:27 -04:00
|
|
|
|
|
2019-07-02 07:22:56 -04:00
|
|
|
|
$allblocks = '(?:table|thead|tfoot|caption|col|colgroup|tbody|tr|td|th|div|dl|dd|dt|ul|ol|li|pre|form|map|area|blockquote|address|math|style|p|h[1-6]|hr|fieldset|legend|section|article|aside|hgroup|header|footer|nav|figure|figcaption|details|menu|summary)';
|
2015-03-20 15:47:27 -04:00
|
|
|
|
|
2016-09-13 00:01:30 -04:00
|
|
|
|
// Add a double line break above block-level opening tags.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee = preg_replace( '!(<' . $allblocks . '[\s/>])!', "\n\n$1", $pee );
|
2015-03-20 15:47:27 -04:00
|
|
|
|
|
|
|
|
|
// Add a double line break below block-level closing tags.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee = preg_replace( '!(</' . $allblocks . '>)!', "$1\n\n", $pee );
|
2014-02-04 19:46:12 -05:00
|
|
|
|
|
2019-06-28 03:16:56 -04:00
|
|
|
|
// Add a double line break after hr tags, which are self closing.
|
|
|
|
|
$pee = preg_replace( '!(<hr\s*?/?>)!', "$1\n\n", $pee );
|
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// Standardize newline characters to "\n".
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee = str_replace( array( "\r\n", "\r" ), "\n", $pee );
|
2015-03-20 15:47:27 -04:00
|
|
|
|
|
2015-07-28 19:03:24 -04:00
|
|
|
|
// Find newlines in all elements and add placeholders.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee = wp_replace_in_html_tags( $pee, array( "\n" => ' <!-- wpnl --> ' ) );
|
2015-07-22 01:15:25 -04:00
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// Collapse line breaks before and after <option> elements so they don't get autop'd.
|
2014-07-28 15:44:18 -04:00
|
|
|
|
if ( strpos( $pee, '<option' ) !== false ) {
|
2014-07-28 15:55:16 -04:00
|
|
|
|
$pee = preg_replace( '|\s*<option|', '<option', $pee );
|
|
|
|
|
$pee = preg_replace( '|</option>\s*|', '</option>', $pee );
|
2014-07-28 15:44:18 -04:00
|
|
|
|
}
|
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
/*
|
|
|
|
|
* Collapse line breaks inside <object> elements, before <param> and <embed> elements
|
|
|
|
|
* so they don't get autop'd.
|
|
|
|
|
*/
|
2014-02-04 19:46:12 -05:00
|
|
|
|
if ( strpos( $pee, '</object>' ) !== false ) {
|
|
|
|
|
$pee = preg_replace( '|(<object[^>]*>)\s*|', '$1', $pee );
|
|
|
|
|
$pee = preg_replace( '|\s*</object>|', '</object>', $pee );
|
|
|
|
|
$pee = preg_replace( '%\s*(</?(?:param|embed)[^>]*>)\s*%', '$1', $pee );
|
|
|
|
|
}
|
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
/*
|
|
|
|
|
* Collapse line breaks inside <audio> and <video> elements,
|
|
|
|
|
* before and after <source> and <track> elements.
|
|
|
|
|
*/
|
2014-02-04 19:46:12 -05:00
|
|
|
|
if ( strpos( $pee, '<source' ) !== false || strpos( $pee, '<track' ) !== false ) {
|
|
|
|
|
$pee = preg_replace( '%([<\[](?:audio|video)[^>\]]*[>\]])\s*%', '$1', $pee );
|
|
|
|
|
$pee = preg_replace( '%\s*([<\[]/(?:audio|video)[>\]])%', '$1', $pee );
|
|
|
|
|
$pee = preg_replace( '%\s*(<(?:source|track)[^>]*>)\s*%', '$1', $pee );
|
2008-01-17 10:44:05 -05:00
|
|
|
|
}
|
2014-02-04 19:46:12 -05:00
|
|
|
|
|
2017-01-15 20:06:40 -05:00
|
|
|
|
// Collapse line breaks before and after <figcaption> elements.
|
|
|
|
|
if ( strpos( $pee, '<figcaption' ) !== false ) {
|
|
|
|
|
$pee = preg_replace( '|\s*(<figcaption[^>]*>)|', '$1', $pee );
|
|
|
|
|
$pee = preg_replace( '|</figcaption>\s*|', '</figcaption>', $pee );
|
|
|
|
|
}
|
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// Remove more than two contiguous line breaks.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee = preg_replace( "/\n\n+/", "\n\n", $pee );
|
2015-03-20 15:47:27 -04:00
|
|
|
|
|
|
|
|
|
// Split up the contents into an array of strings, separated by double line breaks.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pees = preg_split( '/\n\s*\n/', $pee, -1, PREG_SPLIT_NO_EMPTY );
|
2015-03-20 15:47:27 -04:00
|
|
|
|
|
|
|
|
|
// Reset $pee prior to rebuilding.
|
2008-10-20 15:25:02 -04:00
|
|
|
|
$pee = '';
|
2014-02-04 19:46:12 -05:00
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// Rebuild the content as a string, wrapping every bit with a <p>.
|
2014-02-04 19:46:12 -05:00
|
|
|
|
foreach ( $pees as $tinkle ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee .= '<p>' . trim( $tinkle, "\n" ) . "</p>\n";
|
2014-02-04 19:46:12 -05:00
|
|
|
|
}
|
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// Under certain strange conditions it could create a P of entirely whitespace.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee = preg_replace( '|<p>\s*</p>|', '', $pee );
|
2015-03-20 15:47:27 -04:00
|
|
|
|
|
Clean up stray `<p>` tags added by `wpautop()` inside block level tags.
`autop()` can sometimes get confused and not clean up stray `<p>` or `</p>` tags inside block level elements, which produces sub-optimal HTML. While browsers can generally handle it, there's no need to make things harder for them if we don't have to.
Props pento, ayubi, pbearne, jond, azaozz, 1994rstefan, dionysous, MikeHansenMe, jorbin, miqrogroove, niallkennedy.
Fixes #27350.
Built from https://develop.svn.wordpress.org/trunk@45585
git-svn-id: http://core.svn.wordpress.org/trunk@45396 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2019-07-01 21:31:56 -04:00
|
|
|
|
// Add a closing <p> inside <div>, <address>, or <form> tag if missing.
|
|
|
|
|
$pee = preg_replace( '!<p>([^<]+)</(div|address|form)>!', '<p>$1</p></$2>', $pee );
|
|
|
|
|
|
2019-07-02 07:22:56 -04:00
|
|
|
|
// If an opening or closing block element tag is wrapped in a <p>, unwrap it.
|
|
|
|
|
$pee = preg_replace( '!<p>\s*(</?' . $allblocks . '[^>]*>)\s*</p>!', '$1', $pee );
|
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// In some cases <li> may get wrapped in <p>, fix them.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee = preg_replace( '|<p>(<li.+?)</p>|', '$1', $pee );
|
2015-05-25 02:25:25 -04:00
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// If a <blockquote> is wrapped with a <p>, move it inside the <blockquote>.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee = preg_replace( '|<p><blockquote([^>]*)>|i', '<blockquote$1><p>', $pee );
|
|
|
|
|
$pee = str_replace( '</blockquote></p>', '</p></blockquote>', $pee );
|
2015-05-25 02:25:25 -04:00
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// If an opening or closing block element tag is preceded by an opening <p> tag, remove it.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee = preg_replace( '!<p>\s*(</?' . $allblocks . '[^>]*>)!', '$1', $pee );
|
2015-05-25 02:25:25 -04:00
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// If an opening or closing block element tag is followed by a closing <p> tag, remove it.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee = preg_replace( '!(</?' . $allblocks . '[^>]*>)\s*</p>!', '$1', $pee );
|
2014-02-04 19:46:12 -05:00
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// Optionally insert line breaks.
|
2012-03-28 11:43:31 -04:00
|
|
|
|
if ( $br ) {
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// Replace newlines that shouldn't be touched with a placeholder.
|
2019-06-30 23:19:58 -04:00
|
|
|
|
$pee = preg_replace_callback( '/<(script|style|svg).*?<\/\\1>/s', '_autop_newline_preservation_helper', $pee );
|
2015-03-20 15:47:27 -04:00
|
|
|
|
|
2015-08-17 13:36:24 -04:00
|
|
|
|
// Normalize <br>
|
|
|
|
|
$pee = str_replace( array( '<br>', '<br/>' ), '<br />', $pee );
|
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// Replace any new line characters that aren't preceded by a <br /> with a <br />.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee = preg_replace( '|(?<!<br />)\s*\n|', "<br />\n", $pee );
|
2015-03-20 15:47:27 -04:00
|
|
|
|
|
|
|
|
|
// Replace newline placeholders with newlines.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee = str_replace( '<WPPreserveNewline />', "\n", $pee );
|
2006-07-04 19:16:04 -04:00
|
|
|
|
}
|
2014-02-04 19:46:12 -05:00
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// If a <br /> tag is after an opening or closing block tag, remove it.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee = preg_replace( '!(</?' . $allblocks . '[^>]*>)\s*<br />!', '$1', $pee );
|
2015-05-25 02:25:25 -04:00
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// If a <br /> tag is before a subset of opening or closing block tags, remove it.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$pee = preg_replace( '!<br />(\s*</?(?:p|li|div|dl|dd|dt|th|pre|td|ul|ol)[^>]*>)!', '$1', $pee );
|
2006-11-30 18:32:45 -05:00
|
|
|
|
$pee = preg_replace( "|\n</p>$|", '</p>', $pee );
|
2009-12-01 02:46:36 -05:00
|
|
|
|
|
2015-03-20 15:47:27 -04:00
|
|
|
|
// Replace placeholder <pre> tags with their original content.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! empty( $pre_tags ) ) {
|
|
|
|
|
$pee = str_replace( array_keys( $pre_tags ), array_values( $pre_tags ), $pee );
|
|
|
|
|
}
|
2012-03-28 11:43:31 -04:00
|
|
|
|
|
2015-07-28 19:03:24 -04:00
|
|
|
|
// Restore newlines in all elements.
|
2015-09-08 18:55:24 -04:00
|
|
|
|
if ( false !== strpos( $pee, '<!-- wpnl -->' ) ) {
|
|
|
|
|
$pee = str_replace( array( ' <!-- wpnl --> ', '<!-- wpnl -->' ), "\n", $pee );
|
|
|
|
|
}
|
2015-07-28 19:03:24 -04:00
|
|
|
|
|
2009-12-01 02:46:36 -05:00
|
|
|
|
return $pee;
|
|
|
|
|
}
|
|
|
|
|
|
2015-07-28 19:03:24 -04:00
|
|
|
|
/**
|
|
|
|
|
* Separate HTML elements and comments from the text.
|
|
|
|
|
*
|
|
|
|
|
* @since 4.2.4
|
|
|
|
|
*
|
|
|
|
|
* @param string $input The text which has to be formatted.
|
2019-11-05 16:23:02 -05:00
|
|
|
|
* @return string[] Array of the formatted text.
|
2015-07-28 19:03:24 -04:00
|
|
|
|
*/
|
|
|
|
|
function wp_html_split( $input ) {
|
2015-10-02 00:26:25 -04:00
|
|
|
|
return preg_split( get_html_split_regex(), $input, -1, PREG_SPLIT_DELIM_CAPTURE );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Retrieve the regular expression for an HTML element.
|
|
|
|
|
*
|
|
|
|
|
* @since 4.4.0
|
|
|
|
|
*
|
|
|
|
|
* @return string The regular expression
|
|
|
|
|
*/
|
|
|
|
|
function get_html_split_regex() {
|
2015-07-28 19:03:24 -04:00
|
|
|
|
static $regex;
|
|
|
|
|
|
|
|
|
|
if ( ! isset( $regex ) ) {
|
2017-11-27 23:24:57 -05:00
|
|
|
|
// phpcs:disable Squiz.Strings.ConcatenationSpacing.PaddingFound -- don't remove regex indentation
|
2015-07-28 19:03:24 -04:00
|
|
|
|
$comments =
|
2017-11-27 23:24:57 -05:00
|
|
|
|
'!' // Start of comment, after the <.
|
2015-07-28 19:03:24 -04:00
|
|
|
|
. '(?:' // Unroll the loop: Consume everything until --> is found.
|
|
|
|
|
. '-(?!->)' // Dash not followed by end of comment.
|
|
|
|
|
. '[^\-]*+' // Consume non-dashes.
|
|
|
|
|
. ')*+' // Loop possessively.
|
|
|
|
|
. '(?:-->)?'; // End of comment. If not found, match all input.
|
|
|
|
|
|
|
|
|
|
$cdata =
|
2017-11-27 23:24:57 -05:00
|
|
|
|
'!\[CDATA\[' // Start of comment, after the <.
|
2015-07-28 19:03:24 -04:00
|
|
|
|
. '[^\]]*+' // Consume non-].
|
|
|
|
|
. '(?:' // Unroll the loop: Consume everything until ]]> is found.
|
|
|
|
|
. '](?!]>)' // One ] not followed by end of comment.
|
|
|
|
|
. '[^\]]*+' // Consume non-].
|
|
|
|
|
. ')*+' // Loop possessively.
|
|
|
|
|
. '(?:]]>)?'; // End of comment. If not found, match all input.
|
|
|
|
|
|
2015-10-20 02:08:25 -04:00
|
|
|
|
$escaped =
|
2017-11-27 23:24:57 -05:00
|
|
|
|
'(?=' // Is the element escaped?
|
2015-10-02 00:26:25 -04:00
|
|
|
|
. '!--'
|
|
|
|
|
. '|'
|
|
|
|
|
. '!\[CDATA\['
|
|
|
|
|
. ')'
|
|
|
|
|
. '(?(?=!-)' // If yes, which type?
|
|
|
|
|
. $comments
|
|
|
|
|
. '|'
|
|
|
|
|
. $cdata
|
|
|
|
|
. ')';
|
|
|
|
|
|
2015-07-28 19:03:24 -04:00
|
|
|
|
$regex =
|
2017-11-27 23:24:57 -05:00
|
|
|
|
'/(' // Capture the entire match.
|
2015-07-28 19:03:24 -04:00
|
|
|
|
. '<' // Find start of element.
|
2015-10-02 00:26:25 -04:00
|
|
|
|
. '(?' // Conditional expression follows.
|
|
|
|
|
. $escaped // Find end of escaped element.
|
2020-01-28 19:45:18 -05:00
|
|
|
|
. '|' // ...else...
|
2015-10-02 00:26:25 -04:00
|
|
|
|
. '[^>]*>?' // Find end of normal element.
|
2015-07-28 19:03:24 -04:00
|
|
|
|
. ')'
|
2015-10-02 00:26:25 -04:00
|
|
|
|
. ')/';
|
2017-11-27 23:24:57 -05:00
|
|
|
|
// phpcs:enable
|
2015-10-02 00:26:25 -04:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return $regex;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Retrieve the combined regular expression for HTML and shortcodes.
|
|
|
|
|
*
|
|
|
|
|
* @access private
|
|
|
|
|
* @ignore
|
|
|
|
|
* @internal This function will be removed in 4.5.0 per Shortcode API Roadmap.
|
|
|
|
|
* @since 4.4.0
|
|
|
|
|
*
|
2020-01-28 19:45:18 -05:00
|
|
|
|
* @param string $shortcode_regex The result from _get_wptexturize_shortcode_regex(). Optional.
|
2015-10-02 00:26:25 -04:00
|
|
|
|
* @return string The regular expression
|
|
|
|
|
*/
|
|
|
|
|
function _get_wptexturize_split_regex( $shortcode_regex = '' ) {
|
|
|
|
|
static $html_regex;
|
|
|
|
|
|
|
|
|
|
if ( ! isset( $html_regex ) ) {
|
2017-11-27 23:24:57 -05:00
|
|
|
|
// phpcs:disable Squiz.Strings.ConcatenationSpacing.PaddingFound -- don't remove regex indentation
|
2015-10-02 00:26:25 -04:00
|
|
|
|
$comment_regex =
|
2017-11-27 23:24:57 -05:00
|
|
|
|
'!' // Start of comment, after the <.
|
2015-10-02 00:26:25 -04:00
|
|
|
|
. '(?:' // Unroll the loop: Consume everything until --> is found.
|
|
|
|
|
. '-(?!->)' // Dash not followed by end of comment.
|
|
|
|
|
. '[^\-]*+' // Consume non-dashes.
|
|
|
|
|
. ')*+' // Loop possessively.
|
|
|
|
|
. '(?:-->)?'; // End of comment. If not found, match all input.
|
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$html_regex = // Needs replaced with wp_html_split() per Shortcode API Roadmap.
|
2017-11-27 23:24:57 -05:00
|
|
|
|
'<' // Find start of element.
|
2015-10-02 00:26:25 -04:00
|
|
|
|
. '(?(?=!--)' // Is this a comment?
|
|
|
|
|
. $comment_regex // Find end of comment.
|
|
|
|
|
. '|'
|
|
|
|
|
. '[^>]*>?' // Find end of element. If not found, match all input.
|
|
|
|
|
. ')';
|
2017-11-27 23:24:57 -05:00
|
|
|
|
// phpcs:enable
|
2015-07-28 19:03:24 -04:00
|
|
|
|
}
|
|
|
|
|
|
2015-10-02 00:26:25 -04:00
|
|
|
|
if ( empty( $shortcode_regex ) ) {
|
|
|
|
|
$regex = '/(' . $html_regex . ')/';
|
|
|
|
|
} else {
|
|
|
|
|
$regex = '/(' . $html_regex . '|' . $shortcode_regex . ')/';
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return $regex;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Retrieve the regular expression for shortcodes.
|
|
|
|
|
*
|
|
|
|
|
* @access private
|
|
|
|
|
* @ignore
|
|
|
|
|
* @since 4.4.0
|
|
|
|
|
*
|
2019-10-26 17:09:04 -04:00
|
|
|
|
* @param string[] $tagnames Array of shortcodes to find.
|
2015-10-02 00:26:25 -04:00
|
|
|
|
* @return string The regular expression
|
|
|
|
|
*/
|
|
|
|
|
function _get_wptexturize_shortcode_regex( $tagnames ) {
|
2020-10-18 13:27:06 -04:00
|
|
|
|
$tagregexp = implode( '|', array_map( 'preg_quote', $tagnames ) );
|
2015-10-02 00:26:25 -04:00
|
|
|
|
$tagregexp = "(?:$tagregexp)(?=[\\s\\]\\/])"; // Excerpt of get_shortcode_regex().
|
2017-11-27 23:24:57 -05:00
|
|
|
|
// phpcs:disable Squiz.Strings.ConcatenationSpacing.PaddingFound -- don't remove regex indentation
|
2015-10-02 00:26:25 -04:00
|
|
|
|
$regex =
|
2020-01-28 19:45:18 -05:00
|
|
|
|
'\[' // Find start of shortcode.
|
|
|
|
|
. '[\/\[]?' // Shortcodes may begin with [/ or [[.
|
2015-10-02 00:26:25 -04:00
|
|
|
|
. $tagregexp // Only match registered shortcodes, because performance.
|
|
|
|
|
. '(?:'
|
|
|
|
|
. '[^\[\]<>]+' // Shortcodes do not contain other shortcodes. Quantifier critical.
|
|
|
|
|
. '|'
|
|
|
|
|
. '<[^\[\]>]*>' // HTML elements permitted. Prevents matching ] before >.
|
|
|
|
|
. ')*+' // Possessive critical.
|
|
|
|
|
. '\]' // Find end of shortcode.
|
2020-01-28 19:45:18 -05:00
|
|
|
|
. '\]?'; // Shortcodes may end with ]].
|
2017-11-27 23:24:57 -05:00
|
|
|
|
// phpcs:enable
|
2015-10-02 00:26:25 -04:00
|
|
|
|
|
|
|
|
|
return $regex;
|
2015-07-28 19:03:24 -04:00
|
|
|
|
}
|
|
|
|
|
|
2015-07-22 01:15:25 -04:00
|
|
|
|
/**
|
|
|
|
|
* Replace characters or phrases within HTML elements only.
|
|
|
|
|
*
|
|
|
|
|
* @since 4.2.3
|
|
|
|
|
*
|
2020-07-23 17:11:05 -04:00
|
|
|
|
* @param string $haystack The text which has to be formatted.
|
|
|
|
|
* @param array $replace_pairs In the form array('from' => 'to', ...).
|
2015-07-22 01:15:25 -04:00
|
|
|
|
* @return string The formatted text.
|
|
|
|
|
*/
|
|
|
|
|
function wp_replace_in_html_tags( $haystack, $replace_pairs ) {
|
|
|
|
|
// Find all elements.
|
2015-07-28 19:03:24 -04:00
|
|
|
|
$textarr = wp_html_split( $haystack );
|
2015-07-22 01:15:25 -04:00
|
|
|
|
$changed = false;
|
|
|
|
|
|
|
|
|
|
// Optimize when searching for one item.
|
|
|
|
|
if ( 1 === count( $replace_pairs ) ) {
|
|
|
|
|
// Extract $needle and $replace.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
foreach ( $replace_pairs as $needle => $replace ) {
|
|
|
|
|
}
|
2015-07-22 01:15:25 -04:00
|
|
|
|
|
2015-09-16 01:54:26 -04:00
|
|
|
|
// Loop through delimiters (elements) only.
|
2015-07-24 13:27:24 -04:00
|
|
|
|
for ( $i = 1, $c = count( $textarr ); $i < $c; $i += 2 ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( false !== strpos( $textarr[ $i ], $needle ) ) {
|
|
|
|
|
$textarr[ $i ] = str_replace( $needle, $replace, $textarr[ $i ] );
|
|
|
|
|
$changed = true;
|
2015-07-22 01:15:25 -04:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
} else {
|
|
|
|
|
// Extract all $needles.
|
|
|
|
|
$needles = array_keys( $replace_pairs );
|
|
|
|
|
|
2015-09-16 01:54:26 -04:00
|
|
|
|
// Loop through delimiters (elements) only.
|
2015-07-24 13:27:24 -04:00
|
|
|
|
for ( $i = 1, $c = count( $textarr ); $i < $c; $i += 2 ) {
|
2015-07-22 01:15:25 -04:00
|
|
|
|
foreach ( $needles as $needle ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( false !== strpos( $textarr[ $i ], $needle ) ) {
|
|
|
|
|
$textarr[ $i ] = strtr( $textarr[ $i ], $replace_pairs );
|
|
|
|
|
$changed = true;
|
2015-07-22 01:15:25 -04:00
|
|
|
|
// After one strtr() break out of the foreach loop and look at next element.
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( $changed ) {
|
|
|
|
|
$haystack = implode( $textarr );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return $haystack;
|
|
|
|
|
}
|
|
|
|
|
|
2010-10-28 03:38:00 -04:00
|
|
|
|
/**
|
|
|
|
|
* Newline preservation help function for wpautop
|
2010-11-17 13:47:34 -05:00
|
|
|
|
*
|
2010-10-28 03:38:00 -04:00
|
|
|
|
* @since 3.1.0
|
|
|
|
|
* @access private
|
2013-02-01 13:07:08 -05:00
|
|
|
|
*
|
2010-10-28 03:38:00 -04:00
|
|
|
|
* @param array $matches preg_replace_callback matches array
|
2012-07-09 01:03:53 -04:00
|
|
|
|
* @return string
|
2010-10-28 03:38:00 -04:00
|
|
|
|
*/
|
2010-11-11 17:50:36 -05:00
|
|
|
|
function _autop_newline_preservation_helper( $matches ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
return str_replace( "\n", '<WPPreserveNewline />', $matches[0] );
|
2010-10-28 03:38:00 -04:00
|
|
|
|
}
|
|
|
|
|
|
2009-12-01 02:46:36 -05:00
|
|
|
|
/**
|
|
|
|
|
* Don't auto-p wrap shortcodes that stand alone
|
|
|
|
|
*
|
2014-11-24 00:30:25 -05:00
|
|
|
|
* Ensures that shortcodes are not wrapped in `<p>...</p>`.
|
2009-12-01 02:46:36 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 2.9.0
|
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @global array $shortcode_tags
|
|
|
|
|
*
|
2009-12-01 02:46:36 -05:00
|
|
|
|
* @param string $pee The content.
|
|
|
|
|
* @return string The filtered content.
|
|
|
|
|
*/
|
2011-10-12 12:50:30 -04:00
|
|
|
|
function shortcode_unautop( $pee ) {
|
2009-12-01 02:46:36 -05:00
|
|
|
|
global $shortcode_tags;
|
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( empty( $shortcode_tags ) || ! is_array( $shortcode_tags ) ) {
|
2011-10-12 12:50:30 -04:00
|
|
|
|
return $pee;
|
2009-12-01 02:46:36 -05:00
|
|
|
|
}
|
2007-02-20 00:41:39 -05:00
|
|
|
|
|
2020-10-18 13:27:06 -04:00
|
|
|
|
$tagregexp = implode( '|', array_map( 'preg_quote', array_keys( $shortcode_tags ) ) );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$spaces = wp_spaces_regexp();
|
2011-10-12 12:50:30 -04:00
|
|
|
|
|
2019-07-05 01:21:56 -04:00
|
|
|
|
// phpcs:disable Squiz.Strings.ConcatenationSpacing.PaddingFound,WordPress.WhiteSpace.PrecisionAlignment.Found -- don't remove regex indentation
|
2011-10-12 12:50:30 -04:00
|
|
|
|
$pattern =
|
2017-11-26 18:57:55 -05:00
|
|
|
|
'/'
|
2020-01-28 19:45:18 -05:00
|
|
|
|
. '<p>' // Opening paragraph.
|
|
|
|
|
. '(?:' . $spaces . ')*+' // Optional leading whitespace.
|
|
|
|
|
. '(' // 1: The shortcode.
|
|
|
|
|
. '\\[' // Opening bracket.
|
|
|
|
|
. "($tagregexp)" // 2: Shortcode name.
|
|
|
|
|
. '(?![\\w-])' // Not followed by word character or hyphen.
|
|
|
|
|
// Unroll the loop: Inside the opening shortcode tag.
|
|
|
|
|
. '[^\\]\\/]*' // Not a closing bracket or forward slash.
|
2011-10-12 12:50:30 -04:00
|
|
|
|
. '(?:'
|
2020-01-28 19:45:18 -05:00
|
|
|
|
. '\\/(?!\\])' // A forward slash not followed by a closing bracket.
|
|
|
|
|
. '[^\\]\\/]*' // Not a closing bracket or forward slash.
|
2011-10-12 12:50:30 -04:00
|
|
|
|
. ')*?'
|
|
|
|
|
. '(?:'
|
2020-01-28 19:45:18 -05:00
|
|
|
|
. '\\/\\]' // Self closing tag and closing bracket.
|
2011-10-12 12:50:30 -04:00
|
|
|
|
. '|'
|
2020-01-28 19:45:18 -05:00
|
|
|
|
. '\\]' // Closing bracket.
|
|
|
|
|
. '(?:' // Unroll the loop: Optionally, anything between the opening and closing shortcode tags.
|
|
|
|
|
. '[^\\[]*+' // Not an opening bracket.
|
2011-10-12 12:50:30 -04:00
|
|
|
|
. '(?:'
|
2020-01-28 19:45:18 -05:00
|
|
|
|
. '\\[(?!\\/\\2\\])' // An opening bracket not followed by the closing shortcode tag.
|
|
|
|
|
. '[^\\[]*+' // Not an opening bracket.
|
2011-10-12 12:50:30 -04:00
|
|
|
|
. ')*+'
|
2020-01-28 19:45:18 -05:00
|
|
|
|
. '\\[\\/\\2\\]' // Closing shortcode tag.
|
2011-10-12 12:50:30 -04:00
|
|
|
|
. ')?'
|
|
|
|
|
. ')'
|
|
|
|
|
. ')'
|
2020-01-28 19:45:18 -05:00
|
|
|
|
. '(?:' . $spaces . ')*+' // Optional trailing whitespace.
|
|
|
|
|
. '<\\/p>' // Closing paragraph.
|
2015-10-02 00:26:25 -04:00
|
|
|
|
. '/';
|
2017-11-27 23:24:57 -05:00
|
|
|
|
// phpcs:enable
|
2011-10-12 12:50:30 -04:00
|
|
|
|
|
|
|
|
|
return preg_replace( $pattern, '$1', $pee );
|
2004-02-09 01:57:02 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
|
|
|
|
* Checks to see if a string is utf8 encoded.
|
|
|
|
|
*
|
2009-05-24 19:47:49 -04:00
|
|
|
|
* NOTE: This function checks for 5-Byte sequences, UTF8
|
2009-05-20 17:13:14 -04:00
|
|
|
|
* has Bytes Sequences with a maximum length of 4.
|
2008-08-31 16:58:19 -04:00
|
|
|
|
*
|
2009-05-20 17:13:14 -04:00
|
|
|
|
* @author bmorel at ssi dot fr (modified)
|
2008-08-17 07:29:43 -04:00
|
|
|
|
* @since 1.2.1
|
|
|
|
|
*
|
2009-05-20 17:13:14 -04:00
|
|
|
|
* @param string $str The string to be checked
|
|
|
|
|
* @return bool True if $str fits a UTF-8 model, false otherwise.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function seems_utf8( $str ) {
|
2014-06-23 18:21:15 -04:00
|
|
|
|
mbstring_binary_safe_encoding();
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$length = strlen( $str );
|
2014-06-23 18:21:15 -04:00
|
|
|
|
reset_mbstring_encoding();
|
2017-11-30 18:11:00 -05:00
|
|
|
|
for ( $i = 0; $i < $length; $i++ ) {
|
|
|
|
|
$c = ord( $str[ $i ] );
|
|
|
|
|
if ( $c < 0x80 ) {
|
|
|
|
|
$n = 0; // 0bbbbbbb
|
|
|
|
|
} elseif ( ( $c & 0xE0 ) == 0xC0 ) {
|
|
|
|
|
$n = 1; // 110bbbbb
|
|
|
|
|
} elseif ( ( $c & 0xF0 ) == 0xE0 ) {
|
|
|
|
|
$n = 2; // 1110bbbb
|
|
|
|
|
} elseif ( ( $c & 0xF8 ) == 0xF0 ) {
|
|
|
|
|
$n = 3; // 11110bbb
|
|
|
|
|
} elseif ( ( $c & 0xFC ) == 0xF8 ) {
|
|
|
|
|
$n = 4; // 111110bb
|
|
|
|
|
} elseif ( ( $c & 0xFE ) == 0xFC ) {
|
|
|
|
|
$n = 5; // 1111110b
|
|
|
|
|
} else {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
return false; // Does not match any model.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
|
|
|
|
for ( $j = 0; $j < $n; $j++ ) { // n bytes matching 10bbbbbb follow ?
|
|
|
|
|
if ( ( ++$i == $length ) || ( ( ord( $str[ $i ] ) & 0xC0 ) != 0x80 ) ) {
|
2009-05-20 17:13:14 -04:00
|
|
|
|
return false;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2004-05-22 10:34:09 -04:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
return true;
|
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* Converts a number of special characters into their HTML entities.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2009-01-04 18:37:47 -05:00
|
|
|
|
* Specifically deals with: &, <, >, ", and '.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2009-01-04 17:25:50 -05:00
|
|
|
|
* $quote_style can be set to ENT_COMPAT to encode " to
|
|
|
|
|
* ", or ENT_QUOTES to do both. Default is ENT_NOQUOTES where no quotes are encoded.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 1.2.2
|
2020-06-19 18:28:13 -04:00
|
|
|
|
* @since 5.5.0 `$quote_style` also accepts `ENT_XML1`.
|
2013-02-01 13:07:08 -05:00
|
|
|
|
* @access private
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2019-07-01 21:45:58 -04:00
|
|
|
|
* @param string $string The text which is to be encoded.
|
|
|
|
|
* @param int|string $quote_style Optional. Converts double quotes if set to ENT_COMPAT,
|
|
|
|
|
* both single and double if set to ENT_QUOTES or none if set to ENT_NOQUOTES.
|
Sitemaps: Add XML sitemaps functionality to WordPress.
While web crawlers are able to discover pages from links within the site and from other sites, XML sitemaps supplement this approach by allowing crawlers to quickly and comprehensively identify all URLs included in the sitemap and learn other signals about those URLs using the associated metadata.
See https://make.wordpress.org/core/2020/06/10/merge-announcement-extensible-core-sitemaps/ for more details.
This feature exposes the sitemap index via `/wp-sitemap.xml` and exposes a variety of new filters and hooks for developers to modify the behavior. Users can disable sitemaps completely by turning off search engine visibility in WordPress admin.
This change also introduces a new `esc_xml()` function to escape strings for output in XML, as well as XML support to `wp_kses_normalize_entities()`.
Props Adrian McShane, afragen, adamsilverstein, casiepa, flixos90, garrett-eclipse, joemcgill, kburgoine, kraftbj, milana_cap, pacifika, pbiron, pfefferle, Ruxandra Gradina, swissspidy, szepeviktor, tangrufus, tweetythierry.
Fixes #50117.
See #3670. See #19998.
Built from https://develop.svn.wordpress.org/trunk@48072
git-svn-id: http://core.svn.wordpress.org/trunk@47839 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2020-06-17 11:24:07 -04:00
|
|
|
|
* Converts single and double quotes, as well as converting HTML
|
|
|
|
|
* named entities (that are not also XML named entities) to their
|
|
|
|
|
* code points if set to ENT_XML1. Also compatible with old values;
|
|
|
|
|
* converting single quotes if set to 'single',
|
2019-07-01 21:45:58 -04:00
|
|
|
|
* double if set to 'double' or both if otherwise set.
|
|
|
|
|
* Default is ENT_NOQUOTES.
|
2020-06-26 05:30:11 -04:00
|
|
|
|
* @param false|string $charset Optional. The character encoding of the string. Default false.
|
2020-06-28 10:02:06 -04:00
|
|
|
|
* @param bool $double_encode Optional. Whether to encode existing HTML entities. Default false.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @return string The encoded text with HTML entities.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2009-05-18 11:11:07 -04:00
|
|
|
|
function _wp_specialchars( $string, $quote_style = ENT_NOQUOTES, $charset = false, $double_encode = false ) {
|
2009-01-04 18:37:47 -05:00
|
|
|
|
$string = (string) $string;
|
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( 0 === strlen( $string ) ) {
|
2009-01-04 17:25:50 -05:00
|
|
|
|
return '';
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2009-01-04 17:25:50 -05:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Don't bother if there are no specialchars - saves some processing.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! preg_match( '/[&<>"\']/', $string ) ) {
|
2009-01-13 10:18:37 -05:00
|
|
|
|
return $string;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2009-01-13 10:18:37 -05:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Account for the previous behaviour of the function when the $quote_style is not an accepted value.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( empty( $quote_style ) ) {
|
2009-01-18 23:40:12 -05:00
|
|
|
|
$quote_style = ENT_NOQUOTES;
|
Sitemaps: Add XML sitemaps functionality to WordPress.
While web crawlers are able to discover pages from links within the site and from other sites, XML sitemaps supplement this approach by allowing crawlers to quickly and comprehensively identify all URLs included in the sitemap and learn other signals about those URLs using the associated metadata.
See https://make.wordpress.org/core/2020/06/10/merge-announcement-extensible-core-sitemaps/ for more details.
This feature exposes the sitemap index via `/wp-sitemap.xml` and exposes a variety of new filters and hooks for developers to modify the behavior. Users can disable sitemaps completely by turning off search engine visibility in WordPress admin.
This change also introduces a new `esc_xml()` function to escape strings for output in XML, as well as XML support to `wp_kses_normalize_entities()`.
Props Adrian McShane, afragen, adamsilverstein, casiepa, flixos90, garrett-eclipse, joemcgill, kburgoine, kraftbj, milana_cap, pacifika, pbiron, pfefferle, Ruxandra Gradina, swissspidy, szepeviktor, tangrufus, tweetythierry.
Fixes #50117.
See #3670. See #19998.
Built from https://develop.svn.wordpress.org/trunk@48072
git-svn-id: http://core.svn.wordpress.org/trunk@47839 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2020-06-17 11:24:07 -04:00
|
|
|
|
} elseif ( ENT_XML1 === $quote_style ) {
|
|
|
|
|
$quote_style = ENT_QUOTES | ENT_XML1;
|
|
|
|
|
} elseif ( ! in_array( $quote_style, array( ENT_NOQUOTES, ENT_COMPAT, ENT_QUOTES, 'single', 'double' ), true ) ) {
|
2009-01-18 23:40:12 -05:00
|
|
|
|
$quote_style = ENT_QUOTES;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2009-01-18 23:40:12 -05:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Store the site charset as a static to avoid multiple calls to wp_load_alloptions().
|
2011-07-29 16:43:45 -04:00
|
|
|
|
if ( ! $charset ) {
|
2015-05-29 11:43:29 -04:00
|
|
|
|
static $_charset = null;
|
2011-07-29 16:43:45 -04:00
|
|
|
|
if ( ! isset( $_charset ) ) {
|
2009-01-13 10:18:37 -05:00
|
|
|
|
$alloptions = wp_load_alloptions();
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$_charset = isset( $alloptions['blog_charset'] ) ? $alloptions['blog_charset'] : '';
|
2009-01-13 10:18:37 -05:00
|
|
|
|
}
|
|
|
|
|
$charset = $_charset;
|
2009-01-04 17:25:50 -05:00
|
|
|
|
}
|
2011-07-29 16:43:45 -04:00
|
|
|
|
|
2020-04-04 23:02:11 -04:00
|
|
|
|
if ( in_array( $charset, array( 'utf8', 'utf-8', 'UTF8' ), true ) ) {
|
2009-01-04 17:25:50 -05:00
|
|
|
|
$charset = 'UTF-8';
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2009-01-04 17:25:50 -05:00
|
|
|
|
|
2009-01-18 23:40:12 -05:00
|
|
|
|
$_quote_style = $quote_style;
|
|
|
|
|
|
2020-02-09 11:55:09 -05:00
|
|
|
|
if ( 'double' === $quote_style ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$quote_style = ENT_COMPAT;
|
2009-01-18 23:40:12 -05:00
|
|
|
|
$_quote_style = ENT_COMPAT;
|
2020-02-09 11:55:09 -05:00
|
|
|
|
} elseif ( 'single' === $quote_style ) {
|
2009-01-18 23:40:12 -05:00
|
|
|
|
$quote_style = ENT_NOQUOTES;
|
2009-01-04 17:25:50 -05:00
|
|
|
|
}
|
2009-05-24 19:47:49 -04:00
|
|
|
|
|
2015-07-14 13:56:26 -04:00
|
|
|
|
if ( ! $double_encode ) {
|
|
|
|
|
// Guarantee every &entity; is valid, convert &garbage; into &garbage;
|
|
|
|
|
// This is required for PHP < 5.4.0 because ENT_HTML401 flag is unavailable.
|
Sitemaps: Add XML sitemaps functionality to WordPress.
While web crawlers are able to discover pages from links within the site and from other sites, XML sitemaps supplement this approach by allowing crawlers to quickly and comprehensively identify all URLs included in the sitemap and learn other signals about those URLs using the associated metadata.
See https://make.wordpress.org/core/2020/06/10/merge-announcement-extensible-core-sitemaps/ for more details.
This feature exposes the sitemap index via `/wp-sitemap.xml` and exposes a variety of new filters and hooks for developers to modify the behavior. Users can disable sitemaps completely by turning off search engine visibility in WordPress admin.
This change also introduces a new `esc_xml()` function to escape strings for output in XML, as well as XML support to `wp_kses_normalize_entities()`.
Props Adrian McShane, afragen, adamsilverstein, casiepa, flixos90, garrett-eclipse, joemcgill, kburgoine, kraftbj, milana_cap, pacifika, pbiron, pfefferle, Ruxandra Gradina, swissspidy, szepeviktor, tangrufus, tweetythierry.
Fixes #50117.
See #3670. See #19998.
Built from https://develop.svn.wordpress.org/trunk@48072
git-svn-id: http://core.svn.wordpress.org/trunk@47839 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2020-06-17 11:24:07 -04:00
|
|
|
|
$string = wp_kses_normalize_entities( $string, ( $quote_style & ENT_XML1 ) ? 'xml' : 'html' );
|
2015-07-09 16:56:24 -04:00
|
|
|
|
}
|
2009-01-04 17:25:50 -05:00
|
|
|
|
|
2019-07-09 01:45:58 -04:00
|
|
|
|
$string = htmlspecialchars( $string, $quote_style, $charset, $double_encode );
|
2015-07-14 13:56:26 -04:00
|
|
|
|
|
2016-05-13 14:41:31 -04:00
|
|
|
|
// Back-compat.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( 'single' === $_quote_style ) {
|
2009-01-04 17:25:50 -05:00
|
|
|
|
$string = str_replace( "'", ''', $string );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2009-01-04 17:25:50 -05:00
|
|
|
|
|
|
|
|
|
return $string;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
2009-01-04 18:37:47 -05:00
|
|
|
|
* Converts a number of HTML entities into their special characters.
|
2009-01-04 17:25:50 -05:00
|
|
|
|
*
|
2009-01-04 18:37:47 -05:00
|
|
|
|
* Specifically deals with: &, <, >, ", and '.
|
|
|
|
|
*
|
|
|
|
|
* $quote_style can be set to ENT_COMPAT to decode " entities,
|
|
|
|
|
* or ENT_QUOTES to do both " and '. Default is ENT_NOQUOTES where no quotes are decoded.
|
2009-01-04 17:25:50 -05:00
|
|
|
|
*
|
2013-02-01 13:07:08 -05:00
|
|
|
|
* @since 2.8.0
|
2009-01-04 17:25:50 -05:00
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param string $string The text which is to be decoded.
|
|
|
|
|
* @param string|int $quote_style Optional. Converts double quotes if set to ENT_COMPAT,
|
|
|
|
|
* both single and double if set to ENT_QUOTES or
|
|
|
|
|
* none if set to ENT_NOQUOTES.
|
|
|
|
|
* Also compatible with old _wp_specialchars() values;
|
|
|
|
|
* converting single quotes if set to 'single',
|
|
|
|
|
* double if set to 'double' or both if otherwise set.
|
|
|
|
|
* Default is ENT_NOQUOTES.
|
2009-01-04 18:37:47 -05:00
|
|
|
|
* @return string The decoded text without HTML entities.
|
2009-01-04 17:25:50 -05:00
|
|
|
|
*/
|
2009-05-06 00:56:32 -04:00
|
|
|
|
function wp_specialchars_decode( $string, $quote_style = ENT_NOQUOTES ) {
|
2009-01-04 18:37:47 -05:00
|
|
|
|
$string = (string) $string;
|
|
|
|
|
|
2009-01-04 17:25:50 -05:00
|
|
|
|
if ( 0 === strlen( $string ) ) {
|
|
|
|
|
return '';
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Don't bother if there are no entities - saves a lot of processing.
|
2009-01-13 10:18:37 -05:00
|
|
|
|
if ( strpos( $string, '&' ) === false ) {
|
|
|
|
|
return $string;
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Match the previous behaviour of _wp_specialchars() when the $quote_style is not an accepted value.
|
2009-01-18 23:40:12 -05:00
|
|
|
|
if ( empty( $quote_style ) ) {
|
|
|
|
|
$quote_style = ENT_NOQUOTES;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
} elseif ( ! in_array( $quote_style, array( 0, 2, 3, 'single', 'double' ), true ) ) {
|
2009-01-18 23:40:12 -05:00
|
|
|
|
$quote_style = ENT_QUOTES;
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// More complete than get_html_translation_table( HTML_SPECIALCHARS ).
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$single = array(
|
|
|
|
|
''' => '\'',
|
|
|
|
|
''' => '\'',
|
|
|
|
|
);
|
|
|
|
|
$single_preg = array(
|
|
|
|
|
'/�*39;/' => ''',
|
|
|
|
|
'/�*27;/i' => ''',
|
|
|
|
|
);
|
|
|
|
|
$double = array(
|
|
|
|
|
'"' => '"',
|
|
|
|
|
'"' => '"',
|
|
|
|
|
'"' => '"',
|
|
|
|
|
);
|
|
|
|
|
$double_preg = array(
|
|
|
|
|
'/�*34;/' => '"',
|
|
|
|
|
'/�*22;/i' => '"',
|
|
|
|
|
);
|
|
|
|
|
$others = array(
|
|
|
|
|
'<' => '<',
|
|
|
|
|
'<' => '<',
|
|
|
|
|
'>' => '>',
|
|
|
|
|
'>' => '>',
|
|
|
|
|
'&' => '&',
|
|
|
|
|
'&' => '&',
|
|
|
|
|
'&' => '&',
|
|
|
|
|
);
|
|
|
|
|
$others_preg = array(
|
|
|
|
|
'/�*60;/' => '<',
|
|
|
|
|
'/�*62;/' => '>',
|
|
|
|
|
'/�*38;/' => '&',
|
|
|
|
|
'/�*26;/i' => '&',
|
|
|
|
|
);
|
2009-01-04 17:25:50 -05:00
|
|
|
|
|
2020-02-09 11:55:09 -05:00
|
|
|
|
if ( ENT_QUOTES === $quote_style ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$translation = array_merge( $single, $double, $others );
|
2009-01-18 23:40:12 -05:00
|
|
|
|
$translation_preg = array_merge( $single_preg, $double_preg, $others_preg );
|
2020-02-09 11:55:09 -05:00
|
|
|
|
} elseif ( ENT_COMPAT === $quote_style || 'double' === $quote_style ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$translation = array_merge( $double, $others );
|
2009-01-18 23:40:12 -05:00
|
|
|
|
$translation_preg = array_merge( $double_preg, $others_preg );
|
2020-02-09 11:55:09 -05:00
|
|
|
|
} elseif ( 'single' === $quote_style ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$translation = array_merge( $single, $others );
|
2009-01-18 23:40:12 -05:00
|
|
|
|
$translation_preg = array_merge( $single_preg, $others_preg );
|
2020-02-09 11:55:09 -05:00
|
|
|
|
} elseif ( ENT_NOQUOTES === $quote_style ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$translation = $others;
|
2009-01-18 23:40:12 -05:00
|
|
|
|
$translation_preg = $others_preg;
|
2009-01-04 17:25:50 -05:00
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Remove zero padding on numeric entities.
|
2009-01-04 18:37:47 -05:00
|
|
|
|
$string = preg_replace( array_keys( $translation_preg ), array_values( $translation_preg ), $string );
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Replace characters according to translation table.
|
2009-01-04 18:37:47 -05:00
|
|
|
|
return strtr( $string, $translation );
|
2009-01-04 17:25:50 -05:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Checks for invalid UTF8 in a string.
|
|
|
|
|
*
|
2013-02-01 13:07:08 -05:00
|
|
|
|
* @since 2.8.0
|
2009-01-04 17:25:50 -05:00
|
|
|
|
*
|
2020-07-23 17:11:05 -04:00
|
|
|
|
* @param string $string The text which is to be checked.
|
|
|
|
|
* @param bool $strip Optional. Whether to attempt to strip out invalid UTF8. Default false.
|
2009-01-04 17:25:50 -05:00
|
|
|
|
* @return string The checked text.
|
|
|
|
|
*/
|
2009-05-06 00:56:32 -04:00
|
|
|
|
function wp_check_invalid_utf8( $string, $strip = false ) {
|
2009-01-04 18:37:47 -05:00
|
|
|
|
$string = (string) $string;
|
|
|
|
|
|
2009-01-04 17:25:50 -05:00
|
|
|
|
if ( 0 === strlen( $string ) ) {
|
|
|
|
|
return '';
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Store the site charset as a static to avoid multiple calls to get_option().
|
2015-05-29 11:43:29 -04:00
|
|
|
|
static $is_utf8 = null;
|
|
|
|
|
if ( ! isset( $is_utf8 ) ) {
|
2020-04-04 23:02:11 -04:00
|
|
|
|
$is_utf8 = in_array( get_option( 'blog_charset' ), array( 'utf8', 'utf-8', 'UTF8', 'UTF-8' ), true );
|
2009-01-13 10:18:37 -05:00
|
|
|
|
}
|
2015-05-29 11:43:29 -04:00
|
|
|
|
if ( ! $is_utf8 ) {
|
2009-01-13 10:18:37 -05:00
|
|
|
|
return $string;
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Check for support for utf8 in the installed PCRE library once and store the result in a static.
|
2015-05-29 11:43:29 -04:00
|
|
|
|
static $utf8_pcre = null;
|
|
|
|
|
if ( ! isset( $utf8_pcre ) ) {
|
2019-07-09 01:45:58 -04:00
|
|
|
|
// phpcs:ignore WordPress.PHP.NoSilencedErrors.Discouraged
|
2009-01-13 10:18:37 -05:00
|
|
|
|
$utf8_pcre = @preg_match( '/^./u', 'a' );
|
|
|
|
|
}
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// We can't demand utf8 in the PCRE installation, so just return the string in those cases.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! $utf8_pcre ) {
|
2009-01-04 17:25:50 -05:00
|
|
|
|
return $string;
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// phpcs:ignore WordPress.PHP.NoSilencedErrors.Discouraged -- preg_match fails when it encounters invalid UTF8 in $string.
|
2009-01-13 10:18:37 -05:00
|
|
|
|
if ( 1 === @preg_match( '/^./us', $string ) ) {
|
2009-01-04 17:25:50 -05:00
|
|
|
|
return $string;
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Attempt to strip the bad chars if requested (not recommended).
|
2009-01-04 17:25:50 -05:00
|
|
|
|
if ( $strip && function_exists( 'iconv' ) ) {
|
|
|
|
|
return iconv( 'utf-8', 'utf-8', $string );
|
2004-12-12 15:41:19 -05:00
|
|
|
|
}
|
2009-01-13 10:18:37 -05:00
|
|
|
|
|
|
|
|
|
return '';
|
2004-12-12 15:41:19 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-31 16:58:19 -04:00
|
|
|
|
* Encode the Unicode values to be used in the URI.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 1.5.0
|
|
|
|
|
*
|
2008-08-31 16:58:19 -04:00
|
|
|
|
* @param string $utf8_string
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param int $length Max length of the string
|
2008-08-31 16:58:19 -04:00
|
|
|
|
* @return string String with Unicode encoded for URI.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2006-11-30 15:26:42 -05:00
|
|
|
|
function utf8_uri_encode( $utf8_string, $length = 0 ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$unicode = '';
|
|
|
|
|
$values = array();
|
|
|
|
|
$num_octets = 1;
|
2007-11-05 12:13:43 -05:00
|
|
|
|
$unicode_length = 0;
|
2006-11-19 02:56:05 -05:00
|
|
|
|
|
2014-06-23 18:21:15 -04:00
|
|
|
|
mbstring_binary_safe_encoding();
|
|
|
|
|
$string_length = strlen( $utf8_string );
|
|
|
|
|
reset_mbstring_encoding();
|
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
for ( $i = 0; $i < $string_length; $i++ ) {
|
2006-11-19 02:56:05 -05:00
|
|
|
|
|
|
|
|
|
$value = ord( $utf8_string[ $i ] );
|
|
|
|
|
|
|
|
|
|
if ( $value < 128 ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( $length && ( $unicode_length >= $length ) ) {
|
2007-09-03 19:32:58 -04:00
|
|
|
|
break;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
|
|
|
|
$unicode .= chr( $value );
|
2007-11-05 12:13:43 -05:00
|
|
|
|
$unicode_length++;
|
2006-11-19 02:56:05 -05:00
|
|
|
|
} else {
|
2015-03-11 18:55:28 -04:00
|
|
|
|
if ( count( $values ) == 0 ) {
|
|
|
|
|
if ( $value < 224 ) {
|
|
|
|
|
$num_octets = 2;
|
|
|
|
|
} elseif ( $value < 240 ) {
|
|
|
|
|
$num_octets = 3;
|
|
|
|
|
} else {
|
|
|
|
|
$num_octets = 4;
|
|
|
|
|
}
|
|
|
|
|
}
|
2006-11-19 02:56:05 -05:00
|
|
|
|
|
|
|
|
|
$values[] = $value;
|
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( $length && ( $unicode_length + ( $num_octets * 3 ) ) > $length ) {
|
2006-11-30 15:26:42 -05:00
|
|
|
|
break;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2006-11-19 02:56:05 -05:00
|
|
|
|
if ( count( $values ) == $num_octets ) {
|
2015-03-11 18:55:28 -04:00
|
|
|
|
for ( $j = 0; $j < $num_octets; $j++ ) {
|
|
|
|
|
$unicode .= '%' . dechex( $values[ $j ] );
|
2006-11-30 15:26:42 -05:00
|
|
|
|
}
|
|
|
|
|
|
2015-03-11 18:55:28 -04:00
|
|
|
|
$unicode_length += $num_octets * 3;
|
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$values = array();
|
2006-11-30 15:26:42 -05:00
|
|
|
|
$num_octets = 1;
|
2006-11-19 02:56:05 -05:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
}
|
2004-09-10 04:36:54 -04:00
|
|
|
|
|
2006-11-19 02:56:05 -05:00
|
|
|
|
return $unicode;
|
2004-09-10 04:36:54 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-31 16:58:19 -04:00
|
|
|
|
* Converts all accent characters to ASCII characters.
|
|
|
|
|
*
|
|
|
|
|
* If there are no accent characters, then the string given is just returned.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2016-06-09 15:14:30 -04:00
|
|
|
|
* **Accent characters converted:**
|
|
|
|
|
*
|
|
|
|
|
* Currency signs:
|
|
|
|
|
*
|
|
|
|
|
* | Code | Glyph | Replacement | Description |
|
|
|
|
|
* | -------- | ----- | ----------- | ------------------- |
|
|
|
|
|
* | U+00A3 | £ | (empty) | British Pound sign |
|
|
|
|
|
* | U+20AC | € | E | Euro sign |
|
|
|
|
|
*
|
|
|
|
|
* Decompositions for Latin-1 Supplement:
|
|
|
|
|
*
|
|
|
|
|
* | Code | Glyph | Replacement | Description |
|
|
|
|
|
* | ------- | ----- | ----------- | -------------------------------------- |
|
|
|
|
|
* | U+00AA | ª | a | Feminine ordinal indicator |
|
|
|
|
|
* | U+00BA | º | o | Masculine ordinal indicator |
|
|
|
|
|
* | U+00C0 | À | A | Latin capital letter A with grave |
|
|
|
|
|
* | U+00C1 | Á | A | Latin capital letter A with acute |
|
|
|
|
|
* | U+00C2 | Â | A | Latin capital letter A with circumflex |
|
|
|
|
|
* | U+00C3 | Ã | A | Latin capital letter A with tilde |
|
|
|
|
|
* | U+00C4 | Ä | A | Latin capital letter A with diaeresis |
|
|
|
|
|
* | U+00C5 | Å | A | Latin capital letter A with ring above |
|
|
|
|
|
* | U+00C6 | Æ | AE | Latin capital letter AE |
|
|
|
|
|
* | U+00C7 | Ç | C | Latin capital letter C with cedilla |
|
|
|
|
|
* | U+00C8 | È | E | Latin capital letter E with grave |
|
|
|
|
|
* | U+00C9 | É | E | Latin capital letter E with acute |
|
|
|
|
|
* | U+00CA | Ê | E | Latin capital letter E with circumflex |
|
|
|
|
|
* | U+00CB | Ë | E | Latin capital letter E with diaeresis |
|
|
|
|
|
* | U+00CC | Ì | I | Latin capital letter I with grave |
|
|
|
|
|
* | U+00CD | Í | I | Latin capital letter I with acute |
|
|
|
|
|
* | U+00CE | Î | I | Latin capital letter I with circumflex |
|
|
|
|
|
* | U+00CF | Ï | I | Latin capital letter I with diaeresis |
|
|
|
|
|
* | U+00D0 | Ð | D | Latin capital letter Eth |
|
|
|
|
|
* | U+00D1 | Ñ | N | Latin capital letter N with tilde |
|
|
|
|
|
* | U+00D2 | Ò | O | Latin capital letter O with grave |
|
|
|
|
|
* | U+00D3 | Ó | O | Latin capital letter O with acute |
|
|
|
|
|
* | U+00D4 | Ô | O | Latin capital letter O with circumflex |
|
|
|
|
|
* | U+00D5 | Õ | O | Latin capital letter O with tilde |
|
|
|
|
|
* | U+00D6 | Ö | O | Latin capital letter O with diaeresis |
|
|
|
|
|
* | U+00D8 | Ø | O | Latin capital letter O with stroke |
|
|
|
|
|
* | U+00D9 | Ù | U | Latin capital letter U with grave |
|
|
|
|
|
* | U+00DA | Ú | U | Latin capital letter U with acute |
|
|
|
|
|
* | U+00DB | Û | U | Latin capital letter U with circumflex |
|
|
|
|
|
* | U+00DC | Ü | U | Latin capital letter U with diaeresis |
|
|
|
|
|
* | U+00DD | Ý | Y | Latin capital letter Y with acute |
|
|
|
|
|
* | U+00DE | Þ | TH | Latin capital letter Thorn |
|
|
|
|
|
* | U+00DF | ß | s | Latin small letter sharp s |
|
|
|
|
|
* | U+00E0 | à | a | Latin small letter a with grave |
|
|
|
|
|
* | U+00E1 | á | a | Latin small letter a with acute |
|
|
|
|
|
* | U+00E2 | â | a | Latin small letter a with circumflex |
|
|
|
|
|
* | U+00E3 | ã | a | Latin small letter a with tilde |
|
|
|
|
|
* | U+00E4 | ä | a | Latin small letter a with diaeresis |
|
|
|
|
|
* | U+00E5 | å | a | Latin small letter a with ring above |
|
|
|
|
|
* | U+00E6 | æ | ae | Latin small letter ae |
|
|
|
|
|
* | U+00E7 | ç | c | Latin small letter c with cedilla |
|
|
|
|
|
* | U+00E8 | è | e | Latin small letter e with grave |
|
|
|
|
|
* | U+00E9 | é | e | Latin small letter e with acute |
|
|
|
|
|
* | U+00EA | ê | e | Latin small letter e with circumflex |
|
|
|
|
|
* | U+00EB | ë | e | Latin small letter e with diaeresis |
|
|
|
|
|
* | U+00EC | ì | i | Latin small letter i with grave |
|
|
|
|
|
* | U+00ED | í | i | Latin small letter i with acute |
|
|
|
|
|
* | U+00EE | î | i | Latin small letter i with circumflex |
|
|
|
|
|
* | U+00EF | ï | i | Latin small letter i with diaeresis |
|
|
|
|
|
* | U+00F0 | ð | d | Latin small letter Eth |
|
|
|
|
|
* | U+00F1 | ñ | n | Latin small letter n with tilde |
|
|
|
|
|
* | U+00F2 | ò | o | Latin small letter o with grave |
|
|
|
|
|
* | U+00F3 | ó | o | Latin small letter o with acute |
|
|
|
|
|
* | U+00F4 | ô | o | Latin small letter o with circumflex |
|
|
|
|
|
* | U+00F5 | õ | o | Latin small letter o with tilde |
|
|
|
|
|
* | U+00F6 | ö | o | Latin small letter o with diaeresis |
|
|
|
|
|
* | U+00F8 | ø | o | Latin small letter o with stroke |
|
|
|
|
|
* | U+00F9 | ù | u | Latin small letter u with grave |
|
|
|
|
|
* | U+00FA | ú | u | Latin small letter u with acute |
|
|
|
|
|
* | U+00FB | û | u | Latin small letter u with circumflex |
|
|
|
|
|
* | U+00FC | ü | u | Latin small letter u with diaeresis |
|
|
|
|
|
* | U+00FD | ý | y | Latin small letter y with acute |
|
|
|
|
|
* | U+00FE | þ | th | Latin small letter Thorn |
|
|
|
|
|
* | U+00FF | ÿ | y | Latin small letter y with diaeresis |
|
|
|
|
|
*
|
|
|
|
|
* Decompositions for Latin Extended-A:
|
|
|
|
|
*
|
|
|
|
|
* | Code | Glyph | Replacement | Description |
|
|
|
|
|
* | ------- | ----- | ----------- | ------------------------------------------------- |
|
|
|
|
|
* | U+0100 | Ā | A | Latin capital letter A with macron |
|
|
|
|
|
* | U+0101 | ā | a | Latin small letter a with macron |
|
|
|
|
|
* | U+0102 | Ă | A | Latin capital letter A with breve |
|
|
|
|
|
* | U+0103 | ă | a | Latin small letter a with breve |
|
|
|
|
|
* | U+0104 | Ą | A | Latin capital letter A with ogonek |
|
|
|
|
|
* | U+0105 | ą | a | Latin small letter a with ogonek |
|
|
|
|
|
* | U+01006 | Ć | C | Latin capital letter C with acute |
|
|
|
|
|
* | U+0107 | ć | c | Latin small letter c with acute |
|
|
|
|
|
* | U+0108 | Ĉ | C | Latin capital letter C with circumflex |
|
|
|
|
|
* | U+0109 | ĉ | c | Latin small letter c with circumflex |
|
|
|
|
|
* | U+010A | Ċ | C | Latin capital letter C with dot above |
|
|
|
|
|
* | U+010B | ċ | c | Latin small letter c with dot above |
|
|
|
|
|
* | U+010C | Č | C | Latin capital letter C with caron |
|
|
|
|
|
* | U+010D | č | c | Latin small letter c with caron |
|
|
|
|
|
* | U+010E | Ď | D | Latin capital letter D with caron |
|
|
|
|
|
* | U+010F | ď | d | Latin small letter d with caron |
|
|
|
|
|
* | U+0110 | Đ | D | Latin capital letter D with stroke |
|
|
|
|
|
* | U+0111 | đ | d | Latin small letter d with stroke |
|
|
|
|
|
* | U+0112 | Ē | E | Latin capital letter E with macron |
|
|
|
|
|
* | U+0113 | ē | e | Latin small letter e with macron |
|
|
|
|
|
* | U+0114 | Ĕ | E | Latin capital letter E with breve |
|
|
|
|
|
* | U+0115 | ĕ | e | Latin small letter e with breve |
|
|
|
|
|
* | U+0116 | Ė | E | Latin capital letter E with dot above |
|
|
|
|
|
* | U+0117 | ė | e | Latin small letter e with dot above |
|
|
|
|
|
* | U+0118 | Ę | E | Latin capital letter E with ogonek |
|
|
|
|
|
* | U+0119 | ę | e | Latin small letter e with ogonek |
|
|
|
|
|
* | U+011A | Ě | E | Latin capital letter E with caron |
|
|
|
|
|
* | U+011B | ě | e | Latin small letter e with caron |
|
|
|
|
|
* | U+011C | Ĝ | G | Latin capital letter G with circumflex |
|
|
|
|
|
* | U+011D | ĝ | g | Latin small letter g with circumflex |
|
|
|
|
|
* | U+011E | Ğ | G | Latin capital letter G with breve |
|
|
|
|
|
* | U+011F | ğ | g | Latin small letter g with breve |
|
|
|
|
|
* | U+0120 | Ġ | G | Latin capital letter G with dot above |
|
|
|
|
|
* | U+0121 | ġ | g | Latin small letter g with dot above |
|
|
|
|
|
* | U+0122 | Ģ | G | Latin capital letter G with cedilla |
|
|
|
|
|
* | U+0123 | ģ | g | Latin small letter g with cedilla |
|
|
|
|
|
* | U+0124 | Ĥ | H | Latin capital letter H with circumflex |
|
|
|
|
|
* | U+0125 | ĥ | h | Latin small letter h with circumflex |
|
|
|
|
|
* | U+0126 | Ħ | H | Latin capital letter H with stroke |
|
|
|
|
|
* | U+0127 | ħ | h | Latin small letter h with stroke |
|
|
|
|
|
* | U+0128 | Ĩ | I | Latin capital letter I with tilde |
|
|
|
|
|
* | U+0129 | ĩ | i | Latin small letter i with tilde |
|
|
|
|
|
* | U+012A | Ī | I | Latin capital letter I with macron |
|
|
|
|
|
* | U+012B | ī | i | Latin small letter i with macron |
|
|
|
|
|
* | U+012C | Ĭ | I | Latin capital letter I with breve |
|
|
|
|
|
* | U+012D | ĭ | i | Latin small letter i with breve |
|
|
|
|
|
* | U+012E | Į | I | Latin capital letter I with ogonek |
|
|
|
|
|
* | U+012F | į | i | Latin small letter i with ogonek |
|
|
|
|
|
* | U+0130 | İ | I | Latin capital letter I with dot above |
|
|
|
|
|
* | U+0131 | ı | i | Latin small letter dotless i |
|
|
|
|
|
* | U+0132 | IJ | IJ | Latin capital ligature IJ |
|
|
|
|
|
* | U+0133 | ij | ij | Latin small ligature ij |
|
|
|
|
|
* | U+0134 | Ĵ | J | Latin capital letter J with circumflex |
|
|
|
|
|
* | U+0135 | ĵ | j | Latin small letter j with circumflex |
|
|
|
|
|
* | U+0136 | Ķ | K | Latin capital letter K with cedilla |
|
|
|
|
|
* | U+0137 | ķ | k | Latin small letter k with cedilla |
|
|
|
|
|
* | U+0138 | ĸ | k | Latin small letter Kra |
|
|
|
|
|
* | U+0139 | Ĺ | L | Latin capital letter L with acute |
|
|
|
|
|
* | U+013A | ĺ | l | Latin small letter l with acute |
|
|
|
|
|
* | U+013B | Ļ | L | Latin capital letter L with cedilla |
|
|
|
|
|
* | U+013C | ļ | l | Latin small letter l with cedilla |
|
|
|
|
|
* | U+013D | Ľ | L | Latin capital letter L with caron |
|
|
|
|
|
* | U+013E | ľ | l | Latin small letter l with caron |
|
|
|
|
|
* | U+013F | Ŀ | L | Latin capital letter L with middle dot |
|
|
|
|
|
* | U+0140 | ŀ | l | Latin small letter l with middle dot |
|
|
|
|
|
* | U+0141 | Ł | L | Latin capital letter L with stroke |
|
|
|
|
|
* | U+0142 | ł | l | Latin small letter l with stroke |
|
|
|
|
|
* | U+0143 | Ń | N | Latin capital letter N with acute |
|
|
|
|
|
* | U+0144 | ń | n | Latin small letter N with acute |
|
|
|
|
|
* | U+0145 | Ņ | N | Latin capital letter N with cedilla |
|
|
|
|
|
* | U+0146 | ņ | n | Latin small letter n with cedilla |
|
|
|
|
|
* | U+0147 | Ň | N | Latin capital letter N with caron |
|
|
|
|
|
* | U+0148 | ň | n | Latin small letter n with caron |
|
2016-08-04 09:56:29 -04:00
|
|
|
|
* | U+0149 | ʼn | n | Latin small letter n preceded by apostrophe |
|
|
|
|
|
* | U+014A | Ŋ | N | Latin capital letter Eng |
|
|
|
|
|
* | U+014B | ŋ | n | Latin small letter Eng |
|
2016-06-09 15:14:30 -04:00
|
|
|
|
* | U+014C | Ō | O | Latin capital letter O with macron |
|
|
|
|
|
* | U+014D | ō | o | Latin small letter o with macron |
|
|
|
|
|
* | U+014E | Ŏ | O | Latin capital letter O with breve |
|
|
|
|
|
* | U+014F | ŏ | o | Latin small letter o with breve |
|
|
|
|
|
* | U+0150 | Ő | O | Latin capital letter O with double acute |
|
|
|
|
|
* | U+0151 | ő | o | Latin small letter o with double acute |
|
|
|
|
|
* | U+0152 | Œ | OE | Latin capital ligature OE |
|
|
|
|
|
* | U+0153 | œ | oe | Latin small ligature oe |
|
|
|
|
|
* | U+0154 | Ŕ | R | Latin capital letter R with acute |
|
|
|
|
|
* | U+0155 | ŕ | r | Latin small letter r with acute |
|
|
|
|
|
* | U+0156 | Ŗ | R | Latin capital letter R with cedilla |
|
|
|
|
|
* | U+0157 | ŗ | r | Latin small letter r with cedilla |
|
|
|
|
|
* | U+0158 | Ř | R | Latin capital letter R with caron |
|
|
|
|
|
* | U+0159 | ř | r | Latin small letter r with caron |
|
|
|
|
|
* | U+015A | Ś | S | Latin capital letter S with acute |
|
|
|
|
|
* | U+015B | ś | s | Latin small letter s with acute |
|
|
|
|
|
* | U+015C | Ŝ | S | Latin capital letter S with circumflex |
|
|
|
|
|
* | U+015D | ŝ | s | Latin small letter s with circumflex |
|
|
|
|
|
* | U+015E | Ş | S | Latin capital letter S with cedilla |
|
|
|
|
|
* | U+015F | ş | s | Latin small letter s with cedilla |
|
|
|
|
|
* | U+0160 | Š | S | Latin capital letter S with caron |
|
|
|
|
|
* | U+0161 | š | s | Latin small letter s with caron |
|
|
|
|
|
* | U+0162 | Ţ | T | Latin capital letter T with cedilla |
|
|
|
|
|
* | U+0163 | ţ | t | Latin small letter t with cedilla |
|
|
|
|
|
* | U+0164 | Ť | T | Latin capital letter T with caron |
|
|
|
|
|
* | U+0165 | ť | t | Latin small letter t with caron |
|
|
|
|
|
* | U+0166 | Ŧ | T | Latin capital letter T with stroke |
|
|
|
|
|
* | U+0167 | ŧ | t | Latin small letter t with stroke |
|
|
|
|
|
* | U+0168 | Ũ | U | Latin capital letter U with tilde |
|
|
|
|
|
* | U+0169 | ũ | u | Latin small letter u with tilde |
|
|
|
|
|
* | U+016A | Ū | U | Latin capital letter U with macron |
|
|
|
|
|
* | U+016B | ū | u | Latin small letter u with macron |
|
|
|
|
|
* | U+016C | Ŭ | U | Latin capital letter U with breve |
|
|
|
|
|
* | U+016D | ŭ | u | Latin small letter u with breve |
|
|
|
|
|
* | U+016E | Ů | U | Latin capital letter U with ring above |
|
|
|
|
|
* | U+016F | ů | u | Latin small letter u with ring above |
|
|
|
|
|
* | U+0170 | Ű | U | Latin capital letter U with double acute |
|
|
|
|
|
* | U+0171 | ű | u | Latin small letter u with double acute |
|
|
|
|
|
* | U+0172 | Ų | U | Latin capital letter U with ogonek |
|
|
|
|
|
* | U+0173 | ų | u | Latin small letter u with ogonek |
|
|
|
|
|
* | U+0174 | Ŵ | W | Latin capital letter W with circumflex |
|
|
|
|
|
* | U+0175 | ŵ | w | Latin small letter w with circumflex |
|
|
|
|
|
* | U+0176 | Ŷ | Y | Latin capital letter Y with circumflex |
|
|
|
|
|
* | U+0177 | ŷ | y | Latin small letter y with circumflex |
|
|
|
|
|
* | U+0178 | Ÿ | Y | Latin capital letter Y with diaeresis |
|
|
|
|
|
* | U+0179 | Ź | Z | Latin capital letter Z with acute |
|
|
|
|
|
* | U+017A | ź | z | Latin small letter z with acute |
|
|
|
|
|
* | U+017B | Ż | Z | Latin capital letter Z with dot above |
|
|
|
|
|
* | U+017C | ż | z | Latin small letter z with dot above |
|
|
|
|
|
* | U+017D | Ž | Z | Latin capital letter Z with caron |
|
|
|
|
|
* | U+017E | ž | z | Latin small letter z with caron |
|
|
|
|
|
* | U+017F | ſ | s | Latin small letter long s |
|
|
|
|
|
* | U+01A0 | Ơ | O | Latin capital letter O with horn |
|
|
|
|
|
* | U+01A1 | ơ | o | Latin small letter o with horn |
|
|
|
|
|
* | U+01AF | Ư | U | Latin capital letter U with horn |
|
|
|
|
|
* | U+01B0 | ư | u | Latin small letter u with horn |
|
|
|
|
|
* | U+01CD | Ǎ | A | Latin capital letter A with caron |
|
|
|
|
|
* | U+01CE | ǎ | a | Latin small letter a with caron |
|
|
|
|
|
* | U+01CF | Ǐ | I | Latin capital letter I with caron |
|
|
|
|
|
* | U+01D0 | ǐ | i | Latin small letter i with caron |
|
|
|
|
|
* | U+01D1 | Ǒ | O | Latin capital letter O with caron |
|
|
|
|
|
* | U+01D2 | ǒ | o | Latin small letter o with caron |
|
|
|
|
|
* | U+01D3 | Ǔ | U | Latin capital letter U with caron |
|
|
|
|
|
* | U+01D4 | ǔ | u | Latin small letter u with caron |
|
|
|
|
|
* | U+01D5 | Ǖ | U | Latin capital letter U with diaeresis and macron |
|
|
|
|
|
* | U+01D6 | ǖ | u | Latin small letter u with diaeresis and macron |
|
|
|
|
|
* | U+01D7 | Ǘ | U | Latin capital letter U with diaeresis and acute |
|
|
|
|
|
* | U+01D8 | ǘ | u | Latin small letter u with diaeresis and acute |
|
|
|
|
|
* | U+01D9 | Ǚ | U | Latin capital letter U with diaeresis and caron |
|
|
|
|
|
* | U+01DA | ǚ | u | Latin small letter u with diaeresis and caron |
|
|
|
|
|
* | U+01DB | Ǜ | U | Latin capital letter U with diaeresis and grave |
|
|
|
|
|
* | U+01DC | ǜ | u | Latin small letter u with diaeresis and grave |
|
|
|
|
|
*
|
|
|
|
|
* Decompositions for Latin Extended-B:
|
|
|
|
|
*
|
|
|
|
|
* | Code | Glyph | Replacement | Description |
|
|
|
|
|
* | -------- | ----- | ----------- | ----------------------------------------- |
|
|
|
|
|
* | U+0218 | Ș | S | Latin capital letter S with comma below |
|
|
|
|
|
* | U+0219 | ș | s | Latin small letter s with comma below |
|
|
|
|
|
* | U+021A | Ț | T | Latin capital letter T with comma below |
|
|
|
|
|
* | U+021B | ț | t | Latin small letter t with comma below |
|
|
|
|
|
*
|
|
|
|
|
* Vowels with diacritic (Chinese, Hanyu Pinyin):
|
|
|
|
|
*
|
|
|
|
|
* | Code | Glyph | Replacement | Description |
|
|
|
|
|
* | -------- | ----- | ----------- | ----------------------------------------------------- |
|
|
|
|
|
* | U+0251 | ɑ | a | Latin small letter alpha |
|
|
|
|
|
* | U+1EA0 | Ạ | A | Latin capital letter A with dot below |
|
|
|
|
|
* | U+1EA1 | ạ | a | Latin small letter a with dot below |
|
|
|
|
|
* | U+1EA2 | Ả | A | Latin capital letter A with hook above |
|
|
|
|
|
* | U+1EA3 | ả | a | Latin small letter a with hook above |
|
|
|
|
|
* | U+1EA4 | Ấ | A | Latin capital letter A with circumflex and acute |
|
|
|
|
|
* | U+1EA5 | ấ | a | Latin small letter a with circumflex and acute |
|
|
|
|
|
* | U+1EA6 | Ầ | A | Latin capital letter A with circumflex and grave |
|
|
|
|
|
* | U+1EA7 | ầ | a | Latin small letter a with circumflex and grave |
|
|
|
|
|
* | U+1EA8 | Ẩ | A | Latin capital letter A with circumflex and hook above |
|
|
|
|
|
* | U+1EA9 | ẩ | a | Latin small letter a with circumflex and hook above |
|
|
|
|
|
* | U+1EAA | Ẫ | A | Latin capital letter A with circumflex and tilde |
|
|
|
|
|
* | U+1EAB | ẫ | a | Latin small letter a with circumflex and tilde |
|
|
|
|
|
* | U+1EA6 | Ậ | A | Latin capital letter A with circumflex and dot below |
|
|
|
|
|
* | U+1EAD | ậ | a | Latin small letter a with circumflex and dot below |
|
|
|
|
|
* | U+1EAE | Ắ | A | Latin capital letter A with breve and acute |
|
|
|
|
|
* | U+1EAF | ắ | a | Latin small letter a with breve and acute |
|
|
|
|
|
* | U+1EB0 | Ằ | A | Latin capital letter A with breve and grave |
|
|
|
|
|
* | U+1EB1 | ằ | a | Latin small letter a with breve and grave |
|
|
|
|
|
* | U+1EB2 | Ẳ | A | Latin capital letter A with breve and hook above |
|
|
|
|
|
* | U+1EB3 | ẳ | a | Latin small letter a with breve and hook above |
|
|
|
|
|
* | U+1EB4 | Ẵ | A | Latin capital letter A with breve and tilde |
|
|
|
|
|
* | U+1EB5 | ẵ | a | Latin small letter a with breve and tilde |
|
|
|
|
|
* | U+1EB6 | Ặ | A | Latin capital letter A with breve and dot below |
|
|
|
|
|
* | U+1EB7 | ặ | a | Latin small letter a with breve and dot below |
|
|
|
|
|
* | U+1EB8 | Ẹ | E | Latin capital letter E with dot below |
|
|
|
|
|
* | U+1EB9 | ẹ | e | Latin small letter e with dot below |
|
|
|
|
|
* | U+1EBA | Ẻ | E | Latin capital letter E with hook above |
|
|
|
|
|
* | U+1EBB | ẻ | e | Latin small letter e with hook above |
|
|
|
|
|
* | U+1EBC | Ẽ | E | Latin capital letter E with tilde |
|
|
|
|
|
* | U+1EBD | ẽ | e | Latin small letter e with tilde |
|
|
|
|
|
* | U+1EBE | Ế | E | Latin capital letter E with circumflex and acute |
|
|
|
|
|
* | U+1EBF | ế | e | Latin small letter e with circumflex and acute |
|
|
|
|
|
* | U+1EC0 | Ề | E | Latin capital letter E with circumflex and grave |
|
|
|
|
|
* | U+1EC1 | ề | e | Latin small letter e with circumflex and grave |
|
|
|
|
|
* | U+1EC2 | Ể | E | Latin capital letter E with circumflex and hook above |
|
|
|
|
|
* | U+1EC3 | ể | e | Latin small letter e with circumflex and hook above |
|
|
|
|
|
* | U+1EC4 | Ễ | E | Latin capital letter E with circumflex and tilde |
|
|
|
|
|
* | U+1EC5 | ễ | e | Latin small letter e with circumflex and tilde |
|
|
|
|
|
* | U+1EC6 | Ệ | E | Latin capital letter E with circumflex and dot below |
|
|
|
|
|
* | U+1EC7 | ệ | e | Latin small letter e with circumflex and dot below |
|
|
|
|
|
* | U+1EC8 | Ỉ | I | Latin capital letter I with hook above |
|
|
|
|
|
* | U+1EC9 | ỉ | i | Latin small letter i with hook above |
|
|
|
|
|
* | U+1ECA | Ị | I | Latin capital letter I with dot below |
|
|
|
|
|
* | U+1ECB | ị | i | Latin small letter i with dot below |
|
|
|
|
|
* | U+1ECC | Ọ | O | Latin capital letter O with dot below |
|
|
|
|
|
* | U+1ECD | ọ | o | Latin small letter o with dot below |
|
|
|
|
|
* | U+1ECE | Ỏ | O | Latin capital letter O with hook above |
|
|
|
|
|
* | U+1ECF | ỏ | o | Latin small letter o with hook above |
|
|
|
|
|
* | U+1ED0 | Ố | O | Latin capital letter O with circumflex and acute |
|
|
|
|
|
* | U+1ED1 | ố | o | Latin small letter o with circumflex and acute |
|
|
|
|
|
* | U+1ED2 | Ồ | O | Latin capital letter O with circumflex and grave |
|
|
|
|
|
* | U+1ED3 | ồ | o | Latin small letter o with circumflex and grave |
|
|
|
|
|
* | U+1ED4 | Ổ | O | Latin capital letter O with circumflex and hook above |
|
|
|
|
|
* | U+1ED5 | ổ | o | Latin small letter o with circumflex and hook above |
|
|
|
|
|
* | U+1ED6 | Ỗ | O | Latin capital letter O with circumflex and tilde |
|
|
|
|
|
* | U+1ED7 | ỗ | o | Latin small letter o with circumflex and tilde |
|
|
|
|
|
* | U+1ED8 | Ộ | O | Latin capital letter O with circumflex and dot below |
|
|
|
|
|
* | U+1ED9 | ộ | o | Latin small letter o with circumflex and dot below |
|
|
|
|
|
* | U+1EDA | Ớ | O | Latin capital letter O with horn and acute |
|
|
|
|
|
* | U+1EDB | ớ | o | Latin small letter o with horn and acute |
|
|
|
|
|
* | U+1EDC | Ờ | O | Latin capital letter O with horn and grave |
|
|
|
|
|
* | U+1EDD | ờ | o | Latin small letter o with horn and grave |
|
|
|
|
|
* | U+1EDE | Ở | O | Latin capital letter O with horn and hook above |
|
|
|
|
|
* | U+1EDF | ở | o | Latin small letter o with horn and hook above |
|
|
|
|
|
* | U+1EE0 | Ỡ | O | Latin capital letter O with horn and tilde |
|
|
|
|
|
* | U+1EE1 | ỡ | o | Latin small letter o with horn and tilde |
|
|
|
|
|
* | U+1EE2 | Ợ | O | Latin capital letter O with horn and dot below |
|
|
|
|
|
* | U+1EE3 | ợ | o | Latin small letter o with horn and dot below |
|
|
|
|
|
* | U+1EE4 | Ụ | U | Latin capital letter U with dot below |
|
|
|
|
|
* | U+1EE5 | ụ | u | Latin small letter u with dot below |
|
|
|
|
|
* | U+1EE6 | Ủ | U | Latin capital letter U with hook above |
|
|
|
|
|
* | U+1EE7 | ủ | u | Latin small letter u with hook above |
|
|
|
|
|
* | U+1EE8 | Ứ | U | Latin capital letter U with horn and acute |
|
|
|
|
|
* | U+1EE9 | ứ | u | Latin small letter u with horn and acute |
|
|
|
|
|
* | U+1EEA | Ừ | U | Latin capital letter U with horn and grave |
|
|
|
|
|
* | U+1EEB | ừ | u | Latin small letter u with horn and grave |
|
|
|
|
|
* | U+1EEC | Ử | U | Latin capital letter U with horn and hook above |
|
|
|
|
|
* | U+1EED | ử | u | Latin small letter u with horn and hook above |
|
|
|
|
|
* | U+1EEE | Ữ | U | Latin capital letter U with horn and tilde |
|
|
|
|
|
* | U+1EEF | ữ | u | Latin small letter u with horn and tilde |
|
|
|
|
|
* | U+1EF0 | Ự | U | Latin capital letter U with horn and dot below |
|
|
|
|
|
* | U+1EF1 | ự | u | Latin small letter u with horn and dot below |
|
|
|
|
|
* | U+1EF2 | Ỳ | Y | Latin capital letter Y with grave |
|
|
|
|
|
* | U+1EF3 | ỳ | y | Latin small letter y with grave |
|
|
|
|
|
* | U+1EF4 | Ỵ | Y | Latin capital letter Y with dot below |
|
|
|
|
|
* | U+1EF5 | ỵ | y | Latin small letter y with dot below |
|
|
|
|
|
* | U+1EF6 | Ỷ | Y | Latin capital letter Y with hook above |
|
|
|
|
|
* | U+1EF7 | ỷ | y | Latin small letter y with hook above |
|
|
|
|
|
* | U+1EF8 | Ỹ | Y | Latin capital letter Y with tilde |
|
|
|
|
|
* | U+1EF9 | ỹ | y | Latin small letter y with tilde |
|
|
|
|
|
*
|
2016-06-14 13:44:30 -04:00
|
|
|
|
* German (`de_DE`), German formal (`de_DE_formal`), German (Switzerland) formal (`de_CH`),
|
2021-01-17 10:46:08 -05:00
|
|
|
|
* German (Switzerland) informal (`de_CH_informal`), and German (Austria) (`de_AT`) locales:
|
2016-06-09 15:14:30 -04:00
|
|
|
|
*
|
|
|
|
|
* | Code | Glyph | Replacement | Description |
|
|
|
|
|
* | -------- | ----- | ----------- | --------------------------------------- |
|
|
|
|
|
* | U+00C4 | Ä | Ae | Latin capital letter A with diaeresis |
|
|
|
|
|
* | U+00E4 | ä | ae | Latin small letter a with diaeresis |
|
|
|
|
|
* | U+00D6 | Ö | Oe | Latin capital letter O with diaeresis |
|
|
|
|
|
* | U+00F6 | ö | oe | Latin small letter o with diaeresis |
|
|
|
|
|
* | U+00DC | Ü | Ue | Latin capital letter U with diaeresis |
|
|
|
|
|
* | U+00FC | ü | ue | Latin small letter u with diaeresis |
|
|
|
|
|
* | U+00DF | ß | ss | Latin small letter sharp s |
|
|
|
|
|
*
|
|
|
|
|
* Danish (`da_DK`) locale:
|
|
|
|
|
*
|
|
|
|
|
* | Code | Glyph | Replacement | Description |
|
|
|
|
|
* | -------- | ----- | ----------- | --------------------------------------- |
|
|
|
|
|
* | U+00C6 | Æ | Ae | Latin capital letter AE |
|
|
|
|
|
* | U+00E6 | æ | ae | Latin small letter ae |
|
|
|
|
|
* | U+00D8 | Ø | Oe | Latin capital letter O with stroke |
|
|
|
|
|
* | U+00F8 | ø | oe | Latin small letter o with stroke |
|
|
|
|
|
* | U+00C5 | Å | Aa | Latin capital letter A with ring above |
|
|
|
|
|
* | U+00E5 | å | aa | Latin small letter a with ring above |
|
|
|
|
|
*
|
2016-06-26 10:26:29 -04:00
|
|
|
|
* Catalan (`ca`) locale:
|
|
|
|
|
*
|
|
|
|
|
* | Code | Glyph | Replacement | Description |
|
|
|
|
|
* | -------- | ----- | ----------- | --------------------------------------- |
|
|
|
|
|
* | U+00B7 | l·l | ll | Flown dot (between two Ls) |
|
|
|
|
|
*
|
2017-01-21 12:26:41 -05:00
|
|
|
|
* Serbian (`sr_RS`) and Bosnian (`bs_BA`) locales:
|
2016-09-22 20:07:29 -04:00
|
|
|
|
*
|
|
|
|
|
* | Code | Glyph | Replacement | Description |
|
|
|
|
|
* | -------- | ----- | ----------- | --------------------------------------- |
|
|
|
|
|
* | U+0110 | Đ | DJ | Latin capital letter D with stroke |
|
|
|
|
|
* | U+0111 | đ | dj | Latin small letter d with stroke |
|
|
|
|
|
*
|
2008-08-17 07:29:43 -04:00
|
|
|
|
* @since 1.2.1
|
2016-07-20 12:57:32 -04:00
|
|
|
|
* @since 4.6.0 Added locale support for `de_CH`, `de_CH_informal`, and `ca`.
|
2016-09-22 20:07:29 -04:00
|
|
|
|
* @since 4.7.0 Added locale support for `sr_RS`.
|
2017-01-21 12:16:43 -05:00
|
|
|
|
* @since 4.8.0 Added locale support for `bs_BA`.
|
2021-01-17 10:46:08 -05:00
|
|
|
|
* @since 5.7.0 Added locale support for `de_AT`.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-31 16:58:19 -04:00
|
|
|
|
* @param string $string Text that might have accent characters
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @return string Filtered string with replaced "nice" characters.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function remove_accents( $string ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! preg_match( '/[\x80-\xff]/', $string ) ) {
|
2006-07-26 18:55:36 -04:00
|
|
|
|
return $string;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2006-07-26 18:55:36 -04:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( seems_utf8( $string ) ) {
|
2005-03-28 20:38:29 -05:00
|
|
|
|
$chars = array(
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Decompositions for Latin-1 Supplement.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'ª' => 'a',
|
|
|
|
|
'º' => 'o',
|
|
|
|
|
'À' => 'A',
|
|
|
|
|
'Á' => 'A',
|
|
|
|
|
'Â' => 'A',
|
|
|
|
|
'Ã' => 'A',
|
|
|
|
|
'Ä' => 'A',
|
|
|
|
|
'Å' => 'A',
|
|
|
|
|
'Æ' => 'AE',
|
|
|
|
|
'Ç' => 'C',
|
|
|
|
|
'È' => 'E',
|
|
|
|
|
'É' => 'E',
|
|
|
|
|
'Ê' => 'E',
|
|
|
|
|
'Ë' => 'E',
|
|
|
|
|
'Ì' => 'I',
|
|
|
|
|
'Í' => 'I',
|
|
|
|
|
'Î' => 'I',
|
|
|
|
|
'Ï' => 'I',
|
|
|
|
|
'Ð' => 'D',
|
|
|
|
|
'Ñ' => 'N',
|
|
|
|
|
'Ò' => 'O',
|
|
|
|
|
'Ó' => 'O',
|
|
|
|
|
'Ô' => 'O',
|
|
|
|
|
'Õ' => 'O',
|
|
|
|
|
'Ö' => 'O',
|
|
|
|
|
'Ù' => 'U',
|
|
|
|
|
'Ú' => 'U',
|
|
|
|
|
'Û' => 'U',
|
|
|
|
|
'Ü' => 'U',
|
|
|
|
|
'Ý' => 'Y',
|
|
|
|
|
'Þ' => 'TH',
|
|
|
|
|
'ß' => 's',
|
|
|
|
|
'à' => 'a',
|
|
|
|
|
'á' => 'a',
|
|
|
|
|
'â' => 'a',
|
|
|
|
|
'ã' => 'a',
|
|
|
|
|
'ä' => 'a',
|
|
|
|
|
'å' => 'a',
|
|
|
|
|
'æ' => 'ae',
|
|
|
|
|
'ç' => 'c',
|
|
|
|
|
'è' => 'e',
|
|
|
|
|
'é' => 'e',
|
|
|
|
|
'ê' => 'e',
|
|
|
|
|
'ë' => 'e',
|
|
|
|
|
'ì' => 'i',
|
|
|
|
|
'í' => 'i',
|
|
|
|
|
'î' => 'i',
|
|
|
|
|
'ï' => 'i',
|
|
|
|
|
'ð' => 'd',
|
|
|
|
|
'ñ' => 'n',
|
|
|
|
|
'ò' => 'o',
|
|
|
|
|
'ó' => 'o',
|
|
|
|
|
'ô' => 'o',
|
|
|
|
|
'õ' => 'o',
|
|
|
|
|
'ö' => 'o',
|
|
|
|
|
'ø' => 'o',
|
|
|
|
|
'ù' => 'u',
|
|
|
|
|
'ú' => 'u',
|
|
|
|
|
'û' => 'u',
|
|
|
|
|
'ü' => 'u',
|
|
|
|
|
'ý' => 'y',
|
|
|
|
|
'þ' => 'th',
|
|
|
|
|
'ÿ' => 'y',
|
|
|
|
|
'Ø' => 'O',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Decompositions for Latin Extended-A.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'Ā' => 'A',
|
|
|
|
|
'ā' => 'a',
|
|
|
|
|
'Ă' => 'A',
|
|
|
|
|
'ă' => 'a',
|
|
|
|
|
'Ą' => 'A',
|
|
|
|
|
'ą' => 'a',
|
|
|
|
|
'Ć' => 'C',
|
|
|
|
|
'ć' => 'c',
|
|
|
|
|
'Ĉ' => 'C',
|
|
|
|
|
'ĉ' => 'c',
|
|
|
|
|
'Ċ' => 'C',
|
|
|
|
|
'ċ' => 'c',
|
|
|
|
|
'Č' => 'C',
|
|
|
|
|
'č' => 'c',
|
|
|
|
|
'Ď' => 'D',
|
|
|
|
|
'ď' => 'd',
|
|
|
|
|
'Đ' => 'D',
|
|
|
|
|
'đ' => 'd',
|
|
|
|
|
'Ē' => 'E',
|
|
|
|
|
'ē' => 'e',
|
|
|
|
|
'Ĕ' => 'E',
|
|
|
|
|
'ĕ' => 'e',
|
|
|
|
|
'Ė' => 'E',
|
|
|
|
|
'ė' => 'e',
|
|
|
|
|
'Ę' => 'E',
|
|
|
|
|
'ę' => 'e',
|
|
|
|
|
'Ě' => 'E',
|
|
|
|
|
'ě' => 'e',
|
|
|
|
|
'Ĝ' => 'G',
|
|
|
|
|
'ĝ' => 'g',
|
|
|
|
|
'Ğ' => 'G',
|
|
|
|
|
'ğ' => 'g',
|
|
|
|
|
'Ġ' => 'G',
|
|
|
|
|
'ġ' => 'g',
|
|
|
|
|
'Ģ' => 'G',
|
|
|
|
|
'ģ' => 'g',
|
|
|
|
|
'Ĥ' => 'H',
|
|
|
|
|
'ĥ' => 'h',
|
|
|
|
|
'Ħ' => 'H',
|
|
|
|
|
'ħ' => 'h',
|
|
|
|
|
'Ĩ' => 'I',
|
|
|
|
|
'ĩ' => 'i',
|
|
|
|
|
'Ī' => 'I',
|
|
|
|
|
'ī' => 'i',
|
|
|
|
|
'Ĭ' => 'I',
|
|
|
|
|
'ĭ' => 'i',
|
|
|
|
|
'Į' => 'I',
|
|
|
|
|
'į' => 'i',
|
|
|
|
|
'İ' => 'I',
|
|
|
|
|
'ı' => 'i',
|
|
|
|
|
'IJ' => 'IJ',
|
|
|
|
|
'ij' => 'ij',
|
|
|
|
|
'Ĵ' => 'J',
|
|
|
|
|
'ĵ' => 'j',
|
|
|
|
|
'Ķ' => 'K',
|
|
|
|
|
'ķ' => 'k',
|
|
|
|
|
'ĸ' => 'k',
|
|
|
|
|
'Ĺ' => 'L',
|
|
|
|
|
'ĺ' => 'l',
|
|
|
|
|
'Ļ' => 'L',
|
|
|
|
|
'ļ' => 'l',
|
|
|
|
|
'Ľ' => 'L',
|
|
|
|
|
'ľ' => 'l',
|
|
|
|
|
'Ŀ' => 'L',
|
|
|
|
|
'ŀ' => 'l',
|
|
|
|
|
'Ł' => 'L',
|
|
|
|
|
'ł' => 'l',
|
|
|
|
|
'Ń' => 'N',
|
|
|
|
|
'ń' => 'n',
|
|
|
|
|
'Ņ' => 'N',
|
|
|
|
|
'ņ' => 'n',
|
|
|
|
|
'Ň' => 'N',
|
|
|
|
|
'ň' => 'n',
|
|
|
|
|
'ʼn' => 'n',
|
|
|
|
|
'Ŋ' => 'N',
|
|
|
|
|
'ŋ' => 'n',
|
|
|
|
|
'Ō' => 'O',
|
|
|
|
|
'ō' => 'o',
|
|
|
|
|
'Ŏ' => 'O',
|
|
|
|
|
'ŏ' => 'o',
|
|
|
|
|
'Ő' => 'O',
|
|
|
|
|
'ő' => 'o',
|
|
|
|
|
'Œ' => 'OE',
|
|
|
|
|
'œ' => 'oe',
|
|
|
|
|
'Ŕ' => 'R',
|
|
|
|
|
'ŕ' => 'r',
|
|
|
|
|
'Ŗ' => 'R',
|
|
|
|
|
'ŗ' => 'r',
|
|
|
|
|
'Ř' => 'R',
|
|
|
|
|
'ř' => 'r',
|
|
|
|
|
'Ś' => 'S',
|
|
|
|
|
'ś' => 's',
|
|
|
|
|
'Ŝ' => 'S',
|
|
|
|
|
'ŝ' => 's',
|
|
|
|
|
'Ş' => 'S',
|
|
|
|
|
'ş' => 's',
|
|
|
|
|
'Š' => 'S',
|
|
|
|
|
'š' => 's',
|
|
|
|
|
'Ţ' => 'T',
|
|
|
|
|
'ţ' => 't',
|
|
|
|
|
'Ť' => 'T',
|
|
|
|
|
'ť' => 't',
|
|
|
|
|
'Ŧ' => 'T',
|
|
|
|
|
'ŧ' => 't',
|
|
|
|
|
'Ũ' => 'U',
|
|
|
|
|
'ũ' => 'u',
|
|
|
|
|
'Ū' => 'U',
|
|
|
|
|
'ū' => 'u',
|
|
|
|
|
'Ŭ' => 'U',
|
|
|
|
|
'ŭ' => 'u',
|
|
|
|
|
'Ů' => 'U',
|
|
|
|
|
'ů' => 'u',
|
|
|
|
|
'Ű' => 'U',
|
|
|
|
|
'ű' => 'u',
|
|
|
|
|
'Ų' => 'U',
|
|
|
|
|
'ų' => 'u',
|
|
|
|
|
'Ŵ' => 'W',
|
|
|
|
|
'ŵ' => 'w',
|
|
|
|
|
'Ŷ' => 'Y',
|
|
|
|
|
'ŷ' => 'y',
|
|
|
|
|
'Ÿ' => 'Y',
|
|
|
|
|
'Ź' => 'Z',
|
|
|
|
|
'ź' => 'z',
|
|
|
|
|
'Ż' => 'Z',
|
|
|
|
|
'ż' => 'z',
|
|
|
|
|
'Ž' => 'Z',
|
|
|
|
|
'ž' => 'z',
|
|
|
|
|
'ſ' => 's',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Decompositions for Latin Extended-B.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'Ș' => 'S',
|
|
|
|
|
'ș' => 's',
|
|
|
|
|
'Ț' => 'T',
|
|
|
|
|
'ț' => 't',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Euro sign.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'€' => 'E',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// GBP (Pound) sign.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'£' => '',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Vowels with diacritic (Vietnamese).
|
|
|
|
|
// Unmarked.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'Ơ' => 'O',
|
|
|
|
|
'ơ' => 'o',
|
|
|
|
|
'Ư' => 'U',
|
|
|
|
|
'ư' => 'u',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Grave accent.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'Ầ' => 'A',
|
|
|
|
|
'ầ' => 'a',
|
|
|
|
|
'Ằ' => 'A',
|
|
|
|
|
'ằ' => 'a',
|
|
|
|
|
'Ề' => 'E',
|
|
|
|
|
'ề' => 'e',
|
|
|
|
|
'Ồ' => 'O',
|
|
|
|
|
'ồ' => 'o',
|
|
|
|
|
'Ờ' => 'O',
|
|
|
|
|
'ờ' => 'o',
|
|
|
|
|
'Ừ' => 'U',
|
|
|
|
|
'ừ' => 'u',
|
|
|
|
|
'Ỳ' => 'Y',
|
|
|
|
|
'ỳ' => 'y',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Hook.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'Ả' => 'A',
|
|
|
|
|
'ả' => 'a',
|
|
|
|
|
'Ẩ' => 'A',
|
|
|
|
|
'ẩ' => 'a',
|
|
|
|
|
'Ẳ' => 'A',
|
|
|
|
|
'ẳ' => 'a',
|
|
|
|
|
'Ẻ' => 'E',
|
|
|
|
|
'ẻ' => 'e',
|
|
|
|
|
'Ể' => 'E',
|
|
|
|
|
'ể' => 'e',
|
|
|
|
|
'Ỉ' => 'I',
|
|
|
|
|
'ỉ' => 'i',
|
|
|
|
|
'Ỏ' => 'O',
|
|
|
|
|
'ỏ' => 'o',
|
|
|
|
|
'Ổ' => 'O',
|
|
|
|
|
'ổ' => 'o',
|
|
|
|
|
'Ở' => 'O',
|
|
|
|
|
'ở' => 'o',
|
|
|
|
|
'Ủ' => 'U',
|
|
|
|
|
'ủ' => 'u',
|
|
|
|
|
'Ử' => 'U',
|
|
|
|
|
'ử' => 'u',
|
|
|
|
|
'Ỷ' => 'Y',
|
|
|
|
|
'ỷ' => 'y',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Tilde.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'Ẫ' => 'A',
|
|
|
|
|
'ẫ' => 'a',
|
|
|
|
|
'Ẵ' => 'A',
|
|
|
|
|
'ẵ' => 'a',
|
|
|
|
|
'Ẽ' => 'E',
|
|
|
|
|
'ẽ' => 'e',
|
|
|
|
|
'Ễ' => 'E',
|
|
|
|
|
'ễ' => 'e',
|
|
|
|
|
'Ỗ' => 'O',
|
|
|
|
|
'ỗ' => 'o',
|
|
|
|
|
'Ỡ' => 'O',
|
|
|
|
|
'ỡ' => 'o',
|
|
|
|
|
'Ữ' => 'U',
|
|
|
|
|
'ữ' => 'u',
|
|
|
|
|
'Ỹ' => 'Y',
|
|
|
|
|
'ỹ' => 'y',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Acute accent.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'Ấ' => 'A',
|
|
|
|
|
'ấ' => 'a',
|
|
|
|
|
'Ắ' => 'A',
|
|
|
|
|
'ắ' => 'a',
|
|
|
|
|
'Ế' => 'E',
|
|
|
|
|
'ế' => 'e',
|
|
|
|
|
'Ố' => 'O',
|
|
|
|
|
'ố' => 'o',
|
|
|
|
|
'Ớ' => 'O',
|
|
|
|
|
'ớ' => 'o',
|
|
|
|
|
'Ứ' => 'U',
|
|
|
|
|
'ứ' => 'u',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Dot below.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'Ạ' => 'A',
|
|
|
|
|
'ạ' => 'a',
|
|
|
|
|
'Ậ' => 'A',
|
|
|
|
|
'ậ' => 'a',
|
|
|
|
|
'Ặ' => 'A',
|
|
|
|
|
'ặ' => 'a',
|
|
|
|
|
'Ẹ' => 'E',
|
|
|
|
|
'ẹ' => 'e',
|
|
|
|
|
'Ệ' => 'E',
|
|
|
|
|
'ệ' => 'e',
|
|
|
|
|
'Ị' => 'I',
|
|
|
|
|
'ị' => 'i',
|
|
|
|
|
'Ọ' => 'O',
|
|
|
|
|
'ọ' => 'o',
|
|
|
|
|
'Ộ' => 'O',
|
|
|
|
|
'ộ' => 'o',
|
|
|
|
|
'Ợ' => 'O',
|
|
|
|
|
'ợ' => 'o',
|
|
|
|
|
'Ụ' => 'U',
|
|
|
|
|
'ụ' => 'u',
|
|
|
|
|
'Ự' => 'U',
|
|
|
|
|
'ự' => 'u',
|
|
|
|
|
'Ỵ' => 'Y',
|
|
|
|
|
'ỵ' => 'y',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Vowels with diacritic (Chinese, Hanyu Pinyin).
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'ɑ' => 'a',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Macron.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'Ǖ' => 'U',
|
|
|
|
|
'ǖ' => 'u',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Acute accent.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'Ǘ' => 'U',
|
|
|
|
|
'ǘ' => 'u',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Caron.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'Ǎ' => 'A',
|
|
|
|
|
'ǎ' => 'a',
|
|
|
|
|
'Ǐ' => 'I',
|
|
|
|
|
'ǐ' => 'i',
|
|
|
|
|
'Ǒ' => 'O',
|
|
|
|
|
'ǒ' => 'o',
|
|
|
|
|
'Ǔ' => 'U',
|
|
|
|
|
'ǔ' => 'u',
|
|
|
|
|
'Ǚ' => 'U',
|
|
|
|
|
'ǚ' => 'u',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Grave accent.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'Ǜ' => 'U',
|
|
|
|
|
'ǜ' => 'u',
|
2012-05-02 12:55:16 -04:00
|
|
|
|
);
|
2006-02-12 02:53:23 -05:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Used for locale-specific rules.
|
2013-01-30 20:55:09 -05:00
|
|
|
|
$locale = get_locale();
|
|
|
|
|
|
2021-01-17 10:46:08 -05:00
|
|
|
|
if ( in_array( $locale, array( 'de_DE', 'de_DE_formal', 'de_CH', 'de_CH_informal', 'de_AT' ), true ) ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$chars['Ä'] = 'Ae';
|
|
|
|
|
$chars['ä'] = 'ae';
|
|
|
|
|
$chars['Ö'] = 'Oe';
|
|
|
|
|
$chars['ö'] = 'oe';
|
|
|
|
|
$chars['Ü'] = 'Ue';
|
|
|
|
|
$chars['ü'] = 'ue';
|
|
|
|
|
$chars['ß'] = 'ss';
|
2013-12-03 15:39:09 -05:00
|
|
|
|
} elseif ( 'da_DK' === $locale ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$chars['Æ'] = 'Ae';
|
|
|
|
|
$chars['æ'] = 'ae';
|
|
|
|
|
$chars['Ø'] = 'Oe';
|
|
|
|
|
$chars['ø'] = 'oe';
|
|
|
|
|
$chars['Å'] = 'Aa';
|
|
|
|
|
$chars['å'] = 'aa';
|
2016-06-26 10:26:29 -04:00
|
|
|
|
} elseif ( 'ca' === $locale ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$chars['l·l'] = 'll';
|
2017-01-21 12:16:43 -05:00
|
|
|
|
} elseif ( 'sr_RS' === $locale || 'bs_BA' === $locale ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$chars['Đ'] = 'DJ';
|
|
|
|
|
$chars['đ'] = 'dj';
|
2013-01-30 20:55:09 -05:00
|
|
|
|
}
|
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$string = strtr( $string, $chars );
|
2004-09-10 04:36:54 -04:00
|
|
|
|
} else {
|
2014-12-20 17:47:22 -05:00
|
|
|
|
$chars = array();
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Assume ISO-8859-1 if not UTF-8.
|
2016-08-26 05:35:27 -04:00
|
|
|
|
$chars['in'] = "\x80\x83\x8a\x8e\x9a\x9e"
|
2017-11-30 18:11:00 -05:00
|
|
|
|
. "\x9f\xa2\xa5\xb5\xc0\xc1\xc2"
|
|
|
|
|
. "\xc3\xc4\xc5\xc7\xc8\xc9\xca"
|
|
|
|
|
. "\xcb\xcc\xcd\xce\xcf\xd1\xd2"
|
|
|
|
|
. "\xd3\xd4\xd5\xd6\xd8\xd9\xda"
|
|
|
|
|
. "\xdb\xdc\xdd\xe0\xe1\xe2\xe3"
|
|
|
|
|
. "\xe4\xe5\xe7\xe8\xe9\xea\xeb"
|
|
|
|
|
. "\xec\xed\xee\xef\xf1\xf2\xf3"
|
|
|
|
|
. "\xf4\xf5\xf6\xf8\xf9\xfa\xfb"
|
|
|
|
|
. "\xfc\xfd\xff";
|
|
|
|
|
|
|
|
|
|
$chars['out'] = 'EfSZszYcYuAAAAAACEEEEIIIINOOOOOOUUUUYaaaaaaceeeeiiiinoooooouuuuyy';
|
|
|
|
|
|
|
|
|
|
$string = strtr( $string, $chars['in'], $chars['out'] );
|
|
|
|
|
$double_chars = array();
|
|
|
|
|
$double_chars['in'] = array( "\x8c", "\x9c", "\xc6", "\xd0", "\xde", "\xdf", "\xe6", "\xf0", "\xfe" );
|
|
|
|
|
$double_chars['out'] = array( 'OE', 'oe', 'AE', 'DH', 'TH', 'ss', 'ae', 'dh', 'th' );
|
|
|
|
|
$string = str_replace( $double_chars['in'], $double_chars['out'], $string );
|
2004-05-22 10:34:09 -04:00
|
|
|
|
}
|
2004-09-10 04:36:54 -04:00
|
|
|
|
|
2004-05-22 10:34:09 -04:00
|
|
|
|
return $string;
|
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2013-02-01 13:07:08 -05:00
|
|
|
|
* Sanitizes a filename, replacing whitespace with dashes.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2009-05-24 19:47:49 -04:00
|
|
|
|
* Removes special characters that are illegal in filenames on certain
|
|
|
|
|
* operating systems and special characters requiring special escaping
|
|
|
|
|
* to manipulate at the command line. Replaces spaces and consecutive
|
2013-02-01 13:07:08 -05:00
|
|
|
|
* dashes with a single dash. Trims period, dash and underscore from beginning
|
2016-06-21 09:44:31 -04:00
|
|
|
|
* and end of filename. It is not guaranteed that this function will return a
|
|
|
|
|
* filename that is allowed to be uploaded.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 2.1.0
|
|
|
|
|
*
|
2019-10-26 17:09:04 -04:00
|
|
|
|
* @param string $filename The filename to be sanitized.
|
|
|
|
|
* @return string The sanitized filename.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2009-05-04 16:20:48 -04:00
|
|
|
|
function sanitize_file_name( $filename ) {
|
Media: Remove accents in `sanitize_file_name()`.
This brings some consistency with `sanitize_title()` and `sanitize_user()`.
Props tar.gz, NumidWasNotAvailable, juliobox, p_enrique, cristovaov, zodiac1978, mikeschroder, markoheijnen, chriscct7, swissspidy, DrProtocols, pento, gitlost, joemcgill, dustinbolton, programmin, Vayu, MaximeCulea, lucasbustamante, nilovelez, RavanH, audrasjb, SergeyBiryukov.
See #22363.
Built from https://develop.svn.wordpress.org/trunk@48603
git-svn-id: http://core.svn.wordpress.org/trunk@48365 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2020-07-24 14:03:02 -04:00
|
|
|
|
$filename_raw = $filename;
|
|
|
|
|
$filename = remove_accents( $filename );
|
|
|
|
|
|
2020-07-23 20:59:07 -04:00
|
|
|
|
$special_chars = array( '?', '[', ']', '/', '\\', '=', '<', '>', ':', ';', ',', "'", '"', '&', '$', '#', '*', '(', ')', '|', '~', '`', '!', '{', '}', '%', '+', '’', '«', '»', '”', '“', chr( 0 ) );
|
2020-04-29 11:40:07 -04:00
|
|
|
|
|
|
|
|
|
// Check for support for utf8 in the installed PCRE library once and store the result in a static.
|
|
|
|
|
static $utf8_pcre = null;
|
|
|
|
|
if ( ! isset( $utf8_pcre ) ) {
|
|
|
|
|
// phpcs:ignore WordPress.PHP.NoSilencedErrors.Discouraged
|
|
|
|
|
$utf8_pcre = @preg_match( '/^./u', 'a' );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( ! seems_utf8( $filename ) ) {
|
|
|
|
|
$_ext = pathinfo( $filename, PATHINFO_EXTENSION );
|
|
|
|
|
$_name = pathinfo( $filename, PATHINFO_FILENAME );
|
|
|
|
|
$filename = sanitize_title_with_dashes( $_name ) . '.' . $_ext;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( $utf8_pcre ) {
|
|
|
|
|
$filename = preg_replace( "#\x{00a0}#siu", ' ', $filename );
|
|
|
|
|
}
|
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the list of characters to remove from a filename.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 2.8.0
|
|
|
|
|
*
|
2019-10-26 17:09:04 -04:00
|
|
|
|
* @param string[] $special_chars Array of characters to remove.
|
|
|
|
|
* @param string $filename_raw The original filename to be sanitized.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
|
|
|
|
$special_chars = apply_filters( 'sanitize_file_name_chars', $special_chars, $filename_raw );
|
Media: Remove accents in `sanitize_file_name()`.
This brings some consistency with `sanitize_title()` and `sanitize_user()`.
Props tar.gz, NumidWasNotAvailable, juliobox, p_enrique, cristovaov, zodiac1978, mikeschroder, markoheijnen, chriscct7, swissspidy, DrProtocols, pento, gitlost, joemcgill, dustinbolton, programmin, Vayu, MaximeCulea, lucasbustamante, nilovelez, RavanH, audrasjb, SergeyBiryukov.
See #22363.
Built from https://develop.svn.wordpress.org/trunk@48603
git-svn-id: http://core.svn.wordpress.org/trunk@48365 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2020-07-24 14:03:02 -04:00
|
|
|
|
|
|
|
|
|
$filename = str_replace( $special_chars, '', $filename );
|
|
|
|
|
$filename = str_replace( array( '%20', '+' ), '-', $filename );
|
|
|
|
|
$filename = preg_replace( '/[\r\n\t -]+/', '-', $filename );
|
|
|
|
|
$filename = trim( $filename, '.-_' );
|
2009-11-11 18:07:29 -05:00
|
|
|
|
|
2016-06-21 09:44:31 -04:00
|
|
|
|
if ( false === strpos( $filename, '.' ) ) {
|
|
|
|
|
$mime_types = wp_get_mime_types();
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$filetype = wp_check_filetype( 'test.' . $filename, $mime_types );
|
2016-06-21 09:44:31 -04:00
|
|
|
|
if ( $filetype['ext'] === $filename ) {
|
|
|
|
|
$filename = 'unnamed-file.' . $filetype['ext'];
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Split the filename into a base and extension[s].
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$parts = explode( '.', $filename );
|
2009-11-11 18:07:29 -05:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Return if only one extension.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
if ( count( $parts ) <= 2 ) {
|
2020-12-21 13:25:05 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2013-11-30 13:36:10 -05:00
|
|
|
|
return apply_filters( 'sanitize_file_name', $filename, $filename_raw );
|
|
|
|
|
}
|
2009-11-11 18:07:29 -05:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Process multiple extensions.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$filename = array_shift( $parts );
|
|
|
|
|
$extension = array_pop( $parts );
|
|
|
|
|
$mimes = get_allowed_mime_types();
|
2009-11-11 18:07:29 -05:00
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/*
|
|
|
|
|
* Loop over any intermediate extensions. Postfix them with a trailing underscore
|
General: Remove “whitelist” and “blacklist” in favor of more clear and inclusive language.
“The WordPress open source community cares about diversity. We strive to maintain a welcoming environment where everyone can feel included.”
With this commit, all occurrences of “whitelist” and “blacklist” (with the single exception of the `$new_whitelist_options` global variable) are removed. A new ticket has been opened to explore renaming the `$new_whitelist_options` variable (#50434).
Changing to more specific names or rewording sentences containing these terms not only makes the code more inclusive, but also helps provide clarity. These terms are often ambiguous. What is being blocked or allowed is not always immediately clear. This can make it more difficult for non-native English speakers to read through the codebase.
Words matter. If one contributor feels more welcome because these terms are removed, this was worth the effort.
Props strangerstudios, jorbin, desrosj, joemcgill, timothyblynjacobs, ocean90, ayeshrajans, davidbaumwald, earnjam.
See #48900, #50434.
Fixes #50413.
Built from https://develop.svn.wordpress.org/trunk@48121
git-svn-id: http://core.svn.wordpress.org/trunk@47890 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2020-06-22 13:26:13 -04:00
|
|
|
|
* if they are a 2 - 5 character long alpha string not in the allowed extension list.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
2017-11-30 18:11:00 -05:00
|
|
|
|
foreach ( (array) $parts as $part ) {
|
2009-11-11 18:07:29 -05:00
|
|
|
|
$filename .= '.' . $part;
|
2010-01-15 17:11:12 -05:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( preg_match( '/^[a-zA-Z]{2,5}\d?$/', $part ) ) {
|
2009-11-11 18:07:29 -05:00
|
|
|
|
$allowed = false;
|
|
|
|
|
foreach ( $mimes as $ext_preg => $mime_match ) {
|
2011-05-22 19:17:09 -04:00
|
|
|
|
$ext_preg = '!^(' . $ext_preg . ')$!i';
|
2009-11-11 18:07:29 -05:00
|
|
|
|
if ( preg_match( $ext_preg, $part ) ) {
|
|
|
|
|
$allowed = true;
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! $allowed ) {
|
2009-11-11 18:07:29 -05:00
|
|
|
|
$filename .= '_';
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2009-11-11 18:07:29 -05:00
|
|
|
|
}
|
|
|
|
|
}
|
Media: Remove accents in `sanitize_file_name()`.
This brings some consistency with `sanitize_title()` and `sanitize_user()`.
Props tar.gz, NumidWasNotAvailable, juliobox, p_enrique, cristovaov, zodiac1978, mikeschroder, markoheijnen, chriscct7, swissspidy, DrProtocols, pento, gitlost, joemcgill, dustinbolton, programmin, Vayu, MaximeCulea, lucasbustamante, nilovelez, RavanH, audrasjb, SergeyBiryukov.
See #22363.
Built from https://develop.svn.wordpress.org/trunk@48603
git-svn-id: http://core.svn.wordpress.org/trunk@48365 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2020-07-24 14:03:02 -04:00
|
|
|
|
|
2009-11-11 18:07:29 -05:00
|
|
|
|
$filename .= '.' . $extension;
|
Media: Remove accents in `sanitize_file_name()`.
This brings some consistency with `sanitize_title()` and `sanitize_user()`.
Props tar.gz, NumidWasNotAvailable, juliobox, p_enrique, cristovaov, zodiac1978, mikeschroder, markoheijnen, chriscct7, swissspidy, DrProtocols, pento, gitlost, joemcgill, dustinbolton, programmin, Vayu, MaximeCulea, lucasbustamante, nilovelez, RavanH, audrasjb, SergeyBiryukov.
See #22363.
Built from https://develop.svn.wordpress.org/trunk@48603
git-svn-id: http://core.svn.wordpress.org/trunk@48365 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2020-07-24 14:03:02 -04:00
|
|
|
|
|
2020-12-21 13:25:05 -05:00
|
|
|
|
/**
|
|
|
|
|
* Filters a sanitized filename string.
|
|
|
|
|
*
|
|
|
|
|
* @since 2.8.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $filename Sanitized filename.
|
|
|
|
|
* @param string $filename_raw The filename prior to sanitization.
|
|
|
|
|
*/
|
2017-11-30 18:11:00 -05:00
|
|
|
|
return apply_filters( 'sanitize_file_name', $filename, $filename_raw );
|
2007-01-09 17:53:14 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2013-02-01 13:07:08 -05:00
|
|
|
|
* Sanitizes a username, stripping out unsafe characters.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2010-10-24 16:33:54 -04:00
|
|
|
|
* Removes tags, octets, entities, and if strict is enabled, will only keep
|
2010-11-17 13:47:34 -05:00
|
|
|
|
* alphanumeric, _, space, ., -, @. After sanitizing, it passes the username,
|
2010-10-24 16:33:54 -04:00
|
|
|
|
* raw username (the username in the parameter), and the value of $strict as
|
2016-05-23 15:01:27 -04:00
|
|
|
|
* parameters for the {@see 'sanitize_user'} filter.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 2.0.0
|
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @param string $username The username to be sanitized.
|
2020-07-11 21:13:02 -04:00
|
|
|
|
* @param bool $strict Optional. If set limits $username to specific characters.
|
|
|
|
|
* Default false.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @return string The sanitized username, after passing through filters.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2006-01-24 22:09:16 -05:00
|
|
|
|
function sanitize_user( $username, $strict = false ) {
|
2006-01-18 00:37:26 -05:00
|
|
|
|
$raw_username = $username;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$username = wp_strip_all_tags( $username );
|
|
|
|
|
$username = remove_accents( $username );
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Kill octets.
|
2010-05-03 19:46:42 -04:00
|
|
|
|
$username = preg_replace( '|%([a-fA-F0-9][a-fA-F0-9])|', '', $username );
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Kill entities.
|
|
|
|
|
$username = preg_replace( '/&.+?;/', '', $username );
|
2006-01-24 22:09:16 -05:00
|
|
|
|
|
|
|
|
|
// If strict, reduce to ASCII for max portability.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( $strict ) {
|
2010-05-03 19:46:42 -04:00
|
|
|
|
$username = preg_replace( '|[^a-z0-9 _.\-@]|i', '', $username );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2006-01-24 22:09:16 -05:00
|
|
|
|
|
2010-10-24 16:33:54 -04:00
|
|
|
|
$username = trim( $username );
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Consolidate contiguous whitespace.
|
2010-05-03 19:46:42 -04:00
|
|
|
|
$username = preg_replace( '|\s+|', ' ', $username );
|
2008-08-21 18:58:29 -04:00
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters a sanitized username string.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
2013-11-30 14:05:10 -05:00
|
|
|
|
* @since 2.0.1
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @param string $username Sanitized username.
|
|
|
|
|
* @param string $raw_username The username prior to sanitization.
|
2020-07-11 21:13:02 -04:00
|
|
|
|
* @param bool $strict Whether to limit the sanitization to specific characters.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
2010-05-03 19:46:42 -04:00
|
|
|
|
return apply_filters( 'sanitize_user', $username, $raw_username, $strict );
|
2005-06-12 19:14:52 -04:00
|
|
|
|
}
|
|
|
|
|
|
2010-03-16 15:19:32 -04:00
|
|
|
|
/**
|
2013-02-01 13:07:08 -05:00
|
|
|
|
* Sanitizes a string key.
|
2010-03-16 15:19:32 -04:00
|
|
|
|
*
|
2020-07-11 21:13:02 -04:00
|
|
|
|
* Keys are used as internal identifiers. Lowercase alphanumeric characters,
|
|
|
|
|
* dashes, and underscores are allowed.
|
2010-03-16 15:19:32 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 3.0.0
|
2010-03-17 12:27:25 -04:00
|
|
|
|
*
|
2010-03-16 15:19:32 -04:00
|
|
|
|
* @param string $key String key
|
|
|
|
|
* @return string Sanitized key
|
|
|
|
|
*/
|
|
|
|
|
function sanitize_key( $key ) {
|
|
|
|
|
$raw_key = $key;
|
2021-11-30 15:11:02 -05:00
|
|
|
|
|
|
|
|
|
if ( ! is_string( $key ) ) {
|
|
|
|
|
$key = '';
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( '' !== $key ) {
|
|
|
|
|
$key = strtolower( $key );
|
|
|
|
|
$key = preg_replace( '/[^a-z0-9_\-]/', '', $key );
|
|
|
|
|
}
|
2013-11-30 13:36:10 -05:00
|
|
|
|
|
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters a sanitized key string.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 3.0.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $key Sanitized key.
|
|
|
|
|
* @param string $raw_key The key prior to sanitization.
|
|
|
|
|
*/
|
2010-10-24 16:33:54 -04:00
|
|
|
|
return apply_filters( 'sanitize_key', $key, $raw_key );
|
2010-03-16 15:19:32 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2020-07-11 21:13:02 -04:00
|
|
|
|
* Sanitizes a string into a slug, which can be used in URLs or HTML attributes.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2020-07-11 21:13:02 -04:00
|
|
|
|
* By default, converts accent characters to ASCII characters and further
|
|
|
|
|
* limits the output to alphanumeric characters, underscore (_) and dash (-)
|
|
|
|
|
* through the {@see 'sanitize_title'} filter.
|
|
|
|
|
*
|
|
|
|
|
* If `$title` is empty and `$fallback_title` is set, the latter will be used.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 1.0.0
|
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param string $title The string to be sanitized.
|
2020-07-11 21:13:02 -04:00
|
|
|
|
* @param string $fallback_title Optional. A title to use if $title is empty. Default empty.
|
|
|
|
|
* @param string $context Optional. The operation for which the string is sanitized.
|
2020-11-02 15:20:07 -05:00
|
|
|
|
* When set to 'save', the string runs through remove_accents().
|
2020-07-11 21:13:02 -04:00
|
|
|
|
* Default 'save'.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @return string The sanitized string.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2013-02-01 13:07:08 -05:00
|
|
|
|
function sanitize_title( $title, $fallback_title = '', $context = 'save' ) {
|
2009-03-17 13:42:54 -04:00
|
|
|
|
$raw_title = $title;
|
2010-10-23 08:55:55 -04:00
|
|
|
|
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( 'save' === $context ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$title = remove_accents( $title );
|
|
|
|
|
}
|
2010-10-23 08:55:55 -04:00
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters a sanitized title string.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
2013-11-30 14:05:10 -05:00
|
|
|
|
* @since 1.2.0
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @param string $title Sanitized title.
|
|
|
|
|
* @param string $raw_title The title prior to sanitization.
|
|
|
|
|
* @param string $context The context for which the title is being sanitized.
|
|
|
|
|
*/
|
|
|
|
|
$title = apply_filters( 'sanitize_title', $title, $raw_title, $context );
|
2004-08-05 21:28:51 -04:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( '' === $title || false === $title ) {
|
2005-01-02 04:08:55 -05:00
|
|
|
|
$title = $fallback_title;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2004-05-21 04:37:55 -04:00
|
|
|
|
|
2005-01-02 04:08:55 -05:00
|
|
|
|
return $title;
|
2004-02-09 01:57:02 -05:00
|
|
|
|
}
|
|
|
|
|
|
2013-02-01 13:07:08 -05:00
|
|
|
|
/**
|
|
|
|
|
* Sanitizes a title with the 'query' context.
|
|
|
|
|
*
|
|
|
|
|
* Used for querying the database for a value from URL.
|
|
|
|
|
*
|
|
|
|
|
* @since 3.1.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $title The string to be sanitized.
|
|
|
|
|
* @return string The sanitized string.
|
|
|
|
|
*/
|
|
|
|
|
function sanitize_title_for_query( $title ) {
|
|
|
|
|
return sanitize_title( $title, '', 'query' );
|
2010-10-23 08:55:55 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2013-02-01 13:07:08 -05:00
|
|
|
|
* Sanitizes a title, replacing whitespace and a few other characters with dashes.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* Limits the output to alphanumeric characters, underscore (_) and dash (-).
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* Whitespace becomes a dash.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 1.2.0
|
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param string $title The title to be sanitized.
|
2020-07-11 21:13:02 -04:00
|
|
|
|
* @param string $raw_title Optional. Not used. Default empty.
|
2020-11-02 15:20:07 -05:00
|
|
|
|
* @param string $context Optional. The operation for which the string is sanitized.
|
|
|
|
|
* When set to 'save', additional entities are converted to hyphens
|
|
|
|
|
* or stripped entirely. Default 'display'.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @return string The sanitized title.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2013-02-01 13:07:08 -05:00
|
|
|
|
function sanitize_title_with_dashes( $title, $raw_title = '', $context = 'display' ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$title = strip_tags( $title );
|
2005-02-01 03:31:13 -05:00
|
|
|
|
// Preserve escaped octets.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$title = preg_replace( '|%([a-fA-F0-9][a-fA-F0-9])|', '---$1---', $title );
|
2005-02-01 03:31:13 -05:00
|
|
|
|
// Remove percent signs that are not part of an octet.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$title = str_replace( '%', '', $title );
|
2005-02-01 03:31:13 -05:00
|
|
|
|
// Restore octets.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$title = preg_replace( '|---([a-fA-F0-9][a-fA-F0-9])---|', '%$1', $title );
|
2005-02-01 03:31:13 -05:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( seems_utf8( $title ) ) {
|
|
|
|
|
if ( function_exists( 'mb_strtolower' ) ) {
|
|
|
|
|
$title = mb_strtolower( $title, 'UTF-8' );
|
2004-09-10 04:36:54 -04:00
|
|
|
|
}
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$title = utf8_uri_encode( $title, 200 );
|
2005-01-02 04:08:55 -05:00
|
|
|
|
}
|
2004-09-10 04:36:54 -04:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$title = strtolower( $title );
|
2011-09-18 15:53:59 -04:00
|
|
|
|
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( 'save' === $context ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Convert  , &ndash, and &mdash to hyphens.
|
2011-09-18 15:53:59 -04:00
|
|
|
|
$title = str_replace( array( '%c2%a0', '%e2%80%93', '%e2%80%94' ), '-', $title );
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Convert  , &ndash, and &mdash HTML entities to hyphens.
|
2016-02-28 23:42:27 -05:00
|
|
|
|
$title = str_replace( array( ' ', ' ', '–', '–', '—', '—' ), '-', $title );
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Convert forward slash to hyphen.
|
2017-08-25 19:28:45 -04:00
|
|
|
|
$title = str_replace( '/', '-', $title );
|
2012-05-02 12:37:42 -04:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Strip these characters entirely.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$title = str_replace(
|
|
|
|
|
array(
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Soft hyphens.
|
2019-01-14 00:39:51 -05:00
|
|
|
|
'%c2%ad',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// ¡ and ¿.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'%c2%a1',
|
|
|
|
|
'%c2%bf',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Angle quotes.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'%c2%ab',
|
|
|
|
|
'%c2%bb',
|
|
|
|
|
'%e2%80%b9',
|
|
|
|
|
'%e2%80%ba',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Curly quotes.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'%e2%80%98',
|
|
|
|
|
'%e2%80%99',
|
|
|
|
|
'%e2%80%9c',
|
|
|
|
|
'%e2%80%9d',
|
|
|
|
|
'%e2%80%9a',
|
|
|
|
|
'%e2%80%9b',
|
|
|
|
|
'%e2%80%9e',
|
|
|
|
|
'%e2%80%9f',
|
2020-07-23 20:03:05 -04:00
|
|
|
|
// Bullet.
|
|
|
|
|
'%e2%80%a2',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// ©, ®, °, &hellip, and &trade.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'%c2%a9',
|
|
|
|
|
'%c2%ae',
|
|
|
|
|
'%c2%b0',
|
|
|
|
|
'%e2%80%a6',
|
|
|
|
|
'%e2%84%a2',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Acute accents.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'%c2%b4',
|
|
|
|
|
'%cb%8a',
|
|
|
|
|
'%cc%81',
|
|
|
|
|
'%cd%81',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Grave accent, macron, caron.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'%cc%80',
|
|
|
|
|
'%cc%84',
|
|
|
|
|
'%cc%8c',
|
2021-11-02 14:47:57 -04:00
|
|
|
|
// Non-visible characters that display without a width.
|
|
|
|
|
'%e2%80%8b',
|
|
|
|
|
'%e2%80%8c',
|
|
|
|
|
'%e2%80%8d',
|
|
|
|
|
'%e2%80%8e',
|
|
|
|
|
'%e2%80%8f',
|
|
|
|
|
'%e2%80%aa',
|
|
|
|
|
'%e2%80%ab',
|
|
|
|
|
'%e2%80%ac',
|
|
|
|
|
'%e2%80%ad',
|
|
|
|
|
'%e2%80%ae',
|
|
|
|
|
'%ef%bb%bf',
|
2018-08-16 21:51:36 -04:00
|
|
|
|
),
|
|
|
|
|
'',
|
|
|
|
|
$title
|
2017-11-30 18:11:00 -05:00
|
|
|
|
);
|
2012-05-02 12:37:42 -04:00
|
|
|
|
|
2021-11-02 14:47:57 -04:00
|
|
|
|
// Convert non-visible characters that display with a width to hyphen.
|
|
|
|
|
$title = str_replace(
|
|
|
|
|
array(
|
|
|
|
|
'%e2%80%80',
|
|
|
|
|
'%e2%80%81',
|
|
|
|
|
'%e2%80%82',
|
|
|
|
|
'%e2%80%83',
|
|
|
|
|
'%e2%80%84',
|
|
|
|
|
'%e2%80%85',
|
|
|
|
|
'%e2%80%86',
|
|
|
|
|
'%e2%80%87',
|
|
|
|
|
'%e2%80%88',
|
|
|
|
|
'%e2%80%89',
|
|
|
|
|
'%e2%80%8a',
|
|
|
|
|
'%e2%80%a8',
|
|
|
|
|
'%e2%80%a9',
|
|
|
|
|
'%e2%80%af',
|
|
|
|
|
),
|
|
|
|
|
'-',
|
|
|
|
|
$title
|
|
|
|
|
);
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Convert × to 'x'.
|
2012-05-02 12:37:42 -04:00
|
|
|
|
$title = str_replace( '%c3%97', 'x', $title );
|
2011-09-18 15:53:59 -04:00
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Kill entities.
|
|
|
|
|
$title = preg_replace( '/&.+?;/', '', $title );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$title = str_replace( '.', '-', $title );
|
2016-02-28 23:42:27 -05:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$title = preg_replace( '/[^%a-z0-9 _-]/', '', $title );
|
|
|
|
|
$title = preg_replace( '/\s+/', '-', $title );
|
|
|
|
|
$title = preg_replace( '|-+|', '-', $title );
|
|
|
|
|
$title = trim( $title, '-' );
|
2004-05-16 18:14:14 -04:00
|
|
|
|
|
2005-01-02 04:08:55 -05:00
|
|
|
|
return $title;
|
2004-05-16 18:07:26 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2015-04-20 01:42:25 -04:00
|
|
|
|
* Ensures a string is a valid SQL 'order by' clause.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2015-04-20 01:42:25 -04:00
|
|
|
|
* Accepts one or more columns, with or without a sort order (ASC / DESC).
|
|
|
|
|
* e.g. 'column_1', 'column_1, column_2', 'column_1 ASC, column_2 DESC' etc.
|
|
|
|
|
*
|
|
|
|
|
* Also accepts 'RAND()'.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 2.5.1
|
|
|
|
|
*
|
2015-04-20 01:42:25 -04:00
|
|
|
|
* @param string $orderby Order by clause to be validated.
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @return string|false Returns $orderby if valid, false otherwise.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-04-20 01:42:25 -04:00
|
|
|
|
function sanitize_sql_orderby( $orderby ) {
|
|
|
|
|
if ( preg_match( '/^\s*(([a-z0-9_]+|`[a-z0-9_]+`)(\s+(ASC|DESC))?\s*(,\s*(?=[a-z0-9_`])|$))+$/i', $orderby ) || preg_match( '/^\s*RAND\(\s*\)\s*$/i', $orderby ) ) {
|
|
|
|
|
return $orderby;
|
|
|
|
|
}
|
|
|
|
|
return false;
|
2008-04-02 23:05:49 -04:00
|
|
|
|
}
|
|
|
|
|
|
2009-05-22 13:44:26 -04:00
|
|
|
|
/**
|
2013-02-01 13:07:08 -05:00
|
|
|
|
* Sanitizes an HTML classname to ensure it only contains valid characters.
|
2009-05-24 19:47:49 -04:00
|
|
|
|
*
|
2011-04-06 17:28:52 -04:00
|
|
|
|
* Strips the string down to A-Z,a-z,0-9,_,-. If this results in an empty
|
2009-05-22 13:44:26 -04:00
|
|
|
|
* string then it will return the alternative value supplied.
|
2009-05-24 19:47:49 -04:00
|
|
|
|
*
|
2009-05-22 17:31:42 -04:00
|
|
|
|
* @todo Expand to support the full range of CDATA that a class attribute can contain.
|
2009-05-24 19:47:49 -04:00
|
|
|
|
*
|
2009-05-22 17:31:42 -04:00
|
|
|
|
* @since 2.8.0
|
2009-05-24 19:47:49 -04:00
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param string $class The classname to be sanitized
|
2014-07-03 12:58:16 -04:00
|
|
|
|
* @param string $fallback Optional. The value to return if the sanitization ends up as an empty string.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
* Defaults to an empty string.
|
2009-05-22 17:31:42 -04:00
|
|
|
|
* @return string The sanitized value
|
2009-05-22 13:44:26 -04:00
|
|
|
|
*/
|
2010-02-27 15:06:35 -05:00
|
|
|
|
function sanitize_html_class( $class, $fallback = '' ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Strip out any %-encoded octets.
|
2011-04-06 17:28:52 -04:00
|
|
|
|
$sanitized = preg_replace( '|%[a-fA-F0-9][a-fA-F0-9]|', '', $class );
|
2009-05-24 19:47:49 -04:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Limit to A-Z, a-z, 0-9, '_', '-'.
|
2011-04-06 17:28:52 -04:00
|
|
|
|
$sanitized = preg_replace( '/[^A-Za-z0-9_-]/', '', $sanitized );
|
2009-05-24 19:47:49 -04:00
|
|
|
|
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( '' === $sanitized && $fallback ) {
|
2015-09-22 00:31:25 -04:00
|
|
|
|
return sanitize_html_class( $fallback );
|
|
|
|
|
}
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters a sanitized HTML class string.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 2.8.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $sanitized The sanitized HTML class.
|
|
|
|
|
* @param string $class HTML class before sanitization.
|
|
|
|
|
* @param string $fallback The fallback string.
|
|
|
|
|
*/
|
2010-02-27 15:06:35 -05:00
|
|
|
|
return apply_filters( 'sanitize_html_class', $sanitized, $class, $fallback );
|
2009-05-22 13:44:26 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2015-06-20 20:59:26 -04:00
|
|
|
|
* Converts lone & characters into `&` (a.k.a. `&`)
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 0.71
|
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param string $content String of characters to be converted.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @param string $deprecated Not used.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
* @return string Converted string.
|
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function convert_chars( $content, $deprecated = '' ) {
|
2015-06-20 20:59:26 -04:00
|
|
|
|
if ( ! empty( $deprecated ) ) {
|
2010-01-09 05:03:55 -05:00
|
|
|
|
_deprecated_argument( __FUNCTION__, '0.71' );
|
2015-06-20 20:59:26 -04:00
|
|
|
|
}
|
2009-12-30 11:23:39 -05:00
|
|
|
|
|
2015-06-20 20:59:26 -04:00
|
|
|
|
if ( strpos( $content, '&' ) !== false ) {
|
|
|
|
|
$content = preg_replace( '/&([^#])(?![a-z1-4]{1,8};)/i', '&$1', $content );
|
|
|
|
|
}
|
2004-04-22 03:41:57 -04:00
|
|
|
|
|
2015-06-20 20:59:26 -04:00
|
|
|
|
return $content;
|
|
|
|
|
}
|
2004-04-22 03:41:57 -04:00
|
|
|
|
|
2015-06-20 20:59:26 -04:00
|
|
|
|
/**
|
|
|
|
|
* Converts invalid Unicode references range to valid range.
|
|
|
|
|
*
|
2015-06-21 07:41:26 -04:00
|
|
|
|
* @since 4.3.0
|
2015-06-20 20:59:26 -04:00
|
|
|
|
*
|
|
|
|
|
* @param string $content String with entities that need converting.
|
|
|
|
|
* @return string Converted string.
|
|
|
|
|
*/
|
|
|
|
|
function convert_invalid_entities( $content ) {
|
|
|
|
|
$wp_htmltranswinuni = array(
|
2020-01-28 19:45:18 -05:00
|
|
|
|
'€' => '€', // The Euro sign.
|
2015-06-20 20:59:26 -04:00
|
|
|
|
'' => '',
|
2020-01-28 19:45:18 -05:00
|
|
|
|
'‚' => '‚', // These are Windows CP1252 specific characters.
|
|
|
|
|
'ƒ' => 'ƒ', // They would look weird on non-Windows browsers.
|
2015-06-20 20:59:26 -04:00
|
|
|
|
'„' => '„',
|
|
|
|
|
'…' => '…',
|
|
|
|
|
'†' => '†',
|
|
|
|
|
'‡' => '‡',
|
|
|
|
|
'ˆ' => 'ˆ',
|
|
|
|
|
'‰' => '‰',
|
|
|
|
|
'Š' => 'Š',
|
|
|
|
|
'‹' => '‹',
|
|
|
|
|
'Œ' => 'Œ',
|
|
|
|
|
'' => '',
|
|
|
|
|
'Ž' => 'Ž',
|
|
|
|
|
'' => '',
|
|
|
|
|
'' => '',
|
|
|
|
|
'‘' => '‘',
|
|
|
|
|
'’' => '’',
|
|
|
|
|
'“' => '“',
|
|
|
|
|
'”' => '”',
|
|
|
|
|
'•' => '•',
|
|
|
|
|
'–' => '–',
|
|
|
|
|
'—' => '—',
|
|
|
|
|
'˜' => '˜',
|
|
|
|
|
'™' => '™',
|
|
|
|
|
'š' => 'š',
|
|
|
|
|
'›' => '›',
|
|
|
|
|
'œ' => 'œ',
|
|
|
|
|
'' => '',
|
|
|
|
|
'ž' => 'ž',
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'Ÿ' => 'Ÿ',
|
2015-06-20 20:59:26 -04:00
|
|
|
|
);
|
2004-02-09 01:57:02 -05:00
|
|
|
|
|
2015-06-20 20:59:26 -04:00
|
|
|
|
if ( strpos( $content, '' ) !== false ) {
|
|
|
|
|
$content = strtr( $content, $wp_htmltranswinuni );
|
|
|
|
|
}
|
2004-02-09 01:57:02 -05:00
|
|
|
|
|
|
|
|
|
return $content;
|
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2013-02-01 17:20:06 -05:00
|
|
|
|
* Balances tags if forced to, or if the 'use_balanceTags' option is set to true.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 0.71
|
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param string $text Text to be balanced
|
|
|
|
|
* @param bool $force If true, forces balancing, ignoring the value of the option. Default false.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
* @return string Balanced text
|
|
|
|
|
*/
|
2019-07-01 04:01:57 -04:00
|
|
|
|
function balanceTags( $text, $force = false ) { // phpcs:ignore WordPress.NamingConventions.ValidFunctionName.FunctionNameInvalid
|
2019-09-02 06:25:56 -04:00
|
|
|
|
if ( $force || (int) get_option( 'use_balanceTags' ) === 1 ) {
|
2013-12-03 12:08:10 -05:00
|
|
|
|
return force_balance_tags( $text );
|
|
|
|
|
} else {
|
|
|
|
|
return $text;
|
2013-11-08 17:22:11 -05:00
|
|
|
|
}
|
2007-07-16 15:23:41 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
|
|
|
|
* Balances tags of string using a modified stack.
|
|
|
|
|
*
|
|
|
|
|
* @since 2.0.4
|
2019-09-02 06:25:56 -04:00
|
|
|
|
* @since 5.3.0 Improve accuracy and add support for custom element tags.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @author Leonard Lin <leonard@acm.org>
|
2010-08-26 11:43:32 -04:00
|
|
|
|
* @license GPL
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @copyright November 4, 2001
|
2008-08-17 07:29:43 -04:00
|
|
|
|
* @version 1.1
|
|
|
|
|
* @todo Make better - change loop condition to $text in 1.2
|
|
|
|
|
* @internal Modified by Scott Reilly (coffee2code) 02 Aug 2004
|
2017-11-30 18:11:00 -05:00
|
|
|
|
* 1.1 Fixed handling of append/stack pop order of end text
|
|
|
|
|
* Added Cleaning Hooks
|
|
|
|
|
* 1.0 First Version
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @param string $text Text to be balanced.
|
|
|
|
|
* @return string Balanced text.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2007-07-16 15:23:41 -04:00
|
|
|
|
function force_balance_tags( $text ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$tagstack = array();
|
2010-04-01 09:18:34 -04:00
|
|
|
|
$stacksize = 0;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$tagqueue = '';
|
|
|
|
|
$newtext = '';
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Known single-entity/self-closing tags.
|
Formatting: Add additional support for single and nestable tags in `force_balance_tags()`.
Adds `track` and `wbr` support for single tags.
Adds `article`, `aside`, `details`, `figure`, and `section` for nestable tags.
Updates tests.
Follow-up to [5805], [21828], [45929].
Props glendaviesnz, costdev, talldanwp, ramonopoly, sergeybiryukov.
Fixes #50225.
Built from https://develop.svn.wordpress.org/trunk@52188
git-svn-id: http://core.svn.wordpress.org/trunk@51780 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2021-11-16 14:42:01 -05:00
|
|
|
|
$single_tags = array( 'area', 'base', 'basefont', 'br', 'col', 'command', 'embed', 'frame', 'hr', 'img', 'input', 'isindex', 'link', 'meta', 'param', 'source', 'track', 'wbr' );
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Tags that can be immediately nested within themselves.
|
Formatting: Add additional support for single and nestable tags in `force_balance_tags()`.
Adds `track` and `wbr` support for single tags.
Adds `article`, `aside`, `details`, `figure`, and `section` for nestable tags.
Updates tests.
Follow-up to [5805], [21828], [45929].
Props glendaviesnz, costdev, talldanwp, ramonopoly, sergeybiryukov.
Fixes #50225.
Built from https://develop.svn.wordpress.org/trunk@52188
git-svn-id: http://core.svn.wordpress.org/trunk@51780 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2021-11-16 14:42:01 -05:00
|
|
|
|
$nestable_tags = array( 'article', 'aside', 'blockquote', 'details', 'div', 'figure', 'object', 'q', 'section', 'span' );
|
2010-04-01 09:18:34 -04:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// WP bug fix for comments - in case you REALLY meant to type '< !--'.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$text = str_replace( '< !--', '< !--', $text );
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// WP bug fix for LOVE <3 (and other situations with '<' before a number).
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$text = preg_replace( '#<([0-9]{1})#', '<$1', $text );
|
2004-02-09 01:57:02 -05:00
|
|
|
|
|
2019-09-02 06:25:56 -04:00
|
|
|
|
/**
|
|
|
|
|
* Matches supported tags.
|
|
|
|
|
*
|
|
|
|
|
* To get the pattern as a string without the comments paste into a PHP
|
|
|
|
|
* REPL like `php -a`.
|
|
|
|
|
*
|
|
|
|
|
* @see https://html.spec.whatwg.org/#elements-2
|
|
|
|
|
* @see https://w3c.github.io/webcomponents/spec/custom/#valid-custom-element-name
|
|
|
|
|
*
|
|
|
|
|
* @example
|
|
|
|
|
* ~# php -a
|
|
|
|
|
* php > $s = [paste copied contents of expression below including parentheses];
|
|
|
|
|
* php > echo $s;
|
|
|
|
|
*/
|
|
|
|
|
$tag_pattern = (
|
|
|
|
|
'#<' . // Start with an opening bracket.
|
|
|
|
|
'(/?)' . // Group 1 - If it's a closing tag it'll have a leading slash.
|
|
|
|
|
'(' . // Group 2 - Tag name.
|
|
|
|
|
// Custom element tags have more lenient rules than HTML tag names.
|
|
|
|
|
'(?:[a-z](?:[a-z0-9._]*)-(?:[a-z0-9._-]+)+)' .
|
|
|
|
|
'|' .
|
|
|
|
|
// Traditional tag rules approximate HTML tag names.
|
|
|
|
|
'(?:[\w:]+)' .
|
|
|
|
|
')' .
|
|
|
|
|
'(?:' .
|
|
|
|
|
// We either immediately close the tag with its '>' and have nothing here.
|
|
|
|
|
'\s*' .
|
|
|
|
|
'(/?)' . // Group 3 - "attributes" for empty tag.
|
|
|
|
|
'|' .
|
|
|
|
|
// Or we must start with space characters to separate the tag name from the attributes (or whitespace).
|
|
|
|
|
'(\s+)' . // Group 4 - Pre-attribute whitespace.
|
|
|
|
|
'([^>]*)' . // Group 5 - Attributes.
|
|
|
|
|
')' .
|
|
|
|
|
'>#' // End with a closing bracket.
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
while ( preg_match( $tag_pattern, $text, $regex ) ) {
|
|
|
|
|
$full_match = $regex[0];
|
|
|
|
|
$has_leading_slash = ! empty( $regex[1] );
|
|
|
|
|
$tag_name = $regex[2];
|
|
|
|
|
$tag = strtolower( $tag_name );
|
|
|
|
|
$is_single_tag = in_array( $tag, $single_tags, true );
|
|
|
|
|
$pre_attribute_ws = isset( $regex[4] ) ? $regex[4] : '';
|
|
|
|
|
$attributes = trim( isset( $regex[5] ) ? $regex[5] : $regex[3] );
|
|
|
|
|
$has_self_closer = '/' === substr( $attributes, -1 );
|
|
|
|
|
|
2005-01-06 05:24:11 -05:00
|
|
|
|
$newtext .= $tagqueue;
|
2004-02-09 01:57:02 -05:00
|
|
|
|
|
2019-09-02 06:25:56 -04:00
|
|
|
|
$i = strpos( $text, $full_match );
|
|
|
|
|
$l = strlen( $full_match );
|
2004-02-09 01:57:02 -05:00
|
|
|
|
|
2019-09-02 06:25:56 -04:00
|
|
|
|
// Clear the shifter.
|
2004-02-09 01:57:02 -05:00
|
|
|
|
$tagqueue = '';
|
2020-01-28 19:45:18 -05:00
|
|
|
|
if ( $has_leading_slash ) { // End tag.
|
2019-09-02 06:25:56 -04:00
|
|
|
|
// If too many closing tags.
|
2015-06-16 16:01:25 -04:00
|
|
|
|
if ( $stacksize <= 0 ) {
|
2004-02-09 01:57:02 -05:00
|
|
|
|
$tag = '';
|
2019-09-02 06:25:56 -04:00
|
|
|
|
// Or close to be safe $tag = '/' . $tag.
|
2019-01-11 01:40:50 -05:00
|
|
|
|
|
2019-09-02 06:25:56 -04:00
|
|
|
|
// If stacktop value = tag close value, then pop.
|
|
|
|
|
} elseif ( $tagstack[ $stacksize - 1 ] === $tag ) { // Found closing tag.
|
2020-01-28 19:45:18 -05:00
|
|
|
|
$tag = '</' . $tag . '>'; // Close tag.
|
2010-04-01 09:18:34 -04:00
|
|
|
|
array_pop( $tagstack );
|
2004-02-09 01:57:02 -05:00
|
|
|
|
$stacksize--;
|
2019-09-02 06:25:56 -04:00
|
|
|
|
} else { // Closing tag not at top, search for it.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
for ( $j = $stacksize - 1; $j >= 0; $j-- ) {
|
2019-09-02 06:25:56 -04:00
|
|
|
|
if ( $tagstack[ $j ] === $tag ) {
|
|
|
|
|
// Add tag to tagqueue.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
for ( $k = $stacksize - 1; $k >= $j; $k-- ) {
|
2010-04-01 09:18:34 -04:00
|
|
|
|
$tagqueue .= '</' . array_pop( $tagstack ) . '>';
|
2004-02-09 01:57:02 -05:00
|
|
|
|
$stacksize--;
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
$tag = '';
|
|
|
|
|
}
|
2020-01-28 19:45:18 -05:00
|
|
|
|
} else { // Begin tag.
|
2019-09-02 06:25:56 -04:00
|
|
|
|
if ( $has_self_closer ) { // If it presents itself as a self-closing tag...
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// ...but it isn't a known single-entity self-closing tag, then don't let it be treated as such
|
|
|
|
|
// and immediately close it with a closing tag (the tag will encapsulate no text as a result).
|
2019-09-02 06:25:56 -04:00
|
|
|
|
if ( ! $is_single_tag ) {
|
|
|
|
|
$attributes = trim( substr( $attributes, 0, -1 ) ) . "></$tag";
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2020-01-28 19:45:18 -05:00
|
|
|
|
} elseif ( $is_single_tag ) { // Else if it's a known single-entity tag but it doesn't close itself, do so.
|
2019-09-02 06:25:56 -04:00
|
|
|
|
$pre_attribute_ws = ' ';
|
|
|
|
|
$attributes .= '/';
|
|
|
|
|
} else { // It's not a single-entity tag.
|
|
|
|
|
// If the top of the stack is the same as the tag we want to push, close previous tag.
|
|
|
|
|
if ( $stacksize > 0 && ! in_array( $tag, $nestable_tags, true ) && $tagstack[ $stacksize - 1 ] === $tag ) {
|
2012-09-13 12:39:06 -04:00
|
|
|
|
$tagqueue = '</' . array_pop( $tagstack ) . '>';
|
2005-01-06 05:24:11 -05:00
|
|
|
|
$stacksize--;
|
|
|
|
|
}
|
2012-09-13 12:39:06 -04:00
|
|
|
|
$stacksize = array_push( $tagstack, $tag );
|
2004-02-09 01:57:02 -05:00
|
|
|
|
}
|
|
|
|
|
|
2019-09-02 06:25:56 -04:00
|
|
|
|
// Attributes.
|
|
|
|
|
if ( $has_self_closer && $is_single_tag ) {
|
|
|
|
|
// We need some space - avoid <br/> and prefer <br />.
|
|
|
|
|
$pre_attribute_ws = ' ';
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2010-04-01 09:18:34 -04:00
|
|
|
|
|
2019-09-02 06:25:56 -04:00
|
|
|
|
$tag = '<' . $tag . $pre_attribute_ws . $attributes . '>';
|
|
|
|
|
// If already queuing a close tag, then put this tag on too.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! empty( $tagqueue ) ) {
|
2005-01-06 05:24:11 -05:00
|
|
|
|
$tagqueue .= $tag;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$tag = '';
|
2005-01-06 05:24:11 -05:00
|
|
|
|
}
|
2004-02-09 01:57:02 -05:00
|
|
|
|
}
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$newtext .= substr( $text, 0, $i ) . $tag;
|
|
|
|
|
$text = substr( $text, $i + $l );
|
2006-11-19 02:56:05 -05:00
|
|
|
|
}
|
2004-02-09 01:57:02 -05:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Clear tag queue.
|
2005-01-06 05:24:11 -05:00
|
|
|
|
$newtext .= $tagqueue;
|
2004-02-09 01:57:02 -05:00
|
|
|
|
|
2019-09-02 06:25:56 -04:00
|
|
|
|
// Add remaining text.
|
2004-02-09 01:57:02 -05:00
|
|
|
|
$newtext .= $text;
|
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
while ( $x = array_pop( $tagstack ) ) {
|
2019-09-02 06:25:56 -04:00
|
|
|
|
$newtext .= '</' . $x . '>'; // Add remaining tags to close.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2004-02-09 01:57:02 -05:00
|
|
|
|
|
2019-09-02 06:25:56 -04:00
|
|
|
|
// WP fix for the bug with HTML comments.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$newtext = str_replace( '< !--', '<!--', $newtext );
|
|
|
|
|
$newtext = str_replace( '< !--', '< !--', $newtext );
|
2004-02-09 01:57:02 -05:00
|
|
|
|
|
|
|
|
|
return $newtext;
|
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* Acts on text which is about to be edited.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2012-02-23 20:58:18 -05:00
|
|
|
|
* The $content is run through esc_textarea(), which uses htmlspecialchars()
|
2016-05-23 15:01:27 -04:00
|
|
|
|
* to convert special characters to HTML entities. If `$richedit` is set to true,
|
|
|
|
|
* it is simply a holder for the {@see 'format_to_edit'} filter.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 0.71
|
2015-09-30 22:01:26 -04:00
|
|
|
|
* @since 4.4.0 The `$richedit` parameter was renamed to `$rich_text` for clarity.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2015-09-30 22:01:26 -04:00
|
|
|
|
* @param string $content The text about to be edited.
|
|
|
|
|
* @param bool $rich_text Optional. Whether `$content` should be considered rich text,
|
|
|
|
|
* in which case it would not be passed through esc_textarea().
|
|
|
|
|
* Default false.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @return string The text after the filter (and possibly htmlspecialchars()) has been run.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-09-30 22:01:26 -04:00
|
|
|
|
function format_to_edit( $content, $rich_text = false ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the text to be formatted for editing.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
2013-11-30 14:05:10 -05:00
|
|
|
|
* @since 1.2.0
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @param string $content The text, prior to formatting for editing.
|
|
|
|
|
*/
|
2010-12-25 13:10:59 -05:00
|
|
|
|
$content = apply_filters( 'format_to_edit', $content );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! $rich_text ) {
|
2010-12-25 13:10:59 -05:00
|
|
|
|
$content = esc_textarea( $content );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2004-02-09 01:57:02 -05:00
|
|
|
|
return $content;
|
|
|
|
|
}
|
2004-03-28 22:54:57 -05:00
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* Add leading zeros when necessary.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* If you set the threshold to '4' and the number is '10', then you will get
|
2011-10-04 12:02:33 -04:00
|
|
|
|
* back '0010'. If you set the threshold to '4' and the number is '5000', then you
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* will get back '5000'.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-31 16:58:19 -04:00
|
|
|
|
* Uses sprintf to append the amount of zeros based on the $threshold parameter
|
|
|
|
|
* and the size of the number. If the number is large enough, then no zeros will
|
|
|
|
|
* be appended.
|
|
|
|
|
*
|
2008-08-17 07:29:43 -04:00
|
|
|
|
* @since 0.71
|
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param int $number Number to append zeros to if not greater than threshold.
|
|
|
|
|
* @param int $threshold Digit places number needs to be to not have zeros added.
|
2008-08-31 16:58:19 -04:00
|
|
|
|
* @return string Adds leading zeros to number if needed.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function zeroise( $number, $threshold ) {
|
|
|
|
|
return sprintf( '%0' . $threshold . 's', $number );
|
2006-06-07 23:17:01 -04:00
|
|
|
|
}
|
2004-02-09 01:57:02 -05:00
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
|
|
|
|
* Adds backslashes before letters and before a number at the start of a string.
|
|
|
|
|
*
|
|
|
|
|
* @since 0.71
|
|
|
|
|
*
|
|
|
|
|
* @param string $string Value to which backslashes will be added.
|
|
|
|
|
* @return string String with backslashes inserted.
|
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function backslashit( $string ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( isset( $string[0] ) && $string[0] >= '0' && $string[0] <= '9' ) {
|
2013-04-22 16:01:57 -04:00
|
|
|
|
$string = '\\\\' . $string;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2013-04-22 16:01:57 -04:00
|
|
|
|
return addcslashes( $string, 'A..Za..z' );
|
2004-02-09 01:57:02 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* Appends a trailing slash.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2014-03-01 16:45:15 -05:00
|
|
|
|
* Will remove trailing forward and backslashes if it exists already before adding
|
|
|
|
|
* a trailing forward slash. This prevents double slashing a string or path.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* The primary use of this is for paths and thus should be used for paths. It is
|
|
|
|
|
* not restricted to paths and offers no specific path support.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 1.2.0
|
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @param string $string What to add the trailing slash to.
|
|
|
|
|
* @return string String with trailing slash added.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2014-03-01 16:45:15 -05:00
|
|
|
|
function trailingslashit( $string ) {
|
|
|
|
|
return untrailingslashit( $string ) . '/';
|
2004-02-09 01:57:02 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2014-03-01 16:45:15 -05:00
|
|
|
|
* Removes trailing forward slashes and backslashes if they exist.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* The primary use of this is for paths and thus should be used for paths. It is
|
|
|
|
|
* not restricted to paths and offers no specific path support.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 2.2.0
|
|
|
|
|
*
|
2014-03-01 16:45:15 -05:00
|
|
|
|
* @param string $string What to remove the trailing slashes from.
|
|
|
|
|
* @return string String without the trailing slashes.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2014-03-01 16:45:15 -05:00
|
|
|
|
function untrailingslashit( $string ) {
|
|
|
|
|
return rtrim( $string, '/\\' );
|
2007-03-10 01:25:33 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2021-12-07 07:20:02 -05:00
|
|
|
|
* Adds slashes to a string or recursively adds slashes to strings within an array.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* Slashes will first be removed if magic_quotes_gpc is set, see {@link
|
2020-01-19 22:14:06 -05:00
|
|
|
|
* https://www.php.net/magic_quotes} for more details.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 0.71
|
|
|
|
|
*
|
2021-12-07 07:20:02 -05:00
|
|
|
|
* @param string|array $gpc String or array of data to slash.
|
|
|
|
|
* @return string|array Slashed `$gpc`.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2017-11-30 18:11:00 -05:00
|
|
|
|
function addslashes_gpc( $gpc ) {
|
|
|
|
|
return wp_slash( $gpc );
|
2004-02-09 01:57:02 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2015-10-17 19:26:24 -04:00
|
|
|
|
* Navigates through an array, object, or scalar, and removes slashes from the values.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 2.0.0
|
|
|
|
|
*
|
2012-07-20 11:14:26 -04:00
|
|
|
|
* @param mixed $value The value to be stripped.
|
|
|
|
|
* @return mixed Stripped value.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function stripslashes_deep( $value ) {
|
2015-10-17 19:26:24 -04:00
|
|
|
|
return map_deep( $value, 'stripslashes_from_strings_only' );
|
2007-04-12 18:00:22 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2015-10-17 19:26:24 -04:00
|
|
|
|
* Callback function for `stripslashes_deep()` which strips slashes from strings.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2015-10-17 19:26:24 -04:00
|
|
|
|
* @since 4.4.0
|
|
|
|
|
*
|
|
|
|
|
* @param mixed $value The array or string to be stripped.
|
2020-06-19 18:55:12 -04:00
|
|
|
|
* @return mixed The stripped value.
|
2015-10-17 19:26:24 -04:00
|
|
|
|
*/
|
|
|
|
|
function stripslashes_from_strings_only( $value ) {
|
|
|
|
|
return is_string( $value ) ? stripslashes( $value ) : $value;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Navigates through an array, object, or scalar, and encodes the values to be used in a URL.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 2.2.0
|
|
|
|
|
*
|
2015-10-17 19:26:24 -04:00
|
|
|
|
* @param mixed $value The array or string to be encoded.
|
2020-06-19 18:55:12 -04:00
|
|
|
|
* @return mixed The encoded value.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function urlencode_deep( $value ) {
|
2015-10-17 19:26:24 -04:00
|
|
|
|
return map_deep( $value, 'urlencode' );
|
2005-07-05 21:12:38 -04:00
|
|
|
|
}
|
|
|
|
|
|
2012-04-27 11:40:00 -04:00
|
|
|
|
/**
|
2015-10-17 19:26:24 -04:00
|
|
|
|
* Navigates through an array, object, or scalar, and raw-encodes the values to be used in a URL.
|
2012-04-27 11:40:00 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 3.4.0
|
|
|
|
|
*
|
2015-10-17 19:26:24 -04:00
|
|
|
|
* @param mixed $value The array or string to be encoded.
|
2020-06-19 18:55:12 -04:00
|
|
|
|
* @return mixed The encoded value.
|
2012-04-27 11:40:00 -04:00
|
|
|
|
*/
|
|
|
|
|
function rawurlencode_deep( $value ) {
|
2015-10-17 19:26:24 -04:00
|
|
|
|
return map_deep( $value, 'rawurlencode' );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Navigates through an array, object, or scalar, and decodes URL-encoded values
|
|
|
|
|
*
|
|
|
|
|
* @since 4.4.0
|
|
|
|
|
*
|
|
|
|
|
* @param mixed $value The array or string to be decoded.
|
2020-06-19 18:55:12 -04:00
|
|
|
|
* @return mixed The decoded value.
|
2015-10-17 19:26:24 -04:00
|
|
|
|
*/
|
|
|
|
|
function urldecode_deep( $value ) {
|
|
|
|
|
return map_deep( $value, 'urldecode' );
|
2012-04-27 11:40:00 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-31 16:58:19 -04:00
|
|
|
|
* Converts email addresses characters to HTML entities to block spam bots.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 0.71
|
|
|
|
|
*
|
2013-08-20 02:08:09 -04:00
|
|
|
|
* @param string $email_address Email address.
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param int $hex_encoding Optional. Set to 1 to enable hex encoding.
|
2008-08-31 16:58:19 -04:00
|
|
|
|
* @return string Converted email address.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2013-08-27 21:47:09 -04:00
|
|
|
|
function antispambot( $email_address, $hex_encoding = 0 ) {
|
2013-08-20 02:08:09 -04:00
|
|
|
|
$email_no_spam_address = '';
|
2015-03-08 19:01:26 -04:00
|
|
|
|
for ( $i = 0, $len = strlen( $email_address ); $i < $len; $i++ ) {
|
2013-08-27 21:47:09 -04:00
|
|
|
|
$j = rand( 0, 1 + $hex_encoding );
|
2020-02-09 11:55:09 -05:00
|
|
|
|
if ( 0 == $j ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$email_no_spam_address .= '&#' . ord( $email_address[ $i ] ) . ';';
|
2020-02-09 11:55:09 -05:00
|
|
|
|
} elseif ( 1 == $j ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$email_no_spam_address .= $email_address[ $i ];
|
2020-02-09 11:55:09 -05:00
|
|
|
|
} elseif ( 2 == $j ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$email_no_spam_address .= '%' . zeroise( dechex( ord( $email_address[ $i ] ) ), 2 );
|
2004-02-09 01:57:02 -05:00
|
|
|
|
}
|
|
|
|
|
}
|
2013-08-20 02:08:09 -04:00
|
|
|
|
|
2015-05-25 02:25:25 -04:00
|
|
|
|
return str_replace( '@', '@', $email_no_spam_address );
|
2004-02-09 01:57:02 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* Callback to convert URI match to HTML A element.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2016-05-22 13:39:28 -04:00
|
|
|
|
* This function was backported from 2.5.0 to 2.3.2. Regex callback for make_clickable().
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @since 2.3.2
|
2008-08-17 07:29:43 -04:00
|
|
|
|
* @access private
|
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @param array $matches Single Regex Match.
|
|
|
|
|
* @return string HTML A element with URI address.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function _make_url_clickable_cb( $matches ) {
|
2007-12-20 22:14:22 -05:00
|
|
|
|
$url = $matches[2];
|
2011-01-05 23:11:14 -05:00
|
|
|
|
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( ')' === $matches[3] && strpos( $url, '(' ) ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// If the trailing character is a closing parethesis, and the URL has an opening parenthesis in it,
|
|
|
|
|
// add the closing parenthesis to the URL. Then we can let the parenthesis balancer do its thing below.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$url .= $matches[3];
|
2012-02-10 08:42:15 -05:00
|
|
|
|
$suffix = '';
|
|
|
|
|
} else {
|
|
|
|
|
$suffix = $matches[3];
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Include parentheses in the URL only if paired.
|
2010-12-15 08:43:30 -05:00
|
|
|
|
while ( substr_count( $url, '(' ) < substr_count( $url, ')' ) ) {
|
2011-01-05 23:11:14 -05:00
|
|
|
|
$suffix = strrchr( $url, ')' ) . $suffix;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$url = substr( $url, 0, strrpos( $url, ')' ) );
|
2010-12-15 08:43:30 -05:00
|
|
|
|
}
|
2009-08-19 19:56:10 -04:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$url = esc_url( $url );
|
|
|
|
|
if ( empty( $url ) ) {
|
2007-12-20 22:14:22 -05:00
|
|
|
|
return $matches[0];
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2009-08-19 19:56:10 -04:00
|
|
|
|
|
2019-10-21 16:41:04 -04:00
|
|
|
|
if ( 'comment_text' === current_filter() ) {
|
|
|
|
|
$rel = 'nofollow ugc';
|
|
|
|
|
} else {
|
|
|
|
|
$rel = 'nofollow';
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Filters the rel value that is added to URL matches converted to links.
|
|
|
|
|
*
|
|
|
|
|
* @since 5.3.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $rel The rel value.
|
|
|
|
|
* @param string $url The matched URL being converted to a link tag.
|
|
|
|
|
*/
|
|
|
|
|
$rel = apply_filters( 'make_clickable_rel', $rel, $url );
|
|
|
|
|
$rel = esc_attr( $rel );
|
|
|
|
|
|
|
|
|
|
return $matches[1] . "<a href=\"$url\" rel=\"$rel\">$url</a>" . $suffix;
|
2007-12-20 22:14:22 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* Callback to convert URL match to HTML A element.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2016-05-22 13:39:28 -04:00
|
|
|
|
* This function was backported from 2.5.0 to 2.3.2. Regex callback for make_clickable().
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @since 2.3.2
|
2008-08-17 07:29:43 -04:00
|
|
|
|
* @access private
|
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @param array $matches Single Regex Match.
|
|
|
|
|
* @return string HTML A element with URL address.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function _make_web_ftp_clickable_cb( $matches ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$ret = '';
|
2007-12-20 22:14:22 -05:00
|
|
|
|
$dest = $matches[2];
|
|
|
|
|
$dest = 'http://' . $dest;
|
2009-08-19 19:56:10 -04:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Removed trailing [.,;:)] from URL.
|
2020-04-04 23:02:11 -04:00
|
|
|
|
$last_char = substr( $dest, -1 );
|
|
|
|
|
if ( in_array( $last_char, array( '.', ',', ';', ':', ')' ), true ) === true ) {
|
|
|
|
|
$ret = $last_char;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$dest = substr( $dest, 0, strlen( $dest ) - 1 );
|
2008-03-21 12:29:59 -04:00
|
|
|
|
}
|
2015-10-07 19:39:23 -04:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$dest = esc_url( $dest );
|
|
|
|
|
if ( empty( $dest ) ) {
|
2015-10-07 19:39:23 -04:00
|
|
|
|
return $matches[0];
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2015-10-07 19:39:23 -04:00
|
|
|
|
|
2019-10-21 16:41:04 -04:00
|
|
|
|
if ( 'comment_text' === current_filter() ) {
|
|
|
|
|
$rel = 'nofollow ugc';
|
|
|
|
|
} else {
|
|
|
|
|
$rel = 'nofollow';
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
|
|
|
|
$rel = apply_filters( 'make_clickable_rel', $rel, $dest );
|
|
|
|
|
$rel = esc_attr( $rel );
|
|
|
|
|
|
|
|
|
|
return $matches[1] . "<a href=\"$dest\" rel=\"$rel\">$dest</a>$ret";
|
2007-12-20 22:14:22 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* Callback to convert email address match to HTML A element.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2016-05-22 13:39:28 -04:00
|
|
|
|
* This function was backported from 2.5.0 to 2.3.2. Regex callback for make_clickable().
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @since 2.3.2
|
2008-08-17 07:29:43 -04:00
|
|
|
|
* @access private
|
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @param array $matches Single Regex Match.
|
|
|
|
|
* @return string HTML A element with email address.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function _make_email_clickable_cb( $matches ) {
|
2007-12-20 22:14:22 -05:00
|
|
|
|
$email = $matches[2] . '@' . $matches[3];
|
|
|
|
|
return $matches[1] . "<a href=\"mailto:$email\">$email</a>";
|
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* Convert plaintext URI to HTML links.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* Converts URI, www and ftp, and email addresses. Finishes by fixing links
|
|
|
|
|
* within links.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 0.71
|
|
|
|
|
*
|
2012-04-11 17:14:13 -04:00
|
|
|
|
* @param string $text Content to convert URIs.
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @return string Content with converted URIs.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2012-04-11 17:14:13 -04:00
|
|
|
|
function make_clickable( $text ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$r = '';
|
2020-01-28 19:45:18 -05:00
|
|
|
|
$textarr = preg_split( '/(<[^<>]+>)/', $text, -1, PREG_SPLIT_DELIM_CAPTURE ); // Split out HTML tags.
|
|
|
|
|
$nested_code_pre = 0; // Keep track of how many levels link is nested inside <pre> or <code>.
|
2012-04-11 17:14:13 -04:00
|
|
|
|
foreach ( $textarr as $piece ) {
|
2013-11-08 17:38:10 -05:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( preg_match( '|^<code[\s>]|i', $piece ) || preg_match( '|^<pre[\s>]|i', $piece ) || preg_match( '|^<script[\s>]|i', $piece ) || preg_match( '|^<style[\s>]|i', $piece ) ) {
|
2013-11-08 17:38:10 -05:00
|
|
|
|
$nested_code_pre++;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
} elseif ( $nested_code_pre && ( '</code>' === strtolower( $piece ) || '</pre>' === strtolower( $piece ) || '</script>' === strtolower( $piece ) || '</style>' === strtolower( $piece ) ) ) {
|
2013-11-08 17:38:10 -05:00
|
|
|
|
$nested_code_pre--;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2013-11-08 17:38:10 -05:00
|
|
|
|
|
2020-02-09 11:55:09 -05:00
|
|
|
|
if ( $nested_code_pre || empty( $piece ) || ( '<' === $piece[0] && ! preg_match( '|^<\s*[\w]{1,20}+://|', $piece ) ) ) {
|
2012-04-11 17:14:13 -04:00
|
|
|
|
$r .= $piece;
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Long strings might contain expensive edge cases...
|
2012-04-11 17:14:13 -04:00
|
|
|
|
if ( 10000 < strlen( $piece ) ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// ...break it up.
|
|
|
|
|
foreach ( _split_str_by_whitespace( $piece, 2100 ) as $chunk ) { // 2100: Extra room for scheme and leading and trailing paretheses.
|
2012-04-11 17:14:13 -04:00
|
|
|
|
if ( 2101 < strlen( $chunk ) ) {
|
|
|
|
|
$r .= $chunk; // Too big, no whitespace: bail.
|
|
|
|
|
} else {
|
|
|
|
|
$r .= make_clickable( $chunk );
|
|
|
|
|
}
|
2012-02-10 08:42:15 -05:00
|
|
|
|
}
|
2012-04-11 17:14:13 -04:00
|
|
|
|
} else {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
$ret = " $piece "; // Pad with whitespace to simplify the regexes.
|
2012-04-11 17:14:13 -04:00
|
|
|
|
|
|
|
|
|
$url_clickable = '~
|
2020-01-28 19:45:18 -05:00
|
|
|
|
([\\s(<.,;:!?]) # 1: Leading whitespace, or punctuation.
|
|
|
|
|
( # 2: URL.
|
|
|
|
|
[\\w]{1,20}+:// # Scheme and hier-part prefix.
|
|
|
|
|
(?=\S{1,2000}\s) # Limit to URLs less than about 2000 characters long.
|
|
|
|
|
[\\w\\x80-\\xff#%\\~/@\\[\\]*(+=&$-]*+ # Non-punctuation URL character.
|
|
|
|
|
(?: # Unroll the Loop: Only allow puctuation URL character if followed by a non-punctuation URL character.
|
|
|
|
|
[\'.,;:!?)] # Punctuation URL character.
|
|
|
|
|
[\\w\\x80-\\xff#%\\~/@\\[\\]*(+=&$-]++ # Non-punctuation URL character.
|
2012-04-11 17:14:13 -04:00
|
|
|
|
)*
|
|
|
|
|
)
|
2020-01-28 19:45:18 -05:00
|
|
|
|
(\)?) # 3: Trailing closing parenthesis (for parethesis balancing post processing).
|
2019-07-05 01:21:56 -04:00
|
|
|
|
~xS';
|
|
|
|
|
// The regex is a non-anchored pattern and does not have a single fixed starting character.
|
|
|
|
|
// Tell PCRE to spend more time optimizing since, when used on a page load, it will probably be used several times.
|
2012-04-11 17:14:13 -04:00
|
|
|
|
|
|
|
|
|
$ret = preg_replace_callback( $url_clickable, '_make_url_clickable_cb', $ret );
|
|
|
|
|
|
|
|
|
|
$ret = preg_replace_callback( '#([\s>])((www|ftp)\.[\w\\x80-\\xff\#$%&~/.\-;:=,?@\[\]+]+)#is', '_make_web_ftp_clickable_cb', $ret );
|
|
|
|
|
$ret = preg_replace_callback( '#([\s>])([.0-9a-z_+-]+)@(([0-9a-z-]+\.)+[0-9a-z]{2,})#i', '_make_email_clickable_cb', $ret );
|
|
|
|
|
|
|
|
|
|
$ret = substr( $ret, 1, -1 ); // Remove our whitespace padding.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$r .= $ret;
|
2012-02-10 08:42:15 -05:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Cleanup of accidental links within links.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
return preg_replace( '#(<a([ \r\n\t]+[^>]+?>|>))<a [^>]+?>([^>]+?)</a></a>#i', '$1$3</a>', $r );
|
2012-02-10 08:42:15 -05:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Breaks a string into chunks by splitting at whitespace characters.
|
|
|
|
|
* The length of each returned chunk is as close to the specified length goal as possible,
|
|
|
|
|
* with the caveat that each chunk includes its trailing delimiter.
|
|
|
|
|
* Chunks longer than the goal are guaranteed to not have any inner whitespace.
|
|
|
|
|
*
|
|
|
|
|
* Joining the returned chunks with empty delimiters reconstructs the input string losslessly.
|
|
|
|
|
*
|
|
|
|
|
* Input string must have no null characters (or eventual transformations on output chunks must not care about null characters)
|
|
|
|
|
*
|
2014-11-24 00:30:25 -05:00
|
|
|
|
* _split_str_by_whitespace( "1234 67890 1234 67890a cd 1234 890 123456789 1234567890a 45678 1 3 5 7 90 ", 10 ) ==
|
|
|
|
|
* array (
|
2020-01-28 19:45:18 -05:00
|
|
|
|
* 0 => '1234 67890 ', // 11 characters: Perfect split.
|
|
|
|
|
* 1 => '1234 ', // 5 characters: '1234 67890a' was too long.
|
|
|
|
|
* 2 => '67890a cd ', // 10 characters: '67890a cd 1234' was too long.
|
|
|
|
|
* 3 => '1234 890 ', // 11 characters: Perfect split.
|
|
|
|
|
* 4 => '123456789 ', // 10 characters: '123456789 1234567890a' was too long.
|
|
|
|
|
* 5 => '1234567890a ', // 12 characters: Too long, but no inner whitespace on which to split.
|
|
|
|
|
* 6 => ' 45678 ', // 11 characters: Perfect split.
|
|
|
|
|
* 7 => '1 3 5 7 90 ', // 11 characters: End of $string.
|
2014-11-24 00:30:25 -05:00
|
|
|
|
* );
|
2012-02-10 08:42:15 -05:00
|
|
|
|
*
|
2012-02-10 08:57:21 -05:00
|
|
|
|
* @since 3.4.0
|
|
|
|
|
* @access private
|
|
|
|
|
*
|
2012-07-09 01:03:53 -04:00
|
|
|
|
* @param string $string The string to split.
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param int $goal The desired chunk length.
|
2012-02-10 08:42:15 -05:00
|
|
|
|
* @return array Numeric array of chunks.
|
|
|
|
|
*/
|
|
|
|
|
function _split_str_by_whitespace( $string, $goal ) {
|
|
|
|
|
$chunks = array();
|
|
|
|
|
|
|
|
|
|
$string_nullspace = strtr( $string, "\r\n\t\v\f ", "\000\000\000\000\000\000" );
|
|
|
|
|
|
|
|
|
|
while ( $goal < strlen( $string_nullspace ) ) {
|
|
|
|
|
$pos = strrpos( substr( $string_nullspace, 0, $goal + 1 ), "\000" );
|
|
|
|
|
|
|
|
|
|
if ( false === $pos ) {
|
|
|
|
|
$pos = strpos( $string_nullspace, "\000", $goal + 1 );
|
|
|
|
|
if ( false === $pos ) {
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$chunks[] = substr( $string, 0, $pos + 1 );
|
|
|
|
|
$string = substr( $string, $pos + 1 );
|
2012-02-10 08:42:15 -05:00
|
|
|
|
$string_nullspace = substr( $string_nullspace, $pos + 1 );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( $string ) {
|
|
|
|
|
$chunks[] = $string;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return $chunks;
|
2004-02-09 01:57:02 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2019-09-29 21:30:58 -04:00
|
|
|
|
* Callback to add a rel attribute to HTML A element.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2019-09-29 21:30:58 -04:00
|
|
|
|
* Will remove already existing string before adding to prevent invalidating (X)HTML.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2019-09-29 21:30:58 -04:00
|
|
|
|
* @since 5.3.0
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2019-09-29 21:30:58 -04:00
|
|
|
|
* @param array $matches Single match.
|
|
|
|
|
* @param string $rel The rel attribute to add.
|
|
|
|
|
* @return string HTML A element with the added rel attribute.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2019-09-29 21:30:58 -04:00
|
|
|
|
function wp_rel_callback( $matches, $rel ) {
|
2007-09-13 00:51:33 -04:00
|
|
|
|
$text = $matches[1];
|
2019-09-04 13:37:55 -04:00
|
|
|
|
$atts = wp_kses_hair( $matches[1], wp_allowed_protocols() );
|
2015-12-30 18:20:25 -05:00
|
|
|
|
|
2019-03-12 18:15:50 -04:00
|
|
|
|
if ( ! empty( $atts['href'] ) ) {
|
2019-09-04 13:37:55 -04:00
|
|
|
|
if ( in_array( strtolower( wp_parse_url( $atts['href']['value'], PHP_URL_SCHEME ) ), array( 'http', 'https' ), true ) ) {
|
|
|
|
|
if ( strtolower( wp_parse_url( $atts['href']['value'], PHP_URL_HOST ) ) === strtolower( wp_parse_url( home_url(), PHP_URL_HOST ) ) ) {
|
2019-03-12 18:15:50 -04:00
|
|
|
|
return "<a $text>";
|
|
|
|
|
}
|
|
|
|
|
}
|
2015-12-30 18:20:25 -05:00
|
|
|
|
}
|
|
|
|
|
|
2015-09-18 00:36:24 -04:00
|
|
|
|
if ( ! empty( $atts['rel'] ) ) {
|
2019-09-29 21:30:58 -04:00
|
|
|
|
$parts = array_map( 'trim', explode( ' ', $atts['rel']['value'] ) );
|
|
|
|
|
$rel_array = array_map( 'trim', explode( ' ', $rel ) );
|
|
|
|
|
$parts = array_unique( array_merge( $parts, $rel_array ) );
|
|
|
|
|
$rel = implode( ' ', $parts );
|
2015-09-18 00:36:24 -04:00
|
|
|
|
unset( $atts['rel'] );
|
|
|
|
|
|
|
|
|
|
$html = '';
|
|
|
|
|
foreach ( $atts as $name => $value ) {
|
2019-09-04 13:37:55 -04:00
|
|
|
|
if ( isset( $value['vless'] ) && 'y' === $value['vless'] ) {
|
|
|
|
|
$html .= $name . ' ';
|
|
|
|
|
} else {
|
|
|
|
|
$html .= "{$name}=\"" . esc_attr( $value['value'] ) . '" ';
|
|
|
|
|
}
|
2015-09-18 00:36:24 -04:00
|
|
|
|
}
|
|
|
|
|
$text = trim( $html );
|
|
|
|
|
}
|
2019-03-12 18:56:49 -04:00
|
|
|
|
return "<a $text rel=\"" . esc_attr( $rel ) . '">';
|
2007-09-13 00:51:33 -04:00
|
|
|
|
}
|
|
|
|
|
|
2019-09-29 21:30:58 -04:00
|
|
|
|
/**
|
|
|
|
|
* Adds `rel="nofollow"` string to all HTML A elements in content.
|
|
|
|
|
*
|
|
|
|
|
* @since 1.5.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $text Content that may contain HTML A elements.
|
|
|
|
|
* @return string Converted content.
|
|
|
|
|
*/
|
|
|
|
|
function wp_rel_nofollow( $text ) {
|
2019-10-04 20:56:57 -04:00
|
|
|
|
// This is a pre-save filter, so text is already escaped.
|
2019-09-29 21:30:58 -04:00
|
|
|
|
$text = stripslashes( $text );
|
|
|
|
|
$text = preg_replace_callback(
|
|
|
|
|
'|<a (.+?)>|i',
|
2021-08-26 08:59:02 -04:00
|
|
|
|
static function( $matches ) {
|
2019-10-04 20:56:57 -04:00
|
|
|
|
return wp_rel_callback( $matches, 'nofollow' );
|
2019-09-29 21:30:58 -04:00
|
|
|
|
},
|
|
|
|
|
$text
|
|
|
|
|
);
|
|
|
|
|
return wp_slash( $text );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Callback to add `rel="nofollow"` string to HTML A element.
|
|
|
|
|
*
|
|
|
|
|
* @since 2.3.0
|
|
|
|
|
* @deprecated 5.3.0 Use wp_rel_callback()
|
|
|
|
|
*
|
|
|
|
|
* @param array $matches Single match.
|
|
|
|
|
* @return string HTML A Element with `rel="nofollow"`.
|
|
|
|
|
*/
|
|
|
|
|
function wp_rel_nofollow_callback( $matches ) {
|
|
|
|
|
return wp_rel_callback( $matches, 'nofollow' );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Adds `rel="nofollow ugc"` string to all HTML A elements in content.
|
|
|
|
|
*
|
|
|
|
|
* @since 5.3.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $text Content that may contain HTML A elements.
|
|
|
|
|
* @return string Converted content.
|
|
|
|
|
*/
|
|
|
|
|
function wp_rel_ugc( $text ) {
|
2019-10-04 20:56:57 -04:00
|
|
|
|
// This is a pre-save filter, so text is already escaped.
|
2019-09-29 21:30:58 -04:00
|
|
|
|
$text = stripslashes( $text );
|
|
|
|
|
$text = preg_replace_callback(
|
|
|
|
|
'|<a (.+?)>|i',
|
2021-08-26 08:59:02 -04:00
|
|
|
|
static function( $matches ) {
|
2019-10-04 20:56:57 -04:00
|
|
|
|
return wp_rel_callback( $matches, 'nofollow ugc' );
|
2019-09-29 21:30:58 -04:00
|
|
|
|
},
|
|
|
|
|
$text
|
|
|
|
|
);
|
|
|
|
|
return wp_slash( $text );
|
|
|
|
|
}
|
|
|
|
|
|
2018-03-02 09:42:31 -05:00
|
|
|
|
/**
|
2020-10-19 19:39:04 -04:00
|
|
|
|
* Adds `rel="noopener"` to all HTML A elements that have a target.
|
2018-03-02 09:42:31 -05:00
|
|
|
|
*
|
2019-04-11 17:16:51 -04:00
|
|
|
|
* @since 5.1.0
|
2020-10-19 19:39:04 -04:00
|
|
|
|
* @since 5.6.0 Removed 'noreferrer' relationship.
|
2019-04-11 17:16:51 -04:00
|
|
|
|
*
|
2018-03-02 09:42:31 -05:00
|
|
|
|
* @param string $text Content that may contain HTML A elements.
|
|
|
|
|
* @return string Converted content.
|
|
|
|
|
*/
|
|
|
|
|
function wp_targeted_link_rel( $text ) {
|
|
|
|
|
// Don't run (more expensive) regex if no links with targets.
|
2019-12-12 12:54:02 -05:00
|
|
|
|
if ( stripos( $text, 'target' ) === false || stripos( $text, '<a ' ) === false || is_serialized( $text ) ) {
|
|
|
|
|
return $text;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$script_and_style_regex = '/<(script|style).*?<\/\\1>/si';
|
|
|
|
|
|
|
|
|
|
preg_match_all( $script_and_style_regex, $text, $matches );
|
|
|
|
|
$extra_parts = $matches[0];
|
|
|
|
|
$html_parts = preg_split( $script_and_style_regex, $text );
|
|
|
|
|
|
|
|
|
|
foreach ( $html_parts as &$part ) {
|
|
|
|
|
$part = preg_replace_callback( '|<a\s([^>]*target\s*=[^>]*)>|i', 'wp_targeted_link_rel_callback', $part );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$text = '';
|
|
|
|
|
for ( $i = 0; $i < count( $html_parts ); $i++ ) {
|
|
|
|
|
$text .= $html_parts[ $i ];
|
|
|
|
|
if ( isset( $extra_parts[ $i ] ) ) {
|
|
|
|
|
$text .= $extra_parts[ $i ];
|
2019-05-25 08:05:52 -04:00
|
|
|
|
}
|
2018-03-02 09:42:31 -05:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return $text;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
2020-10-19 19:39:04 -04:00
|
|
|
|
* Callback to add `rel="noopener"` string to HTML A element.
|
2018-03-02 09:42:31 -05:00
|
|
|
|
*
|
2020-10-19 19:39:04 -04:00
|
|
|
|
* Will not duplicate an existing 'noopener' value to avoid invalidating the HTML.
|
2018-03-02 09:42:31 -05:00
|
|
|
|
*
|
2019-04-11 17:16:51 -04:00
|
|
|
|
* @since 5.1.0
|
2020-10-19 19:39:04 -04:00
|
|
|
|
* @since 5.6.0 Removed 'noreferrer' relationship.
|
2019-04-11 17:16:51 -04:00
|
|
|
|
*
|
2020-10-19 19:39:04 -04:00
|
|
|
|
* @param array $matches Single match.
|
|
|
|
|
* @return string HTML A Element with `rel="noopener"` in addition to any existing values.
|
2018-03-02 09:42:31 -05:00
|
|
|
|
*/
|
|
|
|
|
function wp_targeted_link_rel_callback( $matches ) {
|
2019-12-12 12:54:02 -05:00
|
|
|
|
$link_html = $matches[1];
|
|
|
|
|
$original_link_html = $link_html;
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Consider the HTML escaped if there are no unescaped quotes.
|
2019-12-12 12:54:02 -05:00
|
|
|
|
$is_escaped = ! preg_match( '/(^|[^\\\\])[\'"]/', $link_html );
|
|
|
|
|
if ( $is_escaped ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Replace only the quotes so that they are parsable by wp_kses_hair(), leave the rest as is.
|
2019-12-12 12:54:02 -05:00
|
|
|
|
$link_html = preg_replace( '/\\\\([\'"])/', '$1', $link_html );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$atts = wp_kses_hair( $link_html, wp_allowed_protocols() );
|
2018-03-02 09:42:31 -05:00
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Filters the rel values that are added to links with `target` attribute.
|
|
|
|
|
*
|
2019-01-17 01:46:50 -05:00
|
|
|
|
* @since 5.1.0
|
2018-03-02 09:42:31 -05:00
|
|
|
|
*
|
2019-10-21 16:41:04 -04:00
|
|
|
|
* @param string $rel The rel values.
|
2018-03-02 09:42:31 -05:00
|
|
|
|
* @param string $link_html The matched content of the link tag including all HTML attributes.
|
|
|
|
|
*/
|
2020-10-19 19:39:04 -04:00
|
|
|
|
$rel = apply_filters( 'wp_targeted_link_rel', 'noopener', $link_html );
|
2018-03-02 09:42:31 -05:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Return early if no rel values to be added or if no actual target attribute.
|
2019-12-12 12:54:02 -05:00
|
|
|
|
if ( ! $rel || ! isset( $atts['target'] ) ) {
|
|
|
|
|
return "<a $original_link_html>";
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( isset( $atts['rel'] ) ) {
|
|
|
|
|
$all_parts = preg_split( '/\s/', "{$atts['rel']['value']} $rel", -1, PREG_SPLIT_NO_EMPTY );
|
|
|
|
|
$rel = implode( ' ', array_unique( $all_parts ) );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$atts['rel']['whole'] = 'rel="' . esc_attr( $rel ) . '"';
|
2020-10-18 13:27:06 -04:00
|
|
|
|
$link_html = implode( ' ', array_column( $atts, 'whole' ) );
|
2019-12-12 12:54:02 -05:00
|
|
|
|
|
|
|
|
|
if ( $is_escaped ) {
|
|
|
|
|
$link_html = preg_replace( '/[\'"]/', '\\\\$0', $link_html );
|
2018-03-02 09:42:31 -05:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return "<a $link_html>";
|
|
|
|
|
}
|
|
|
|
|
|
2019-01-29 16:29:50 -05:00
|
|
|
|
/**
|
|
|
|
|
* Adds all filters modifying the rel attribute of targeted links.
|
|
|
|
|
*
|
|
|
|
|
* @since 5.1.0
|
|
|
|
|
*/
|
|
|
|
|
function wp_init_targeted_link_rel_filters() {
|
|
|
|
|
$filters = array(
|
|
|
|
|
'title_save_pre',
|
|
|
|
|
'content_save_pre',
|
|
|
|
|
'excerpt_save_pre',
|
|
|
|
|
'content_filtered_save_pre',
|
|
|
|
|
'pre_comment_content',
|
|
|
|
|
'pre_term_description',
|
|
|
|
|
'pre_link_description',
|
|
|
|
|
'pre_link_notes',
|
|
|
|
|
'pre_user_description',
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
foreach ( $filters as $filter ) {
|
|
|
|
|
add_filter( $filter, 'wp_targeted_link_rel' );
|
2021-08-05 09:15:55 -04:00
|
|
|
|
}
|
2019-01-29 16:29:50 -05:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Removes all filters modifying the rel attribute of targeted links.
|
|
|
|
|
*
|
|
|
|
|
* @since 5.1.0
|
|
|
|
|
*/
|
|
|
|
|
function wp_remove_targeted_link_rel_filters() {
|
|
|
|
|
$filters = array(
|
|
|
|
|
'title_save_pre',
|
|
|
|
|
'content_save_pre',
|
|
|
|
|
'excerpt_save_pre',
|
|
|
|
|
'content_filtered_save_pre',
|
|
|
|
|
'pre_comment_content',
|
|
|
|
|
'pre_term_description',
|
|
|
|
|
'pre_link_description',
|
|
|
|
|
'pre_link_notes',
|
|
|
|
|
'pre_user_description',
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
foreach ( $filters as $filter ) {
|
|
|
|
|
remove_filter( $filter, 'wp_targeted_link_rel' );
|
2021-08-05 09:15:55 -04:00
|
|
|
|
}
|
2019-01-29 16:29:50 -05:00
|
|
|
|
}
|
|
|
|
|
|
2009-01-06 13:20:47 -05:00
|
|
|
|
/**
|
|
|
|
|
* Convert one smiley code to the icon graphic file equivalent.
|
|
|
|
|
*
|
2016-05-22 13:39:28 -04:00
|
|
|
|
* Callback handler for convert_smilies().
|
|
|
|
|
*
|
2009-01-06 13:20:47 -05:00
|
|
|
|
* Looks up one smiley code in the $wpsmiliestrans global array and returns an
|
2014-11-24 00:30:25 -05:00
|
|
|
|
* `<img>` string for that smiley.
|
2009-01-06 13:20:47 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 2.8.0
|
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @global array $wpsmiliestrans
|
|
|
|
|
*
|
2013-09-29 06:08:10 -04:00
|
|
|
|
* @param array $matches Single match. Smiley code to convert to image.
|
2009-01-06 13:20:47 -05:00
|
|
|
|
* @return string Image string for smiley.
|
|
|
|
|
*/
|
2013-09-29 06:08:10 -04:00
|
|
|
|
function translate_smiley( $matches ) {
|
2009-01-06 13:20:47 -05:00
|
|
|
|
global $wpsmiliestrans;
|
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( count( $matches ) == 0 ) {
|
2009-01-06 13:20:47 -05:00
|
|
|
|
return '';
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2009-01-06 13:20:47 -05:00
|
|
|
|
|
2013-09-29 06:08:10 -04:00
|
|
|
|
$smiley = trim( reset( $matches ) );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$img = $wpsmiliestrans[ $smiley ];
|
2009-09-14 10:03:32 -04:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$matches = array();
|
|
|
|
|
$ext = preg_match( '/\.([^.]+)$/', $img, $matches ) ? strtolower( $matches[1] ) : false;
|
Images: enable WebP support.
Add support for uploading, editing and saving WebP images when supported by the server.
Add 'image/webp' to supported mime types. Correctly identify WebP images and sizes even when PHP doesn't support WebP. Resize uploaded WebP files (when supported) and use for front end markup.
Props markoheijne, blobfolio, Clorith, joemcgill, atjn, desrosj, spacedmonkey, marylauc, mikeschroder, hellofromtonya, flixos90.
Fixes #35725.
Built from https://develop.svn.wordpress.org/trunk@50810
git-svn-id: http://core.svn.wordpress.org/trunk@50419 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2021-05-04 10:44:58 -04:00
|
|
|
|
$image_exts = array( 'jpg', 'jpeg', 'jpe', 'gif', 'png', 'webp' );
|
2015-03-11 18:49:28 -04:00
|
|
|
|
|
|
|
|
|
// Don't convert smilies that aren't images - they're probably emoji.
|
2020-04-04 23:02:11 -04:00
|
|
|
|
if ( ! in_array( $ext, $image_exts, true ) ) {
|
2015-03-11 18:49:28 -04:00
|
|
|
|
return $img;
|
|
|
|
|
}
|
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the Smiley image URL before it's used in the image element.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 2.9.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $smiley_url URL for the smiley image.
|
|
|
|
|
* @param string $img Filename for the smiley image.
|
|
|
|
|
* @param string $site_url Site URL, as returned by site_url().
|
2013-12-11 14:49:11 -05:00
|
|
|
|
*/
|
2013-09-29 06:08:10 -04:00
|
|
|
|
$src_url = apply_filters( 'smilies_src', includes_url( "images/smilies/$img" ), $img, site_url() );
|
2009-01-06 13:20:47 -05:00
|
|
|
|
|
2015-03-26 22:12:28 -04:00
|
|
|
|
return sprintf( '<img src="%s" alt="%s" class="wp-smiley" style="height: 1em; max-height: 1em;" />', esc_url( $src_url ), esc_attr( $smiley ) );
|
2009-01-06 13:20:47 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-31 16:58:19 -04:00
|
|
|
|
* Convert text equivalent of smilies to images.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2009-01-06 13:20:47 -05:00
|
|
|
|
* Will only convert smilies if the option 'use_smilies' is true and the global
|
|
|
|
|
* used in the function isn't empty.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 0.71
|
2015-05-25 02:25:25 -04:00
|
|
|
|
*
|
|
|
|
|
* @global string|array $wp_smiliessearch
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-31 16:58:19 -04:00
|
|
|
|
* @param string $text Content to convert smilies from text.
|
|
|
|
|
* @return string Converted content with text smilies replaced with images.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2013-11-14 21:46:10 -05:00
|
|
|
|
function convert_smilies( $text ) {
|
2009-01-06 13:20:47 -05:00
|
|
|
|
global $wp_smiliessearch;
|
2008-08-17 07:29:43 -04:00
|
|
|
|
$output = '';
|
2013-11-14 21:46:10 -05:00
|
|
|
|
if ( get_option( 'use_smilies' ) && ! empty( $wp_smiliessearch ) ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// HTML loop taken from texturize function, could possible be consolidated.
|
|
|
|
|
$textarr = preg_split( '/(<.*>)/U', $text, -1, PREG_SPLIT_DELIM_CAPTURE ); // Capture the tags as well as in between.
|
|
|
|
|
$stop = count( $textarr ); // Loop stuff.
|
2013-11-14 21:46:10 -05:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Ignore proessing of specific tags.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$tags_to_ignore = 'code|pre|style|script|textarea';
|
2013-11-14 21:46:10 -05:00
|
|
|
|
$ignore_block_element = '';
|
|
|
|
|
|
|
|
|
|
for ( $i = 0; $i < $stop; $i++ ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$content = $textarr[ $i ];
|
2013-11-14 21:46:10 -05:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// If we're in an ignore block, wait until we find its closing tag.
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( '' === $ignore_block_element && preg_match( '/^<(' . $tags_to_ignore . ')[^>]*>/', $content, $matches ) ) {
|
2013-11-14 21:46:10 -05:00
|
|
|
|
$ignore_block_element = $matches[1];
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// If it's not a tag and not in ignore block.
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( '' === $ignore_block_element && strlen( $content ) > 0 && '<' !== $content[0] ) {
|
2013-11-14 21:46:10 -05:00
|
|
|
|
$content = preg_replace_callback( $wp_smiliessearch, 'translate_smiley', $content );
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Did we exit ignore block?
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( '' !== $ignore_block_element && '</' . $ignore_block_element . '>' === $content ) {
|
2013-11-14 21:46:10 -05:00
|
|
|
|
$ignore_block_element = '';
|
2007-09-03 19:32:58 -04:00
|
|
|
|
}
|
2013-11-14 21:46:10 -05:00
|
|
|
|
|
2007-09-03 19:32:58 -04:00
|
|
|
|
$output .= $content;
|
2006-10-12 06:14:14 -04:00
|
|
|
|
}
|
2004-02-09 01:57:02 -05:00
|
|
|
|
} else {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Return default text.
|
2004-02-09 01:57:02 -05:00
|
|
|
|
$output = $text;
|
|
|
|
|
}
|
|
|
|
|
return $output;
|
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2009-03-11 11:26:34 -04:00
|
|
|
|
* Verifies that an email is valid.
|
|
|
|
|
*
|
|
|
|
|
* Does not grok i18n domains. Not RFC compliant.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 0.71
|
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param string $email Email address to verify.
|
|
|
|
|
* @param bool $deprecated Deprecated.
|
2019-07-30 21:26:54 -04:00
|
|
|
|
* @return string|false Valid email address on success, false on failure.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2010-05-03 14:54:37 -04:00
|
|
|
|
function is_email( $email, $deprecated = false ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! empty( $deprecated ) ) {
|
2016-07-06 08:40:29 -04:00
|
|
|
|
_deprecated_argument( __FUNCTION__, '3.0.0' );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2010-05-03 14:54:37 -04:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Test for the minimum length the email can be.
|
2017-05-14 00:20:43 -04:00
|
|
|
|
if ( strlen( $email ) < 6 ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters whether an email address is valid.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* This filter is evaluated under several different contexts, such as 'email_too_short',
|
|
|
|
|
* 'email_no_at', 'local_invalid_chars', 'domain_period_sequence', 'domain_period_limits',
|
|
|
|
|
* 'domain_no_periods', 'sub_hyphen_limits', 'sub_invalid_chars', or no specific context.
|
|
|
|
|
*
|
|
|
|
|
* @since 2.8.0
|
|
|
|
|
*
|
2019-07-30 21:26:54 -04:00
|
|
|
|
* @param string|false $is_email The email address if successfully passed the is_email() checks, false otherwise.
|
|
|
|
|
* @param string $email The email address being checked.
|
|
|
|
|
* @param string $context Context under which the email was tested.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'is_email', false, $email, 'email_too_short' );
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Test for an @ character after the first position.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
if ( strpos( $email, '@', 1 ) === false ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'is_email', false, $email, 'email_no_at' );
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Split out the local and domain parts.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
list( $local, $domain ) = explode( '@', $email, 2 );
|
|
|
|
|
|
|
|
|
|
// LOCAL PART
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Test for invalid characters.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! preg_match( '/^[a-zA-Z0-9!#$%&\'*+\/=?^_`{|}~\.-]+$/', $local ) ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'is_email', false, $email, 'local_invalid_chars' );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// DOMAIN PART
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Test for sequences of periods.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
if ( preg_match( '/\.{2,}/', $domain ) ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'is_email', false, $email, 'domain_period_sequence' );
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Test for leading and trailing periods and whitespace.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
if ( trim( $domain, " \t\n\r\0\x0B." ) !== $domain ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'is_email', false, $email, 'domain_period_limits' );
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Split the domain into subs.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
$subs = explode( '.', $domain );
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Assume the domain will have at least two subs.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
if ( 2 > count( $subs ) ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'is_email', false, $email, 'domain_no_periods' );
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Loop through each sub.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
foreach ( $subs as $sub ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Test for leading and trailing hyphens and whitespace.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
if ( trim( $sub, " \t\n\r\0\x0B-" ) !== $sub ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'is_email', false, $email, 'sub_hyphen_limits' );
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Test for invalid characters.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! preg_match( '/^[a-z0-9-]+$/i', $sub ) ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'is_email', false, $email, 'sub_invalid_chars' );
|
2004-02-09 01:57:02 -05:00
|
|
|
|
}
|
|
|
|
|
}
|
2009-03-11 11:26:34 -04:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Congratulations, your email made it!
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'is_email', $email, $email, null );
|
2004-02-09 01:57:02 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-31 16:58:19 -04:00
|
|
|
|
* Convert to ASCII from email subjects.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 1.2.0
|
|
|
|
|
*
|
2008-08-31 16:58:19 -04:00
|
|
|
|
* @param string $string Subject line
|
|
|
|
|
* @return string Converted string to ASCII
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function wp_iso_descrambler( $string ) {
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/* this may only work with iso-8859-1, I'm afraid */
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! preg_match( '#\=\?(.+)\?Q\?(.+)\?\=#i', $string, $matches ) ) {
|
2008-08-17 07:29:43 -04:00
|
|
|
|
return $string;
|
|
|
|
|
} else {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$subject = str_replace( '_', ' ', $matches[2] );
|
2015-05-25 02:25:25 -04:00
|
|
|
|
return preg_replace_callback( '#\=([0-9a-f]{2})#i', '_wp_iso_convert', $subject );
|
2008-08-17 07:29:43 -04:00
|
|
|
|
}
|
2004-02-21 19:31:25 -05:00
|
|
|
|
}
|
|
|
|
|
|
2010-10-28 03:38:00 -04:00
|
|
|
|
/**
|
2012-07-09 01:03:53 -04:00
|
|
|
|
* Helper function to convert hex encoded chars to ASCII
|
2010-11-17 13:47:34 -05:00
|
|
|
|
*
|
2010-10-28 03:38:00 -04:00
|
|
|
|
* @since 3.1.0
|
|
|
|
|
* @access private
|
2013-02-01 13:07:08 -05:00
|
|
|
|
*
|
2012-07-09 01:03:53 -04:00
|
|
|
|
* @param array $match The preg_replace_callback matches array
|
2014-11-30 20:34:24 -05:00
|
|
|
|
* @return string Converted chars
|
2010-10-28 03:38:00 -04:00
|
|
|
|
*/
|
2010-11-17 13:47:34 -05:00
|
|
|
|
function _wp_iso_convert( $match ) {
|
|
|
|
|
return chr( hexdec( strtolower( $match[1] ) ) );
|
|
|
|
|
}
|
2010-10-28 03:38:00 -04:00
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2020-03-16 14:40:07 -04:00
|
|
|
|
* Given a date in the timezone of the site, returns that date in UTC.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2019-08-23 07:03:56 -04:00
|
|
|
|
* Requires and returns a date in the Y-m-d H:i:s format.
|
|
|
|
|
* Return format can be overridden using the $format parameter.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 1.2.0
|
|
|
|
|
*
|
2019-12-13 16:45:02 -05:00
|
|
|
|
* @param string $string The date to be converted, in the timezone of the site.
|
2019-08-23 07:03:56 -04:00
|
|
|
|
* @param string $format The format string for the returned date. Default 'Y-m-d H:i:s'.
|
2020-03-16 14:40:07 -04:00
|
|
|
|
* @return string Formatted version of the date, in UTC.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2013-03-05 11:14:14 -05:00
|
|
|
|
function get_gmt_from_date( $string, $format = 'Y-m-d H:i:s' ) {
|
2019-08-23 07:03:56 -04:00
|
|
|
|
$datetime = date_create( $string, wp_timezone() );
|
|
|
|
|
|
|
|
|
|
if ( false === $datetime ) {
|
|
|
|
|
return gmdate( $format, 0 );
|
2011-05-18 14:56:42 -04:00
|
|
|
|
}
|
2019-08-23 07:03:56 -04:00
|
|
|
|
|
|
|
|
|
return $datetime->setTimezone( new DateTimeZone( 'UTC' ) )->format( $format );
|
2004-02-22 22:04:55 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2020-03-16 14:40:07 -04:00
|
|
|
|
* Given a date in UTC or GMT timezone, returns that date in the timezone of the site.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2021-10-29 19:13:05 -04:00
|
|
|
|
* Requires a date in the Y-m-d H:i:s format.
|
|
|
|
|
* Default return format of 'Y-m-d H:i:s' can be overridden using the `$format` parameter.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 1.2.0
|
|
|
|
|
*
|
2020-03-16 14:40:07 -04:00
|
|
|
|
* @param string $string The date to be converted, in UTC or GMT timezone.
|
2019-08-23 07:03:56 -04:00
|
|
|
|
* @param string $format The format string for the returned date. Default 'Y-m-d H:i:s'.
|
2019-12-13 16:45:02 -05:00
|
|
|
|
* @return string Formatted version of the date, in the site's timezone.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2013-03-05 11:14:14 -05:00
|
|
|
|
function get_date_from_gmt( $string, $format = 'Y-m-d H:i:s' ) {
|
2019-08-23 07:03:56 -04:00
|
|
|
|
$datetime = date_create( $string, new DateTimeZone( 'UTC' ) );
|
|
|
|
|
|
|
|
|
|
if ( false === $datetime ) {
|
|
|
|
|
return gmdate( $format, 0 );
|
2013-03-05 11:14:14 -05:00
|
|
|
|
}
|
2019-08-23 07:03:56 -04:00
|
|
|
|
|
|
|
|
|
return $datetime->setTimezone( wp_timezone() )->format( $format );
|
2004-02-22 23:37:11 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2020-03-16 14:40:07 -04:00
|
|
|
|
* Given an ISO 8601 timezone, returns its UTC offset in seconds.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 1.5.0
|
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @param string $timezone Either 'Z' for 0 offset or '±hhmm'.
|
2008-12-09 13:03:31 -05:00
|
|
|
|
* @return int|float The offset in seconds.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function iso8601_timezone_to_offset( $timezone ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// $timezone is either 'Z' or '[+|-]hhmm'.
|
2020-02-09 11:55:09 -05:00
|
|
|
|
if ( 'Z' === $timezone ) {
|
2008-08-17 07:29:43 -04:00
|
|
|
|
$offset = 0;
|
|
|
|
|
} else {
|
2020-05-16 14:42:12 -04:00
|
|
|
|
$sign = ( '+' === substr( $timezone, 0, 1 ) ) ? 1 : -1;
|
2020-10-08 17:15:13 -04:00
|
|
|
|
$hours = (int) substr( $timezone, 1, 2 );
|
|
|
|
|
$minutes = (int) substr( $timezone, 3, 4 ) / 60;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$offset = $sign * HOUR_IN_SECONDS * ( $hours + $minutes );
|
2008-08-17 07:29:43 -04:00
|
|
|
|
}
|
|
|
|
|
return $offset;
|
2004-05-31 13:02:09 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2020-03-16 14:40:07 -04:00
|
|
|
|
* Given an ISO 8601 (Ymd\TH:i:sO) date, returns a MySQL DateTime (Y-m-d H:i:s) format used by post_date[_gmt].
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 1.5.0
|
|
|
|
|
*
|
2016-06-10 00:50:33 -04:00
|
|
|
|
* @param string $date_string Date and time in ISO 8601 format {@link https://en.wikipedia.org/wiki/ISO_8601}.
|
2019-08-23 07:03:56 -04:00
|
|
|
|
* @param string $timezone Optional. If set to 'gmt' returns the result in UTC. Default 'user'.
|
2021-01-03 17:04:04 -05:00
|
|
|
|
* @return string|false The date and time in MySQL DateTime format - Y-m-d H:i:s, or false on failure.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function iso8601_to_datetime( $date_string, $timezone = 'user' ) {
|
2019-08-23 07:03:56 -04:00
|
|
|
|
$timezone = strtolower( $timezone );
|
|
|
|
|
$wp_timezone = wp_timezone();
|
|
|
|
|
$datetime = date_create( $date_string, $wp_timezone ); // Timezone is ignored if input has one.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
|
2019-08-23 07:03:56 -04:00
|
|
|
|
if ( false === $datetime ) {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
2008-08-17 07:29:43 -04:00
|
|
|
|
|
2019-08-23 07:03:56 -04:00
|
|
|
|
if ( 'gmt' === $timezone ) {
|
|
|
|
|
return $datetime->setTimezone( new DateTimeZone( 'UTC' ) )->format( 'Y-m-d H:i:s' );
|
|
|
|
|
}
|
2008-08-17 07:29:43 -04:00
|
|
|
|
|
2019-08-23 07:03:56 -04:00
|
|
|
|
if ( 'user' === $timezone ) {
|
|
|
|
|
return $datetime->setTimezone( $wp_timezone )->format( 'Y-m-d H:i:s' );
|
2008-08-17 07:29:43 -04:00
|
|
|
|
}
|
2019-08-23 07:03:56 -04:00
|
|
|
|
|
|
|
|
|
return false;
|
2004-05-31 13:02:09 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* Strips out all characters that are not allowable in an email.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 1.5.0
|
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @param string $email Email address to filter.
|
|
|
|
|
* @return string Filtered email address.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2009-03-11 11:26:34 -04:00
|
|
|
|
function sanitize_email( $email ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Test for the minimum length the email can be.
|
2017-05-14 00:20:43 -04:00
|
|
|
|
if ( strlen( $email ) < 6 ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters a sanitized email address.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* This filter is evaluated under several contexts, including 'email_too_short',
|
|
|
|
|
* 'email_no_at', 'local_invalid_chars', 'domain_period_sequence', 'domain_period_limits',
|
|
|
|
|
* 'domain_no_periods', 'domain_no_valid_subs', or no context.
|
|
|
|
|
*
|
|
|
|
|
* @since 2.8.0
|
|
|
|
|
*
|
2019-01-16 01:16:49 -05:00
|
|
|
|
* @param string $sanitized_email The sanitized email address.
|
|
|
|
|
* @param string $email The email address, as provided to sanitize_email().
|
|
|
|
|
* @param string|null $message A message to pass to the user. null if email is sanitized.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'sanitize_email', '', $email, 'email_too_short' );
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Test for an @ character after the first position.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
if ( strpos( $email, '@', 1 ) === false ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'sanitize_email', '', $email, 'email_no_at' );
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Split out the local and domain parts.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
list( $local, $domain ) = explode( '@', $email, 2 );
|
|
|
|
|
|
|
|
|
|
// LOCAL PART
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Test for invalid characters.
|
2009-03-13 21:35:47 -04:00
|
|
|
|
$local = preg_replace( '/[^a-zA-Z0-9!#$%&\'*+\/=?^_`{|}~\.-]/', '', $local );
|
|
|
|
|
if ( '' === $local ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'sanitize_email', '', $email, 'local_invalid_chars' );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// DOMAIN PART
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Test for sequences of periods.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
$domain = preg_replace( '/\.{2,}/', '', $domain );
|
|
|
|
|
if ( '' === $domain ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'sanitize_email', '', $email, 'domain_period_sequence' );
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Test for leading and trailing periods and whitespace.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
$domain = trim( $domain, " \t\n\r\0\x0B." );
|
|
|
|
|
if ( '' === $domain ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'sanitize_email', '', $email, 'domain_period_limits' );
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Split the domain into subs.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
$subs = explode( '.', $domain );
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Assume the domain will have at least two subs.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
if ( 2 > count( $subs ) ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'sanitize_email', '', $email, 'domain_no_periods' );
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Create an array that will contain valid subs.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
$new_subs = array();
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Loop through each sub.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
foreach ( $subs as $sub ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Test for leading and trailing hyphens.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
$sub = trim( $sub, " \t\n\r\0\x0B-" );
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Test for invalid characters.
|
2010-11-05 11:29:50 -04:00
|
|
|
|
$sub = preg_replace( '/[^a-z0-9-]+/i', '', $sub );
|
2009-03-11 11:26:34 -04:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// If there's anything left, add it to the valid subs.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
if ( '' !== $sub ) {
|
|
|
|
|
$new_subs[] = $sub;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// If there aren't 2 or more valid subs.
|
2009-03-11 11:26:34 -04:00
|
|
|
|
if ( 2 > count( $new_subs ) ) {
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2009-03-11 11:26:34 -04:00
|
|
|
|
return apply_filters( 'sanitize_email', '', $email, 'domain_no_valid_subs' );
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Join valid subs into the new domain.
|
2020-10-18 13:27:06 -04:00
|
|
|
|
$domain = implode( '.', $new_subs );
|
2009-03-11 11:26:34 -04:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Put the email back together.
|
2019-01-16 01:16:49 -05:00
|
|
|
|
$sanitized_email = $local . '@' . $domain;
|
2009-03-11 11:26:34 -04:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Congratulations, your email made it!
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2019-01-16 01:16:49 -05:00
|
|
|
|
return apply_filters( 'sanitize_email', $sanitized_email, $email, null );
|
2004-12-15 21:57:05 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* Determines the difference between two timestamps.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* The difference is returned in a human readable format such as "1 hour",
|
|
|
|
|
* "5 mins", "2 days".
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 1.5.0
|
2019-06-28 02:44:57 -04:00
|
|
|
|
* @since 5.3.0 Added support for showing a difference in seconds.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @param int $from Unix timestamp from which the difference begins.
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param int $to Optional. Unix timestamp to end the time difference. Default becomes time() if not set.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @return string Human readable time difference.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2019-07-01 21:45:58 -04:00
|
|
|
|
function human_time_diff( $from, $to = 0 ) {
|
2014-06-04 20:39:14 -04:00
|
|
|
|
if ( empty( $to ) ) {
|
2004-12-18 19:10:10 -05:00
|
|
|
|
$to = time();
|
2014-06-04 20:39:14 -04:00
|
|
|
|
}
|
2013-07-08 09:00:34 -04:00
|
|
|
|
|
2012-09-25 01:26:19 -04:00
|
|
|
|
$diff = (int) abs( $to - $from );
|
2013-07-08 09:00:34 -04:00
|
|
|
|
|
2019-06-28 02:44:57 -04:00
|
|
|
|
if ( $diff < MINUTE_IN_SECONDS ) {
|
|
|
|
|
$secs = $diff;
|
|
|
|
|
if ( $secs <= 1 ) {
|
|
|
|
|
$secs = 1;
|
|
|
|
|
}
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Time difference between two dates, in seconds. %s: Number of seconds. */
|
2019-06-28 02:44:57 -04:00
|
|
|
|
$since = sprintf( _n( '%s second', '%s seconds', $secs ), $secs );
|
|
|
|
|
} elseif ( $diff < HOUR_IN_SECONDS && $diff >= MINUTE_IN_SECONDS ) {
|
2012-09-25 01:26:19 -04:00
|
|
|
|
$mins = round( $diff / MINUTE_IN_SECONDS );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( $mins <= 1 ) {
|
2006-12-21 18:06:18 -05:00
|
|
|
|
$mins = 1;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Time difference between two dates, in minutes (min=minute). %s: Number of minutes. */
|
2012-09-25 01:26:19 -04:00
|
|
|
|
$since = sprintf( _n( '%s min', '%s mins', $mins ), $mins );
|
2013-07-08 09:00:34 -04:00
|
|
|
|
} elseif ( $diff < DAY_IN_SECONDS && $diff >= HOUR_IN_SECONDS ) {
|
2012-09-25 01:26:19 -04:00
|
|
|
|
$hours = round( $diff / HOUR_IN_SECONDS );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( $hours <= 1 ) {
|
2007-12-06 14:49:33 -05:00
|
|
|
|
$hours = 1;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Time difference between two dates, in hours. %s: Number of hours. */
|
2012-09-25 01:26:19 -04:00
|
|
|
|
$since = sprintf( _n( '%s hour', '%s hours', $hours ), $hours );
|
2013-07-08 09:00:34 -04:00
|
|
|
|
} elseif ( $diff < WEEK_IN_SECONDS && $diff >= DAY_IN_SECONDS ) {
|
2012-09-25 01:26:19 -04:00
|
|
|
|
$days = round( $diff / DAY_IN_SECONDS );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( $days <= 1 ) {
|
2006-12-21 18:06:18 -05:00
|
|
|
|
$days = 1;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Time difference between two dates, in days. %s: Number of days. */
|
2012-09-25 01:26:19 -04:00
|
|
|
|
$since = sprintf( _n( '%s day', '%s days', $days ), $days );
|
2015-11-06 11:34:26 -05:00
|
|
|
|
} elseif ( $diff < MONTH_IN_SECONDS && $diff >= WEEK_IN_SECONDS ) {
|
2013-07-08 09:00:34 -04:00
|
|
|
|
$weeks = round( $diff / WEEK_IN_SECONDS );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( $weeks <= 1 ) {
|
2013-07-08 09:00:34 -04:00
|
|
|
|
$weeks = 1;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Time difference between two dates, in weeks. %s: Number of weeks. */
|
2013-07-08 09:00:34 -04:00
|
|
|
|
$since = sprintf( _n( '%s week', '%s weeks', $weeks ), $weeks );
|
2015-11-06 11:34:26 -05:00
|
|
|
|
} elseif ( $diff < YEAR_IN_SECONDS && $diff >= MONTH_IN_SECONDS ) {
|
|
|
|
|
$months = round( $diff / MONTH_IN_SECONDS );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( $months <= 1 ) {
|
2013-07-08 09:00:34 -04:00
|
|
|
|
$months = 1;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Time difference between two dates, in months. %s: Number of months. */
|
2013-07-08 09:00:34 -04:00
|
|
|
|
$since = sprintf( _n( '%s month', '%s months', $months ), $months );
|
|
|
|
|
} elseif ( $diff >= YEAR_IN_SECONDS ) {
|
|
|
|
|
$years = round( $diff / YEAR_IN_SECONDS );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( $years <= 1 ) {
|
2013-07-08 09:00:34 -04:00
|
|
|
|
$years = 1;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Time difference between two dates, in years. %s: Number of years. */
|
2013-07-08 09:00:34 -04:00
|
|
|
|
$since = sprintf( _n( '%s year', '%s years', $years ), $years );
|
2004-12-18 19:10:10 -05:00
|
|
|
|
}
|
2013-07-08 09:00:34 -04:00
|
|
|
|
|
2014-06-04 20:39:14 -04:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the human readable difference between two timestamps.
|
2014-06-04 20:39:14 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 4.0.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $since The difference in human readable text.
|
|
|
|
|
* @param int $diff The difference in seconds.
|
|
|
|
|
* @param int $from Unix timestamp from which the difference begins.
|
|
|
|
|
* @param int $to Unix timestamp to end the time difference.
|
|
|
|
|
*/
|
|
|
|
|
return apply_filters( 'human_time_diff', $since, $diff, $from, $to );
|
2004-12-18 19:10:10 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* Generates an excerpt from the content, if needed.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2019-06-08 14:42:52 -04:00
|
|
|
|
* Returns a maximum of 55 words with an ellipsis appended if necessary.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2016-05-23 15:01:27 -04:00
|
|
|
|
* The 55 word limit can be modified by plugins/themes using the {@see 'excerpt_length'} filter
|
|
|
|
|
* The ' […]' string can be modified by plugins/themes using the {@see 'excerpt_more'} filter
|
2009-09-09 12:34:44 -04:00
|
|
|
|
*
|
2008-08-17 07:29:43 -04:00
|
|
|
|
* @since 1.5.0
|
2019-03-20 11:49:49 -04:00
|
|
|
|
* @since 5.2.0 Added the `$post` parameter.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2019-03-20 11:49:49 -04:00
|
|
|
|
* @param string $text Optional. The excerpt. If set to empty, an excerpt is generated.
|
2020-06-26 05:30:11 -04:00
|
|
|
|
* @param WP_Post|object|int $post Optional. WP_Post instance or Post ID/object. Default null.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @return string The excerpt.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2019-03-20 11:49:49 -04:00
|
|
|
|
function wp_trim_excerpt( $text = '', $post = null ) {
|
2009-04-17 02:59:33 -04:00
|
|
|
|
$raw_excerpt = $text;
|
2020-05-16 14:42:12 -04:00
|
|
|
|
|
2020-08-18 11:10:04 -04:00
|
|
|
|
if ( '' === trim( $text ) ) {
|
2019-03-20 11:49:49 -04:00
|
|
|
|
$post = get_post( $post );
|
|
|
|
|
$text = get_the_content( '', false, $post );
|
2008-08-09 01:36:14 -04:00
|
|
|
|
|
|
|
|
|
$text = strip_shortcodes( $text );
|
2018-12-16 23:52:00 -05:00
|
|
|
|
$text = excerpt_remove_blocks( $text );
|
2008-08-09 01:36:14 -04:00
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/** This filter is documented in wp-includes/post-template.php */
|
|
|
|
|
$text = apply_filters( 'the_content', $text );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$text = str_replace( ']]>', ']]>', $text );
|
2013-11-30 13:36:10 -05:00
|
|
|
|
|
2019-06-08 14:42:52 -04:00
|
|
|
|
/* translators: Maximum number of words used in a post excerpt. */
|
2020-10-08 17:15:13 -04:00
|
|
|
|
$excerpt_length = (int) _x( '55', 'excerpt_length' );
|
2019-06-08 14:42:52 -04:00
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2019-06-08 14:42:52 -04:00
|
|
|
|
* Filters the maximum number of words in a post excerpt.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 2.7.0
|
|
|
|
|
*
|
2019-06-08 14:42:52 -04:00
|
|
|
|
* @param int $number The maximum number of words. Default 55.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
2019-08-14 13:18:55 -04:00
|
|
|
|
$excerpt_length = (int) apply_filters( 'excerpt_length', $excerpt_length );
|
2019-06-08 14:42:52 -04:00
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the string in the "more" link displayed after a trimmed excerpt.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 2.9.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $more_string The string shown within the more link.
|
|
|
|
|
*/
|
|
|
|
|
$excerpt_more = apply_filters( 'excerpt_more', ' ' . '[…]' );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$text = wp_trim_words( $text, $excerpt_length, $excerpt_more );
|
2005-03-13 20:02:04 -05:00
|
|
|
|
}
|
2019-06-08 14:42:52 -04:00
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the trimmed excerpt string.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 2.8.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $text The trimmed text.
|
|
|
|
|
* @param string $raw_excerpt The text prior to trimming.
|
|
|
|
|
*/
|
|
|
|
|
return apply_filters( 'wp_trim_excerpt', $text, $raw_excerpt );
|
2005-02-14 19:21:21 -05:00
|
|
|
|
}
|
|
|
|
|
|
2011-09-20 13:14:23 -04:00
|
|
|
|
/**
|
|
|
|
|
* Trims text to a certain number of words.
|
|
|
|
|
*
|
2012-05-23 17:04:35 -04:00
|
|
|
|
* This function is localized. For languages that count 'words' by the individual
|
|
|
|
|
* character (such as East Asian languages), the $num_words argument will apply
|
|
|
|
|
* to the number of individual characters.
|
|
|
|
|
*
|
2011-09-20 13:14:23 -04:00
|
|
|
|
* @since 3.3.0
|
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param string $text Text to trim.
|
|
|
|
|
* @param int $num_words Number of words. Default 55.
|
|
|
|
|
* @param string $more Optional. What to append if $text needs to be trimmed. Default '…'.
|
2011-09-20 13:14:23 -04:00
|
|
|
|
* @return string Trimmed text.
|
|
|
|
|
*/
|
|
|
|
|
function wp_trim_words( $text, $num_words = 55, $more = null ) {
|
2015-07-27 07:19:26 -04:00
|
|
|
|
if ( null === $more ) {
|
2011-09-20 13:14:23 -04:00
|
|
|
|
$more = __( '…' );
|
2015-07-27 07:19:26 -04:00
|
|
|
|
}
|
|
|
|
|
|
2011-09-20 13:14:23 -04:00
|
|
|
|
$original_text = $text;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$text = wp_strip_all_tags( $text );
|
2019-08-14 13:18:55 -04:00
|
|
|
|
$num_words = (int) $num_words;
|
2015-07-27 07:19:26 -04:00
|
|
|
|
|
2015-07-30 13:08:24 -04:00
|
|
|
|
/*
|
|
|
|
|
* translators: If your word count is based on single characters (e.g. East Asian characters),
|
|
|
|
|
* enter 'characters_excluding_spaces' or 'characters_including_spaces'. Otherwise, enter 'words'.
|
|
|
|
|
* Do not translate into your own language.
|
|
|
|
|
*/
|
2015-07-27 07:19:26 -04:00
|
|
|
|
if ( strpos( _x( 'words', 'Word count type. Do not translate!' ), 'characters' ) === 0 && preg_match( '/^utf\-?8$/i', get_option( 'blog_charset' ) ) ) {
|
2012-05-23 17:04:35 -04:00
|
|
|
|
$text = trim( preg_replace( "/[\n\r\t ]+/", ' ', $text ), ' ' );
|
|
|
|
|
preg_match_all( '/./u', $text, $words_array );
|
|
|
|
|
$words_array = array_slice( $words_array[0], 0, $num_words + 1 );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$sep = '';
|
2012-05-23 17:04:35 -04:00
|
|
|
|
} else {
|
|
|
|
|
$words_array = preg_split( "/[\n\r\t ]+/", $text, $num_words + 1, PREG_SPLIT_NO_EMPTY );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$sep = ' ';
|
2012-05-23 17:04:35 -04:00
|
|
|
|
}
|
2015-07-27 07:19:26 -04:00
|
|
|
|
|
2011-09-20 13:14:23 -04:00
|
|
|
|
if ( count( $words_array ) > $num_words ) {
|
|
|
|
|
array_pop( $words_array );
|
2012-05-23 17:04:35 -04:00
|
|
|
|
$text = implode( $sep, $words_array );
|
2011-09-20 13:14:23 -04:00
|
|
|
|
$text = $text . $more;
|
|
|
|
|
} else {
|
2012-05-23 17:04:35 -04:00
|
|
|
|
$text = implode( $sep, $words_array );
|
2011-09-20 13:14:23 -04:00
|
|
|
|
}
|
2015-07-27 07:19:26 -04:00
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the text content after words have been trimmed.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 3.3.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $text The trimmed text.
|
2017-03-23 20:58:41 -04:00
|
|
|
|
* @param int $num_words The number of words to trim the text to. Default 55.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
* @param string $more An optional string to append to the end of the trimmed text, e.g. ….
|
|
|
|
|
* @param string $original_text The text before it was trimmed.
|
|
|
|
|
*/
|
2011-09-20 13:14:23 -04:00
|
|
|
|
return apply_filters( 'wp_trim_words', $text, $num_words, $more, $original_text );
|
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* Converts named entities into numbered entities.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 1.5.1
|
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @param string $text The text within which entities will be converted.
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @return string Text with converted entities.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function ent2ncr( $text ) {
|
2011-07-21 17:41:21 -04:00
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters text before named entities are converted into numbered entities.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* A non-null string must be returned for the filter to be evaluated.
|
|
|
|
|
*
|
|
|
|
|
* @since 3.3.0
|
|
|
|
|
*
|
2019-09-21 13:41:57 -04:00
|
|
|
|
* @param string|null $converted_text The text to be converted. Default null.
|
|
|
|
|
* @param string $text The text prior to entity conversion.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
2011-07-25 09:20:07 -04:00
|
|
|
|
$filtered = apply_filters( 'pre_ent2ncr', null, $text );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( null !== $filtered ) {
|
2011-07-21 17:41:21 -04:00
|
|
|
|
return $filtered;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2011-07-21 17:41:21 -04:00
|
|
|
|
|
2005-04-05 13:25:57 -04:00
|
|
|
|
$to_ncr = array(
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'"' => '"',
|
|
|
|
|
'&' => '&',
|
|
|
|
|
'<' => '<',
|
|
|
|
|
'>' => '>',
|
|
|
|
|
'|' => '|',
|
|
|
|
|
' ' => ' ',
|
|
|
|
|
'¡' => '¡',
|
|
|
|
|
'¢' => '¢',
|
|
|
|
|
'£' => '£',
|
|
|
|
|
'¤' => '¤',
|
|
|
|
|
'¥' => '¥',
|
|
|
|
|
'¦' => '¦',
|
|
|
|
|
'&brkbar;' => '¦',
|
|
|
|
|
'§' => '§',
|
|
|
|
|
'¨' => '¨',
|
|
|
|
|
'¨' => '¨',
|
|
|
|
|
'©' => '©',
|
|
|
|
|
'ª' => 'ª',
|
|
|
|
|
'«' => '«',
|
|
|
|
|
'¬' => '¬',
|
|
|
|
|
'­' => '­',
|
|
|
|
|
'®' => '®',
|
|
|
|
|
'¯' => '¯',
|
|
|
|
|
'&hibar;' => '¯',
|
|
|
|
|
'°' => '°',
|
|
|
|
|
'±' => '±',
|
|
|
|
|
'²' => '²',
|
|
|
|
|
'³' => '³',
|
|
|
|
|
'´' => '´',
|
|
|
|
|
'µ' => 'µ',
|
|
|
|
|
'¶' => '¶',
|
|
|
|
|
'·' => '·',
|
|
|
|
|
'¸' => '¸',
|
|
|
|
|
'¹' => '¹',
|
|
|
|
|
'º' => 'º',
|
|
|
|
|
'»' => '»',
|
|
|
|
|
'¼' => '¼',
|
|
|
|
|
'½' => '½',
|
|
|
|
|
'¾' => '¾',
|
|
|
|
|
'¿' => '¿',
|
|
|
|
|
'À' => 'À',
|
|
|
|
|
'Á' => 'Á',
|
|
|
|
|
'Â' => 'Â',
|
|
|
|
|
'Ã' => 'Ã',
|
|
|
|
|
'Ä' => 'Ä',
|
|
|
|
|
'Å' => 'Å',
|
|
|
|
|
'Æ' => 'Æ',
|
|
|
|
|
'Ç' => 'Ç',
|
|
|
|
|
'È' => 'È',
|
|
|
|
|
'É' => 'É',
|
|
|
|
|
'Ê' => 'Ê',
|
|
|
|
|
'Ë' => 'Ë',
|
|
|
|
|
'Ì' => 'Ì',
|
|
|
|
|
'Í' => 'Í',
|
|
|
|
|
'Î' => 'Î',
|
|
|
|
|
'Ï' => 'Ï',
|
|
|
|
|
'Ð' => 'Ð',
|
|
|
|
|
'Ñ' => 'Ñ',
|
|
|
|
|
'Ò' => 'Ò',
|
|
|
|
|
'Ó' => 'Ó',
|
|
|
|
|
'Ô' => 'Ô',
|
|
|
|
|
'Õ' => 'Õ',
|
|
|
|
|
'Ö' => 'Ö',
|
|
|
|
|
'×' => '×',
|
|
|
|
|
'Ø' => 'Ø',
|
|
|
|
|
'Ù' => 'Ù',
|
|
|
|
|
'Ú' => 'Ú',
|
|
|
|
|
'Û' => 'Û',
|
|
|
|
|
'Ü' => 'Ü',
|
|
|
|
|
'Ý' => 'Ý',
|
|
|
|
|
'Þ' => 'Þ',
|
|
|
|
|
'ß' => 'ß',
|
|
|
|
|
'à' => 'à',
|
|
|
|
|
'á' => 'á',
|
|
|
|
|
'â' => 'â',
|
|
|
|
|
'ã' => 'ã',
|
|
|
|
|
'ä' => 'ä',
|
|
|
|
|
'å' => 'å',
|
|
|
|
|
'æ' => 'æ',
|
|
|
|
|
'ç' => 'ç',
|
|
|
|
|
'è' => 'è',
|
|
|
|
|
'é' => 'é',
|
|
|
|
|
'ê' => 'ê',
|
|
|
|
|
'ë' => 'ë',
|
|
|
|
|
'ì' => 'ì',
|
|
|
|
|
'í' => 'í',
|
|
|
|
|
'î' => 'î',
|
|
|
|
|
'ï' => 'ï',
|
|
|
|
|
'ð' => 'ð',
|
|
|
|
|
'ñ' => 'ñ',
|
|
|
|
|
'ò' => 'ò',
|
|
|
|
|
'ó' => 'ó',
|
|
|
|
|
'ô' => 'ô',
|
|
|
|
|
'õ' => 'õ',
|
|
|
|
|
'ö' => 'ö',
|
|
|
|
|
'÷' => '÷',
|
|
|
|
|
'ø' => 'ø',
|
|
|
|
|
'ù' => 'ù',
|
|
|
|
|
'ú' => 'ú',
|
|
|
|
|
'û' => 'û',
|
|
|
|
|
'ü' => 'ü',
|
|
|
|
|
'ý' => 'ý',
|
|
|
|
|
'þ' => 'þ',
|
|
|
|
|
'ÿ' => 'ÿ',
|
|
|
|
|
'Œ' => 'Œ',
|
|
|
|
|
'œ' => 'œ',
|
|
|
|
|
'Š' => 'Š',
|
|
|
|
|
'š' => 'š',
|
|
|
|
|
'Ÿ' => 'Ÿ',
|
|
|
|
|
'ƒ' => 'ƒ',
|
|
|
|
|
'ˆ' => 'ˆ',
|
|
|
|
|
'˜' => '˜',
|
|
|
|
|
'Α' => 'Α',
|
|
|
|
|
'Β' => 'Β',
|
|
|
|
|
'Γ' => 'Γ',
|
|
|
|
|
'Δ' => 'Δ',
|
|
|
|
|
'Ε' => 'Ε',
|
|
|
|
|
'Ζ' => 'Ζ',
|
|
|
|
|
'Η' => 'Η',
|
|
|
|
|
'Θ' => 'Θ',
|
|
|
|
|
'Ι' => 'Ι',
|
|
|
|
|
'Κ' => 'Κ',
|
|
|
|
|
'Λ' => 'Λ',
|
|
|
|
|
'Μ' => 'Μ',
|
|
|
|
|
'Ν' => 'Ν',
|
|
|
|
|
'Ξ' => 'Ξ',
|
|
|
|
|
'Ο' => 'Ο',
|
|
|
|
|
'Π' => 'Π',
|
|
|
|
|
'Ρ' => 'Ρ',
|
|
|
|
|
'Σ' => 'Σ',
|
|
|
|
|
'Τ' => 'Τ',
|
|
|
|
|
'Υ' => 'Υ',
|
|
|
|
|
'Φ' => 'Φ',
|
|
|
|
|
'Χ' => 'Χ',
|
|
|
|
|
'Ψ' => 'Ψ',
|
|
|
|
|
'Ω' => 'Ω',
|
|
|
|
|
'α' => 'α',
|
|
|
|
|
'β' => 'β',
|
|
|
|
|
'γ' => 'γ',
|
|
|
|
|
'δ' => 'δ',
|
|
|
|
|
'ε' => 'ε',
|
|
|
|
|
'ζ' => 'ζ',
|
|
|
|
|
'η' => 'η',
|
|
|
|
|
'θ' => 'θ',
|
|
|
|
|
'ι' => 'ι',
|
|
|
|
|
'κ' => 'κ',
|
|
|
|
|
'λ' => 'λ',
|
|
|
|
|
'μ' => 'μ',
|
|
|
|
|
'ν' => 'ν',
|
|
|
|
|
'ξ' => 'ξ',
|
|
|
|
|
'ο' => 'ο',
|
|
|
|
|
'π' => 'π',
|
|
|
|
|
'ρ' => 'ρ',
|
|
|
|
|
'ς' => 'ς',
|
|
|
|
|
'σ' => 'σ',
|
|
|
|
|
'τ' => 'τ',
|
|
|
|
|
'υ' => 'υ',
|
|
|
|
|
'φ' => 'φ',
|
|
|
|
|
'χ' => 'χ',
|
|
|
|
|
'ψ' => 'ψ',
|
|
|
|
|
'ω' => 'ω',
|
2005-07-02 19:44:35 -04:00
|
|
|
|
'ϑ' => 'ϑ',
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'ϒ' => 'ϒ',
|
|
|
|
|
'ϖ' => 'ϖ',
|
|
|
|
|
' ' => ' ',
|
|
|
|
|
' ' => ' ',
|
|
|
|
|
' ' => ' ',
|
|
|
|
|
'‌' => '‌',
|
|
|
|
|
'‍' => '‍',
|
|
|
|
|
'‎' => '‎',
|
|
|
|
|
'‏' => '‏',
|
|
|
|
|
'–' => '–',
|
|
|
|
|
'—' => '—',
|
|
|
|
|
'‘' => '‘',
|
|
|
|
|
'’' => '’',
|
|
|
|
|
'‚' => '‚',
|
|
|
|
|
'“' => '“',
|
|
|
|
|
'”' => '”',
|
|
|
|
|
'„' => '„',
|
|
|
|
|
'†' => '†',
|
|
|
|
|
'‡' => '‡',
|
|
|
|
|
'•' => '•',
|
|
|
|
|
'…' => '…',
|
|
|
|
|
'‰' => '‰',
|
|
|
|
|
'′' => '′',
|
|
|
|
|
'″' => '″',
|
|
|
|
|
'‹' => '‹',
|
|
|
|
|
'›' => '›',
|
|
|
|
|
'‾' => '‾',
|
|
|
|
|
'⁄' => '⁄',
|
|
|
|
|
'€' => '€',
|
|
|
|
|
'ℑ' => 'ℑ',
|
|
|
|
|
'℘' => '℘',
|
|
|
|
|
'ℜ' => 'ℜ',
|
|
|
|
|
'™' => '™',
|
|
|
|
|
'ℵ' => 'ℵ',
|
|
|
|
|
'↵' => '↵',
|
|
|
|
|
'⇐' => '⇐',
|
|
|
|
|
'⇑' => '⇑',
|
|
|
|
|
'⇒' => '⇒',
|
|
|
|
|
'⇓' => '⇓',
|
|
|
|
|
'⇔' => '⇔',
|
|
|
|
|
'∀' => '∀',
|
|
|
|
|
'∂' => '∂',
|
|
|
|
|
'∃' => '∃',
|
|
|
|
|
'∅' => '∅',
|
|
|
|
|
'∇' => '∇',
|
|
|
|
|
'∈' => '∈',
|
|
|
|
|
'∉' => '∉',
|
|
|
|
|
'∋' => '∋',
|
|
|
|
|
'∏' => '∏',
|
|
|
|
|
'∑' => '∑',
|
|
|
|
|
'−' => '−',
|
|
|
|
|
'∗' => '∗',
|
|
|
|
|
'√' => '√',
|
|
|
|
|
'∝' => '∝',
|
|
|
|
|
'∞' => '∞',
|
|
|
|
|
'∠' => '∠',
|
|
|
|
|
'∧' => '∧',
|
|
|
|
|
'∨' => '∨',
|
|
|
|
|
'∩' => '∩',
|
|
|
|
|
'∪' => '∪',
|
|
|
|
|
'∫' => '∫',
|
|
|
|
|
'∴' => '∴',
|
|
|
|
|
'∼' => '∼',
|
|
|
|
|
'≅' => '≅',
|
|
|
|
|
'≈' => '≈',
|
|
|
|
|
'≠' => '≠',
|
|
|
|
|
'≡' => '≡',
|
|
|
|
|
'≤' => '≤',
|
|
|
|
|
'≥' => '≥',
|
|
|
|
|
'⊂' => '⊂',
|
|
|
|
|
'⊃' => '⊃',
|
|
|
|
|
'⊄' => '⊄',
|
|
|
|
|
'⊆' => '⊆',
|
|
|
|
|
'⊇' => '⊇',
|
|
|
|
|
'⊕' => '⊕',
|
|
|
|
|
'⊗' => '⊗',
|
|
|
|
|
'⊥' => '⊥',
|
|
|
|
|
'⋅' => '⋅',
|
|
|
|
|
'⌈' => '⌈',
|
|
|
|
|
'⌉' => '⌉',
|
|
|
|
|
'⌊' => '⌊',
|
|
|
|
|
'⌋' => '⌋',
|
|
|
|
|
'⟨' => '〈',
|
|
|
|
|
'⟩' => '〉',
|
|
|
|
|
'←' => '←',
|
|
|
|
|
'↑' => '↑',
|
|
|
|
|
'→' => '→',
|
|
|
|
|
'↓' => '↓',
|
|
|
|
|
'↔' => '↔',
|
|
|
|
|
'◊' => '◊',
|
|
|
|
|
'♠' => '♠',
|
|
|
|
|
'♣' => '♣',
|
|
|
|
|
'♥' => '♥',
|
|
|
|
|
'♦' => '♦',
|
2005-04-05 13:25:57 -04:00
|
|
|
|
);
|
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
return str_replace( array_keys( $to_ncr ), array_values( $to_ncr ), $text );
|
2005-04-05 13:25:57 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2015-06-21 18:01:28 -04:00
|
|
|
|
* Formats text for the editor.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2015-06-21 18:01:28 -04:00
|
|
|
|
* Generally the browsers treat everything inside a textarea as text, but
|
|
|
|
|
* it is still a good idea to HTML entity encode `<`, `>` and `&` in the content.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2015-07-13 17:30:24 -04:00
|
|
|
|
* The filter {@see 'format_for_editor'} is applied here. If `$text` is empty the
|
|
|
|
|
* filter will be applied to an empty string.
|
2015-06-21 18:01:28 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 4.3.0
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2015-12-13 14:22:26 -05:00
|
|
|
|
* @see _WP_Editors::editor()
|
|
|
|
|
*
|
|
|
|
|
* @param string $text The text to be formatted.
|
|
|
|
|
* @param string $default_editor The default editor for the current user.
|
|
|
|
|
* It is usually either 'html' or 'tinymce'.
|
2015-06-21 18:08:28 -04:00
|
|
|
|
* @return string The formatted text after filter is applied.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-06-21 18:01:28 -04:00
|
|
|
|
function format_for_editor( $text, $default_editor = null ) {
|
2015-07-12 23:19:24 -04:00
|
|
|
|
if ( $text ) {
|
2015-06-21 18:01:28 -04:00
|
|
|
|
$text = htmlspecialchars( $text, ENT_NOQUOTES, get_option( 'blog_charset' ) );
|
|
|
|
|
}
|
2008-02-09 02:29:36 -05:00
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the text after it is formatted for the editor.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
2015-06-21 18:01:28 -04:00
|
|
|
|
* @since 4.3.0
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
2015-12-13 14:22:26 -05:00
|
|
|
|
* @param string $text The formatted text.
|
|
|
|
|
* @param string $default_editor The default editor for the current user.
|
|
|
|
|
* It is usually either 'html' or 'tinymce'.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
2015-06-21 18:01:28 -04:00
|
|
|
|
return apply_filters( 'format_for_editor', $text, $default_editor );
|
2008-02-09 02:29:36 -05:00
|
|
|
|
}
|
|
|
|
|
|
2009-06-20 13:42:24 -04:00
|
|
|
|
/**
|
|
|
|
|
* Perform a deep string replace operation to ensure the values in $search are no longer present
|
2009-09-14 10:03:32 -04:00
|
|
|
|
*
|
2009-06-20 13:42:24 -04:00
|
|
|
|
* Repeats the replacement operation until it no longer replaces anything so as to remove "nested" values
|
|
|
|
|
* e.g. $subject = '%0%0%0DDD', $search ='%0D', $result ='' rather than the '%0%0DD' that
|
|
|
|
|
* str_replace would return
|
2009-09-14 10:03:32 -04:00
|
|
|
|
*
|
2009-06-20 13:42:24 -04:00
|
|
|
|
* @since 2.8.1
|
|
|
|
|
* @access private
|
2009-09-14 10:03:32 -04:00
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param string|array $search The value being searched for, otherwise known as the needle.
|
|
|
|
|
* An array may be used to designate multiple needles.
|
|
|
|
|
* @param string $subject The string being searched and replaced on, otherwise known as the haystack.
|
2018-01-20 08:32:32 -05:00
|
|
|
|
* @return string The string with the replaced values.
|
2009-06-20 13:42:24 -04:00
|
|
|
|
*/
|
2010-04-03 23:07:14 -04:00
|
|
|
|
function _deep_replace( $search, $subject ) {
|
|
|
|
|
$subject = (string) $subject;
|
2013-08-20 01:57:10 -04:00
|
|
|
|
|
|
|
|
|
$count = 1;
|
|
|
|
|
while ( $count ) {
|
|
|
|
|
$subject = str_replace( $search, '', $subject, $count );
|
2009-06-20 13:42:24 -04:00
|
|
|
|
}
|
2009-09-14 10:03:32 -04:00
|
|
|
|
|
2009-06-20 13:42:24 -04:00
|
|
|
|
return $subject;
|
|
|
|
|
}
|
|
|
|
|
|
2009-05-29 16:31:52 -04:00
|
|
|
|
/**
|
2013-07-16 13:44:42 -04:00
|
|
|
|
* Escapes data for use in a MySQL query.
|
2009-05-29 16:31:52 -04:00
|
|
|
|
*
|
2013-07-16 13:44:42 -04:00
|
|
|
|
* Usually you should prepare queries using wpdb::prepare().
|
|
|
|
|
* Sometimes, spot-escaping is required or useful. One example
|
|
|
|
|
* is preparing an array for use in an IN clause.
|
2009-05-29 16:31:52 -04:00
|
|
|
|
*
|
2017-10-31 08:00:49 -04:00
|
|
|
|
* NOTE: Since 4.8.3, '%' characters will be replaced with a placeholder string,
|
|
|
|
|
* this prevents certain SQLi attacks from taking place. This change in behaviour
|
|
|
|
|
* may cause issues for code that expects the return value of esc_sql() to be useable
|
|
|
|
|
* for other purposes.
|
|
|
|
|
*
|
2009-05-29 16:31:52 -04:00
|
|
|
|
* @since 2.8.0
|
2015-05-25 02:25:25 -04:00
|
|
|
|
*
|
2015-10-14 19:44:25 -04:00
|
|
|
|
* @global wpdb $wpdb WordPress database abstraction object.
|
2015-05-25 02:25:25 -04:00
|
|
|
|
*
|
2013-08-05 18:11:30 -04:00
|
|
|
|
* @param string|array $data Unescaped data
|
|
|
|
|
* @return string|array Escaped data
|
2009-05-29 16:31:52 -04:00
|
|
|
|
*/
|
2013-07-16 13:44:42 -04:00
|
|
|
|
function esc_sql( $data ) {
|
2009-05-29 16:31:52 -04:00
|
|
|
|
global $wpdb;
|
2013-07-16 13:44:42 -04:00
|
|
|
|
return $wpdb->_escape( $data );
|
2009-05-29 16:31:52 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2009-05-18 12:00:33 -04:00
|
|
|
|
* Checks and cleans a URL.
|
|
|
|
|
*
|
|
|
|
|
* A number of characters are removed from the URL. If the URL is for displaying
|
2016-05-23 15:01:27 -04:00
|
|
|
|
* (the default behaviour) ampersands are also replaced. The {@see 'clean_url'} filter
|
2009-05-18 12:00:33 -04:00
|
|
|
|
* is applied to the returned cleaned URL.
|
|
|
|
|
*
|
|
|
|
|
* @since 2.8.0
|
|
|
|
|
*
|
2019-10-26 17:09:04 -04:00
|
|
|
|
* @param string $url The URL to be cleaned.
|
|
|
|
|
* @param string[] $protocols Optional. An array of acceptable protocols.
|
2020-05-11 16:34:13 -04:00
|
|
|
|
* Defaults to return value of wp_allowed_protocols().
|
2019-10-26 17:09:04 -04:00
|
|
|
|
* @param string $_context Private. Use esc_url_raw() for database usage.
|
2020-05-11 16:34:13 -04:00
|
|
|
|
* @return string The cleaned URL after the {@see 'clean_url'} filter is applied.
|
2020-11-06 09:03:06 -05:00
|
|
|
|
* An empty string is returned if `$url` specifies a protocol other than
|
|
|
|
|
* those in `$protocols`, or if `$url` contains an empty string.
|
2009-05-18 12:00:33 -04:00
|
|
|
|
*/
|
2010-02-22 13:25:51 -05:00
|
|
|
|
function esc_url( $url, $protocols = null, $_context = 'display' ) {
|
|
|
|
|
$original_url = $url;
|
|
|
|
|
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( '' === $url ) {
|
2010-04-25 04:16:10 -04:00
|
|
|
|
return $url;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2015-09-02 13:20:21 -04:00
|
|
|
|
|
2019-06-30 23:29:57 -04:00
|
|
|
|
$url = str_replace( ' ', '%20', ltrim( $url ) );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$url = preg_replace( '|[^a-z0-9-~+_.?#=!&;,/:%@$\|*\'()\[\]\\x80-\\xff]|i', '', $url );
|
2015-09-05 17:29:25 -04:00
|
|
|
|
|
|
|
|
|
if ( '' === $url ) {
|
|
|
|
|
return $url;
|
|
|
|
|
}
|
|
|
|
|
|
2015-07-03 10:28:23 -04:00
|
|
|
|
if ( 0 !== stripos( $url, 'mailto:' ) ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$strip = array( '%0d', '%0a', '%0D', '%0A' );
|
|
|
|
|
$url = _deep_replace( $strip, $url );
|
2015-07-03 10:28:23 -04:00
|
|
|
|
}
|
2015-09-02 13:20:21 -04:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$url = str_replace( ';//', '://', $url );
|
2020-01-28 19:45:18 -05:00
|
|
|
|
/*
|
|
|
|
|
* If the URL doesn't appear to contain a scheme, we presume
|
|
|
|
|
* it needs http:// prepended (unless it's a relative link
|
|
|
|
|
* starting with /, # or ?, or a PHP file).
|
2010-02-22 13:25:51 -05:00
|
|
|
|
*/
|
2020-04-04 23:02:11 -04:00
|
|
|
|
if ( strpos( $url, ':' ) === false && ! in_array( $url[0], array( '/', '#', '?' ), true ) &&
|
2017-11-30 18:11:00 -05:00
|
|
|
|
! preg_match( '/^[a-z0-9-]+?\.php/i', $url ) ) {
|
2010-02-22 13:25:51 -05:00
|
|
|
|
$url = 'http://' . $url;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2010-02-22 13:25:51 -05:00
|
|
|
|
|
|
|
|
|
// Replace ampersands and single quotes only when displaying.
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( 'display' === $_context ) {
|
2010-12-29 15:45:37 -05:00
|
|
|
|
$url = wp_kses_normalize_entities( $url );
|
|
|
|
|
$url = str_replace( '&', '&', $url );
|
2010-02-22 13:25:51 -05:00
|
|
|
|
$url = str_replace( "'", ''', $url );
|
|
|
|
|
}
|
|
|
|
|
|
2015-10-07 19:39:23 -04:00
|
|
|
|
if ( ( false !== strpos( $url, '[' ) ) || ( false !== strpos( $url, ']' ) ) ) {
|
|
|
|
|
|
2015-10-23 01:57:24 -04:00
|
|
|
|
$parsed = wp_parse_url( $url );
|
2015-10-07 19:39:23 -04:00
|
|
|
|
$front = '';
|
|
|
|
|
|
|
|
|
|
if ( isset( $parsed['scheme'] ) ) {
|
|
|
|
|
$front .= $parsed['scheme'] . '://';
|
|
|
|
|
} elseif ( '/' === $url[0] ) {
|
|
|
|
|
$front .= '//';
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( isset( $parsed['user'] ) ) {
|
|
|
|
|
$front .= $parsed['user'];
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( isset( $parsed['pass'] ) ) {
|
|
|
|
|
$front .= ':' . $parsed['pass'];
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( isset( $parsed['user'] ) || isset( $parsed['pass'] ) ) {
|
|
|
|
|
$front .= '@';
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( isset( $parsed['host'] ) ) {
|
|
|
|
|
$front .= $parsed['host'];
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( isset( $parsed['port'] ) ) {
|
|
|
|
|
$front .= ':' . $parsed['port'];
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$end_dirty = str_replace( $front, '', $url );
|
|
|
|
|
$end_clean = str_replace( array( '[', ']' ), array( '%5B', '%5D' ), $end_dirty );
|
|
|
|
|
$url = str_replace( $end_dirty, $end_clean, $url );
|
|
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
2013-07-10 09:45:22 -04:00
|
|
|
|
if ( '/' === $url[0] ) {
|
|
|
|
|
$good_protocol_url = $url;
|
|
|
|
|
} else {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! is_array( $protocols ) ) {
|
2013-07-10 09:45:22 -04:00
|
|
|
|
$protocols = wp_allowed_protocols();
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2013-07-10 09:45:22 -04:00
|
|
|
|
$good_protocol_url = wp_kses_bad_protocol( $url, $protocols );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( strtolower( $good_protocol_url ) != strtolower( $url ) ) {
|
2013-07-10 09:45:22 -04:00
|
|
|
|
return '';
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2013-07-10 09:45:22 -04:00
|
|
|
|
}
|
2010-02-22 13:25:51 -05:00
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters a string cleaned and escaped for output as a URL.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 2.3.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $good_protocol_url The cleaned URL to be returned.
|
|
|
|
|
* @param string $original_url The URL prior to cleaning.
|
|
|
|
|
* @param string $_context If 'display', replace ampersands and single quotes only.
|
|
|
|
|
*/
|
|
|
|
|
return apply_filters( 'clean_url', $good_protocol_url, $original_url, $_context );
|
2009-05-18 12:00:33 -04:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
2021-08-10 15:44:59 -04:00
|
|
|
|
* Performs esc_url() for database or redirect usage.
|
2009-05-18 12:00:33 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 2.8.0
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2020-11-06 09:16:07 -05:00
|
|
|
|
* @see esc_url()
|
|
|
|
|
*
|
2019-10-26 17:09:04 -04:00
|
|
|
|
* @param string $url The URL to be cleaned.
|
2020-05-11 16:34:13 -04:00
|
|
|
|
* @param string[] $protocols Optional. An array of acceptable protocols.
|
|
|
|
|
* Defaults to return value of wp_allowed_protocols().
|
2020-11-06 09:03:06 -05:00
|
|
|
|
* @return string The cleaned URL after esc_url() is run with the 'db' context.
|
2009-05-18 12:00:33 -04:00
|
|
|
|
*/
|
|
|
|
|
function esc_url_raw( $url, $protocols = null ) {
|
2010-02-22 13:25:51 -05:00
|
|
|
|
return esc_url( $url, $protocols, 'db' );
|
2009-05-18 12:00:33 -04:00
|
|
|
|
}
|
|
|
|
|
|
2021-08-10 15:44:59 -04:00
|
|
|
|
/**
|
|
|
|
|
* Performs esc_url() for database or redirect usage.
|
|
|
|
|
*
|
|
|
|
|
* This function is an alias for esc_url_raw().
|
|
|
|
|
*
|
|
|
|
|
* @since 2.3.1
|
|
|
|
|
* @since 2.8.0 Deprecated in favor of esc_url_raw().
|
|
|
|
|
* @since 5.9.0 Restored (un-deprecated).
|
|
|
|
|
*
|
|
|
|
|
* @see esc_url_raw()
|
|
|
|
|
*
|
|
|
|
|
* @param string $url The URL to be cleaned.
|
|
|
|
|
* @param string[] $protocols Optional. An array of acceptable protocols.
|
|
|
|
|
* Defaults to return value of wp_allowed_protocols().
|
|
|
|
|
* @return string The cleaned URL after esc_url() is run with the 'db' context.
|
|
|
|
|
*/
|
|
|
|
|
function sanitize_url( $url, $protocols = null ) {
|
|
|
|
|
return esc_url_raw( $url, $protocols );
|
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* Convert entities, while preserving already-encoded entities.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2020-01-19 22:14:06 -05:00
|
|
|
|
* @link https://www.php.net/htmlentities Borrowed from the PHP Manual user notes.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 1.2.2
|
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @param string $myHTML The text to be converted.
|
|
|
|
|
* @return string Converted text.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function htmlentities2( $myHTML ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$translation_table = get_html_translation_table( HTML_ENTITIES, ENT_QUOTES );
|
|
|
|
|
$translation_table[ chr( 38 ) ] = '&';
|
|
|
|
|
return preg_replace( '/&(?![A-Za-z]{0,4}\w{2,3};|#[0-9]{2,3};)/', '&', strtr( $myHTML, $translation_table ) );
|
2006-04-18 23:03:27 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2009-09-15 06:11:59 -04:00
|
|
|
|
* Escape single quotes, htmlspecialchar " < > &, and fix line endings.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2010-02-12 21:54:54 -05:00
|
|
|
|
* Escapes text strings for echoing in JS. It is intended to be used for inline JS
|
|
|
|
|
* (in a tag attribute, for example onclick="..."). Note that the strings have to
|
2016-05-23 15:01:27 -04:00
|
|
|
|
* be in single quotes. The {@see 'js_escape'} filter is also applied here.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2009-05-09 03:27:22 -04:00
|
|
|
|
* @since 2.8.0
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @param string $text The text to be escaped.
|
|
|
|
|
* @return string Escaped text.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2009-05-09 03:27:22 -04:00
|
|
|
|
function esc_js( $text ) {
|
2009-01-04 18:37:47 -05:00
|
|
|
|
$safe_text = wp_check_invalid_utf8( $text );
|
2009-05-18 11:11:07 -04:00
|
|
|
|
$safe_text = _wp_specialchars( $safe_text, ENT_COMPAT );
|
2009-01-04 18:37:47 -05:00
|
|
|
|
$safe_text = preg_replace( '/&#(x)?0*(?(1)27|39);?/i', "'", stripslashes( $safe_text ) );
|
2009-09-15 06:11:59 -04:00
|
|
|
|
$safe_text = str_replace( "\r", '', $safe_text );
|
|
|
|
|
$safe_text = str_replace( "\n", '\\n', addslashes( $safe_text ) );
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters a string cleaned and escaped for output in JavaScript.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* Text passed to esc_js() is stripped of invalid or special characters,
|
|
|
|
|
* and properly slashed for output.
|
|
|
|
|
*
|
2013-11-30 14:05:10 -05:00
|
|
|
|
* @since 2.0.6
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @param string $safe_text The text after it has been escaped.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
* @param string $text The text prior to being escaped.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
2009-01-04 18:37:47 -05:00
|
|
|
|
return apply_filters( 'js_escape', $safe_text, $text );
|
2006-05-05 03:49:05 -04:00
|
|
|
|
}
|
2006-06-23 21:28:08 -04:00
|
|
|
|
|
2009-05-18 11:11:07 -04:00
|
|
|
|
/**
|
|
|
|
|
* Escaping for HTML blocks.
|
|
|
|
|
*
|
|
|
|
|
* @since 2.8.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $text
|
|
|
|
|
* @return string
|
|
|
|
|
*/
|
|
|
|
|
function esc_html( $text ) {
|
|
|
|
|
$safe_text = wp_check_invalid_utf8( $text );
|
|
|
|
|
$safe_text = _wp_specialchars( $safe_text, ENT_QUOTES );
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters a string cleaned and escaped for output in HTML.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* Text passed to esc_html() is stripped of invalid or special characters
|
|
|
|
|
* before output.
|
|
|
|
|
*
|
|
|
|
|
* @since 2.8.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $safe_text The text after it has been escaped.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
* @param string $text The text prior to being escaped.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
2009-05-18 11:11:07 -04:00
|
|
|
|
return apply_filters( 'esc_html', $safe_text, $text );
|
|
|
|
|
}
|
|
|
|
|
|
2008-08-27 02:49:21 -04:00
|
|
|
|
/**
|
|
|
|
|
* Escaping for HTML attributes.
|
|
|
|
|
*
|
2009-04-27 17:58:04 -04:00
|
|
|
|
* @since 2.8.0
|
2008-08-27 02:49:21 -04:00
|
|
|
|
*
|
|
|
|
|
* @param string $text
|
|
|
|
|
* @return string
|
|
|
|
|
*/
|
2009-05-05 15:43:53 -04:00
|
|
|
|
function esc_attr( $text ) {
|
2009-01-04 17:25:50 -05:00
|
|
|
|
$safe_text = wp_check_invalid_utf8( $text );
|
2009-05-18 11:11:07 -04:00
|
|
|
|
$safe_text = _wp_specialchars( $safe_text, ENT_QUOTES );
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters a string cleaned and escaped for output in an HTML attribute.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* Text passed to esc_attr() is stripped of invalid or special characters
|
|
|
|
|
* before output.
|
|
|
|
|
*
|
2013-11-30 14:05:10 -05:00
|
|
|
|
* @since 2.0.6
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @param string $safe_text The text after it has been escaped.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
* @param string $text The text prior to being escaped.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
2009-01-04 17:25:50 -05:00
|
|
|
|
return apply_filters( 'attribute_escape', $safe_text, $text );
|
2006-12-21 05:10:04 -05:00
|
|
|
|
}
|
2008-03-24 01:15:28 -04:00
|
|
|
|
|
2010-11-17 12:12:01 -05:00
|
|
|
|
/**
|
|
|
|
|
* Escaping for textarea values.
|
|
|
|
|
*
|
2013-02-01 13:07:08 -05:00
|
|
|
|
* @since 3.1.0
|
2010-11-17 12:12:01 -05:00
|
|
|
|
*
|
|
|
|
|
* @param string $text
|
|
|
|
|
* @return string
|
|
|
|
|
*/
|
|
|
|
|
function esc_textarea( $text ) {
|
2013-03-13 11:24:38 -04:00
|
|
|
|
$safe_text = htmlspecialchars( $text, ENT_QUOTES, get_option( 'blog_charset' ) );
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters a string cleaned and escaped for output in a textarea element.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 3.1.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $safe_text The text after it has been escaped.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
* @param string $text The text prior to being escaped.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
2010-11-17 12:12:01 -05:00
|
|
|
|
return apply_filters( 'esc_textarea', $safe_text, $text );
|
|
|
|
|
}
|
|
|
|
|
|
Sitemaps: Add XML sitemaps functionality to WordPress.
While web crawlers are able to discover pages from links within the site and from other sites, XML sitemaps supplement this approach by allowing crawlers to quickly and comprehensively identify all URLs included in the sitemap and learn other signals about those URLs using the associated metadata.
See https://make.wordpress.org/core/2020/06/10/merge-announcement-extensible-core-sitemaps/ for more details.
This feature exposes the sitemap index via `/wp-sitemap.xml` and exposes a variety of new filters and hooks for developers to modify the behavior. Users can disable sitemaps completely by turning off search engine visibility in WordPress admin.
This change also introduces a new `esc_xml()` function to escape strings for output in XML, as well as XML support to `wp_kses_normalize_entities()`.
Props Adrian McShane, afragen, adamsilverstein, casiepa, flixos90, garrett-eclipse, joemcgill, kburgoine, kraftbj, milana_cap, pacifika, pbiron, pfefferle, Ruxandra Gradina, swissspidy, szepeviktor, tangrufus, tweetythierry.
Fixes #50117.
See #3670. See #19998.
Built from https://develop.svn.wordpress.org/trunk@48072
git-svn-id: http://core.svn.wordpress.org/trunk@47839 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2020-06-17 11:24:07 -04:00
|
|
|
|
/**
|
|
|
|
|
* Escaping for XML blocks.
|
|
|
|
|
*
|
|
|
|
|
* @since 5.5.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $text Text to escape.
|
|
|
|
|
* @return string Escaped text.
|
|
|
|
|
*/
|
|
|
|
|
function esc_xml( $text ) {
|
|
|
|
|
$safe_text = wp_check_invalid_utf8( $text );
|
|
|
|
|
|
|
|
|
|
$cdata_regex = '\<\!\[CDATA\[.*?\]\]\>';
|
|
|
|
|
$regex = <<<EOF
|
|
|
|
|
/
|
|
|
|
|
(?=.*?{$cdata_regex}) # lookahead that will match anything followed by a CDATA Section
|
|
|
|
|
(?<non_cdata_followed_by_cdata>(.*?)) # the "anything" matched by the lookahead
|
|
|
|
|
(?<cdata>({$cdata_regex})) # the CDATA Section matched by the lookahead
|
|
|
|
|
|
|
|
|
|
| # alternative
|
|
|
|
|
|
|
|
|
|
(?<non_cdata>(.*)) # non-CDATA Section
|
|
|
|
|
/sx
|
|
|
|
|
EOF;
|
|
|
|
|
|
|
|
|
|
$safe_text = (string) preg_replace_callback(
|
|
|
|
|
$regex,
|
|
|
|
|
static function( $matches ) {
|
|
|
|
|
if ( ! $matches[0] ) {
|
|
|
|
|
return '';
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( ! empty( $matches['non_cdata'] ) ) {
|
|
|
|
|
// escape HTML entities in the non-CDATA Section.
|
|
|
|
|
return _wp_specialchars( $matches['non_cdata'], ENT_XML1 );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// Return the CDATA Section unchanged, escape HTML entities in the rest.
|
|
|
|
|
return _wp_specialchars( $matches['non_cdata_followed_by_cdata'], ENT_XML1 ) . $matches['cdata'];
|
|
|
|
|
},
|
|
|
|
|
$safe_text
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Filters a string cleaned and escaped for output in XML.
|
|
|
|
|
*
|
|
|
|
|
* Text passed to esc_xml() is stripped of invalid or special characters
|
|
|
|
|
* before output. HTML named character references are converted to their
|
|
|
|
|
* equivalent code points.
|
|
|
|
|
*
|
|
|
|
|
* @since 5.5.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $safe_text The text after it has been escaped.
|
|
|
|
|
* @param string $text The text prior to being escaped.
|
|
|
|
|
*/
|
|
|
|
|
return apply_filters( 'esc_xml', $safe_text, $text );
|
|
|
|
|
}
|
|
|
|
|
|
2008-08-27 02:49:21 -04:00
|
|
|
|
/**
|
2013-02-01 13:07:08 -05:00
|
|
|
|
* Escape an HTML tag name.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @since 2.5.0
|
2008-08-27 02:49:21 -04:00
|
|
|
|
*
|
|
|
|
|
* @param string $tag_name
|
|
|
|
|
* @return string
|
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function tag_escape( $tag_name ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$safe_tag = strtolower( preg_replace( '/[^a-zA-Z0-9_:]/', '', $tag_name ) );
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters a string cleaned and escaped for output as an HTML tag.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 2.8.0
|
2013-12-04 15:03:09 -05:00
|
|
|
|
*
|
2013-11-30 13:36:10 -05:00
|
|
|
|
* @param string $safe_tag The tag name after it has been escaped.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
* @param string $tag_name The text before it was escaped.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
|
|
|
|
return apply_filters( 'tag_escape', $safe_tag, $tag_name );
|
2008-03-24 01:15:28 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-27 02:49:21 -04:00
|
|
|
|
/**
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* Convert full URL paths to absolute paths.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* Removes the http or https protocols and the domain. Keeps the path '/' at the
|
|
|
|
|
* beginning, so it isn't a true relative link, but from the web root base.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @since 2.1.0
|
2014-11-20 22:44:23 -05:00
|
|
|
|
* @since 4.1.0 Support was added for relative URLs.
|
2008-08-30 17:28:11 -04:00
|
|
|
|
*
|
|
|
|
|
* @param string $link Full URL path.
|
|
|
|
|
* @return string Absolute path.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
*/
|
2006-10-06 18:43:21 -04:00
|
|
|
|
function wp_make_link_relative( $link ) {
|
2015-11-03 16:36:25 -05:00
|
|
|
|
return preg_replace( '|^(https?:)?//[^/]+(/?.*)|i', '$2', $link );
|
2006-10-05 20:34:58 -04:00
|
|
|
|
}
|
2006-10-06 18:43:21 -04:00
|
|
|
|
|
2008-08-27 02:49:21 -04:00
|
|
|
|
/**
|
|
|
|
|
* Sanitises various option values based on the nature of the option.
|
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* This is basically a switch statement which will pass $value through a number
|
2008-12-09 13:03:31 -05:00
|
|
|
|
* of functions depending on the $option.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 2.0.5
|
|
|
|
|
*
|
2015-10-14 19:44:25 -04:00
|
|
|
|
* @global wpdb $wpdb WordPress database abstraction object.
|
2015-05-25 02:25:25 -04:00
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @param string $option The name of the option.
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param string $value The unsanitised value.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @return string Sanitized value.
|
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function sanitize_option( $option, $value ) {
|
2015-01-06 23:15:23 -05:00
|
|
|
|
global $wpdb;
|
2007-05-24 22:22:30 -04:00
|
|
|
|
|
2015-05-21 14:00:26 -04:00
|
|
|
|
$original_value = $value;
|
2021-11-30 16:03:00 -05:00
|
|
|
|
$error = null;
|
2015-05-21 14:00:26 -04:00
|
|
|
|
|
2010-04-25 04:16:10 -04:00
|
|
|
|
switch ( $option ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
case 'admin_email':
|
|
|
|
|
case 'new_admin_email':
|
2015-01-06 23:15:23 -05:00
|
|
|
|
$value = $wpdb->strip_invalid_text_for_column( $wpdb->options, 'option_value', $value );
|
2015-06-15 21:29:27 -04:00
|
|
|
|
if ( is_wp_error( $value ) ) {
|
|
|
|
|
$error = $value->get_error_message();
|
|
|
|
|
} else {
|
|
|
|
|
$value = sanitize_email( $value );
|
|
|
|
|
if ( ! is_email( $value ) ) {
|
|
|
|
|
$error = __( 'The email address entered did not appear to be a valid email address. Please enter a valid email address.' );
|
|
|
|
|
}
|
2011-06-27 11:56:42 -04:00
|
|
|
|
}
|
|
|
|
|
break;
|
2011-09-21 15:05:06 -04:00
|
|
|
|
|
2008-11-13 02:54:27 -05:00
|
|
|
|
case 'thumbnail_size_w':
|
|
|
|
|
case 'thumbnail_size_h':
|
|
|
|
|
case 'medium_size_w':
|
|
|
|
|
case 'medium_size_h':
|
2015-10-31 16:50:25 -04:00
|
|
|
|
case 'medium_large_size_w':
|
|
|
|
|
case 'medium_large_size_h':
|
2008-11-13 02:54:27 -05:00
|
|
|
|
case 'large_size_w':
|
|
|
|
|
case 'large_size_h':
|
2007-05-24 22:22:30 -04:00
|
|
|
|
case 'mailserver_port':
|
|
|
|
|
case 'comment_max_links':
|
2007-08-22 13:57:36 -04:00
|
|
|
|
case 'page_on_front':
|
2010-06-11 13:04:06 -04:00
|
|
|
|
case 'page_for_posts':
|
2007-08-22 13:57:36 -04:00
|
|
|
|
case 'rss_excerpt_length':
|
|
|
|
|
case 'default_category':
|
|
|
|
|
case 'default_email_category':
|
|
|
|
|
case 'default_link_category':
|
2008-09-23 17:11:27 -04:00
|
|
|
|
case 'close_comments_days_old':
|
|
|
|
|
case 'comments_per_page':
|
|
|
|
|
case 'thread_comments_depth':
|
2009-08-04 17:28:42 -04:00
|
|
|
|
case 'users_can_register':
|
2010-02-13 01:08:15 -05:00
|
|
|
|
case 'start_of_week':
|
Introducing Site Icon, favicon management for WordPress.
This v1 marries Jetpack's Site Icon module with the Media Modal, reusing code
from the Custom Header admin. For now, the core-provided icons will be limited
to a favicon, an iOS app icon, and a Windows tile icon, leaving `.ico` support
and additional icons to plugins to add.
Props obenland, tyxla, flixos90, jancbeck, markjaquith, scruffian.
See #16434.
Built from https://develop.svn.wordpress.org/trunk@32994
git-svn-id: http://core.svn.wordpress.org/trunk@32965 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2015-06-29 08:58:25 -04:00
|
|
|
|
case 'site_icon':
|
2009-08-04 17:28:42 -04:00
|
|
|
|
$value = absint( $value );
|
2007-05-24 22:22:30 -04:00
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 'posts_per_page':
|
|
|
|
|
case 'posts_per_rss':
|
|
|
|
|
$value = (int) $value;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( empty( $value ) ) {
|
2010-04-25 04:16:10 -04:00
|
|
|
|
$value = 1;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
|
|
|
|
if ( $value < -1 ) {
|
|
|
|
|
$value = abs( $value );
|
|
|
|
|
}
|
2007-05-24 22:22:30 -04:00
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 'default_ping_status':
|
|
|
|
|
case 'default_comment_status':
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Options that if not there have 0 value but need to be something like "closed".
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( '0' == $value || '' === $value ) {
|
2007-05-24 22:22:30 -04:00
|
|
|
|
$value = 'closed';
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2007-05-24 22:22:30 -04:00
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 'blogdescription':
|
|
|
|
|
case 'blogname':
|
2015-01-06 23:15:23 -05:00
|
|
|
|
$value = $wpdb->strip_invalid_text_for_column( $wpdb->options, 'option_value', $value );
|
2016-05-20 00:54:27 -04:00
|
|
|
|
if ( $value !== $original_value ) {
|
|
|
|
|
$value = $wpdb->strip_invalid_text_for_column( $wpdb->options, 'option_value', wp_encode_emoji( $original_value ) );
|
|
|
|
|
}
|
|
|
|
|
|
2015-06-15 21:29:27 -04:00
|
|
|
|
if ( is_wp_error( $value ) ) {
|
|
|
|
|
$error = $value->get_error_message();
|
|
|
|
|
} else {
|
|
|
|
|
$value = esc_html( $value );
|
|
|
|
|
}
|
2007-05-24 22:22:30 -04:00
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 'blog_charset':
|
2020-01-28 19:45:18 -05:00
|
|
|
|
$value = preg_replace( '/[^a-zA-Z0-9_-]/', '', $value ); // Strips slashes.
|
2007-05-24 22:22:30 -04:00
|
|
|
|
break;
|
|
|
|
|
|
2012-09-14 16:26:20 -04:00
|
|
|
|
case 'blog_public':
|
|
|
|
|
// This is the value if the settings checkbox is not checked on POST. Don't rely on this.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( null === $value ) {
|
2012-09-14 16:26:20 -04:00
|
|
|
|
$value = 1;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
} else {
|
2020-10-08 17:15:13 -04:00
|
|
|
|
$value = (int) $value;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2012-09-14 16:26:20 -04:00
|
|
|
|
break;
|
|
|
|
|
|
2007-05-24 22:22:30 -04:00
|
|
|
|
case 'date_format':
|
|
|
|
|
case 'time_format':
|
|
|
|
|
case 'mailserver_url':
|
|
|
|
|
case 'mailserver_login':
|
|
|
|
|
case 'mailserver_pass':
|
|
|
|
|
case 'upload_path':
|
2015-01-06 23:15:23 -05:00
|
|
|
|
$value = $wpdb->strip_invalid_text_for_column( $wpdb->options, 'option_value', $value );
|
2015-06-15 21:29:27 -04:00
|
|
|
|
if ( is_wp_error( $value ) ) {
|
|
|
|
|
$error = $value->get_error_message();
|
|
|
|
|
} else {
|
|
|
|
|
$value = strip_tags( $value );
|
|
|
|
|
$value = wp_kses_data( $value );
|
|
|
|
|
}
|
2012-10-17 13:44:40 -04:00
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 'ping_sites':
|
|
|
|
|
$value = explode( "\n", $value );
|
|
|
|
|
$value = array_filter( array_map( 'trim', $value ) );
|
|
|
|
|
$value = array_filter( array_map( 'esc_url_raw', $value ) );
|
|
|
|
|
$value = implode( "\n", $value );
|
2007-05-24 22:22:30 -04:00
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 'gmt_offset':
|
2020-01-28 19:45:18 -05:00
|
|
|
|
$value = preg_replace( '/[^0-9:.-]/', '', $value ); // Strips slashes.
|
2007-05-24 22:22:30 -04:00
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 'siteurl':
|
2015-01-06 23:15:23 -05:00
|
|
|
|
$value = $wpdb->strip_invalid_text_for_column( $wpdb->options, 'option_value', $value );
|
2015-06-15 21:29:27 -04:00
|
|
|
|
if ( is_wp_error( $value ) ) {
|
|
|
|
|
$error = $value->get_error_message();
|
2010-04-25 04:16:10 -04:00
|
|
|
|
} else {
|
2015-06-15 21:29:27 -04:00
|
|
|
|
if ( preg_match( '#http(s?)://(.+)#i', $value ) ) {
|
|
|
|
|
$value = esc_url_raw( $value );
|
|
|
|
|
} else {
|
|
|
|
|
$error = __( 'The WordPress address you entered did not appear to be a valid URL. Please enter a valid URL.' );
|
|
|
|
|
}
|
2010-04-25 04:16:10 -04:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
2007-05-24 22:22:30 -04:00
|
|
|
|
case 'home':
|
2015-01-06 23:15:23 -05:00
|
|
|
|
$value = $wpdb->strip_invalid_text_for_column( $wpdb->options, 'option_value', $value );
|
2015-06-15 21:29:27 -04:00
|
|
|
|
if ( is_wp_error( $value ) ) {
|
|
|
|
|
$error = $value->get_error_message();
|
2010-04-25 04:16:10 -04:00
|
|
|
|
} else {
|
2015-06-15 21:29:27 -04:00
|
|
|
|
if ( preg_match( '#http(s?)://(.+)#i', $value ) ) {
|
|
|
|
|
$value = esc_url_raw( $value );
|
|
|
|
|
} else {
|
|
|
|
|
$error = __( 'The Site address you entered did not appear to be a valid URL. Please enter a valid URL.' );
|
|
|
|
|
}
|
2010-04-25 04:16:10 -04:00
|
|
|
|
}
|
2007-05-24 22:22:30 -04:00
|
|
|
|
break;
|
2011-09-21 15:05:06 -04:00
|
|
|
|
|
2011-06-27 11:56:42 -04:00
|
|
|
|
case 'WPLANG':
|
|
|
|
|
$allowed = get_available_languages();
|
2014-09-03 04:03:16 -04:00
|
|
|
|
if ( ! is_multisite() && defined( 'WPLANG' ) && '' !== WPLANG && 'en_US' !== WPLANG ) {
|
|
|
|
|
$allowed[] = WPLANG;
|
|
|
|
|
}
|
2020-04-04 23:02:11 -04:00
|
|
|
|
if ( ! in_array( $value, $allowed, true ) && ! empty( $value ) ) {
|
2011-06-27 11:56:42 -04:00
|
|
|
|
$value = get_option( $option );
|
2014-09-03 04:03:16 -04:00
|
|
|
|
}
|
2011-06-27 11:56:42 -04:00
|
|
|
|
break;
|
2010-04-25 04:16:10 -04:00
|
|
|
|
|
2012-09-24 21:54:12 -04:00
|
|
|
|
case 'illegal_names':
|
2015-01-06 23:15:23 -05:00
|
|
|
|
$value = $wpdb->strip_invalid_text_for_column( $wpdb->options, 'option_value', $value );
|
2015-06-15 21:29:27 -04:00
|
|
|
|
if ( is_wp_error( $value ) ) {
|
|
|
|
|
$error = $value->get_error_message();
|
|
|
|
|
} else {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! is_array( $value ) ) {
|
2015-06-15 21:29:27 -04:00
|
|
|
|
$value = explode( ' ', $value );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2012-09-24 21:54:12 -04:00
|
|
|
|
|
2015-06-15 21:29:27 -04:00
|
|
|
|
$value = array_values( array_filter( array_map( 'trim', $value ) ) );
|
2012-09-24 21:54:12 -04:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! $value ) {
|
2015-06-15 21:29:27 -04:00
|
|
|
|
$value = '';
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2015-06-15 21:29:27 -04:00
|
|
|
|
}
|
2012-09-24 21:54:12 -04:00
|
|
|
|
break;
|
|
|
|
|
|
|
|
|
|
case 'limited_email_domains':
|
|
|
|
|
case 'banned_email_domains':
|
2015-01-06 23:15:23 -05:00
|
|
|
|
$value = $wpdb->strip_invalid_text_for_column( $wpdb->options, 'option_value', $value );
|
2015-06-15 21:29:27 -04:00
|
|
|
|
if ( is_wp_error( $value ) ) {
|
|
|
|
|
$error = $value->get_error_message();
|
|
|
|
|
} else {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! is_array( $value ) ) {
|
2015-06-15 21:29:27 -04:00
|
|
|
|
$value = explode( "\n", $value );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2012-09-24 21:54:12 -04:00
|
|
|
|
|
2015-06-15 21:29:27 -04:00
|
|
|
|
$domains = array_values( array_filter( array_map( 'trim', $value ) ) );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$value = array();
|
2012-09-24 21:54:12 -04:00
|
|
|
|
|
2015-06-15 21:29:27 -04:00
|
|
|
|
foreach ( $domains as $domain ) {
|
|
|
|
|
if ( ! preg_match( '/(--|\.\.)/', $domain ) && preg_match( '|^([a-zA-Z0-9-\.])+$|', $domain ) ) {
|
|
|
|
|
$value[] = $domain;
|
|
|
|
|
}
|
|
|
|
|
}
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! $value ) {
|
2015-06-15 21:29:27 -04:00
|
|
|
|
$value = '';
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2012-09-24 21:54:12 -04:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
2011-06-20 10:58:50 -04:00
|
|
|
|
case 'timezone_string':
|
|
|
|
|
$allowed_zones = timezone_identifiers_list();
|
2020-04-04 23:02:11 -04:00
|
|
|
|
if ( ! in_array( $value, $allowed_zones, true ) && ! empty( $value ) ) {
|
2015-06-15 21:29:27 -04:00
|
|
|
|
$error = __( 'The timezone you have entered is not valid. Please select a valid timezone.' );
|
2011-06-20 10:58:50 -04:00
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
|
2011-09-21 15:05:06 -04:00
|
|
|
|
case 'permalink_structure':
|
|
|
|
|
case 'category_base':
|
|
|
|
|
case 'tag_base':
|
2015-01-06 23:15:23 -05:00
|
|
|
|
$value = $wpdb->strip_invalid_text_for_column( $wpdb->options, 'option_value', $value );
|
2015-06-15 21:29:27 -04:00
|
|
|
|
if ( is_wp_error( $value ) ) {
|
|
|
|
|
$error = $value->get_error_message();
|
|
|
|
|
} else {
|
|
|
|
|
$value = esc_url_raw( $value );
|
|
|
|
|
$value = str_replace( 'http://', '', $value );
|
|
|
|
|
}
|
2016-06-19 08:02:29 -04:00
|
|
|
|
|
2021-11-30 16:03:00 -05:00
|
|
|
|
if ( 'permalink_structure' === $option && null === $error
|
|
|
|
|
&& '' !== $value && ! preg_match( '/%[^\/%]+%/', $value )
|
|
|
|
|
) {
|
2016-06-19 08:02:29 -04:00
|
|
|
|
$error = sprintf(
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: %s: Documentation URL. */
|
2016-06-19 08:02:29 -04:00
|
|
|
|
__( 'A structure tag is required when using custom permalinks. <a href="%s">Learn more</a>' ),
|
2019-07-25 18:45:57 -04:00
|
|
|
|
__( 'https://wordpress.org/support/article/using-permalinks/#choosing-your-permalink-structure' )
|
2016-06-19 08:02:29 -04:00
|
|
|
|
);
|
|
|
|
|
}
|
2007-05-24 22:22:30 -04:00
|
|
|
|
break;
|
2013-10-06 06:56:09 -04:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
case 'default_role':
|
|
|
|
|
if ( ! get_role( $value ) && get_role( 'subscriber' ) ) {
|
2013-10-06 06:56:09 -04:00
|
|
|
|
$value = 'subscriber';
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2013-10-06 06:56:09 -04:00
|
|
|
|
break;
|
2014-05-16 07:10:14 -04:00
|
|
|
|
|
|
|
|
|
case 'moderation_keys':
|
General: Update code for readability and inclusion
There are two pieces in here:
1) The update to change blacklist to blocklist is moved to disallowed_list. "Block" has a meaning in our code, and there could be ambiguity between this code and code related to blocks.
2) This improves backwards compatibility for code that was accessing the now deprecated code.
Previously: [48477], [48405], [48400], [48121], [48122], [48124], [48142], [48566]
Props: desrosj, SergeyBiryukov, johnjamesjacoby
Fixes: #50413
Built from https://develop.svn.wordpress.org/trunk@48575
git-svn-id: http://core.svn.wordpress.org/trunk@48337 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2020-07-22 23:14:06 -04:00
|
|
|
|
case 'disallowed_keys':
|
2015-01-06 23:15:23 -05:00
|
|
|
|
$value = $wpdb->strip_invalid_text_for_column( $wpdb->options, 'option_value', $value );
|
2015-06-15 21:29:27 -04:00
|
|
|
|
if ( is_wp_error( $value ) ) {
|
|
|
|
|
$error = $value->get_error_message();
|
|
|
|
|
} else {
|
|
|
|
|
$value = explode( "\n", $value );
|
|
|
|
|
$value = array_filter( array_map( 'trim', $value ) );
|
|
|
|
|
$value = array_unique( $value );
|
|
|
|
|
$value = implode( "\n", $value );
|
|
|
|
|
}
|
2014-05-16 07:10:14 -04:00
|
|
|
|
break;
|
2007-05-24 22:22:30 -04:00
|
|
|
|
}
|
|
|
|
|
|
2021-11-30 16:03:00 -05:00
|
|
|
|
if ( null !== $error ) {
|
|
|
|
|
if ( '' === $error && is_wp_error( $value ) ) {
|
|
|
|
|
/* translators: 1: Option name, 2: Error code. */
|
|
|
|
|
$error = sprintf( __( 'Could not sanitize the %1$s option. Error code: %2$s' ), $option, $value->get_error_code() );
|
|
|
|
|
}
|
|
|
|
|
|
2015-06-15 21:29:27 -04:00
|
|
|
|
$value = get_option( $option );
|
|
|
|
|
if ( function_exists( 'add_settings_error' ) ) {
|
|
|
|
|
add_settings_error( $option, "invalid_{$option}", $error );
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters an option value following sanitization.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 2.3.0
|
2015-05-21 14:00:26 -04:00
|
|
|
|
* @since 4.3.0 Added the `$original_value` parameter.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
2015-05-21 14:00:26 -04:00
|
|
|
|
* @param string $value The sanitized option value.
|
|
|
|
|
* @param string $option The option name.
|
|
|
|
|
* @param string $original_value The original value passed to the function.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
return apply_filters( "sanitize_option_{$option}", $value, $option, $original_value );
|
2007-05-24 22:22:30 -04:00
|
|
|
|
}
|
|
|
|
|
|
2015-10-17 19:26:24 -04:00
|
|
|
|
/**
|
|
|
|
|
* Maps a function to all non-iterable elements of an array or an object.
|
|
|
|
|
*
|
|
|
|
|
* This is similar to `array_walk_recursive()` but acts upon objects too.
|
|
|
|
|
*
|
2015-10-20 02:08:25 -04:00
|
|
|
|
* @since 4.4.0
|
|
|
|
|
*
|
2015-10-17 19:26:24 -04:00
|
|
|
|
* @param mixed $value The array, object, or scalar.
|
2015-10-20 02:08:25 -04:00
|
|
|
|
* @param callable $callback The function to map onto $value.
|
2016-02-06 19:15:27 -05:00
|
|
|
|
* @return mixed The value with the callback applied to all non-arrays and non-objects inside it.
|
2015-10-17 19:26:24 -04:00
|
|
|
|
*/
|
|
|
|
|
function map_deep( $value, $callback ) {
|
2015-12-26 00:22:26 -05:00
|
|
|
|
if ( is_array( $value ) ) {
|
|
|
|
|
foreach ( $value as $index => $item ) {
|
|
|
|
|
$value[ $index ] = map_deep( $item, $callback );
|
|
|
|
|
}
|
|
|
|
|
} elseif ( is_object( $value ) ) {
|
|
|
|
|
$object_vars = get_object_vars( $value );
|
|
|
|
|
foreach ( $object_vars as $property_name => $property_value ) {
|
|
|
|
|
$value->$property_name = map_deep( $property_value, $callback );
|
2015-10-17 19:26:24 -04:00
|
|
|
|
}
|
|
|
|
|
} else {
|
2015-12-26 00:22:26 -05:00
|
|
|
|
$value = call_user_func( $callback, $value );
|
2015-10-17 19:26:24 -04:00
|
|
|
|
}
|
2015-12-26 00:22:26 -05:00
|
|
|
|
|
|
|
|
|
return $value;
|
2015-10-17 19:26:24 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-17 07:29:43 -04:00
|
|
|
|
/**
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* Parses a string into variables to be stored in an array.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 2.2.1
|
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @param string $string The string to be parsed.
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param array $array Variables will be stored in this array.
|
2008-08-17 07:29:43 -04:00
|
|
|
|
*/
|
2007-06-14 18:46:59 -04:00
|
|
|
|
function wp_parse_str( $string, &$array ) {
|
Code Modernization: Correct handling of `null` in `wp_parse_str()`.
This fixes `parse_str(): Passing null to parameter #1 ($string) of type string is deprecated` notices on PHP 8.1, without change in behaviour.
Impact: 311 of the pre-existing tests are affected by this issue.
The PHP native `parse_str()` function expects a string, however, based on the failing tests, it is clear there are functions in WordPress which passes a non-string – including `null` – value to the `wp_parse_str()` function, which would subsequently pass it onto the PHP native function without further input validation.
Most notable offender is the `wp_parse_args()` function which special cases arrays and objects, but passes everything else off to `wp_parse_str()`.
Several ways to fix this issue have been explored, including checking the received value with `is_string()` or `is_scalar()` before passing it off to the PHP native `parse_str()` function.
In the end it was decided against these in favor of a string cast as:
* `is_string()` would significantly change the behavior for anything non-string.
* `is_scalar()` up to a point as well, as it does not take objects with a `__toString()` method into account.
Executing a string cast on the received value before passing it on maintains the pre-existing behavior while still preventing the deprecation notice coming from PHP 8.1.
Reference: [https://www.php.net/manual/en/function.parse-str.php PHP Manual: parse_str()]
Follow-up to [5709].
Props jrf, hellofromTonya, lucatume, SergeyBiryukov.
See #53635.
Built from https://develop.svn.wordpress.org/trunk@51624
git-svn-id: http://core.svn.wordpress.org/trunk@51230 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2021-08-16 18:18:02 -04:00
|
|
|
|
parse_str( (string) $string, $array );
|
2019-09-13 18:21:01 -04:00
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the array of variables derived from a parsed string.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
2021-08-13 11:50:58 -04:00
|
|
|
|
* @since 2.2.1
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @param array $array The array populated with variables.
|
|
|
|
|
*/
|
2007-06-14 18:46:59 -04:00
|
|
|
|
$array = apply_filters( 'wp_parse_str', $array );
|
|
|
|
|
}
|
|
|
|
|
|
2008-08-27 02:49:21 -04:00
|
|
|
|
/**
|
|
|
|
|
* Convert lone less than signs.
|
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* KSES already converts lone greater than signs.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @since 2.3.0
|
2008-08-27 02:49:21 -04:00
|
|
|
|
*
|
|
|
|
|
* @param string $text Text to be converted.
|
|
|
|
|
* @return string Converted text.
|
|
|
|
|
*/
|
2007-07-06 08:53:15 -04:00
|
|
|
|
function wp_pre_kses_less_than( $text ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
return preg_replace_callback( '%<[^>]*?((?=<)|>|$)%', 'wp_pre_kses_less_than_callback', $text );
|
2007-07-06 08:53:15 -04:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-27 02:49:21 -04:00
|
|
|
|
/**
|
|
|
|
|
* Callback function used by preg_replace.
|
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @since 2.3.0
|
2008-08-27 02:49:21 -04:00
|
|
|
|
*
|
2021-11-08 05:48:59 -05:00
|
|
|
|
* @param string[] $matches Populated by matches to preg_replace.
|
2009-05-18 11:11:07 -04:00
|
|
|
|
* @return string The text returned after esc_html if needed.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
*/
|
2007-07-06 08:53:15 -04:00
|
|
|
|
function wp_pre_kses_less_than_callback( $matches ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( false === strpos( $matches[0], '>' ) ) {
|
|
|
|
|
return esc_html( $matches[0] );
|
|
|
|
|
}
|
2007-07-06 08:53:15 -04:00
|
|
|
|
return $matches[0];
|
|
|
|
|
}
|
|
|
|
|
|
2019-12-12 13:02:03 -05:00
|
|
|
|
/**
|
|
|
|
|
* Remove non-allowable HTML from parsed block attribute values when filtering
|
|
|
|
|
* in the post context.
|
|
|
|
|
*
|
|
|
|
|
* @since 5.3.1
|
|
|
|
|
*
|
|
|
|
|
* @param string $string Content to be run through KSES.
|
|
|
|
|
* @param array[]|string $allowed_html An array of allowed HTML elements
|
|
|
|
|
* and attributes, or a context name
|
|
|
|
|
* such as 'post'.
|
|
|
|
|
* @param string[] $allowed_protocols Array of allowed URL protocols.
|
|
|
|
|
* @return string Filtered text to run through KSES.
|
|
|
|
|
*/
|
|
|
|
|
function wp_pre_kses_block_attributes( $string, $allowed_html, $allowed_protocols ) {
|
|
|
|
|
/*
|
|
|
|
|
* `filter_block_content` is expected to call `wp_kses`. Temporarily remove
|
|
|
|
|
* the filter to avoid recursion.
|
|
|
|
|
*/
|
|
|
|
|
remove_filter( 'pre_kses', 'wp_pre_kses_block_attributes', 10 );
|
|
|
|
|
$string = filter_block_content( $string, $allowed_html, $allowed_protocols );
|
|
|
|
|
add_filter( 'pre_kses', 'wp_pre_kses_block_attributes', 10, 3 );
|
|
|
|
|
|
|
|
|
|
return $string;
|
|
|
|
|
}
|
|
|
|
|
|
2008-02-22 00:53:47 -05:00
|
|
|
|
/**
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* WordPress implementation of PHP sprintf() with filters.
|
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @since 2.5.0
|
2019-10-09 00:28:02 -04:00
|
|
|
|
* @since 5.3.0 Formalized the existing and already documented `...$args` parameter
|
|
|
|
|
* by adding it to the function signature.
|
|
|
|
|
*
|
2020-01-19 22:14:06 -05:00
|
|
|
|
* @link https://www.php.net/sprintf
|
2008-08-27 02:49:21 -04:00
|
|
|
|
*
|
2019-05-25 17:59:51 -04:00
|
|
|
|
* @param string $pattern The string which formatted args are inserted.
|
|
|
|
|
* @param mixed ...$args Arguments to be formatted into the $pattern string.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @return string The formatted string.
|
2008-02-22 00:53:47 -05:00
|
|
|
|
*/
|
2019-09-15 07:06:55 -04:00
|
|
|
|
function wp_sprintf( $pattern, ...$args ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$len = strlen( $pattern );
|
|
|
|
|
$start = 0;
|
|
|
|
|
$result = '';
|
2008-02-22 00:53:47 -05:00
|
|
|
|
$arg_index = 0;
|
|
|
|
|
while ( $len > $start ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Last character: append and break.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( strlen( $pattern ) - 1 == $start ) {
|
|
|
|
|
$result .= substr( $pattern, -1 );
|
2008-02-22 00:53:47 -05:00
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Literal %: append and continue.
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( '%%' === substr( $pattern, $start, 2 ) ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$start += 2;
|
2008-02-22 00:53:47 -05:00
|
|
|
|
$result .= '%';
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Get fragment before next %.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$end = strpos( $pattern, '%', $start + 1 );
|
|
|
|
|
if ( false === $end ) {
|
2008-02-22 00:53:47 -05:00
|
|
|
|
$end = $len;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
|
|
|
|
$fragment = substr( $pattern, $start, $end - $start );
|
2008-02-22 00:53:47 -05:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Fragment has a specifier.
|
2020-02-09 11:55:09 -05:00
|
|
|
|
if ( '%' === $pattern[ $start ] ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Find numbered arguments or take the next one in order.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( preg_match( '/^%(\d+)\$/', $fragment, $matches ) ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
$index = $matches[1] - 1; // 0-based array vs 1-based sprintf() arguments.
|
2019-09-15 07:06:55 -04:00
|
|
|
|
$arg = isset( $args[ $index ] ) ? $args[ $index ] : '';
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$fragment = str_replace( "%{$matches[1]}$", '%', $fragment );
|
2008-02-22 00:53:47 -05:00
|
|
|
|
} else {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$arg = isset( $args[ $arg_index ] ) ? $args[ $arg_index ] : '';
|
2019-09-15 07:06:55 -04:00
|
|
|
|
++$arg_index;
|
2008-02-22 00:53:47 -05:00
|
|
|
|
}
|
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters a fragment from the pattern passed to wp_sprintf().
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* If the fragment is unchanged, then sprintf() will be run on the fragment.
|
|
|
|
|
*
|
|
|
|
|
* @since 2.5.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $fragment A fragment from the pattern.
|
|
|
|
|
* @param string $arg The argument.
|
|
|
|
|
*/
|
2008-02-22 00:53:47 -05:00
|
|
|
|
$_fragment = apply_filters( 'wp_sprintf', $fragment, $arg );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( $_fragment != $fragment ) {
|
2008-02-22 00:53:47 -05:00
|
|
|
|
$fragment = $_fragment;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
} else {
|
2020-10-08 17:15:13 -04:00
|
|
|
|
$fragment = sprintf( $fragment, (string) $arg );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2008-02-22 00:53:47 -05:00
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Append to result and move to next fragment.
|
2008-02-22 00:53:47 -05:00
|
|
|
|
$result .= $fragment;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$start = $end;
|
2008-02-22 00:53:47 -05:00
|
|
|
|
}
|
2020-01-28 19:45:18 -05:00
|
|
|
|
|
2008-02-22 00:53:47 -05:00
|
|
|
|
return $result;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* Localize list items before the rest of the content.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* The '%l' must be at the first characters can then contain the rest of the
|
|
|
|
|
* content. The list items will have ', ', ', and', and ' and ' added depending
|
|
|
|
|
* on the amount of list items in the $args parameter.
|
2008-02-22 00:53:47 -05:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @since 2.5.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $pattern Content containing '%l' at the beginning.
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param array $args List items to prepend to the content and replace '%l'.
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @return string Localized list items and rest of the content.
|
2008-02-22 00:53:47 -05:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function wp_sprintf_l( $pattern, $args ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Not a match.
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( '%l' !== substr( $pattern, 0, 2 ) ) {
|
2008-02-22 00:53:47 -05:00
|
|
|
|
return $pattern;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2008-02-22 00:53:47 -05:00
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Nothing to work with.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( empty( $args ) ) {
|
2008-02-22 00:53:47 -05:00
|
|
|
|
return '';
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2008-02-22 00:53:47 -05:00
|
|
|
|
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the translated delimiters used by wp_sprintf_l().
|
2014-02-26 11:50:15 -05:00
|
|
|
|
* Placeholders (%s) are included to assist translators and then
|
|
|
|
|
* removed before the array of strings reaches the filter.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* Please note: Ampersands and entities should be avoided here.
|
|
|
|
|
*
|
|
|
|
|
* @since 2.5.0
|
|
|
|
|
*
|
|
|
|
|
* @param array $delimiters An array of translated delimiters.
|
|
|
|
|
*/
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$l = apply_filters(
|
2018-08-16 21:51:36 -04:00
|
|
|
|
'wp_sprintf_l',
|
|
|
|
|
array(
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Used to join items in a list with more than 2 items. */
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'between' => sprintf( __( '%1$s, %2$s' ), '', '' ),
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Used to join last two items in a list with more than 2 times. */
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'between_last_two' => sprintf( __( '%1$s, and %2$s' ), '', '' ),
|
2019-09-02 20:41:05 -04:00
|
|
|
|
/* translators: Used to join items in a list with only 2 items. */
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'between_only_two' => sprintf( __( '%1$s and %2$s' ), '', '' ),
|
|
|
|
|
)
|
|
|
|
|
);
|
|
|
|
|
|
|
|
|
|
$args = (array) $args;
|
|
|
|
|
$result = array_shift( $args );
|
|
|
|
|
if ( count( $args ) == 1 ) {
|
|
|
|
|
$result .= $l['between_only_two'] . array_shift( $args );
|
|
|
|
|
}
|
2020-01-28 19:45:18 -05:00
|
|
|
|
|
|
|
|
|
// Loop when more than two args.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$i = count( $args );
|
2008-10-15 16:47:56 -04:00
|
|
|
|
while ( $i ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$arg = array_shift( $args );
|
2008-10-15 16:47:56 -04:00
|
|
|
|
$i--;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( 0 == $i ) {
|
2008-02-22 00:53:47 -05:00
|
|
|
|
$result .= $l['between_last_two'] . $arg;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
} else {
|
2008-02-22 00:53:47 -05:00
|
|
|
|
$result .= $l['between'] . $arg;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2008-02-22 00:53:47 -05:00
|
|
|
|
}
|
2020-01-28 19:45:18 -05:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
return $result . substr( $pattern, 2 );
|
2008-02-22 00:53:47 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-03-03 16:05:23 -05:00
|
|
|
|
/**
|
2020-06-28 10:02:06 -04:00
|
|
|
|
* Safely extracts not more than the first $count characters from HTML string.
|
2008-03-03 16:05:23 -05:00
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* UTF-8, tags and entities safe prefix extraction. Entities inside will *NOT*
|
|
|
|
|
* be counted as one character. For example & will be counted as 4, < as
|
|
|
|
|
* 3, etc.
|
2008-03-03 16:05:23 -05:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @since 2.5.0
|
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param string $str String to get the excerpt from.
|
|
|
|
|
* @param int $count Maximum number of characters to take.
|
|
|
|
|
* @param string $more Optional. What to append if $str needs to be trimmed. Defaults to empty string.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @return string The excerpt.
|
2008-03-03 16:05:23 -05:00
|
|
|
|
*/
|
2013-05-08 20:22:02 -04:00
|
|
|
|
function wp_html_excerpt( $str, $count, $more = null ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( null === $more ) {
|
2013-05-08 20:22:02 -04:00
|
|
|
|
$more = '';
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2020-01-28 19:45:18 -05:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$str = wp_strip_all_tags( $str, true );
|
2013-05-08 20:22:02 -04:00
|
|
|
|
$excerpt = mb_substr( $str, 0, $count );
|
2020-01-28 19:45:18 -05:00
|
|
|
|
|
|
|
|
|
// Remove part of an entity at the end.
|
2013-05-08 20:22:02 -04:00
|
|
|
|
$excerpt = preg_replace( '/&[^;\s]{0,6}$/', '', $excerpt );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( $str != $excerpt ) {
|
2013-05-08 20:22:02 -04:00
|
|
|
|
$excerpt = trim( $excerpt ) . $more;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2020-01-28 19:45:18 -05:00
|
|
|
|
|
2013-05-08 20:22:02 -04:00
|
|
|
|
return $excerpt;
|
2008-03-03 16:05:23 -05:00
|
|
|
|
}
|
|
|
|
|
|
2008-08-04 17:01:09 -04:00
|
|
|
|
/**
|
|
|
|
|
* Add a Base url to relative links in passed content.
|
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* By default it supports the 'src' and 'href' attributes. However this can be
|
|
|
|
|
* changed via the 3rd param.
|
2008-08-04 17:01:09 -04:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @since 2.7.0
|
2008-08-04 17:01:09 -04:00
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @global string $_links_add_base
|
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @param string $content String to search for links in.
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param string $base The base URL to prefix to links.
|
|
|
|
|
* @param array $attrs The attributes which should be processed.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @return string The processed content.
|
2008-08-04 17:01:09 -04:00
|
|
|
|
*/
|
2017-11-30 18:11:00 -05:00
|
|
|
|
function links_add_base_url( $content, $base, $attrs = array( 'src', 'href' ) ) {
|
2011-02-16 14:24:18 -05:00
|
|
|
|
global $_links_add_base;
|
|
|
|
|
$_links_add_base = $base;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$attrs = implode( '|', (array) $attrs );
|
2011-02-16 14:24:18 -05:00
|
|
|
|
return preg_replace_callback( "!($attrs)=(['\"])(.+?)\\2!i", '_links_add_base', $content );
|
2008-08-04 17:01:09 -04:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Callback to add a base url to relative links in passed content.
|
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @since 2.7.0
|
|
|
|
|
* @access private
|
2008-08-04 17:01:09 -04:00
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @global string $_links_add_base
|
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @param string $m The matched link.
|
|
|
|
|
* @return string The processed link.
|
2008-08-04 17:01:09 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function _links_add_base( $m ) {
|
2011-02-16 14:24:18 -05:00
|
|
|
|
global $_links_add_base;
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// 1 = attribute name 2 = quotation mark 3 = URL.
|
2008-08-09 01:36:14 -04:00
|
|
|
|
return $m[1] . '=' . $m[2] .
|
2020-04-04 23:02:11 -04:00
|
|
|
|
( preg_match( '#^(\w{1,20}):#', $m[3], $protocol ) && in_array( $protocol[1], wp_allowed_protocols(), true ) ?
|
2012-04-14 15:14:10 -04:00
|
|
|
|
$m[3] :
|
2015-09-14 13:37:25 -04:00
|
|
|
|
WP_Http::make_absolute_url( $m[3], $_links_add_base )
|
2014-12-06 22:19:23 -05:00
|
|
|
|
)
|
2008-08-04 17:01:09 -04:00
|
|
|
|
. $m[2];
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Adds a Target attribute to all links in passed content.
|
|
|
|
|
*
|
2014-11-24 00:30:25 -05:00
|
|
|
|
* This function by default only applies to `<a>` tags, however this can be
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* modified by the 3rd param.
|
2008-08-04 17:01:09 -04:00
|
|
|
|
*
|
2014-11-24 00:30:25 -05:00
|
|
|
|
* *NOTE:* Any current target attributed will be stripped and replaced.
|
2008-08-30 17:28:11 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 2.7.0
|
2008-08-04 17:01:09 -04:00
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @global string $_links_add_target
|
|
|
|
|
*
|
2019-10-26 17:09:04 -04:00
|
|
|
|
* @param string $content String to search for links in.
|
|
|
|
|
* @param string $target The Target to add to the links.
|
|
|
|
|
* @param string[] $tags An array of tags to apply to.
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @return string The processed content.
|
2008-08-04 17:01:09 -04:00
|
|
|
|
*/
|
2017-11-30 18:11:00 -05:00
|
|
|
|
function links_add_target( $content, $target = '_blank', $tags = array( 'a' ) ) {
|
2011-02-16 14:24:18 -05:00
|
|
|
|
global $_links_add_target;
|
|
|
|
|
$_links_add_target = $target;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$tags = implode( '|', (array) $tags );
|
2020-09-17 06:14:07 -04:00
|
|
|
|
return preg_replace_callback( "!<($tags)((\s[^>]*)?)>!i", '_links_add_target', $content );
|
2008-08-04 17:01:09 -04:00
|
|
|
|
}
|
2009-09-14 09:57:48 -04:00
|
|
|
|
|
2008-08-04 17:01:09 -04:00
|
|
|
|
/**
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* Callback to add a target attribute to all links in passed content.
|
2008-08-04 17:01:09 -04:00
|
|
|
|
*
|
2008-08-30 17:28:11 -04:00
|
|
|
|
* @since 2.7.0
|
|
|
|
|
* @access private
|
2008-08-04 17:01:09 -04:00
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @global string $_links_add_target
|
|
|
|
|
*
|
2008-08-27 02:49:21 -04:00
|
|
|
|
* @param string $m The matched link.
|
|
|
|
|
* @return string The processed link.
|
2008-08-04 17:01:09 -04:00
|
|
|
|
*/
|
2011-02-16 14:24:18 -05:00
|
|
|
|
function _links_add_target( $m ) {
|
|
|
|
|
global $_links_add_target;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$tag = $m[1];
|
|
|
|
|
$link = preg_replace( '|( target=([\'"])(.*?)\2)|i', '', $m[2] );
|
2011-02-16 14:24:18 -05:00
|
|
|
|
return '<' . $tag . $link . ' target="' . esc_attr( $_links_add_target ) . '">';
|
2008-08-04 17:01:09 -04:00
|
|
|
|
}
|
|
|
|
|
|
2013-02-01 13:07:08 -05:00
|
|
|
|
/**
|
|
|
|
|
* Normalize EOL characters and strip duplicate whitespace.
|
|
|
|
|
*
|
|
|
|
|
* @since 2.7.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $str The string to normalize.
|
|
|
|
|
* @return string The normalized string.
|
|
|
|
|
*/
|
2008-10-23 16:03:16 -04:00
|
|
|
|
function normalize_whitespace( $str ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$str = trim( $str );
|
|
|
|
|
$str = str_replace( "\r", "\n", $str );
|
|
|
|
|
$str = preg_replace( array( '/\n+/', '/[ \t]+/' ), array( "\n", ' ' ), $str );
|
2008-10-23 16:03:16 -04:00
|
|
|
|
return $str;
|
|
|
|
|
}
|
|
|
|
|
|
2009-09-14 09:57:48 -04:00
|
|
|
|
/**
|
|
|
|
|
* Properly strip all HTML tags including script and style
|
2014-02-04 20:43:12 -05:00
|
|
|
|
*
|
|
|
|
|
* This differs from strip_tags() because it removes the contents of
|
2014-11-24 00:30:25 -05:00
|
|
|
|
* the `<script>` and `<style>` tags. E.g. `strip_tags( '<script>something</script>' )`
|
2014-01-26 22:16:11 -05:00
|
|
|
|
* will return 'something'. wp_strip_all_tags will return ''
|
2009-09-14 09:57:48 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 2.9.0
|
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param string $string String containing HTML tags
|
|
|
|
|
* @param bool $remove_breaks Optional. Whether to remove left over line breaks and white space chars
|
2009-09-14 09:57:48 -04:00
|
|
|
|
* @return string The processed string.
|
|
|
|
|
*/
|
2017-11-30 18:11:00 -05:00
|
|
|
|
function wp_strip_all_tags( $string, $remove_breaks = false ) {
|
2009-09-14 09:57:48 -04:00
|
|
|
|
$string = preg_replace( '@<(script|style)[^>]*?>.*?</\\1>@si', '', $string );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$string = strip_tags( $string );
|
2009-09-14 09:57:48 -04:00
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( $remove_breaks ) {
|
|
|
|
|
$string = preg_replace( '/[\r\n\t ]+/', ' ', $string );
|
|
|
|
|
}
|
2009-09-14 09:57:48 -04:00
|
|
|
|
|
2012-05-01 17:05:02 -04:00
|
|
|
|
return trim( $string );
|
2009-09-14 09:57:48 -04:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
2016-06-26 10:26:29 -04:00
|
|
|
|
* Sanitizes a string from user input or from the database.
|
2009-09-14 09:57:48 -04:00
|
|
|
|
*
|
2016-06-26 10:26:29 -04:00
|
|
|
|
* - Checks for invalid UTF-8,
|
|
|
|
|
* - Converts single `<` characters to entities
|
|
|
|
|
* - Strips all tags
|
|
|
|
|
* - Removes line breaks, tabs, and extra whitespace
|
|
|
|
|
* - Strips octets
|
2009-09-14 09:57:48 -04:00
|
|
|
|
*
|
2010-03-26 15:23:39 -04:00
|
|
|
|
* @since 2.9.0
|
2009-09-14 09:57:48 -04:00
|
|
|
|
*
|
2016-10-26 01:17:35 -04:00
|
|
|
|
* @see sanitize_textarea_field()
|
2016-06-26 10:26:29 -04:00
|
|
|
|
* @see wp_check_invalid_utf8()
|
|
|
|
|
* @see wp_strip_all_tags()
|
|
|
|
|
*
|
|
|
|
|
* @param string $str String to sanitize.
|
|
|
|
|
* @return string Sanitized string.
|
2009-09-14 09:57:48 -04:00
|
|
|
|
*/
|
2015-05-25 02:25:25 -04:00
|
|
|
|
function sanitize_text_field( $str ) {
|
2016-10-26 01:17:35 -04:00
|
|
|
|
$filtered = _sanitize_text_fields( $str, false );
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Filters a sanitized text field string.
|
|
|
|
|
*
|
|
|
|
|
* @since 2.9.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $filtered The sanitized string.
|
|
|
|
|
* @param string $str The string prior to being sanitized.
|
|
|
|
|
*/
|
|
|
|
|
return apply_filters( 'sanitize_text_field', $filtered, $str );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Sanitizes a multiline string from user input or from the database.
|
|
|
|
|
*
|
|
|
|
|
* The function is like sanitize_text_field(), but preserves
|
|
|
|
|
* new lines (\n) and other whitespace, which are legitimate
|
|
|
|
|
* input in textarea elements.
|
|
|
|
|
*
|
|
|
|
|
* @see sanitize_text_field()
|
|
|
|
|
*
|
|
|
|
|
* @since 4.7.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $str String to sanitize.
|
|
|
|
|
* @return string Sanitized string.
|
|
|
|
|
*/
|
|
|
|
|
function sanitize_textarea_field( $str ) {
|
|
|
|
|
$filtered = _sanitize_text_fields( $str, true );
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Filters a sanitized textarea field string.
|
|
|
|
|
*
|
|
|
|
|
* @since 4.7.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $filtered The sanitized string.
|
|
|
|
|
* @param string $str The string prior to being sanitized.
|
|
|
|
|
*/
|
|
|
|
|
return apply_filters( 'sanitize_textarea_field', $filtered, $str );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Internal helper function to sanitize a string from user input or from the db
|
|
|
|
|
*
|
|
|
|
|
* @since 4.7.0
|
|
|
|
|
* @access private
|
|
|
|
|
*
|
2020-07-23 17:11:05 -04:00
|
|
|
|
* @param string $str String to sanitize.
|
|
|
|
|
* @param bool $keep_newlines Optional. Whether to keep newlines. Default: false.
|
2016-10-26 01:17:35 -04:00
|
|
|
|
* @return string Sanitized string.
|
|
|
|
|
*/
|
|
|
|
|
function _sanitize_text_fields( $str, $keep_newlines = false ) {
|
2019-02-07 18:35:49 -05:00
|
|
|
|
if ( is_object( $str ) || is_array( $str ) ) {
|
2019-01-16 01:05:49 -05:00
|
|
|
|
return '';
|
|
|
|
|
}
|
|
|
|
|
|
2019-02-07 18:35:49 -05:00
|
|
|
|
$str = (string) $str;
|
|
|
|
|
|
2009-09-14 09:57:48 -04:00
|
|
|
|
$filtered = wp_check_invalid_utf8( $str );
|
|
|
|
|
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( strpos( $filtered, '<' ) !== false ) {
|
2009-09-14 09:57:48 -04:00
|
|
|
|
$filtered = wp_pre_kses_less_than( $filtered );
|
2009-12-23 04:52:48 -05:00
|
|
|
|
// This will strip extra whitespace for us.
|
2016-10-26 01:17:35 -04:00
|
|
|
|
$filtered = wp_strip_all_tags( $filtered, false );
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Use HTML entities in a special case to make sure no later
|
|
|
|
|
// newline stripping stage could lead to a functional tag.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$filtered = str_replace( "<\n", "<\n", $filtered );
|
2016-10-26 01:17:35 -04:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( ! $keep_newlines ) {
|
|
|
|
|
$filtered = preg_replace( '/[\r\n\t ]+/', ' ', $filtered );
|
2009-09-14 09:57:48 -04:00
|
|
|
|
}
|
2016-10-26 01:17:35 -04:00
|
|
|
|
$filtered = trim( $filtered );
|
2009-09-14 09:57:48 -04:00
|
|
|
|
|
2009-12-23 06:00:29 -05:00
|
|
|
|
$found = false;
|
2017-11-30 18:11:00 -05:00
|
|
|
|
while ( preg_match( '/%[a-f0-9]{2}/i', $filtered, $match ) ) {
|
|
|
|
|
$filtered = str_replace( $match[0], '', $filtered );
|
|
|
|
|
$found = true;
|
2009-12-23 06:00:29 -05:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( $found ) {
|
|
|
|
|
// Strip out the whitespace that may now exist after removing the octets.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$filtered = trim( preg_replace( '/ +/', ' ', $filtered ) );
|
2009-12-23 04:52:48 -05:00
|
|
|
|
}
|
2009-09-14 09:57:48 -04:00
|
|
|
|
|
2016-10-26 01:17:35 -04:00
|
|
|
|
return $filtered;
|
2009-09-14 09:57:48 -04:00
|
|
|
|
}
|
|
|
|
|
|
2010-11-02 13:19:55 -04:00
|
|
|
|
/**
|
|
|
|
|
* i18n friendly version of basename()
|
|
|
|
|
*
|
|
|
|
|
* @since 3.1.0
|
|
|
|
|
*
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @param string $path A path.
|
2010-11-02 13:19:55 -04:00
|
|
|
|
* @param string $suffix If the filename ends in suffix this will also be cut off.
|
|
|
|
|
* @return string
|
|
|
|
|
*/
|
|
|
|
|
function wp_basename( $path, $suffix = '' ) {
|
2012-10-25 18:31:17 -04:00
|
|
|
|
return urldecode( basename( str_replace( array( '%2F', '%5C' ), '/', urlencode( $path ) ), $suffix ) );
|
2010-11-02 13:19:55 -04:00
|
|
|
|
}
|
|
|
|
|
|
2018-01-08 05:36:51 -05:00
|
|
|
|
// phpcs:disable WordPress.WP.CapitalPDangit.Misspelled, WordPress.NamingConventions.ValidFunctionName.FunctionNameInvalid -- 8-)
|
2010-05-27 12:11:27 -04:00
|
|
|
|
/**
|
2018-01-08 05:36:51 -05:00
|
|
|
|
* Forever eliminate "Wordpress" from the planet (or at least the little bit we can influence).
|
2010-05-27 12:11:27 -04:00
|
|
|
|
*
|
|
|
|
|
* Violating our coding standards for a good function name.
|
|
|
|
|
*
|
|
|
|
|
* @since 3.0.0
|
2015-05-25 02:25:25 -04:00
|
|
|
|
*
|
2015-12-06 17:02:27 -05:00
|
|
|
|
* @param string $text The text to be modified.
|
|
|
|
|
* @return string The modified text.
|
2010-05-27 12:11:27 -04:00
|
|
|
|
*/
|
|
|
|
|
function capital_P_dangit( $text ) {
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Simple replacement for titles.
|
2013-11-12 22:56:09 -05:00
|
|
|
|
$current_filter = current_filter();
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( 'the_title' === $current_filter || 'wp_title' === $current_filter ) {
|
2018-01-08 05:36:51 -05:00
|
|
|
|
return str_replace( 'Wordpress', 'WordPress', $text );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
}
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Still here? Use the more judicious replacement.
|
2010-07-08 15:35:29 -04:00
|
|
|
|
static $dblq = false;
|
2015-05-29 11:43:29 -04:00
|
|
|
|
if ( false === $dblq ) {
|
2012-07-09 01:08:43 -04:00
|
|
|
|
$dblq = _x( '“', 'opening curly double quote' );
|
2015-05-29 11:43:29 -04:00
|
|
|
|
}
|
2010-07-08 15:35:29 -04:00
|
|
|
|
return str_replace(
|
|
|
|
|
array( ' Wordpress', '‘Wordpress', $dblq . 'Wordpress', '>Wordpress', '(Wordpress' ),
|
|
|
|
|
array( ' WordPress', '‘WordPress', $dblq . 'WordPress', '>WordPress', '(WordPress' ),
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$text
|
|
|
|
|
);
|
2010-05-27 12:11:27 -04:00
|
|
|
|
}
|
2018-01-08 05:36:51 -05:00
|
|
|
|
// phpcs:enable
|
2010-05-27 12:11:27 -04:00
|
|
|
|
|
2011-05-22 19:19:42 -04:00
|
|
|
|
/**
|
|
|
|
|
* Sanitize a mime type
|
|
|
|
|
*
|
2011-05-25 11:47:17 -04:00
|
|
|
|
* @since 3.1.3
|
2011-05-22 19:19:42 -04:00
|
|
|
|
*
|
|
|
|
|
* @param string $mime_type Mime type
|
|
|
|
|
* @return string Sanitized mime type
|
|
|
|
|
*/
|
|
|
|
|
function sanitize_mime_type( $mime_type ) {
|
2011-06-20 16:05:57 -04:00
|
|
|
|
$sani_mime_type = preg_replace( '/[^-+*.a-zA-Z0-9\/]/', '', $mime_type );
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters a mime type following sanitization.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* @since 3.1.3
|
|
|
|
|
*
|
|
|
|
|
* @param string $sani_mime_type The sanitized mime type.
|
|
|
|
|
* @param string $mime_type The mime type prior to sanitization.
|
|
|
|
|
*/
|
2011-05-22 19:19:42 -04:00
|
|
|
|
return apply_filters( 'sanitize_mime_type', $sani_mime_type, $mime_type );
|
|
|
|
|
}
|
|
|
|
|
|
2012-01-04 14:45:13 -05:00
|
|
|
|
/**
|
|
|
|
|
* Sanitize space or carriage return separated URLs that are used to send trackbacks.
|
|
|
|
|
*
|
|
|
|
|
* @since 3.4.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $to_ping Space or carriage return separated URLs
|
|
|
|
|
* @return string URLs starting with the http or https protocol, separated by a carriage return.
|
|
|
|
|
*/
|
|
|
|
|
function sanitize_trackback_urls( $to_ping ) {
|
2012-09-03 23:36:19 -04:00
|
|
|
|
$urls_to_ping = preg_split( '/[\r\n\t ]/', trim( $to_ping ), -1, PREG_SPLIT_NO_EMPTY );
|
2012-01-04 14:45:13 -05:00
|
|
|
|
foreach ( $urls_to_ping as $k => $url ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( ! preg_match( '#^https?://.#i', $url ) ) {
|
|
|
|
|
unset( $urls_to_ping[ $k ] );
|
|
|
|
|
}
|
2012-01-04 14:45:13 -05:00
|
|
|
|
}
|
|
|
|
|
$urls_to_ping = array_map( 'esc_url_raw', $urls_to_ping );
|
|
|
|
|
$urls_to_ping = implode( "\n", $urls_to_ping );
|
2013-11-30 13:36:10 -05:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters a list of trackback URLs following sanitization.
|
2013-11-30 13:36:10 -05:00
|
|
|
|
*
|
|
|
|
|
* The string returned here consists of a space or carriage return-delimited list
|
|
|
|
|
* of trackback URLs.
|
|
|
|
|
*
|
|
|
|
|
* @since 3.4.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $urls_to_ping Sanitized space or carriage return separated URLs.
|
|
|
|
|
* @param string $to_ping Space or carriage return separated URLs before sanitization.
|
|
|
|
|
*/
|
2012-01-04 14:45:13 -05:00
|
|
|
|
return apply_filters( 'sanitize_trackback_urls', $urls_to_ping, $to_ping );
|
|
|
|
|
}
|
2013-03-01 11:34:48 -05:00
|
|
|
|
|
|
|
|
|
/**
|
2021-01-17 11:38:06 -05:00
|
|
|
|
* Adds slashes to a string or recursively adds slashes to strings within an array.
|
2013-03-01 11:34:48 -05:00
|
|
|
|
*
|
|
|
|
|
* This should be used when preparing data for core API that expects slashed data.
|
|
|
|
|
* This should not be used to escape data going directly into an SQL query.
|
|
|
|
|
*
|
|
|
|
|
* @since 3.6.0
|
2020-07-11 18:48:07 -04:00
|
|
|
|
* @since 5.5.0 Non-string values are left untouched.
|
2013-03-01 11:34:48 -05:00
|
|
|
|
*
|
2021-01-17 11:38:06 -05:00
|
|
|
|
* @param string|array $value String or array of data to slash.
|
2021-12-07 07:20:02 -05:00
|
|
|
|
* @return string|array Slashed `$value`.
|
2013-03-01 11:34:48 -05:00
|
|
|
|
*/
|
|
|
|
|
function wp_slash( $value ) {
|
|
|
|
|
if ( is_array( $value ) ) {
|
Formatting: Prevent wp_slash from returning non-strings as strings.
If a bool/float/int is passed into wp_slash it will be coerced into a string.
This changes the behavior to only slash strings. At the same time, handles recursion a little nicer by calling array_map for arrays.
Fixes #42195, #24106.
Props johnbillion, andizer, jrf, ryotasakamoto, SergeyBiryukov, donmhico, TobiasBg, markoheijnen, ryan, nacin, devesine, whyisjake.
Built from https://develop.svn.wordpress.org/trunk@48433
git-svn-id: http://core.svn.wordpress.org/trunk@48202 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2020-07-10 20:13:04 -04:00
|
|
|
|
$value = array_map( 'wp_slash', $value );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( is_string( $value ) ) {
|
|
|
|
|
return addslashes( $value );
|
2013-03-01 11:34:48 -05:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return $value;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
2021-01-17 11:38:06 -05:00
|
|
|
|
* Removes slashes from a string or recursively removes slashes from strings within an array.
|
2013-03-01 11:34:48 -05:00
|
|
|
|
*
|
|
|
|
|
* This should be used to remove slashes from data passed to core API that
|
|
|
|
|
* expects data to be unslashed.
|
|
|
|
|
*
|
|
|
|
|
* @since 3.6.0
|
|
|
|
|
*
|
2021-01-17 11:38:06 -05:00
|
|
|
|
* @param string|array $value String or array of data to unslash.
|
2021-12-07 07:20:02 -05:00
|
|
|
|
* @return string|array Unslashed `$value`.
|
2013-03-01 11:34:48 -05:00
|
|
|
|
*/
|
|
|
|
|
function wp_unslash( $value ) {
|
|
|
|
|
return stripslashes_deep( $value );
|
2013-07-12 15:38:37 -04:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Extract and return the first URL from passed content.
|
|
|
|
|
*
|
|
|
|
|
* @since 3.6.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $content A string which might contain a URL.
|
2015-05-25 02:25:25 -04:00
|
|
|
|
* @return string|false The found URL.
|
2013-07-12 15:38:37 -04:00
|
|
|
|
*/
|
|
|
|
|
function get_url_in_content( $content ) {
|
2014-01-17 02:47:10 -05:00
|
|
|
|
if ( empty( $content ) ) {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
2013-07-12 15:38:37 -04:00
|
|
|
|
|
2014-01-17 02:47:10 -05:00
|
|
|
|
if ( preg_match( '/<a\s[^>]*?href=([\'"])(.+?)\1/is', $content, $matches ) ) {
|
2013-07-12 15:38:37 -04:00
|
|
|
|
return esc_url_raw( $matches[2] );
|
2014-01-17 02:47:10 -05:00
|
|
|
|
}
|
2013-07-12 15:38:37 -04:00
|
|
|
|
|
|
|
|
|
return false;
|
|
|
|
|
}
|
2014-06-09 15:30:14 -04:00
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Returns the regexp for common whitespace characters.
|
|
|
|
|
*
|
|
|
|
|
* By default, spaces include new lines, tabs, nbsp entities, and the UTF-8 nbsp.
|
2020-01-28 19:45:18 -05:00
|
|
|
|
* This is designed to replace the PCRE \s sequence. In ticket #22692, that
|
2014-06-09 15:30:14 -04:00
|
|
|
|
* sequence was found to be unreliable due to random inclusion of the A0 byte.
|
|
|
|
|
*
|
|
|
|
|
* @since 4.0.0
|
|
|
|
|
*
|
|
|
|
|
* @return string The spaces regexp.
|
|
|
|
|
*/
|
|
|
|
|
function wp_spaces_regexp() {
|
2015-05-29 11:43:29 -04:00
|
|
|
|
static $spaces = '';
|
2014-06-09 15:30:14 -04:00
|
|
|
|
|
|
|
|
|
if ( empty( $spaces ) ) {
|
2014-06-09 21:55:15 -04:00
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the regexp for common whitespace characters.
|
2014-06-09 21:55:15 -04:00
|
|
|
|
*
|
2014-06-10 02:46:15 -04:00
|
|
|
|
* This string is substituted for the \s sequence as needed in regular
|
|
|
|
|
* expressions. For websites not written in English, different characters
|
|
|
|
|
* may represent whitespace. For websites not encoded in UTF-8, the 0xC2 0xA0
|
|
|
|
|
* sequence may not be in use.
|
2014-06-09 21:55:15 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 4.0.0
|
|
|
|
|
*
|
2014-06-10 02:46:15 -04:00
|
|
|
|
* @param string $spaces Regexp pattern for matching common whitespace characters.
|
2014-06-09 21:55:15 -04:00
|
|
|
|
*/
|
2014-06-09 15:30:14 -04:00
|
|
|
|
$spaces = apply_filters( 'wp_spaces_regexp', '[\r\n\t ]|\xC2\xA0| ' );
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return $spaces;
|
2014-06-09 21:55:15 -04:00
|
|
|
|
}
|
2015-03-11 18:49:28 -04:00
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Print the important emoji-related styles.
|
|
|
|
|
*
|
|
|
|
|
* @since 4.2.0
|
|
|
|
|
*/
|
|
|
|
|
function print_emoji_styles() {
|
2015-03-24 19:33:32 -04:00
|
|
|
|
static $printed = false;
|
|
|
|
|
|
|
|
|
|
if ( $printed ) {
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$printed = true;
|
2019-09-18 10:50:56 -04:00
|
|
|
|
|
|
|
|
|
$type_attr = current_theme_supports( 'html5', 'style' ) ? '' : ' type="text/css"';
|
2018-08-16 21:51:36 -04:00
|
|
|
|
?>
|
2019-09-18 10:50:56 -04:00
|
|
|
|
<style<?php echo $type_attr; ?>>
|
2015-03-11 18:49:28 -04:00
|
|
|
|
img.wp-smiley,
|
|
|
|
|
img.emoji {
|
2015-03-13 14:45:27 -04:00
|
|
|
|
display: inline !important;
|
2015-03-11 18:49:28 -04:00
|
|
|
|
border: none !important;
|
|
|
|
|
box-shadow: none !important;
|
|
|
|
|
height: 1em !important;
|
|
|
|
|
width: 1em !important;
|
2021-10-18 12:53:57 -04:00
|
|
|
|
margin: 0 0.07em !important;
|
2015-03-11 18:49:28 -04:00
|
|
|
|
vertical-align: -0.1em !important;
|
|
|
|
|
background: none !important;
|
|
|
|
|
padding: 0 !important;
|
|
|
|
|
}
|
|
|
|
|
</style>
|
2018-08-16 21:51:36 -04:00
|
|
|
|
<?php
|
2015-03-11 18:49:28 -04:00
|
|
|
|
}
|
|
|
|
|
|
2015-05-25 02:25:25 -04:00
|
|
|
|
/**
|
2016-05-20 02:03:27 -04:00
|
|
|
|
* Print the inline Emoji detection script if it is not already printed.
|
2015-05-25 02:25:25 -04:00
|
|
|
|
*
|
2016-05-20 02:03:27 -04:00
|
|
|
|
* @since 4.2.0
|
2015-05-25 02:25:25 -04:00
|
|
|
|
*/
|
2015-03-24 19:33:32 -04:00
|
|
|
|
function print_emoji_detection_script() {
|
|
|
|
|
static $printed = false;
|
|
|
|
|
|
|
|
|
|
if ( $printed ) {
|
|
|
|
|
return;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$printed = true;
|
|
|
|
|
|
2016-05-20 02:03:27 -04:00
|
|
|
|
_print_emoji_detection_script();
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
2019-10-12 22:48:01 -04:00
|
|
|
|
* Prints inline Emoji detection script.
|
2016-05-20 02:03:27 -04:00
|
|
|
|
*
|
|
|
|
|
* @ignore
|
|
|
|
|
* @since 4.6.0
|
|
|
|
|
* @access private
|
|
|
|
|
*/
|
|
|
|
|
function _print_emoji_detection_script() {
|
2015-03-24 19:33:32 -04:00
|
|
|
|
$settings = array(
|
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the URL where emoji png images are hosted.
|
2015-03-24 19:33:32 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 4.2.0
|
|
|
|
|
*
|
2019-10-27 15:11:02 -04:00
|
|
|
|
* @param string $url The emoji base URL for png images.
|
2015-03-24 19:33:32 -04:00
|
|
|
|
*/
|
2021-06-08 18:15:12 -04:00
|
|
|
|
'baseUrl' => apply_filters( 'emoji_url', 'https://s.w.org/images/core/emoji/13.1.0/72x72/' ),
|
2015-03-24 19:33:32 -04:00
|
|
|
|
|
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the extension of the emoji png files.
|
2015-03-24 19:33:32 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 4.2.0
|
|
|
|
|
*
|
2019-10-27 15:11:02 -04:00
|
|
|
|
* @param string $extension The emoji extension for png files. Default .png.
|
2015-03-24 19:33:32 -04:00
|
|
|
|
*/
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'ext' => apply_filters( 'emoji_ext', '.png' ),
|
2016-05-20 02:03:27 -04:00
|
|
|
|
|
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the URL where emoji SVG images are hosted.
|
2016-05-20 02:03:27 -04:00
|
|
|
|
*
|
2016-05-20 02:15:27 -04:00
|
|
|
|
* @since 4.6.0
|
2016-05-20 02:03:27 -04:00
|
|
|
|
*
|
2019-10-27 15:11:02 -04:00
|
|
|
|
* @param string $url The emoji base URL for svg images.
|
2016-05-20 02:03:27 -04:00
|
|
|
|
*/
|
2021-06-08 18:15:12 -04:00
|
|
|
|
'svgUrl' => apply_filters( 'emoji_svg_url', 'https://s.w.org/images/core/emoji/13.1.0/svg/' ),
|
2016-05-20 02:03:27 -04:00
|
|
|
|
|
|
|
|
|
/**
|
2016-05-22 14:45:28 -04:00
|
|
|
|
* Filters the extension of the emoji SVG files.
|
2016-05-20 02:03:27 -04:00
|
|
|
|
*
|
2016-05-20 02:15:27 -04:00
|
|
|
|
* @since 4.6.0
|
2016-05-20 02:03:27 -04:00
|
|
|
|
*
|
2019-10-27 15:11:02 -04:00
|
|
|
|
* @param string $extension The emoji extension for svg files. Default .svg.
|
2016-05-20 02:03:27 -04:00
|
|
|
|
*/
|
2017-11-30 18:11:00 -05:00
|
|
|
|
'svgExt' => apply_filters( 'emoji_svg_ext', '.svg' ),
|
2015-03-24 19:33:32 -04:00
|
|
|
|
);
|
|
|
|
|
|
2021-11-10 21:49:18 -05:00
|
|
|
|
$version = 'ver=' . get_bloginfo( 'version' );
|
2015-03-24 19:33:32 -04:00
|
|
|
|
|
2015-06-24 22:29:31 -04:00
|
|
|
|
if ( SCRIPT_DEBUG ) {
|
2015-03-24 19:33:32 -04:00
|
|
|
|
$settings['source'] = array(
|
2015-04-09 07:07:28 -04:00
|
|
|
|
/** This filter is documented in wp-includes/class.wp-scripts.php */
|
|
|
|
|
'wpemoji' => apply_filters( 'script_loader_src', includes_url( "js/wp-emoji.js?$version" ), 'wpemoji' ),
|
|
|
|
|
/** This filter is documented in wp-includes/class.wp-scripts.php */
|
|
|
|
|
'twemoji' => apply_filters( 'script_loader_src', includes_url( "js/twemoji.js?$version" ), 'twemoji' ),
|
2015-03-24 19:33:32 -04:00
|
|
|
|
);
|
|
|
|
|
} else {
|
|
|
|
|
$settings['source'] = array(
|
2015-04-09 07:07:28 -04:00
|
|
|
|
/** This filter is documented in wp-includes/class.wp-scripts.php */
|
|
|
|
|
'concatemoji' => apply_filters( 'script_loader_src', includes_url( "js/wp-emoji-release.min.js?$version" ), 'concatemoji' ),
|
2015-03-24 19:33:32 -04:00
|
|
|
|
);
|
|
|
|
|
}
|
2021-11-10 21:49:18 -05:00
|
|
|
|
|
|
|
|
|
wp_print_inline_script_tag(
|
2021-12-06 05:14:06 -05:00
|
|
|
|
sprintf( 'window._wpemojiSettings = %s;', wp_json_encode( $settings ) ) . "\n" .
|
2021-11-10 21:49:18 -05:00
|
|
|
|
file_get_contents( sprintf( ABSPATH . WPINC . '/js/wp-emoji-loader' . wp_scripts_get_suffix() . '.js' ) )
|
|
|
|
|
);
|
2015-03-24 19:33:32 -04:00
|
|
|
|
}
|
|
|
|
|
|
2015-03-11 18:49:28 -04:00
|
|
|
|
/**
|
Emoji: Port the Twemoji regex to PHP.
Previously, `wp_encode_emoji()` and `wp_staticize_emoji()` used inaccurate regular expressions to find emoji, and transform then into HTML entities or `<img>`s, respectively. This would result in emoji not being correctly transformed, or occasionally, non-emoji being incorrectly transformed.
This commit adds a new `grunt` task - `grunt precommit:emoji`. It finds the regex in `twemoji.js`, transforms it into a PHP-friendly version, and adds it to `formatting.php`. This task is also automatically run by `grunt precommit`, when it detects that `twemoji.js` has changed.
The new regex requires features introduced in PCRE 8.32, which was introduced in PHP 5.4.14, though it was also backported to later releases of the PHP 5.3 series. For versions of PHP that don't support this, it will fall back to an updated version of the loose-matching regex.
For short posts, the performance difference between the old and new regex is negligible. As the posts get longer, however, the new method is exponentially faster.
Fixes #35293.
Built from https://develop.svn.wordpress.org/trunk@41043
git-svn-id: http://core.svn.wordpress.org/trunk@40893 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2017-07-14 01:47:49 -04:00
|
|
|
|
* Convert emoji characters to their equivalent HTML entity.
|
2015-03-11 18:49:28 -04:00
|
|
|
|
*
|
|
|
|
|
* This allows us to store emoji in a DB using the utf8 character set.
|
|
|
|
|
*
|
|
|
|
|
* @since 4.2.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $content The content to encode.
|
|
|
|
|
* @return string The encoded content.
|
|
|
|
|
*/
|
|
|
|
|
function wp_encode_emoji( $content ) {
|
2019-09-20 18:02:57 -04:00
|
|
|
|
$emoji = _wp_emoji_list( 'partials' );
|
Emoji: Port the Twemoji regex to PHP.
Previously, `wp_encode_emoji()` and `wp_staticize_emoji()` used inaccurate regular expressions to find emoji, and transform then into HTML entities or `<img>`s, respectively. This would result in emoji not being correctly transformed, or occasionally, non-emoji being incorrectly transformed.
This commit adds a new `grunt` task - `grunt precommit:emoji`. It finds the regex in `twemoji.js`, transforms it into a PHP-friendly version, and adds it to `formatting.php`. This task is also automatically run by `grunt precommit`, when it detects that `twemoji.js` has changed.
The new regex requires features introduced in PCRE 8.32, which was introduced in PHP 5.4.14, though it was also backported to later releases of the PHP 5.3 series. For versions of PHP that don't support this, it will fall back to an updated version of the loose-matching regex.
For short posts, the performance difference between the old and new regex is negligible. As the posts get longer, however, the new method is exponentially faster.
Fixes #35293.
Built from https://develop.svn.wordpress.org/trunk@41043
git-svn-id: http://core.svn.wordpress.org/trunk@40893 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2017-07-14 01:47:49 -04:00
|
|
|
|
|
2017-10-03 03:12:50 -04:00
|
|
|
|
foreach ( $emoji as $emojum ) {
|
2019-09-20 18:02:57 -04:00
|
|
|
|
$emoji_char = html_entity_decode( $emojum );
|
2017-10-03 03:12:50 -04:00
|
|
|
|
if ( false !== strpos( $content, $emoji_char ) ) {
|
|
|
|
|
$content = preg_replace( "/$emoji_char/", $emojum, $content );
|
2015-03-11 18:49:28 -04:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return $content;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
2015-03-15 21:43:28 -04:00
|
|
|
|
* Convert emoji to a static img element.
|
2015-03-11 18:49:28 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 4.2.0
|
|
|
|
|
*
|
2015-03-12 09:17:26 -04:00
|
|
|
|
* @param string $text The content to encode.
|
2015-03-11 18:49:28 -04:00
|
|
|
|
* @return string The encoded content.
|
|
|
|
|
*/
|
2015-03-12 09:17:26 -04:00
|
|
|
|
function wp_staticize_emoji( $text ) {
|
2017-10-03 03:12:50 -04:00
|
|
|
|
if ( false === strpos( $text, '&#x' ) ) {
|
|
|
|
|
if ( ( function_exists( 'mb_check_encoding' ) && mb_check_encoding( $text, 'ASCII' ) ) || ! preg_match( '/[^\x00-\x7F]/', $text ) ) {
|
|
|
|
|
// The text doesn't contain anything that might be emoji, so we can return early.
|
|
|
|
|
return $text;
|
|
|
|
|
} else {
|
|
|
|
|
$encoded_text = wp_encode_emoji( $text );
|
|
|
|
|
if ( $encoded_text === $text ) {
|
|
|
|
|
return $encoded_text;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$text = $encoded_text;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$emoji = _wp_emoji_list( 'entities' );
|
|
|
|
|
|
|
|
|
|
// Quickly narrow down the list of emoji that might be in the text and need replacing.
|
|
|
|
|
$possible_emoji = array();
|
2017-11-30 18:11:00 -05:00
|
|
|
|
foreach ( $emoji as $emojum ) {
|
2017-10-03 03:12:50 -04:00
|
|
|
|
if ( false !== strpos( $text, $emojum ) ) {
|
2019-09-20 18:02:57 -04:00
|
|
|
|
$possible_emoji[ $emojum ] = html_entity_decode( $emojum );
|
2017-10-03 03:12:50 -04:00
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
if ( ! $possible_emoji ) {
|
|
|
|
|
return $text;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
2021-06-08 18:15:12 -04:00
|
|
|
|
$cdn_url = apply_filters( 'emoji_url', 'https://s.w.org/images/core/emoji/13.1.0/72x72/' );
|
2017-10-03 03:12:50 -04:00
|
|
|
|
|
|
|
|
|
/** This filter is documented in wp-includes/formatting.php */
|
|
|
|
|
$ext = apply_filters( 'emoji_ext', '.png' );
|
2015-03-11 18:49:28 -04:00
|
|
|
|
|
2015-03-12 09:17:26 -04:00
|
|
|
|
$output = '';
|
2015-03-15 21:43:28 -04:00
|
|
|
|
/*
|
2015-03-15 21:56:27 -04:00
|
|
|
|
* HTML loop taken from smiley function, which was taken from texturize function.
|
2015-03-15 21:43:28 -04:00
|
|
|
|
* It'll never be consolidated.
|
|
|
|
|
*
|
|
|
|
|
* First, capture the tags as well as in between.
|
|
|
|
|
*/
|
|
|
|
|
$textarr = preg_split( '/(<.*>)/U', $text, -1, PREG_SPLIT_DELIM_CAPTURE );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$stop = count( $textarr );
|
2015-03-11 18:49:28 -04:00
|
|
|
|
|
2015-03-15 21:43:28 -04:00
|
|
|
|
// Ignore processing of specific tags.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$tags_to_ignore = 'code|pre|style|script|textarea';
|
2015-03-12 09:17:26 -04:00
|
|
|
|
$ignore_block_element = '';
|
2015-03-11 18:49:28 -04:00
|
|
|
|
|
2015-03-12 09:17:26 -04:00
|
|
|
|
for ( $i = 0; $i < $stop; $i++ ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$content = $textarr[ $i ];
|
2015-03-11 18:49:28 -04:00
|
|
|
|
|
2015-03-15 21:43:28 -04:00
|
|
|
|
// If we're in an ignore block, wait until we find its closing tag.
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( '' === $ignore_block_element && preg_match( '/^<(' . $tags_to_ignore . ')>/', $content, $matches ) ) {
|
2015-03-12 09:17:26 -04:00
|
|
|
|
$ignore_block_element = $matches[1];
|
|
|
|
|
}
|
2015-03-11 18:49:28 -04:00
|
|
|
|
|
2015-03-15 21:43:28 -04:00
|
|
|
|
// If it's not a tag and not in ignore block.
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( '' === $ignore_block_element && strlen( $content ) > 0 && '<' !== $content[0] && false !== strpos( $content, '&#x' ) ) {
|
2017-10-03 03:12:50 -04:00
|
|
|
|
foreach ( $possible_emoji as $emojum => $emoji_char ) {
|
|
|
|
|
if ( false === strpos( $content, $emojum ) ) {
|
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
$file = str_replace( ';&#x', '-', $emojum );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$file = str_replace( array( '&#x', ';' ), '', $file );
|
2017-10-03 03:12:50 -04:00
|
|
|
|
|
|
|
|
|
$entity = sprintf( '<img src="%s" alt="%s" class="wp-smiley" style="height: 1em; max-height: 1em;" />', $cdn_url . $file . $ext, $emoji_char );
|
|
|
|
|
|
|
|
|
|
$content = str_replace( $emojum, $entity, $content );
|
|
|
|
|
}
|
2015-03-11 18:49:28 -04:00
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Did we exit ignore block?
|
2020-05-16 14:42:12 -04:00
|
|
|
|
if ( '' !== $ignore_block_element && '</' . $ignore_block_element . '>' === $content ) {
|
2015-03-12 09:17:26 -04:00
|
|
|
|
$ignore_block_element = '';
|
2015-03-11 18:49:28 -04:00
|
|
|
|
}
|
2015-03-12 09:17:26 -04:00
|
|
|
|
|
|
|
|
|
$output .= $content;
|
2015-03-11 18:49:28 -04:00
|
|
|
|
}
|
|
|
|
|
|
2020-01-28 19:45:18 -05:00
|
|
|
|
// Finally, remove any stray U+FE0F characters.
|
2017-10-03 03:12:50 -04:00
|
|
|
|
$output = str_replace( '️', '', $output );
|
2015-03-11 18:49:28 -04:00
|
|
|
|
|
2017-10-03 03:12:50 -04:00
|
|
|
|
return $output;
|
Emoji: Port the Twemoji regex to PHP.
Previously, `wp_encode_emoji()` and `wp_staticize_emoji()` used inaccurate regular expressions to find emoji, and transform then into HTML entities or `<img>`s, respectively. This would result in emoji not being correctly transformed, or occasionally, non-emoji being incorrectly transformed.
This commit adds a new `grunt` task - `grunt precommit:emoji`. It finds the regex in `twemoji.js`, transforms it into a PHP-friendly version, and adds it to `formatting.php`. This task is also automatically run by `grunt precommit`, when it detects that `twemoji.js` has changed.
The new regex requires features introduced in PCRE 8.32, which was introduced in PHP 5.4.14, though it was also backported to later releases of the PHP 5.3 series. For versions of PHP that don't support this, it will fall back to an updated version of the loose-matching regex.
For short posts, the performance difference between the old and new regex is negligible. As the posts get longer, however, the new method is exponentially faster.
Fixes #35293.
Built from https://develop.svn.wordpress.org/trunk@41043
git-svn-id: http://core.svn.wordpress.org/trunk@40893 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2017-07-14 01:47:49 -04:00
|
|
|
|
}
|
|
|
|
|
|
2015-03-11 18:49:28 -04:00
|
|
|
|
/**
|
|
|
|
|
* Convert emoji in emails into static images.
|
|
|
|
|
*
|
2015-03-15 21:43:28 -04:00
|
|
|
|
* @since 4.2.0
|
2015-03-11 18:49:28 -04:00
|
|
|
|
*
|
2015-03-15 21:43:28 -04:00
|
|
|
|
* @param array $mail The email data array.
|
2015-03-11 18:49:28 -04:00
|
|
|
|
* @return array The email data array, with emoji in the message staticized.
|
|
|
|
|
*/
|
2015-04-20 00:15:26 -04:00
|
|
|
|
function wp_staticize_emoji_for_email( $mail ) {
|
2015-03-22 19:16:28 -04:00
|
|
|
|
if ( ! isset( $mail['message'] ) ) {
|
|
|
|
|
return $mail;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/*
|
2021-08-10 08:53:59 -04:00
|
|
|
|
* We can only transform the emoji into images if it's a `text/html` email.
|
2015-03-22 19:16:28 -04:00
|
|
|
|
* To do that, here's a cut down version of the same process that happens
|
2021-08-10 08:53:59 -04:00
|
|
|
|
* in wp_mail() - get the `Content-Type` from the headers, if there is one,
|
|
|
|
|
* then pass it through the {@see 'wp_mail_content_type'} filter, in case
|
|
|
|
|
* a plugin is handling changing the `Content-Type`.
|
2015-03-22 19:16:28 -04:00
|
|
|
|
*/
|
|
|
|
|
$headers = array();
|
|
|
|
|
if ( isset( $mail['headers'] ) ) {
|
|
|
|
|
if ( is_array( $mail['headers'] ) ) {
|
|
|
|
|
$headers = $mail['headers'];
|
|
|
|
|
} else {
|
|
|
|
|
$headers = explode( "\n", str_replace( "\r\n", "\n", $mail['headers'] ) );
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
foreach ( $headers as $header ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( strpos( $header, ':' ) === false ) {
|
2015-03-22 19:16:28 -04:00
|
|
|
|
continue;
|
|
|
|
|
}
|
|
|
|
|
|
2015-04-05 11:51:27 -04:00
|
|
|
|
// Explode them out.
|
2015-03-22 19:16:28 -04:00
|
|
|
|
list( $name, $content ) = explode( ':', trim( $header ), 2 );
|
|
|
|
|
|
2015-04-05 11:51:27 -04:00
|
|
|
|
// Cleanup crew.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$name = trim( $name );
|
2015-03-22 19:16:28 -04:00
|
|
|
|
$content = trim( $content );
|
|
|
|
|
|
|
|
|
|
if ( 'content-type' === strtolower( $name ) ) {
|
|
|
|
|
if ( strpos( $content, ';' ) !== false ) {
|
|
|
|
|
list( $type, $charset ) = explode( ';', $content );
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$content_type = trim( $type );
|
2015-03-22 19:16:28 -04:00
|
|
|
|
} else {
|
|
|
|
|
$content_type = trim( $content );
|
|
|
|
|
}
|
|
|
|
|
break;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
2015-04-05 11:51:27 -04:00
|
|
|
|
// Set Content-Type if we don't have a content-type from the input headers.
|
2015-03-22 19:16:28 -04:00
|
|
|
|
if ( ! isset( $content_type ) ) {
|
|
|
|
|
$content_type = 'text/plain';
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/** This filter is documented in wp-includes/pluggable.php */
|
|
|
|
|
$content_type = apply_filters( 'wp_mail_content_type', $content_type );
|
|
|
|
|
|
|
|
|
|
if ( 'text/html' === $content_type ) {
|
2015-04-20 00:15:26 -04:00
|
|
|
|
$mail['message'] = wp_staticize_emoji( $mail['message'] );
|
2015-03-20 08:32:26 -04:00
|
|
|
|
}
|
2015-03-22 19:16:28 -04:00
|
|
|
|
|
2015-03-11 18:49:28 -04:00
|
|
|
|
return $mail;
|
|
|
|
|
}
|
2015-10-20 23:48:24 -04:00
|
|
|
|
|
Emoji: Port the Twemoji regex to PHP.
Previously, `wp_encode_emoji()` and `wp_staticize_emoji()` used inaccurate regular expressions to find emoji, and transform then into HTML entities or `<img>`s, respectively. This would result in emoji not being correctly transformed, or occasionally, non-emoji being incorrectly transformed.
This commit adds a new `grunt` task - `grunt precommit:emoji`. It finds the regex in `twemoji.js`, transforms it into a PHP-friendly version, and adds it to `formatting.php`. This task is also automatically run by `grunt precommit`, when it detects that `twemoji.js` has changed.
The new regex requires features introduced in PCRE 8.32, which was introduced in PHP 5.4.14, though it was also backported to later releases of the PHP 5.3 series. For versions of PHP that don't support this, it will fall back to an updated version of the loose-matching regex.
For short posts, the performance difference between the old and new regex is negligible. As the posts get longer, however, the new method is exponentially faster.
Fixes #35293.
Built from https://develop.svn.wordpress.org/trunk@41043
git-svn-id: http://core.svn.wordpress.org/trunk@40893 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2017-07-14 01:47:49 -04:00
|
|
|
|
/**
|
2018-03-09 20:50:30 -05:00
|
|
|
|
* Returns arrays of emoji data.
|
Emoji: Port the Twemoji regex to PHP.
Previously, `wp_encode_emoji()` and `wp_staticize_emoji()` used inaccurate regular expressions to find emoji, and transform then into HTML entities or `<img>`s, respectively. This would result in emoji not being correctly transformed, or occasionally, non-emoji being incorrectly transformed.
This commit adds a new `grunt` task - `grunt precommit:emoji`. It finds the regex in `twemoji.js`, transforms it into a PHP-friendly version, and adds it to `formatting.php`. This task is also automatically run by `grunt precommit`, when it detects that `twemoji.js` has changed.
The new regex requires features introduced in PCRE 8.32, which was introduced in PHP 5.4.14, though it was also backported to later releases of the PHP 5.3 series. For versions of PHP that don't support this, it will fall back to an updated version of the loose-matching regex.
For short posts, the performance difference between the old and new regex is negligible. As the posts get longer, however, the new method is exponentially faster.
Fixes #35293.
Built from https://develop.svn.wordpress.org/trunk@41043
git-svn-id: http://core.svn.wordpress.org/trunk@40893 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2017-07-14 01:47:49 -04:00
|
|
|
|
*
|
2018-03-09 20:50:30 -05:00
|
|
|
|
* These arrays are automatically built from the regex in twemoji.js - if they need to be updated,
|
2019-05-26 15:35:51 -04:00
|
|
|
|
* you should update the regex there, then run the `npm run grunt precommit:emoji` job.
|
Emoji: Port the Twemoji regex to PHP.
Previously, `wp_encode_emoji()` and `wp_staticize_emoji()` used inaccurate regular expressions to find emoji, and transform then into HTML entities or `<img>`s, respectively. This would result in emoji not being correctly transformed, or occasionally, non-emoji being incorrectly transformed.
This commit adds a new `grunt` task - `grunt precommit:emoji`. It finds the regex in `twemoji.js`, transforms it into a PHP-friendly version, and adds it to `formatting.php`. This task is also automatically run by `grunt precommit`, when it detects that `twemoji.js` has changed.
The new regex requires features introduced in PCRE 8.32, which was introduced in PHP 5.4.14, though it was also backported to later releases of the PHP 5.3 series. For versions of PHP that don't support this, it will fall back to an updated version of the loose-matching regex.
For short posts, the performance difference between the old and new regex is negligible. As the posts get longer, however, the new method is exponentially faster.
Fixes #35293.
Built from https://develop.svn.wordpress.org/trunk@41043
git-svn-id: http://core.svn.wordpress.org/trunk@40893 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2017-07-14 01:47:49 -04:00
|
|
|
|
*
|
2017-10-03 03:12:50 -04:00
|
|
|
|
* @since 4.9.0
|
|
|
|
|
* @access private
|
Emoji: Port the Twemoji regex to PHP.
Previously, `wp_encode_emoji()` and `wp_staticize_emoji()` used inaccurate regular expressions to find emoji, and transform then into HTML entities or `<img>`s, respectively. This would result in emoji not being correctly transformed, or occasionally, non-emoji being incorrectly transformed.
This commit adds a new `grunt` task - `grunt precommit:emoji`. It finds the regex in `twemoji.js`, transforms it into a PHP-friendly version, and adds it to `formatting.php`. This task is also automatically run by `grunt precommit`, when it detects that `twemoji.js` has changed.
The new regex requires features introduced in PCRE 8.32, which was introduced in PHP 5.4.14, though it was also backported to later releases of the PHP 5.3 series. For versions of PHP that don't support this, it will fall back to an updated version of the loose-matching regex.
For short posts, the performance difference between the old and new regex is negligible. As the posts get longer, however, the new method is exponentially faster.
Fixes #35293.
Built from https://develop.svn.wordpress.org/trunk@41043
git-svn-id: http://core.svn.wordpress.org/trunk@40893 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2017-07-14 01:47:49 -04:00
|
|
|
|
*
|
2017-10-03 03:12:50 -04:00
|
|
|
|
* @param string $type Optional. Which array type to return. Accepts 'partials' or 'entities', default 'entities'.
|
|
|
|
|
* @return array An array to match all emoji that WordPress recognises.
|
Emoji: Port the Twemoji regex to PHP.
Previously, `wp_encode_emoji()` and `wp_staticize_emoji()` used inaccurate regular expressions to find emoji, and transform then into HTML entities or `<img>`s, respectively. This would result in emoji not being correctly transformed, or occasionally, non-emoji being incorrectly transformed.
This commit adds a new `grunt` task - `grunt precommit:emoji`. It finds the regex in `twemoji.js`, transforms it into a PHP-friendly version, and adds it to `formatting.php`. This task is also automatically run by `grunt precommit`, when it detects that `twemoji.js` has changed.
The new regex requires features introduced in PCRE 8.32, which was introduced in PHP 5.4.14, though it was also backported to later releases of the PHP 5.3 series. For versions of PHP that don't support this, it will fall back to an updated version of the loose-matching regex.
For short posts, the performance difference between the old and new regex is negligible. As the posts get longer, however, the new method is exponentially faster.
Fixes #35293.
Built from https://develop.svn.wordpress.org/trunk@41043
git-svn-id: http://core.svn.wordpress.org/trunk@40893 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2017-07-14 01:47:49 -04:00
|
|
|
|
*/
|
2017-10-03 03:12:50 -04:00
|
|
|
|
function _wp_emoji_list( $type = 'entities' ) {
|
|
|
|
|
// Do not remove the START/END comments - they're used to find where to insert the arrays.
|
Emoji: Port the Twemoji regex to PHP.
Previously, `wp_encode_emoji()` and `wp_staticize_emoji()` used inaccurate regular expressions to find emoji, and transform then into HTML entities or `<img>`s, respectively. This would result in emoji not being correctly transformed, or occasionally, non-emoji being incorrectly transformed.
This commit adds a new `grunt` task - `grunt precommit:emoji`. It finds the regex in `twemoji.js`, transforms it into a PHP-friendly version, and adds it to `formatting.php`. This task is also automatically run by `grunt precommit`, when it detects that `twemoji.js` has changed.
The new regex requires features introduced in PCRE 8.32, which was introduced in PHP 5.4.14, though it was also backported to later releases of the PHP 5.3 series. For versions of PHP that don't support this, it will fall back to an updated version of the loose-matching regex.
For short posts, the performance difference between the old and new regex is negligible. As the posts get longer, however, the new method is exponentially faster.
Fixes #35293.
Built from https://develop.svn.wordpress.org/trunk@41043
git-svn-id: http://core.svn.wordpress.org/trunk@40893 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2017-07-14 01:47:49 -04:00
|
|
|
|
|
2017-10-03 03:12:50 -04:00
|
|
|
|
// START: emoji arrays
|
2021-06-08 18:15:12 -04:00
|
|
|
|
$entities = array( '👨🏻‍❤️‍💋‍👨🏻', '👨🏻‍❤️‍💋‍👨🏼', '👨🏻‍❤️‍💋‍👨🏽', '👨🏻‍❤️‍💋‍👨🏾', '👨🏻‍❤️‍💋‍👨🏿', '👨🏼‍❤️‍💋‍👨🏻', '👨🏼‍❤️‍💋‍👨🏼', '👨🏼‍❤️‍💋‍👨🏽', '👨🏼‍❤️‍💋‍👨🏾', '👨🏼‍❤️‍💋‍👨🏿', '👨🏽‍❤️‍💋‍👨🏻', '👨🏽‍❤️‍💋‍👨🏼', '👨🏽‍❤️‍💋‍👨🏽', '👨🏽‍❤️‍💋‍👨🏾', '👨🏽‍❤️‍💋‍👨🏿', '👨🏾‍❤️‍💋‍👨🏻', '👨🏾‍❤️‍💋‍👨🏼', '👨🏾‍❤️‍💋‍👨🏽', '👨🏾‍❤️‍💋‍👨🏾', '👨🏾‍❤️‍💋‍👨🏿', '👨🏿‍❤️‍💋‍👨🏻', '👨🏿‍❤️‍💋‍👨🏼', '👨🏿‍❤️‍💋‍👨🏽', '👨🏿‍❤️‍💋‍👨🏾', '👨🏿‍❤️‍💋‍👨🏿', '👩🏻‍❤️‍💋‍👨🏻', '👩🏻‍❤️‍💋‍👨🏼', '👩🏻‍❤️‍💋‍👨🏽', '👩🏻‍❤️‍💋‍👨🏾', '👩🏻‍❤️‍💋‍👨🏿', '👩🏻‍❤️‍💋‍👩🏻', '👩🏻‍❤️‍💋‍👩🏼', '👩🏻‍❤️‍💋‍👩🏽', '👩🏻‍❤️‍💋‍👩🏾', '👩🏻‍❤️‍💋‍👩🏿', '👩🏼‍❤️‍💋‍👨🏻', '👩🏼‍❤️‍💋‍👨🏼', '👩🏼‍❤️‍💋‍👨🏽', '👩🏼‍❤️‍💋‍👨🏾', '👩🏼‍❤️‍💋‍👨🏿', '👩🏼‍❤️‍💋‍👩🏻', '👩🏼‍❤️‍💋‍👩🏼', '👩🏼‍❤️‍💋‍👩🏽', '👩🏼‍❤️‍💋‍👩🏾', '👩🏼‍❤️‍💋‍👩🏿', '👩🏽‍❤️‍💋‍&#
|
|
|
|
|
$partials = array( '🀄', '🃏', '🅰', '🅱', '🅾', '🅿', '🆎', '🆑', '🆒', '🆓', '🆔', '🆕', '🆖', '🆗', '🆘', '🆙', '🆚', '🇦', '🇨', '🇩', '🇪', '🇫', '🇬', '🇮', '🇱', '🇲', '🇴', '🇶', '🇷', '🇸', '🇹', '🇺', '🇼', '🇽', '🇿', '🇧', '🇭', '🇯', '🇳', '🇻', '🇾', '🇰', '🇵', '🈁', '🈂', '🈚', '🈯', '🈲', '🈳', '🈴', '🈵', '🈶', '🈷', '🈸', '🈹', '🈺', '🉐', '🉑', '🌀', '🌁', '🌂', '🌃', '🌄', '🌅', '🌆', '🌇', '🌈', '🌉', '🌊', '🌋', '🌌', '🌍', '🌎', '🌏', '🌐', '🌑', '🌒', '🌓', '🌔', '🌕', '🌖', '🌗', '🌘', '🌙', '🌚', '🌛', '🌜', '🌝', '🌞', '🌟', '🌠', '🌡', '🌤', '🌥', '🌦', '🌧', '🌨', '🌩', '🌪', '🌫', '🌬', '🌭', '🌮', '🌯', '🌰', '🌱', '🌲', '🌳', '🌴', '🌵', '🌶', '🌷', '🌸', '🌹', '🌺', '🌻', '🌼', '🌽', '🌾', '🌿', '🍀', '🍁', '🍂', '🍃', '🍄', '🍅', '🍆', '🍇', '🍈', '🍉', '🍊', '🍋', '🍌', '🍍', '🍎', '🍏', '🍐', '🍑', '🍒', '🍓', '🍔', '🍕', '🍖', '🍗', '🍘', '🍙', '🍚', '🍛', '🍜', '🍝', '🍞', '🍟', '🍠', '🍡', '🍢', '🍣', '🍤', '🍥', '🍦', '🍧', '🍨', '🍩', '🍪', '🍫', '🍬', '🍭', '🍮', '🍯', '🍰', '🍱', '🍲', '🍳', '🍴', '🍵', '🍶', '🍷', '🍸', '🍹', '🍺', '🍻', '🍼', '🍽', '🍾', '🍿', '🎀', '🎁', '🎂', '🎃', '🎄', '🎅', '🏻', '🏼', '🏽', '🏾', '🏿', '🎆', '🎇', '🎈', '🎉', '🎊', '🎋', '🎌', '🎍', '🎎', '🎏', '🎐', '🎑', '🎒', '🎓', '🎖', '🎗', '🎙', '🎚', '🎛', '🎞', '🎟', '🎠', '🎡', '🎢', '🎣', '🎤', '🎥', '🎦', '🎧', '🎨', '🎩', '🎪', '🎫', '🎬', '🎭', '🎮', '🎯', '🎰', '🎱', '🎲', '🎳', '🎴', '🎵', '🎶', '🎷', '🎸', '🎹', '🎺', '🎻', '🎼', '🎽', '🎾', '🎿', '🏀', '🏁', '🏂', '🏃', '‍', '♀', '️', '♂', '🏄', '🏅', '🏆', '🏇', '🏈', '🏉', '🏊', '🏋', '🏌', '🏍', '🏎', '🏏', '🏐', '🏑', '🏒', '🏓', '🏔', '🏕', '🏖', '🏗', '🏘', '🏙', '🏚', '🏛', '🏜', '🏝', '🏞', '🏟', '🏠', '🏡', '🏢', '🏣', '🏤', '🏥', '🏦', '🏧', '🏨', '🏩', '🏪', '🏫', '🏬', '🏭', '🏮', '🏯', '🏰', '🏳', '⚧', '🏴', '☠', '󠁧', '󠁢', '󠁥', '󠁮', '󠁿', '󠁳', '󠁣', '󠁴', '󠁷',
|
2017-10-03 03:12:50 -04:00
|
|
|
|
// END: emoji arrays
|
Emoji: Port the Twemoji regex to PHP.
Previously, `wp_encode_emoji()` and `wp_staticize_emoji()` used inaccurate regular expressions to find emoji, and transform then into HTML entities or `<img>`s, respectively. This would result in emoji not being correctly transformed, or occasionally, non-emoji being incorrectly transformed.
This commit adds a new `grunt` task - `grunt precommit:emoji`. It finds the regex in `twemoji.js`, transforms it into a PHP-friendly version, and adds it to `formatting.php`. This task is also automatically run by `grunt precommit`, when it detects that `twemoji.js` has changed.
The new regex requires features introduced in PCRE 8.32, which was introduced in PHP 5.4.14, though it was also backported to later releases of the PHP 5.3 series. For versions of PHP that don't support this, it will fall back to an updated version of the loose-matching regex.
For short posts, the performance difference between the old and new regex is negligible. As the posts get longer, however, the new method is exponentially faster.
Fixes #35293.
Built from https://develop.svn.wordpress.org/trunk@41043
git-svn-id: http://core.svn.wordpress.org/trunk@40893 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2017-07-14 01:47:49 -04:00
|
|
|
|
|
|
|
|
|
if ( 'entities' === $type ) {
|
|
|
|
|
return $entities;
|
|
|
|
|
}
|
|
|
|
|
|
2017-10-03 03:12:50 -04:00
|
|
|
|
return $partials;
|
Emoji: Port the Twemoji regex to PHP.
Previously, `wp_encode_emoji()` and `wp_staticize_emoji()` used inaccurate regular expressions to find emoji, and transform then into HTML entities or `<img>`s, respectively. This would result in emoji not being correctly transformed, or occasionally, non-emoji being incorrectly transformed.
This commit adds a new `grunt` task - `grunt precommit:emoji`. It finds the regex in `twemoji.js`, transforms it into a PHP-friendly version, and adds it to `formatting.php`. This task is also automatically run by `grunt precommit`, when it detects that `twemoji.js` has changed.
The new regex requires features introduced in PCRE 8.32, which was introduced in PHP 5.4.14, though it was also backported to later releases of the PHP 5.3 series. For versions of PHP that don't support this, it will fall back to an updated version of the loose-matching regex.
For short posts, the performance difference between the old and new regex is negligible. As the posts get longer, however, the new method is exponentially faster.
Fixes #35293.
Built from https://develop.svn.wordpress.org/trunk@41043
git-svn-id: http://core.svn.wordpress.org/trunk@40893 1a063a9b-81f0-0310-95a4-ce76da25c4cd
2017-07-14 01:47:49 -04:00
|
|
|
|
}
|
|
|
|
|
|
2015-10-20 23:48:24 -04:00
|
|
|
|
/**
|
2016-03-12 07:39:27 -05:00
|
|
|
|
* Shorten a URL, to be used as link text.
|
2015-10-20 23:48:24 -04:00
|
|
|
|
*
|
|
|
|
|
* @since 1.2.0
|
2015-12-07 11:39:25 -05:00
|
|
|
|
* @since 4.4.0 Moved to wp-includes/formatting.php from wp-admin/includes/misc.php and added $length param.
|
2015-10-20 23:48:24 -04:00
|
|
|
|
*
|
2015-12-07 11:39:25 -05:00
|
|
|
|
* @param string $url URL to shorten.
|
|
|
|
|
* @param int $length Optional. Maximum length of the shortened URL. Default 35 characters.
|
|
|
|
|
* @return string Shortened URL.
|
|
|
|
|
*/
|
2015-10-20 23:48:24 -04:00
|
|
|
|
function url_shorten( $url, $length = 35 ) {
|
2017-11-30 18:11:00 -05:00
|
|
|
|
$stripped = str_replace( array( 'https://', 'http://', 'www.' ), '', $url );
|
2015-10-20 23:48:24 -04:00
|
|
|
|
$short_url = untrailingslashit( $stripped );
|
|
|
|
|
|
|
|
|
|
if ( strlen( $short_url ) > $length ) {
|
|
|
|
|
$short_url = substr( $short_url, 0, $length - 3 ) . '…';
|
|
|
|
|
}
|
|
|
|
|
return $short_url;
|
2015-12-07 11:39:25 -05:00
|
|
|
|
}
|
2016-04-21 15:22:27 -04:00
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Sanitizes a hex color.
|
|
|
|
|
*
|
|
|
|
|
* Returns either '', a 3 or 6 digit hex color (with #), or nothing.
|
|
|
|
|
* For sanitizing values without a #, see sanitize_hex_color_no_hash().
|
|
|
|
|
*
|
|
|
|
|
* @since 3.4.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $color
|
|
|
|
|
* @return string|void
|
|
|
|
|
*/
|
|
|
|
|
function sanitize_hex_color( $color ) {
|
|
|
|
|
if ( '' === $color ) {
|
|
|
|
|
return '';
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// 3 or 6 hex digits, or the empty string.
|
2017-11-30 18:11:00 -05:00
|
|
|
|
if ( preg_match( '|^#([A-Fa-f0-9]{3}){1,2}$|', $color ) ) {
|
2016-04-21 15:22:27 -04:00
|
|
|
|
return $color;
|
|
|
|
|
}
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Sanitizes a hex color without a hash. Use sanitize_hex_color() when possible.
|
|
|
|
|
*
|
|
|
|
|
* Saving hex colors without a hash puts the burden of adding the hash on the
|
|
|
|
|
* UI, which makes it difficult to use or upgrade to other color types such as
|
2020-06-28 10:02:06 -04:00
|
|
|
|
* rgba, hsl, rgb, and HTML color names.
|
2016-04-21 15:22:27 -04:00
|
|
|
|
*
|
|
|
|
|
* Returns either '', a 3 or 6 digit hex color (without a #), or null.
|
|
|
|
|
*
|
|
|
|
|
* @since 3.4.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $color
|
|
|
|
|
* @return string|null
|
|
|
|
|
*/
|
|
|
|
|
function sanitize_hex_color_no_hash( $color ) {
|
|
|
|
|
$color = ltrim( $color, '#' );
|
|
|
|
|
|
|
|
|
|
if ( '' === $color ) {
|
|
|
|
|
return '';
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return sanitize_hex_color( '#' . $color ) ? $color : null;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* Ensures that any hex color is properly hashed.
|
|
|
|
|
* Otherwise, returns value untouched.
|
|
|
|
|
*
|
|
|
|
|
* This method should only be necessary if using sanitize_hex_color_no_hash().
|
|
|
|
|
*
|
|
|
|
|
* @since 3.4.0
|
|
|
|
|
*
|
|
|
|
|
* @param string $color
|
|
|
|
|
* @return string
|
|
|
|
|
*/
|
|
|
|
|
function maybe_hash_hex_color( $color ) {
|
2019-07-02 19:42:58 -04:00
|
|
|
|
$unhashed = sanitize_hex_color_no_hash( $color );
|
|
|
|
|
if ( $unhashed ) {
|
2016-04-21 15:22:27 -04:00
|
|
|
|
return '#' . $unhashed;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
return $color;
|
|
|
|
|
}
|