* * @return string */ public function get_output_charset() { return $this->output_charset; } /** * Set a custom stylesheet for this sitemap. Set to empty to just remove the default stylesheet. * * @param string $stylesheet Full XML-stylesheet declaration. */ public function set_stylesheet( $stylesheet ) { $this->stylesheet = $stylesheet; } /** * Build the `` tag for a given URL. * * @param array $url Array of parts that make up this entry. * * @return string */ protected function sitemap_index_url( $url ) { $date = null; if ( ! empty( $url['lastmod'] ) ) { $date = $this->timezone->format_date( $url['lastmod'] ); } $url['loc'] = htmlspecialchars( $url['loc'], ENT_COMPAT, $this->output_charset, false ); $output = "\t\n"; $output .= "\t\t" . $url['loc'] . "\n"; $output .= empty( $date ) ? '' : "\t\t" . htmlspecialchars( $date, ENT_COMPAT, $this->output_charset, false ) . "\n"; $output .= "\t\n"; return $output; } /** * Build the `` tag for a given URL. * * Public access for backwards compatibility reasons. * * @param array $url Array of parts that make up this entry. * * @return string */ public function sitemap_url( $url ) { $date = null; if ( ! empty( $url['mod'] ) ) { // Create a DateTime object date in the correct timezone. $date = $this->timezone->format_date( $url['mod'] ); } $url['loc'] = htmlspecialchars( $url['loc'], ENT_COMPAT, $this->output_charset, false ); $output = "\t\n"; $output .= "\t\t" . $this->encode_url_rfc3986( $url['loc'] ) . "\n"; $output .= empty( $date ) ? '' : "\t\t" . htmlspecialchars( $date, ENT_COMPAT, $this->output_charset, false ) . "\n"; if ( empty( $url['images'] ) ) { $url['images'] = array(); } foreach ( $url['images'] as $img ) { if ( empty( $img['src'] ) ) { continue; } $output .= "\t\t\n"; $output .= "\t\t\t" . esc_html( $this->encode_url_rfc3986( $img['src'] ) ) . "\n"; if ( ! empty( $img['title'] ) ) { $title = $img['title']; if ( $this->needs_conversion ) { $title = mb_convert_encoding( $title, $this->output_charset, $this->charset ); } $title = _wp_specialchars( html_entity_decode( $title, ENT_QUOTES, $this->output_charset ) ); $output .= "\t\t\t\n"; } if ( ! empty( $img['alt'] ) ) { $alt = $img['alt']; if ( $this->needs_conversion ) { $alt = mb_convert_encoding( $alt, $this->output_charset, $this->charset ); } $alt = _wp_specialchars( html_entity_decode( $alt, ENT_QUOTES, $this->output_charset ) ); $output .= "\t\t\t\n"; } $output .= "\t\t\n"; } unset( $img, $title, $alt ); $output .= "\t\n"; /** * Filters the output for the sitemap URL tag. * * @api string $output The output for the sitemap url tag. * * @param array $url The sitemap URL array on which the output is based. */ return apply_filters( 'wpseo_sitemap_url', $output, $url ); } /** * Apply some best effort conversion to comply with RFC3986. * * @param string $url URL to encode. * * @return string */ protected function encode_url_rfc3986( $url ) { if ( filter_var( $url, FILTER_VALIDATE_URL ) ) { return $url; } $path = wp_parse_url( $url, PHP_URL_PATH ); if ( ! empty( $path ) && '/' !== $path ) { $encoded_path = explode( '/', $path ); // First decode the path, to prevent double encoding. $encoded_path = array_map( 'rawurldecode', $encoded_path ); $encoded_path = array_map( 'rawurlencode', $encoded_path ); $encoded_path = implode( '/', $encoded_path ); $encoded_path = str_replace( '%7E', '~', $encoded_path ); // PHP < 5.3. $url = str_replace( $path, $encoded_path, $url ); } $query = wp_parse_url( $url, PHP_URL_QUERY ); if ( ! empty( $query ) ) { parse_str( $query, $parsed_query ); if ( defined( 'PHP_QUERY_RFC3986' ) ) { // PHP 5.4+. $parsed_query = http_build_query( $parsed_query, null, '&', PHP_QUERY_RFC3986 ); } else { $parsed_query = http_build_query( $parsed_query, null, '&' ); $parsed_query = str_replace( '+', '%20', $parsed_query ); $parsed_query = str_replace( '%7E', '~', $parsed_query ); } $url = str_replace( $query, $parsed_query, $url ); } return $url; } /** * Retrieves the XSL URL that should be used in the current environment * * When home_url and site_url are not the same, the home_url should be used. * This is because the XSL needs to be served from the same domain, protocol and port * as the XML file that is loading it. * * @return string The XSL URL that needs to be used. */ protected function get_xsl_url() { if ( home_url() !== site_url() ) { return home_url( 'main-sitemap.xsl' ); } /* * Fallback to circumvent a cross-domain security problem when the XLS file is * loaded from a different (sub)domain. */ if ( strpos( plugins_url(), home_url() ) !== 0 ) { return home_url( 'main-sitemap.xsl' ); } return plugin_dir_url( WPSEO_FILE ) . 'css/main-sitemap.xsl'; } /** * Adds debugging information to the output. * * @param bool $transient Transient cache was used or not. * * @return string Information about the functionality used to build the sitemap. */ protected function get_debug( $transient ) { $debug = defined( 'YOAST_SEO_DEBUG_SITEMAPS' ) && YOAST_SEO_DEBUG_SITEMAPS === true; if ( ! $debug ) { return ''; } $memory_used = number_format( ( memory_get_peak_usage() / 1048576 ), 2 ); $queries_run = ( $transient ) ? 'Served from transient cache' : 'Queries executed ' . absint( $GLOBALS['wpdb']->num_queries ); $output = "\n"; if ( defined( 'SAVEQUERIES' ) && SAVEQUERIES ) { $queries = print_r( $GLOBALS['wpdb']->queries, true ); $output .= "\n"; } return $output; } }