diff options
Diffstat (limited to 'plugins/jetpack/modules/sitemaps/sitemap-builder.php')
-rw-r--r-- | plugins/jetpack/modules/sitemaps/sitemap-builder.php | 1468 |
1 files changed, 0 insertions, 1468 deletions
diff --git a/plugins/jetpack/modules/sitemaps/sitemap-builder.php b/plugins/jetpack/modules/sitemaps/sitemap-builder.php deleted file mode 100644 index e04f58d5..00000000 --- a/plugins/jetpack/modules/sitemaps/sitemap-builder.php +++ /dev/null @@ -1,1468 +0,0 @@ -<?php -/** - * Build the sitemap tree. - * - * @package Jetpack - * @since 4.8.0 - * @author Automattic - */ - -/* Include sitemap subclasses, if not already, and include proper buffer based on phpxml's availability. */ -require_once dirname( __FILE__ ) . '/sitemap-constants.php'; -require_once dirname( __FILE__ ) . '/sitemap-buffer.php'; - -if ( ! class_exists( 'DOMDocument' ) ) { - require_once dirname( __FILE__ ) . '/sitemap-buffer-fallback.php'; - require_once dirname( __FILE__ ) . '/sitemap-buffer-image-fallback.php'; - require_once dirname( __FILE__ ) . '/sitemap-buffer-master-fallback.php'; - require_once dirname( __FILE__ ) . '/sitemap-buffer-news-fallback.php'; - require_once dirname( __FILE__ ) . '/sitemap-buffer-page-fallback.php'; - require_once dirname( __FILE__ ) . '/sitemap-buffer-video-fallback.php'; -} else { - require_once dirname( __FILE__ ) . '/sitemap-buffer-image.php'; - require_once dirname( __FILE__ ) . '/sitemap-buffer-master.php'; - require_once dirname( __FILE__ ) . '/sitemap-buffer-news.php'; - require_once dirname( __FILE__ ) . '/sitemap-buffer-page.php'; - require_once dirname( __FILE__ ) . '/sitemap-buffer-video.php'; -} - -require_once dirname( __FILE__ ) . '/sitemap-librarian.php'; -require_once dirname( __FILE__ ) . '/sitemap-finder.php'; -require_once dirname( __FILE__ ) . '/sitemap-state.php'; - -if ( defined( 'WP_DEBUG' ) && WP_DEBUG ) { - require_once dirname( __FILE__ ) . '/sitemap-logger.php'; -} - -/** - * Simple class for rendering an empty sitemap with a short TTL - */ -class Jetpack_Sitemap_Buffer_Empty extends Jetpack_Sitemap_Buffer { - - public function __construct() { - parent::__construct( JP_SITEMAP_MAX_ITEMS, JP_SITEMAP_MAX_BYTES, '1970-01-01 00:00:00' ); - - $this->doc->appendChild( - $this->doc->createComment( "generator='jetpack-" . JETPACK__VERSION . "'" ) - ); - - $this->doc->appendChild( - $this->doc->createProcessingInstruction( - 'xml-stylesheet', - 'type="text/xsl" href="' . $this->finder->construct_sitemap_url( 'sitemap-index.xsl' ) . '"' - ) - ); - } - - protected function get_root_element() { - if ( ! isset( $this->root ) ) { - $this->root = $this->doc->createElement( 'sitemapindex' ); - $this->root->setAttribute( 'xmlns', 'http://www.sitemaps.org/schemas/sitemap/0.9' ); - $this->doc->appendChild( $this->root ); - $this->byte_capacity -= strlen( $this->doc->saveXML( $this->root ) ); - } - - return $this->root; - } -} - -/** - * The Jetpack_Sitemap_Builder object handles the construction of - * all sitemap files (except the XSL files, which are handled by - * Jetpack_Sitemap_Stylist.) Other than the constructor, there are - * only two public functions: build_all_sitemaps and news_sitemap_xml. - * - * @since 4.8.0 - */ -class Jetpack_Sitemap_Builder { - - /** - * Librarian object for storing and retrieving sitemap data. - * - * @access private - * @since 4.8.0 - * @var $librarian Jetpack_Sitemap_Librarian - */ - private $librarian; - - /** - * Logger object for reporting debug messages. - * - * @access private - * @since 4.8.0 - * @var $logger Jetpack_Sitemap_Logger - */ - private $logger = false; - - /** - * Finder object for dealing with sitemap URIs. - * - * @access private - * @since 4.8.0 - * @var $finder Jetpack_Sitemap_Finder - */ - private $finder; - - /** - * Construct a new Jetpack_Sitemap_Builder object. - * - * @access public - * @since 4.8.0 - */ - public function __construct() { - $this->librarian = new Jetpack_Sitemap_Librarian(); - $this->finder = new Jetpack_Sitemap_Finder(); - - if ( defined( 'WP_DEBUG' ) && WP_DEBUG ) { - $this->logger = new Jetpack_Sitemap_Logger(); - } - - update_option( - 'jetpack_sitemap_post_types', - /** - * The array of post types to be included in the sitemap. - * - * Add your custom post type name to the array to have posts of - * that type included in the sitemap. The default array includes - * 'page' and 'post'. - * - * The result of this filter is cached in an option, 'jetpack_sitemap_post_types', - * so this filter only has to be applied once per generation. - * - * @since 4.8.0 - */ - apply_filters( - 'jetpack_sitemap_post_types', - array( 'post', 'page' ) - ) - ); - } - - /** - * Update the sitemap. - * - * All we do here is call build_next_sitemap_file a bunch of times. - * - * @since 4.8.0 - */ - public function update_sitemap() { - if ( $this->logger ) { - $this->logger->report( '-- Updating...' ); - if ( ! class_exists( 'DOMDocument' ) ) { - $this->logger->report( - __( - 'Jetpack can not load necessary XML manipulation libraries. Please ask your hosting provider to refer to our server requirements at https://jetpack.com/support/server-requirements/ .', - 'jetpack' - ), - true - ); - } - } - - for ( $i = 1; $i <= JP_SITEMAP_UPDATE_SIZE; $i++ ) { - if ( true === $this->build_next_sitemap_file() ) { - break; // All finished! - } - } - - if ( $this->logger ) { - $this->logger->report( '-- ...done for now.' ); - $this->logger->time(); - } - } - - /** - * Generate the next sitemap file. - * - * Reads the most recent state of the sitemap generation phase, - * constructs the next file, and updates the state. - * - * @since 4.8.0 - * - * @return bool True when finished. - */ - private function build_next_sitemap_file() { - $finished = false; // Initialize finished flag. - - // Get the most recent state, and lock the state. - $state = Jetpack_Sitemap_State::check_out(); - - // Do nothing if the state was locked. - if ( false === $state ) { - return false; - } - - // Otherwise, branch on the sitemap-type key of $state. - switch ( $state['sitemap-type'] ) { - case JP_PAGE_SITEMAP_TYPE: - $this->build_next_sitemap_of_type( - JP_PAGE_SITEMAP_TYPE, - array( $this, 'build_one_page_sitemap' ), - $state - ); - break; - - case JP_PAGE_SITEMAP_INDEX_TYPE: - $this->build_next_sitemap_index_of_type( - JP_PAGE_SITEMAP_INDEX_TYPE, - JP_IMAGE_SITEMAP_TYPE, - $state - ); - break; - - case JP_IMAGE_SITEMAP_TYPE: - $this->build_next_sitemap_of_type( - JP_IMAGE_SITEMAP_TYPE, - array( $this, 'build_one_image_sitemap' ), - $state - ); - break; - - case JP_IMAGE_SITEMAP_INDEX_TYPE: - $this->build_next_sitemap_index_of_type( - JP_IMAGE_SITEMAP_INDEX_TYPE, - JP_VIDEO_SITEMAP_TYPE, - $state - ); - break; - - case JP_VIDEO_SITEMAP_TYPE: - $this->build_next_sitemap_of_type( - JP_VIDEO_SITEMAP_TYPE, - array( $this, 'build_one_video_sitemap' ), - $state - ); - break; - - case JP_VIDEO_SITEMAP_INDEX_TYPE: - $this->build_next_sitemap_index_of_type( - JP_VIDEO_SITEMAP_INDEX_TYPE, - JP_MASTER_SITEMAP_TYPE, - $state - ); - break; - - case JP_MASTER_SITEMAP_TYPE: - $this->build_master_sitemap( $state['max'] ); - - // Reset the state and quit. - Jetpack_Sitemap_State::reset( - JP_PAGE_SITEMAP_TYPE - ); - - if ( $this->logger ) { - $this->logger->report( '-- Finished.' ); - $this->logger->time(); - } - $finished = true; - - break; - - default: - Jetpack_Sitemap_State::reset( - JP_PAGE_SITEMAP_TYPE - ); - $finished = true; - - break; - } // End switch. - - // Unlock the state. - Jetpack_Sitemap_State::unlock(); - - return $finished; - } - - /** - * Build the next sitemap of a given type and update the sitemap state. - * - * @since 4.8.0 - * - * @param string $sitemap_type The type of the sitemap being generated. - * @param callback $build_one A callback which builds a single sitemap file. - * @param array $state A sitemap state. - */ - private function build_next_sitemap_of_type( $sitemap_type, $build_one, $state ) { - $index_type = jp_sitemap_index_type_of( $sitemap_type ); - - // Try to build a sitemap. - $result = call_user_func_array( - $build_one, - array( - $state['number'] + 1, - $state['last-added'], - ) - ); - - if ( false === $result ) { - // If no sitemap was generated, advance to the next type. - Jetpack_Sitemap_State::check_in( - array( - 'sitemap-type' => $index_type, - 'last-added' => 0, - 'number' => 0, - 'last-modified' => '1970-01-01 00:00:00', - ) - ); - - if ( $this->logger ) { - $this->logger->report( "-- Cleaning Up $sitemap_type" ); - } - - // Clean up old files. - $this->librarian->delete_numbered_sitemap_rows_after( - $state['number'], - $sitemap_type - ); - - return; - } - - // Otherwise, update the state. - Jetpack_Sitemap_State::check_in( - array( - 'sitemap-type' => $state['sitemap-type'], - 'last-added' => $result['last_id'], - 'number' => $state['number'] + 1, - 'last-modified' => $result['last_modified'], - ) - ); - - if ( true === $result['any_left'] ) { - // If there's more work to be done with this type, return. - return; - } - - // Otherwise, advance state to the next sitemap type. - Jetpack_Sitemap_State::check_in( - array( - 'sitemap-type' => $index_type, - 'last-added' => 0, - 'number' => 0, - 'last-modified' => '1970-01-01 00:00:00', - ) - ); - - if ( $this->logger ) { - $this->logger->report( "-- Cleaning Up $sitemap_type" ); - } - - // Clean up old files. - $this->librarian->delete_numbered_sitemap_rows_after( - $state['number'] + 1, - $sitemap_type - ); - } - - /** - * Build the next sitemap index of a given type and update the state. - * - * @since 4.8.0 - * - * @param string $index_type The type of index being generated. - * @param string $next_type The next type to generate after this one. - * @param array $state A sitemap state. - */ - private function build_next_sitemap_index_of_type( $index_type, $next_type, $state ) { - $sitemap_type = jp_sitemap_child_type_of( $index_type ); - - // If only 0 or 1 sitemaps were built, advance to the next type and return. - if ( 1 >= $state['max'][ $sitemap_type ]['number'] ) { - Jetpack_Sitemap_State::check_in( - array( - 'sitemap-type' => $next_type, - 'last-added' => 0, - 'number' => 0, - 'last-modified' => '1970-01-01 00:00:00', - ) - ); - - if ( $this->logger ) { - $this->logger->report( "-- Cleaning Up $index_type" ); - } - - // There are no indices of this type. - $this->librarian->delete_numbered_sitemap_rows_after( - 0, - $index_type - ); - - return; - } - - // Otherwise, try to build a sitemap index. - $result = $this->build_one_sitemap_index( - $state['number'] + 1, - $state['last-added'], - $state['last-modified'], - $index_type - ); - - // If no index was built, advance to the next type and return. - if ( false === $result ) { - Jetpack_Sitemap_State::check_in( - array( - 'sitemap-type' => $next_type, - 'last-added' => 0, - 'number' => 0, - 'last-modified' => '1970-01-01 00:00:00', - ) - ); - - if ( $this->logger ) { - $this->logger->report( "-- Cleaning Up $index_type" ); - } - - // Clean up old files. - $this->librarian->delete_numbered_sitemap_rows_after( - $state['number'], - $index_type - ); - - return; - } - - // Otherwise, check in the state. - Jetpack_Sitemap_State::check_in( - array( - 'sitemap-type' => $index_type, - 'last-added' => $result['last_id'], - 'number' => $state['number'] + 1, - 'last-modified' => $result['last_modified'], - ) - ); - - // If there are still sitemaps left to index, return. - if ( true === $result['any_left'] ) { - return; - } - - // Otherwise, advance to the next type. - Jetpack_Sitemap_State::check_in( - array( - 'sitemap-type' => $next_type, - 'last-added' => 0, - 'number' => 0, - 'last-modified' => '1970-01-01 00:00:00', - ) - ); - - if ( $this->logger ) { - $this->logger->report( "-- Cleaning Up $index_type" ); - } - - // We're done generating indices of this type. - $this->librarian->delete_numbered_sitemap_rows_after( - $state['number'] + 1, - $index_type - ); - } - - /** - * Builds the master sitemap index. - * - * @param array $max Array of sitemap types with max index and datetime. - * - * @since 4.8.0 - */ - private function build_master_sitemap( $max ) { - $page = array(); - $image = array(); - $video = array(); - if ( $this->logger ) { - $this->logger->report( '-- Building Master Sitemap.' ); - } - - $buffer = new Jetpack_Sitemap_Buffer_Master( - JP_SITEMAP_MAX_ITEMS, - JP_SITEMAP_MAX_BYTES - ); - - if ( 0 < $max[ JP_PAGE_SITEMAP_TYPE ]['number'] ) { - if ( 1 === $max[ JP_PAGE_SITEMAP_TYPE ]['number'] ) { - $page['filename'] = jp_sitemap_filename( JP_PAGE_SITEMAP_TYPE, 1 ); - $page['last_modified'] = jp_sitemap_datetime( $max[ JP_PAGE_SITEMAP_TYPE ]['lastmod'] ); - } else { - $page['filename'] = jp_sitemap_filename( - JP_PAGE_SITEMAP_INDEX_TYPE, - $max[ JP_PAGE_SITEMAP_INDEX_TYPE ]['number'] - ); - $page['last_modified'] = jp_sitemap_datetime( $max[ JP_PAGE_SITEMAP_INDEX_TYPE ]['lastmod'] ); - } - - $buffer->append( - array( - 'sitemap' => array( - 'loc' => $this->finder->construct_sitemap_url( $page['filename'] ), - 'lastmod' => $page['last_modified'], - ), - ) - ); - } - - if ( 0 < $max[ JP_IMAGE_SITEMAP_TYPE ]['number'] ) { - if ( 1 === $max[ JP_IMAGE_SITEMAP_TYPE ]['number'] ) { - $image['filename'] = jp_sitemap_filename( JP_IMAGE_SITEMAP_TYPE, 1 ); - $image['last_modified'] = jp_sitemap_datetime( $max[ JP_IMAGE_SITEMAP_TYPE ]['lastmod'] ); - } else { - $image['filename'] = jp_sitemap_filename( - JP_IMAGE_SITEMAP_INDEX_TYPE, - $max[ JP_IMAGE_SITEMAP_INDEX_TYPE ]['number'] - ); - $image['last_modified'] = jp_sitemap_datetime( $max[ JP_IMAGE_SITEMAP_INDEX_TYPE ]['lastmod'] ); - } - - $buffer->append( - array( - 'sitemap' => array( - 'loc' => $this->finder->construct_sitemap_url( $image['filename'] ), - 'lastmod' => $image['last_modified'], - ), - ) - ); - } - - if ( 0 < $max[ JP_VIDEO_SITEMAP_TYPE ]['number'] ) { - if ( 1 === $max[ JP_VIDEO_SITEMAP_TYPE ]['number'] ) { - $video['filename'] = jp_sitemap_filename( JP_VIDEO_SITEMAP_TYPE, 1 ); - $video['last_modified'] = jp_sitemap_datetime( $max[ JP_VIDEO_SITEMAP_TYPE ]['lastmod'] ); - } else { - $video['filename'] = jp_sitemap_filename( - JP_VIDEO_SITEMAP_INDEX_TYPE, - $max[ JP_VIDEO_SITEMAP_INDEX_TYPE ]['number'] - ); - $video['last_modified'] = jp_sitemap_datetime( $max[ JP_VIDEO_SITEMAP_INDEX_TYPE ]['lastmod'] ); - } - - $buffer->append( - array( - 'sitemap' => array( - 'loc' => $this->finder->construct_sitemap_url( $video['filename'] ), - 'lastmod' => $video['last_modified'], - ), - ) - ); - } - - $this->librarian->store_sitemap_data( - 0, - JP_MASTER_SITEMAP_TYPE, - $buffer->contents(), - '' - ); - } - - /** - * Build and store a single page sitemap. Returns false if no sitemap is built. - * - * Side effect: Create/update a sitemap row. - * - * @access private - * @since 4.8.0 - * - * @param int $number The number of the current sitemap. - * @param int $from_id The greatest lower bound of the IDs of the posts to be included. - * - * @return bool|array @args { - * @type int $last_id The ID of the last item to be successfully added to the buffer. - * @type bool $any_left 'true' if there are items which haven't been saved to a sitemap, 'false' otherwise. - * @type string $last_modified The most recent timestamp to appear on the sitemap. - * } - */ - public function build_one_page_sitemap( $number, $from_id ) { - $last_post_id = $from_id; - $any_posts_left = true; - - if ( $this->logger ) { - $debug_name = jp_sitemap_filename( JP_PAGE_SITEMAP_TYPE, $number ); - $this->logger->report( "-- Building $debug_name" ); - } - - $buffer = new Jetpack_Sitemap_Buffer_Page( - JP_SITEMAP_MAX_ITEMS, - JP_SITEMAP_MAX_BYTES - ); - - // Add entry for the main page (only if we're at the first one) and it isn't already going to be included as a page. - if ( 1 === $number && 'page' !== get_option( 'show_on_front' ) ) { - $item_array = array( - 'url' => array( - 'loc' => home_url(), - ), - ); - - /** - * Filter associative array with data to build <url> node - * and its descendants for site home. - * - * @module sitemaps - * - * @since 3.9.0 - * - * @param array $blog_home Data to build parent and children nodes for site home. - */ - $item_array = apply_filters( 'jetpack_sitemap_url_home', $item_array ); - - $buffer->append( $item_array ); - } - - // Add as many items to the buffer as possible. - while ( $last_post_id >= 0 && false === $buffer->is_full() ) { - $posts = $this->librarian->query_posts_after_id( - $last_post_id, - JP_SITEMAP_BATCH_SIZE - ); - - if ( null == $posts ) { // WPCS: loose comparison ok. - $any_posts_left = false; - break; - } - - foreach ( $posts as $post ) { - $current_item = $this->post_to_sitemap_item( $post ); - - if ( true === $buffer->append( $current_item['xml'] ) ) { - $last_post_id = $post->ID; - $buffer->view_time( $current_item['last_modified'] ); - } else { - break; - } - } - } - - // Handle other page sitemap URLs. - if ( false === $any_posts_left || $last_post_id < 0 ) { - // Negative IDs are used to track URL indexes. - $last_post_id = min( 0, $last_post_id ); - $any_posts_left = true; // Reinitialize. - - /** - * Filter other page sitemap URLs. - * - * @module sitemaps - * - * @since 6.1.0 - * - * @param array $urls An array of other URLs. - */ - $other_urls = apply_filters( 'jetpack_page_sitemap_other_urls', array() ); - - if ( $other_urls ) { // Start with index [1]. - $other_urls = array_values( $other_urls ); - array_unshift( $other_urls, $other_urls[0] ); - unset( $other_urls[0] ); - } - - // Add as many items to the buffer as possible. - while ( false === $buffer->is_full() ) { - $last_post_id_index = abs( $last_post_id ); - $start_from_post_id_index = $last_post_id_index ? $last_post_id_index + 1 : 0; - $urls = array_slice( - $other_urls, - $start_from_post_id_index, - JP_SITEMAP_BATCH_SIZE, - true - ); - - if ( ! $urls ) { - $any_posts_left = false; - break; - } - - foreach ( $urls as $index => $url ) { - if ( ! is_array( $url ) ) { - $url = array( 'loc' => $url ); - } - $item = array( 'xml' => compact( 'url' ) ); - - if ( true === $buffer->append( $item['xml'] ) ) { - $last_post_id = -$index; - } else { - break; - } - } - } - } - - // If no items were added, return false. - if ( true === $buffer->is_empty() ) { - return false; - } - - /** - * Filter sitemap before rendering it as XML. - * - * @module sitemaps - * - * @since 3.9.0 - * @since 5.3.0 returns an element of DOMDocument type instead of SimpleXMLElement - * - * @param DOMDocument $doc Data tree for sitemap. - * @param string $last_modified Date of last modification. - */ - $tree = apply_filters( - 'jetpack_print_sitemap', - $buffer->get_document(), - $buffer->last_modified() - ); - - // Store the buffer as the content of a sitemap row. - $this->librarian->store_sitemap_data( - $number, - JP_PAGE_SITEMAP_TYPE, - $buffer->contents(), - $buffer->last_modified() - ); - - /* - * Now report back with the ID of the last post ID to be - * successfully added and whether there are any posts left. - */ - return array( - 'last_id' => $last_post_id, - 'any_left' => $any_posts_left, - 'last_modified' => $buffer->last_modified(), - ); - } - - /** - * Build and store a single image sitemap. Returns false if no sitemap is built. - * - * Side effect: Create/update an image sitemap row. - * - * @access private - * @since 4.8.0 - * - * @param int $number The number of the current sitemap. - * @param int $from_id The greatest lower bound of the IDs of the posts to be included. - * - * @return bool|array @args { - * @type int $last_id The ID of the last item to be successfully added to the buffer. - * @type bool $any_left 'true' if there are items which haven't been saved to a sitemap, 'false' otherwise. - * @type string $last_modified The most recent timestamp to appear on the sitemap. - * } - */ - public function build_one_image_sitemap( $number, $from_id ) { - $last_post_id = $from_id; - $any_posts_left = true; - - if ( $this->logger ) { - $debug_name = jp_sitemap_filename( JP_IMAGE_SITEMAP_TYPE, $number ); - $this->logger->report( "-- Building $debug_name" ); - } - - $buffer = new Jetpack_Sitemap_Buffer_Image( - JP_SITEMAP_MAX_ITEMS, - JP_SITEMAP_MAX_BYTES - ); - - // Add as many items to the buffer as possible. - while ( false === $buffer->is_full() ) { - $posts = $this->librarian->query_images_after_id( - $last_post_id, - JP_SITEMAP_BATCH_SIZE - ); - - if ( null == $posts ) { // WPCS: loose comparison ok. - $any_posts_left = false; - break; - } - - foreach ( $posts as $post ) { - $current_item = $this->image_post_to_sitemap_item( $post ); - - if ( true === $buffer->append( $current_item['xml'] ) ) { - $last_post_id = $post->ID; - $buffer->view_time( $current_item['last_modified'] ); - } else { - break; - } - } - } - - // If no items were added, return false. - if ( true === $buffer->is_empty() ) { - return false; - } - - // Store the buffer as the content of a jp_sitemap post. - $this->librarian->store_sitemap_data( - $number, - JP_IMAGE_SITEMAP_TYPE, - $buffer->contents(), - $buffer->last_modified() - ); - - /* - * Now report back with the ID of the last post to be - * successfully added and whether there are any posts left. - */ - return array( - 'last_id' => $last_post_id, - 'any_left' => $any_posts_left, - 'last_modified' => $buffer->last_modified(), - ); - } - - /** - * Build and store a single video sitemap. Returns false if no sitemap is built. - * - * Side effect: Create/update an video sitemap row. - * - * @access private - * @since 4.8.0 - * - * @param int $number The number of the current sitemap. - * @param int $from_id The greatest lower bound of the IDs of the posts to be included. - * - * @return bool|array @args { - * @type int $last_id The ID of the last item to be successfully added to the buffer. - * @type bool $any_left 'true' if there are items which haven't been saved to a sitemap, 'false' otherwise. - * @type string $last_modified The most recent timestamp to appear on the sitemap. - * } - */ - public function build_one_video_sitemap( $number, $from_id ) { - $last_post_id = $from_id; - $any_posts_left = true; - - if ( $this->logger ) { - $debug_name = jp_sitemap_filename( JP_VIDEO_SITEMAP_TYPE, $number ); - $this->logger->report( "-- Building $debug_name" ); - } - - $buffer = new Jetpack_Sitemap_Buffer_Video( - JP_SITEMAP_MAX_ITEMS, - JP_SITEMAP_MAX_BYTES - ); - - // Add as many items to the buffer as possible. - while ( false === $buffer->is_full() ) { - $posts = $this->librarian->query_videos_after_id( - $last_post_id, - JP_SITEMAP_BATCH_SIZE - ); - - if ( null == $posts ) { // WPCS: loose comparison ok. - $any_posts_left = false; - break; - } - - foreach ( $posts as $post ) { - $current_item = $this->video_post_to_sitemap_item( $post ); - - if ( true === $buffer->append( $current_item['xml'] ) ) { - $last_post_id = $post->ID; - $buffer->view_time( $current_item['last_modified'] ); - } else { - break; - } - } - } - - // If no items were added, return false. - if ( true === $buffer->is_empty() ) { - return false; - } - - if ( false === $buffer->is_empty() ) { - $this->librarian->store_sitemap_data( - $number, - JP_VIDEO_SITEMAP_TYPE, - $buffer->contents(), - $buffer->last_modified() - ); - } - - /* - * Now report back with the ID of the last post to be - * successfully added and whether there are any posts left. - */ - return array( - 'last_id' => $last_post_id, - 'any_left' => $any_posts_left, - 'last_modified' => $buffer->last_modified(), - ); - } - - /** - * Build and store a single page sitemap index. Return false if no index is built. - * - * Side effect: Create/update a sitemap index row. - * - * @access private - * @since 4.8.0 - * - * @param int $number The number of the current sitemap index. - * @param int $from_id The greatest lower bound of the IDs of the sitemaps to be included. - * @param string $datetime Datetime of previous sitemap in 'YYYY-MM-DD hh:mm:ss' format. - * @param string $index_type Sitemap index type. - * - * @return bool|array @args { - * @type int $last_id The ID of the last item to be successfully added to the buffer. - * @type bool $any_left 'true' if there are items which haven't been saved to a sitemap, 'false' otherwise. - * @type string $last_modified The most recent timestamp to appear on the sitemap. - * } - */ - private function build_one_sitemap_index( $number, $from_id, $datetime, $index_type ) { - $last_sitemap_id = $from_id; - $any_sitemaps_left = true; - - // Check the datetime format. - $datetime = jp_sitemap_datetime( $datetime ); - - $sitemap_type = jp_sitemap_child_type_of( $index_type ); - - if ( $this->logger ) { - $index_debug_name = jp_sitemap_filename( $index_type, $number ); - $this->logger->report( "-- Building $index_debug_name" ); - } - - $buffer = new Jetpack_Sitemap_Buffer_Master( - JP_SITEMAP_MAX_ITEMS, - JP_SITEMAP_MAX_BYTES, - $datetime - ); - - // Add pointer to the previous sitemap index (unless we're at the first one). - if ( 1 !== $number ) { - $i = $number - 1; - $prev_index_url = $this->finder->construct_sitemap_url( - jp_sitemap_filename( $index_type, $i ) - ); - - $item_array = array( - 'sitemap' => array( - 'loc' => $prev_index_url, - 'lastmod' => $datetime, - ), - ); - - $buffer->append( $item_array ); - } - - // Add as many items to the buffer as possible. - while ( false === $buffer->is_full() ) { - // Retrieve a batch of posts (in order). - $posts = $this->librarian->query_sitemaps_after_id( - $sitemap_type, - $last_sitemap_id, - JP_SITEMAP_BATCH_SIZE - ); - - // If there were no posts to get, make a note. - if ( null == $posts ) { // WPCS: loose comparison ok. - $any_sitemaps_left = false; - break; - } - - // Otherwise, loop through each post in the batch. - foreach ( $posts as $post ) { - // Generate the sitemap XML for the post. - $current_item = $this->sitemap_row_to_index_item( (array) $post ); - - // Try adding this item to the buffer. - if ( true === $buffer->append( $current_item['xml'] ) ) { - $last_sitemap_id = $post['ID']; - $buffer->view_time( $current_item['last_modified'] ); - } else { - // Otherwise stop looping through posts. - break; - } - } - } - - // If no items were added, return false. - if ( true === $buffer->is_empty() ) { - return false; - } - - $this->librarian->store_sitemap_data( - $number, - $index_type, - $buffer->contents(), - $buffer->last_modified() - ); - - /* - * Now report back with the ID of the last sitemap post ID to - * be successfully added, whether there are any sitemap posts - * left, and the most recent modification time seen. - */ - return array( - 'last_id' => $last_sitemap_id, - 'any_left' => $any_sitemaps_left, - 'last_modified' => $buffer->last_modified(), - ); - } - - /** - * Construct the sitemap index url entry for a sitemap row. - * - * @link http://www.sitemaps.org/protocol.html#sitemapIndex_sitemap - * - * @access private - * @since 4.8.0 - * - * @param array $row The sitemap data to be processed. - * - * @return string An XML fragment representing the post URL. - */ - private function sitemap_row_to_index_item( $row ) { - $url = $this->finder->construct_sitemap_url( $row['post_title'] ); - - $item_array = array( - 'sitemap' => array( - 'loc' => $url, - 'lastmod' => jp_sitemap_datetime( $row['post_date'] ), - ), - ); - - return array( - 'xml' => $item_array, - 'last_modified' => $row['post_date'], - ); - } - - - /** - * This is served instead of a 404 when the master sitemap is requested - * but not yet generated. - * - * @access public - * @since 6.7.0 - * - * @return string The empty sitemap xml. - */ - public function empty_sitemap_xml() { - $empty_sitemap = new Jetpack_Sitemap_Buffer_Empty(); - return $empty_sitemap->contents(); - } - - /** - * Build and return the news sitemap xml. Note that the result of this - * function is cached in the transient 'jetpack_news_sitemap_xml'. - * - * @access public - * @since 4.8.0 - * - * @return string The news sitemap xml. - */ - public function news_sitemap_xml() { - $the_stored_news_sitemap = get_transient( 'jetpack_news_sitemap_xml' ); - - if ( false === $the_stored_news_sitemap ) { - - if ( $this->logger ) { - $this->logger->report( 'Beginning news sitemap generation.' ); - } - - /** - * Filter limit of entries to include in news sitemap. - * - * @module sitemaps - * - * @since 3.9.0 - * - * @param int $count Number of entries to include in news sitemap. - */ - $item_limit = apply_filters( - 'jetpack_sitemap_news_sitemap_count', - JP_NEWS_SITEMAP_MAX_ITEMS - ); - - $buffer = new Jetpack_Sitemap_Buffer_News( - min( $item_limit, JP_NEWS_SITEMAP_MAX_ITEMS ), - JP_SITEMAP_MAX_BYTES - ); - - $posts = $this->librarian->query_most_recent_posts( JP_NEWS_SITEMAP_MAX_ITEMS ); - - foreach ( $posts as $post ) { - $current_item = $this->post_to_news_sitemap_item( $post ); - - if ( false === $buffer->append( $current_item['xml'] ) ) { - break; - } - } - - if ( $this->logger ) { - $this->logger->time( 'End news sitemap generation.' ); - } - - $the_stored_news_sitemap = $buffer->contents(); - - set_transient( - 'jetpack_news_sitemap_xml', - $the_stored_news_sitemap, - JP_NEWS_SITEMAP_INTERVAL - ); - } // End if. - - return $the_stored_news_sitemap; - } - - /** - * Construct the sitemap url entry for a WP_Post. - * - * @link http://www.sitemaps.org/protocol.html#urldef - * @access private - * @since 4.8.0 - * - * @param WP_Post $post The post to be processed. - * - * @return array - * @type array $xml An XML fragment representing the post URL. - * @type string $last_modified Date post was last modified. - */ - private function post_to_sitemap_item( $post ) { - - /** - * Filter condition to allow skipping specific posts in sitemap. - * - * @module sitemaps - * - * @since 3.9.0 - * - * @param bool $skip Current boolean. False by default, so no post is skipped. - * @param object $post Current post in the form of a $wpdb result object. Not WP_Post. - */ - if ( true === apply_filters( 'jetpack_sitemap_skip_post', false, $post ) ) { - return array( - 'xml' => null, - 'last_modified' => null, - ); - } - - $url = esc_url( get_permalink( $post ) ); - - /* - * Spec requires the URL to be <=2048 bytes. - * In practice this constraint is unlikely to be violated. - */ - if ( 2048 < strlen( $url ) ) { - $url = home_url() . '/?p=' . $post->ID; - } - - $last_modified = $post->post_modified_gmt; - - // Check for more recent comments. - // Note that 'Y-m-d h:i:s' strings sort lexicographically. - if ( 0 < $post->comment_count ) { - $last_modified = max( - $last_modified, - $this->librarian->query_latest_approved_comment_time_on_post( $post->ID ) - ); - } - - $item_array = array( - 'url' => array( - 'loc' => $url, - 'lastmod' => jp_sitemap_datetime( $last_modified ), - ), - ); - - /** - * Filter sitemap URL item before rendering it as XML. - * - * @module sitemaps - * - * @since 3.9.0 - * - * @param array $tree Associative array representing sitemap URL element. - * @param int $post_id ID of the post being processed. - */ - $item_array = apply_filters( 'jetpack_sitemap_url', $item_array, $post->ID ); - - return array( - 'xml' => $item_array, - 'last_modified' => $last_modified, - ); - } - - /** - * Construct the image sitemap url entry for a WP_Post of image type. - * - * @link http://www.sitemaps.org/protocol.html#urldef - * - * @access private - * @since 4.8.0 - * - * @param WP_Post $post The image post to be processed. - * - * @return array - * @type array $xml An XML fragment representing the post URL. - * @type string $last_modified Date post was last modified. - */ - private function image_post_to_sitemap_item( $post ) { - - /** - * Filter condition to allow skipping specific image posts in the sitemap. - * - * @module sitemaps - * - * @since 4.8.0 - * - * @param bool $skip Current boolean. False by default, so no post is skipped. - * @param WP_POST $post Current post object. - */ - if ( apply_filters( 'jetpack_sitemap_image_skip_post', false, $post ) ) { - return array( - 'xml' => null, - 'last_modified' => null, - ); - } - - $url = wp_get_attachment_url( $post->ID ); - - // Do not include the image if the attached parent is not published. - // Unattached will be published. Otherwise, will inherit parent status. - if ( 'publish' !== get_post_status( $post ) ) { - return array( - 'xml' => null, - 'last_modified' => null, - ); - } - - $parent_url = get_permalink( get_post( $post->post_parent ) ); - if ( '' == $parent_url ) { // WPCS: loose comparison ok. - $parent_url = get_permalink( $post ); - } - - $item_array = array( - 'url' => array( - 'loc' => $parent_url, - 'lastmod' => jp_sitemap_datetime( $post->post_modified_gmt ), - 'image:image' => array( - 'image:loc' => $url, - ), - ), - ); - - $item_array['url']['image:image']['image:title'] = $post->post_title; - $item_array['url']['image:image']['image:caption'] = $post->post_excerpt; - - /** - * Filter associative array with data to build <url> node - * and its descendants for current post in image sitemap. - * - * @module sitemaps - * - * @since 4.8.0 - * - * @param array $item_array Data to build parent and children nodes for current post. - * @param int $post_id Current image post ID. - */ - $item_array = apply_filters( - 'jetpack_sitemap_image_sitemap_item', - $item_array, - $post->ID - ); - - return array( - 'xml' => $item_array, - 'last_modified' => $post->post_modified_gmt, - ); - } - - /** - * Construct the video sitemap url entry for a WP_Post of video type. - * - * @link http://www.sitemaps.org/protocol.html#urldef - * @link https://developers.google.com/webmasters/videosearch/sitemaps - * - * @access private - * @since 4.8.0 - * - * @param WP_Post $post The video post to be processed. - * - * @return array - * @type array $xml An XML fragment representing the post URL. - * @type string $last_modified Date post was last modified. - */ - private function video_post_to_sitemap_item( $post ) { - - /** - * Filter condition to allow skipping specific image posts in the sitemap. - * - * @module sitemaps - * - * @since 4.8.0 - * - * @param bool $skip Current boolean. False by default, so no post is skipped. - * @param WP_POST $post Current post object. - */ - if ( apply_filters( 'jetpack_sitemap_video_skip_post', false, $post ) ) { - return array( - 'xml' => null, - 'last_modified' => null, - ); - } - - // Do not include the video if the attached parent is not published. - // Unattached will be published. Otherwise, will inherit parent status. - if ( 'publish' !== get_post_status( $post ) ) { - return array( - 'xml' => null, - 'last_modified' => null, - ); - } - - $parent_url = esc_url( get_permalink( get_post( $post->post_parent ) ) ); - if ( '' == $parent_url ) { // WPCS: loose comparison ok. - $parent_url = esc_url( get_permalink( $post ) ); - } - - // Prepare the content like get_the_content_feed(). - $content = $post->post_content; - /** This filter is already documented in core/wp-includes/post-template.php */ - $content = apply_filters( 'the_content', $content ); - - /** This filter is already documented in core/wp-includes/feed.php */ - $content = apply_filters( 'the_content_feed', $content, 'rss2' ); - - // Include thumbnails for VideoPress videos, use blank image for others - if ( 'complete' === get_post_meta( $post->ID, 'videopress_status', true ) && has_post_thumbnail( $post ) ) { - $video_thumbnail_url = get_the_post_thumbnail_url( $post ); - } else { - /** - * Filter the thumbnail image used in the video sitemap for non-VideoPress videos. - * - * @since 7.2.0 - * - * @param string $str Image URL. - */ - $video_thumbnail_url = apply_filters( 'jetpack_video_sitemap_default_thumbnail', 'https://s0.wp.com/i/blank.jpg' ); - } - - $item_array = array( - 'url' => array( - 'loc' => $parent_url, - 'lastmod' => jp_sitemap_datetime( $post->post_modified_gmt ), - 'video:video' => array( - /** This filter is already documented in core/wp-includes/feed.php */ - 'video:title' => apply_filters( 'the_title_rss', $post->post_title ), - 'video:thumbnail_loc' => esc_url( $video_thumbnail_url ), - 'video:description' => $content, - 'video:content_loc' => esc_url( wp_get_attachment_url( $post->ID ) ), - ), - ), - ); - - // TODO: Integrate with VideoPress here. - // cf. video:player_loc tag in video sitemap spec. - - /** - * Filter associative array with data to build <url> node - * and its descendants for current post in video sitemap. - * - * @module sitemaps - * - * @since 4.8.0 - * - * @param array $item_array Data to build parent and children nodes for current post. - * @param int $post_id Current video post ID. - */ - $item_array = apply_filters( - 'jetpack_sitemap_video_sitemap_item', - $item_array, - $post->ID - ); - - return array( - 'xml' => $item_array, - 'last_modified' => $post->post_modified_gmt, - ); - } - - /** - * Construct the news sitemap url entry for a WP_Post. - * - * @link http://www.sitemaps.org/protocol.html#urldef - * - * @access private - * @since 4.8.0 - * - * @param WP_Post $post The post to be processed. - * - * @return string An XML fragment representing the post URL. - */ - private function post_to_news_sitemap_item( $post ) { - - /** - * Filter condition to allow skipping specific posts in news sitemap. - * - * @module sitemaps - * - * @since 3.9.0 - * - * @param bool $skip Current boolean. False by default, so no post is skipped. - * @param WP_POST $post Current post object. - */ - if ( apply_filters( 'jetpack_sitemap_news_skip_post', false, $post ) ) { - return array( - 'xml' => null, - ); - } - - $url = get_permalink( $post ); - - /* - * Spec requires the URL to be <=2048 bytes. - * In practice this constraint is unlikely to be violated. - */ - if ( 2048 < strlen( $url ) ) { - $url = home_url() . '/?p=' . $post->ID; - } - - /* - * Trim the locale to an ISO 639 language code as required by Google. - * Special cases are zh-cn (Simplified Chinese) and zh-tw (Traditional Chinese). - * @link http://www.loc.gov/standards/iso639-2/php/code_list.php - */ - $language = strtolower( get_locale() ); - - if ( in_array( $language, array( 'zh_tw', 'zh_cn' ), true ) ) { - $language = str_replace( '_', '-', $language ); - } else { - $language = preg_replace( '/(_.*)$/i', '', $language ); - } - - $item_array = array( - 'url' => array( - 'loc' => $url, - 'lastmod' => jp_sitemap_datetime( $post->post_modified_gmt ), - 'news:news' => array( - 'news:publication' => array( - 'news:name' => html_entity_decode( get_bloginfo( 'name' ) ), - 'news:language' => $language, - ), - /** This filter is already documented in core/wp-includes/feed.php */ - 'news:title' => apply_filters( 'the_title_rss', $post->post_title ), - 'news:publication_date' => jp_sitemap_datetime( $post->post_date_gmt ), - 'news:genres' => 'Blog', - ), - ), - ); - - /** - * Filter associative array with data to build <url> node - * and its descendants for current post in news sitemap. - * - * @module sitemaps - * - * @since 3.9.0 - * - * @param array $item_array Data to build parent and children nodes for current post. - * @param int $post_id Current post ID. - */ - $item_array = apply_filters( - 'jetpack_sitemap_news_sitemap_item', - $item_array, - $post->ID - ); - - return array( - 'xml' => $item_array, - ); - } -} |