mirror of
https://github.com/WordPress/WordPress.git
synced 2025-01-05 16:08:12 +01:00
ee1ba7f2f3
Exporter overhaul: * Add author information to export * Greater usage of slug identifiers * Don't export auto-drafts, spam comments, or edit lock/last meta keys * Inline documentation improvements * Remove filtering for now (@todo) * Bump WXR version to 1.1, but remain back compat in the importer Importer overhaul (http://plugins.trac.wordpress.org/changeset/304249): * Use an XML parser where available (SimpleXML, XML Parser) * Proper import support for navigation menus * Many bug fixes, specifically improvements to category and custom taxonomy handling * Better author/user mapping Fixes #5447 #5460 #7400 #7973 #8471 #9237 #10319 #11118 #11144 #11354 #11574 #12685 #13364 #13394 #13453 #13454 #13627 #14306 #14442 #14524 #14750 #15055 #15091 #15108. See #15197. git-svn-id: http://svn.automattic.com/wordpress/trunk@15961 1a063a9b-81f0-0310-95a4-ce76da25c4cd
367 lines
13 KiB
PHP
367 lines
13 KiB
PHP
<?php
|
|
/**
|
|
* WordPress Export Administration API
|
|
*
|
|
* @package WordPress
|
|
* @subpackage Administration
|
|
*/
|
|
|
|
/**
|
|
* Version number for the export format.
|
|
*
|
|
* Bump this when something changes that might affect compatibility.
|
|
*
|
|
* @since 2.5.0
|
|
*/
|
|
define( 'WXR_VERSION', '1.1' );
|
|
|
|
/**
|
|
* Generates the WXR export file for download
|
|
*
|
|
* @since 2.1.0
|
|
*
|
|
* @param array $args Filters defining what should be included in the export
|
|
*/
|
|
function export_wp( $args = array() ) {
|
|
global $wpdb, $post;
|
|
|
|
do_action( 'export_wp' );
|
|
|
|
$sitename = sanitize_key( get_bloginfo( 'name' ) );
|
|
if ( ! empty($sitename) ) $sitename .= '.';
|
|
$filename = $sitename . 'wordpress.' . date( 'Y-m-d' ) . '.xml';
|
|
|
|
header( 'Content-Description: File Transfer' );
|
|
header( 'Content-Disposition: attachment; filename=' . $filename );
|
|
header( 'Content-Type: text/xml; charset=' . get_option( 'blog_charset' ), true );
|
|
|
|
// grab a snapshot of post IDs, just in case it changes during the export
|
|
$post_ids = $wpdb->get_col( "SELECT ID FROM $wpdb->posts WHERE post_type != 'revision' AND post_status != 'auto-draft' ORDER BY post_date_gmt ASC" );
|
|
|
|
$categories = (array) get_categories( array( 'get' => 'all' ) );
|
|
$tags = (array) get_tags( array( 'get' => 'all' ) );
|
|
|
|
$custom_taxonomies = get_taxonomies( array( '_builtin' => false ) );
|
|
$taxonomy_terms = (array) get_terms( $custom_taxonomies, array( 'get' => 'all' ) );
|
|
|
|
// put categories in order with no child going before its parent
|
|
$cats = array();
|
|
while ( $cat = array_shift( $categories ) ) {
|
|
if ( $cat->parent == 0 || isset( $cats[$cat->parent] ) )
|
|
$cats[$cat->term_id] = $cat;
|
|
else
|
|
$categories[] = $cat;
|
|
}
|
|
|
|
// put terms in order with no child going before its parent
|
|
$terms = array();
|
|
while ( $t = array_shift( $taxonomy_terms ) ) {
|
|
if ( $t->parent == 0 || isset( $terms[$t->parent] ) )
|
|
$terms[$t->term_id] = $t;
|
|
else
|
|
$taxonomy_terms[] = $t;
|
|
}
|
|
|
|
/**
|
|
* Wrap given string in XML CDATA tag.
|
|
*
|
|
* @since 2.1.0
|
|
*
|
|
* @param string $str String to wrap in XML CDATA tag.
|
|
*/
|
|
function wxr_cdata( $str ) {
|
|
if ( seems_utf8( $str ) == false )
|
|
$str = utf8_encode( $str );
|
|
|
|
// $str = ent2ncr(esc_html($str));
|
|
$str = "<![CDATA[$str" . ( ( substr( $str, -1 ) == ']' ) ? ' ' : '') . "]]>";
|
|
|
|
return $str;
|
|
}
|
|
|
|
/**
|
|
* Return the URL of the site
|
|
*
|
|
* @since 2.5.0
|
|
*
|
|
* @return string Site URL.
|
|
*/
|
|
function wxr_site_url() {
|
|
// ms: the base url
|
|
if ( is_multisite() )
|
|
return network_home_url();
|
|
// wp: the blog url
|
|
else
|
|
return get_bloginfo_rss( 'url' );
|
|
}
|
|
|
|
/**
|
|
* Output a cat_name XML tag from a given category object
|
|
*
|
|
* @since 2.1.0
|
|
*
|
|
* @param object $category Category Object
|
|
*/
|
|
function wxr_cat_name( $category ) {
|
|
if ( empty( $category->name ) )
|
|
return;
|
|
|
|
echo '<wp:cat_name>' . wxr_cdata( $category->name ) . '</wp:cat_name>';
|
|
}
|
|
|
|
/**
|
|
* Output a category_description XML tag from a given category object
|
|
*
|
|
* @since 2.1.0
|
|
*
|
|
* @param object $category Category Object
|
|
*/
|
|
function wxr_category_description( $category ) {
|
|
if ( empty( $category->description ) )
|
|
return;
|
|
|
|
echo '<wp:category_description>' . wxr_cdata( $category->description ) . '</wp:category_description>';
|
|
}
|
|
|
|
/**
|
|
* Output a tag_name XML tag from a given tag object
|
|
*
|
|
* @since 2.3.0
|
|
*
|
|
* @param object $tag Tag Object
|
|
*/
|
|
function wxr_tag_name( $tag ) {
|
|
if ( empty( $tag->name ) )
|
|
return;
|
|
|
|
echo '<wp:tag_name>' . wxr_cdata( $tag->name ) . '</wp:tag_name>';
|
|
}
|
|
|
|
/**
|
|
* Output a tag_description XML tag from a given tag object
|
|
*
|
|
* @since 2.3.0
|
|
*
|
|
* @param object $tag Tag Object
|
|
*/
|
|
function wxr_tag_description( $tag ) {
|
|
if ( empty( $tag->description ) )
|
|
return;
|
|
|
|
echo '<wp:tag_description>' . wxr_cdata( $tag->description ) . '</wp:tag_description>';
|
|
}
|
|
|
|
/**
|
|
* Output a term_name XML tag from a given term object
|
|
*
|
|
* @since 2.9.0
|
|
*
|
|
* @param object $term Term Object
|
|
*/
|
|
function wxr_term_name( $term ) {
|
|
if ( empty( $term->name ) )
|
|
return;
|
|
|
|
echo '<wp:term_name>' . wxr_cdata( $term->name ) . '</wp:term_name>';
|
|
}
|
|
|
|
/**
|
|
* Output a term_description XML tag from a given term object
|
|
*
|
|
* @since 2.9.0
|
|
*
|
|
* @param object $term Term Object
|
|
*/
|
|
function wxr_term_description( $term ) {
|
|
if ( empty( $term->description ) )
|
|
return;
|
|
|
|
echo '<wp:term_description>' . wxr_cdata( $term->description ) . '</wp:term_description>';
|
|
}
|
|
|
|
/**
|
|
* Output list of authors with posts
|
|
*
|
|
* @since 3.1.0
|
|
*/
|
|
function wxr_authors_list() {
|
|
global $wpdb;
|
|
|
|
$authors = array();
|
|
$results = $wpdb->get_results( "SELECT DISTINCT post_author FROM $wpdb->posts" );
|
|
foreach ( (array) $results as $result )
|
|
$authors[] = get_userdata( $result->post_author );
|
|
|
|
foreach( $authors as $author ) {
|
|
echo "\t<wp:author>";
|
|
echo '<wp:author_login>' . $author->user_login . '</wp:author_login>';
|
|
echo '<wp:author_email>' . $author->user_email . '</wp:author_email>';
|
|
echo '<wp:author_display_name>' . wxr_cdata( $author->display_name ) . '</wp:author_display_name>';
|
|
echo '<wp:author_first_name>' . wxr_cdata( $author->user_firstname ) . '</wp:author_first_name>';
|
|
echo '<wp:author_last_name>' . wxr_cdata( $author->user_lastname ) . '</wp:author_last_name>';
|
|
echo "</wp:author>\n";
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Ouput all navigation menu terms
|
|
*
|
|
* @since 3.1.0
|
|
*/
|
|
function wxr_nav_menu_terms() {
|
|
$nav_menus = wp_get_nav_menus();
|
|
if ( empty( $nav_menus ) || ! is_array( $nav_menus ) )
|
|
return;
|
|
|
|
foreach ( $nav_menus as $menu ) {
|
|
echo "\t<wp:term><wp:term_id>{$menu->term_id}</wp:term_id><wp:term_taxonomy>nav_menu</wp:term_taxonomy><wp:term_slug>{$menu->slug}</wp:term_slug>";
|
|
wxr_term_name( $menu );
|
|
echo "</wp:term>\n";
|
|
}
|
|
}
|
|
|
|
/**
|
|
* Output list of taxonomy terms, in XML tag format, associated with a post
|
|
*
|
|
* @since 2.3.0
|
|
*/
|
|
function wxr_post_taxonomy() {
|
|
global $post;
|
|
|
|
$taxonomies = get_object_taxonomies( $post->post_type );
|
|
if ( empty( $taxonomies ) )
|
|
return;
|
|
$terms = wp_get_object_terms( $post->ID, $taxonomies );
|
|
|
|
foreach ( (array) $terms as $term ) {
|
|
echo "\t\t<category domain=\"{$term->taxonomy}\" nicename=\"{$term->slug}\">" . wxr_cdata( $term->name ) . "</category>\n";
|
|
}
|
|
}
|
|
|
|
echo '<?xml version="1.0" encoding="' . get_bloginfo('charset') . "\" ?>\n";
|
|
|
|
?>
|
|
<!-- This is a WordPress eXtended RSS file generated by WordPress as an export of your site. -->
|
|
<!-- It contains information about your site's posts, pages, comments, categories, and other content. -->
|
|
<!-- You may use this file to transfer that content from one site to another. -->
|
|
<!-- This file is not intended to serve as a complete backup of your site. -->
|
|
|
|
<!-- To import this information into a WordPress site follow these steps: -->
|
|
<!-- 1. Log in to that site as an administrator. -->
|
|
<!-- 2. Go to Tools: Import in the WordPress admin panel. -->
|
|
<!-- 3. Install the "WordPress" importer from the list. -->
|
|
<!-- 4. Activate & Run Importer. -->
|
|
<!-- 5. Upload this file using the form provided on that page. -->
|
|
<!-- 6. You will first be asked to map the authors in this export file to users -->
|
|
<!-- on the site. For each author, you may choose to map to an -->
|
|
<!-- existing user on the site or to create a new user. -->
|
|
<!-- 7. WordPress will then import each of the posts, pages, comments, categories, etc. -->
|
|
<!-- contained in this file into your site. -->
|
|
|
|
<?php the_generator( 'export' ); ?>
|
|
<rss version="2.0"
|
|
xmlns:excerpt="http://wordpress.org/export/<?php echo WXR_VERSION; ?>/excerpt/"
|
|
xmlns:content="http://purl.org/rss/1.0/modules/content/"
|
|
xmlns:wfw="http://wellformedweb.org/CommentAPI/"
|
|
xmlns:dc="http://purl.org/dc/elements/1.1/"
|
|
xmlns:wp="http://wordpress.org/export/<?php echo WXR_VERSION; ?>/"
|
|
>
|
|
|
|
<channel>
|
|
<title><?php bloginfo_rss( 'name' ); ?></title>
|
|
<link><?php bloginfo_rss( 'url' ); ?></link>
|
|
<description><?php bloginfo_rss( 'description' ); ?></description>
|
|
<pubDate><?php echo mysql2date( 'D, d M Y H:i:s +0000', get_lastpostmodified( 'GMT' ), false ); ?></pubDate>
|
|
<language><?php echo get_option( 'rss_language' ); ?></language>
|
|
<wp:wxr_version><?php echo WXR_VERSION; ?></wp:wxr_version>
|
|
<wp:base_site_url><?php echo wxr_site_url(); ?></wp:base_site_url>
|
|
<wp:base_blog_url><?php bloginfo_rss( 'url' ); ?></wp:base_blog_url>
|
|
|
|
<?php wxr_authors_list(); ?>
|
|
|
|
<?php foreach ( $cats as $c ) : ?>
|
|
<wp:category><wp:term_id><?php echo $c->term_id ?></wp:term_id><wp:category_nicename><?php echo $c->slug; ?></wp:category_nicename><wp:category_parent><?php echo $c->parent ? $cats[$c->parent]->slug : ''; ?></wp:category_parent><?php wxr_cat_name( $c ); ?><?php wxr_category_description( $c ); ?></wp:category>
|
|
<?php endforeach; ?>
|
|
<?php foreach ( $tags as $t ) : ?>
|
|
<wp:tag><wp:term_id><?php echo $t->term_id ?></wp:term_id><wp:tag_slug><?php echo $t->slug; ?></wp:tag_slug><?php wxr_tag_name( $t ); ?><?php wxr_tag_description( $t ); ?></wp:tag>
|
|
<?php endforeach; ?>
|
|
<?php foreach ( $terms as $t ) : ?>
|
|
<wp:term><wp:term_id><?php echo $t->term_id ?></wp:term_id><wp:term_taxonomy><?php echo $t->taxonomy; ?></wp:term_taxonomy><wp:term_slug><?php echo $t->slug; ?></wp:term_slug><wp:term_parent><?php echo $t->parent ? $terms[$t->parent]->slug : ''; ?></wp:term_parent><?php wxr_term_name( $t ); ?><?php wxr_term_description( $t ); ?></wp:term>
|
|
<?php endforeach; ?>
|
|
<?php wxr_nav_menu_terms(); ?>
|
|
|
|
<?php do_action( 'rss2_head' ); ?>
|
|
|
|
<?php if ( $post_ids ) {
|
|
global $wp_query;
|
|
$wp_query->in_the_loop = true; // Fake being in the loop.
|
|
|
|
// fetch 20 posts at a time rather than loading the entire table into memory
|
|
while ( $next_posts = array_splice( $post_ids, 0, 20 ) ) {
|
|
$where = "WHERE ID IN (" . join( ',', $next_posts ) . ")";
|
|
$posts = $wpdb->get_results( "SELECT * FROM $wpdb->posts $where ORDER BY post_date_gmt ASC" );
|
|
|
|
// Begin Loop
|
|
foreach ( $posts as $post ) {
|
|
setup_postdata( $post );
|
|
$is_sticky = is_sticky( $post->ID ) ? 1 : 0;
|
|
?>
|
|
<item>
|
|
<title><?php echo apply_filters( 'the_title_rss', $post->post_title ); ?></title>
|
|
<link><?php the_permalink_rss() ?></link>
|
|
<pubDate><?php echo mysql2date( 'D, d M Y H:i:s +0000', get_post_time( 'Y-m-d H:i:s', true ), false ); ?></pubDate>
|
|
<dc:creator><?php echo get_the_author_meta( 'login' ); ?></dc:creator>
|
|
<guid isPermaLink="false"><?php esc_url( the_guid() ); ?></guid>
|
|
<description></description>
|
|
<content:encoded><?php echo wxr_cdata( apply_filters( 'the_content_export', $post->post_content ) ); ?></content:encoded>
|
|
<excerpt:encoded><?php echo wxr_cdata( apply_filters( 'the_excerpt_export', $post->post_excerpt ) ); ?></excerpt:encoded>
|
|
<wp:post_id><?php echo $post->ID; ?></wp:post_id>
|
|
<wp:post_date><?php echo $post->post_date; ?></wp:post_date>
|
|
<wp:post_date_gmt><?php echo $post->post_date_gmt; ?></wp:post_date_gmt>
|
|
<wp:comment_status><?php echo $post->comment_status; ?></wp:comment_status>
|
|
<wp:ping_status><?php echo $post->ping_status; ?></wp:ping_status>
|
|
<wp:post_name><?php echo $post->post_name; ?></wp:post_name>
|
|
<wp:status><?php echo $post->post_status; ?></wp:status>
|
|
<wp:post_parent><?php echo $post->post_parent; ?></wp:post_parent>
|
|
<wp:menu_order><?php echo $post->menu_order; ?></wp:menu_order>
|
|
<wp:post_type><?php echo $post->post_type; ?></wp:post_type>
|
|
<wp:post_password><?php echo $post->post_password; ?></wp:post_password>
|
|
<wp:is_sticky><?php echo $is_sticky; ?></wp:is_sticky>
|
|
<?php if ( $post->post_type == 'attachment' ) : ?>
|
|
<wp:attachment_url><?php echo wp_get_attachment_url( $post->ID ); ?></wp:attachment_url>
|
|
<?php endif; ?>
|
|
<?php wxr_post_taxonomy(); ?>
|
|
<?php $postmeta = $wpdb->get_results( $wpdb->prepare( "SELECT * FROM $wpdb->postmeta WHERE post_id = %d", $post->ID ) );
|
|
if ( $postmeta ) : foreach( $postmeta as $meta ) : if ( $meta->meta_key != '_edit_lock' && $meta->meta_key != '_edit_last' ) : ?>
|
|
<wp:postmeta>
|
|
<wp:meta_key><?php echo $meta->meta_key; ?></wp:meta_key>
|
|
<wp:meta_value><?php echo wxr_cdata( $meta->meta_value ); ?></wp:meta_value>
|
|
</wp:postmeta>
|
|
<?php endif; endforeach; endif; ?>
|
|
<?php $comments = $wpdb->get_results( $wpdb->prepare( "SELECT * FROM $wpdb->comments WHERE comment_post_ID = %d AND comment_approved <> 'spam'", $post->ID ) );
|
|
if ( $comments ) : foreach ( $comments as $c ) : ?>
|
|
<wp:comment>
|
|
<wp:comment_id><?php echo $c->comment_ID; ?></wp:comment_id>
|
|
<wp:comment_author><?php echo wxr_cdata( $c->comment_author ); ?></wp:comment_author>
|
|
<wp:comment_author_email><?php echo $c->comment_author_email; ?></wp:comment_author_email>
|
|
<wp:comment_author_url><?php echo esc_url_raw( $c->comment_author_url ); ?></wp:comment_author_url>
|
|
<wp:comment_author_IP><?php echo $c->comment_author_IP; ?></wp:comment_author_IP>
|
|
<wp:comment_date><?php echo $c->comment_date; ?></wp:comment_date>
|
|
<wp:comment_date_gmt><?php echo $c->comment_date_gmt; ?></wp:comment_date_gmt>
|
|
<wp:comment_content><?php echo wxr_cdata( $c->comment_content ) ?></wp:comment_content>
|
|
<wp:comment_approved><?php echo $c->comment_approved; ?></wp:comment_approved>
|
|
<wp:comment_type><?php echo $c->comment_type; ?></wp:comment_type>
|
|
<wp:comment_parent><?php echo $c->comment_parent; ?></wp:comment_parent>
|
|
<wp:comment_user_id><?php echo $c->user_id; ?></wp:comment_user_id>
|
|
</wp:comment>
|
|
<?php endforeach; endif; ?>
|
|
</item>
|
|
<?php
|
|
}
|
|
}
|
|
} ?>
|
|
</channel>
|
|
</rss>
|
|
<?php
|
|
}
|