2005-08-21 09:03:23 +02:00
< ? php
2005-09-11 00:45:32 +02:00
2005-08-21 09:03:23 +02:00
class RSS_Import {
var $posts = array ();
2005-11-16 00:39:32 +01:00
var $file ;
2005-08-21 09:03:23 +02:00
function header () {
echo '<div class="wrap">' ;
echo '<h2>' . __ ( 'Import RSS' ) . '</h2>' ;
}
function footer () {
echo '</div>' ;
}
2005-09-11 00:45:32 +02:00
function unhtmlentities ( $string ) { // From php.net for < 4.3 compat
$trans_tbl = get_html_translation_table ( HTML_ENTITIES );
$trans_tbl = array_flip ( $trans_tbl );
return strtr ( $string , $trans_tbl );
}
2006-02-12 08:53:23 +01:00
2005-08-21 09:03:23 +02:00
function greet () {
2006-10-06 03:14:47 +02:00
echo '<div class="narrow">' ;
2006-12-05 08:15:12 +01:00
echo '<p>' . __ ( 'Howdy! This importer allows you to extract posts from an RSS 2.0 file into your blog. This is useful if you want to import your posts from a system that is not handled by a custom import tool. Pick an RSS file to upload and click Import.' ) . '</p>' ;
2005-11-16 00:39:32 +01:00
wp_import_upload_form ( " admin.php?import=rss&step=1 " );
2006-10-06 03:14:47 +02:00
echo '</div>' ;
2005-08-21 09:03:23 +02:00
}
function get_posts () {
2005-09-11 00:45:32 +02:00
global $wpdb ;
2006-02-12 08:53:23 +01:00
2005-08-21 09:03:23 +02:00
set_magic_quotes_runtime ( 0 );
2005-11-16 00:39:32 +01:00
$datalines = file ( $this -> file ); // Read the file into an array
2005-08-21 09:03:23 +02:00
$importdata = implode ( '' , $datalines ); // squish it
$importdata = str_replace ( array ( " \r \n " , " \r " ), " \n " , $importdata );
2005-09-11 00:45:32 +02:00
preg_match_all ( '|<item>(.*?)</item>|is' , $importdata , $this -> posts );
$this -> posts = $this -> posts [ 1 ];
$index = 0 ;
foreach ( $this -> posts as $post ) {
preg_match ( '|<title>(.*?)</title>|is' , $post , $post_title );
2006-08-31 19:36:35 +02:00
$post_title = str_replace ( array ( '<![CDATA[' , ']]>' ), '' , $wpdb -> escape ( trim ( $post_title [ 1 ]) ));
2005-09-11 00:45:32 +02:00
2006-08-31 19:34:56 +02:00
preg_match ( '|<pubdate>(.*?)</pubdate>|is' , $post , $post_date_gmt );
2005-09-11 00:45:32 +02:00
2006-08-31 19:34:56 +02:00
if ( $post_date_gmt ) {
$post_date_gmt = strtotime ( $post_date_gmt [ 1 ]);
2005-09-11 00:45:32 +02:00
} else {
// if we don't already have something from pubDate
2006-08-31 19:34:56 +02:00
preg_match ( '|<dc:date>(.*?)</dc:date>|is' , $post , $post_date_gmt );
$post_date_gmt = preg_replace ( '|([-+])([0-9]+):([0-9]+)$|' , '\1\2\3' , $post_date_gmt [ 1 ]);
$post_date_gmt = str_replace ( 'T' , ' ' , $post_date_gmt );
$post_date_gmt = strtotime ( $post_date_gmt );
2005-09-11 00:45:32 +02:00
}
2006-08-31 19:34:56 +02:00
$post_date_gmt = gmdate ( 'Y-m-d H:i:s' , $post_date_gmt );
$post_date = get_date_from_gmt ( $post_date_gmt );
2005-09-11 00:45:32 +02:00
preg_match_all ( '|<category>(.*?)</category>|is' , $post , $categories );
$categories = $categories [ 1 ];
if ( ! $categories ) {
preg_match_all ( '|<dc:subject>(.*?)</dc:subject>|is' , $post , $categories );
$categories = $categories [ 1 ];
}
$cat_index = 0 ;
foreach ( $categories as $category ) {
$categories [ $cat_index ] = $wpdb -> escape ( $this -> unhtmlentities ( $category ));
$cat_index ++ ;
}
preg_match ( '|<guid.+?>(.*?)</guid>|is' , $post , $guid );
if ( $guid )
$guid = $wpdb -> escape ( trim ( $guid [ 1 ]));
else
$guid = '' ;
preg_match ( '|<content:encoded>(.*?)</content:encoded>|is' , $post , $post_content );
$post_content = str_replace ( array ( '<![CDATA[' , ']]>' ), '' , $wpdb -> escape ( trim ( $post_content [ 1 ])));
if ( ! $post_content ) {
// This is for feeds that put content in description
preg_match ( '|<description>(.*?)</description>|is' , $post , $post_content );
$post_content = $wpdb -> escape ( $this -> unhtmlentities ( trim ( $post_content [ 1 ])));
}
// Clean up content
$post_content = preg_replace ( '|<(/?[A-Z]+)|e' , " '<' . strtolower(' $ 1') " , $post_content );
$post_content = str_replace ( '<br>' , '<br />' , $post_content );
$post_content = str_replace ( '<hr>' , '<hr />' , $post_content );
$post_author = 1 ;
$post_status = 'publish' ;
2006-08-31 19:34:56 +02:00
$this -> posts [ $index ] = compact ( 'post_author' , 'post_date' , 'post_date_gmt' , 'post_content' , 'post_title' , 'post_status' , 'guid' , 'categories' );
2005-09-11 00:45:32 +02:00
$index ++ ;
}
2005-08-21 09:03:23 +02:00
}
function import_posts () {
echo '<ol>' ;
2005-09-11 00:45:32 +02:00
foreach ( $this -> posts as $post ) {
echo " <li> " . __ ( 'Importing post...' );
2005-08-21 09:03:23 +02:00
2005-09-11 00:45:32 +02:00
extract ( $post );
2005-08-21 09:03:23 +02:00
2005-09-11 00:45:32 +02:00
if ( $post_id = post_exists ( $post_title , $post_content , $post_date )) {
2005-12-02 23:37:02 +01:00
_e ( 'Post already imported' );
2005-09-11 00:45:32 +02:00
} else {
$post_id = wp_insert_post ( $post );
2007-09-18 18:32:22 +02:00
if ( is_wp_error ( $post_id ) )
return $post_id ;
2005-11-16 00:39:32 +01:00
if ( ! $post_id ) {
2005-12-02 23:37:02 +01:00
_e ( " Couldn't get post ID " );
2005-11-16 00:39:32 +01:00
return ;
}
2005-09-11 00:45:32 +02:00
if ( 0 != count ( $categories ))
wp_create_categories ( $categories , $post_id );
2005-12-02 23:37:02 +01:00
_e ( 'Done !' );
2005-09-11 00:45:32 +02:00
}
echo '</li>' ;
2005-08-21 09:03:23 +02:00
}
echo '</ol>' ;
}
2005-09-11 00:45:32 +02:00
2005-08-21 09:03:23 +02:00
function import () {
2005-11-16 00:39:32 +01:00
$file = wp_import_handle_upload ();
if ( isset ( $file [ 'error' ]) ) {
echo $file [ 'error' ];
return ;
}
2005-09-11 00:45:32 +02:00
2005-11-16 00:39:32 +01:00
$this -> file = $file [ 'file' ];
2005-08-21 09:03:23 +02:00
$this -> get_posts ();
2007-09-18 18:32:22 +02:00
$result = $this -> import_posts ();
if ( is_wp_error ( $result ) )
return $result ;
2005-11-16 03:07:56 +01:00
wp_import_cleanup ( $file [ 'id' ]);
2007-12-23 02:10:29 +01:00
do_action ( 'import_done' , 'rss' );
2006-02-12 08:53:23 +01:00
2005-12-02 23:37:02 +01:00
echo '<h3>' ;
printf ( __ ( 'All done. <a href="%s">Have fun!</a>' ), get_option ( 'home' ));
echo '</h3>' ;
2005-08-21 09:03:23 +02:00
}
2005-09-11 00:45:32 +02:00
2005-08-21 09:03:23 +02:00
function dispatch () {
2005-09-11 00:45:32 +02:00
if ( empty ( $_GET [ 'step' ]))
2005-08-21 09:03:23 +02:00
$step = 0 ;
else
$step = ( int ) $_GET [ 'step' ];
2005-09-11 00:45:32 +02:00
2005-09-11 02:00:18 +02:00
$this -> header ();
2006-02-12 08:53:23 +01:00
2005-08-21 09:03:23 +02:00
switch ( $step ) {
2005-09-11 00:45:32 +02:00
case 0 :
2005-08-21 09:03:23 +02:00
$this -> greet ();
break ;
2005-09-11 00:45:32 +02:00
case 1 :
2007-05-07 17:56:53 +02:00
check_admin_referer ( 'import-upload' );
2007-09-18 18:32:22 +02:00
$result = $this -> import ();
if ( is_wp_error ( $result ) )
echo $result -> get_error_message ();
2005-08-21 09:03:23 +02:00
break ;
}
2006-02-12 08:53:23 +01:00
2005-09-11 02:00:18 +02:00
$this -> footer ();
2005-08-21 09:03:23 +02:00
}
2005-09-11 00:45:32 +02:00
2005-08-21 09:03:23 +02:00
function RSS_Import () {
2006-02-12 08:53:23 +01:00
// Nothing.
2005-08-21 09:03:23 +02:00
}
}
$rss_import = new RSS_Import ();
2006-09-05 20:52:24 +02:00
register_importer ( 'rss' , __ ( 'RSS' ), __ ( 'Import posts from an RSS feed' ), array ( $rss_import , 'dispatch' ));
2005-12-02 23:37:02 +01:00
?>