2005-08-21 03:03:23 -04:00
< ? php
class MT_Import {
2005-09-14 01:17:20 -04:00
var $posts = array ();
2005-11-15 21:07:56 -05:00
var $file ;
var $id ;
2005-09-14 01:17:20 -04:00
var $mtnames = array ();
var $newauthornames = array ();
var $j = - 1 ;
2005-08-21 03:03:23 -04:00
function header () {
echo '<div class="wrap">' ;
2005-09-14 01:17:20 -04:00
echo '<h2>' . __ ( 'Import Movable Type' ) . '</h2>' ;
2005-08-21 03:03:23 -04:00
}
function footer () {
2005-09-14 01:17:20 -04:00
echo '</div>' ;
2005-08-21 03:03:23 -04:00
}
2005-09-14 01:17:20 -04:00
2005-08-21 03:03:23 -04:00
function greet () {
$this -> header ();
?>
2005-12-02 17:37:02 -05:00
< p >< ? php _e ( 'Howdy! We’re about to begin the process to import all of your Movable Type entries into WordPress. To begin, select a file to upload and click Import.' ); ?> </p>
2005-11-15 21:07:56 -05:00
< ? php wp_import_upload_form ( add_query_arg ( 'step' , 1 ) ); ?>
2005-12-02 17:37:02 -05:00
< p >< ? php _e ( 'The importer is smart enough not to import duplicates, so you can run this multiple times without worry if—for whatever reason—it doesn\'t finish. If you get an <strong>out of memory</strong> error try splitting up the import file into pieces.' ); ?> </p>
2005-08-21 03:03:23 -04:00
< ? php
$this -> footer ();
2005-09-14 01:17:20 -04:00
}
function users_form ( $n ) {
global $wpdb , $testing ;
$users = $wpdb -> get_results ( " SELECT * FROM $wpdb->users ORDER BY ID " );
?> <select name="userselect[<?php echo $n; ?>]">
< option value = " #NONE# " >- Select -</ option >
< ? php
foreach ( $users as $user ) {
echo '<option value="' . $user -> user_login . '">' . $user -> user_login . '</option>' ;
}
?>
</ select >
< ? php
}
//function to check the authorname and do the mapping
function checkauthor ( $author ) {
global $wpdb ;
//mtnames is an array with the names in the mt import file
2005-09-24 14:07:46 -04:00
$pass = 'changeme' ;
2005-09-14 01:17:20 -04:00
if ( ! ( in_array ( $author , $this -> mtnames ))) { //a new mt author name is found
++ $this -> j ;
$this -> mtnames [ $this -> j ] = $author ; //add that new mt author name to an array
2005-09-24 14:07:46 -04:00
$user_id = username_exists ( $this -> newauthornames [ $j ]); //check if the new author name defined by the user is a pre-existing wp user
2005-09-14 01:17:20 -04:00
if ( ! $user_id ) { //banging my head against the desk now.
if ( $newauthornames [ $this -> j ] == 'left_blank' ) { //check if the user does not want to change the authorname
2005-09-24 14:07:46 -04:00
$user_id = wp_create_user ( $author , $pass );
2005-09-14 01:17:20 -04:00
$this -> newauthornames [ $this -> j ] = $author ; //now we have a name, in the place of left_blank.
} else {
2005-09-24 14:07:46 -04:00
$user_id = wp_create_user ( $this -> newauthornames [ $this -> j ], $pass );
2005-09-14 01:17:20 -04:00
}
} else {
return $user_id ; // return pre-existing wp username if it exists
}
} else {
$key = array_search ( $author , $this -> mtnames ); //find the array key for $author in the $mtnames array
2005-09-24 14:07:46 -04:00
$user_id = username_exists ( $this -> newauthornames [ $key ]); //use that key to get the value of the author's name from $newauthornames
2005-09-14 01:17:20 -04:00
}
return $user_id ;
}
2005-08-21 03:03:23 -04:00
function get_entries () {
set_magic_quotes_runtime ( 0 );
2005-11-15 21:07:56 -05:00
$importdata = file ( $this -> file ); // Read the file into an array
2005-08-21 03:03:23 -04:00
$importdata = implode ( '' , $importdata ); // squish it
$importdata = preg_replace ( " /( \r \n | \n | \r )/ " , " \n " , $importdata );
$importdata = preg_replace ( " / \n -------- \n / " , " --MT-ENTRY-- \n " , $importdata );
$this -> posts = explode ( " --MT-ENTRY-- " , $importdata );
}
2005-09-14 01:17:20 -04:00
function get_mt_authors () {
$temp = array ();
$i = - 1 ;
foreach ( $this -> posts as $post ) {
if ( '' != trim ( $post )) {
++ $i ;
preg_match ( " |AUTHOR:(.*)| " , $post , $thematch );
$thematch = trim ( $thematch [ 1 ]);
array_push ( $temp , " $thematch " ); //store the extracted author names in a temporary array
}
}
//we need to find unique values of author names, while preserving the order, so this function emulates the unique_value(); php function, without the sorting.
$authors [ 0 ] = array_shift ( $temp );
$y = count ( $temp ) + 1 ;
for ( $x = 1 ; $x < $y ; $x ++ ) {
$next = array_shift ( $temp );
if ( ! ( in_array ( $next , $authors )))
array_push ( $authors , " $next " );
}
return $authors ;
}
function get_authors_from_post () {
$formnames = array ();
$selectnames = array ();
foreach ( $_POST [ 'user' ] as $key => $line ) {
$newname = trim ( stripslashes ( $line ));
if ( $newname == '' )
$newname = 'left_blank' ; //passing author names from step 1 to step 2 is accomplished by using POST. left_blank denotes an empty entry in the form.
array_push ( $formnames , " $newname " );
} // $formnames is the array with the form entered names
foreach ( $_POST [ 'userselect' ] as $user => $key ) {
$selected = trim ( stripslashes ( $key ));
array_push ( $selectnames , " $selected " );
}
$count = count ( $formnames );
for ( $i = 0 ; $i < $count ; $i ++ ) {
if ( $selectnames [ $i ] != '#NONE#' ) { //if no name was selected from the select menu, use the name entered in the form
array_push ( $this -> newauthornames , " $selectnames[$i] " );
} else {
array_push ( $this -> newauthornames , " $formnames[$i] " );
}
}
}
function mt_authors_form () {
?>
< p >< ? php _e ( 'To make it easier for you to edit and save the imported posts and drafts, you may want to change the name of the author of the posts. For example, you may want to import all the entries as <code>admin</code>s entries.' ); ?> </p>
< p >< ? php _e ( 'Below, you can see the names of the authors of the MovableType posts in <i>italics</i>. For each of these names, you can either pick an author in your WordPress installation from the menu, or enter a name for the author in the textbox.' ); ?> </p>
< p >< ? php _e ( 'If a new user is created by WordPress, the password will be set, by default, to "changeme". Quite suggestive, eh? ;)' ); ?> </p>
< ? php
$authors = $this -> get_mt_authors ();
echo '<ol id="authors">' ;
2005-11-15 21:07:56 -05:00
echo '<form action="?import=mt&step=2&id=' . $this -> id . '" method="post">' ;
2005-09-14 01:17:20 -04:00
$j = - 1 ;
foreach ( $authors as $author ) {
++ $j ;
echo '<li><i>' . $author . '</i><br />' . '<input type="text" value="' . $author . '" name="' . 'user[]' . '" maxlength="30">' ;
$this -> users_form ( $j );
echo '</li>' ;
}
echo '<input type="submit" value="Submit">' . '<br/>' ;
echo '</form>' ;
echo '</ol>' ;
flush ();
}
function select_authors () {
2005-11-15 21:07:56 -05:00
$file = wp_import_handle_upload ();
if ( isset ( $file [ 'error' ]) ) {
echo $file [ 'error' ];
return ;
}
$this -> file = $file [ 'file' ];
$this -> id = $file [ 'id' ];
2005-09-14 01:17:20 -04:00
$this -> get_entries ();
$this -> mt_authors_form ();
}
function process_posts () {
$i = - 1 ;
echo " <ol> " ;
foreach ( $posts as $post ) {
if ( '' != trim ( $post )) {
++ $i ;
unset ( $post_categories );
2005-12-02 17:37:02 -05:00
echo '<li>' . __ ( 'Processing post...' );
2005-09-14 01:17:20 -04:00
// Take the pings out first
preg_match ( " |(----- \n \n PING:.*)|s " , $post , $pings );
$post = preg_replace ( " |(----- \n \n PING:.*)|s " , '' , $post );
// Then take the comments out
preg_match ( " |(----- \n COMMENT:.*)|s " , $post , $comments );
$post = preg_replace ( " |(----- \n COMMENT:.*)|s " , '' , $post );
// We ignore the keywords
$post = preg_replace ( " |(----- \n KEYWORDS:.*)|s " , '' , $post );
// We want the excerpt
preg_match ( " |----- \n EXCERPT:(.*)|s " , $post , $excerpt );
$excerpt = $wpdb -> escape ( trim ( $excerpt [ 1 ]));
$post = preg_replace ( " |(----- \n EXCERPT:.*)|s " , '' , $post );
// We're going to put extended body into main body with a more tag
preg_match ( " |----- \n EXTENDED BODY:(.*)|s " , $post , $extended );
$extended = trim ( $extended [ 1 ]);
if ( '' != $extended )
$extended = " \n <!--more--> \n $extended " ;
$post = preg_replace ( " |(----- \n EXTENDED BODY:.*)|s " , '' , $post );
// Now for the main body
preg_match ( " |----- \n BODY:(.*)|s " , $post , $body );
$body = trim ( $body [ 1 ]);
$post_content = $wpdb -> escape ( $body . $extended );
$post = preg_replace ( " |(----- \n BODY:.*)|s " , '' , $post );
// Grab the metadata from what's left
$metadata = explode ( " \n " , $post );
foreach ( $metadata as $line ) {
preg_match ( " /^(.*?):(.*)/ " , $line , $token );
$key = trim ( $token [ 1 ]);
$value = trim ( $token [ 2 ]);
// Now we decide what it is and what to do with it
switch ( $key ) {
case '' :
break ;
case 'AUTHOR' :
$post_author = $value ;
break ;
case 'TITLE' :
$post_title = $wpdb -> escape ( $value );
echo '<i>' . stripslashes ( $post_title ) . '</i>... ' ;
break ;
case 'STATUS' :
// "publish" and "draft" enumeration items match up; no change required
$post_status = $value ;
if ( empty ( $post_status ))
$post_status = 'publish' ;
break ;
case 'ALLOW COMMENTS' :
$post_allow_comments = $value ;
if ( $post_allow_comments == 1 ) {
$comment_status = 'open' ;
} else {
$comment_status = 'closed' ;
}
break ;
case 'CONVERT BREAKS' :
$post_convert_breaks = $value ;
break ;
case 'ALLOW PINGS' :
$post_allow_pings = trim ( $meta [ 2 ][ 0 ]);
if ( $post_allow_pings == 1 ) {
$post_allow_pings = 'open' ;
} else {
$post_allow_pings = 'closed' ;
}
break ;
case 'PRIMARY CATEGORY' :
$post_categories [] = $wpdb -> escape ( $value );
break ;
case 'CATEGORY' :
$post_categories [] = $wpdb -> escape ( $value );
break ;
case 'DATE' :
$post_modified = strtotime ( $value );
$post_modified = date ( 'Y-m-d H:i:s' , $post_modified );
$post_modified_gmt = get_gmt_from_date ( " $post_modified " );
break ;
default :
// echo "\n$key: $value";
break ;
} // end switch
} // End foreach
// Let's check to see if it's in already
2005-09-24 14:07:46 -04:00
if ( $post_id = posts_exists ( $post_title , '' , $post_date )) {
2005-12-02 17:37:02 -05:00
_e ( 'Post already imported.' );
2005-09-14 01:17:20 -04:00
} else {
$post_author = checkauthor ( $post_author ); //just so that if a post already exists, new users are not created by checkauthor
$postdata = compact ( 'post_author' , 'post_date' , 'post_date_gmt' , 'post_content' , 'post_title' , 'post_excerpt' , 'post_status' , 'comment_status' , 'ping_status' , 'post_modified' , 'post_modified_gmt' );
$post_id = wp_insert_post ( $postdata );
// Add categories.
if ( 0 != count ( $post_categories )) {
wp_create_categories ( $post_categories );
}
2005-12-02 17:37:02 -05:00
_e ( ' Post imported successfully...' );
2005-09-14 01:17:20 -04:00
}
2005-09-24 14:07:46 -04:00
$comment_post_ID = $post_id ;
2005-09-14 01:17:20 -04:00
// Now for comments
$comments = explode ( " ----- \n COMMENT: " , $comments [ 0 ]);
foreach ( $comments as $comment ) {
if ( '' != trim ( $comment )) {
// Author
preg_match ( " |AUTHOR:(.*)| " , $comment , $comment_author );
$comment_author = $wpdb -> escape ( trim ( $comment_author [ 1 ]));
$comment = preg_replace ( '|(\n?AUTHOR:.*)|' , '' , $comment );
2005-09-24 14:07:46 -04:00
preg_match ( " |EMAIL:(.*)| " , $comment , $comment_author_email );
$comment_author_email = $wpdb -> escape ( trim ( $comment_author_email [ 1 ]));
2005-09-14 01:17:20 -04:00
$comment = preg_replace ( '|(\n?EMAIL:.*)|' , '' , $comment );
2005-09-24 14:07:46 -04:00
preg_match ( " |IP:(.*)| " , $comment , $comment_author_IP );
$comment_author_IP = trim ( $comment_author_IP [ 1 ]);
2005-09-14 01:17:20 -04:00
$comment = preg_replace ( '|(\n?IP:.*)|' , '' , $comment );
2005-09-24 14:07:46 -04:00
preg_match ( " |URL:(.*)| " , $comment , $comment_author_url );
$comment_author_url = $wpdb -> escape ( trim ( $comment_author_url [ 1 ]));
2005-09-14 01:17:20 -04:00
$comment = preg_replace ( '|(\n?URL:.*)|' , '' , $comment );
preg_match ( " |DATE:(.*)| " , $comment , $comment_date );
$comment_date = trim ( $comment_date [ 1 ]);
$comment_date = date ( 'Y-m-d H:i:s' , strtotime ( $comment_date ));
$comment = preg_replace ( '|(\n?DATE:.*)|' , '' , $comment );
$comment_content = $wpdb -> escape ( trim ( $comment ));
$comment_content = str_replace ( '-----' , '' , $comment_content );
// Check if it's already there
2005-09-24 14:07:46 -04:00
if ( ! comment_exists ( $comment_author , $comment_date )) {
$commentdata = compact ( 'comment_post_ID' , 'comment_author' , 'comment_author_url' , 'comment_author_email' , 'comment_author_IP' , 'comment_date' , 'comment_content' );
$commentdata = wp_filter_comment ( $commentdata );
wp_insert_comment ( $commentdata );
2005-09-14 01:17:20 -04:00
echo " Comment added. " ;
}
}
}
// Finally the pings
// fix the double newline on the first one
$pings [ 0 ] = str_replace ( " ----- \n \n " , " ----- \n " , $pings [ 0 ]);
$pings = explode ( " ----- \n PING: " , $pings [ 0 ]);
foreach ( $pings as $ping ) {
if ( '' != trim ( $ping )) {
// 'Author'
preg_match ( " |BLOG NAME:(.*)| " , $ping , $comment_author );
$comment_author = $wpdb -> escape ( trim ( $comment_author [ 1 ]));
$ping = preg_replace ( '|(\n?BLOG NAME:.*)|' , '' , $ping );
2005-09-24 14:07:46 -04:00
preg_match ( " |IP:(.*)| " , $ping , $comment_author_IP );
$comment_author_IP = trim ( $comment_author_IP [ 1 ]);
2005-09-14 01:17:20 -04:00
$ping = preg_replace ( '|(\n?IP:.*)|' , '' , $ping );
2005-09-24 14:07:46 -04:00
preg_match ( " |URL:(.*)| " , $ping , $comment_author_url );
$comment_author_url = $wpdb -> escape ( trim ( $comment_author_url [ 1 ]));
2005-09-14 01:17:20 -04:00
$ping = preg_replace ( '|(\n?URL:.*)|' , '' , $ping );
preg_match ( " |DATE:(.*)| " , $ping , $comment_date );
$comment_date = trim ( $comment_date [ 1 ]);
$comment_date = date ( 'Y-m-d H:i:s' , strtotime ( $comment_date ));
$ping = preg_replace ( '|(\n?DATE:.*)|' , '' , $ping );
preg_match ( " |TITLE:(.*)| " , $ping , $ping_title );
$ping_title = $wpdb -> escape ( trim ( $ping_title [ 1 ]));
$ping = preg_replace ( '|(\n?TITLE:.*)|' , '' , $ping );
$comment_content = $wpdb -> escape ( trim ( $ping ));
$comment_content = str_replace ( '-----' , '' , $comment_content );
$comment_content = " <strong> $ping_title </strong> \n \n $comment_content " ;
2005-09-24 14:07:46 -04:00
$comment_type = 'trackback' ;
2005-09-14 01:17:20 -04:00
// Check if it's already there
2005-09-24 14:07:46 -04:00
if ( ! comment_exists ( $comment_author , $comment_date )) {
$commentdata = compact ( 'comment_post_ID' , 'comment_author' , 'comment_author_url' , 'comment_author_email' , 'comment_author_IP' , 'comment_date' , 'comment_content' , 'comment_type' );
$commentdata = wp_filter_comment ( $commentdata );
wp_insert_comment ( $commentdata );
2005-12-02 17:37:02 -05:00
_e ( 'Comment added.' );
2005-09-14 01:17:20 -04:00
}
}
}
echo " </li> " ;
}
flush ();
}
echo '</ol>' ;
2005-11-23 05:02:23 -05:00
wp_import_cleanup ( $this -> id );
2005-09-14 01:17:20 -04:00
echo '<h3>' . sprintf ( __ ( 'All done. <a href="%s">Have fun!</a>' ), get_option ( 'home' )) . '</h3>' ;
}
2005-08-21 03:03:23 -04:00
function import () {
2005-11-23 05:02:23 -05:00
$this -> id = ( int ) $_GET [ 'id' ];
$this -> file = get_attached_file ( $this -> id );
2005-09-14 01:17:20 -04:00
$this -> get_authors_from_post ();
2005-09-13 20:03:02 -04:00
$this -> get_entries ();
2005-09-14 01:17:20 -04:00
$this -> process_posts ();
2005-08-21 03:03:23 -04:00
}
2005-09-14 01:17:20 -04:00
2005-08-21 03:03:23 -04:00
function dispatch () {
2005-09-14 01:17:20 -04:00
if ( empty ( $_GET [ 'step' ]))
2005-08-21 03:03:23 -04:00
$step = 0 ;
else
$step = ( int ) $_GET [ 'step' ];
2005-09-14 01:17:20 -04:00
2005-08-21 03:03:23 -04:00
switch ( $step ) {
2005-09-14 01:17:20 -04:00
case 0 :
2005-08-21 03:03:23 -04:00
$this -> greet ();
break ;
2005-09-14 01:17:20 -04:00
case 1 :
$this -> select_authors ();
2005-08-21 03:03:23 -04:00
break ;
2005-11-15 21:07:56 -05:00
case 2 :
2005-11-23 05:02:23 -05:00
$this -> import ();
2005-11-15 21:07:56 -05:00
break ;
2005-08-21 03:03:23 -04:00
}
}
2005-09-14 01:17:20 -04:00
2005-08-21 03:03:23 -04:00
function MT_Import () {
// Nothing.
}
}
$mt_import = new MT_Import ();
2005-11-17 20:36:20 -05:00
//register_importer('mt', 'Movable Type', 'Import posts and comments from your Movable Type blog', array ($mt_import, 'dispatch'));
2005-12-02 17:37:02 -05:00
?>