git-svn-id: https://192.168.0.254/svn/Proyectos.EstudioJuridicoAlmagro_Web/trunk@3 c22fe52d-42d7-ba4f-95f7-33effcf65713
288 lines
10 KiB
PHP
288 lines
10 KiB
PHP
<?php
|
|
/**
|
|
* WordPress eXtended RSS file parser implementations
|
|
*
|
|
* @package WordPress
|
|
* @subpackage Importer
|
|
*/
|
|
|
|
function wpv_get_export_data($file) {
|
|
$replaced_contents = file_get_contents($file);
|
|
return str_replace('{WPV:SAMPLES_URI}', WPV_THEME_URI . 'samples/', $replaced_contents);
|
|
}
|
|
|
|
/**
|
|
* WordPress Importer class for managing parsing of WXR files.
|
|
*/
|
|
class WPV_WXR_Parser {
|
|
function parse( $file ) {
|
|
// use regular expressions if nothing else available or this is bad XML
|
|
$parser = new WPV_WXR_Parser_Regex;
|
|
return $parser->parse( $file );
|
|
}
|
|
}
|
|
|
|
/**
|
|
* WXR Parser that uses regular expressions. Fallback for installs without an XML parser.
|
|
*/
|
|
class WPV_WXR_Parser_Regex {
|
|
var $authors = array();
|
|
var $posts = array();
|
|
var $categories = array();
|
|
var $tags = array();
|
|
var $terms = array();
|
|
var $base_url = '';
|
|
|
|
function WXR_Parser_Regex() {
|
|
$this->__construct();
|
|
}
|
|
|
|
function __construct() {
|
|
$this->has_gzip = is_callable( 'gzopen' );
|
|
}
|
|
|
|
function parse( $file ) {
|
|
$wxr_version = $in_post = $frontpage = false;
|
|
|
|
$fp = $this->fopen( $file, 'r' );
|
|
if ( $fp ) {
|
|
while ( ! $this->feof( $fp ) ) {
|
|
$importline = rtrim( $this->fgets( $fp ) );
|
|
|
|
$importline = str_replace('{WPV:SAMPLES_URI}', WPV_THEME_URI . 'samples/', $importline);
|
|
|
|
if ( ! $wxr_version && preg_match( '|<wp:wxr_version>(\d+\.\d+)</wp:wxr_version>|', $importline, $version ) )
|
|
$wxr_version = $version[1];
|
|
|
|
if ( ! $frontpage) {
|
|
preg_match( "|<wpv:frontpage.*?>(\d*?)</wpv:frontpage>|is", $importline, $frontpage );
|
|
|
|
if ( isset( $frontpage[1] ) ) {
|
|
$frontpage = $frontpage[1];
|
|
}
|
|
}
|
|
|
|
if ( false !== strpos( $importline, '<wp:base_site_url>' ) ) {
|
|
preg_match( '|<wp:base_site_url>(.*?)</wp:base_site_url>|is', $importline, $url );
|
|
$this->base_url = $url[1];
|
|
continue;
|
|
}
|
|
if ( false !== strpos( $importline, '<wp:category>' ) ) {
|
|
preg_match( '|<wp:category>(.*?)</wp:category>|is', $importline, $category );
|
|
$this->categories[] = $this->process_category( $category[1] );
|
|
continue;
|
|
}
|
|
if ( false !== strpos( $importline, '<wp:tag>' ) ) {
|
|
preg_match( '|<wp:tag>(.*?)</wp:tag>|is', $importline, $tag );
|
|
$this->tags[] = $this->process_tag( $tag[1] );
|
|
continue;
|
|
}
|
|
if ( false !== strpos( $importline, '<wp:term>' ) ) {
|
|
preg_match( '|<wp:term>(.*?)</wp:term>|is', $importline, $term );
|
|
$this->terms[] = $this->process_term( $term[1] );
|
|
continue;
|
|
}
|
|
if ( false !== strpos( $importline, '<wp:author>' ) ) {
|
|
preg_match( '|<wp:author>(.*?)</wp:author>|is', $importline, $author );
|
|
$a = $this->process_author( $author[1] );
|
|
$this->authors[$a['author_login']] = $a;
|
|
continue;
|
|
}
|
|
if ( false !== strpos( $importline, '<item>' ) ) {
|
|
$post = '';
|
|
$in_post = true;
|
|
continue;
|
|
}
|
|
if ( false !== strpos( $importline, '</item>' ) ) {
|
|
$in_post = false;
|
|
$this->posts[] = $this->process_post( $post );
|
|
continue;
|
|
}
|
|
if ( $in_post ) {
|
|
$post .= $importline . "\n";
|
|
}
|
|
}
|
|
|
|
$this->fclose($fp);
|
|
}
|
|
|
|
if ( ! $wxr_version )
|
|
return new WP_Error( 'WXR_parse_error', __( 'This does not appear to be a WXR file, missing/invalid WXR version number', 'wordpress-importer' ) );
|
|
|
|
return array(
|
|
'authors' => $this->authors,
|
|
'posts' => $this->posts,
|
|
'categories' => $this->categories,
|
|
'tags' => $this->tags,
|
|
'terms' => $this->terms,
|
|
'base_url' => $this->base_url,
|
|
'version' => $wxr_version,
|
|
'frontpage' => $frontpage,
|
|
);
|
|
}
|
|
|
|
function get_tag( $string, $tag ) {
|
|
global $wpdb;
|
|
preg_match( "|<$tag.*?>(.*?)</$tag>|is", $string, $return );
|
|
if ( isset( $return[1] ) ) {
|
|
$return = preg_replace( '|^<!\[CDATA\[(.*)\]\]>$|s', '$1', $return[1] );
|
|
$return = $wpdb->escape( trim( $return ) );
|
|
} else {
|
|
$return = '';
|
|
}
|
|
return $return;
|
|
}
|
|
|
|
function process_category( $c ) {
|
|
return array(
|
|
'term_id' => $this->get_tag( $c, 'wp:term_id' ),
|
|
'cat_name' => $this->get_tag( $c, 'wp:cat_name' ),
|
|
'category_nicename' => $this->get_tag( $c, 'wp:category_nicename' ),
|
|
'category_parent' => $this->get_tag( $c, 'wp:category_parent' ),
|
|
'category_description' => $this->get_tag( $c, 'wp:category_description' ),
|
|
);
|
|
}
|
|
|
|
function process_tag( $t ) {
|
|
return array(
|
|
'term_id' => $this->get_tag( $t, 'wp:term_id' ),
|
|
'tag_name' => $this->get_tag( $t, 'wp:tag_name' ),
|
|
'tag_slug' => $this->get_tag( $t, 'wp:tag_slug' ),
|
|
'tag_description' => $this->get_tag( $t, 'wp:tag_description' ),
|
|
);
|
|
}
|
|
|
|
function process_term( $t ) {
|
|
return array(
|
|
'term_id' => $this->get_tag( $t, 'wp:term_id' ),
|
|
'term_taxonomy' => $this->get_tag( $t, 'wp:term_taxonomy' ),
|
|
'slug' => $this->get_tag( $t, 'wp:term_slug' ),
|
|
'term_parent' => $this->get_tag( $t, 'wp:term_parent' ),
|
|
'term_name' => $this->get_tag( $t, 'wp:term_name' ),
|
|
'term_description' => $this->get_tag( $t, 'wp:term_description' ),
|
|
);
|
|
}
|
|
|
|
function process_author( $a ) {
|
|
return array(
|
|
'author_id' => $this->get_tag( $a, 'wp:author_id' ),
|
|
'author_login' => $this->get_tag( $a, 'wp:author_login' ),
|
|
'author_email' => $this->get_tag( $a, 'wp:author_email' ),
|
|
'author_display_name' => $this->get_tag( $a, 'wp:author_display_name' ),
|
|
'author_first_name' => $this->get_tag( $a, 'wp:author_first_name' ),
|
|
'author_last_name' => $this->get_tag( $a, 'wp:author_last_name' ),
|
|
);
|
|
}
|
|
|
|
function process_post( $post ) {
|
|
$post_id = $this->get_tag( $post, 'wp:post_id' );
|
|
$post_title = $this->get_tag( $post, 'title' );
|
|
$post_date = $this->get_tag( $post, 'wp:post_date' );
|
|
$post_date_gmt = $this->get_tag( $post, 'wp:post_date_gmt' );
|
|
$comment_status = $this->get_tag( $post, 'wp:comment_status' );
|
|
$ping_status = $this->get_tag( $post, 'wp:ping_status' );
|
|
$status = $this->get_tag( $post, 'wp:status' );
|
|
$post_name = $this->get_tag( $post, 'wp:post_name' );
|
|
$post_parent = $this->get_tag( $post, 'wp:post_parent' );
|
|
$menu_order = $this->get_tag( $post, 'wp:menu_order' );
|
|
$post_type = $this->get_tag( $post, 'wp:post_type' );
|
|
$post_password = $this->get_tag( $post, 'wp:post_password' );
|
|
$is_sticky = $this->get_tag( $post, 'wp:is_sticky' );
|
|
$guid = $this->get_tag( $post, 'guid' );
|
|
$post_author = $this->get_tag( $post, 'dc:creator' );
|
|
|
|
$post_excerpt = $this->get_tag( $post, 'excerpt:encoded' );
|
|
$post_excerpt = preg_replace_callback( '|<(/?[A-Z]+)|', array( &$this, '_normalize_tag' ), $post_excerpt );
|
|
$post_excerpt = str_replace( '<br>', '<br />', $post_excerpt );
|
|
$post_excerpt = str_replace( '<hr>', '<hr />', $post_excerpt );
|
|
|
|
$post_content = $this->get_tag( $post, 'content:encoded' );
|
|
$post_content = preg_replace_callback( '|<(/?[A-Z]+)|', array( &$this, '_normalize_tag' ), $post_content );
|
|
$post_content = str_replace( '<br>', '<br />', $post_content );
|
|
$post_content = str_replace( '<hr>', '<hr />', $post_content );
|
|
|
|
$postdata = compact( 'post_id', 'post_author', 'post_date', 'post_date_gmt', 'post_content', 'post_excerpt',
|
|
'post_title', 'status', 'post_name', 'comment_status', 'ping_status', 'guid', 'post_parent',
|
|
'menu_order', 'post_type', 'post_password', 'is_sticky'
|
|
);
|
|
|
|
$attachment_url = $this->get_tag( $post, 'wp:attachment_url' );
|
|
if ( $attachment_url )
|
|
$postdata['attachment_url'] = $attachment_url;
|
|
|
|
preg_match_all( '|<category domain="([^"]+?)" nicename="([^"]+?)">(.+?)</category>|is', $post, $terms, PREG_SET_ORDER );
|
|
foreach ( $terms as $t ) {
|
|
$post_terms[] = array(
|
|
'slug' => $t[2],
|
|
'domain' => $t[1],
|
|
'name' => str_replace( array( '<![CDATA[', ']]>' ), '', $t[3] ),
|
|
);
|
|
}
|
|
if ( ! empty( $post_terms ) ) $postdata['terms'] = $post_terms;
|
|
|
|
preg_match_all( '|<wp:comment>(.+?)</wp:comment>|is', $post, $comments );
|
|
$comments = $comments[1];
|
|
if ( $comments ) {
|
|
foreach ( $comments as $comment ) {
|
|
$post_comments[] = array(
|
|
'comment_id' => $this->get_tag( $comment, 'wp:comment_id' ),
|
|
'comment_author' => $this->get_tag( $comment, 'wp:comment_author' ),
|
|
'comment_author_email' => $this->get_tag( $comment, 'wp:comment_author_email' ),
|
|
'comment_author_IP' => $this->get_tag( $comment, 'wp:comment_author_IP' ),
|
|
'comment_author_url' => $this->get_tag( $comment, 'wp:comment_author_url' ),
|
|
'comment_date' => $this->get_tag( $comment, 'wp:comment_date' ),
|
|
'comment_date_gmt' => $this->get_tag( $comment, 'wp:comment_date_gmt' ),
|
|
'comment_content' => $this->get_tag( $comment, 'wp:comment_content' ),
|
|
'comment_approved' => $this->get_tag( $comment, 'wp:comment_approved' ),
|
|
'comment_type' => $this->get_tag( $comment, 'wp:comment_type' ),
|
|
'comment_parent' => $this->get_tag( $comment, 'wp:comment_parent' ),
|
|
'comment_user_id' => $this->get_tag( $comment, 'wp:comment_user_id' ),
|
|
);
|
|
}
|
|
}
|
|
if ( ! empty( $post_comments ) ) $postdata['comments'] = $post_comments;
|
|
|
|
preg_match_all( '|<wp:postmeta>(.+?)</wp:postmeta>|is', $post, $postmeta );
|
|
$postmeta = $postmeta[1];
|
|
if ( $postmeta ) {
|
|
foreach ( $postmeta as $p ) {
|
|
$post_postmeta[] = array(
|
|
'key' => $this->get_tag( $p, 'wp:meta_key' ),
|
|
'value' => $this->get_tag( $p, 'wp:meta_value' ),
|
|
);
|
|
}
|
|
}
|
|
if ( ! empty( $post_postmeta ) ) $postdata['postmeta'] = $post_postmeta;
|
|
|
|
return $postdata;
|
|
}
|
|
|
|
function _normalize_tag( $matches ) {
|
|
return '<' . strtolower( $matches[1] );
|
|
}
|
|
|
|
function fopen( $filename, $mode = 'r' ) {
|
|
if ( $this->has_gzip )
|
|
return gzopen( $filename, $mode );
|
|
return fopen( $filename, $mode );
|
|
}
|
|
|
|
function feof( $fp ) {
|
|
if ( $this->has_gzip )
|
|
return gzeof( $fp );
|
|
return feof( $fp );
|
|
}
|
|
|
|
function fgets( $fp, $len = 8192 ) {
|
|
if ( $this->has_gzip )
|
|
return gzgets( $fp, $len );
|
|
return fgets( $fp, $len );
|
|
}
|
|
|
|
function fclose( $fp ) {
|
|
if ( $this->has_gzip )
|
|
return gzclose( $fp );
|
|
return fclose( $fp );
|
|
}
|
|
}
|