[44] | 1 | <?php
|
---|
| 2 | class SyndicatedPost {
|
---|
| 3 | var $item = null;
|
---|
| 4 |
|
---|
| 5 | var $link = null;
|
---|
| 6 | var $feed = null;
|
---|
| 7 | var $feedmeta = null;
|
---|
| 8 |
|
---|
| 9 | var $post = array ();
|
---|
| 10 |
|
---|
| 11 | var $_freshness = null;
|
---|
| 12 | var $_wp_id = null;
|
---|
| 13 |
|
---|
| 14 | function SyndicatedPost ($item, $link) {
|
---|
| 15 | global $wpdb;
|
---|
| 16 |
|
---|
| 17 | $this->link = $link;
|
---|
| 18 | $feedmeta = $link->settings;
|
---|
| 19 | $feed = $link->magpie;
|
---|
| 20 |
|
---|
| 21 | # This is ugly as all hell. I'd like to use apply_filters()'s
|
---|
| 22 | # alleged support for a variable argument count, but this seems
|
---|
| 23 | # to have been broken in WordPress 1.5. It'll be fixed somehow
|
---|
| 24 | # in WP 1.5.1, but I'm aiming at WP 1.5 compatibility across
|
---|
| 25 | # the board here.
|
---|
| 26 | #
|
---|
| 27 | # Cf.: <http://mosquito.wordpress.org/view.php?id=901>
|
---|
| 28 | global $fwp_channel, $fwp_feedmeta;
|
---|
| 29 | $fwp_channel = $feed; $fwp_feedmeta = $feedmeta;
|
---|
| 30 |
|
---|
| 31 | $this->feed = $feed;
|
---|
| 32 | $this->feedmeta = $feedmeta;
|
---|
| 33 |
|
---|
| 34 | $this->item = $item;
|
---|
| 35 | $this->item = apply_filters('syndicated_item', $this->item, $this);
|
---|
| 36 |
|
---|
| 37 | # Filters can halt further processing by returning NULL
|
---|
| 38 | if (is_null($this->item)) :
|
---|
| 39 | $this->post = NULL;
|
---|
| 40 | else :
|
---|
| 41 | # Note that nothing is run through $wpdb->escape() here.
|
---|
| 42 | # That's deliberate. The escaping is done at the point
|
---|
| 43 | # of insertion, not here, to avoid double-escaping and
|
---|
| 44 | # to avoid screwing with syndicated_post filters
|
---|
| 45 |
|
---|
| 46 | $this->post['post_title'] = apply_filters('syndicated_item_title', $this->item['title'], $this);
|
---|
| 47 |
|
---|
| 48 | // This just gives us an alphanumeric representation of
|
---|
| 49 | // the author. We will look up (or create) the numeric
|
---|
| 50 | // ID for the author in SyndicatedPost::add()
|
---|
| 51 | $this->post['named']['author'] = apply_filters('syndicated_item_author', $this->author(), $this);
|
---|
| 52 |
|
---|
| 53 | # Identify content and sanitize it.
|
---|
| 54 | # ---------------------------------
|
---|
| 55 | if (isset($this->item['atom_content'])) :
|
---|
| 56 | $content = $this->item['atom_content'];
|
---|
| 57 | elseif (isset($this->item['xhtml']['body'])) :
|
---|
| 58 | $content = $this->item['xhtml']['body'];
|
---|
| 59 | elseif (isset($this->item['xhtml']['div'])) :
|
---|
| 60 | $content = $this->item['xhtml']['div'];
|
---|
| 61 | elseif (isset($this->item['content']['encoded']) and $this->item['content']['encoded']):
|
---|
| 62 | $content = $this->item['content']['encoded'];
|
---|
| 63 | else:
|
---|
| 64 | $content = $this->item['description'];
|
---|
| 65 | endif;
|
---|
| 66 | $this->post['post_content'] = apply_filters('syndicated_item_content', $content, $this);
|
---|
| 67 |
|
---|
| 68 | # Identify and sanitize excerpt
|
---|
| 69 | $excerpt = NULL;
|
---|
| 70 | if ( isset($this->item['description']) and $this->item['description'] ) :
|
---|
| 71 | $excerpt = $this->item['description'];
|
---|
| 72 | elseif ( isset($content) and $content ) :
|
---|
| 73 | $excerpt = strip_tags($content);
|
---|
| 74 | if (strlen($excerpt) > 255) :
|
---|
| 75 | $excerpt = substr($excerpt,0,252).'...';
|
---|
| 76 | endif;
|
---|
| 77 | endif;
|
---|
| 78 | $excerpt = apply_filters('syndicated_item_excerpt', $excerpt, $this);
|
---|
| 79 |
|
---|
| 80 | if (!is_null($excerpt)):
|
---|
| 81 | $this->post['post_excerpt'] = $excerpt;
|
---|
| 82 | endif;
|
---|
| 83 |
|
---|
| 84 | // This is unnecessary if we use wp_insert_post
|
---|
| 85 | if (!$this->use_api('wp_insert_post')) :
|
---|
| 86 | $this->post['post_name'] = sanitize_title($this->post['post_title']);
|
---|
| 87 | endif;
|
---|
| 88 |
|
---|
| 89 | $this->post['epoch']['issued'] = apply_filters('syndicated_item_published', $this->published(), $this);
|
---|
| 90 | $this->post['epoch']['created'] = apply_filters('syndicated_item_created', $this->created(), $this);
|
---|
| 91 | $this->post['epoch']['modified'] = apply_filters('syndicated_item_updated', $this->updated(), $this);
|
---|
| 92 |
|
---|
| 93 | // Dealing with timestamps in WordPress is so fucking fucked.
|
---|
| 94 | $offset = (int) get_option('gmt_offset') * 60 * 60;
|
---|
| 95 | $this->post['post_date'] = gmdate('Y-m-d H:i:s', $this->published() + $offset);
|
---|
| 96 | $this->post['post_modified'] = gmdate('Y-m-d H:i:s', $this->updated() + $offset);
|
---|
| 97 | $this->post['post_date_gmt'] = gmdate('Y-m-d H:i:s', $this->published());
|
---|
| 98 | $this->post['post_modified_gmt'] = gmdate('Y-m-d H:i:s', $this->updated());
|
---|
| 99 |
|
---|
| 100 | // Use feed-level preferences or the global default.
|
---|
| 101 | $this->post['post_status'] = $this->link->syndicated_status('post', 'publish');
|
---|
| 102 | $this->post['comment_status'] = $this->link->syndicated_status('comment', 'closed');
|
---|
| 103 | $this->post['ping_status'] = $this->link->syndicated_status('ping', 'closed');
|
---|
| 104 |
|
---|
| 105 | // Unique ID (hopefully a unique tag: URI); failing that, the permalink
|
---|
| 106 | $this->post['guid'] = apply_filters('syndicated_item_guid', $this->guid(), $this);
|
---|
| 107 |
|
---|
| 108 | // User-supplied custom settings to apply to each post. Do first so that FWP-generated custom settings will overwrite if necessary; thus preventing any munging
|
---|
| 109 | $default_custom_settings = get_option('feedwordpress_custom_settings');
|
---|
| 110 | if ($default_custom_settings) :
|
---|
| 111 | $default_custom_settings = unserialize($default_custom_settings);
|
---|
| 112 | endif;
|
---|
| 113 | if (!is_array($default_custom_settings)) :
|
---|
| 114 | $default_custom_settings = array();
|
---|
| 115 | endif;
|
---|
| 116 |
|
---|
| 117 | $custom_settings = (isset($this->link->settings['postmeta']) ? $this->link->settings['postmeta'] : null);
|
---|
| 118 | if ($custom_settings) :
|
---|
| 119 | $custom_settings = unserialize($custom_settings);
|
---|
| 120 | endif;
|
---|
| 121 | if (!is_array($custom_settings)) :
|
---|
| 122 | $custom_settings = array();
|
---|
| 123 | endif;
|
---|
| 124 | $this->post['meta'] = array_merge($default_custom_settings, $custom_settings);
|
---|
| 125 |
|
---|
| 126 | // RSS 2.0 / Atom 1.0 enclosure support
|
---|
| 127 | if ( isset($this->item['enclosure#']) ) :
|
---|
| 128 | for ($i = 1; $i <= $this->item['enclosure#']; $i++) :
|
---|
| 129 | $eid = (($i > 1) ? "#{$id}" : "");
|
---|
| 130 | $this->post['meta']['enclosure'][] =
|
---|
| 131 | apply_filters('syndicated_item_enclosure_url', $this->item["enclosure{$eid}@url"], $this)."\n".
|
---|
| 132 | apply_filters('syndicated_item_enclosure_length', $this->item["enclosure{$eid}@length"], $this)."\n".
|
---|
| 133 | apply_filters('syndicated_item_enclosure_type', $this->item["enclosure{$eid}@type"], $this);
|
---|
| 134 | endfor;
|
---|
| 135 | endif;
|
---|
| 136 |
|
---|
| 137 | // In case you want to point back to the blog this was syndicated from
|
---|
| 138 | if (isset($this->feed->channel['title'])) :
|
---|
| 139 | $this->post['meta']['syndication_source'] = apply_filters('syndicated_item_source_title', $this->feed->channel['title'], $this);
|
---|
| 140 | endif;
|
---|
| 141 |
|
---|
| 142 | if (isset($this->feed->channel['link'])) :
|
---|
| 143 | $this->post['meta']['syndication_source_uri'] = apply_filters('syndicated_item_source_link', $this->feed->channel['link'], $this);
|
---|
| 144 | endif;
|
---|
| 145 |
|
---|
| 146 | // Make use of atom:source data, if present in an aggregated feed
|
---|
| 147 | if (isset($this->item['source_title'])) :
|
---|
| 148 | $this->post['meta']['syndication_source_original'] = $this->item['source_title'];
|
---|
| 149 | endif;
|
---|
| 150 |
|
---|
| 151 | if (isset($this->item['source_link'])) :
|
---|
| 152 | $this->post['meta']['syndication_source_uri_original'] = $this->item['source_link'];
|
---|
| 153 | endif;
|
---|
| 154 |
|
---|
| 155 | if (isset($this->item['source_id'])) :
|
---|
| 156 | $this->post['meta']['syndication_source_id_original'] = $this->item['source_id'];
|
---|
| 157 | endif;
|
---|
| 158 |
|
---|
| 159 | // Store information on human-readable and machine-readable comment URIs
|
---|
| 160 | if (isset($this->item['comments'])) :
|
---|
| 161 | $this->post['meta']['rss:comments'] = apply_filters('syndicated_item_comments', $this->item['comments']);
|
---|
| 162 | endif;
|
---|
| 163 | if (isset($this->item['wfw']['commentrss'])) :
|
---|
| 164 | $this->post['meta']['wfw:commentRSS'] = apply_filters('syndicated_item_commentrss', $this->item['wfw']['commentrss']);
|
---|
| 165 | endif;
|
---|
| 166 |
|
---|
| 167 | // Store information to identify the feed that this came from
|
---|
| 168 | $this->post['meta']['syndication_feed'] = $this->feedmeta['link/uri'];
|
---|
| 169 | $this->post['meta']['syndication_feed_id'] = $this->feedmeta['link/id'];
|
---|
| 170 |
|
---|
| 171 | if (isset($this->item['source_link_self'])) :
|
---|
| 172 | $this->post['meta']['syndication_feed_original'] = $this->item['source_link_self'];
|
---|
| 173 | endif;
|
---|
| 174 |
|
---|
| 175 | // In case you want to know the external permalink...
|
---|
| 176 | $this->post['meta']['syndication_permalink'] = apply_filters('syndicated_item_link', $this->item['link']);
|
---|
| 177 |
|
---|
| 178 | // Store a hash of the post content for checking whether something needs to be updated
|
---|
| 179 | $this->post['meta']['syndication_item_hash'] = $this->update_hash();
|
---|
| 180 |
|
---|
| 181 | // Feed-by-feed options for author and category creation
|
---|
| 182 | $this->post['named']['unfamiliar']['author'] = (isset($this->feedmeta['unfamiliar author']) ? $this->feedmeta['unfamiliar author'] : null);
|
---|
| 183 | $this->post['named']['unfamiliar']['category'] = (isset($this->feedmeta['unfamiliar category']) ? $this->feedmeta['unfamiliar category'] : null);
|
---|
| 184 |
|
---|
| 185 | // Categories: start with default categories, if any
|
---|
| 186 | $fc = get_option("feedwordpress_syndication_cats");
|
---|
| 187 | if ($fc) :
|
---|
| 188 | $this->post['named']['preset/category'] = explode("\n", $fc);
|
---|
| 189 | else :
|
---|
| 190 | $this->post['named']['preset/category'] = array();
|
---|
| 191 | endif;
|
---|
| 192 |
|
---|
| 193 | if (isset($this->feedmeta['cats']) and is_array($this->feedmeta['cats'])) :
|
---|
| 194 | $this->post['named']['preset/category'] = array_merge($this->post['named']['preset/category'], $this->feedmeta['cats']);
|
---|
| 195 | endif;
|
---|
| 196 |
|
---|
| 197 | // Now add categories from the post, if we have 'em
|
---|
| 198 | $this->post['named']['category'] = array();
|
---|
| 199 | if ( isset($this->item['category#']) ) :
|
---|
| 200 | for ($i = 1; $i <= $this->item['category#']; $i++) :
|
---|
| 201 | $cat_idx = (($i > 1) ? "#{$i}" : "");
|
---|
| 202 | $cat = $this->item["category{$cat_idx}"];
|
---|
| 203 |
|
---|
| 204 | if ( isset($this->feedmeta['cat_split']) and strlen($this->feedmeta['cat_split']) > 0) :
|
---|
| 205 | $pcre = "\007".$this->feedmeta['cat_split']."\007";
|
---|
| 206 | $this->post['named']['category'] = array_merge($this->post['named']['category'], preg_split($pcre, $cat, -1 /*=no limit*/, PREG_SPLIT_NO_EMPTY));
|
---|
| 207 | else :
|
---|
| 208 | $this->post['named']['category'][] = $cat;
|
---|
| 209 | endif;
|
---|
| 210 | endfor;
|
---|
| 211 | endif;
|
---|
| 212 | $this->post['named']['category'] = apply_filters('syndicated_item_categories', $this->post['named']['category'], $this);
|
---|
| 213 |
|
---|
| 214 | // Tags: start with default tags, if any
|
---|
| 215 | $ft = get_option("feedwordpress_syndication_tags");
|
---|
| 216 | if ($ft) :
|
---|
| 217 | $this->post['tags_input'] = explode(FEEDWORDPRESS_CAT_SEPARATOR, $ft);
|
---|
| 218 | else :
|
---|
| 219 | $this->post['tags_input'] = array();
|
---|
| 220 | endif;
|
---|
| 221 |
|
---|
| 222 | if (isset($this->feedmeta['tags']) and is_array($this->feedmeta['tags'])) :
|
---|
| 223 | $this->post['tags_input'] = array_merge($this->post['tags_input'], $this->feedmeta['tags']);
|
---|
| 224 | endif;
|
---|
| 225 |
|
---|
| 226 | endif;
|
---|
| 227 | } // SyndicatedPost::SyndicatedPost()
|
---|
| 228 |
|
---|
| 229 | function filtered () {
|
---|
| 230 | return is_null($this->post);
|
---|
| 231 | }
|
---|
| 232 |
|
---|
| 233 | function freshness () {
|
---|
| 234 | global $wpdb;
|
---|
| 235 |
|
---|
| 236 | if ($this->filtered()) : // This should never happen.
|
---|
| 237 | FeedWordPress::critical_bug('SyndicatedPost', $this, __LINE__);
|
---|
| 238 | endif;
|
---|
| 239 |
|
---|
| 240 | if (is_null($this->_freshness)) :
|
---|
| 241 | $guid = $wpdb->escape($this->guid());
|
---|
| 242 |
|
---|
| 243 | $result = $wpdb->get_row("
|
---|
| 244 | SELECT id, guid, post_modified_gmt
|
---|
| 245 | FROM $wpdb->posts WHERE guid='$guid'
|
---|
| 246 | ");
|
---|
| 247 |
|
---|
| 248 | if (!$result) :
|
---|
| 249 | $this->_freshness = 2; // New content
|
---|
| 250 | else:
|
---|
| 251 | $stored_update_hashes = get_post_custom_values('syndication_item_hash', $result->id);
|
---|
| 252 | if (count($stored_update_hashes) > 0) :
|
---|
| 253 | $stored_update_hash = $stored_update_hashes[0];
|
---|
| 254 | $update_hash_changed = ($stored_update_hash != $this->update_hash());
|
---|
| 255 | else :
|
---|
| 256 | $update_hash_changed = false;
|
---|
| 257 | endif;
|
---|
| 258 |
|
---|
| 259 | preg_match('/([0-9]+)-([0-9]+)-([0-9]+) ([0-9]+):([0-9]+):([0-9]+)/', $result->post_modified_gmt, $backref);
|
---|
| 260 |
|
---|
| 261 | $last_rev_ts = gmmktime($backref[4], $backref[5], $backref[6], $backref[2], $backref[3], $backref[1]);
|
---|
| 262 | $updated_ts = $this->updated(/*fallback=*/ true, /*default=*/ NULL);
|
---|
| 263 | $updated = ((
|
---|
| 264 | !is_null($updated_ts)
|
---|
| 265 | and ($updated_ts > $last_rev_ts)
|
---|
| 266 | ) or $update_hash_changed);
|
---|
| 267 |
|
---|
| 268 | if ($updated) :
|
---|
| 269 | $this->_freshness = 1; // Updated content
|
---|
| 270 | $this->_wp_id = $result->id;
|
---|
| 271 | else :
|
---|
| 272 | $this->_freshness = 0; // Same old, same old
|
---|
| 273 | $this->_wp_id = $result->id;
|
---|
| 274 | endif;
|
---|
| 275 | endif;
|
---|
| 276 | endif;
|
---|
| 277 | return $this->_freshness;
|
---|
| 278 | }
|
---|
| 279 |
|
---|
| 280 | function wp_id () {
|
---|
| 281 | if ($this->filtered()) : // This should never happen.
|
---|
| 282 | FeedWordPress::critical_bug('SyndicatedPost', $this, __LINE__);
|
---|
| 283 | endif;
|
---|
| 284 |
|
---|
| 285 | if (is_null($this->_wp_id) and is_null($this->_freshness)) :
|
---|
| 286 | $fresh = $this->freshness(); // sets WP DB id in the process
|
---|
| 287 | endif;
|
---|
| 288 | return $this->_wp_id;
|
---|
| 289 | }
|
---|
| 290 |
|
---|
| 291 | function store () {
|
---|
| 292 | global $wpdb;
|
---|
| 293 |
|
---|
| 294 | if ($this->filtered()) : // This should never happen.
|
---|
| 295 | FeedWordPress::critical_bug('SyndicatedPost', $this, __LINE__);
|
---|
| 296 | endif;
|
---|
| 297 |
|
---|
| 298 | $freshness = $this->freshness();
|
---|
| 299 | if ($freshness > 0) :
|
---|
| 300 | # -- Look up, or create, numeric ID for author
|
---|
| 301 | $this->post['post_author'] = $this->author_id (
|
---|
| 302 | FeedWordPress::on_unfamiliar('author', $this->post['named']['unfamiliar']['author'])
|
---|
| 303 | );
|
---|
| 304 |
|
---|
| 305 | if (is_null($this->post['post_author'])) :
|
---|
| 306 | $this->post = NULL;
|
---|
| 307 | endif;
|
---|
| 308 | endif;
|
---|
| 309 |
|
---|
| 310 | if (!$this->filtered() and $freshness > 0) :
|
---|
| 311 | # -- Look up, or create, numeric ID for categories
|
---|
| 312 | list($pcats, $ptags) = $this->category_ids (
|
---|
| 313 | $this->post['named']['category'],
|
---|
| 314 | FeedWordPress::on_unfamiliar('category', $this->post['named']['unfamiliar']['category']),
|
---|
| 315 | /*tags_too=*/ true
|
---|
| 316 | );
|
---|
| 317 |
|
---|
| 318 | $this->post['post_category'] = $pcats;
|
---|
| 319 | $this->post['tags_input'] = array_merge($this->post['tags_input'], $ptags);
|
---|
| 320 |
|
---|
| 321 | if (is_null($this->post['post_category'])) :
|
---|
| 322 | // filter mode on, no matching categories; drop the post
|
---|
| 323 | $this->post = NULL;
|
---|
| 324 | else :
|
---|
| 325 | // filter mode off or at least one match; now add on the feed and global presets
|
---|
| 326 | $this->post['post_category'] = array_merge (
|
---|
| 327 | $this->post['post_category'],
|
---|
| 328 | $this->category_ids (
|
---|
| 329 | $this->post['named']['preset/category'],
|
---|
| 330 | 'default'
|
---|
| 331 | )
|
---|
| 332 | );
|
---|
| 333 |
|
---|
| 334 | if (count($this->post['post_category']) < 1) :
|
---|
| 335 | $this->post['post_category'][] = 1; // Default to category 1 ("Uncategorized" / "General") if nothing else
|
---|
| 336 | endif;
|
---|
| 337 | endif;
|
---|
| 338 | endif;
|
---|
| 339 |
|
---|
| 340 | if (!$this->filtered() and $freshness > 0) :
|
---|
| 341 | unset($this->post['named']);
|
---|
| 342 | $this->post = apply_filters('syndicated_post', $this->post, $this);
|
---|
| 343 | endif;
|
---|
| 344 |
|
---|
| 345 | if (!$this->filtered() and $freshness == 2) :
|
---|
| 346 | // The item has not yet been added. So let's add it.
|
---|
| 347 | $this->insert_new();
|
---|
| 348 | $this->add_rss_meta();
|
---|
| 349 | do_action('post_syndicated_item', $this->wp_id());
|
---|
| 350 |
|
---|
| 351 | $ret = 'new';
|
---|
| 352 | elseif (!$this->filtered() and $freshness == 1) :
|
---|
| 353 | $this->post['ID'] = $this->wp_id();
|
---|
| 354 | $this->update_existing();
|
---|
| 355 | $this->add_rss_meta();
|
---|
| 356 | do_action('update_syndicated_item', $this->wp_id());
|
---|
| 357 |
|
---|
| 358 | $ret = 'updated';
|
---|
| 359 | else :
|
---|
| 360 | $ret = false;
|
---|
| 361 | endif;
|
---|
| 362 |
|
---|
| 363 | return $ret;
|
---|
| 364 | } // function SyndicatedPost::store ()
|
---|
| 365 |
|
---|
| 366 | function insert_new () {
|
---|
| 367 | global $wpdb, $wp_db_version;
|
---|
| 368 |
|
---|
| 369 | $dbpost = $this->normalize_post(/*new=*/ true);
|
---|
| 370 | if (!is_null($dbpost)) :
|
---|
| 371 | if ($this->use_api('wp_insert_post')) :
|
---|
| 372 | $dbpost['post_pingback'] = false; // Tell WP 2.1 and 2.2 not to process for pingbacks
|
---|
| 373 |
|
---|
| 374 | // This is a ridiculous fucking kludge necessitated by WordPress 2.6 munging authorship meta-data
|
---|
| 375 | add_action('_wp_put_post_revision', array($this, 'fix_revision_meta'));
|
---|
| 376 |
|
---|
| 377 | // Kludge to prevent kses filters from stripping the
|
---|
| 378 | // content of posts when updating without a logged in
|
---|
| 379 | // user who has `unfiltered_html` capability.
|
---|
| 380 | add_filter('content_save_pre', array($this, 'avoid_kses_munge'), 11);
|
---|
| 381 |
|
---|
| 382 | $this->_wp_id = wp_insert_post($dbpost);
|
---|
| 383 |
|
---|
| 384 | // Turn off ridiculous fucking kludges #1 and #2
|
---|
| 385 | remove_action('_wp_put_post_revision', array($this, 'fix_revision_meta'));
|
---|
| 386 | remove_filter('content_save_pre', array($this, 'avoid_kses_munge'), 11);
|
---|
| 387 |
|
---|
| 388 | $this->validate_post_id($dbpost, array(__CLASS__, __FUNCTION__));
|
---|
| 389 |
|
---|
| 390 | // Unfortunately, as of WordPress 2.3, wp_insert_post()
|
---|
| 391 | // *still* offers no way to use a guid of your choice,
|
---|
| 392 | // and munges your post modified timestamp, too.
|
---|
| 393 | $result = $wpdb->query("
|
---|
| 394 | UPDATE $wpdb->posts
|
---|
| 395 | SET
|
---|
| 396 | guid='{$dbpost['guid']}',
|
---|
| 397 | post_modified='{$dbpost['post_modified']}',
|
---|
| 398 | post_modified_gmt='{$dbpost['post_modified_gmt']}'
|
---|
| 399 | WHERE ID='{$this->_wp_id}'
|
---|
| 400 | ");
|
---|
| 401 | else :
|
---|
| 402 | # The right way to do this is the above. But, alas,
|
---|
| 403 | # in earlier versions of WordPress, wp_insert_post has
|
---|
| 404 | # too much behavior (mainly related to pings) that can't
|
---|
| 405 | # be overridden. In WordPress 1.5, it's enough of a
|
---|
| 406 | # resource hog to make PHP segfault after inserting
|
---|
| 407 | # 50-100 posts. This can get pretty annoying, especially
|
---|
| 408 | # if you are trying to update your feeds for the first
|
---|
| 409 | # time.
|
---|
| 410 |
|
---|
| 411 | $result = $wpdb->query("
|
---|
| 412 | INSERT INTO $wpdb->posts
|
---|
| 413 | SET
|
---|
| 414 | guid = '{$dbpost['guid']}',
|
---|
| 415 | post_author = '{$dbpost['post_author']}',
|
---|
| 416 | post_date = '{$dbpost['post_date']}',
|
---|
| 417 | post_date_gmt = '{$dbpost['post_date_gmt']}',
|
---|
| 418 | post_content = '{$dbpost['post_content']}',"
|
---|
| 419 | .(isset($dbpost['post_excerpt']) ? "post_excerpt = '{$dbpost['post_excerpt']}'," : "")."
|
---|
| 420 | post_title = '{$dbpost['post_title']}',
|
---|
| 421 | post_name = '{$dbpost['post_name']}',
|
---|
| 422 | post_modified = '{$dbpost['post_modified']}',
|
---|
| 423 | post_modified_gmt = '{$dbpost['post_modified_gmt']}',
|
---|
| 424 | comment_status = '{$dbpost['comment_status']}',
|
---|
| 425 | ping_status = '{$dbpost['ping_status']}',
|
---|
| 426 | post_status = '{$dbpost['post_status']}'
|
---|
| 427 | ");
|
---|
| 428 | $this->_wp_id = $wpdb->insert_id;
|
---|
| 429 |
|
---|
| 430 | $this->validate_post_id($dbpost, array(__CLASS__, __FUNCTION__));
|
---|
| 431 |
|
---|
| 432 | // WordPress 1.5.x - 2.0.x
|
---|
| 433 | wp_set_post_cats('1', $this->wp_id(), $this->post['post_category']);
|
---|
| 434 |
|
---|
| 435 | // Since we are not going through official channels, we need to
|
---|
| 436 | // manually tell WordPress that we've published a new post.
|
---|
| 437 | // We need to make sure to do this in order for FeedWordPress
|
---|
| 438 | // to play well with the staticize-reloaded plugin (something
|
---|
| 439 | // that a large aggregator website is going to *want* to be
|
---|
| 440 | // able to use).
|
---|
| 441 | do_action('publish_post', $this->_wp_id);
|
---|
| 442 | endif;
|
---|
| 443 | endif;
|
---|
| 444 | } /* SyndicatedPost::insert_new() */
|
---|
| 445 |
|
---|
| 446 | function update_existing () {
|
---|
| 447 | global $wpdb;
|
---|
| 448 |
|
---|
| 449 | // Why the fuck doesn't wp_insert_post already do this?
|
---|
| 450 | $dbpost = $this->normalize_post(/*new=*/ false);
|
---|
| 451 | if (!is_null($dbpost)) :
|
---|
| 452 | if ($this->use_api('wp_insert_post')) :
|
---|
| 453 | $dbpost['post_pingback'] = false; // Tell WP 2.1 and 2.2 not to process for pingbacks
|
---|
| 454 |
|
---|
| 455 | // This is a ridiculous fucking kludge necessitated by WordPress 2.6 munging authorship meta-data
|
---|
| 456 | add_action('_wp_put_post_revision', array($this, 'fix_revision_meta'));
|
---|
| 457 |
|
---|
| 458 | // Kludge to prevent kses filters from stripping the
|
---|
| 459 | // content of posts when updating without a logged in
|
---|
| 460 | // user who has `unfiltered_html` capability.
|
---|
| 461 | add_filter('content_save_pre', array($this, 'avoid_kses_munge'), 11);
|
---|
| 462 |
|
---|
| 463 | // Don't munge status fields that the user may have reset manually
|
---|
| 464 | if (function_exists('get_post_field')) :
|
---|
| 465 | $doNotMunge = array('post_status', 'comment_status', 'ping_status');
|
---|
| 466 | foreach ($doNotMunge as $field) :
|
---|
| 467 | $dbpost[$field] = get_post_field($field, $this->wp_id());
|
---|
| 468 | endforeach;
|
---|
| 469 | endif;
|
---|
| 470 |
|
---|
| 471 | $this->_wp_id = wp_insert_post($dbpost);
|
---|
| 472 |
|
---|
| 473 | // Turn off ridiculous fucking kludges #1 and #2
|
---|
| 474 | remove_action('_wp_put_post_revision', array($this, 'fix_revision_meta'));
|
---|
| 475 | remove_filter('content_save_pre', array($this, 'avoid_kses_munge'), 11);
|
---|
| 476 |
|
---|
| 477 | $this->validate_post_id($dbpost, array(__CLASS__, __FUNCTION__));
|
---|
| 478 |
|
---|
| 479 | // Unfortunately, as of WordPress 2.3, wp_insert_post()
|
---|
| 480 | // munges your post modified timestamp.
|
---|
| 481 | $result = $wpdb->query("
|
---|
| 482 | UPDATE $wpdb->posts
|
---|
| 483 | SET
|
---|
| 484 | post_modified='{$dbpost['post_modified']}',
|
---|
| 485 | post_modified_gmt='{$dbpost['post_modified_gmt']}'
|
---|
| 486 | WHERE ID='{$this->_wp_id}'
|
---|
| 487 | ");
|
---|
| 488 | else :
|
---|
| 489 |
|
---|
| 490 | $result = $wpdb->query("
|
---|
| 491 | UPDATE $wpdb->posts
|
---|
| 492 | SET
|
---|
| 493 | post_author = '{$dbpost['post_author']}',
|
---|
| 494 | post_content = '{$dbpost['post_content']}',"
|
---|
| 495 | .(isset($dbpost['post_excerpt']) ? "post_excerpt = '{$dbpost['post_excerpt']}'," : "")."
|
---|
| 496 | post_title = '{$dbpost['post_title']}',
|
---|
| 497 | post_name = '{$dbpost['post_name']}',
|
---|
| 498 | post_modified = '{$dbpost['post_modified']}',
|
---|
| 499 | post_modified_gmt = '{$dbpost['post_modified_gmt']}'
|
---|
| 500 | WHERE guid='{$dbpost['guid']}'
|
---|
| 501 | ");
|
---|
| 502 |
|
---|
| 503 | // WordPress 2.1.x and up
|
---|
| 504 | if (function_exists('wp_set_post_categories')) :
|
---|
| 505 | wp_set_post_categories($this->wp_id(), $this->post['post_category']);
|
---|
| 506 | // WordPress 1.5.x - 2.0.x
|
---|
| 507 | elseif (function_exists('wp_set_post_cats')) :
|
---|
| 508 | wp_set_post_cats('1', $this->wp_id(), $this->post['post_category']);
|
---|
| 509 | // This should never happen.
|
---|
| 510 | else :
|
---|
| 511 | FeedWordPress::critical_bug(__CLASS__.'::'.__FUNCTION.'(): no post categorizing function', array("dbpost" => $dbpost, "this" => $this), __LINE__);
|
---|
| 512 | endif;
|
---|
| 513 |
|
---|
| 514 | // Since we are not going through official channels, we need to
|
---|
| 515 | // manually tell WordPress that we've published a new post.
|
---|
| 516 | // We need to make sure to do this in order for FeedWordPress
|
---|
| 517 | // to play well with the staticize-reloaded plugin (something
|
---|
| 518 | // that a large aggregator website is going to *want* to be
|
---|
| 519 | // able to use).
|
---|
| 520 | do_action('edit_post', $this->post['ID']);
|
---|
| 521 | endif;
|
---|
| 522 | endif;
|
---|
| 523 | } /* SyndicatedPost::update_existing() */
|
---|
| 524 |
|
---|
| 525 | /**
|
---|
| 526 | * SyndicatedPost::normalize_post()
|
---|
| 527 | *
|
---|
| 528 | * @param bool $new If true, this post is to be inserted anew. If false, it is an update of an existing post.
|
---|
| 529 | * @return array A normalized representation of the post ready to be inserted into the database or sent to the WordPress API functions
|
---|
| 530 | */
|
---|
| 531 | function normalize_post ($new = true) {
|
---|
| 532 | global $wpdb;
|
---|
| 533 |
|
---|
| 534 | $out = array();
|
---|
| 535 |
|
---|
| 536 | // Why the fuck doesn't wp_insert_post already do this?
|
---|
| 537 | foreach ($this->post as $key => $value) :
|
---|
| 538 | if (is_string($value)) :
|
---|
| 539 | $out[$key] = $wpdb->escape($value);
|
---|
| 540 | else :
|
---|
| 541 | $out[$key] = $value;
|
---|
| 542 | endif;
|
---|
| 543 | endforeach;
|
---|
| 544 |
|
---|
| 545 | if (strlen($out['post_title'].$out['post_content'].$out['post_excerpt']) == 0) :
|
---|
| 546 | // FIXME: Option for filtering out empty posts
|
---|
| 547 | endif;
|
---|
| 548 | if (strlen($out['post_title'])==0) :
|
---|
| 549 | $offset = (int) get_option('gmt_offset') * 60 * 60;
|
---|
| 550 | $out['post_title'] =
|
---|
| 551 | $this->post['meta']['syndication_source']
|
---|
| 552 | .' '.gmdate('Y-m-d H:i:s', $this->published() + $offset);
|
---|
| 553 | // FIXME: Option for what to fill a blank title with...
|
---|
| 554 | endif;
|
---|
| 555 |
|
---|
| 556 | return $out;
|
---|
| 557 | }
|
---|
| 558 |
|
---|
| 559 | /**
|
---|
| 560 | * SyndicatedPost::validate_post_id()
|
---|
| 561 | *
|
---|
| 562 | * @param array $dbpost An array representing the post we attempted to insert or update
|
---|
| 563 | * @param mixed $ns A string or array representing the namespace (class, method) whence this method was called.
|
---|
| 564 | */
|
---|
| 565 | function validate_post_id ($dbpost, $ns) {
|
---|
| 566 | if (is_array($ns)) : $ns = implode('::', $ns);
|
---|
| 567 | else : $ns = (string) $ns; endif;
|
---|
| 568 |
|
---|
| 569 | // This should never happen.
|
---|
| 570 | if (!is_numeric($this->_wp_id) or ($this->_wp_id == 0)) :
|
---|
| 571 | FeedWordPress::critical_bug(
|
---|
| 572 | /*name=*/ $ns.'::_wp_id',
|
---|
| 573 | /*var =*/ array(
|
---|
| 574 | "\$this->_wp_id" => $this->_wp_id,
|
---|
| 575 | "\$dbpost" => $dbpost,
|
---|
| 576 | "\$this" => $this
|
---|
| 577 | ),
|
---|
| 578 | /*line # =*/ __LINE__
|
---|
| 579 | );
|
---|
| 580 | endif;
|
---|
| 581 | } /* SyndicatedPost::validate_post_id() */
|
---|
| 582 |
|
---|
| 583 | /**
|
---|
| 584 | * SyndicatedPost::fix_revision_meta() - Fixes the way WP 2.6+ fucks up
|
---|
| 585 | * meta-data (authorship, etc.) when storing revisions of an updated
|
---|
| 586 | * syndicated post.
|
---|
| 587 | *
|
---|
| 588 | * In their infinite wisdom, the WordPress coders have made it completely
|
---|
| 589 | * impossible for a plugin that uses wp_insert_post() to set certain
|
---|
| 590 | * meta-data (such as the author) when you store an old revision of an
|
---|
| 591 | * updated post. Instead, it uses the WordPress defaults (= currently
|
---|
| 592 | * active user ID if the process is running with a user logged in, or
|
---|
| 593 | * = #0 if there is no user logged in). This results in bogus authorship
|
---|
| 594 | * data for revisions that are syndicated from off the feed, unless we
|
---|
| 595 | * use a ridiculous kludge like this to end-run the munging of meta-data
|
---|
| 596 | * by _wp_put_post_revision.
|
---|
| 597 | *
|
---|
| 598 | * @param int $revision_id The revision ID to fix up meta-data
|
---|
| 599 | */
|
---|
| 600 | function fix_revision_meta ($revision_id) {
|
---|
| 601 | global $wpdb;
|
---|
| 602 |
|
---|
| 603 | $post_author = (int) $this->post['post_author'];
|
---|
| 604 |
|
---|
| 605 | $revision_id = (int) $revision_id;
|
---|
| 606 | $wpdb->query("
|
---|
| 607 | UPDATE $wpdb->posts
|
---|
| 608 | SET post_author={$this->post['post_author']}
|
---|
| 609 | WHERE post_type = 'revision' AND ID='$revision_id'
|
---|
| 610 | ");
|
---|
| 611 | } /* SyndicatedPost::fix_revision_meta () */
|
---|
| 612 |
|
---|
| 613 | /**
|
---|
| 614 | * SyndicatedPost::avoid_kses_munge() -- If FeedWordPress is processing
|
---|
| 615 | * an automatic update, that generally means that wp_insert_post() is
|
---|
| 616 | * being called under the user credentials of whoever is viewing the
|
---|
| 617 | * blog at the time -- usually meaning no user at all. But if WordPress
|
---|
| 618 | * gets a wp_insert_post() when current_user_can('unfiltered_html') is
|
---|
| 619 | * false, it will run the content of the post through a kses function
|
---|
| 620 | * that strips out lots of HTML tags -- notably <object> and some others.
|
---|
| 621 | * This causes problems for syndicating (for example) feeds that contain
|
---|
| 622 | * YouTube videos. It also produces an unexpected asymmetry between
|
---|
| 623 | * automatically-initiated updates and updates initiated manually from
|
---|
| 624 | * the WordPress Dashboard (which are usually initiated under the
|
---|
| 625 | * credentials of a logged-in admin, and so don't get run through the
|
---|
| 626 | * kses function). So, to avoid the whole mess, what we do here is
|
---|
| 627 | * just forcibly disable the kses munging for a single syndicated post,
|
---|
| 628 | * by restoring the contents of the `post_content` field.
|
---|
| 629 | *
|
---|
| 630 | * @param string $content The content of the post, after other filters have gotten to it
|
---|
| 631 | * @return string The original content of the post, before other filters had a chance to munge it.
|
---|
| 632 | */
|
---|
| 633 | function avoid_kses_munge ($content) {
|
---|
| 634 | global $wpdb;
|
---|
| 635 | return $wpdb->escape($this->post['post_content']);
|
---|
| 636 | }
|
---|
| 637 |
|
---|
| 638 | // SyndicatedPost::add_rss_meta: adds interesting meta-data to each entry
|
---|
| 639 | // using the space for custom keys. The set of keys and values to add is
|
---|
| 640 | // specified by the keys and values of $post['meta']. This is used to
|
---|
| 641 | // store anything that the WordPress user might want to access from a
|
---|
| 642 | // template concerning the post's original source that isn't provided
|
---|
| 643 | // for by standard WP meta-data (i.e., any interesting data about the
|
---|
| 644 | // syndicated post other than author, title, timestamp, categories, and
|
---|
| 645 | // guid). It's also used to hook into WordPress's support for
|
---|
| 646 | // enclosures.
|
---|
| 647 | function add_rss_meta () {
|
---|
| 648 | global $wpdb;
|
---|
| 649 | if ( is_array($this->post) and isset($this->post['meta']) and is_array($this->post['meta']) ) :
|
---|
| 650 | $postId = $this->wp_id();
|
---|
| 651 |
|
---|
| 652 | // Aggregated posts should NOT send out pingbacks.
|
---|
| 653 | // WordPress 2.1-2.2 claim you can tell them not to
|
---|
| 654 | // using $post_pingback, but they don't listen, so we
|
---|
| 655 | // make sure here.
|
---|
| 656 | $result = $wpdb->query("
|
---|
| 657 | DELETE FROM $wpdb->postmeta
|
---|
| 658 | WHERE post_id='$postId' AND meta_key='_pingme'
|
---|
| 659 | ");
|
---|
| 660 |
|
---|
| 661 | foreach ( $this->post['meta'] as $key => $values ) :
|
---|
| 662 |
|
---|
| 663 | $key = $wpdb->escape($key);
|
---|
| 664 |
|
---|
| 665 | // If this is an update, clear out the old
|
---|
| 666 | // values to avoid duplication.
|
---|
| 667 | $result = $wpdb->query("
|
---|
| 668 | DELETE FROM $wpdb->postmeta
|
---|
| 669 | WHERE post_id='$postId' AND meta_key='$key'
|
---|
| 670 | ");
|
---|
| 671 |
|
---|
| 672 | // Allow for either a single value or an array
|
---|
| 673 | if (!is_array($values)) $values = array($values);
|
---|
| 674 | foreach ( $values as $value ) :
|
---|
| 675 | $value = $wpdb->escape($value);
|
---|
| 676 | $result = $wpdb->query("
|
---|
| 677 | INSERT INTO $wpdb->postmeta
|
---|
| 678 | SET
|
---|
| 679 | post_id='$postId',
|
---|
| 680 | meta_key='$key',
|
---|
| 681 | meta_value='$value'
|
---|
| 682 | ");
|
---|
| 683 | endforeach;
|
---|
| 684 | endforeach;
|
---|
| 685 | endif;
|
---|
| 686 | } /* SyndicatedPost::add_rss_meta () */
|
---|
| 687 |
|
---|
| 688 | // SyndicatedPost::author_id (): get the ID for an author name from
|
---|
| 689 | // the feed. Create the author if necessary.
|
---|
| 690 | function author_id ($unfamiliar_author = 'create') {
|
---|
| 691 | global $wpdb;
|
---|
| 692 |
|
---|
| 693 | $a = $this->author();
|
---|
| 694 | $author = $a['name'];
|
---|
| 695 | $email = $a['email'];
|
---|
| 696 | $url = $a['uri'];
|
---|
| 697 |
|
---|
| 698 | $match_author_by_email = !('yes' == get_option("feedwordpress_do_not_match_author_by_email"));
|
---|
| 699 | if ($match_author_by_email and !FeedWordPress::is_null_email($email)) :
|
---|
| 700 | $test_email = $email;
|
---|
| 701 | else :
|
---|
| 702 | $test_email = NULL;
|
---|
| 703 | endif;
|
---|
| 704 |
|
---|
| 705 | // Never can be too careful...
|
---|
| 706 | $login = sanitize_user($author, /*strict=*/ true);
|
---|
| 707 | $login = apply_filters('pre_user_login', $login);
|
---|
| 708 |
|
---|
| 709 | $nice_author = sanitize_title($author);
|
---|
| 710 | $nice_author = apply_filters('pre_user_nicename', $nice_author);
|
---|
| 711 |
|
---|
| 712 | $reg_author = $wpdb->escape(preg_quote($author));
|
---|
| 713 | $author = $wpdb->escape($author);
|
---|
| 714 | $email = $wpdb->escape($email);
|
---|
| 715 | $test_email = $wpdb->escape($test_email);
|
---|
| 716 | $url = $wpdb->escape($url);
|
---|
| 717 |
|
---|
| 718 | // Check for an existing author rule....
|
---|
| 719 | if (isset($this->link->settings['map authors']['name'][strtolower(trim($author))])) :
|
---|
| 720 | $author_rule = $this->link->settings['map authors']['name'][strtolower(trim($author))];
|
---|
| 721 | else :
|
---|
| 722 | $author_rule = NULL;
|
---|
| 723 | endif;
|
---|
| 724 |
|
---|
| 725 | // User name is mapped to a particular author. If that author ID exists, use it.
|
---|
| 726 | if (is_numeric($author_rule) and get_userdata((int) $author_rule)) :
|
---|
| 727 | $id = (int) $author_rule;
|
---|
| 728 |
|
---|
| 729 | // User name is filtered out
|
---|
| 730 | elseif ('filter' == $author_rule) :
|
---|
| 731 | $id = NULL;
|
---|
| 732 |
|
---|
| 733 | else :
|
---|
| 734 | // Check the database for an existing author record that might fit
|
---|
| 735 |
|
---|
| 736 | #-- WordPress 2.0+
|
---|
| 737 | if (fwp_test_wp_version(FWP_SCHEMA_HAS_USERMETA)) :
|
---|
| 738 |
|
---|
| 739 | // First try the user core data table.
|
---|
| 740 | $id = $wpdb->get_var(
|
---|
| 741 | "SELECT ID FROM $wpdb->users
|
---|
| 742 | WHERE
|
---|
| 743 | TRIM(LCASE(user_login)) = TRIM(LCASE('$login'))
|
---|
| 744 | OR (
|
---|
| 745 | LENGTH(TRIM(LCASE(user_email))) > 0
|
---|
| 746 | AND TRIM(LCASE(user_email)) = TRIM(LCASE('$test_email'))
|
---|
| 747 | )
|
---|
| 748 | OR TRIM(LCASE(user_nicename)) = TRIM(LCASE('$nice_author'))
|
---|
| 749 | ");
|
---|
| 750 |
|
---|
| 751 | // If that fails, look for aliases in the user meta data table
|
---|
| 752 | if (is_null($id)) :
|
---|
| 753 | $id = $wpdb->get_var(
|
---|
| 754 | "SELECT user_id FROM $wpdb->usermeta
|
---|
| 755 | WHERE
|
---|
| 756 | (meta_key = 'description' AND TRIM(LCASE(meta_value)) = TRIM(LCASE('$author')))
|
---|
| 757 | OR (
|
---|
| 758 | meta_key = 'description'
|
---|
| 759 | AND TRIM(LCASE(meta_value))
|
---|
| 760 | RLIKE CONCAT(
|
---|
| 761 | '(^|\\n)a\\.?k\\.?a\\.?( |\\t)*:?( |\\t)*',
|
---|
| 762 | TRIM(LCASE('$reg_author')),
|
---|
| 763 | '( |\\t|\\r)*(\\n|\$)'
|
---|
| 764 | )
|
---|
| 765 | )
|
---|
| 766 | ");
|
---|
| 767 | endif;
|
---|
| 768 |
|
---|
| 769 | #-- WordPress 1.5.x
|
---|
| 770 | else :
|
---|
| 771 | $id = $wpdb->get_var(
|
---|
| 772 | "SELECT ID from $wpdb->users
|
---|
| 773 | WHERE
|
---|
| 774 | TRIM(LCASE(user_login)) = TRIM(LCASE('$login')) OR
|
---|
| 775 | (
|
---|
| 776 | LENGTH(TRIM(LCASE(user_email))) > 0
|
---|
| 777 | AND TRIM(LCASE(user_email)) = TRIM(LCASE('$test_email'))
|
---|
| 778 | ) OR
|
---|
| 779 | TRIM(LCASE(user_firstname)) = TRIM(LCASE('$author')) OR
|
---|
| 780 | TRIM(LCASE(user_nickname)) = TRIM(LCASE('$author')) OR
|
---|
| 781 | TRIM(LCASE(user_nicename)) = TRIM(LCASE('$nice_author')) OR
|
---|
| 782 | TRIM(LCASE(user_description)) = TRIM(LCASE('$author')) OR
|
---|
| 783 | (
|
---|
| 784 | LOWER(user_description)
|
---|
| 785 | RLIKE CONCAT(
|
---|
| 786 | '(^|\\n)a\\.?k\\.?a\\.?( |\\t)*:?( |\\t)*',
|
---|
| 787 | LCASE('$reg_author'),
|
---|
| 788 | '( |\\t|\\r)*(\\n|\$)'
|
---|
| 789 | )
|
---|
| 790 | )
|
---|
| 791 | ");
|
---|
| 792 |
|
---|
| 793 | endif;
|
---|
| 794 |
|
---|
| 795 | // ... if you don't find one, then do what you need to do
|
---|
| 796 | if (is_null($id)) :
|
---|
| 797 | if ($unfamiliar_author === 'create') :
|
---|
| 798 | $userdata = array();
|
---|
| 799 |
|
---|
| 800 | #-- user table data
|
---|
| 801 | $userdata['ID'] = NULL; // new user
|
---|
| 802 | $userdata['user_login'] = $login;
|
---|
| 803 | $userdata['user_nicename'] = $nice_author;
|
---|
| 804 | $userdata['user_pass'] = substr(md5(uniqid(microtime())), 0, 6); // just something random to lock it up
|
---|
| 805 | $userdata['user_email'] = $email;
|
---|
| 806 | $userdata['user_url'] = $url;
|
---|
| 807 | $userdata['display_name'] = $author;
|
---|
| 808 |
|
---|
| 809 | $id = wp_insert_user($userdata);
|
---|
| 810 | elseif (is_numeric($unfamiliar_author) and get_userdata((int) $unfamiliar_author)) :
|
---|
| 811 | $id = (int) $unfamiliar_author;
|
---|
| 812 | elseif ($unfamiliar_author === 'default') :
|
---|
| 813 | $id = 1;
|
---|
| 814 | endif;
|
---|
| 815 | endif;
|
---|
| 816 | endif;
|
---|
| 817 |
|
---|
| 818 | if ($id) :
|
---|
| 819 | $this->link->settings['map authors']['name'][strtolower(trim($author))] = $id;
|
---|
| 820 | endif;
|
---|
| 821 | return $id;
|
---|
| 822 | } // function SyndicatedPost::author_id ()
|
---|
| 823 |
|
---|
| 824 | // look up (and create) category ids from a list of categories
|
---|
| 825 | function category_ids ($cats, $unfamiliar_category = 'create', $tags_too = false) {
|
---|
| 826 | global $wpdb;
|
---|
| 827 |
|
---|
| 828 | // We need to normalize whitespace because (1) trailing
|
---|
| 829 | // whitespace can cause PHP and MySQL not to see eye to eye on
|
---|
| 830 | // VARCHAR comparisons for some versions of MySQL (cf.
|
---|
| 831 | // <http://dev.mysql.com/doc/mysql/en/char.html>), and (2)
|
---|
| 832 | // because I doubt most people want to make a semantic
|
---|
| 833 | // distinction between 'Computers' and 'Computers '
|
---|
| 834 | $cats = array_map('trim', $cats);
|
---|
| 835 |
|
---|
| 836 | $tags = array();
|
---|
| 837 |
|
---|
| 838 | $cat_ids = array ();
|
---|
| 839 | foreach ($cats as $cat_name) :
|
---|
| 840 | if (preg_match('/^{#([0-9]+)}$/', $cat_name, $backref)) :
|
---|
| 841 | $cat_id = (int) $backref[1];
|
---|
| 842 | if (function_exists('is_term') and is_term($cat_id, 'category')) :
|
---|
| 843 | $cat_ids[] = $cat_id;
|
---|
| 844 | elseif (get_category($cat_id)) :
|
---|
| 845 | $cat_ids[] = $cat_id;
|
---|
| 846 | endif;
|
---|
| 847 | elseif (strlen($cat_name) > 0) :
|
---|
| 848 | $esc = $wpdb->escape($cat_name);
|
---|
| 849 | $resc = $wpdb->escape(preg_quote($cat_name));
|
---|
| 850 |
|
---|
| 851 | // WordPress 2.3+
|
---|
| 852 | if (function_exists('is_term')) :
|
---|
| 853 | $cat_id = is_term($cat_name, 'category');
|
---|
| 854 | if ($cat_id) :
|
---|
| 855 | $cat_ids[] = $cat_id['term_id'];
|
---|
| 856 | // There must be a better way to do this...
|
---|
| 857 | elseif ($results = $wpdb->get_results(
|
---|
| 858 | "SELECT term_id
|
---|
| 859 | FROM $wpdb->term_taxonomy
|
---|
| 860 | WHERE
|
---|
| 861 | LOWER(description) RLIKE
|
---|
| 862 | CONCAT('(^|\\n)a\\.?k\\.?a\\.?( |\\t)*:?( |\\t)*', LOWER('{$resc}'), '( |\\t|\\r)*(\\n|\$)')"
|
---|
| 863 | )) :
|
---|
| 864 | foreach ($results AS $term) :
|
---|
| 865 | $cat_ids[] = (int) $term->term_id;
|
---|
| 866 | endforeach;
|
---|
| 867 | elseif ('tag'==$unfamiliar_category) :
|
---|
| 868 | $tags[] = $cat_name;
|
---|
| 869 | elseif ('create'===$unfamiliar_category) :
|
---|
| 870 | $term = wp_insert_term($cat_name, 'category');
|
---|
| 871 | if (is_wp_error($term)) :
|
---|
| 872 | FeedWordPress::noncritical_bug('term insertion problem', array('cat_name' => $cat_name, 'term' => $term, 'this' => $this), __LINE__);
|
---|
| 873 | else :
|
---|
| 874 | $cat_ids[] = $term['term_id'];
|
---|
| 875 | endif;
|
---|
| 876 | endif;
|
---|
| 877 |
|
---|
| 878 | // WordPress 1.5.x - 2.2.x
|
---|
| 879 | else :
|
---|
| 880 | $results = $wpdb->get_results(
|
---|
| 881 | "SELECT cat_ID
|
---|
| 882 | FROM $wpdb->categories
|
---|
| 883 | WHERE
|
---|
| 884 | (LOWER(cat_name) = LOWER('$esc'))
|
---|
| 885 | OR (LOWER(category_description)
|
---|
| 886 | RLIKE CONCAT('(^|\\n)a\\.?k\\.?a\\.?( |\\t)*:?( |\\t)*', LOWER('{$resc}'), '( |\\t|\\r)*(\\n|\$)'))
|
---|
| 887 | ");
|
---|
| 888 | if ($results) :
|
---|
| 889 | foreach ($results as $term) :
|
---|
| 890 | $cat_ids[] = (int) $term->cat_ID;
|
---|
| 891 | endforeach;
|
---|
| 892 | elseif ('create'===$unfamiliar_category) :
|
---|
| 893 | if (function_exists('wp_insert_category')) :
|
---|
| 894 | $cat_id = wp_insert_category(array('cat_name' => $cat_name));
|
---|
| 895 | // And into the database we go.
|
---|
| 896 | else :
|
---|
| 897 | $nice_kitty = sanitize_title($cat_name);
|
---|
| 898 | $wpdb->query(sprintf("
|
---|
| 899 | INSERT INTO $wpdb->categories
|
---|
| 900 | SET
|
---|
| 901 | cat_name='%s',
|
---|
| 902 | category_nicename='%s'
|
---|
| 903 | ", $wpdb->escape($cat_name), $nice_kitty
|
---|
| 904 | ));
|
---|
| 905 | $cat_id = $wpdb->insert_id;
|
---|
| 906 | endif;
|
---|
| 907 | $cat_ids[] = $cat_id;
|
---|
| 908 | endif;
|
---|
| 909 | endif;
|
---|
| 910 | endif;
|
---|
| 911 | endforeach;
|
---|
| 912 |
|
---|
| 913 | if ((count($cat_ids) == 0) and ($unfamiliar_category === 'filter')) :
|
---|
| 914 | $cat_ids = NULL; // Drop the post
|
---|
| 915 | else :
|
---|
| 916 | $cat_ids = array_unique($cat_ids);
|
---|
| 917 | endif;
|
---|
| 918 |
|
---|
| 919 | if ($tags_too) : $ret = array($cat_ids, $tags);
|
---|
| 920 | else : $ret = $cat_ids;
|
---|
| 921 | endif;
|
---|
| 922 |
|
---|
| 923 | return $ret;
|
---|
| 924 | } // function SyndicatedPost::category_ids ()
|
---|
| 925 |
|
---|
| 926 | function use_api ($tag) {
|
---|
| 927 | global $wp_db_version;
|
---|
| 928 | switch ($tag) :
|
---|
| 929 | case 'wp_insert_post':
|
---|
| 930 | // Before 2.2, wp_insert_post does too much of the wrong stuff to use it
|
---|
| 931 | // In 1.5 it was such a resource hog it would make PHP segfault on big updates
|
---|
| 932 | $ret = (isset($wp_db_version) and $wp_db_version > FWP_SCHEMA_21);
|
---|
| 933 | break;
|
---|
| 934 | case 'post_status_pending':
|
---|
| 935 | $ret = (isset($wp_db_version) and $wp_db_version > FWP_SCHEMA_23);
|
---|
| 936 | break;
|
---|
| 937 | endswitch;
|
---|
| 938 | return $ret;
|
---|
| 939 | } // function SyndicatedPost::use_api ()
|
---|
| 940 |
|
---|
| 941 | #### EXTRACT DATA FROM FEED ITEM ####
|
---|
| 942 |
|
---|
| 943 | function created () {
|
---|
| 944 | $epoch = null;
|
---|
| 945 | if (isset($this->item['dc']['created'])) :
|
---|
| 946 | $epoch = @parse_w3cdtf($this->item['dc']['created']);
|
---|
| 947 | elseif (isset($this->item['dcterms']['created'])) :
|
---|
| 948 | $epoch = @parse_w3cdtf($this->item['dcterms']['created']);
|
---|
| 949 | elseif (isset($this->item['created'])): // Atom 0.3
|
---|
| 950 | $epoch = @parse_w3cdtf($this->item['created']);
|
---|
| 951 | endif;
|
---|
| 952 | return $epoch;
|
---|
| 953 | }
|
---|
| 954 | function published ($fallback = true) {
|
---|
| 955 | $epoch = null;
|
---|
| 956 |
|
---|
| 957 | # RSS is a fucking mess. Figure out whether we have a date in
|
---|
| 958 | # <dc:date>, <issued>, <pubDate>, etc., and get it into Unix
|
---|
| 959 | # epoch format for reformatting. If we can't find anything,
|
---|
| 960 | # we'll use the last-updated time.
|
---|
| 961 | if (isset($this->item['dc']['date'])): // Dublin Core
|
---|
| 962 | $epoch = @parse_w3cdtf($this->item['dc']['date']);
|
---|
| 963 | elseif (isset($this->item['dcterms']['issued'])) : // Dublin Core extensions
|
---|
| 964 | $epoch = @parse_w3cdtf($this->item['dcterms']['issued']);
|
---|
| 965 | elseif (isset($this->item['published'])) : // Atom 1.0
|
---|
| 966 | $epoch = @parse_w3cdtf($this->item['published']);
|
---|
| 967 | elseif (isset($this->item['issued'])): // Atom 0.3
|
---|
| 968 | $epoch = @parse_w3cdtf($this->item['issued']);
|
---|
| 969 | elseif (isset($this->item['pubdate'])): // RSS 2.0
|
---|
| 970 | $epoch = strtotime($this->item['pubdate']);
|
---|
| 971 | elseif ($fallback) : // Fall back to <updated> / <modified> if present
|
---|
| 972 | $epoch = $this->updated(/*fallback=*/ false);
|
---|
| 973 | endif;
|
---|
| 974 |
|
---|
| 975 | # If everything failed, then default to the current time.
|
---|
| 976 | if (is_null($epoch)) :
|
---|
| 977 | if (-1 == $default) :
|
---|
| 978 | $epoch = time();
|
---|
| 979 | else :
|
---|
| 980 | $epoch = $default;
|
---|
| 981 | endif;
|
---|
| 982 | endif;
|
---|
| 983 |
|
---|
| 984 | return $epoch;
|
---|
| 985 | }
|
---|
| 986 | function updated ($fallback = true, $default = -1) {
|
---|
| 987 | $epoch = null;
|
---|
| 988 |
|
---|
| 989 | # As far as I know, only dcterms and Atom have reliable ways to
|
---|
| 990 | # specify when something was *modified* last. If neither is
|
---|
| 991 | # available, then we'll try to get the time of publication.
|
---|
| 992 | if (isset($this->item['dc']['modified'])) : // Not really correct
|
---|
| 993 | $epoch = @parse_w3cdtf($this->item['dc']['modified']);
|
---|
| 994 | elseif (isset($this->item['dcterms']['modified'])) : // Dublin Core extensions
|
---|
| 995 | $epoch = @parse_w3cdtf($this->item['dcterms']['modified']);
|
---|
| 996 | elseif (isset($this->item['modified'])): // Atom 0.3
|
---|
| 997 | $epoch = @parse_w3cdtf($this->item['modified']);
|
---|
| 998 | elseif (isset($this->item['updated'])): // Atom 1.0
|
---|
| 999 | $epoch = @parse_w3cdtf($this->item['updated']);
|
---|
| 1000 | elseif ($fallback) : // Fall back to issued / dc:date
|
---|
| 1001 | $epoch = $this->published(/*fallback=*/ false, /*default=*/ $default);
|
---|
| 1002 | endif;
|
---|
| 1003 |
|
---|
| 1004 | # If everything failed, then default to the current time.
|
---|
| 1005 | if (is_null($epoch)) :
|
---|
| 1006 | if (-1 == $default) :
|
---|
| 1007 | $epoch = time();
|
---|
| 1008 | else :
|
---|
| 1009 | $epoch = $default;
|
---|
| 1010 | endif;
|
---|
| 1011 | endif;
|
---|
| 1012 |
|
---|
| 1013 | return $epoch;
|
---|
| 1014 | }
|
---|
| 1015 |
|
---|
| 1016 | function update_hash () {
|
---|
| 1017 | return md5(serialize($this->item));
|
---|
| 1018 | }
|
---|
| 1019 |
|
---|
| 1020 | function guid () {
|
---|
| 1021 | $guid = null;
|
---|
| 1022 | if (isset($this->item['id'])): // Atom 0.3 / 1.0
|
---|
| 1023 | $guid = $this->item['id'];
|
---|
| 1024 | elseif (isset($this->item['atom']['id'])) : // Namespaced Atom
|
---|
| 1025 | $guid = $this->item['atom']['id'];
|
---|
| 1026 | elseif (isset($this->item['guid'])) : // RSS 2.0
|
---|
| 1027 | $guid = $this->item['guid'];
|
---|
| 1028 | elseif (isset($this->item['dc']['identifier'])) :// yeah, right
|
---|
| 1029 | $guid = $this->item['dc']['identifier'];
|
---|
| 1030 | else :
|
---|
| 1031 | // The feed does not seem to have provided us with a
|
---|
| 1032 | // unique identifier, so we'll have to cobble together
|
---|
| 1033 | // a tag: URI that might work for us. The base of the
|
---|
| 1034 | // URI will be the host name of the feed source ...
|
---|
| 1035 | $bits = parse_url($this->feedmeta['link/uri']);
|
---|
| 1036 | $guid = 'tag:'.$bits['host'];
|
---|
| 1037 |
|
---|
| 1038 | // If we have a date of creation, then we can use that
|
---|
| 1039 | // to uniquely identify the item. (On the other hand, if
|
---|
| 1040 | // the feed producer was consicentious enough to
|
---|
| 1041 | // generate dates of creation, she probably also was
|
---|
| 1042 | // conscientious enough to generate unique identifiers.)
|
---|
| 1043 | if (!is_null($this->created())) :
|
---|
| 1044 | $guid .= '://post.'.date('YmdHis', $this->created());
|
---|
| 1045 |
|
---|
| 1046 | // Otherwise, use both the URI of the item, *and* the
|
---|
| 1047 | // item's title. We have to use both because titles are
|
---|
| 1048 | // often not unique, and sometimes links aren't unique
|
---|
| 1049 | // either (e.g. Bitch (S)HITLIST, Mozilla Dot Org news,
|
---|
| 1050 | // some podcasts). But it's rare to have *both* the same
|
---|
| 1051 | // title *and* the same link for two different items. So
|
---|
| 1052 | // this is about the best we can do.
|
---|
| 1053 | else :
|
---|
| 1054 | $guid .= '://'.md5($this->item['link'].'/'.$this->item['title']);
|
---|
| 1055 | endif;
|
---|
| 1056 | endif;
|
---|
| 1057 | return $guid;
|
---|
| 1058 | }
|
---|
| 1059 |
|
---|
| 1060 | function author () {
|
---|
| 1061 | $author = array ();
|
---|
| 1062 |
|
---|
| 1063 | if (isset($this->item['author_name'])):
|
---|
| 1064 | $author['name'] = $this->item['author_name'];
|
---|
| 1065 | elseif (isset($this->item['dc']['creator'])):
|
---|
| 1066 | $author['name'] = $this->item['dc']['creator'];
|
---|
| 1067 | elseif (isset($this->item['dc']['contributor'])):
|
---|
| 1068 | $author['name'] = $this->item['dc']['contributor'];
|
---|
| 1069 | elseif (isset($this->feed->channel['dc']['creator'])) :
|
---|
| 1070 | $author['name'] = $this->feed->channel['dc']['creator'];
|
---|
| 1071 | elseif (isset($this->feed->channel['dc']['contributor'])) :
|
---|
| 1072 | $author['name'] = $this->feed->channel['dc']['contributor'];
|
---|
| 1073 | elseif (isset($this->feed->channel['author_name'])) :
|
---|
| 1074 | $author['name'] = $this->feed->channel['author_name'];
|
---|
| 1075 | elseif ($this->feed->is_rss() and isset($this->item['author'])) :
|
---|
| 1076 | // The author element in RSS is allegedly an
|
---|
| 1077 | // e-mail address, but lots of people don't use
|
---|
| 1078 | // it that way. So let's make of it what we can.
|
---|
| 1079 | $author = parse_email_with_realname($this->item['author']);
|
---|
| 1080 |
|
---|
| 1081 | if (!isset($author['name'])) :
|
---|
| 1082 | if (isset($author['email'])) :
|
---|
| 1083 | $author['name'] = $author['email'];
|
---|
| 1084 | else :
|
---|
| 1085 | $author['name'] = $this->feed->channel['title'];
|
---|
| 1086 | endif;
|
---|
| 1087 | endif;
|
---|
| 1088 | else :
|
---|
| 1089 | $author['name'] = $this->feed->channel['title'];
|
---|
| 1090 | endif;
|
---|
| 1091 |
|
---|
| 1092 | if (isset($this->item['author_email'])):
|
---|
| 1093 | $author['email'] = $this->item['author_email'];
|
---|
| 1094 | elseif (isset($this->feed->channel['author_email'])) :
|
---|
| 1095 | $author['email'] = $this->feed->channel['author_email'];
|
---|
| 1096 | endif;
|
---|
| 1097 |
|
---|
| 1098 | if (isset($this->item['author_url'])):
|
---|
| 1099 | $author['uri'] = $this->item['author_url'];
|
---|
| 1100 | elseif (isset($this->feed->channel['author_url'])) :
|
---|
| 1101 | $author['uri'] = $this->item['author_url'];
|
---|
| 1102 | else:
|
---|
| 1103 | $author['uri'] = $this->feed->channel['link'];
|
---|
| 1104 | endif;
|
---|
| 1105 |
|
---|
| 1106 | return $author;
|
---|
| 1107 | } // SyndicatedPost::author()
|
---|
| 1108 |
|
---|
| 1109 | var $uri_attrs = array (
|
---|
| 1110 | array('a', 'href'),
|
---|
| 1111 | array('applet', 'codebase'),
|
---|
| 1112 | array('area', 'href'),
|
---|
| 1113 | array('blockquote', 'cite'),
|
---|
| 1114 | array('body', 'background'),
|
---|
| 1115 | array('del', 'cite'),
|
---|
| 1116 | array('form', 'action'),
|
---|
| 1117 | array('frame', 'longdesc'),
|
---|
| 1118 | array('frame', 'src'),
|
---|
| 1119 | array('iframe', 'longdesc'),
|
---|
| 1120 | array('iframe', 'src'),
|
---|
| 1121 | array('head', 'profile'),
|
---|
| 1122 | array('img', 'longdesc'),
|
---|
| 1123 | array('img', 'src'),
|
---|
| 1124 | array('img', 'usemap'),
|
---|
| 1125 | array('input', 'src'),
|
---|
| 1126 | array('input', 'usemap'),
|
---|
| 1127 | array('ins', 'cite'),
|
---|
| 1128 | array('link', 'href'),
|
---|
| 1129 | array('object', 'classid'),
|
---|
| 1130 | array('object', 'codebase'),
|
---|
| 1131 | array('object', 'data'),
|
---|
| 1132 | array('object', 'usemap'),
|
---|
| 1133 | array('q', 'cite'),
|
---|
| 1134 | array('script', 'src')
|
---|
| 1135 | ); /* var SyndicatedPost::$uri_attrs */
|
---|
| 1136 |
|
---|
| 1137 | var $_base = null;
|
---|
| 1138 |
|
---|
| 1139 | function resolve_single_relative_uri ($refs) {
|
---|
| 1140 | $tag = FeedWordPressHTML::attributeMatch($refs);
|
---|
| 1141 | $url = Relative_URI::resolve($tag['value'], $this->_base);
|
---|
| 1142 | return $tag['prefix'] . $url . $tag['suffix'];
|
---|
| 1143 | } /* function SyndicatedPost::resolve_single_relative_uri() */
|
---|
| 1144 |
|
---|
| 1145 | function resolve_relative_uris ($content, $obj) {
|
---|
| 1146 | # The MagpieRSS upgrade has some `xml:base` support baked in.
|
---|
| 1147 | # However, sometimes people do silly things, like putting
|
---|
| 1148 | # relative URIs out on a production RSS 2.0 feed or other feeds
|
---|
| 1149 | # with no good support for `xml:base`. So we'll do our best to
|
---|
| 1150 | # try to catch any remaining relative URIs and resolve them as
|
---|
| 1151 | # best we can.
|
---|
| 1152 | $obj->_base = $obj->item['link']; // Reset the base for resolving relative URIs
|
---|
| 1153 |
|
---|
| 1154 | foreach ($obj->uri_attrs as $pair) :
|
---|
| 1155 | list($tag, $attr) = $pair;
|
---|
| 1156 | $pattern = FeedWordPressHTML::attributeRegex($tag, $attr);
|
---|
| 1157 | $content = preg_replace_callback (
|
---|
| 1158 | $pattern,
|
---|
| 1159 | array(&$obj, 'resolve_single_relative_uri'),
|
---|
| 1160 | $content
|
---|
| 1161 | );
|
---|
| 1162 | endforeach;
|
---|
| 1163 |
|
---|
| 1164 | return $content;
|
---|
| 1165 | } /* function SyndicatedPost::resolve_relative_uris () */
|
---|
| 1166 |
|
---|
| 1167 | var $strip_attrs = array (
|
---|
| 1168 | array('[a-z]+', 'target'),
|
---|
| 1169 | // array('[a-z]+', 'style'),
|
---|
| 1170 | // array('[a-z]+', 'on[a-z]+'),
|
---|
| 1171 | );
|
---|
| 1172 |
|
---|
| 1173 | function strip_attribute_from_tag ($refs) {
|
---|
| 1174 | $tag = FeedWordPressHTML::attributeMatch($refs);
|
---|
| 1175 | return $tag['before_attribute'].$tag['after_attribute'];
|
---|
| 1176 | }
|
---|
| 1177 |
|
---|
| 1178 | function sanitize_content ($content, $obj) {
|
---|
| 1179 | # This kind of sucks. I intend to replace it with
|
---|
| 1180 | # lib_filter sometime soon.
|
---|
| 1181 | foreach ($obj->strip_attrs as $pair):
|
---|
| 1182 | list($tag,$attr) = $pair;
|
---|
| 1183 | $pattern = FeedWordPressHTML::attributeRegex($tag, $attr);
|
---|
| 1184 |
|
---|
| 1185 | $content = preg_replace_callback (
|
---|
| 1186 | $pattern,
|
---|
| 1187 | array(&$obj, 'strip_attribute_from_tag'),
|
---|
| 1188 | $content
|
---|
| 1189 | );
|
---|
| 1190 | endforeach;
|
---|
| 1191 | return $content;
|
---|
| 1192 | }
|
---|
| 1193 | } // class SyndicatedPost
|
---|
| 1194 |
|
---|