[ XREF Home ] [ Index ]

PHP Cross Reference of WordPress Trunk

Provided by Yoast

title

Body

[close]

/wp-includes/ -> canonical.php (source)

   1  <?php
   2  /**
   3   * Canonical API to handle WordPress Redirecting
   4   *
   5   * Based on "Permalink Redirect" from Scott Yang and "Enforce www. Preference"
   6   * by Mark Jaquith
   7   *
   8   * @package WordPress
   9   * @since 2.3.0
  10   */
  11  
  12  /**
  13   * Redirects incoming links to the proper URL based on the site url.
  14   *
  15   * Search engines consider www.somedomain.com and somedomain.com to be two
  16   * different URLs when they both go to the same location. This SEO enhancement
  17   * prevents penality for duplicate content by redirecting all incoming links to
  18   * one or the other.
  19   *
  20   * Prevents redirection for feeds, trackbacks, searches, comment popup, and
  21   * admin URLs. Does not redirect on IIS, page/post previews, and on form data.
  22   *
  23   * Will also attempt to find the correct link when a user enters a URL that does
  24   * not exist based on exact WordPress query. Will instead try to parse the URL
  25   * or query in an attempt to figure the correct page to go to.
  26   *
  27   * @since 2.3.0
  28   * @uses $wp_rewrite
  29   * @uses $is_IIS
  30   *
  31   * @param string $requested_url Optional. The URL that was requested, used to
  32   *        figure if redirect is needed.
  33   * @param bool $do_redirect Optional. Redirect to the new URL.
  34   * @return null|false|string Null, if redirect not needed. False, if redirect
  35   *        not needed or the string of the URL
  36   */
  37  function redirect_canonical( $requested_url = null, $do_redirect = true ) {
  38      global $wp_rewrite, $is_IIS, $wp_query, $wpdb;
  39  
  40      if ( is_trackback() || is_search() || is_comments_popup() || is_admin() || !empty($_POST) || is_preview() || is_robots() || $is_IIS )
  41          return;
  42  
  43      if ( !$requested_url ) {
  44          // build the URL in the address bar
  45          $requested_url  = is_ssl() ? 'https://' : 'http://';
  46          $requested_url .= $_SERVER['HTTP_HOST'];
  47          $requested_url .= $_SERVER['REQUEST_URI'];
  48      }
  49  
  50      $original = @parse_url($requested_url);
  51      if ( false === $original )
  52          return;
  53  
  54      // Some PHP setups turn requests for / into /index.php in REQUEST_URI
  55      // See: http://trac.wordpress.org/ticket/5017
  56      // See: http://trac.wordpress.org/ticket/7173
  57      // Disabled, for now:
  58      // $original['path'] = preg_replace('|/index\.php$|', '/', $original['path']);
  59  
  60      $redirect = $original;
  61      $redirect_url = false;
  62  
  63      // Notice fixing
  64      if ( !isset($redirect['path']) )
  65          $redirect['path'] = '';
  66      if ( !isset($redirect['query']) )
  67          $redirect['query'] = '';
  68  
  69      if ( is_singular() && 1 > $wp_query->post_count && ($id = get_query_var('p')) ) {
  70  
  71          $vars = $wpdb->get_results( $wpdb->prepare("SELECT post_type, post_parent FROM $wpdb->posts WHERE ID = %d", $id) );
  72  
  73          if ( isset($vars[0]) && $vars = $vars[0] ) {
  74              if ( 'revision' == $vars->post_type && $vars->post_parent > 0 )
  75                  $id = $vars->post_parent;
  76  
  77              if ( $redirect_url = get_permalink($id) )
  78                  $redirect['query'] = remove_query_arg(array('p', 'page_id', 'attachment_id', 'post_type'), $redirect['query']);
  79          }
  80      }
  81  
  82      // These tests give us a WP-generated permalink
  83      if ( is_404() ) {
  84  
  85          // Redirect ?page_id, ?p=, ?attachment_id= to their respective url's
  86          $id = max( get_query_var('p'), get_query_var('page_id'), get_query_var('attachment_id') );
  87          if ( $id && $redirect_post = get_post($id) ) {
  88              $post_type_obj = get_post_type_object($redirect_post->post_type);
  89              if ( $post_type_obj->public ) {
  90                  $redirect_url = get_permalink($redirect_post);
  91                  $redirect['query'] = remove_query_arg(array('p', 'page_id', 'attachment_id', 'post_type'), $redirect['query']);
  92              }
  93          }
  94  
  95          if ( ! $redirect_url )
  96              $redirect_url = redirect_guess_404_permalink();
  97  
  98      } elseif ( is_object($wp_rewrite) && $wp_rewrite->using_permalinks() ) {
  99          // rewriting of old ?p=X, ?m=2004, ?m=200401, ?m=20040101
 100          if ( is_attachment() && !empty($_GET['attachment_id']) && ! $redirect_url ) {
 101              if ( $redirect_url = get_attachment_link(get_query_var('attachment_id')) )
 102                  $redirect['query'] = remove_query_arg('attachment_id', $redirect['query']);
 103          } elseif ( is_single() && !empty($_GET['p']) && ! $redirect_url ) {
 104              if ( $redirect_url = get_permalink(get_query_var('p')) )
 105                  $redirect['query'] = remove_query_arg(array('p', 'post_type'), $redirect['query']);
 106          } elseif ( is_single() && !empty($_GET['name'])  && ! $redirect_url ) {
 107              if ( $redirect_url = get_permalink( $wp_query->get_queried_object_id() ) )
 108                  $redirect['query'] = remove_query_arg('name', $redirect['query']);
 109          } elseif ( is_page() && !empty($_GET['page_id']) && ! $redirect_url ) {
 110              if ( $redirect_url = get_permalink(get_query_var('page_id')) )
 111                  $redirect['query'] = remove_query_arg('page_id', $redirect['query']);
 112          } elseif ( is_page() && !is_feed() && isset($wp_query->queried_object) && 'page' == get_option('show_on_front') && $wp_query->queried_object->ID == get_option('page_on_front')  && ! $redirect_url ) {
 113              $redirect_url = home_url('/');
 114          } elseif ( is_home() && !empty($_GET['page_id']) && 'page' == get_option('show_on_front') && get_query_var('page_id') == get_option('page_for_posts')  && ! $redirect_url ) {
 115              if ( $redirect_url = get_permalink(get_option('page_for_posts')) )
 116                  $redirect['query'] = remove_query_arg('page_id', $redirect['query']);
 117          } elseif ( !empty($_GET['m']) && ( is_year() || is_month() || is_day() ) ) {
 118              $m = get_query_var('m');
 119              switch ( strlen($m) ) {
 120                  case 4: // Yearly
 121                      $redirect_url = get_year_link($m);
 122                      break;
 123                  case 6: // Monthly
 124                      $redirect_url = get_month_link( substr($m, 0, 4), substr($m, 4, 2) );
 125                      break;
 126                  case 8: // Daily
 127                      $redirect_url = get_day_link(substr($m, 0, 4), substr($m, 4, 2), substr($m, 6, 2));
 128                      break;
 129              }
 130              if ( $redirect_url )
 131                  $redirect['query'] = remove_query_arg('m', $redirect['query']);
 132          // now moving on to non ?m=X year/month/day links
 133          } elseif ( is_day() && get_query_var('year') && get_query_var('monthnum') && !empty($_GET['day']) ) {
 134              if ( $redirect_url = get_day_link(get_query_var('year'), get_query_var('monthnum'), get_query_var('day')) )
 135                  $redirect['query'] = remove_query_arg(array('year', 'monthnum', 'day'), $redirect['query']);
 136          } elseif ( is_month() && get_query_var('year') && !empty($_GET['monthnum']) ) {
 137              if ( $redirect_url = get_month_link(get_query_var('year'), get_query_var('monthnum')) )
 138                  $redirect['query'] = remove_query_arg(array('year', 'monthnum'), $redirect['query']);
 139          } elseif ( is_year() && !empty($_GET['year']) ) {
 140              if ( $redirect_url = get_year_link(get_query_var('year')) )
 141                  $redirect['query'] = remove_query_arg('year', $redirect['query']);
 142          } elseif ( is_author() && !empty($_GET['author']) && preg_match( '|^[0-9]+$|', $_GET['author'] ) ) {
 143              $author = get_userdata(get_query_var('author'));
 144              if ( ( false !== $author ) && $wpdb->get_var( $wpdb->prepare( "SELECT ID FROM $wpdb->posts WHERE $wpdb->posts.post_author = %d AND $wpdb->posts.post_status = 'publish' LIMIT 1", $author->ID ) ) ) {
 145                  if ( $redirect_url = get_author_posts_url($author->ID, $author->user_nicename) )
 146                      $redirect['query'] = remove_query_arg('author', $redirect['query']);
 147              }
 148          } elseif ( is_category() || is_tag() || is_tax() ) { // Terms (Tags/categories)
 149  
 150              $term_count = 0;
 151              foreach ( $wp_query->tax_query->queries as $tax_query )
 152                  $term_count += count( $tax_query['terms'] );
 153  
 154              $obj = $wp_query->get_queried_object();
 155              if ( $term_count <= 1 && !empty($obj->term_id) && ( $tax_url = get_term_link((int)$obj->term_id, $obj->taxonomy) ) && !is_wp_error($tax_url) ) {
 156                  if ( !empty($redirect['query']) ) {
 157                      // Strip taxonomy query vars off the url.
 158                      $qv_remove = array( 'term', 'taxonomy');
 159                      if ( is_category() ) {
 160                          $qv_remove[] = 'category_name';
 161                          $qv_remove[] = 'cat';
 162                      } elseif ( is_tag() ) {
 163                          $qv_remove[] = 'tag';
 164                          $qv_remove[] = 'tag_id';
 165                      } else { // Custom taxonomies will have a custom query var, remove those too:
 166                          $tax_obj = get_taxonomy( $obj->taxonomy );
 167                          if ( false !== $tax_obj->query_var )
 168                              $qv_remove[] = $tax_obj->query_var;
 169                      }
 170  
 171                      $rewrite_vars = array_diff( array_keys($wp_query->query), array_keys($_GET) );
 172  
 173                      if ( !array_diff($rewrite_vars, array_keys($_GET))  ) { // Check to see if all the Query vars are coming from the rewrite, none are set via $_GET
 174                          $redirect['query'] = remove_query_arg($qv_remove, $redirect['query']); //Remove all of the per-tax qv's
 175  
 176                          // Create the destination url for this taxonomy
 177                          $tax_url = parse_url($tax_url);
 178                          if ( ! empty($tax_url['query']) ) { // Taxonomy accessable via ?taxonomy=..&term=.. or any custom qv..
 179                              parse_str($tax_url['query'], $query_vars);
 180                              $redirect['query'] = add_query_arg($query_vars, $redirect['query']);
 181                          } else { // Taxonomy is accessable via a "pretty-URL"
 182                              $redirect['path'] = $tax_url['path'];
 183                          }
 184  
 185                      } else { // Some query vars are set via $_GET. Unset those from $_GET that exist via the rewrite
 186                          foreach ( $qv_remove as $_qv ) {
 187                              if ( isset($rewrite_vars[$_qv]) ) 
 188                                  $redirect['query'] = remove_query_arg($_qv, $redirect['query']);
 189                          }
 190                      }
 191                  }
 192  
 193              }
 194          } elseif ( is_single() && strpos($wp_rewrite->permalink_structure, '%category%') !== false ) {
 195              $category = get_category_by_path(get_query_var('category_name'));
 196              $post_terms = wp_get_object_terms($wp_query->get_queried_object_id(), 'category', array('fields' => 'tt_ids'));
 197              if ( (!$category || is_wp_error($category)) || ( !is_wp_error($post_terms) && !empty($post_terms) && !in_array($category->term_taxonomy_id, $post_terms) ) )
 198                  $redirect_url = get_permalink($wp_query->get_queried_object_id());
 199          }
 200  
 201          // Post Paging
 202          if ( is_singular() && get_query_var('page') && $redirect_url ) {
 203              $redirect_url = trailingslashit( $redirect_url ) . user_trailingslashit( get_query_var( 'page' ), 'single_paged' );
 204              $redirect['query'] = remove_query_arg( 'page', $redirect['query'] );
 205          }
 206  
 207          // paging and feeds
 208          if ( get_query_var('paged') || is_feed() || get_query_var('cpage') ) {
 209              while ( preg_match( "#/$wp_rewrite->pagination_base/?[0-9]+?(/+)?$#", $redirect['path'] ) || preg_match( '#/(comments/?)?(feed|rss|rdf|atom|rss2)(/+)?$#', $redirect['path'] ) || preg_match( '#/comment-page-[0-9]+(/+)?$#', $redirect['path'] ) ) {
 210                  // Strip off paging and feed
 211                  $redirect['path'] = preg_replace("#/$wp_rewrite->pagination_base/?[0-9]+?(/+)?$#", '/', $redirect['path']); // strip off any existing paging
 212                  $redirect['path'] = preg_replace('#/(comments/?)?(feed|rss2?|rdf|atom)(/+|$)#', '/', $redirect['path']); // strip off feed endings
 213                  $redirect['path'] = preg_replace('#/comment-page-[0-9]+?(/+)?$#', '/', $redirect['path']); // strip off any existing comment paging
 214              }
 215  
 216              $addl_path = '';
 217              if ( is_feed() && in_array( get_query_var('feed'), $wp_rewrite->feeds ) ) {
 218                  $addl_path = !empty( $addl_path ) ? trailingslashit($addl_path) : '';
 219                  if ( get_query_var( 'withcomments' ) )
 220                      $addl_path .= 'comments/';
 221                  $addl_path .= user_trailingslashit( 'feed/' . ( ( get_default_feed() ==  get_query_var('feed') || 'feed' == get_query_var('feed') ) ? '' : get_query_var('feed') ), 'feed' );
 222                  $redirect['query'] = remove_query_arg( 'feed', $redirect['query'] );
 223              }
 224  
 225              if ( get_query_var('paged') > 0 ) {
 226                  $paged = get_query_var('paged');
 227                  $redirect['query'] = remove_query_arg( 'paged', $redirect['query'] );
 228                  if ( !is_feed() ) {
 229                      if ( $paged > 1 && !is_single() ) {
 230                          $addl_path = ( !empty( $addl_path ) ? trailingslashit($addl_path) : '' ) . user_trailingslashit("$wp_rewrite->pagination_base/$paged", 'paged');
 231                      } elseif ( !is_single() ) {
 232                          $addl_path = !empty( $addl_path ) ? trailingslashit($addl_path) : '';
 233                      }
 234                  } elseif ( $paged > 1 ) {
 235                      $redirect['query'] = add_query_arg( 'paged', $paged, $redirect['query'] );
 236                  }
 237              }
 238  
 239              if ( get_option('page_comments') && ( ( 'newest' == get_option('default_comments_page') && get_query_var('cpage') > 0 ) || ( 'newest' != get_option('default_comments_page') && get_query_var('cpage') > 1 ) ) ) {
 240                  $addl_path = ( !empty( $addl_path ) ? trailingslashit($addl_path) : '' ) . user_trailingslashit( 'comment-page-' . get_query_var('cpage'), 'commentpaged' );
 241                  $redirect['query'] = remove_query_arg( 'cpage', $redirect['query'] );
 242              }
 243  
 244              $redirect['path'] = user_trailingslashit( preg_replace('|/index.php/?$|', '/', $redirect['path']) ); // strip off trailing /index.php/
 245              if ( !empty( $addl_path ) && $wp_rewrite->using_index_permalinks() && strpos($redirect['path'], '/index.php/') === false )
 246                  $redirect['path'] = trailingslashit($redirect['path']) . 'index.php/';
 247              if ( !empty( $addl_path ) )
 248                  $redirect['path'] = trailingslashit($redirect['path']) . $addl_path;
 249              $redirect_url = $redirect['scheme'] . '://' . $redirect['host'] . $redirect['path'];
 250          }
 251      }
 252  
 253      // tack on any additional query vars
 254      $redirect['query'] = preg_replace( '#^\??&*?#', '', $redirect['query'] );
 255      if ( $redirect_url && !empty($redirect['query']) ) {
 256          parse_str( $redirect['query'], $_parsed_query );
 257          $redirect = @parse_url($redirect_url);
 258  
 259          if ( ! empty( $_parsed_query['name'] ) && ! empty( $redirect['query'] ) ) {
 260              parse_str( $redirect['query'], $_parsed_redirect_query );
 261  
 262              if ( empty( $_parsed_redirect_query['name'] ) )
 263                  unset( $_parsed_query['name'] );
 264          }
 265  
 266          $redirect_url = add_query_arg( $_parsed_query, $redirect_url );
 267      }
 268  
 269      if ( $redirect_url )
 270          $redirect = @parse_url($redirect_url);
 271  
 272      // www.example.com vs example.com
 273      $user_home = @parse_url(home_url());
 274      if ( !empty($user_home['host']) )
 275          $redirect['host'] = $user_home['host'];
 276      if ( empty($user_home['path']) )
 277          $user_home['path'] = '/';
 278  
 279      // Handle ports
 280      if ( !empty($user_home['port']) )
 281          $redirect['port'] = $user_home['port'];
 282      else
 283          unset($redirect['port']);
 284  
 285      // trailing /index.php
 286      $redirect['path'] = preg_replace('|/index.php/*?$|', '/', $redirect['path']);
 287  
 288      // Remove trailing spaces from the path
 289      $redirect['path'] = preg_replace( '#(%20| )+$#', '', $redirect['path'] );
 290  
 291      if ( !empty( $redirect['query'] ) ) {
 292          // Remove trailing spaces from certain terminating query string args
 293          $redirect['query'] = preg_replace( '#((p|page_id|cat|tag)=[^&]*?)(%20| )+$#', '$1', $redirect['query'] );
 294  
 295          // Clean up empty query strings
 296          $redirect['query'] = trim(preg_replace( '#(^|&)(p|page_id|cat|tag)=?(&|$)#', '&', $redirect['query']), '&');
 297  
 298          // Remove redundant leading ampersands
 299          $redirect['query'] = preg_replace( '#^\??&*?#', '', $redirect['query'] );
 300      }
 301  
 302      // strip /index.php/ when we're not using PATHINFO permalinks
 303      if ( !$wp_rewrite->using_index_permalinks() )
 304          $redirect['path'] = str_replace('/index.php/', '/', $redirect['path']);
 305  
 306      // trailing slashes
 307      if ( is_object($wp_rewrite) && $wp_rewrite->using_permalinks() && !is_404() && (!is_front_page() || ( is_front_page() && (get_query_var('paged') > 1) ) ) ) {
 308          $user_ts_type = '';
 309          if ( get_query_var('paged') > 0 ) {
 310              $user_ts_type = 'paged';
 311          } else {
 312              foreach ( array('single', 'category', 'page', 'day', 'month', 'year', 'home') as $type ) {
 313                  $func = 'is_' . $type;
 314                  if ( call_user_func($func) ) {
 315                      $user_ts_type = $type;
 316                      break;
 317                  }
 318              }
 319          }
 320          $redirect['path'] = user_trailingslashit($redirect['path'], $user_ts_type);
 321      } elseif ( is_front_page() ) {
 322          $redirect['path'] = trailingslashit($redirect['path']);
 323      }
 324  
 325      // Strip multiple slashes out of the URL
 326      if ( strpos($redirect['path'], '//') > -1 )
 327          $redirect['path'] = preg_replace('|/+|', '/', $redirect['path']);
 328  
 329      // Always trailing slash the Front Page URL
 330      if ( trailingslashit( $redirect['path'] ) == trailingslashit( $user_home['path'] ) )
 331          $redirect['path'] = trailingslashit($redirect['path']);
 332  
 333      // Ignore differences in host capitalization, as this can lead to infinite redirects
 334      // Only redirect no-www <=> yes-www
 335      if ( strtolower($original['host']) == strtolower($redirect['host']) ||
 336          ( strtolower($original['host']) != 'www.' . strtolower($redirect['host']) && 'www.' . strtolower($original['host']) != strtolower($redirect['host']) ) )
 337          $redirect['host'] = $original['host'];
 338  
 339      $compare_original = array($original['host'], $original['path']);
 340  
 341      if ( !empty( $original['port'] ) )
 342          $compare_original[] = $original['port'];
 343  
 344      if ( !empty( $original['query'] ) )
 345          $compare_original[] = $original['query'];
 346  
 347      $compare_redirect = array($redirect['host'], $redirect['path']);
 348  
 349      if ( !empty( $redirect['port'] ) )
 350          $compare_redirect[] = $redirect['port'];
 351  
 352      if ( !empty( $redirect['query'] ) )
 353          $compare_redirect[] = $redirect['query'];
 354  
 355      if ( $compare_original !== $compare_redirect ) {
 356          $redirect_url = $redirect['scheme'] . '://' . $redirect['host'];
 357          if ( !empty($redirect['port']) )
 358              $redirect_url .= ':' . $redirect['port'];
 359          $redirect_url .= $redirect['path'];
 360          if ( !empty($redirect['query']) )
 361              $redirect_url .= '?' . $redirect['query'];
 362      }
 363  
 364      if ( !$redirect_url || $redirect_url == $requested_url )
 365          return false;
 366  
 367      // Hex encoded octets are case-insensitive.
 368      if ( false !== strpos($requested_url, '%') ) {
 369          if ( !function_exists('lowercase_octets') ) {
 370              function lowercase_octets($matches) {
 371                  return strtolower( $matches[0] );
 372              }
 373          }
 374          $requested_url = preg_replace_callback('|%[a-fA-F0-9][a-fA-F0-9]|', 'lowercase_octets', $requested_url);
 375      }
 376  
 377      // Note that you can use the "redirect_canonical" filter to cancel a canonical redirect for whatever reason by returning FALSE
 378      $redirect_url = apply_filters('redirect_canonical', $redirect_url, $requested_url);
 379  
 380      if ( !$redirect_url || $redirect_url == $requested_url ) // yes, again -- in case the filter aborted the request
 381          return false;
 382  
 383      if ( $do_redirect ) {
 384          // protect against chained redirects
 385          if ( !redirect_canonical($redirect_url, false) ) {
 386              wp_redirect($redirect_url, 301);
 387              exit();
 388          } else {
 389              // Debug
 390              // die("1: $redirect_url<br />2: " . redirect_canonical( $redirect_url, false ) );
 391              return false;
 392          }
 393      } else {
 394          return $redirect_url;
 395      }
 396  }
 397  
 398  /**
 399   * Attempts to guess correct post based on query vars.
 400   *
 401   * @since 2.3.0
 402   * @uses $wpdb
 403   *
 404   * @return bool|string Returns False, if it can't find post, returns correct
 405   *        location on success.
 406   */
 407  function redirect_guess_404_permalink() {
 408      global $wpdb;
 409  
 410      if ( !get_query_var('name') )
 411          return false;
 412  
 413      $where = $wpdb->prepare("post_name LIKE %s", like_escape( get_query_var('name') ) . '%');
 414  
 415      // if any of post_type, year, monthnum, or day are set, use them to refine the query
 416      if ( get_query_var('post_type') )
 417          $where .= $wpdb->prepare(" AND post_type = %s", get_query_var('post_type'));
 418      if ( get_query_var('year') )
 419          $where .= $wpdb->prepare(" AND YEAR(post_date) = %d", get_query_var('year'));
 420      if ( get_query_var('monthnum') )
 421          $where .= $wpdb->prepare(" AND MONTH(post_date) = %d", get_query_var('monthnum'));
 422      if ( get_query_var('day') )
 423          $where .= $wpdb->prepare(" AND DAYOFMONTH(post_date) = %d", get_query_var('day'));
 424  
 425      $post_id = $wpdb->get_var("SELECT ID FROM $wpdb->posts WHERE $where AND post_status = 'publish'");
 426      if ( !$post_id )
 427          return false;
 428      return get_permalink($post_id);
 429  }
 430  
 431  add_action('template_redirect', 'redirect_canonical');
 432  
 433  ?>


Generated: Wed Jun 1 08:30:02 2011 Cross-referenced by PHPXref 0.7
Provided by Yoast and awesome WordPress Hosting