php实现专业获取网站SEO信息类实例

前端之家收集整理的这篇文章主要介绍了php实现专业获取网站SEO信息类实例前端之家小编觉得挺不错的,现在分享给大家,也给大家做个参考。

本文实例讲述了PHP实现专业获取网站seo信息类。分享给大家供大家参考。具体如下:

这个SEO类的功能包括: - 检查指定的网站响应 - 获取从该网站主页的语言和其他Meta标签数据的 - 获取网站的导入链接,从Alexa的流量排名 - 获取网站的导入链接,由谷歌索引的网页数量 - 获取网站的信任,从WOT排名。 - 获取,因为它是第一个注册的网站域名年龄 - 获取的Twitter网站页面数量 - 获取的Facebook链接的网站页面 - 获取网站谷歌网页速度等级 - 获取网站的谷歌网页排名

PHP;"> PHP /** * * SEO report for different metrics * * @category SEO * @author Chema * @copyright (c) 2009-2012 Open Classifieds Team * @license GPL v3 * Based on SEO report script http://www.PHPeasycode.com && PHP class SEOstats * */ class SEOreport{ /** * * check if a url is online/alive * @param string $url * @return bool */ public static function is_alive($url) { $ch = curl_init(); curl_setopt($ch,CURLOPT_URL,$url); curl_setopt($ch,CURLOPT_BINARYTRANSFER,1); curl_setopt($ch,CURLOPT_HEADERFUNCTION,'curlHeaderCallback'); curl_setopt($ch,CURLOPT_FAILONERROR,1); curl_exec ($ch); $int_return_code = curl_getinfo($ch,CURLINFO_HTTP_CODE); curl_close ($ch); if ($int_return_code != 200 && $int_return_code != 302 && $int_return_code != 304) { return FALSE; } else return TRUE; } /** * HTTP GET request with curl. * * @param string $url String,containing the URL to curl. * @return string Returns string,containing the curl result. * */ protected static function get_html($url) { $ch = curl_init($url); curl_setopt($ch,CURLOPT_RETURNTRANSFER,CURLOPT_CONNECTTIMEOUT,5); curl_setopt($ch,CURLOPT_FOLLOWLOCATION,CURLOPT_MAXREDIRS,2); if(strtolower(parse_url($url,PHP_URL_SCHEME)) == 'https') { curl_setopt($ch,CURLOPT_SSL_VERIFYPEER,1); curl_setopt($ch,CURLOPT_SSL_VERIFYHOST,1); } $str = curl_exec($ch); curl_close($ch); return ($str)?$str:FALSE; } /** * * get the domain from any URL * @param string $url */ public static function domain_name($url) { $nowww = ereg_replace('www\.','',$url); $domain = parse_url($nowww); if(!empty($domain["host"])) return $domain["host"]; else return $domain["path"]; } /** * * get the Metas from a url and the language of the site * @param string $url * @return array */ public static function Meta_info($url) { //doesn't work at mediatemple /*$html = new DOMDocument(); if(!$html->loadHtmlFile($url)) return FALSE;*/ if (!$html_content = self::get_html($url)) return FALSE; $html = new DOMDocument(); $html->loadHtml($html_content);
$xpath = new DOMXPath( $html );
$url_info = array();
$langs = $xpath->query( '//html' );
foreach ($langs as $lang)
{
  $url_info['language'] = $lang->getAttribute('lang');
}
$<a href="/tag/Meta/" target="_blank" class="keywords">Meta</a>s = $xpath->query( '//<a href="/tag/Meta/" target="_blank" class="keywords">Meta</a>' );
foreach ($<a href="/tag/Meta/" target="_blank" class="keywords">Meta</a>s as $<a href="/tag/Meta/" target="_blank" class="keywords">Meta</a>)
{
  if ($<a href="/tag/Meta/" target="_blank" class="keywords">Meta</a>->getAttribute('name'))
  {
    $url_info[$<a href="/tag/Meta/" target="_blank" class="keywords">Meta</a>->getAttribute('name')] = $<a href="/tag/Meta/" target="_blank" class="keywords">Meta</a>->getAttribute('content');
  }
}
return $url_info;

}
/**

  • Alexa rank
  • @param string $url
  • @return integer
    /
    public static function alexa_rank($url)
    {
    $domain = self::domain_name($url);
    $request = "http://data.alexa.com/data?cli=10&amp;dat=s&amp;url=" . $domain;
    $data = self::get_html($request);
    preg_match('/<POPULARITY URL="(.
    ?)" TEXT="([\d]+)"\/>/si',$data,$p);
    return ($l[2]) ? $l[2] : NULL;
    }
    /**
  • Alexa inbounds link
  • @param string $url
  • @return integer
    */
    public static function alexa_links($url)
    {
    $domain = self::domain_name($url);
    $request = "http://data.alexa.com/data?cli=10&amp;dat=s&amp;url=" . $domain;
    $data = self::get_html($request);
    preg_match('/<LINKSIN NUM="([\d]+)"\/>/si',$l);
    return ($l[1]) ? $l[1] : NULL;
    }
    /**
  • Returns total amount of results for any Google search,* requesting the deprecated Websearch API.
  • @param string $query String,containing the search query.
  • @return integer Returns a total count.
    */
    public static function google_pages($url)
    {
    //$query = self::domain_name($url);
    $url = 'http://ajax.googleapis.com/ajax/services/search/web?v=1.0&rsz=1&q='.$url;
    $str = self::get_html($url);
    $data = json_decode($str);
    return (!isset($data->responseData->cursor->estimatedResultCount))
    ? '0'
    : intval($data->responseData->cursor->estimatedResultCount);
    }
    /**
  • gets the inbounds links from a site
  • @param string $url
  • @param integer
    */
    public static function google_links($url)
    {
    $request = "http://www.google.com/search?q=" . urlencode("link:" . $url) . "&hl=en";
    $data = self::get_html($request);
    preg_match('/
    (About )?([\d,]+) result/si',$l);
    return ($l[2]) ? $l[2] : NULL;
    }
    /**
  • web of trust rating
  • @param string $url
  • @reutn integer
    */
    public static function WOT_rating($url)
    {
    $domain = self::domain_name($url);
    $request = "http://api.mywot.com/0.4/public_query2?target=" . $domain;
    $data = self::get_html($request);
    preg_match_all('/<application name="(\d+)" r="(\d+)" c="(\d+)"\/>/si',$regs);
    $trustworthiness = ($regs[2][0]) ? $regs[2][0] : NULL;
    return (is_numeric($trustworthiness))? $trustworthiness:NULL;
    }

/**

  • how old is the domain?
  • @param string $domain
  • @return integer unixtime
    */
    public static function domain_age($domain)
    {
    $request = "http://reports.internic.net/cgi/whois?whois_nic=" . $domain . "&type=domain";
    $data = self::get_html($request);
    preg_match('/Creation Date: ([a-z0-9-]+)/si',$p);
    return (!$p[1])?FALSE:strtotime($p[1]);
    }
    /**
  • counts how many tweets about the url
  • @param string $url
  • @return integer
    */
    public static function tweet_count($url)
    {
    $url = urlencode($url);
    $twitterEndpoint = "http://urls.api.twitter.com/1/urls/count.json?url=%s";
    $fileData = file_get_contents(sprintf($twitterEndpoint,$url));
    $json = json_decode($fileData,true);
    unset($fileData); // free memory
    return (is_numeric($json['count']))? $json['count']:NULL;
    }
    /**
  • Returns the total amount of Facebook Shares for a single page
  • @link https://graph.facebook.com/
  • @param string The URL to check.
  • @return integer Returns the total amount of Facebook
    */
    public static function facebook_shares($q)
    {
    //Execution and result of Json
    $str = self::get_html('http://graph.facebook.com/?id='.urlencode($q));
    $data = json_decode($str);
    //Return only number of facebook shares
    $r = $data->shares;
    return ($r != NULL) ? $r : intval('0');
    }
    /**
  • get the pagespeed rank over 100
  • @param string $url
  • @return integer
    */
    public static function page_speed($url)
    {
    $url = 'https://developers.google.com/_apps/pagespeed/run_pagespeed?url='.$url.'&format=json';
    $str = self::get_html($url);
    $data = json_decode($str);
    return intval($data->results->score);
    }
    /**
  • get google page rank
  • @param string $url
  • @return integer
    */
    public static function page_rank($url)
    {
    $query = "http://toolbarqueries.google.com/tbr?client=navclient-auto&ch=".self::CheckHash(self::HashURL($url)). "&features=Rank&q=info:".$url."&num=100&filter=0";
    $data = self::get_html($query);//die(printr($data));
    $pos = strpos($data,"Rank
    ");
    if($pos === false)
    {
    return NULL;
    }
    else
    {
    $pagerank = substr($data,$pos + 9);
    return $pagerank;
    }
    }
    // functions for google pagerank
    /**
  • To calculate PR functions
    /
    public static function StrToNum($Str,$Check,$Magic)
    {
    $Int32Unit = 4294967296; // 2^32
    $length = strlen($Str);
    for ($i = 0; $i < $length; $i++) {
    $Check
    = $Magic;
    //If the float is beyond the boundaries of integer (usually +/- 2.15e+9 = 2^31),// the result of converting to integer is undefined
    // refer to http://www.php.net/manual/en/language.types.integer.php
    if ($Check >= $Int32Unit) {
    $Check = ($Check - $Int32Unit * (int) ($Check / $Int32Unit));
    //if the check less than -2^31
    $Check = ($Check < -2147483648) ? ($Check + $Int32Unit) : $Check;
    }
    $Check += ord($Str{$i});
    }
    return $Check;
    }
    /**
  • Genearate a hash for a url
    */
    public static function HashURL($String)
    {
    $Check1 = self::StrToNum($String,0x1505,0x21);
    $Check2 = self::StrToNum($String,0x1003F);
    $Check1 >>= 2;
    $Check1 = (($Check1 >> 4) & 0x3FFFFC0 ) | ($Check1 & 0x3F);
    $Check1 = (($Check1 >> 4) & 0x3FFC00 ) | ($Check1 & 0x3FF);
    $Check1 = (($Check1 >> 4) & 0x3C000 ) | ($Check1 & 0x3FFF);
    $T1 = (((($Check1 & 0x3C0) << 4) | ($Check1 & 0x3C)) <<2 ) | ($Check2 & 0xF0F );
    $T2 = (((($Check1 & 0xFFFFC000) << 4) | ($Check1 & 0x3C00)) << 0xA) | ($Check2 & 0xF0F0000 );
    return ($T1 | $T2);
    }
    /**
  • genearate a checksum for the hash string
    */
    public static function CheckHash($Hashnum)
    {
    $CheckByte = 0;
    $Flag = 0;
    $HashStr = sprintf('%u',$Hashnum) ;
    $length = strlen($HashStr);
    for ($i = $length - 1; $i >= 0; $i --) {
    $Re = $HashStr{$i};
    if (1 === ($Flag % 2)) {
    $Re += $Re;
    $Re = (int)($Re / 10) + ($Re % 10);
    }
    $CheckByte += $Re;
    $Flag ++;
    }
    $CheckByte %= 10;
    if (0 !== $CheckByte) {
    $CheckByte = 10 - $CheckByte;
    if (1 === ($Flag % 2) ) {
    if (1 === ($CheckByte % 2)) {
    $CheckByte += 9;
    }
    $CheckByte >>= 1;
    }
    }
    return '7'.$CheckByte.$HashStr;
    }
    }

使用范例

PHP;"> PHP include 'SEOreport.PHP'; ini_set('max_execution_time',180); $url = (isset($_GET['url']))?$_GET['url']:'http://PHPclasses.org'; $Meta_tags = SEOreport::Meta_info($url); //die(var_dump($Meta_tags)); //first check if site online if ($Meta_tags!==FALSE) { $stats = array(); $stats['Meta'] = $Meta_tags; $stats['alexa']['rank'] = SEOreport::alexa_rank($url); $stats['alexa']['links'] = SEOreport::alexa_links($url); $stats['domain']['WOT_rating'] = SEOreport::WOT_rating($url); $stats['domain']['domain_age'] = SEOreport::domain_age($url); $stats['social']['twitter'] = SEOreport::tweet_count($url); $stats['social']['facebook'] = SEOreport::facebook_shares($url); $stats['google']['page_rank'] = SEOreport::page_rank($url); $stats['google']['page_speed'] = SEOreport::page_speed($url); $stats['google']['pages'] = SEOreport::google_pages($url); $stats['google']['links'] = SEOreport::google_links($url); var_dump($stats); } else 'Site not online. '.$url;

希望本文所述对大家的PHP程序设计有所帮助。

猜你在找的PHP相关文章