• 欢迎访问开心洋葱网站,在线教程,推荐使用最新版火狐浏览器和Chrome浏览器访问本网站,欢迎加入开心洋葱 QQ群
  • 为方便开心洋葱网用户,开心洋葱官网已经开启复制功能!
  • 欢迎访问开心洋葱网站,手机也能访问哦~欢迎加入开心洋葱多维思维学习平台 QQ群
  • 如果您觉得本站非常有看点,那么赶紧使用Ctrl+D 收藏开心洋葱吧~~~~~~~~~~~~~!
  • 由于近期流量激增,小站的ECS没能经的起亲们的访问,本站依然没有盈利,如果各位看如果觉着文字不错,还请看官给小站打个赏~~~~~~~~~~~~~!

专业获取网站SEO信息的php类 seoreport.php

PHP 水墨上仙 1842次浏览

这个seo类的功能包括:
– 检查指定的网站响应
– 获取从该网站主页的语言和其他meta标签数据的
– 获取网站的导入链接,从Alexa的流量排名
– 获取网站的导入链接,由谷歌索引的网页数量
– 获取网站的信任,从WOT排名。
– 获取,因为它是第一个注册的网站域名年龄
– 获取的Twitter网站页面的数量
– 获取的Facebook链接的网站页面
– 获取网站谷歌网页速度等级
– 获取网站的谷歌网页排名

<?php
/**
 * 
 * SEO report for different metrics
 * 
 * @category   SEO
 * @author     Chema <chema@garridodiaz.com>
 * @copyright  (c) 2009-2012 Open Classifieds Team
 * @license    GPL v3
 * Based on  seo report script http://www.phpeasycode.com && PHP class SEOstats
 *
 */
class seoreport{
    
    /**
     * 
     * check if a url is online/alive
     * @param string $url
     * @return bool
     */
    public static function is_alive($url)
    {
        $ch = curl_init(); 
        curl_setopt($ch, CURLOPT_URL, $url); 
        curl_setopt($ch, CURLOPT_BINARYTRANSFER, 1); 
        curl_setopt($ch, CURLOPT_HEADERFUNCTION, 'curlHeaderCallback'); 
        curl_setopt($ch, CURLOPT_FAILONERROR, 1); 
        curl_exec ($ch); 
        $int_return_code = curl_getinfo($ch, CURLINFO_HTTP_CODE); 
        curl_close ($ch); 
        
        if ($int_return_code != 200 && $int_return_code != 302 && $int_return_code != 304) 
        { 
            return FALSE;
        }
        else return TRUE;
    }
    
    /**
     * HTTP GET request with curl.
     *
     * @param     string      $url        String, containing the URL to curl.
     * @return    string        Returns string, containing the curl result.
     *
     */
    protected static function get_html($url)
    {
        $ch  = curl_init($url);
        curl_setopt($ch,CURLOPT_RETURNTRANSFER,1);
        curl_setopt($ch,CURLOPT_CONNECTTIMEOUT,5);
        curl_setopt($ch,CURLOPT_FOLLOWLOCATION,1);
        curl_setopt($ch,CURLOPT_MAXREDIRS,2);
        if(strtolower(parse_url($url, PHP_URL_SCHEME)) == 'https')
        {
            curl_setopt($ch,CURLOPT_SSL_VERIFYPEER,1);
            curl_setopt($ch,CURLOPT_SSL_VERIFYHOST,1);
        }
        $str = curl_exec($ch);
        curl_close($ch);
        return ($str)?$str:FALSE;
    }
    /**
     * 
     * get the domain from any URL
     * @param string $url
     */
    public static function domain_name($url)
    {
        $nowww = ereg_replace('www\.','',$url);
        $domain = parse_url($nowww);
        
        if(!empty($domain["host"]))
            return $domain["host"];
        else
            return $domain["path"];
    }
    
    /**
     * 
     * get the metas from a url and the language of the site
     * @param string $url
     * @return array
     */
    public static function meta_info($url)
    {
        //doesn't work at mediatemple
        /*$html = new DOMDocument();
        
        if(!$html->loadHtmlFile($url)) 
            return FALSE;*/
            
        if (!$html_content = self::get_html($url)) 
                return FALSE;
        $html = new DOMDocument();
        $html->loadHtml($html_content); 
        
            
        $xpath = new DOMXPath( $html );
        
        $url_info = array();
        
        $langs = $xpath->query( '//html' );
        foreach ($langs as $lang)
        {
            $url_info['language'] = $lang->getAttribute('lang');
        }
        
        $metas = $xpath->query( '//meta' );
        foreach ($metas as $meta)
        {
            if ($meta->getAttribute('name'))
            {
                $url_info[$meta->getAttribute('name')] = $meta->getAttribute('content');
            }
        }
        
        return $url_info;
    }
    
    /**
     * 
     * Alexa rank
     * @param string $url
     * @return integer
     */
    public static function alexa_rank($url) 
    {
        $domain     = self::domain_name($url);
        $request     = "http://data.alexa.com/data?cli=10&dat=s&url=" . $domain;
        $data         = self::get_html($request);
        preg_match('/<POPULARITY URL="(.*?)" TEXT="([\d]+)"\/>/si', $data, $p);
        return ($l[2]) ? $l[2] : NULL;
    }
    
    /**
     * 
     * Alexa inbounds link
     * @param string $url
     * @return integer
     */
    public static function alexa_links($url) 
    {
        $domain     = self::domain_name($url);
        $request     = "http://data.alexa.com/data?cli=10&dat=s&url=" . $domain;
        $data         = self::get_html($request);
        preg_match('/<LINKSIN NUM="([\d]+)"\/>/si', $data, $l);
        return ($l[1]) ? $l[1] : NULL;
    }
    /**
     * Returns total amount of results for any Google search,
     * requesting the deprecated Websearch API.
     *
     * @param        string        $query      String, containing the search query.
     * @return       integer                   Returns a total count.
     */
    public static function google_pages($url)
    {
        //$query = self::domain_name($url);
        $url  = 'http://ajax.useso.com/ajax/services/search/web?v=1.0&rsz=1&q='.$url;
        $str  = self::get_html($url);
        $data = json_decode($str);
        return (!isset($data->responseData->cursor->estimatedResultCount))
                ? '0'
                : intval($data->responseData->cursor->estimatedResultCount);
    }
    
    /**
     * 
     * gets the inbounds links from a site
     * @param string $url
     * @param integer
     */
    public static function google_links($url) 
    {
        $request     = "http://www.google.com/search?q=" . urlencode("link:" . $url) . "&hl=en";
        $data         = self::get_html($request);
        preg_match('/<div id=resultStats>(About )?([\d,]+) result/si', $data, $l);
        return ($l[2]) ? $l[2] :  NULL;
    }
    /**
     * 
     * web of trust rating
     * @param string $url
     * @reutn integer
     */
    public static function WOT_rating($url) 
    {
        $domain  = self::domain_name($url);
        $request = "http://api.mywot.com/0.4/public_query2?target=" . $domain;
        $data      = self::get_html($request);
        preg_match_all('/<application name="(\d+)" r="(\d+)" c="(\d+)"\/>/si', $data, $regs);
        $trustworthiness = ($regs[2][0]) ? $regs[2][0] : NULL;
        return (is_numeric($trustworthiness))? $trustworthiness:NULL;
    }
    
    
    /**
     * 
     * how old is the domain?
     * @param string $domain
     * @return integer unixtime
     */
    public static function domain_age($domain) 
    {
        $request = "http://reports.internic.net/cgi/whois?whois_nic=" . $domain . "&type=domain";
        $data      = self::get_html($request);
        preg_match('/Creation Date: ([a-z0-9-]+)/si', $data, $p);
        return (!$p[1])?FALSE:strtotime($p[1]);
    }
    /**
     * 
     * counts how many tweets about the url
     * @param string $url
     * @return integer
     */
    public static function tweet_count($url)
    {
        $url = urlencode($url);
        $twitterEndpoint = "http://urls.api.twitter.com/1/urls/count.json?url=%s";
        $fileData = file_get_contents(sprintf($twitterEndpoint, $url)); 
        $json = json_decode($fileData, true);
        unset($fileData);               // free memory
        return (is_numeric($json['count']))? $json['count']:NULL;
    }
    
    /**
     * Returns the total amount of Facebook Shares for a single page
     *
     * @link          https://graph.facebook.com/
     * @param         string     The URL to check.
     * @return        integer    Returns the total amount of Facebook
     */
    public static function facebook_shares($q)
    {
        //Execution and result of Json
        $str  = self::get_html('http://graph.facebook.com/?id='.urlencode($q));
        $data = json_decode($str);
        //Return only number of facebook shares
        $r = $data->shares;
        return ($r != NULL) ? $r : intval('0');
    }
    
    /**
     * 
     * get the pagespeed rank over 100
     * @param string $url
     * @return integer
     */
    public static function page_speed($url)
    {
        $url  = 'https://developers.google.com/_apps/pagespeed/run_pagespeed?url='.$url.'&format=json';
        $str  = self::get_html($url);
        $data = json_decode($str);
        return intval($data->results->score);
    }
    
    /**
     * 
     * get google page rank
     * @param string $url
     * @return integer
     */
    public static function page_rank($url) 
    {
         $query = "http://toolbarqueries.google.com/tbr?client=navclient-auto&ch=".self::CheckHash(self::HashURL($url)). "&features=Rank&q=info:".$url."&num=100&filter=0";
           $data  = self::get_html($query);//die(print_r($data));
        $pos   = strpos($data, "Rank_");
        if($pos === false)
        {
            return NULL;
        } 
        else
       {
            $pagerank = substr($data, $pos + 9);
            return $pagerank;
        }
    }
    
    // functions for google pagerank
    
    /**
     * To calculate PR functions
     */
    public static function StrToNum($Str, $Check, $Magic)
    {
        $Int32Unit = 4294967296;  // 2^32
     
        $length = strlen($Str);
        for ($i = 0; $i < $length; $i++) {
            $Check *= $Magic;
            //If the float is beyond the boundaries of integer (usually +/- 2.15e+9 = 2^31),
            //  the result of converting to integer is undefined
            //  refer to http://www.php.net/manual/en/language.types.integer.php
            if ($Check >= $Int32Unit) {
                $Check = ($Check - $Int32Unit * (int) ($Check / $Int32Unit));
                //if the check less than -2^31
                $Check = ($Check < -2147483648) ? ($Check + $Int32Unit) : $Check;
            }
            $Check += ord($Str{$i});
        }
        return $Check;
    }
     
    /**
      * Genearate a hash for a url
      */
    public static function HashURL($String)
    {
        $Check1 = self::StrToNum($String, 0x1505, 0x21);
        $Check2 = self::StrToNum($String, 0, 0x1003F);
     
        $Check1 >>= 2;
        $Check1 = (($Check1 >> 4) & 0x3FFFFC0 ) | ($Check1 & 0x3F);
        $Check1 = (($Check1 >> 4) & 0x3FFC00 ) | ($Check1 & 0x3FF);
        $Check1 = (($Check1 >> 4) & 0x3C000 ) | ($Check1 & 0x3FFF);
     
        $T1 = (((($Check1 & 0x3C0) << 4) | ($Check1 & 0x3C)) <<2 ) | ($Check2 & 0xF0F );
        $T2 = (((($Check1 & 0xFFFFC000) << 4) | ($Check1 & 0x3C00)) << 0xA) | ($Check2 & 0xF0F0000 );
     
        return ($T1 | $T2);
    }
       
    /**
      * genearate a checksum for the hash string
      */
    public static function CheckHash($Hashnum)
    {
        $CheckByte = 0;
        $Flag = 0;
     
        $HashStr = sprintf('%u', $Hashnum) ;
        $length = strlen($HashStr);
     
        for ($i = $length - 1;  $i >= 0;  $i --) {
            $Re = $HashStr{$i};
            if (1 === ($Flag % 2)) {
                $Re += $Re;
                $Re = (int)($Re / 10) + ($Re % 10);
            }
            $CheckByte += $Re;
            $Flag ++;
        }
     
        $CheckByte %= 10;
        if (0 !== $CheckByte) {
            $CheckByte = 10 - $CheckByte;
            if (1 === ($Flag % 2) ) {
                if (1 === ($CheckByte % 2)) {
                    $CheckByte += 9;
                }
                $CheckByte >>= 1;
            }
        }
     
        return '7'.$CheckByte.$HashStr;
    }
}

使用范例

<?
include 'seoreport.php';
ini_set('max_execution_time', 180);
 
    $url = (isset($_GET['url']))?$_GET['url']:'http://phpclasses.org';
    $meta_tags = seoreport::meta_info($url);
            //die(var_dump($meta_tags));
            
    //first check if site online
    if ($meta_tags!==FALSE)
    {
        $stats = array();
    
        $stats['meta']                  = $meta_tags;
        $stats['alexa']['rank']         = seoreport::alexa_rank($url);
        $stats['alexa']['links']         = seoreport::alexa_links($url);
        $stats['domain']['WOT_rating']     = seoreport::WOT_rating($url);    
        $stats['domain']['domain_age']     = seoreport::domain_age($url);    
        $stats['social']['twitter']     = seoreport::tweet_count($url);    
        $stats['social']['facebook']     = seoreport::facebook_shares($url);    
        $stats['google']['page_rank']     = seoreport::page_rank($url);
        $stats['google']['page_speed']     = seoreport::page_speed($url);
        $stats['google']['pages']         = seoreport::google_pages($url);
        $stats['google']['links']         = seoreport::google_links($url);
        var_dump($stats);
    }
    else 'Site not online. '.$url;


开心洋葱 , 版权所有丨如未注明 , 均为原创丨未经授权请勿修改 , 转载请注明专业获取网站SEO信息的php类 seoreport.php
喜欢 (0)
加载中……