• 技术文章 >后端开发 >php教程

    php实现专业获取网站SEO信息类实例,seo实例_PHP教程

    2016-07-13 09:58:09原创1634

    php实现专业获取网站SEO信息类实例,seo实例


    本文实例讲述了php实现专业获取网站SEO信息类。分享给大家供大家参考。具体如下:

    这个seo类的功能包括:
    - 检查指定的网站响应
    - 获取从该网站主页的语言和其他meta标签数据的
    - 获取网站的导入链接,从Alexa的流量排名
    - 获取网站的导入链接,由谷歌索引的网页数量
    - 获取网站的信任,从WOT排名。
    - 获取,因为它是第一个注册的网站域名年龄
    - 获取的Twitter网站页面的数量
    - 获取的Facebook链接的网站页面
    - 获取网站谷歌网页速度等级
    - 获取网站的谷歌网页排名

    <?php
    /**
     *
     * SEO report for different metrics
     *
     * @category SEO
     * @author Chema 
     * @copyright (c) 2009-2012 Open Classifieds Team
     * @license GPL v3
     * Based on seo report script http://www.phpeasycode.com && PHP class SEOstats
     *
     */
    class seoreport{
      /**
       *
       * check if a url is online/alive
       * @param string $url
       * @return bool
       */
      public static function is_alive($url)
      {
        $ch = curl_init();
        curl_setopt($ch, CURLOPT_URL, $url);
        curl_setopt($ch, CURLOPT_BINARYTRANSFER, 1);
        curl_setopt($ch, CURLOPT_HEADERFUNCTION, 'curlHeaderCallback');
        curl_setopt($ch, CURLOPT_FAILONERROR, 1);
        curl_exec ($ch);
        $int_return_code = curl_getinfo($ch, CURLINFO_HTTP_CODE);
        curl_close ($ch);
        if ($int_return_code != 200 && $int_return_code != 302 && $int_return_code != 304)
        {
          return FALSE;
        }
        else return TRUE;
      }
      /**
       * HTTP GET request with curl.
       *
       * @param string $url String, containing the URL to curl.
       * @return string Returns string, containing the curl result.
       *
       */
      protected static function get_html($url)
      {
        $ch = curl_init($url);
        curl_setopt($ch,CURLOPT_RETURNTRANSFER,1);
        curl_setopt($ch,CURLOPT_CONNECTTIMEOUT,5);
        curl_setopt($ch,CURLOPT_FOLLOWLOCATION,1);
        curl_setopt($ch,CURLOPT_MAXREDIRS,2);
        if(strtolower(parse_url($url, PHP_URL_SCHEME)) == 'https')
        {
          curl_setopt($ch,CURLOPT_SSL_VERIFYPEER,1);
          curl_setopt($ch,CURLOPT_SSL_VERIFYHOST,1);
        }
        $str = curl_exec($ch);
        curl_close($ch);
        return ($str)?$str:FALSE;
      }
      /**
       *
       * get the domain from any URL
       * @param string $url
       */
      public static function domain_name($url)
      {
        $nowww = ereg_replace('www\.','',$url);
        $domain = parse_url($nowww);
        if(!empty($domain["host"]))
          return $domain["host"];
        else
          return $domain["path"];
      }
      /**
       *
       * get the metas from a url and the language of the site
       * @param string $url
       * @return array
       */
      public static function meta_info($url)
      {
        //doesn't work at mediatemple
        /*$html = new DOMDocument();
        if(!$html->loadHtmlFile($url))
          return FALSE;*/
        if (!$html_content = self::get_html($url))
            return FALSE;
        $html = new DOMDocument();
        $html->loadHtml($html_content);
           
        $xpath = new DOMXPath( $html );
        $url_info = array();
        $langs = $xpath->query( '//html' );
        foreach ($langs as $lang)
        {
          $url_info['language'] = $lang->getAttribute('lang');
        }
        $metas = $xpath->query( '//meta' );
        foreach ($metas as $meta)
        {
          if ($meta->getAttribute('name'))
          {
            $url_info[$meta->getAttribute('name')] = $meta->getAttribute('content');
          }
        }
        return $url_info;
      }
      /**
       *
       * Alexa rank
       * @param string $url
       * @return integer
       */
      public static function alexa_rank($url)
      {
        $domain   = self::domain_name($url);
        $request   = "http://data.alexa.com/data?cli=10&dat=s&url=" . $domain;
        $data     = self::get_html($request);
        preg_match('//si', $data, $p);
        return ($l[2]) ? $l[2] : NULL;
      }
      /**
       *
       * Alexa inbounds link
       * @param string $url
       * @return integer
       */
      public static function alexa_links($url)
      {
        $domain   = self::domain_name($url);
        $request   = "http://data.alexa.com/data?cli=10&dat=s&url=" . $domain;
        $data     = self::get_html($request);
        preg_match('//si', $data, $l);
        return ($l[1]) ? $l[1] : NULL;
      }
      /**
       * Returns total amount of results for any Google search,
       * requesting the deprecated Websearch API.
       *
       * @param    string    $query   String, containing the search query.
       * @return    integer          Returns a total count.
       */
      public static function google_pages($url)
      {
        //$query = self::domain_name($url);
        $url = 'http://ajax.googleapis.com/ajax/services/search/web?v=1.0&rsz=1&q='.$url;
        $str = self::get_html($url);
        $data = json_decode($str);
        return (!isset($data->responseData->cursor->estimatedResultCount))
            ? '0'
            : intval($data->responseData->cursor->estimatedResultCount);
      }
      /**
       *
       * gets the inbounds links from a site
       * @param string $url
       * @param integer
       */
      public static function google_links($url)
      {
        $request   = "http://www.google.com/search?q=" . urlencode("link:" . $url) . "&hl=en";
        $data     = self::get_html($request);
        preg_match('/
    (About )?([\d,]+) result/si', $data, $l); return ($l[2]) ? $l[2] : NULL; } /** * * web of trust rating * @param string $url * @reutn integer */ public static function WOT_rating($url) { $domain = self::domain_name($url); $request = "http://api.mywot.com/0.4/public_query2?target=" . $domain; $data = self::get_html($request); preg_match_all('//si', $data, $regs); $trustworthiness = ($regs[2][0]) ? $regs[2][0] : NULL; return (is_numeric($trustworthiness))? $trustworthiness:NULL; } /** * * how old is the domain? * @param string $domain * @return integer unixtime */ public static function domain_age($domain) { $request = "http://reports.internic.net/cgi/whois?whois_nic=" . $domain . "&type=domain"; $data = self::get_html($request); preg_match('/Creation Date: ([a-z0-9-]+)/si', $data, $p); return (!$p[1])?FALSE:strtotime($p[1]); } /** * * counts how many tweets about the url * @param string $url * @return integer */ public static function tweet_count($url) { $url = urlencode($url); $twitterEndpoint = "http://urls.api.twitter.com/1/urls/count.json?url=%s"; $fileData = file_get_contents(sprintf($twitterEndpoint, $url)); $json = json_decode($fileData, true); unset($fileData); // free memory return (is_numeric($json['count']))? $json['count']:NULL; } /** * Returns the total amount of Facebook Shares for a single page * * @link https://graph.facebook.com/ * @param string The URL to check. * @return integer Returns the total amount of Facebook */ public static function facebook_shares($q) { //Execution and result of Json $str = self::get_html('http://graph.facebook.com/?id='.urlencode($q)); $data = json_decode($str); //Return only number of facebook shares $r = $data->shares; return ($r != NULL) ? $r : intval('0'); } /** * * get the pagespeed rank over 100 * @param string $url * @return integer */ public static function page_speed($url) { $url = 'https://developers.google.com/_apps/pagespeed/run_pagespeed?url='.$url.'&format=json'; $str = self::get_html($url); $data = json_decode($str); return intval($data->results->score); } /** * * get google page rank * @param string $url * @return integer */ public static function page_rank($url) { $query = "http://toolbarqueries.google.com/tbr?client=navclient-auto&ch=".self::CheckHash(self::HashURL($url)). "&features=Rank&q=info:".$url."&num=100&filter=0"; $data = self::get_html($query);//die(print_r($data)); $pos = strpos($data, "Rank_"); if($pos === false) { return NULL; } else { $pagerank = substr($data, $pos + 9); return $pagerank; } } // functions for google pagerank /** * To calculate PR functions */ public static function StrToNum($Str, $Check, $Magic) { $Int32Unit = 4294967296; // 2^32 $length = strlen($Str); for ($i = 0; $i < $length; $i++) { $Check *= $Magic; //If the float is beyond the boundaries of integer (usually +/- 2.15e+9 = 2^31), // the result of converting to integer is undefined // refer to http://www.php.net/manual/en/language.types.integer.php if ($Check >= $Int32Unit) { $Check = ($Check - $Int32Unit * (int) ($Check / $Int32Unit)); //if the check less than -2^31 $Check = ($Check < -2147483648) ? ($Check + $Int32Unit) : $Check; } $Check += ord($Str{$i}); } return $Check; } /** * Genearate a hash for a url */ public static function HashURL($String) { $Check1 = self::StrToNum($String, 0x1505, 0x21); $Check2 = self::StrToNum($String, 0, 0x1003F); $Check1 >>= 2; $Check1 = (($Check1 >> 4) & 0x3FFFFC0 ) | ($Check1 & 0x3F); $Check1 = (($Check1 >> 4) & 0x3FFC00 ) | ($Check1 & 0x3FF); $Check1 = (($Check1 >> 4) & 0x3C000 ) | ($Check1 & 0x3FFF); $T1 = (((($Check1 & 0x3C0) << 4) | ($Check1 & 0x3C)) <<2 ) | ($Check2 & 0xF0F ); $T2 = (((($Check1 & 0xFFFFC000) << 4) | ($Check1 & 0x3C00)) << 0xA) | ($Check2 & 0xF0F0000 ); return ($T1 | $T2); } /** * genearate a checksum for the hash string */ public static function CheckHash($Hashnum) { $CheckByte = 0; $Flag = 0; $HashStr = sprintf('%u', $Hashnum) ; $length = strlen($HashStr); for ($i = $length - 1; $i >= 0; $i --) { $Re = $HashStr{$i}; if (1 === ($Flag % 2)) { $Re += $Re; $Re = (int)($Re / 10) + ($Re % 10); } $CheckByte += $Re; $Flag ++; } $CheckByte %= 10; if (0 !== $CheckByte) { $CheckByte = 10 - $CheckByte; if (1 === ($Flag % 2) ) { if (1 === ($CheckByte % 2)) { $CheckByte += 9; } $CheckByte >>= 1; } } return '7'.$CheckByte.$HashStr; } }

    使用范例

    <?php
    include 'seoreport.php';
    ini_set('max_execution_time', 180);
      $url = (isset($_GET['url']))?$_GET['url']:'http://phpclasses.org';
      $meta_tags = seoreport::meta_info($url);
      //die(var_dump($meta_tags));
      //first check if site online
      if ($meta_tags!==FALSE)
      {
        $stats = array();
        $stats['meta'] = $meta_tags;
        $stats['alexa']['rank'] = seoreport::alexa_rank($url);
        $stats['alexa']['links'] = seoreport::alexa_links($url);
        $stats['domain']['WOT_rating'] = seoreport::WOT_rating($url);  
        $stats['domain']['domain_age'] = seoreport::domain_age($url);  
        $stats['social']['twitter'] = seoreport::tweet_count($url);  
        $stats['social']['facebook'] = seoreport::facebook_shares($url);
        $stats['google']['page_rank'] = seoreport::page_rank($url);
        $stats['google']['page_speed'] = seoreport::page_speed($url);
        $stats['google']['pages'] = seoreport::google_pages($url);
        $stats['google']['links'] = seoreport::google_links($url);
        var_dump($stats);
      }
      else 'Site not online. '.$url;

    希望本文所述对大家的php程序设计有所帮助。

    www.bkjia.comtruehttp://www.bkjia.com/PHPjc/978379.htmlTechArticlephp实现专业获取网站SEO信息类实例,seo实例 本文实例讲述了php实现专业获取网站SEO信息类。分享给大家供大家参考。具体如下: 这个seo类...

    声明:本文内容由网友自发贡献,版权归原作者所有,本站不承担相应法律责任。如您发现有涉嫌抄袭侵权的内容,请联系admin@php.cn核实处理。
    专题推荐:php 网站 SEO 转行
    上一篇:php使用post数组的键值创建同名变量并赋值的方法_PHP教程 下一篇:php中实现获取随机数组列表的自定义函数,php数组_PHP教程
    20期PHP线上班

    相关文章推荐

    • 【活动】充值PHP中文网VIP即送云服务器• php-fpm配置详解_php实例• 用PHP+MySQL搭建聊天室功能实例代码_php实例• php和数据库结合的一个简单的web实例 代码分析 (php初学者)_php实例• 想下载个论坛,哪种好?该如何解决• PHP 读取大文件时,怎样得到以回车换行的一行数据。该怎么解决
    1/1

    PHP中文网