最近对google的pagerank比较感兴趣,一直想知道如何不用google toolbar来获取pr值。用嗅探工具获得google toolbar发出请求的url为:http://toolbarqueries.google.com//search?client=navclient-auto&ch=64170410360&ie=utf-8&oe=utf-8&features=rank:fvn&q=info:http%3a//www.ugia.cn,其中的关键部分为ch=64170410360,即checksum,不知道这个是用的什么算法得出来的。
苦苦搜索之后,找到如下代码:
转自: http://meese.ath.cx/google via 思路(http://silu.spirezone.com)
<?php
/**
this code is released unto the public domain
*/
//header("content-type: text/plain; charset=utf-8");
define('google_magic', 0xe6359a60);
//unsigned shift right
function zerofill($a, $b)
{
$z = hexdec(80000000);
if ($z & $a)
{
$a = ($a>>1);
$a &= (~$z);
$a |= 0x40000000;
$a = ($a>>($b-1));
}
else
{
$a = ($a>>$b);
}
return $a;
}
function mix($a,$b,$c) {
$a -= $b; $a -= $c; $a ^= (zerofill($c,13));
$b -= $c; $b -= $a; $b ^= ($a< <8);
$c -= $a; $c -= $b; $c ^= (zerofill($b,13));
$a -= $b; $a -= $c; $a ^= (zerofill($c,12));
$b -= $c; $b -= $a; $b ^= ($a<<16);
$c -= $a; $c -= $b; $c ^= (zerofill($b,5));
$a -= $b; $a -= $c; $a ^= (zerofill($c,3));
$b -= $c; $b -= $a; $b ^= ($a<<10);
$c -= $a; $c -= $b; $c ^= (zerofill($b,15));
return array($a,$b,$c);
}
function googlech($url, $length=null, $init=google_magic) {
if(is_null($length)) {
$length = sizeof($url);
}
$a = $b = 0x9e3779b9;
$c = $init;
$k = 0;
$len = $length;
while($len >= 12) {
$a += ($url[$k+0] +($url[$k+1]< <8) +($url[$k+2]<<16) +($url[$k+3]<<24));
$b += ($url[$k+4] +($url[$k+5]<<8) +($url[$k+6]<<16) +($url[$k+7]<<24));
$c += ($url[$k+8] +($url[$k+9]<<8) +($url[$k+10]<<16)+($url[$k+11]<<24));
$mix = mix($a,$b,$c);
$a = $mix[0]; $b = $mix[1]; $c = $mix[2];
$k += 12;
$len -= 12;
}
$c += $length;
switch($len) /* all the case statements fall through */
{
case 11: $c+=($url[$k+10]<<24);
case 10: $c+=($url[$k+9]<<16);
case 9 : $c+=($url[$k+8]<<8);
/* the first byte of c is reserved for the length */
case 8 : $b+=($url[$k+7]<<24);
case 7 : $b+=($url[$k+6]<<16);
case 6 : $b+=($url[$k+5]<<8);
case 5 : $b+=($url[$k+4]);
case 4 : $a+=($url[$k+3]<<24);
case 3 : $a+=($url[$k+2]<<16);
case 2 : $a+=($url[$k+1]<<8);
case 1 : $a+=($url[$k+0]);
/* case 0: nothing left to add */
}
$mix = mix($a,$b,$c);
/*-------------------------------------------- report the result */
return $mix[2];
}
//converts a string into an array of integers containing the
numeric value of the char
function strord($string) {
for($i=0;$i<strlen($string);$i++) {
$result[$i] = ord($string{$i});
}
return $result;
}
// http://www.example.com/ - checksum: 6540747202
$url = 'info:'.$_get['url'];
$ch = googlech(strord($url));
$url='info:'.urlencode($_get['url']);
echo file_get_contents("http://www.google.com/search?client=
navclient-auto&ch=6$ch&ie=utf-8&oe=utf-8&features=rank&q=$url");
/* use curl send the user angent
$curl = curl_init("http://www.google.com/search?client=navclient-auto&ch=6$
ch&ie=utf-8&oe=utf-8&features=rank&q=$url");
curl_setopt ($curl, curlopt_useragent, "mozilla/4.0 (compatible;
googletoolbar 2.0.110-big; windows 2000 5.0)");
curl_exec($curl);
*/
?>
</></>
新闻热点
疑难解答