zl程序教程

您现在的位置是:首页 >  后端

当前栏目

PHP屏蔽蜘蛛访问代码及常用搜索引擎的HTTP_USER_AGENT

PHPHTTP代码 访问 常用 user 搜索引擎 屏蔽
2023-06-13 09:14:47 时间

PHP屏蔽蜘蛛访问代码代码

常用搜索引擎名与HTTP_USER_AGENT对应值

百度baiduspider

谷歌googlebot

搜狗sogou

腾讯SOSOsosospider

雅虎slurp

有道youdaobot

Bingbingbot

MSNmsnbot

Alexais_archiver

functionis_crawler(){
$userAgent=strtolower($_SERVER["HTTP_USER_AGENT"]);
$spiders=array(
"Googlebot",//Google爬虫
"Baiduspider",//百度爬虫
"Yahoo!Slurp",//雅虎爬虫
"YodaoBot",//有道爬虫
"msnbot"//Bing爬虫
//更多爬虫关键字
);
foreach($spidersas$spider){
$spider=strtolower($spider);
if(strpos($userAgent,$spider)!==false){
returntrue;
}
}
returnfalse;
}

下面的php代码附带了更多的蜘蛛标识

functionisCrawler(){
echo$agent=strtolower($_SERVER["HTTP_USER_AGENT"]);
if(!empty($agent)){
$spiderSite=array(
"TencentTraveler",
"Baiduspider+",
"BaiduGame",
"Googlebot",
"msnbot",
"Sosospider+",
"Sogouwebspider",
"ia_archiver",
"Yahoo!Slurp",
"YoudaoBot",
"YahooSlurp",
"MSNBot",
"Java(Oftenspambot)",
"BaiDuSpider",
"Voila",
"Yandexbot",
"BSpider",
"twiceler",
"SogouSpider",
"SpeedySpider",
"GoogleAdSense",
"Heritrix",
"Python-urllib",
"Alexa(IAArchiver)",
"Ask",
"Exabot",
"Custo",
"OutfoxBot/YodaoBot",
"yacy",
"SurveyBot",
"legs",
"lwp-trivial",
"Nutch",
"StackRambler",
"Thewebarchive(IAArchiver)",
"Perltool",
"MJ12bot",
"Netcraft",
"MSIECrawler",
"WGettools",
"larbin",
"Fishsearch",
);
foreach($spiderSiteas$val){
$str=strtolower($val);
if(strpos($agent,$str)!==false){
returntrue;
}
}
}else{
returnfalse;
}
}
if(isCrawler()){
echo"你好蜘蛛精!";
}
else{
echo"你不是蜘蛛精啊!";
}

使用PHP实现蜘蛛访问日志统计

$useragent=addslashes(strtolower($_SERVER["HTTP_USER_AGENT"]));

if(strpos($useragent,"googlebot")!==false){$bot="Google";}
elseif(strpos($useragent,"mediapartners-google")!==false){$bot="GoogleAdsense";}
elseif(strpos($useragent,"baiduspider")!==false){$bot="Baidu";}
elseif(strpos($useragent,"sogouspider")!==false){$bot="Sogou";}
elseif(strpos($useragent,"sogouweb")!==false){$bot="Sogouweb";}
elseif(strpos($useragent,"sosospider")!==false){$bot="SOSO";}
elseif(strpos($useragent,"360spider")!==false){$bot="360Spider";}
elseif(strpos($useragent,"yahoo")!==false){$bot="Yahoo";}
elseif(strpos($useragent,"msn")!==false){$bot="MSN";}
elseif(strpos($useragent,"msnbot")!==false){$bot="msnbot";}
elseif(strpos($useragent,"sohu")!==false){$bot="Sohu";}
elseif(strpos($useragent,"yodaoBot")!==false){$bot="Yodao";}
elseif(strpos($useragent,"twiceler")!==false){$bot="Twiceler";}
elseif(strpos($useragent,"ia_archiver")!==false){$bot="Alexa_";}
elseif(strpos($useragent,"iaarchiver")!==false){$bot="Alexa";}
elseif(strpos($useragent,"slurp")!==false){$bot="雅虎";}
elseif(strpos($useragent,"bot")!==false){$bot="其它蜘蛛";}
if(isset($bot)){
$fp=@fopen("bot.txt","a");
fwrite($fp,date("Y-m-dH:i:s")."\t".$_SERVER["REMOTE_ADDR"]."\t".$bot."\t"."http://".$_SERVER["SERVER_NAME"].$_SERVER["REQUEST_URI"]."\r\n");
fclose($fp);
}