php记录搜索引擎蜘蛛抓取页面代码
<?php error_reporting(E_ALL & ~E_NOTICE); /*($_SERVER ['HTTP_HOST'].$_SERVER['PHP_SELF']);($_SERVER['HTTP_USER_AGENT']);*/ $tlc_thispage = addslashes($_SERVER['HTTP_REFERER'] . $_SERVER['PHP_SELF']); //添加蜘蛛的抓取记录 $searchbot = get_naps_bot(); if ($searchbot) { @mysql_connect('localhost', 'root') or die('不能链接数据库教程' . mysql_error()); @mysql_select_db('spider') or die('不能选择数据库' . mysql_error()); mysql_query("UPDATE bot SET botcount=botcount+1, botlast=NOW(), botlasturl='$tlc_thispage' WHERE botname='$searchbot'"); } mysql_close(); function get_naps_bot() { $useragent = strtolower($_SERVER['HTTP_USER_AGENT']); if (strpos($useragent, 'googlebot') !== false) { return 'Googlebot'; } if (strpos($useragent, 'msnbot') !== false) { return 'MSNbot'; } if (strpos($useragent, 'slurp') !== false) { return 'Yahoobot'; } if (strpos($useragent, 'baiduspider') !== false) { return 'Baiduspider'; } if (strpos($useragent, 'sohu-search') !== false) { return 'Sohubot'; } if (strpos($useragent, 'lycos') !== false) { return 'Lycos'; } if (strpos($useragent, 'robozilla') !== false) { return 'Robozilla'; } if (strpos($useragent, 'msie 6.0') !== false) { //这条是我自己测试用的(我的浏览器就是ie6.0) return 'MSIE 6.0'; } return false; } ?> </body> </html>
本文地址:http://www.phprm.com/code/c1b56f30c9559d2a4cae080cac79e0b2.html
转载随意,但请附上文章地址:-)