Searchactivity > Searchbot.php

Questions? Need Help? Want to share? » PHP Forum
Script Name:
Searchactivity

Download:
searchactivity.zip

Category:
Search Engines

Archive Content:

Searchactivity

Searchactivity > INSTALLATION GUIDE

Searchbot.php:


<?
$path 
=  __FILE__;
$path preg_replace"'\\\searchbot\.php'",  "",  $path);
$path preg_replace"'/searchbot\.php'",  "",  $path);

include(
$path."/searchbot_config.php");
$agent $_SERVER['HTTP_USER_AGENT'];
/*This Recognizes:
Ask Jeeves
Atomz
BlackWidow
BoxSeaBot
bSpider (Japenese indexing)
ChristCrawler (Christian Indexing) - christcentral.com
Combine - www.ub2.lu.se
CoolBot (German Search Engine) - suchmaschine21.de
Cruiser - krstarica.com
Deep Index
Desert Realm - SciFi - www.desertrealm.com
Digger - Diggit Search Engine - www.diggit.com
Digital Integrity Robot - www.digital-integrity.com/robotinfo.html
DNAbot - xx.dnainc.co.jp - Japenese
ExactSeek.com
Fido - planetsearch.com
FreeCrawl - Used for EuroSeek - freeside.net
geckobot - http://www.geckobot.com/
Google - www.google.com
Green Research,  Inc. - SPAMbot
Gulliver - nothernlight.com
InfoSeek - infoseek.com
Inktomi
IsraeliSearch - www.idc.ac.il/Sandbag/
Lycos - lycos.cs.cmu.edu
Mac Finder - SPAM bot
Marvin - infoseek.de
MSNbot
Muncher - www.goodlookingcooking.co.uk - SearchBot seeking out cooking pages.
NDSpider - www.nationaldirectory.com
NetScoop - www-a2k.is.tokushima-u.ac.jp/search
NetSearch - netsearch.org
PSBot - picsearch.com
Rambler - rambler.ru; Russian search site
River Valley - SPAM bot
Scooter - AltaVistas Indexing Agent - www.altavista.com
Seeker - Lookseek.com
SmartSpider - Knowledgebase Spider - www.engsoftware.com/robots.htm
SpeedySpider - EntireWeb.com
SpiderMan - Yahoo
Tarantula - www.nathan.de
Inktomi - HotBot - www.inktomi.com
Wanderer -     www.mit.edu/people/mkgray/net - MIT's bot to measure the growth of the web.
WebZinger - www.imaginon.com
Yahoo - Yahoo.com
Yellowpet - Yellowpet.com
*/
$arr = array("ask jeeves",  "atomz",  "blackwidow",  "bot",  "boxseabot",  "bspider",  "christcrawler",  "combine",  "coolbot",  "cruiser",  "desertrealm",  "deepindex",  "digger",  "diibot",  "dnabot",  "exactseek",  "fast-webcrawler",  "fido",  "freecrawl",  "geckobot",  "green research",  "googlebot",  "gulliver",  "turnitinbot",  "ia_archiver",  "infoseek",  "inktomisearch",  "israelisearch",  "lycos",  "mac finder",  "marvin",  "msnbot",  "muncher",  "ndspider",  "netscoop",  "netsearch",  "psbot",  "rambler.ru",  "river valley",  "robot",  "scooter",  "seeker",  "slurp",  "smartspider",  "speedy",  "spiderman",  "tarantula",  "wanderer",  "wz101",  "yahoo",  "yellowpet");
foreach (
$arr as $bot) {
    if (
eregi($bot,  $agent)) {
        
$bot_here "1";
        
$bot_name ucwords("$bot");
    }
}
if (
$bot_here == "1") {
  
$credit "<a href=\"http://jonathan.charpie.com/scripts.php?dir=342727009JCSALT-12\">SearchBot detection by: Jonathan Charpie - 342727009JCSALT-05</a>; Keep track of your <a href=\"http://www.collectandtrack.com/?dir=342727009JCSALT-12\">Pez Collection</a> here!   <a href=\"http://host.charpie.com/?dir=342727009JCSALT-all\"> Compare All Hosting Plans</a> |     <a href=\"http://host.charpie.com/asp_hosting.php?dir=342727009JCSALT-all\">ASP Hosting</a> | <a href=\"http://host.charpie.com/cheap_domain_hosting.php?dir=342727009JCSALT-all\">Cheap Domain Hosting</a> | <a href=\"http://host.charpie.com/cheap_internet_hosting.php?dir=342727009JCSALT-all\">Cheap Internet Hosting</a> | <a href=\"http://host.charpie.com/company_web_site_hosting.php?dir=342727009JCSALT-all\">Company Web Site Hosting</a> | <a href=\"http://host.charpie.com/index.php?dir=342727009JCSALT-all\">Compare All Hosting Plans</a> | <a href=\"http://host.charpie.com/domain_name_hosting.php?dir=342727009JCSALT-all\">Domain Name Hosting</a> | <a href=\"http://host.charpie.com/domain_registration_hosting.php?dir=342727009JCSALT-all\">Domain Registration Hosting</a> | <a href=\"http://host.charpie.com/ecommerce_web_hosting.php?dir=342727009JCSALT-all\">Ecommerce Web Hosting</a> | <a href=\"http://host.charpie.com/email_domain_hosting.php?dir=342727009JCSALT-all\">Email Domain Hosting</a> | <a href=\"http://host.charpie.com/free_domain_hosting.php?dir=342727009JCSALT-all\">Free Domain Hosting</a> | <a href=\"http://host.charpie.com/hosting_domain.php?dir=342727009JCSALT-all\">Hosting a Domain</a> | <a href=\"http://host.charpie.com/linux_hosting.php?dir=342727009JCSALT-all\">Linux Hosting</a> | <a href=\"http://host.charpie.com/multiple_domain_hosting.php?dir=342727009JCSALT-all\">Multiple Domain Hosting</a> | <a href=\"http://host.charpie.com/multiple_domain_web_hosting.php?dir=342727009JCSALT-all\">Multiple Domain Web Hosting</a> | <a href=\"http://host.charpie.com/php_hosting.php?dir=342727009JCSALT-all\">PHP Hosting</a> | <a href=\"http://host.charpie.com/unlimited_domain_hosting.php?dir=342727009JCSALT-all\">Unlimited Domain Hosting</a> | <a href=\"http://host.charpie.com/unlimited_space_domain_hosting.php?dir=342727009JCSALT-all\">Unlimited Space Domain Hosting</a> | <a href=\"http://host.charpie.com/virtual_domain_hosting.php?dir=342727009JCSALT-all\">Virtual Domain Hosting</a> | <a href=\"http://host.charpie.com/web_hosting_company.php?dir=342727009JCSALT-all\">Web Hosting Company</a> | <a href=\"http://host.charpie.com/web_hosting_provider.php?dir=342727009JCSALT-all\">Web Hosting Provider</a>
</p>"
;
  if(
$_SERVER['QUERY_STRING'] != ""){
      
$u $_SERVER['SERVER_NAME'].$_SERVER['PHP_SELF'].'?'.$_SERVER['QUERY_STRING'];
  } 
  else{
      
$u $_SERVER['SERVER_NAME'].$_SERVER['PHP_SELF'];
  } 
  
 echo 
$credit;
 
$delete = array("http://",  "www.");
 
$u str_replace($delete,  "",  $u);
 
$prefix "http://";
 
$url $prefix.$u;
 
$today date("l,  M j\<\s\u\p\>S\<\/\s\u\p\> Y - g:i a"); 
 
$hostname gethostbyaddr($_SERVER['REMOTE_ADDR']);
 
  if(
$logit){
      
$agent ucwords(substr($agent,  0,  strpos($agent,  '(')));
      
$write "<FONT COLOR=\"#AA0000\">$today</FONT><br><I>Bot:</I> "$agent." (<font color=\"#008080\"><small>".$hostname."</small></font>)";
      
$write .= "<br><I>Crawled:</I> <small><A HREF=\"$url\">$url</A></small><br><br>\r\n";
      
$fd fopen ($path."/".$logfile,  "a");
      
$write stripslashes($write);        
      
fwrite ($fd,  $write);      
  }
  if (
$agent != '') {
         
$mail_subject "$agent - $bot_name - Detected";
  } else if (
$agent == '') {
          
$mail_subject "$bot_name - Detected";
  }
  if(
$emailit){
        
$message "Date: $today\n\n$agent (".$hostname.")\n";
        
$message .= "Crawled: $url\n\n\nRegards\nSearchBot Activity Robot";
        
$headers "From: SearchBot Activity <$youremail>\r\nReply-To: $youremail\r\n";
        
mail($youremail,  $mail_subject,  $message,  $headers); 
  }

?>


Other Search Engines Scripts:

WebMaster Resources Home

©RingsWorld.com