]> git.nbdom.net Git - nb.git/commitdiff
lib/php/db/table.php
authorNicolas Boisselier <nicolas.boisselier@gmail.com>
Thu, 7 Dec 2017 03:35:16 +0000 (03:35 +0000)
committerNicolas Boisselier <nicolas.boisselier@gmail.com>
Thu, 7 Dec 2017 03:35:16 +0000 (03:35 +0000)
lib/php/db/table.php
share/db/nb.db
share/db/update.sh
share/db/useragent.csv [new file with mode: 0644]
share/db/useragent.sql

index 7a79d85df48170d47e2f285cfd911e9a2acac9dd..72c4f19081fe6cdc2d3c4efbcb6ea2d350aaad7e 100644 (file)
@@ -1765,7 +1765,8 @@ Class Table extends nb {
       return null;
     }
 
-    $sql = 'DELETE FROM ' . $this->sql_name() . $where;
+               # NB 07.12.17: Add LIMIT 1. If a table as not primary key when want to delete only on record
+    $sql = 'DELETE FROM ' . $this->sql_name() . $where . " LIMIT 1";
     $info['sql'] = $sql;
 
     if (self::p('debug')) {
index c354813c888ec783c5f7332d696707b66c6de4e8..502b190f31037ba372da7383bf9c6f143f2aeffd 100644 (file)
Binary files a/share/db/nb.db and b/share/db/nb.db differ
index e83cb31e8b2e43364ad8798731729288b387a3ab..4509c9613a86cd01995f435de6f0a7c6f4075d8d 100755 (executable)
@@ -5,7 +5,7 @@
 #
 #
 set +e
-DIR=$(dirname "$0")
+cd $(dirname "$0")
 tmp=`mktemp -d`
 
 csv2table() {
@@ -43,14 +43,14 @@ EOF
 
 data_src() {
 
-       $DIR/port > "$TMP/port.csv"
+       ./port > "$TMP/port.csv"
   csv2table port "$TMP/port.csv"
 
 }
 
 (
 
-cat "$DIR/*.sql"
+cat "*.sql"
 cat << EOF
 PRAGMA foreign_keys=OFF;
 .separator \t
@@ -65,7 +65,7 @@ COMMIT;
 VACUUM;
 EOF
 
-) | sqlite3 "$DIR/nb.db"
+) | sqlite3 "nb.db"
 
 rm -rf "$TMP"
 
diff --git a/share/db/useragent.csv b/share/db/useragent.csv
new file mode 100644 (file)
index 0000000..6aa9f83
--- /dev/null
@@ -0,0 +1,2459 @@
+id_a_f_3       !Susie (http://www.sync2it.com/susie)   Sync2It bookmark management & clustering engine C R             http://www.sync2it.com  
+id_a_f_6       <a href='http://www.unchaos.com/'> UnChaos </a> From Chaos To Order Hybrid Web Search Engine.(vadim_gonchar@unchaos.com)        UnCHAOS search robot    R       Site is dead    http://www.unchaos.com/ 
+id_a_f_7       <a href='http://www.unchaos.com/'> UnChaos Bot Hybrid Web Search Engine. </a> (vadim_gonchar@unchaos.com)       UnCHAOS search robot    R       Site is dead    http://www.unchaos.com/ 
+id_a_f_8       <b> UnChaosBot From Chaos To Order UnChaos Hybrid Web Search Engine at www.unchaos.com </b> (info@unchaos.com)  UnCHAOS search robot    R       Site is dead    http://www.unchaos.com/ 
+id_a_f_9       <http://www.sygol.com/> http://www.sygol.com    Sygol Search (Italy) robot      R       s.also SygolBot http://www.sygol.com/   
+id_a_f_4       ( Robots.txt Validator http://www.searchengineworld.com/cgi-bin/robotcheck.cgi )        SearchEngineWorld's robots.txt validator        C       Services is no more available   http://www.searchengineworld.com/cgi-bin/robotcheck.cgi 
+id_a_f_171105_1        (DreamPassport/3.0; isao/MyDiGiRabi)    DreamCast DreamPassport browser B               http://www.dricas.com/dp/       
+id_a_f_290606_1        (Privoxy/1.0)   Privoxy web proxy       P       s.also Privoxy/3.0 (Anonymous)  http://www.privoxy.org/ 
+id_a_f_230507_1        */Nutch-0.9-dev Unknown Yahoo robot     R       123.113.184.2xx http://www.yahoo.com    
+id_a_f_5       +SitiDi.net/SitiDiBot/1.0 (+Have Good Day)      SitiDi.net search (Germany) robot       R               http://www.sitidi.net/  
+id_a_f_1       -DIE-KRAEHE- META-SEARCH-ENGINE/1.1 http://www.die-kraehe.de    Die Kraehe Meta-Search-Engine (Germany) link checking   R               http://www.die-kraehe.de        
+id_a_f_060206_1        123spider-Bot (Version: 1.02, powered by www.123spider.de       123spider.de (Germany) web directory link checking      C               http://www.123spider.de/        
+id_a_f_180806_1        192.comAgent    192.com - UK web directory      R       217.160.75.2xx  http://www.192.com/     
+id_a_f_060606_1        1st ZipCommander (Net) - http://www.zipcommander.com/   1st ZipCommander Net - IE based browser B               http://www.zipcommander.com/    
+id_a_f_10      2Bone_LinkChecker/1.0 libwww-perl/5.64  2Bone online link checker       C               http://www.2bone.com/links/linkchecker.shtml    
+id_a_f_11      4anything.com LinkChecker v2.0  4Anything robot R               http://www.4anything.com        
+id_a_f_110207_1        8484 Boston Project v 1.0       Unknown guestbook spamming or harvesting tool from diff. IPs    S       s. various honey pot sites      http://www.projecthoneypot.org/bsh_X19tb2RlPWdsb2JhbCZfX2J5PWMmY3RyeT11cyZ1YWc9ODQ4NCtCb3N0b24rUHJvamVjdCt2KzEuMA..     
+id_a_f_2       :robot/1.0 (linux) ( admin e-mail: undefined http://www.neofonie.de/loesungen/search/robot.html )       neofonie search robot Germany   R               http://www.neofonie.de/loesungen/search/        
+id_a_f_12      A-Online Search A-Online.at robot - now Jet2Web Search  R               http://www.jet2web.net/portal   
+id_a_f_090707_1        A1 Keyword Research/1.0.2 (+http://www.micro-sys.dk/products/keyword-research/) miggibot/2007.03.27     A1 Keyword Research - search engine and keyword optimization software   C               http://www.micro-sys.dk/products/keyword-research/      
+id_a_f_100906_1        A1 Sitemap Generator/1.0 (+http://www.micro-sys.dk/products/sitemap-generator/) miggibot/2006.01.24     MiggiBot website crawler engine - A1 Sitemap Generator  R               http://www.micro-sys.dk/products/sitemap-generator/     http://www.micro-sys.dk/developer/miggibot/
+id_a_f_250408_2        aardvark-crawler        Aardvark web crawler for Sun's Blog recommendations     R       192.9.71.7x     http://blogs.sun.com/plamere/   
+id_a_f_13      AbachoBOT       Abacho / Crawler.de robot       R               http://www.abacho.com   
+id_a_f_14      AbachoBOT (Mozilla compatible)  Abacho / Crawler.de robot       R               http://www.abacho.com   
+id_a_f_15      ABCdatos BotLink/5.xx.xxx#BBL   ABCdatos - Castilian program & tutorial directory       R               http://www.abcdatos.com 
+id_a_f_16      Aberja Checkomat        Aberja Hybridsuchmaschine (Germany) link checking       R               http://www.aberja.de    
+id_a_f_17      abot/0.1 (abot; http://www.abot.com; abot@abot.com)     Nameprotect copyright search robot (24.177.134.x)       R       s. also - np/0.1_(np;_http://www.nameprotect.com... - aipbot/1.0 (aipbot; http://www.aipbot.com...      http://www.nameprotect.com/     
+id_a_f_18      About/0.1libwww-perl/5.47       About robot     R               http://www.about.com    
+id_a_f_051206_3        Accelatech RSSCrawler/0.4       Accela Technology RSS feed crawler      R       125.100.242.2xx http://www.accelatech.com/      
+id_a_f_19      accoona Accoona Search robot    R       65.17.255.xx    http://www.accoona.com  
+id_a_f_20      Accoona-AI-Agent/1.1.1 (crawler at accoona dot com)     Accoona Search robot    R       65.17.255.xx    http://www.accoona.com  
+id_a_f_140906_3        Accoona-AI-Agent/1.1.2 (aicrawler at accoonabot dot com)        Accoona Search robot    R       65.17.255.xx    http://www.accoona.com  
+id_a_f_21      Ace Explorer    Ace Explorer - IE based browser B               http://www.aceexplorer.com      
+id_a_f_280806_1        Ack (http://www.ackerm.com/)    Ackerm search robot     R       64.74.153.xx    http://www.ackerm.com/  
+id_a_f_22      AcoiRobot       Acoi picture finder robot       R               http://monetdb.cwi.nl/acoi/projects.html        
+id_a_f_23      Acoon Robot v1.50.001   Acoon.de search (Germany) robot R       80.237.153.10x  http://www.acoon.de     
+id_a_f_24      Acoon Robot v1.52 (http://www.acoon.de) Acoon.de search (Germany) robot R       80.237.153.10x  http://www.acoon.de     
+id_a_f_100508_1        Acoon-Robot 4.0.x.[xx] (http://www.acoon.de)    Acoon.de search (Germany) robot R       80.237.209.xx   http://www.acoon.de     
+id_a_f_010108_1        Acoon-Robot v3.xx (http://www.acoon.de and http://www.acoon.com)        Acoon.de search (Germany) robot R       80.237.153.10x  http://www.acoon.de     
+id_a_f_110507_1        Acorn/Nutch-0.9 (Non-Profit Search Engine; acorn.isara.org; acorn at isara dot org)     Acorn Search Project    R       124.157.145.1xx http://acorn.no-ip.org/ 
+id_a_f_25      ActiveBookmark 1.x      LibMaster.com Active Bookmark HTML page creator C B             http://www.libmaster.com/software.php   
+id_a_f_060806_2        Activeworlds    Activeworlds 3D homepage browser        B               http://www.activeworlds.com     
+id_a_f_26      ActiveWorlds/3.xx (xxx) Activeworlds 3D homepage browser        B               http://www.activeworlds.com     
+id_a_f_27      Ad Muncher v4.xx.x      Ad Muncher - banner killer      P               http://www.admuncher.com/       
+id_a_f_28      Ad Muncher v4x Build xxxxx      Ad Muncher - banner killer      P               http://www.admuncher.com/       
+id_a_f_061006_1        Adaxas Spider (http://www.adaxas.net/)  website directory adaxas link checking  C       85.10.199.xx    http://www.adaxas.net/  
+id_a_f_29      Advanced Browser (http://www.avantbrowser.com)  Avant Browser - IE based browser        B               http://www.avantbrowser.com     
+id_a_f_30      AESOP_com_SpiderMan     Aesop robot     R               http://www.aesop.com    
+id_a_f_31      agadine/1.x.x (+http://www.agada.de)    Agada search (Germany) robot    R       s. also Mozilla/4.0 (agadine3.0)        http://www.agada.de     
+id_a_f_32      Agent-SharewarePlazaFileCheckBot/2.0+(+http://www.SharewarePlaza.com)   SharewarePlaza link checking    R               http://www.sharewareplaza.com   
+id_a_f_33      AgentName/0.1 libwww-perl/5.48  Linkomatic submission verifier  R               http://www.linkomatic.com/      
+id_a_f_34      AIBOT/2.1 By +(www.21seek.com A Real artificial intelligence search engine China)       21seek.com (China) robot (218.17.90.xxx)        R               http://www.21seek.com   
+id_a_f_130807_1        AideRSS/1.0 (aiderss.com)       AideRss - Postrank RSS and Blog filtering       C       72.44.35.2xx    http://www.aiderss.com/ 
+id_a_f_35      aipbot/1.0 (aipbot; http://www.aipbot.com; aipbot@aipbot.com)   Nameprotect copyright search robot (24.177.134.x)       R       s. also - np/0.1_(np;_http://www.nameprotect.com... - abot/0.1 (abot; http://www.abot.com...    http://www.nameprotect.com/     
+id_a_f_36      aipbot/2-beta (aipbot dev; http://aipbot.com; aipbot@aipbot.com)        Nameprotect copyright search robot (24.177.134.x)       R       s. also - np/0.1_(np;_http://www.nameprotect.com... - abot/0.1 (abot; http://www.abot.com...    http://www.nameprotect.com/     
+id_a_f_291108_1        Akregator/1.2.9; librss/remnants        Akregator news feed reader for KDE      B               http://akregator.kde.org/       
+id_a_f_37      Aladin/3.324    Aladin robot    R               http://www.aladin.de    
+id_a_f_180408_1        Alcatel-BG3/1.0 UP.Browser/5.0.3.1.2    Phone.com UP.Browser for mobiles on Alcatel cellphone   B               http://www.openwave.com 
+id_a_f_38      Aleksika Spider/1.0 (+http://www.aleksika.com/) Aleksika Danmark - Search engine optimization spider    R               http://www.aleksika.com 
+id_a_f_291108_2        AlertInfo 2.0 (Powered by Newsbrain)    Alertinfo - French version of Feedreader 3.xx   B               http://www.feedreader.com/      http://www.geste.fr/alertinfo/home.html
+id_a_f_39      AlkalineBOT/1.3 Vestris robot   R               http://alkaline.vestris.com/    
+id_a_f_40      AlkalineBOT/1.4 (1.4.0326.0 RTM)        Vestris robot   R               http://alkaline.vestris.com/    
+id_a_f_41      Allesklar/0.1 libwww-perl/5.46  Allesklar.de robot      R               http://www.allesklar.de 
+id_a_f_42      Alligator 1.31 (www.nearsoftware.com)   Alligator download manager      D               http://www.nearsoftware.com     
+id_a_f_011108_1        Allrati/1.1 (+) Unknown robot from Allrati.com  R       67.205.96.xxx/67.205.104.xx     http://www.allrati.com/ 
+id_a_f_43      AltaVista Intranet V2.0 AVS EVAL search@freeit.com      Altavista robot R               http://www.altavista.com        
+id_a_f_44      AltaVista Intranet V2.0 Compaq Altavista Eval sveand@altavista.net      Altavista robot R               http://www.altavista.com        
+id_a_f_45      AltaVista Intranet V2.0 evreka.com crawler@evreka.com   Altavista robot R               http://www.altavista.com        
+id_a_f_46      AltaVista V2.0B crawler@evreka.com      Altavista robot R               http://www.altavista.com        
+id_a_f_280209_1        amaya/x.xx libwww/x.x.x Amaya - W3C's Editor/Browser    B               http://www.w3.org/Amaya/        
+id_a_f_47      AmfibiBOT       Amfibi Search robot     R       64.111.217.9x   http://www.amfibi.com/  
+id_a_f_48      Amfibibot/0.06 (Amfibi Web Search; http://www.amfibi.com; agent@amfibi.com)     Amfibi Search robot     R       64.111.217.9x   http://www.amfibi.com/  
+id_a_f_141105_2        Amfibibot/0.07 (Amfibi Robot; http://www.amfibi.com; agent@amfibi.com)  Amfibi Search robot     R       64.111.217.9x   http://www.amfibi.com/  
+id_a_f_49      amibot  amibot - Amidalla search engine robot (62.241.33.xx)    R       s. also libwww-perl/5.65        http://www.amidalla.com/        
+id_a_f_50      Amiga-AWeb/3.4.167SE    AWeb Amiga browser      B               http://www.amitrix.com/aweb.html        
+id_a_f_51      AmigaVoyager/3.4.4 (MorphOS/PPC native) Voyager - Amiga browser B               http://www.vapor.com/voyager/   
+id_a_f_091205_1        AmiTCP Miami (AmigaOS 2.04)     Amiga Miami TCP Stack                   http://home.ptd.net/~strdustr/amirc/Netware.html        
+id_a_f_210608_1        Amoi 8512/R21.0 NF-Browser/3.3  NF embedded browser on Amois Skypephone B               http://3skypephone.com/ 
+id_a_f_190206_3        amzn_assoc      Amazon.com robot for checking their affiliate sites     C       s. also aranhabot               
+id_a_f_52      AnnoMille spider 0.1 alpha - http://www.annomille.it    Annomille Italian historical oriented robot     R               http://www.annomille.it 
+id_a_f_53      annotate_google; http://ponderer.org/download/annotate_google.user.js   annotate Google - Firefox extension for annotating Google search results        B               http://ponderer.org/annotate_google     
+id_a_f_54      Anonymized by ProxyOS: http://www.megaproxy.com Megaproxy user  P               http://www.megaproxy.com        
+id_a_f_55      Anonymizer/1.1  faked user agent                                
+id_a_f_56      AnswerBus (http://www.answerbus.com/)   AnswerBus natural language search using COLLATE technology      R               http://www.answerbus.com        http://collate.dfki.de/kurzdarstellung.html
+id_a_f_57      AnswerChase PROve x.0   AnswerChase search tool                 http://www.answerchase.com      
+id_a_f_58      AnswerChase x.0 AnswerChase search tool                 http://www.answerchase.com      
+id_a_f_59      ANTFresco/x.xx  ANT Fresco Browser      B       s. also Mozilla/x.xx (compatible; ANTFresco....)        http://www.antlimited.com/products/fresco.htm   
+id_a_f_60      antibot-V1.1.5/i586-linux-2.2   Antibot (discontinued) robot    R               http://www.antidot.net  
+id_a_f_61      AnzwersCrawl/2.0 (anzwerscrawl@anzwers.com.au;Engine)   Anzwers (Yahoo) Australia robot R               http://au.anzwers.yahoo.com/    
+id_a_f_030206_1        Apexoo Spider 1.x       Apexoo Search spider    R       216.240.143.xx  http://www.apexoo.com/  
+id_a_f_62      Aplix HTTP/1.0.1        JavaOS app. for SEGA Saturn Internet and Sanyo Internet-TV      B                       
+id_a_f_63      Aplix_SANYO_browser/1.x (Japanese)      JavaOS app. for Sanyo Internet-TV       B                       
+id_a_f_64      Aplix_SEGASATURN_browser/1.x (Japanese) JavaOS app. for SEGA Saturn Internet    B                       
+id_a_f_65      Aport   Aport robot     R               http://www.aport.ru     
+id_a_f_66      appie 1.1 (www.walhello.com)    Walhello Internet Search robot  R               http://www.walhello.com 
+id_a_f_140608_1        Apple iPhone v1.1.4 CoreMedia v1.0.0.4A102      CoreMedia player on Apple iPhone        B               http://www.apple.com/iphone/    
+id_a_f_070209_1        Apple-PubSub/65.1.1     PubSub - Mac OS X utility for managing RSS/Atom subscriptions via the PubSub framework  B               http://developer.apple.com/documentation/Darwin/Reference/ManPages/man1/pubsub.1.html   
+id_a_f_120707_1        ArabyBot (compatible; Mozilla/5.0; GoogleBot; FAST Crawler 6.4; http://www.araby.com;)  Araby search - Arabia   R       209.85.31.2xx   http://www.araby.com/   
+id_a_f_260608_1        ArachBot        Covac Arachnid Web Crawler      R       s.also Covac TexAs Arachbot     http://www.covac-software.com/  
+id_a_f_67      Arachnoidea (arachnoidea@euroseek.com)  Euroseek spider R               http://www.euroseek.com 
+id_a_f_190206_2        aranhabot       Amazon.com robot for checking their affiliate sites     C       s. also amzn_assoc              
+id_a_f_68      ArchitextSpider Excite spider   R               http://www.excite.com   
+id_a_f_69      archive.org_bot Heritrix - The Internet Archive's open-source crawler (207.241.225.2xx) R       s.also - InternetArchive/0.8-dev - Mozilla/5.0 (compatible;archive.org_bot/...  http://www.archive.org/ 
+id_a_f_70      Argus/1.1 (Nutch; http://www.simpy.com/bot.html; feedback at simpy dot com)     Simpy Bookmarklet crawler (69.55.233.xx)        C       s. also Simpy   http://www.simpy.com/   
+id_a_f_031205_1        Arikus_Spider   Arikus inContext search engine software R               http://www.arikus.com/inContext-enterprise.html 
+id_a_f_210208_1        Arquivo-web-crawler (compatible; heritrix/1.12.1 +http://arquivo-web.fccn.pt)   Tomba project: the Portuguese web archive       R       193.136.192.xx  http://arquivo-web.fccn.pt/     http://arquivo-web.fccn.pt/crawler?set_language=en
+id_a_f_251007_1        ASAHA Search Engine Turkey V.001 (http://www.asaha.com/)        Asaha search robot (Turkey)     R       62.68.194.2xx   http://www.asaha.com/   
+id_a_f_71      Asahina-Antenna/1.x     ASAHINA Antenna information detecting agent     R               http://masshy.fastwave.gr.jp/hina/release/      
+id_a_f_72      Asahina-Antenna/1.x (libhina.pl/x.x ; libtime.pl/x.x)   ASAHINA Antenna information detecting agent     R               http://masshy.fastwave.gr.jp/hina/release/      
+id_a_f_73      ask.24x.info    Ask 24x Info robot      R               http://ask.24x.info/    
+id_a_f_74      AskAboutOil/0.06-rcp (Nutch; http://www.nutch.org/docs/en/bot.html; nutch-agent@askaboutoil.com)        Ask About Oil - Petroleum related search (24.227.212.xxx) using Nutch   R               http://askaboutoil.com/search.jsp       http://www.nutch.org
+id_a_f_120806_1        asked/Nutch-0.8 (web crawler; http://asked.jp; epicurus at gmail dot com)       askEd! / Inferret search (Japan) robot using Nutch      R       131.112.125.1xx http://asked.jp/        
+id_a_f_75      ASPSeek/1.2.5   ASPSeek search engine software -Yahoo-Inc. / Telecom Canada robot       R               http://www.aspseek.org  
+id_a_f_76      ASPseek/1.2.9d  Swsoft.net robot using Aspseek  R               http://www.aspseek.com  
+id_a_f_77      ASPSeek/1.2.x   ASPSeek search engine software  R               http://www.aspseek.org  
+id_a_f_78      ASPSeek/1.2.xa  ASPSeek search engine software  R               http://www.aspseek.org  
+id_a_f_79      ASPseek/1.2.xx  ASPSeek search engine software  R               http://www.aspseek.org  
+id_a_f_80      ASPSeek/1.2.xxpre       ASPSeek search engine software  R               http://www.aspseek.org  
+id_a_f_81      ASSORT/0.10     Associative Sort robot  R       site is down    http://pcmath126.unice.fr/assort-robot.html     
+id_a_f_82      asterias/2.0    Singingfish media spider (64.12.186.2xx) via AOL search R       s. also Mozilla/4.0 (compatible; MSIE 6.0 compatible; Asterias Crawler ...      http://search.singingfish.com/sfw/home.jsp      
+id_a_f_83      AtlocalBot/1.1 +(http://www.atlocal.com/local-web-site-owner.html)      Atlocal local business search robot     R               http://www.atlocal.com/ 
+id_a_f_041207_2        Atomic_Email_Hunter/4.0 Atomic Email Hunter email extracing and harvesting      S                       
+id_a_f_84      Atomz/1.0       Atomz robot     R               http://www.atomz.com    
+id_a_f_85      atSpider/1.0    atSpider (ceased) email harvester / spambot     S                       
+id_a_f_060707_1        Attentio/Nutch-0.9-dev (Attentio's beta blog crawler; www.attentio.com; info@attentio.com)      Attentio social media monitoring and analysing  R       85.88.35.xx     http://www.attentio.com/        
+id_a_f_231105_2        AU-MIC/2.0 MMP/2.0      Samsung SPH-A660 phone with Sprint software     B               http://www1.sprintpcs.com/explore/showcase/Showcase.jsp?scTopic=pcsVision       
+id_a_f_240208_1        AUDIOVOX-SMT5600        Audiovox SMT5600 (AT&T) Smartphone mobile phone browser B               http://www.audiovox.com/        http://www.audiovox.com/manuals/owners/SMT%205600%20QSG%209-7%20FINAL.pdf
+id_a_f_86      augurfind       Augurnet Swiss (was www.augurnet.ch) search robot       R                       
+id_a_f_87      augurnfind V-1.x        Augurnet Swiss (was www.augurnet.ch) search robot       R                       
+id_a_f_88      autoemailspider Auto Email Pro Email harvester  S       was http://autoemailspider.com - site is dead           
+id_a_f_89      autohttp        Linkscan tool from Elsop        C       s. Linkscan/x ? http://www.elsop.com/linkscan/  
+id_a_f_050208_1        autowebdir 1.1 (www.autowebdir.com)     Autowebdir - The Automatically Generated Web Directory  R       84.104.43.x     http://www.autowebdir.com/      
+id_a_f_90      AV Fetch 1.0    Altavista robot ??      R               http://www.altavista.com/       
+id_a_f_91      Avant Browser (http://www.avantbrowser.com)     Avant Browser - IE based browser        B               http://www.avantbrowser.com     
+id_a_f_92      AVSearch-1.0(peter.turney@nrc.ca)       National Research Council Canada robot  R               http://www.nrc-cnrc.gc.ca/main_e.html   
+id_a_f_93      AVSearch-2.0-fusionIdx-14-CompetitorWebSites    Unknown robot from 205.203.108.xx (telerate.com)                                
+id_a_f_94      AVSearch-3.0(AltaVista/AVC)     Altavista robot R               http://www.altavista.com/       
+id_a_f_95      AWeb    AWeb Amiga browser      B               http://aweb.sunsite.dk/ 
+id_a_f_96      axadine/ (Axadine Crawler; http://www.axada.de/; )      Axada search Germany robot      R               http://www.axada.de     
+id_a_f_97      AxmoRobot - Crawling your site for better indexing on www.axmo.com search engine.       Axmo search robot       R               http://www.axmo.com     
+id_a_f_250306_1        Azureus 2.x.x.x Azureus Java BitTorrent Client  D               http://azureus.sourceforge.net/ 
+id_a_f_131208_1        BabalooSpider/1.3 (BabalooSpider; http://www.babaloo.si; spider@babaloo.si)     Babaloo search robot (Slovenia) R       84.255.237.2xx  http://www.babaloo.si/  
+id_a_f_98      BaboomBot/1.x.x (+http://www.baboom.us) BaBoom Web Portal (ODP) robot (66.98.254.xx)    R               http://www.baboom.us    
+id_a_f_050406_1        BackStreet Browser 3.x  BackStreet Browser - Offline browser / website downloader       D               http://www.spadixbd.com/backstreet/     
+id_a_f_140508_1        BaiduImagespider+(+http://www.baidu.jp/search/s308.html)        Baidu search (Japan) image crawler      R       119.63.193.94.[x]xx     http://www.baidu.jp/    
+id_a_f_99      BaiDuSpider     Baidu spidering engine - used by diff. IPs      R               http://www.baidu.com    
+id_a_f_080608_1        Baiduspider+(+http://help.baidu.jp/system/05.html)      Baidu spidering engine - used by diff. IPs      R               http://www.baidu.com    
+id_a_f_100     Baiduspider+(+http://www.baidu.com/search/spider.htm)   Baidu spidering engine - used by diff. IPs      R               http://www.baidu.com    
+id_a_f_080407_1        Baiduspider+(+http://www.baidu.com/search/spider_jp.html)       Baidu search (Japan) crawler    R       119.63.193.[x]xx        http://www.baidu.jp     
+id_a_f_031107_1        Balihoo/Nutch-1.0-dev (Crawler for Balihoo.com search engine - obeys robots.txt and robots meta tags ; http://balihoo.com/index.aspx; robot at balihoo dot com) Balihoo - Vertical search engine crawler (beta) R               http://www.balihoo.com/ http://www.balihoo.com/pdfs/BalihooFactSheet.pdf
+id_a_f_101     BanBots/1.2 (spider@banbots.com)        Project BanBots Perl script robot       C       s. also Mozilla/5.0 (compatible; BanBots/2.0b.. http://www.banbots.com/ 
+id_a_f_140506_3        Barca/2.0.xxxx  Barca Pro email & PIM software  B               http://www.pocosystems.com/home/index.php?option=com_content&task=view&id=105&Itemid=54 
+id_a_f_120206_2        BarcaPro/1.4.xxxx       Barca Pro email & PIM software  B               http://www.pocosystems.com/home/index.php?option=com_content&task=view&id=105&Itemid=54 
+id_a_f_102     BarraHomeCrawler (albertof@barrahome.org)       Barrahome crawler       R       64.246.56.xx    http://www.barrahome.org        
+id_a_f_011006_1        bCentral Billing Post-Process   Unknown user agent from Microsoft               204.71.191.1xx          
+id_a_f_103     bdcindexer_2.6.2 (research@bdc) Business.com robot      R       208.144.233.xxx http://www.business.com 
+id_a_f_104     BDFetch Brandimensions Brand Protection robot   R               http://www.brandimensions.com/  
+id_a_f_105     BDNcentral Crawler v2.3 [en] (http://www.bdncentral.com/robot.html) (X11; I; Linux 2.0.44 i686) Bdncentral Sitesearch robot     R               http://www.bdncentral.com       
+id_a_f_111205_3        BeamMachine/0.5 (dead link remover of www.beammachine.net)      beammachine web directory (Germany) link checking       R C             http://www.beammachine.net/de/  
+id_a_f_106     beautybot/1.0 (+http://www.uchoose.de/crawler/beautybot/)       Beauty robot for Cosmoty - German beauty and wellness search    R               http://www.cosmoty.de   http://www.uchoose.de/Projekte/Lifestyle/beauty/
+id_a_f_230406_1        BebopBot/2.5.1 ( crawler http://www.apassion4jazz.net/bebopbot.html )   A Passion for Jazz music related search robot   R       68.6.204.2xx    http://www.apassion4jazz.net/   
+id_a_f_107     BeebwareDirectory/v0.01 LinkcheckerBeepware (site is down) web directory link checking  C               http://directory.beebware.co.uk 
+id_a_f_108     Big Brother (http://pauillac.inria.fr/~fpottier/)       Big Brother link checking tool  C               http://pauillac.inria.fr        
+id_a_f_130606_1        Big Fish v1.0   GoonGee.com link popularity checking    C       216.89.111.x    http://www.goongee.com/big-fish/        
+id_a_f_109     BigBrother/1.6e BB4 network monitoring  C               http://www.bb4.com      
+id_a_f_110     BigCliqueBOT/1.03-dev (bigclicbot; http://www.bigclique.com; bot@bigclique.com) BigClique Search robot  R               http://www.bigclique.com        
+id_a_f_080206_4        BIGLOTRON (Beta 2;GNU/Linux)    Biglotron search (France) robot R               http://www.biglotron.com/       
+id_a_f_171106_2        Bigsearch.ca/Nutch-x.x-dev (Bigsearch.ca Internet Spider; http://www.bigsearch.ca/; info@enhancededge.com)      Bigsearch.ca search robot       R       72.0.207.1xx    http://www.bigsearch.ca/        
+id_a_f_111     Bilbo/2.3b-UNIX Bilbo - web frontend for the Nessus Security Scanner    C               http://home.broadpark.no/%7Etnilsen-1/Linux/Bilbo_-_Nessus_WEB/bilbo_-_nessus_web.html  
+id_a_f_170806_1        BilgiBetaBot/0.8-dev (bilgi.com (Beta) ; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org)        Bilgi.com (Beta) search robot - Turkey  R       212.156.230.2xx http://www.bilgi.com/   
+id_a_f_080607_1        BilgiBot/1.0(beta) (http://www.bilgi.com/; bilgi at bilgi dot com)      Bilgi.com (Beta) search robot - Turkey  R       212.156.230.2xx http://www.bilgi.com/   
+id_a_f_112     billbot wjj@cs.cmu.edu  Carnegie Mellon School robot/link checking ?    C               http://www.cs.cmu.edu   
+id_a_f_050206_3        Bitacle bot/1.1 Bitacle Blog Search Archive robot       R               http://bitacle.org/     
+id_a_f_050206_2        Bitacle Robot (V:1.0;) (http://www.bitacle.com) Bitacle Blog Search Archive robot       R               http://bitacle.org/     
+id_a_f_113     Biyubi/x.x (Sistema Fenix; G11; Familia Toledo; es-mx)  Biyubi Navigator - Mexican browser for Fenix OS B               http://www.biyubi.com   
+id_a_f_114     BlackBerry7520/4.0.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/5.0.3.3 UP.Link/5.1.2.12 (Google WAP Proxy/1.0) Blackberry Wireless Internet browser via Google WAP Proxy       B P             http://www.blackberry.com/products/service/web.shtml    http://www.openwave.com
+id_a_f_115     BlackWidow      FS Consulting (was www.fsconsult.net) Black Widow web crawler   R                       
+id_a_f_010306_1        BlackWidow      BlackWidow web site scanner / downloading tool  D               http://www.softbytelabs.com/BlackWidow  
+id_a_f_116     Blaiz-Bee/1.0 (+http://www.blaiz.net)   Blaiz Enterprises RawGrunt search       R       203.87.123.1xx  http://www.rawgrunt.com/        http://www.blaiz.net
+id_a_f_160307_1        Blaiz-Bee/2.00.8222 (BE Internet Search Engine http://www.rawgrunt.com) Blaiz Enterprises RawGrunt search       R       203.87.123.1xx  http://www.rawgrunt.com/        http://www.blaiz.net
+id_a_f_240706_1        Blaiz-Bee/2.00.xxxx (+http://www.blaiz.net)     Blaiz Enterprises RawGrunt search       R       203.87.123.1xx  http://www.rawgrunt.com/        http://www.blaiz.net
+id_a_f_117     BlitzBOT@tricus.net     Blitzsuche Germany robot        R               http://blitzsuche.rp-online.de/ 
+id_a_f_118     BlitzBOT@tricus.net (Mozilla compatible)        Blitzsuche Germany robot        R               http://blitzsuche.rp-online.de/ 
+id_a_f_090307_1        BlockNote.Net   BlockNote web page editor       B               http://blocknote.net/   
+id_a_f_119     BlogBot/1.x     blogdex robot from MIT.edu      R               http://blogdex.media.mit.edu/   
+id_a_f_071206_1        BlogBridge 2.13 (http://www.blogbridge.com/)    BlogBridge RSS reader   B               http://www.blogbridge.com/      
+id_a_f_120     Bloglines Title Fetch/1.0 (http://www.bloglines.com)    Bloglines article search        R       65.214.44.xx    http://www.bloglines.com        
+id_a_f_250907_1        Bloglines-Images/0.1 (http://www.bloglines.com) Bloglines graphics crawler      R       65.214.44.xx    http://www.bloglines.com        
+id_a_f_011108_2        Bloglines/3.1 (http://www.bloglines.com)        Bloglines news crawler  R       65.214.44.xx    http://www.bloglines.com        
+id_a_f_071206_2        BlogMap (http://www.feedmap.net)        FeedMap / BlogMap geo coding service    C               http://www.feedmap.net/BlogMap/ 
+id_a_f_121     Blogpulse (info@blogpulse.com)  Intelliseek's BlogPulse blog search     R       64.158.138.xx   http://www.blogpulse.com        
+id_a_f_050208_2        BlogPulseLive (support@blogpulse.com)   Intelliseek's BlogPulse blog search     R       64.158.138.xx   http://www.blogpulse.com        
+id_a_f_161206_2        BlogSearch/1.x +http://www.icerocket.com/       IceRocket Web search robot      R       s. also BlogzIce ...    http://www.icerocket.com        
+id_a_f_020707_1        blogsearchbot-pumpkin-3 Art of Computing blog search project    R       88.198.44.2xx   http://artofcomputing.net/blog/?p=4     
+id_a_f_241205_1        BlogsNowBot, V 2.01 (+http://www.blogsnow.com/) BlogsNow realtime link tracker robot    R               http://www.blogsnow.com/        
+id_a_f_261107_1        BlogVibeBot-v1.1 (spider@blogvibe.nl)   BlogVipe news and Blog crawler (Netherlands)    R       212.61.21.xx    http://www.blogvibe.nl  
+id_a_f_122     blogWatcher_Spider/0.1 (http://www.lr.pi.titech.ac.jp/blogWatcher/)     blogWatcher robot from Okumura Group Tokyo (131.112.182.xxx)    R               http://www.lr.pi.titech.ac.jp   
+id_a_f_123     BlogzIce/1.0 (+http://icerocket.com; rhodes@icerocket.com)      IceRocket Web search robot      R       s. also BlogSearch ...  http://www.icerocket.com        
+id_a_f_124     BlogzIce/1.0 +http://www.icerocket.com/ IceRocket Web search robot      R       s. also BlogSearch ...  http://www.icerocket.com        
+id_a_f_310108_1        BloobyBot       Blooby search (beta) robot      R       206.166.206.18x http://www.blooby.com/  
+id_a_f_270507_1        Bloodhound/Nutch-0.9 (Testing Crawler for Research - obeys robots.txt and robots meta tags ; http://balihoo.com/index.aspx; robot at balihoo dot com)   Balihoo - Search Engine for Advertising Media   R       204.228.230.xx  http://balihoo.com/     
+id_a_f_125     bluefish 0.6 HTML editor        Bluefish HTML-editor for Linux  B               http://bluefish.openoffice.nl/  
+id_a_f_126     BMCLIENT        Part of ButtMan remote access tool              seems to be a Trojan - see link http://www.glocksoft.com/trojan_list/ButtMan.htm        
+id_a_f_120506_1        BMLAUNCHER      Bookmark Express bookmark manager       C       Website is dead - was:  http://www.bookmarkexpress.com/ 
+id_a_f_127     Bobby/4.0.x RPT-HTTPClient/0.3-3E       Bobby web accessibility desktop testing tool    C               http://bobby.watchfire.com/bobby/html/en/index.jsp      
+id_a_f_128     boitho.com-dc/0.xx (http://www.boitho.com/dcbot.html)   Boitho search (Norway) robot via 80.202.212.xx / 80.80.111.xx   R               http://www.boitho.com   
+id_a_f_129     boitho.com-robot/1.x    Boitho search (Norway) robot via 80.202.212.xx / 80.80.111.xx   R               http://www.boitho.com   
+id_a_f_130     boitho.com-robot/1.x (http://www.boitho.com/bot.html)   Boitho search (Norway) robot via 80.202.212.xx / 80.80.111.xx   R               http://www.boitho.com   
+id_a_f_060806_1        Bookdog/x.x     Bookdog - Mac bookmark manager  C               http://www.sheepsystems.com/bookdog/    
+id_a_f_131     Bookmark Buddy bookmark checker (http://www.bookmarkbuddy.net/) Bookmark Buddy - favorite bookmark manager      C               http://www.bookmarkbuddy.net    
+id_a_f_132     Bookmark Renewal Check Agent [http://www.bookmark.ne.jp/]       Favourites managing program     C               http://www.bookmark.ne.jp       
+id_a_f_230807_1        Bookmark Renewal Check Agent [http://www.bookmark.ne.jp/] (Version 2.0beta)     Favourites managing program     C               http://www.bookmark.ne.jp       
+id_a_f_300408_1        BookmarkBase(2/;http://bookmarkbase.com)        Bookmark Base bookmark manager  C               http://www.bookmarkbase.com/    
+id_a_f_133     Bot mailto:craftbot@yahoo.com   cybercity.fr user robot / faked user agent ?                            
+id_a_f_160308_1        BPImageWalker/2.0 (www.bdbrandprotect.com)      BD-Brandprotect copyright infringement crawler  R       72.14.164.1xx   http://www.bdbrandprotect.com/  http://www.bdbrandprotect.com/solutions_5.html
+id_a_f_134     BravoBrian bstop.bravobrian.it  BravoBrian bSTOP parental control       P R     s. also BStop   http://bstop.bravobrian.it/     
+id_a_f_135     BravoBrian SpiderEngine MarcoPolo       Robot for BravoBrian bSTOP      R       s. also BStop   http://bstop.bravobrian.it/     
+id_a_f_220508_1        BrightCrawler (http://www.brightcloud.com/brightcrawler.asp)    BrightCloud web filtering for classifying websites      P R             http://www.brightcloud.com/brightcrawler.asp    
+id_a_f_136     BruinBot (+http://webarchive.cs.ucla.edu/bruinbot.html) Webarchive Project Bruinbot crawler     R               http://webarchive.cs.ucla.edu   
+id_a_f_137     BSDSeek/1.0     Inktomi (Hotbot-Lycos NBCi) robot       R               http://www.inktomi.com/ 
+id_a_f_138     BStop.BravoBrian.it Agent Detector      BravoBrian bSTOP parental control       P R     s. also BravoBrian ..   http://bstop.bravobrian.it/     
+id_a_f_139     BTbot/0.x (+http://www.btbot.com/btbot.html)    BitTorrent Search Engine btbot robot    R               http://www.btbot.com    
+id_a_f_300408_2        BTWebClient/180B(9704)  µTorrent BitTorrent Client     D               http://www.utorrent.com/        
+id_a_f_080407_2        BuildCMS crawler (http://www.buildcms.com/crawler)      BuildCMS crawler - market monitoring project of BuildCMS        R       194.24.253.xx   http://www.buildcms.com/index.php       http://www.buildcms.com/about_us/crawler
+id_a_f_051206_4        Bulkfeeds/r1752 (http://bulkfeeds.net/) Bulkfeeds: RSS directory link checking  C       202.181.96.2xx  http://bulkfeeds.net/   
+id_a_f_140     BullsEye        BullsEye/Intelliseek robot      R               http://www.intelliseek.com/be/bullseye.htm      
+id_a_f_141     bumblebee@relevare.com  Relevare Portal software robot  R               http://www.relevare.com 
+id_a_f_142     BunnySlippers   Microsoft server information robot (see link)   C               http://www.webmasterworld.com/forum11/841.htm   
+id_a_f_070606_1        BurstFindCrawler/1.1 (crawler.burstfind.com; http://crawler.burstfind.com; crawler@burstfind.com)       BurstFind search crawler (64.34.172.xx) R               http://www.burstfind.com/       
+id_a_f_143     Buscaplus Robi/1.0 (http://www.buscaplus.com/robi/)     Buscaplus (Spain) robot R               http://www.buscaplus.com        
+id_a_f_050807_2        BW-C-2.0        Logitech Desktop Managers (LDM) Backweb (BW) update check       D               http://www.logitech.com/index.cfm/494/3041&cl=de,de     
+id_a_f_140508_2        bwh3_user_agent Basic Web Hacking 3 fake user-agent from Hellbound Hackers challenges   S               http://www.hellboundhackers.org/forum/_basic_web_hacking_3-7-6960_0.html        http://vuau.wordpress.com/2008/03/12/hbh-basic-web-3-switch-user-agent/
+id_a_f_140508_3        Cabot/Nutch-0.9 (Amfibi's web-crawling robot; http://www.amfibi.com/cabot/; agent@amfibi.com)   Amfibi Search robot     R       64.111.217.9x   http://www.amfibi.com/  
+id_a_f_280508_1        Cabot/Nutch-1.0-dev (Amfibi's web-crawling robot; http://www.amfibi.com/cabot/; agent@amfibi.com)       Amfibi Search robot     R       64.111.217.9x   http://www.amfibi.com/  
+id_a_f_140506_4        CamelHttpStream/1.0     Evolution integrated mail solution Camel TCP stream class                       http://www.gnome.org/projects/evolution/        http://go-evolution.org/Camel.Stream
+id_a_f_144     Cancer Information and Support International;   Some user agent                         
+id_a_f_110206_1        carleson/1.0    Cosmix project crawler (204.14.48.x / 38.113.234.xxx)   R       s. also - voyager/1.x - cfetch/1.       http://www.cosmixcorp.com/      
+id_a_f_145     Carnegie_Mellon_University_Research_WebBOT-->PLEASE READ-->http://www.andrew.cmu.edu/~brgordon/webbot/index.html http://www.andrew.cmu.edu/~brgordon/webbot/index.html  Carnegie Mellon University WebBOT       R               http://www.andrew.cmu.edu       
+id_a_f_146     Carnegie_Mellon_University_WebCrawler http://www.andrew.cmu.edu/~brgordon/webbot/index.html     Carnegie Mellon University WebBOT       R               http://www.andrew.cmu.edu       
+id_a_f_170206_1        Catall Spider   Catall.de search & web directory (Germany)      R               http://www.catall.de/   
+id_a_f_130807_3        CazoodleBot/CazoodleBot-0.1 (CazoodleBot Crawler; http://www.cazoodle.com/cazoodlebot; cazoodlebot@cazoodle.com)        UIUCs Cazoodle search based on MetaQuerier      R       72.36.94.1xx    http://www.cazoodle.com/        http://metaquerier.cs.uiuc.edu/
+id_a_f_290308_1        CCBot/1.0 (+http://www.commoncrawl.org/bot.html)        CommonCrawl Foundation search crawler   R       38.103.63.1[6-8]        http://www.commoncrawl.org/faq.htm      
+id_a_f_147     ccubee/x.x      Empyreum Ccubee (Czech) search engine solution  R               http://empyreum.com/technologies/ccubee 
+id_a_f_010108_2        CDR/1.7.1 Simulator/0.7(+http://timewe.net) Profile/MIDP-1.0 Configuration/CLDC-1.0     Timewe mobile browser (WAP) simulator (Japan)   B       61.142.xx.x[xx] http://timewe.net/      
+id_a_f_291105_6        CE-Preload      Cisco Content Engine    P               http://www.cisco.com/en/US/products/hw/contnetw/index.html      
+id_a_f_100408_4        CentiverseBot   Nordic semantic search engine   C       87.72.214.9x    http://www.centiverse-project.net/post/Educating-the-bots.aspx  
+id_a_f_180408_2        CentiverseBot - investigator    Nordic semantic search engine   C       87.72.214.9x    http://www.centiverse-project.net/post/Educating-the-bots.aspx  
+id_a_f_180408_3        CentiverseBot/3.0 (http://www.centiverse-project.net)   Nordic semantic search engine   C       87.72.214.9x    http://www.centiverse-project.net/post/Educating-the-bots.aspx  
+id_a_f_148     Ceramic Tile Installation Guide (http://www.floorstransformed.com)      Floortransformed.com robot (link ckecking ??)   R               http://www.floorstransformed.com        
+id_a_f_131208_2        CERN-LineMode/2.15      CERN Line Mode Browser  B               http://www.w3.org/LineMode/     
+id_a_f_149     cfetch/1.0      Cosmix project crawler (204.14.48.x / 38.113.234.xxx)   R       s. also - voyager/1.x - carleson/1.x    http://www.cosmixcorp.com       
+id_a_f_150     CFNetwork/x.x   MaxOS X CoreFoundation CFNetwork API                    http://www.cocoadev.com/index.pl?CFNetwork      
+id_a_f_151     cg-eye interactive      cg-eye CGI checker      C               http://www.htmlhelp.com 
+id_a_f_152     Charon/1.x (Amiga)      Charon Amiga download manager   D               http://tesla.rcub.bg.ac.yu/%7Eantony/Charon/    
+id_a_f_131208_3        Chat Catcher/1.0        Chat Catcher blog monitoring robot      C       69.80.208.2xx   http://chatcatcher.com/cc/      
+id_a_f_153     Checkbot/1.xx LWP/5.xx  Checkbot link validation        C               http://degraaff.org/checkbot/   
+id_a_f_154     CheckLinks/1.x.x        Checklinks - Perl link checker  C               http://www.jmarshall.com        
+id_a_f_155     CheckUrl        NTL user agent                  http://www.ntl.com      
+id_a_f_156     CheckWeb        CheckWeb link validation        C               http://p.duby.free.fr/chkweb.htm        
+id_a_f_030206_2        Chilkat/1.0.0 (+http://www.chilkatsoft.com/ChilkatHttpUA.asp)   Chilkat HTTP component user-agent                       http://www.chilkatsoft.com/HttpDotNet.asp       
+id_a_f_230506_1        China Local Browse 2.6  Unknown spam bot from telekom.com.my (218.111.83.xxx)   S       see link:       http://linuxreviews.org/webdesign/602_Apache_Webalizer/ 
+id_a_f_170408_2        Chitika ContentHit 1.0  Chitika Inc. Blog advertising   C       67.15.219.[x]x  http://chitika.com/     
+id_a_f_157     ChristCRAWLER 2.0       Christcentral.com Christcrawler (was www.christcrawler.com)     R       - s. also Mozilla/4.0 (compatible; ChristCrawler..)             
+id_a_f_010607_2        CHttpClient by Open Text Corporation    CHttpClient - C++ class using WinInet                   http://www.codeproject.com/library/lyoulhttpclient.asp  
+id_a_f_158     CipinetBot (http://www.cipinet.com/bot.html)    CipinetBot -Cipinet Search Engine Web Crawler   R               http://www.cipinet.com  
+id_a_f_130108_1        Cityreview Robot (+http://www.cityreview.org/crawler/)  Cityreview regional search (Germany) link checking      C       88.198.212.5x   http://www.cityreview.de/       http://www.cityreview.org/crawler/
+id_a_f_159     CJ Spider/      Commision Junction link checking spider C               http://www.cj.com/      
+id_a_f_050606_1        CJB.NET Proxy   CJB Net anonymous socks proxy service (216.194.70.x)    P               http://proxy.cjb.net/   
+id_a_f_160     ClariaBot/1.0   Claria (ex Gator) SearchScout robot (64.152.73.xx)      R       s. also Diamond http://www.searchscout.com      
+id_a_f_161     Claymont.com    Claymont Search robot   R               http://www.claymont.com 
+id_a_f_100307_1        CloakDetect/0.9 (+http://fulltext.seznam.cz/)   Seznam Search (Czech Republic) robot    R       212.80.76.xx    http://www.seznam.cz/   
+id_a_f_162     Clushbot/2.x (+http://www.clush.com/bot.html)   Clush clustered search robot    R               http://www.clush.com    
+id_a_f_163     Clushbot/3.x-BinaryFury (+http://www.clush.com/bot.html)        Clush clustered search robot    R               http://www.clush.com    
+id_a_f_164     Clushbot/3.xx-Ajax (+http://www.clush.com/bot.html)     Clush clustered search robot    R               http://www.clush.com    
+id_a_f_165     Clushbot/3.xx-Hector (+http://www.clush.com/bot.html)   Clush clustered search robot    R               http://www.clush.com    
+id_a_f_166     Clushbot/3.xx-Peleus (+http://www.clush.com/bot.html)   Clush clustered search robot    R               http://www.clush.com    
+id_a_f_070506_1        COAST WebMaster Pro/4.x.x.xx (Windows NT)       COAST Webmaster - Web management and maintenance software       C               http://www.extablish.com/cwm.htm        
+id_a_f_150306_1        CoBITSProbe     Proposed Content-Based Image Tracking System (CoBITS) P2P crawler       R C             http://www.iis.sinica.edu.tw/~hungchi/CBIT/     
+id_a_f_167     Cocoal.icio.us/1.0 (v36) (Mac OS X; http://www.scifihifi.com/cocoalicious)      Cocoa del.icio.us (social bookmarks manager) client for Mac OS X        C               http://www.scifihifi.com        
+id_a_f_070209_2        Cogentbot/1.X (+http://www.cogentsoftwaresolutions.com/bot.html)        Cogent Search Bot from Cogent Software Solutions for unknown purposes   R       72.81.252.9x    http://www.cogentsoftwaresolutions.com/bot.html 
+id_a_f_168     ColdFusion      Cold Fusion server used by various IPs i.e.: - NetWORLD web catalogue link checking     P C             http://www.networld.com http://www.macromedia.com/software/coldfusion/
+id_a_f_169     ColdFusion (BookmarkTracker.com)        Cold Fusion server used by Bookmark Tracker - online favourites managment       C               http://www.bookmarktracker.com  http://www.macromedia.com/software/coldfusion/
+id_a_f_170     collage.cgi/1.xx        WebCollage Syndicator graphics crawler/collector        R D             http://www.webcollage.com       
+id_a_f_171     combine/0.0     Combine harvesting & indexing robot     R       130.235.4.xx    http://combine.it.lth.se/       
+id_a_f_080406_1        Combine/2.0 http://combine.it.lth.se/   Combine harvesting & indexing robot     R       130.235.4.xx    http://combine.it.lth.se/       
+id_a_f_160807_1        Combine/3 http://combine.it.lth.se/     Combine harvesting & indexing robot     R       130.235.4.xx    http://combine.it.lth.se/       
+id_a_f_172     Combine/x.0     Combine harvesting & indexing robot     R       130.235.4.xx    http://combine.it.lth.se/       
+id_a_f_280606_3        cometrics-bot, http://www.cometrics.de  cometrics Web Content Mining solution - Germany R               http://www.cometrics.de/        
+id_a_f_173     Commerce Browser Center Wildsoft Germany (closed) Internet client system user-agent (was www.oskarweb.de)       B                       
+id_a_f_240107_1        complex_network_group/Nutch-0.9-dev (discovering the structure of the world-wide-web; http://cantor.ee.ucla.edu/~networks/crawl; nimakhaj@gmail.com)    UCLA Complex Networks Groups Complex Network Analysis   C       216.182.233.1xx http://cantor.ee.ucla.edu/~networks/    
+id_a_f_174     Computer_and_Automation_Research_Institute_Crawler crawler@ilab.sztaki.hu       Hungarian Academy of Sciences data mining search        R               http://www.ilab.sztaki.hu/websearch/    
+id_a_f_010406_2        Comrite/0.7.1 (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org)   ComRite Chinese Search Engine for Oversea Web Sites (69.248.26.xx)      R       powered by Nutch        http://www.comrite.com/ http://meidong.comrite.com/
+id_a_f_175     Contact unknown                         
+id_a_f_200307_1        ContactBot/0.2  Probably E-Mail harvesting robot - same as LMQueueBot   S       64.124.152.xx           
+id_a_f_291105_7        ContentSmartz   ContentSmartz e-mail harvesting tools   S                       
+id_a_f_176     contype Internet Explorer versions 4.x and 5 plugin content     B       NOT Contype mime type managment Perl script     http://support.microsoft.com/default.aspx?scid=kb;en-us;293792  
+id_a_f_177     Convera Internet Spider V6.x    Converas RetrievalWare Internet Spider (63.241.61.x)    R       s. also - infoConveraCrawler... - CrawlConvera ...      http://www.convera.com  
+id_a_f_178     ConveraCrawler/0.2      Converas RetrievalWare Internet Spider (63.241.61.x)    R       s. also - infoConveraCrawler... - CrawlConvera ...      http://www.convera.com  
+id_a_f_051205_1        ConveraCrawler/0.9d (+http://www.authoritativeweb.com/crawl)    Converas RetrievalWare Internet Spider (63.241.61.x)    R       s. also - infoConveraCrawler... - CrawlConvera ...      http://www.convera.com/ 
+id_a_f_179     ConveraMultiMediaCrawler/0.1 (+http://www.authoritativeweb.com/crawl)   Converas RetrievalWare Internet Spider (63.241.61.x)    R       s. also - infoConveraCrawler... - CrawlConvera ...      http://www.convera.com  
+id_a_f_180     CoolBot Suchmaschine21 (Germany) robot  R               http://www.suchmaschine21.de/   
+id_a_f_030110_2        Cooliris/1.5 CFNetwork/459 Darwin/10.0.0d3      Cooliris photo and video browser        B               http://www.cooliris.com/        
+id_a_f_040406_1        CoralWebPrx/0.1.1x (See http://coralcdn.org/)   Coral Content Distribution Network      P C             http://coralcdn.org/    
+id_a_f_181     cosmos/0.8_(robot@xyleme.com)   Xyleme SA France robot  R               http://www.xyleme.com/en/index.jsp      
+id_a_f_182     cosmos/0.9_(robot@xyleme.com)   Xyleme SA France robot  R               http://www.xyleme.com/en/index.jsp      
+id_a_f_040607_1        CoteoNutchCrawler/Nutch-0.9 (info [at] coteo [dot] com) Coteo.com - local French directory link checking        C               http://www.coteo.com/   
+id_a_f_030206_3        CougarSearch/0.x (+http://www.cougarsearch.com/faq.shtml)       Cougarsearch.com robot  R               http://www.cougarsearch.com/    
+id_a_f_280408_2        Covac TexAs Arachbot    Covac Arachnid Web Crawler      R       s.also ArachBot http://www.covac-software.com/  
+id_a_f_211208_1        CoverScout%203/3.0.1 CFNetwork/339.5 Darwin/9.5.0 (i386) (iMac5,1)      CoverScout for iTunes - CD cover search tool    B               http://www.equinux.com/de/products/coverscout/index.html        
+id_a_f_183     Cowbot-0.1 (NHN Corp. / +82-2-3011-1954 / nhnbot@naver.com)     Naver Japan / Korea robot       R       s. also Python-urllib/1.15 - nabot - NaverBot & dloader http://www.naver.co.jp  
+id_a_f_184     Cowbot-0.1.x (NHN Corp. / +82-2-3011-1954 / nhnbot@naver.com)   Naver Japan / Korea robot       R       s. also Python-urllib/1.15 - nabot - NaverBot & dloader http://www.naver.co.jp  
+id_a_f_185     CrawlConvera0.1 (CrawlConvera@yahoo.com)        Converas RetrievalWare Internet Spider  R       s. also - Convera Internet Spider .. - infoConveraCrawler...    http://www.convera.com  
+id_a_f_186     Crawler unknown robot via Level3.net                            
+id_a_f_187     Crawler (cometsearch@cometsystems.com)  Cometsystems Comet Search robot via Findwhat (now Miva) R               http://www.cometsystems.com     http://www.miva.com/
+id_a_f_188     Crawler admin@crawler.de        Crawler.de / Abacho robot       R               http://www.crawler.de   http://www.abacho.de/
+id_a_f_189     Crawler V 0.2.x admin@crawler.de        Crawler.de / Abacho robot       R               http://www.crawler.de   http://www.abacho.de/
+id_a_f_190     crawler@alexa.com       Alexa crawler   R               http://www.alexa.com    
+id_a_f_191     CrawlerBoy Pinpoint.com Pinpoint WAP search robot       R               http://www.pinpoint.com 
+id_a_f_130506_1        Crawllybot/0.1 (Crawllybot; +http://www.crawlly.com; crawler@crawlly.com)       Crawlly Beta search - Germany (72.232.194.2xx)  R       powered by Nutch        http://www.crawlly.com/ 
+id_a_f_192     CreativeCommons/0.06-dev (Nutch; http://www.nutch.org/docs/en/bot.html; nutch-agent@lists.sourceforge.net)      Creatice Commons using Nutch open source robot  R               http://www.nutch.org    
+id_a_f_030110_3        Cricket-A100/1.0 UP.Browser/6.3.0.7 (GUI) MMP/2.0       Cricket A100 cell phone browser B               http://www.mycricket.com/cell-phones/details/Cricket-A100       
+id_a_f_193     CrocCrawler vx.3 [en] (http://www.croccrawler.com) (X11; I; Linux 2.0.44 i686)  Croccrawler robot       R               http://www.croccrawler.com      
+id_a_f_090306_2        csci_b659/0.13  Web mining project from CSCI 659 (computer science course) at Indiana Univerity R               http://informatics.indiana.edu/fil/Class/b659/  
+id_a_f_180906_1        CSE HTML Validator Professional (http://www.htmlvalidator.com/) CSE HTML Validator for Windows  C               http://www.htmlvalidator.com/   
+id_a_f_194     Cuam Ver0.050bx Cuam - IE based browser B       site is dead    http://cuam.virtualave.net      
+id_a_f_195     Cuasarbot/0.9b http://www.cuasar.com/spider_beta/       Cuasar (Spain) music / ringtone search spider   R               http://www.cuasar.com   
+id_a_f_196     curl/7.10.x (i386-redhat-linux-gnu) libcurl/7.10.x OpenSSL/0.9.7a ipv6 zlib/1.1.4       Curl file transferring tool     D               http://curl.haxx.se/    
+id_a_f_197     curl/7.7.x (i386--freebsd4.3) libcurl 7.7.x (SSL 0.9.6) (ipv6 enabled)  Curl file transferring tool     D               http://curl.haxx.se/    
+id_a_f_198     curl/7.8 (i686-pc-linux-gnu) libcurl 7.8 (OpenSSL 0.9.6)        Curl file transferring tool     D               http://curl.haxx.se/    
+id_a_f_199     curl/7.9.x (win32) libcurl 7.9.x        Curl file transferring tool     D               http://curl.haxx.se/    
+id_a_f_200     CurryGuide SiteScan 1.1 CurryGuide UK link check robot  R               http://uk.curryguide.com/       
+id_a_f_201     Custo x.x (www.netwu.com)       Custo web site spidering tool (link checking)   C       s. also - - Mozilla/5.0 (compatible; Custo 3... http://www.netwu.com    
+id_a_f_202     Custom Spider www.bisnisseek.com /1.0   Bisnisseek (was www.bisnisseek.com) robot       R                       
+id_a_f_203     Cyberdog/2.0 (Macintosh; 68k)   Cyberdog Mac Browser (was www.cyberdog.org)     B                       
+id_a_f_260608_2        CyberPatrol SiteCat Webbot (http://www.cyberpatrol.com/cyberpatrolcrawler.asp)  CyberPatrol LLC robot for web filtering software        R       38.103.17.16x   http://www.cyberpatrol.com/cyberpatrolcrawler.asp       
+id_a_f_204     CyberSpyder Link Test/2.1.12 (admin@mspennyworth.com)   CyberSpyder Link Test software  C               http://www.cyberspyder.com/cslnkts1.html        
+id_a_f_205     CydralSpider/1.x (Cydral Web Image Search; http://www.cydral.com)       Cydral image & site search spider       R               http://www.cydral.com   
+id_a_f_060508_1        CydralSpider/3.0 (Cydral Image Search; http://www.cydral.com)   Cydral image & site search spider       R               http://www.cydral.com   
+id_a_f_206     DA 3.5 (www.lidan.com)  Downloadaccelerator download manager    D               http://www.downloadaccelerator.com      
+id_a_f_207     DA 4.0  Downloadaccelerator download manager    D               http://www.downloadaccelerator.com      
+id_a_f_208     DA 4.0 (www.downloadaccelerator.com)    Downloadaccelerator download manager    D               http://www.downloadaccelerator.com      
+id_a_f_209     DA 5.0  Downloadaccelerator download manager    D               http://www.downloadaccelerator.com      
+id_a_f_210     DA 7.0  Downloadaccelerator download manager    D               http://www.downloadaccelerator.com      
+id_a_f_070209_3        DAP x.x Download Accelerator Plus download manager      D               http://www.speedbit.com/        
+id_a_f_211     Dart Communications PowerTCP    PowerTCP ActiveX control tool                   http://www.dart.com     
+id_a_f_212     DataCha0s/2.0   Unknown bot from Kornet Korea (218.149.129.xxx) scans for Perl Awstats  S                       
+id_a_f_101106_1        DataCha0s/2.0   Unknown UA looking for Awstats Perl components  S       from various IPs                
+id_a_f_213     DataFountains/DMOZ Downloader   INFOMINE/iVia Scholary Internet Resource Collections robot      R       138.23.85.xx    http://infomine.ucr.edu/        http://ivia.ucr.edu/useragents.shtml
+id_a_f_040307_1        DataFountains/Dmoz Downloader (http://ivia.ucr.edu/useragents.shtml)    INFOMINE/iVia Scholary Internet Resource Collections robot      R       138.23.85.xx    http://infomine.ucr.edu/        http://ivia.ucr.edu/useragents.shtml
+id_a_f_110307_1        DataFountains/DMOZ Feature Vector Corpus Creator (http://ivia.ucr.edu/useragents.shtml) INFOMINE/iVia Scholary Internet Resource Collections robot      R       138.23.85.xx    http://infomine.ucr.edu/        http://ivia.ucr.edu/useragents.shtml
+id_a_f_050907_1        DataparkSearch/4.47 (+http://dataparksearch.org/bot)    DataparkSearch open source search engine        R               http://www.dataparksearch.org   
+id_a_f_214     DataparkSearch/4.xx (http://www.dataparksearch.org/)    DataparkSearch open source search engine        R               http://www.dataparksearch.org   
+id_a_f_080206_1        DataSpear/1.0 (Spider; http://www.dataspear.com/spider.html; spider@dataspear.com)      DataSpear Directory robot (24.109.29.xx)        R               http://www.dataspear.com/       
+id_a_f_215     DataSpearSpiderBot/0.2 (DataSpear Spider Bot; http://dssb.dataspear.com/bot.html; dssb@dataspear.com)   DataSpear Directory robot (24.109.29.xx)        R               http://www.dataspear.com/       
+id_a_f_161105_1        DatenBot( http://www.sicher-durchs-netz.de/bot.html)    Sicher-durchs-Netz German security related search (62.75.220.xxx)       R               http://www.sicher-durchs-netz.de/suche  
+id_a_f_216     DaviesBot/1.7 (www.wholeweb.net)        Wholeweb robot  R       site is closed  http://www.wholeweb.net 
+id_a_f_217     daypopbot/0.x   Daypop blog - weblog - online mag search spider R               http://www.daypop.com/info/about.htm    
+id_a_f_218     dbDig(http://www.prairielandconsulting.com)     dbDig search engine     R               http://www.prairielandconsulting.com    
+id_a_f_219     DBrowse 1.4b    Some site scanning tool via diff. IPs i.e.: - wanweb.net (208.6.163.xxx) - cox.net (68.4.xxx.xxx)       S       UA sometimes - DSurf15a 01 - DBrowse 1.4d               
+id_a_f_220     DBrowse 1.4d    Some site scanning tool via diff. IPs i.e.: - pacbell.net (67.112.xxx.xxx)      S       see also DSurf15a 01 - DBrowse 1.4b             
+id_a_f_221     DC-Sakura/x.xx  DC-Sakura download manager      D               http://www.dc-sakura.com/       
+id_a_f_222     dCSbot/1.1      unknown divine/Openmarket.com robot     R               http://www.openmarket.com/      
+id_a_f_223     DDD     some (website) downloading tool D                       
+id_a_f_224     dds explorer v1.0 beta  Unknown user agent                              
+id_a_f_225     de.searchengine.comBot 1.2 (http://de.searchengine.com/spider)  Searchengine.com (Germany) submission checking / robot (84.73.57.xx)    R               http://de.searchengine.com      
+id_a_f_226     DeadLinkCheck/0.4.0 libwww-perl/5.xx    DLC Perl HTTP link checking     C               http://dlc.sourceforge.net/     
+id_a_f_111206_3        Deep Link Calculator v1.0       Sootle Web Directory deep link checker  C       216.89.111.x    http://directory.sootle.com/deep-links/ 
+id_a_f_227     deepak-USC/ISI  deepak-USC/ISI robot from USC/Information Science Institute     R               http://www.isi.edu/%7Eravichan/deepak-usc-isi.html      http://www.isi.edu/
+id_a_f_228     DeepIndex       Deepindex robot R               http://www.deepindex.net/utilisateurs.php?referral=deepindex    
+id_a_f_229     DeepIndex ( http://www.zetbot.com )     Zetbot search Belgium (213.41.128.xx) using Deepindex robot     R               http://www.zetbot.com/  http://www.deepindex.net/utilisateurs.php?referral=deepindex
+id_a_f_230     DeepIndex (www.en.deepindex.com)        Deepindex robot R               http://www.deepindex.net/utilisateurs.php?referral=deepindex    
+id_a_f_231     DeepIndexer.ca  Deepindex robot (via Paragon.net Canada)        R               http://www.deepindex.net/utilisateurs.php?referral=deepindex    
+id_a_f_011006_2        del.icio.us-thumbnails/1.0 Mozilla/5.0 (compatible; Konqueror/3.4; FreeBSD) KHTML/3.4.2 (like Gecko)    del.icio.us picture robot for thumbnail preview via Yahoo       D       66.94.237.1xx   http://del.icio.us/     
+id_a_f_250106_1        DeleGate/9.0.5-fix1     DeleGate application level gateway / proxy server       P               http://www.delegate.org/delegate/       
+id_a_f_232     Demo Bot DOT 16b        Some site scanning tool from 217.34.59.xxx (btopenworld.com)    S                       
+id_a_f_233     Demo Bot Z 16b  Some site scanning tool from 68.154.96.xx (bellsouth.net)       S       appears also as - MFC Foundation Class Library - Full Web Bot 0516B             
+id_a_f_234     Denmex websearch (http://search.denmex.com)     Denmex Websearch robot/link checking    R               http://search.denmex.com        
+id_a_f_235     Der große BilderSauger 2.00u   DataBecker Bilder Sauger (discontinued) web graphics downloader D               http://www.databecker.de        
+id_a_f_230206_1        dev-spider2.searchpsider.com/1.3b       Searchspider.com robot (72.245.225.xxx) R               http://www.searchspider.com/    
+id_a_f_236     DevComponents.com HtmlDocument Object   DevComponents HTMLDocument Class Library for Visual Studio.net                  http://www.devcomponents.com    
+id_a_f_237     DiaGem/1.1 (http://www.skyrocket.gr.jp/diagem.html)     DiaGem Japan web crawler        R       (site is offline)       http://www.skyrocket.gr.jp      
+id_a_f_238     Diamond/x.0     Claria (ex Gator) SearchScout robot (64.152.73.xx)      R       s. also Claria  http://www.searchscout.com      
+id_a_f_239     DiamondBot      Claria (ex Gator) SearchScout robot (64.152.73.xx)      R       s. also Claria  http://www.searchscout.com      
+id_a_f_240     Digger/1.0 JDK/1.3.0rc3 Diggit! robot   R               http://www.diggit.com   
+id_a_f_241     DigOut4U        OpenPortal4U robot      R               http://www.arisem.com   
+id_a_f_242     DIIbot/1.2      Findsame.com (site is offline) / Digital-Integrity robot        R               http://www.digital-integrity.com/       
+id_a_f_100206_1        Dillo/0.8.5-i18n-misc   Dillo Web Browser       B               http://www.dillo.org/   
+id_a_f_243     Dillo/0.x.x     Dillo Web Browser       B               http://www.dillo.org/   
+id_a_f_100109_1        disastrous/1.0.5 (running with Python 2.5.1; http://www.bortzmeyer.org/disastrous.html; archangel77@del.icio.us)        disastrous - a del.icio.us link checker based on Python C               http://www.bortzmeyer.org/disastrous.html       
+id_a_f_140306_1        DISCo Pump x.x  DISCo Pump offline browser / website ripper     D       No active homepage      http://www.arssoft.com/ http://www.filetransit.com/view.php?id=3870
+id_a_f_300907_1        disco/Nutch-0.9 (experimental crawler; www.discoveryengine.com; disco-crawl@discoveryengine.com)        Unkown robot from Discovery Engine Corp.        R       208.96.54.xx    http://www.discoveryengine.com/ 
+id_a_f_300907_2        disco/Nutch-1.0-dev (experimental crawler; www.discoveryengine.com; disco-crawl@discoveryengine.com)    Unkown robot from Discovery Engine Corp.        R       208.96.54.xx    http://www.discoveryengine.com/ 
+id_a_f_244     DittoSpyder     Ditto picture search robot      R               http://www.ditto.com    
+id_a_f_245     dlman   some download agent     D       Wildsoft Surfer         
+id_a_f_246     dloader(NaverRobot)/1.0 Naver Japan / Korea robot       R       s. also Python-urllib/1.15 - nabot - NaverBot & Cowbot  http://www.naver.co.jp  
+id_a_f_100408_1        DNSRight.com WebBot Link Ckeck Tool. Report abuse to: dnsr@dnsright.com DNS Right - Online DNS tools    C       203.161.71.17x  http://www.dnsright.com/        
+id_a_f_247     DoCoMo/1.0/Nxxxi/c10    NTT DoCoMo (Japan) robot        R               http://www.nttdocomo.co.jp/     
+id_a_f_248     DoCoMo/1.0/Nxxxi/c10/TB NTT DoCoMo (Japan) robot        R               http://www.nttdocomo.co.jp/     
+id_a_f_249     DoCoMo/1.0/P502i/c10 (Google CHTML Proxy/1.0)   Google (216.239.39.x) proxy server      P                       
+id_a_f_250     DoCoMo/2.0 P900iV(c100;TB;W24H11)       NTT DoCoMo (Japan) robot        R               http://www.nttdocomo.co.jp/     
+id_a_f_141205_1        DoCoMo/2.0 SH901iS(c100;TB;W24H12),gzip(gfe) (via translate.google.com) NTT DoCoMo (Japan) proxy server (210.136.161.1xx)       P               http://www.nttdocomo.co.jp/     
+id_a_f_081207_1        DoCoMo/2.0 SH902i (compatible; Y!J-SRD/1.0; http://help.yahoo.co.jp/help/jp/search/indexing/indexing-27.html)   Yahoo Search Japan robot (203.216.197.xxx)      R       s. also Y!J-SRD/1.0     http://www.yahoo.co.jp/ 
+id_a_f_271006_3        DoCoMo/2.0/SO502i (compatible; Y!J-SRD/1.0; http://help.yahoo.co.jp/help/jp/search/indexing/indexing-27.html)   Yahoo Search Japan robot (203.216.197.xxx)      R       s. also Y!J-SRD/1.0     http://www.yahoo.co.jp/ 
+id_a_f_251     DocZilla/1.0 (Windows; U; WinNT4.0; en-US; rv:1.0.0) Gecko/20020804     DocZilla - Mozilla-based SGML/XML/HTML- browser B               http://www.doczilla.com 
+id_a_f_210607_1        dodgebot/experimental   unknown robot from AGMLAB Information Technologies (Information retrieval system ?)     R       212.174.130.1xx http://www.agmlab.com/agmlab_eng.html   
+id_a_f_180606_1        DonutP; Windows98SE     Donut P - Japanese IE based browser     B               http://donutp.com/      
+id_a_f_250907_2        Doubanbot/1.0 (bot@douban.com http://www.douban.com)    Unknown robot from douban search (China) - maybe image crawling         59.151.41.xx    http://www.douban.com/  
+id_a_f_252     Download Demon/3.x.x.x  Download Demon/Netzip download manager  D               http://www.netzip.com   
+id_a_f_191105_4        Download Druid 2.x      Download Druid IE plugin download manager       D               http://www.xemico.com/druid/index.html  
+id_a_f_253     Download Express 1.0    Download Express download manager       D               http://www.metaproducts.com     
+id_a_f_254     Download Master Download Master download manager        D               http://www.westbyte.com/dm/index.phtml  
+id_a_f_191105_5        Download Ninja 3.0      Download Ninja download manager (Japan) D               http://www.h-fd.org/mkro/mt/archives/2002/09/download_ninja_1.html      
+id_a_f_255     Download Wonder Download Wonder download manager        D               http://www.forty.com    
+id_a_f_256     Download-Tipp Linkcheck (http://download-tipp.de/)      Download-Tipp Germany link checking     R               http://download-tipp.de/        
+id_a_f_257     Download.exe(1.1) (+http://www.sql-und-xml.de/freeware-tools/)  download.exe .NET based downloading tool        D               http://www.sql-und-xml.de/freeware-tools/       
+id_a_f_300907_3        DownloadDirect.1.0      Download Direct download manager        D               http://senbit.com/      
+id_a_f_258     Dr.Web (R) online scanner: http://online.drweb.com/     Dr.WEB online virus scanner                     http://online.drweb.com 
+id_a_f_259     Dragonfly File Reader   Dragonfly CMS - Open Source content management system   B               http://www.cpgnuke.com  
+id_a_f_260     Drecombot/1.0 (http://career.drecom.jp/bot.html)        Drecom Japan (210.233.67.xxx) - Blog search ??  R               http://www.drecom.co.jp 
+id_a_f_3090906_1       Drupal (+http://drupal.org/)    Drupal - open source content management platform        C               http://drupal.org/      
+id_a_f_261     DSurf15a 01     Some site scanning tool via diff. IPs i.e.: - cox.net (68.5.xxx.xxx) - pacbell.net (64.16x.xxx.xxx)     S       DBrowse 1.4d            
+id_a_f_262     DSurf15a 71     Some site scanning tool via diff. IPs i.e.: - cox.net (68.4.xxx.xxx)    S       TRPMFHXE                
+id_a_f_263     DSurf15a 81     Some site scanning tool via diff. IPs i.e.: - verizon.net (4.47.xxx.xxx)        S       WFRIKXVNFL              
+id_a_f_264     DSurf15a VA     Some site scanning tool via diff. IPs i.e.: - eastlink.ca (24.222.xxx.xxx) - cogeco.net (216.221.8x.xxx)        S                       
+id_a_f_020506_2        DTAAgent        DTAAgent Java object for data collecting        R D             http://www.ibr.cs.tu-bs.de/courses/ss00/sep-vs/gruppe1/jdoc/DTA/agent/DTAAgent.html     
+id_a_f_265     dtSearchSpider  dt Search Spider software       R               http://www.dtsearch.com/spider.html     
+id_a_f_266     Dual Proxy      Fourelle Venturi proxy server   P               http://www.fourelle.com/news/articles/148457.htm        
+id_a_f_290308_2        DuckDuckBot/1.0; (+http://duckduckgo.com/duckduckbot.html)      Duck Duck Go search crawler     R       72.94.249.34    http://duckduckgo.com/  http://duckduckgo.com/duckduckbot.html
+id_a_f_267     Dumbot(version 0.1 beta - dumbfind.com) DumbFind.com robot      R               http://www.dumbfind.com 
+id_a_f_268     Dumbot(version 0.1 beta - http://www.dumbfind.com/dumbot.html)  DumbFind.com robot      R               http://www.dumbfind.com 
+id_a_f_269     Dumbot(version 0.1 beta)        DumbFind.com robot      R               http://www.dumbfind.com 
+id_a_f_270     e-sense 1.0 ea(www.vigiltech.com/esensedisclaim.html)   Vigiltech e-Sense user research robot (website is offline)      R                       
+id_a_f_271     e-SocietyRobot(http://www.yama.info.waseda.ac.jp/~yamana/es/)   e-Society Project (Japan) crawler (133.9.238.xx)        R               http://www.yama.info.waseda.ac.jp       
+id_a_f_280108_1        eApolloBot/2.0 (compatible; heritrix/2.0.0-SNAPSHOT-20071024.170148 +http://www.eapollo-opto.com)       Global Opto's eApollo Flash based search engine - Taiwan        R               http://www.eapollo.com/eaSE.jsp?language=eng    http://www.global-opto.com/
+id_a_f_272     EARTHCOM.info/1.x [www.earthcom.info]   Earthcom (Czech Republic) search robot (194.108.39.xx)  R       s. also Mozilla/5.0 (compatible; EARTHCOM.info/2.01 ... http://www.earthcom.info        
+id_a_f_273     EARTHCOM.info/1.xbeta [www.earthcom.info]       Earthcom (Czech Republic) search robot (194.108.39.xx)  R       s. also Mozilla/5.0 (compatible; EARTHCOM.info/2.01 ... http://www.earthcom.info        
+id_a_f_274     EasyDL/3.xx     Keywen Encyclopedia Bot R               http://keywen.com/Encyclopedia/Bot/     
+id_a_f_275     EasyDL/3.xx http://keywen.com/Encyclopedia/Bot  Keywen Encyclopedia Bot R               http://keywen.com/Encyclopedia/Bot/     
+id_a_f_276     EBrowse 1.4b    Some site scanning tool via diff. IPs i.e.: - swbell.net (65.66.xxx.xxx)        S                       
+id_a_f_277     eCatch/3.0      eCatch (now Wysigot) offline browser    B D             http://www.ecatch.com   
+id_a_f_278     EchO!/2.0       Echo.fr robot   R               http://echo.fr/ 
+id_a_f_279     Educate Search VxB      Some site scanning tool via diff. IPs i.e.: - cox.net (68.4.xxx.xxx)    S       s. also DSurf - 66.118.1xx.xxx (sagonet.com) - see also Full Web Bot - Industry Program 1.0.5           
+id_a_f_280     egothor/3.0a (+http://www.xdefine.org/robot.html)       Xdefine text search engine robot - based on Egothor open source crawler R               http://www.xdefine.com/ http://www.egothor.org/
+id_a_f_281     EgotoBot/4.8 (+http://www.egoto.com/about.htm)  Egoto Search robot      R               http://www.egoto.com    
+id_a_f_211105_1        ejupiter.com    eJupiter searcg robot (206.191.49.xx)   R               http://search.ejupiter.com/     
+id_a_f_282     EldoS TimelyWeb/3.x     TimelyWeb web page monitoring tool      C       s. also TimelyWeb/...   http://www.eldos.org/timelyweb/timelyweb.html   
+id_a_f_283     elfbot/1.0 (+http://www.uchoose.de/crawler/elfbot/)     Elftales crawler for uChoose theme based search (Germany)       R               http://www.uchoose.de   
+id_a_f_300707_1        ELI/20070402:2.0 (DAUM RSS Robot, Daum Communications Corp.; +http://ws.daum.net/aboutkr.html)  DAUMOA - RSS search robot of Daum       R       211.115.109.1xx http://ws.daum.net/abouten.html 
+id_a_f_284     ELinks (0.x.x; Linux 2.4.20 i586; 132x60)       ELinks text mode browser        B               http://elinks.or.cz/    
+id_a_f_285     ELinks/0.x.x (textmode; NetBSD 1.6.2 sparc; 132x43)     ELinks text mode browser        B               http://elinks.or.cz/    
+id_a_f_286     EmailSiphon     Sonic E-mail collector  S               http://www.americaint.com/superstore/elist.html 
+id_a_f_220508_2        EmailSpider     EmailSpider E-mail harvesting software  S               http://www.emailspider.net/index.php?kat=11     
+id_a_f_287     EmailWolf 1.00  Trellian EMailWolf E-mail collector     S               http://www.trellian.com 
+id_a_f_288     EmeraldShield.com WebBot        EmeraldShield spam and web filtration services  P R             http://www.emeraldshield.com    
+id_a_f_289     EmeraldShield.com WebBot (http://www.emeraldshield.com/webbot.aspx)     EmeraldShield spam and web filtration services  P R             http://www.emeraldshield.com    
+id_a_f_070606_2        EMPAS_ROBOT     Empas search Korea robot (220.95.22x.xxx)       R               http://www.empas.com/   
+id_a_f_280208_1        EnaBot/1.x (http://www.enaball.com/crawler.html)        Enabot - Enaball semantic search project crawler        R               http://www.enaball.com/crawler.html     
+id_a_f_110506_4        endo/1.0 (Mac OS X; ppc i386; http://kula.jp/endo)      endo - Mac news site and blog aggregator        B               http://kula.jp/software/endo/   
+id_a_f_290     Enfish Tracker  Enfish Personal search tool     R               http://www.enfish.com   
+id_a_f_291     Enterprise_Search/1.0   Enterprise Search engine software (64.202.165.xxx)      R       s. also - ES.NET_Crawler - InnerpriseBot        http://www.innerprise.net       
+id_a_f_292     Enterprise_Search/1.0.xxx       Enterprise Search engine software (64.202.165.xxx)      R       s. also - ES.NET_Crawler - InnerpriseBot        http://www.innerprise.net       
+id_a_f_293     Enterprise_Search/1.00.xxx;MSSQL (http://www.innerprise.net/es-spider.asp)      Enterprise Search engine software (64.202.165.xxx)      R       s. also - ES.NET_Crawler - InnerpriseBot        http://www.innerprise.net       
+id_a_f_230706_1        envolk/1.7 (+http://www.envolk.com/envolkspiderinfo.php)        Envolk Web Search robot R       70.169.191.x    http://www.envolk.com/  
+id_a_f_294     envolk[ITS]spider/1.6(+http://www.envolk.com/envolkspider.html) Envolk Web Search robot R       70.169.191.x    http://www.envolk.com/  
+id_a_f_295     EroCrawler      EroCrawler adult search robot   R               http://www.erocrawler.com       
+id_a_f_296     ES.NET_Crawler/2.0 (http://search.innerprise.net/)      Enterprise Search engine software (64.202.165.xxx)      R       s. also - Enterprise_Search - InnerpriseBot     http://search.innerprise.net    
+id_a_f_297     eseek-larbin_2.6.2 (crawler@exactseek.com)      ExactSEEK (Jayde Online) robot  R       see also ExactSeek Crawler / eseek-larbin / exactseek.com       http://www.exactseek.com        
+id_a_f_298     ESISmartSpider  ESI Smart-Spider toolkit        R               http://www.smart-spider.com/    
+id_a_f_299     eStyleSearch 4 (compatible; MSIE 6.0; Windows NT 5.0)   e-Style ISP search (Russia) robot (217.174.103.xxx)     R               http://www.e-styleisp.ru/       
+id_a_f_300     ESurf15a 15     Some site scanning tool via diff. IPs   S       s. also DSurf - PBrowse ...             
+id_a_f_301     EuripBot/0.x (+http://www.eurip.com) GetFile    Eurip.com - European Internet Portal robot      R               http://www.eurip.com    
+id_a_f_302     EuripBot/0.x (+http://www.eurip.com) GetRobots  Eurip.com - European Internet Portal robot      R               http://www.eurip.com    
+id_a_f_303     EuripBot/0.x (+http://www.eurip.com) PreCheck   Eurip.com - European Internet Portal robot      R               http://www.eurip.com    
+id_a_f_220508_3        Eurobot/1.0 (http://www.ayell.eu)       Ayell Euronet business directory robot  R               http://www.ayell.eu/    
+id_a_f_030206_4        EvaalSE - bot@evaal.com Evaal Search Engine robot       R       based on Nutch  http://www.evaal.com/   http://search.evaal.com/en/about.html
+id_a_f_304     eventax/1.3 (eventax; http://www.eventax.de/; info@eventax.de)  Eventax event search (Germany)  R               http://www.eventax.de   
+id_a_f_291205_1        Everest-Vulcan Inc./0.1 (R&D project; host=e-1-24; http://everest.vulcan.com/crawlerhelp)       Vulcan Inc. Everest crawler (in development)    R               http://www.vulcan.com/  
+id_a_f_305     Everest-Vulcan Inc./0.1 (R&D project; http://everest.vulcan.com/crawlerhelp)    Vulcan Inc. Everest crawler (in development)    R               http://www.vulcan.com/  
+id_a_f_050406_2        Exabot-Images/1.0       Exalead Websearch image crawler (193.47.80.xx)  R       Exabot-Images only requests robots.txt - image crawling under UA NG/4.0.1229    http://www.exalead.com/search   
+id_a_f_211206_1        Exabot-Test/1.0 Exalead (France) search robot (193.47.80.xx)    R       s. Harvest-NG/1.0.2 and Exalead NG...   http://www.exabot.com/  
+id_a_f_190106_1        Exabot/2.0      Exalead (France) search robot (193.47.80.xx)    R       s. Harvest-NG/1.0.2 and Exalead NG...   http://www.exabot.com/  
+id_a_f_211206_2        Exabot/3.0      Exalead (France) search robot (193.47.80.xx)    R       s. Harvest-NG/1.0.2 and Exalead NG...   http://www.exabot.com/  
+id_a_f_306     ExactSearch     eXact Search Bar for IE B               http://www.exactsearchbar.com/exact04   
+id_a_f_307     ExactSeek Crawler/0.1   ExactSEEK (Jayde Online) robot  R       see also eseek-larbin / exactseek.com   http://www.exactseek.com        
+id_a_f_308     exactseek-crawler-2.63 (crawler@exactseek.com)  ExactSEEK (Jayde Online) robot  R       see also eseek-larbin / exactseek.com   http://www.exactseek.com        
+id_a_f_309     exactseek-pagereaper-2.63 (crawler@exactseek.com)       ExactSEEK (Jayde Online) robot  R       see also eseek-larbin / exactseek.com   http://www.exactseek.com        
+id_a_f_050606_2        exactseek.com   ExactSEEK (Jayde Online) robot (69.9.181.1xx)   R       see also eseek-larbin   http://www.exactseek.com        
+id_a_f_310     Exalead NG/MimeLive Client (convert/http/0.120) Exalead (France) search robot (193.47.80.xx)    R       s. Harvest-NG/1.0.2 and NG/1.0  http://www.exabot.com   
+id_a_f_311     Excalibur Internet Spider V6.5.4        Excalibur (now Convera) spider software R               http://www.excalib.com  
+id_a_f_191206_1        Execrawl/1.0 (Execrawl; http://www.execrawl.com/; bot@execrawl.com)     Execrawl software search using nutch    R       72.36.179.1xx   http://www.execrawl.com/        
+id_a_f_060608_1        exooba crawler/exooba crawler (crawler for exooba.com; http://www.exooba.com/; info at exooba dot com)  exooba crawler for exooba search pre-alpha development  R       216.195.184.xx  http://www.exooba.com/  
+id_a_f_060608_2        exooba/exooba crawler (exooba; exooba)  exooba crawler for exooba search pre-alpha development  R       216.195.184.xx  http://www.exooba.com/  
+id_a_f_312     ExperimentalHenrytheMiragoRobot Mirago UK Robot R               http://www.mirago.co.uk 
+id_a_f_313     Expired Domain Sleuth   Expired Domain Sleuth domain name tool  R C             http://expireddomainsleuth.com/ 
+id_a_f_314     Express WebPictures (www.express-soft.com)      Express Web Pictures image browser      B D             http://www.express-soft.com/    
+id_a_f_315     ExtractorPro    Extractor Pro e-mail collector  S               http://www.extractorpro.com     
+id_a_f_170106_1        Extreme Picture Finder  Exisoftware image grabber and downloading tool  D               http://www.exisoftware.com/picture_finder/      
+id_a_f_316     EyeCatcher (Download-tipp.de)/1.0       Download-Tipp Germany robot     R               http://download-tipp.de 
+id_a_f_091006_1        Factbot 1.09 (see http://www.factbites.com/webmasters.php)      Factbites search robot  R       70.86.159.1xx   http://www.factbites.com/       
+id_a_f_220906_1        factbot : http://www.factbites.com/robots       Factbites search robot  R       70.86.159.1xx   http://www.factbites.com/       
+id_a_f_221006_1        FaEdit/2.0.x    FaEdit Professional - Japanese bookmark manager C               https://sw.vector.co.jp/swreg/step1.reserve?srno=SR040433&site=y        
+id_a_f_317     FairAd Client   FairAd user     P               http://www.fairad.de    
+id_a_f_051206_1        FANGCrawl/0.01  Safe-t.net web filtering service        P       63.167.160.1xx  http://www.safe-t.net/  
+id_a_f_210206_1        FARK.com link verifier  Drew Curtis' FARK.com link checking     C               http://www.fark.com/    
+id_a_f_318     Fast Crawler Gold Edition       Fast/Alltheweb crawler (66.151.181.xx)  R               http://www.alltheweb.com        
+id_a_f_319     FAST Enterprise Crawler 6 (Experimental)        Fast/Alltheweb crawler (66.151.181.xx)  R               http://www.alltheweb.com        
+id_a_f_040206_1        FAST Enterprise Crawler 6 / Scirus scirus-crawler@fast.no; http://www.scirus.com/srsapp/contactus/      Fast Enterprise Crawler (66.151.181.xx) for Scirus scienctific information search       R               http://www.scirus.com/srsapp/   http://www.alltheweb.com
+id_a_f_320     FAST Enterprise Crawler 6 used by Cobra Development (admin@fastsearch.com)      Fast/Alltheweb crawler (66.151.181.xx)  R               http://www.alltheweb.com        
+id_a_f_070507_1        FAST Enterprise Crawler 6 used by Comperio AS (sts@comperio.no) Comperio Web Miner based on Fast ESP    R               http://www.comperio.no/index.php?option=com_content&task=blogcategory&id=7&Itemid=27    
+id_a_f_321     FAST Enterprise Crawler 6 used by FAST (FAST)   Fast/Alltheweb crawler (66.151.181.xx)  R               http://www.alltheweb.com        
+id_a_f_161106_1        FAST Enterprise Crawler 6 used by Pages Jaunes (pvincent@pagesjaunes.fr)        Pages Jaunes business search (France) robot using Fast Enterprise Crawler       R       193.252.242.xx  http://www.pagesjaunes.fr/      
+id_a_f_322     FAST Enterprise Crawler 6 used by Sensis.com.au Web Crawler (search_comments\at\sensis\dot\com\dot\au)  Fast/Alltheweb crawler for Sensis.com.au Australian search (66.151.181.xx)      R               http://www.sensis.com.au/       http://www.alltheweb.com
+id_a_f_251007_2        FAST Enterprise Crawler 6 used by Singapore Press Holdings (crawler@sphsearch.sg)       SPH Search - Singapore related search using Fast crawler        R       202.176.220.xx  http://www.sphsearch.sg/        
+id_a_f_280606_2        FAST Enterprise Crawler 6 used by WWU (wardi@uni-muenster.de)   FAST Enterprise Crawler used by WWU (University of Muenster - Germany)  C       128.176.188.2xx http://www.uni-muenster.de/en/index.html        http://www.alltheweb.com
+id_a_f_323     FAST Enterprise Crawler/6 (www.fastsearch.com)  Fast/Alltheweb crawler (66.151.181.xx)  R               http://www.alltheweb.com        
+id_a_f_324     FAST Enterprise Crawler/6.4 (helpdesk at fast.no)       Fast/Alltheweb crawler (66.151.181.xx)  R               http://www.alltheweb.com        
+id_a_f_325     FAST FirstPage retriever (compatible; MSIE 5.5; Mozilla/4.0)    Fast/Alltheweb crawler (66.151.181.xx)  R               http://www.alltheweb.com        
+id_a_f_326     FAST MetaWeb Crawler (helpdesk at fastsearch dot com)   Fast/Alltheweb crawler (66.151.181.xx)  R               http://www.alltheweb.com        
+id_a_f_327     Fast PartnerSite Crawler        Fast/Alltheweb crawler (66.151.181.xx)  R               http://www.alltheweb.com        
+id_a_f_328     FAST-WebCrawler/2.2.10 (Multimedia Search) (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html)    Fast/Alltheweb multimedia crawler       R       see also Yahoo-MMCrawler/3.x    http://www.alltheweb.com        
+id_a_f_329     FAST-WebCrawler/2.2.6 (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html) Fast/Alltheweb crawler  R               http://www.alltheweb.com        
+id_a_f_330     FAST-WebCrawler/2.2.7 (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html)http://www.fast.no       Fast/Alltheweb crawler  R               http://www.alltheweb.com        
+id_a_f_331     FAST-WebCrawler/2.2.8 (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html)http://www.fast.no       Fast/Alltheweb crawler  R               http://www.alltheweb.com        
+id_a_f_332     FAST-WebCrawler/3.2 test        Fast/Alltheweb crawler  R               http://www.alltheweb.com        
+id_a_f_333     FAST-WebCrawler/3.3 (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler)        Fast/Alltheweb crawler  R               http://www.alltheweb.com        
+id_a_f_334     FAST-WebCrawler/3.4/Nirvana (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler)        Fast/Alltheweb crawler  R               http://www.alltheweb.com        
+id_a_f_335     FAST-WebCrawler/3.4/PartnerSite (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler)    Fast/Alltheweb crawler  R               http://www.alltheweb.com        
+id_a_f_336     FAST-WebCrawler/3.5 (atw-crawler at fast dot no; http://fast.no/support.php?c=faqs/crawler)     Fast/Alltheweb crawler  R               http://www.alltheweb.com        
+id_a_f_337     FAST-WebCrawler/3.6 (atw-crawler at fast dot no; http://fast.no/support/crawler.asp)    Fast/Alltheweb crawler  R               http://www.alltheweb.com        
+id_a_f_338     FAST-WebCrawler/3.6/FirstPage (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler)      Fast/Alltheweb crawler  R               http://www.alltheweb.com        
+id_a_f_339     FAST-WebCrawler/3.7 (atw-crawler at fast dot no; http://fast.no/support/crawler.asp)    Fast/Alltheweb crawler  R               http://www.alltheweb.com        
+id_a_f_340     FAST-WebCrawler/3.7/FirstPage (atw-crawler at fast dot no;http://fast.no/support/crawler.asp)   Fast/Alltheweb crawler  R               http://www.alltheweb.com        
+id_a_f_341     FAST-WebCrawler/3.8 (atw-crawler at fast dot no; http://fast.no/support/crawler.asp)    Fast/Alltheweb crawler  R               http://www.alltheweb.com        
+id_a_f_342     FAST-WebCrawler/3.8/Fresh (atw-crawler at fast dot no; http://fast.no/support/crawler.asp)      Fast/Alltheweb crawler  R               http://www.alltheweb.com        
+id_a_f_343     FAST-WebCrawler/3.x Multimedia  Fast/Alltheweb multimedia crawler       R       see also Yahoo-MMCrawler/3.x    http://www.alltheweb.com        
+id_a_f_344     FAST-WebCrawler/3.x Multimedia (mm dash crawler at fast dot no) Fast/Alltheweb multimedia crawler       R       see also Yahoo-MMCrawler/3.x    http://www.alltheweb.com        
+id_a_f_121205_2        fastbot crawler beta 2.0 (+http://www.fastbot.de)       Fastbot search Germany crawler (80.252.104.1xx) R               http://www.fastbot.de/  
+id_a_f_345     FastBug http://www.ay-up.com    Ay-Up geo sync search robot     R               http://www.ay-up.com    
+id_a_f_346     FastCrawler 3.0.1 (crawler@1klik.dk)    Fast/Alltheweb crawler (66.151.181.xx)  R               http://www.alltheweb.com        
+id_a_f_347     FastSearch Web Crawler for Verizon SuperPages (kevin.watters@fastsearch.com)    Fast/Alltheweb crawler used by SuperPages.com   R               http://www.superpages.com       http://www.alltheweb.com
+id_a_f_170408_3        Favcollector/2.0 (info@favcollector.com http://www.favcollector.com/)   Favcollector Favicon collecting robot   R       66.207.217.13x  http://www.favcollector.com/    
+id_a_f_161006_1        FavIconizer     FavIconizer - IE favorites icons refreshing tool        D               http://www.codeproject.com/tools/faviconizer.asp        
+id_a_f_151206_1        favo.eu crawler/0.6 (http://www.favo.eu)        favo.eu (Germany) search robot  R       84.19.186.1xx   http://www.favo.eu/     
+id_a_f_348     FavOrg  ZD's FavOrg favourites managing program C               http://www.pcmag.com/article2/0,4149,108438,00.asp      
+id_a_f_260108_1        Favorites Checking (http://campulka.net)        Campulka.net Favorites checking tool    C               http://campulka.net/?dir=Utility        
+id_a_f_349     Favorites Sweeper v.2.03        Favorites Sweeper bookmark checker      C               http://www.manitoolssoftware.cjb.net    
+id_a_f_350     Faxobot/1.0     FaXo Search robot (69.152.89.xx)        R               http://www.faxo.com     
+id_a_f_351     FDM 1.x Free Download Manager (FDM) download accelerator        D               http://www.freedownloadmanager.org      
+id_a_f_180207_1        FDM 2.x Free Download Manager (FDM) download accelerator        D               http://www.freedownloadmanager.org      
+id_a_f_352     Feed Seeker Bot (RSS Feed Seeker http://www.MyNewFavoriteThing.com/fsb.php)     RSS Feed Seeker bot (68.225.95.2xx)     R               http://www.MyNewFavoriteThing.com       
+id_a_f_241206_1        Feed24.com      Feed24 news feed and blog search        R       194.105.139.2xx http://www.feed24.com/  
+id_a_f_050306_1        Feed::Find/0.0x Feed::Find - Syndication feed (RSS/Atom) auto-discovery D               http://search.cpan.org/~btrott/Feed-Find-0.06/lib/Feed/Find.pm  
+id_a_f_250707_1        Feedable/0.1 (compatible; MSIE 6.0; Windows NT 5.1)     Feedable beta web based RSS service     B       64.27.19.25x    http://reader.feedable.com/     
+id_a_f_230406_2        FeedChecker/0.01        Unknown robot from the University of Tokyo (157.82.157.xx)      R       reads robots.txt        http://www.u-tokyo.ac.jp/index_e.html   
+id_a_f_140608_2        FeedDemon/2.7 (http://www.newsgator.com/; Microsoft Windows XP) FeedDemon RSS reader    B               http://www.newsgator.com/individuals/feeddemon/ 
+id_a_f_160308_2        Feedfetcher-Google-iGoogleGadgets; (+http://www.google.com/feedfetcher.html)    Google news feed feetcher for iGoogle gadgets   C       72.14.[1-2]xx.[X]xx     http://www.google.com/feedfetcher.html  
+id_a_f_010906_1        Feedfetcher-Google; (+http://www.google.com/feedfetcher.html)   Google Feedfetcher - RSS and Atom feed crawler  R       72.14.199.x[xx] http://www.google.com/feedfetcher.html  
+id_a_f_010307_1        FeedForAll rss2html.php v2      FeedForAll RSS feed robot       C       216.92.192.1xx  http://www.feedforall.com/      
+id_a_f_010308_1        FeedHub FeedDiscovery/1.0 (http://www.feedhub.com)      FeedHub news feed personalization engine powered by mSpoke      R       216.134.194.xx  http://www.feedhub.com/ http://www.mspoke.com/
+id_a_f_060608_3        FeedHub MetaDataFetcher/1.0 (http://www.feedhub.com)    FeedHub news feed personalization engine powered by mSpoke      R       216.134.194.xx  http://www.feedhub.com/ http://www.mspoke.com/
+id_a_f_260608_3        Feedjit Favicon Crawler 1.0     Feedjit news feed service favicon crawler       R       69.46.36.x      http://feedjit.com/     
+id_a_f_150108_1        Feedreader 3.xx (Powered by Newsbrain)  Newsbrain Feedreader3   B               http://www.feedreader.com/      
+id_a_f_281106_3        Feedshow/x.0 (http://www.feedshow.com; 1 subscriber)    FeedShow online RSS feed reader B               http://www.feedshow.com/        
+id_a_f_051206_2        FeedshowOnline (http://www.feedshow.com)        FeedShow online RSS feed reader B               http://www.feedshow.com/        
+id_a_f_040207_1        FeedZcollector v1.x (Platinum) http://www.feeds4all.com/feedzcollector  FeedZcollector - Feed (RSS, ATOM and RDF) capturing software    B               http://www.feeds4all.com/feedzcollector/        
+id_a_f_353     Felix - Mixcat Crawler (+http://mixcat.com)     MixCat robot    R       s. also Morris  http://mixcat.com       
+id_a_f_354     fetch libfetch/2.0      FreeBSD download tool   D                       
+id_a_f_355     FFC Trap Door Spider    Frequent Finders spider via Sitefusion.com      R               http://www.frequentfinders.com  
+id_a_f_356     Filangy/0.01-beta (Filangy; http://www.nutch.org/docs/en/bot.html; filangy-agent@filangy.com)   Filangy search and bookmark service     R C             http://www.filangy.com  
+id_a_f_357     Filangy/1.0x (Filangy; http://www.filangy.com/filangyinfo.jsp?inc=robots.jsp; filangy-agent@filangy.com)        Filangy search and bookmark service     R C             http://www.filangy.com  
+id_a_f_358     Filangy/1.0x (Filangy; http://www.nutch.org/docs/en/bot.html; filangy-agent@filangy.com)        Filangy search and bookmark service     R C             http://www.filangy.com  
+id_a_f_359     fileboost.net/1.0 (+http://www.fileboost.net)   File Boost Network link checking        R C             http://www.fileboost.net        
+id_a_f_360     FileHound x.x   FileHound download manager      D               http://www.allabout.com 
+id_a_f_180208_1        Filtrbox/1.0    filtrbox media content (news) monitoring        R       72.47.203.8x    http://www.filtrbox.com/        
+id_a_f_361     FindAnISP.com_ISP_Finder_v99a   Find An ISP robot       R C     site is down    http://www.findanisp.com/       
+id_a_f_141205_2        Findexa Crawler (http://www.findexa.no/gulesider/article26548.ece)      Yelo.no business search (Norway) via Findexa    R               http://www.findexa.no/english/article27709.ece  
+id_a_f_362     findlinks/x.xxx (+http://wortschatz.uni-leipzig.de/findlinks/)  NextLinks - German vocabulary and hyperlink search      R               http://wortschatz.uni-leipzig.de/nextlinks/findlinks.html       
+id_a_f_363     FineBot Finesearch robot        R               http://www.finesearch.com       
+id_a_f_080306_1        Finjan-prefetch Finjan Vital Security Web Appliance security solution   P               http://www.finjan.com/  
+id_a_f_364     Firefly/1.0     Fireball.de robot       R               http://www.fireball.de  
+id_a_f_365     Firefly/1.0 (compatible; Mozilla 4.0; MSIE 5.5) Fireball.de robot       R               http://www.fireball.de  
+id_a_f_210906_1        Firefox (kastaneta03@hotmail.com)       Unknown robot from Czech Technical University Prague (147.32.141.xx)    R       reads robots.txt        http://www.cvut.cz/     
+id_a_f_190306_2        Firefox_1.0.6 (kasparek@naparek.cz)     Unknown robot from Czech Technical University Prague (147.32.141.xx)    R       reads robots.txt        http://www.cvut.cz/     
+id_a_f_366     FirstGov.gov Search - POC:firstgov.webmasters@gsa.gov   AT&T/Fast Search robot for FirstGov (U.S.Government) portal     R               http://www.firstgov.gov 
+id_a_f_367     firstsbot       Firstsfind Germany robot / link checking        R               http://www.firstsfind.de        
+id_a_f_020906_1        Flapbot/0.7.2 (Flaptor Crawler; http://www.flaptor.com; crawler at flaptor period com)  Flaptor information retrieval solutions robot   R               http://www.flaptor.com/index.htm        
+id_a_f_368     FlashGet        JetCar/FlashGet download manager        D               http://www.amazesoft.com        
+id_a_f_161205_1        FLATARTS_FAVICO FlatArts Favorites Icon Tool    C D             http://flatarts.jp/contents/software/information.php?name=rico  
+id_a_f_100308_1        Flexum spider   Flexum.ru search service        R       81.176.76.93    http://www.flexum.ru/   
+id_a_f_280508_2        Flexum/2.0      Flexum.ru search service        R       81.176.76.93    http://www.flexum.ru/   
+id_a_f_369     FlickBot 2.0 RPT-HTTPClient/0.3-3       DivX.com Movie Find robot       R               http://www.divx.com     
+id_a_f_370     flunky  Metacarta / Cogent robot        R               http://www.metacarta.com        
+id_a_f_371     fly/6.01 libwww/4.0D    unknown                         
+id_a_f_110107_1        flyindex.net 1.0/http://www.flyindex.net        FLY Index Metasearch link checking      C       62.141.52.2xx   http://www.flyindex.net/        
+id_a_f_021108_1        FnooleBot/2.5.2 (+http://www.fnoole.com/addurl.html)    Fnoole news crawler     R       209.205.65.9x   http://www.fnoole.com/  
+id_a_f_372     FocusedSampler/1.0      IBM's Almaden Research robot    R       s. also: - - WFARC      http://www.almaden.ibm.com      
+id_a_f_080108_1        Folkd.com Spider/0.1 beta 1 (www.folkd.com)     folkd.com social search robot   R       212.227.95.3x   http://www.folkd.com/   
+id_a_f_070209_4        FollowSite Bot ( http://www.followsite.com/bot.html )   FollowSite robot - website monitoring   C       77.232.77.13x   http://www.followsite.com/bot.html      
+id_a_f_140209_1        FollowSite.com ( http://www.followsite.com/b.html )     FollowSite robot - website monitoring   C       77.232.77.13x   http://www.followsite.com/bot.html      
+id_a_f_141105_1        Fooky.com/ScorpionBot/ScoutOut; http://www.fooky.com/scorpionbots       Fooky search Scorpionbots robot (65.12.170.xxx) R               http://www.fooky.com/   
+id_a_f_373     Francis/1.0 (francis@neomo.de http://www.neomo.de/)     Neomo Search (Germany) robot (85.10.197.1xx)    R               http://www.neomo.de     
+id_a_f_374     Franklin Locator 1.8    Some spam bot   S                       
+id_a_f_110506_1        free-downloads.net download-link validator /0.1 Free Downloads shareware directory link checking        C               http://www.free-downloads.net/  
+id_a_f_375     FreeFind.com-SiteSearchEngine/1.0 (http://freefind.com; spiderinfo@freefind.com)        FreeFind.com robot      R               http://freefind.com     
+id_a_f_221008_2        Frelicbot/1.0 +http://www.frelic.com/   Frelics backlink checking bot (beta)    C               http://www.frelic.com/  
+id_a_f_376     FreshDownload/x.xx      Fresh Download download manager D               http://www.freshdevices.com     
+id_a_f_230306_2        FreshNotes crawler< report problems to crawler-at-freshnotes-dot-com    FreshNotes - music related artist search (72.3.225.xx)  R               http://freshnotes.com/fn/       
+id_a_f_377     FSurf15a 01     Some site scanning tool via diff. IPs   S       s. also DSurf - PBrowse ...             
+id_a_f_070209_5        FTB-Bot http://www.findthebest.co.uk/   Find the Best search robot      R       83.105.71.16x   http://www.findthebest.co.uk/   
+id_a_f_378     Full Web Bot 0416B      Some site scanning tool from diff. IPs i.e.: - 66.28.240.xx (cogentco.com) - 68.5.174.xx (cox.net)      S                       
+id_a_f_379     Full Web Bot 0516B      Some site scanning tool i.e. from - 68.154.96.xx (bellsouth.net)        S       appears also as MFC Foundation Class Library & Demo Bot Z 16b - 66.118.1xx.xxx (sagonet.com) - s. also Educate Search VxB - Industry Program 1.0.5              
+id_a_f_380     Full Web Bot 2816B      Some site scanning tool from 66.255.6.xxx (uslec.com)   S                       
+id_a_f_190807_1        FuseBulb.Com    FuseBulb search R       208.109.126.1xx http://www.fusebulb.com/        
+id_a_f_381     FyberSpider (+http://www.fybersearch.com/fyberspider.php)       FyberSearch FyberSpider robot   R               http://www.fybersearch.com      
+id_g_m_382     Gagglebot       Some user from bbnplanet.net (4.63.218.2xx) using an Innerprise robot tool      R C ?           http://www.innerprise.net       
+id_g_m_383     GAIS Robot/1.0B2        Seed Search robot       R               http://www.seed.net.tw  
+id_g_m_384     Gaisbot/3.0 (indexer@gais.cs.ccu.edu.tw; http://gais.cs.ccu.edu.tw/robot.php)   Gaislab Taiwan robot    R       140.123.100.x   http://gais.cs.ccu.edu.tw       
+id_g_m_160706_1        Gaisbot/3.0+(robot06@gais.cs.ccu.edu.tw;+http://gais.cs.ccu.edu.tw/robot.php)   Gaislab Taiwan robot    R       140.123.100.x   http://gais.cs.ccu.edu.tw       
+id_g_m_385     GalaxyBot/1.0 (http://www.galaxy.com/galaxybot.html)    Galaxy robot (63.121.41.xxx)    R       s. also Mozilla/4.0 (compatible; MSIE 5.0; www.galaxy.com....)  http://www.galaxy.com   
+id_g_m_130407_2        Gallent Search Spider v1.4 Robot 2 (http://robot.GallentSearch.com)     Gallent Search directory (UK)   R       88.208.223.xx   http://www.gallent.co.uk/       http://robot.gallentsearch.com/
+id_g_m_010107_1        gamekitbot/1.0 (+http://www.uchoose.de/crawler/gamekitbot/)     Gamekit game search engine - Germany    R       80.65.45.xx     http://www.gamekit.de/  
+id_g_m_386     Gamespy_Arcade  GameSpyHTTP/1.0 D       GameSpy Arcade download manager (FilePlanet)    http://www.gamespyarcade.com/features/  
+id_g_m_387     GammaSpider/1.0 GammaWare GammaSpider   R               http://www.gammasite.com        
+id_g_m_388     gazz/x.x (gazz@nttrd.com)       nttrd.com / Infobee.ne.jp robot R                       
+id_g_m_389     geckobot        Geckobot user robot             no active website       http://www.geckobot.com/        
+id_g_m_280406_1        Generic Mobile Phone (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)        Google Mobile Search crawler    R P     66.249.72.1xx   http://www.google.com/mobile/formats.html       
+id_g_m_390     generic_crawler/01.0217/        Unknown robot from Carnegie Mellon University (128.2.211.xxx)   R               http://www.cmu.edu      
+id_g_m_100109_2        GenesisBrowser (HTTP 1.1; 0.9; XP SP2; .NET CLR 2.0.50727)      Lunascape Genesis browser       B               http://www.lunascape.tv/        
+id_g_m_231205_1        genieBot (http://64.5.245.11/faq/faq.html)      GenieKnows.com search   R       s. also: - larbin_2.6.3 (wgao@genieknows.com)   http://www.genieknows.com/      
+id_g_m_391     geniebot wgao@genieknows.com    GenieKnows.com search   R       s. also: - larbin_2.6.3 (wgao@genieknows.com)   http://www.genieknows.com/      
+id_g_m_050606_3        GeoBot/1.0      Unknown robot from wavepath.com (65.254.33.1xx)         no active website               
+id_g_m_392     GeonaBot 1.x; http://www.geona.com/     Geona Search robot / link checking      R               http://www.geona.com    
+id_g_m_160206_3        geourl/2.0b2    GeoURL ICBM Address Server - a location-to-URL reverse directory        C               http://geourl.org/      
+id_g_m_160206_2        GeoURLBot 1.0 (http://geourl.org)       GeoURL ICBM Address Server - a location-to-URL reverse directory        C               http://geourl.org/      
+id_g_m_393     GetBot  Getbot web downloading tool / site grabber      D               http://www.getbot.com   
+id_g_m_394     GetRight/3.x.x  GetRight download manager       D               http://www.getright.com 
+id_g_m_395     GetRight/4.5xx  GetRight download manager       D               http://www.getright.com 
+id_g_m_396     GetRight/4.x    GetRight download manager       D               http://www.getright.com 
+id_g_m_397     GetRight/4.x[a-e]       GetRight download manager       D               http://www.getright.com 
+id_g_m_260807_1        GetRight/6.1 (Pro)      GetRight download manager       D               http://www.getright.com 
+id_g_m_398     GetRightPro/6.0beta2    GetRight download manager       D               http://www.getright.com 
+id_g_m_170706_3        GetWeb/0.1 libwww-perl/5.16     GetWeb - web page to email service      D       216.204.133.xxx http://www.healthnet.org/getweb.php     
+id_g_m_399     GhostRouteHunter/20021130 (https://www.sixxs.net/tools/grh/; info@sixxs.net)    Sixxs Ghost Route Hunter        C               http://www.sixxs.net/tools/grh/ 
+id_g_m_400     gigabaz/3.1x (baz@gigabaz.com; http://gigabaz.com/gigabaz/)     GigaBaz Brainbot (Germany) robot        R       s. also - MicroBaz      http://gigabaz.com      
+id_g_m_401     Gigabot/2.0 (gigablast.com)     Gigablast robot (64.62.168.xx)  R               http://www.gigablast.com        
+id_g_m_140106_1        Gigabot/2.0/gigablast.com/spider.html   Gigablast robot R       comes from 64.62.168.xx AND 66.154.102.xx       http://www.gigablast.com        
+id_g_m_170506_1        Gigabot/2.0; http://www.gigablast.com/spider.html       Gigablast robot R       comes from 64.62.168.xx AND 66.154.102.xx       http://www.gigablast.com        
+id_g_m_190507_1        Gigabot/2.0att  Gigablast robot R       66.231.188.1xx  http://www.gigablast.com        
+id_g_m_230508_1        Gigabot/3.0 (http://www.gigablast.com/spider.html)      Gigablast robot R       66.231.18x.[x]xx        http://www.gigablast.com        
+id_g_m_402     Gigabot/x.0     Gigablast robot (64.62.168.xx)  R               http://www.gigablast.com        
+id_g_m_403     GigabotSiteSearch/2.0 (sitesearch.gigablast.com)        Gigablast robot (64.62.168.xx)  R               http://www.gigablast.com        
+id_g_m_404     GNODSPIDER (www.gnod.net)       www.gnod.net spider     R               http://www.gnod.net     
+id_g_m_406     Go!Zilla 3.x (www.gozilla.com)  Go!Zilla download manager       D               http://www.gozilla.com  
+id_g_m_407     Go!Zilla/4.x.x.xx       Go!Zilla download manager       D               http://www.gozilla.com  
+id_g_m_405     Go-Ahead-Got-It/1.1     GotIt web accelerator (discontinued)    P D                     
+id_g_m_408     Goblin/0.9 (http://www.goguides.org/)   GoGuides.Org (195.226.137.xx) robot     R               http://www.goguides.org/goblin-info.html        
+id_g_m_409     Goblin/0.9.x (http://www.goguides.org/goblin-info.html) GoGuides.Org (195.226.137.xx) robot     R               http://www.goguides.org/goblin-info.html        
+id_g_m_410     GoForIt.com     GoForIt Search robot    R       208.109.236.xx  http://www.goforit.com  
+id_g_m_411     GOFORITBOT ( http://www.goforit.com/about/ )    GoForIt Search robot    R       208.109.236.xx  http://www.goforit.com  
+id_g_m_020306_1        GoGuides.Org Link Check GoGuides.org directory & search link checking   C               http://www.goguides.org/        
+id_g_m_230207_2        GoldenFeed Spider 1.0 (http://www.goldenfeed.com)       GoldenFeed.com - RSS search engine      C       74.52.41.1xx    http://www.goldenfeed.com/      
+id_g_m_412     Goldfire Server Invention Machines Goldfire Server      P               http://www.invention-machine.com/custsupport/GFR_install.cfm    
+id_g_m_041006_1        gonzo1[P] +http://www.suchen.de/popups/faq.jsp  suchen.de German local search robot     R       212.34.185.xx   http://www.suchen.de/   
+id_g_m_130108_2        gonzo2[P] +http://www.suchen.de/faq.html        suchen.de German local search robot     R       212.34.185.xx   http://www.suchen.de/   
+id_g_m_413     Goofer/0.2      Some private robot (Wanadoo.fr client)  R                       
+id_g_m_300606_1        Google Talk     Google instant messenger        B               http://www.google.com/talk/     
+id_g_m_414     googlebot (larbin2.6.0@unspecified.mail)        Packard Bell Net user robot (*not* Google)                              
+id_g_m_050106_1        Googlebot-Image/1.0     Google image crawler (66.249.72.xxx)    R               http://www.google.com   
+id_g_m_415     Googlebot-Image/1.0 ( http://www.googlebot.com/bot.html)        Google image crawler (66.249.72.xxx)    R               http://www.google.com   
+id_g_m_416     Googlebot/2.1 ( http://www.google.com/bot.html) Google robot 66.249.64.XXX      R       s. also: - Mozilla/4.0 (MobilePhone SCP ... - Mozilla/5.0 (compatible; Googlebot/2.1... http://www.google.com   
+id_g_m_417     Googlebot/2.1 ( http://www.googlebot.com/bot.html)      Google robot 66.249.64.XXX      R               http://www.google.com   
+id_g_m_418     Googlebot/Test ( http://www.googlebot.com/bot.html)     Google robot 66.249.64.XXX      R               http://www.google.com   
+id_g_m_280209_2        Gordon's Spider/Nutch-0.9 (http://www.sharethis.com; gordon@sharethis.com)      ShareThis social networking service via Amazon Web Services     C       174.129.242.x   http://sharethis.com/   http://www.amazonaws.com/
+id_g_m_419     GrapeFX/0.3 libwww/5.4.0        Grapeshot web search system API R               http://www.grapeshot.co.uk/html/Index.html      
+id_g_m_300907_4        great-plains-web-spider/flatlandbot (Flatland Industries Web Spider; http://www.flatlandindustries.com/flatlandbot.php; jason@flatlandindustries.com)   Flatland Industries vertical search solution    R       74.62.161.xx    http://www.flatlandindustries.com/      http://www.flatlandindustries.com/flatlandbot.php
+id_g_m_250707_2        GreatNews/1.0   GreatNews 1.0 Beta RSS reader   B               http://www.curiostudio.com/     
+id_g_m_170207_2        GreenBrowser    GreenBrowser - IE based browser (China) B               http://www.morequick.com/indexen.htm    
+id_g_m_100307_2        gridwell (http://search.gridwell.com)   search gridwell favicon display D       212.227.127.xx  http://search.gridwell.com/     
+id_g_m_420     GrigorBot 0.8 (http://www.grigor.biz/bot.html)  Grigor Search bot       R               http://www.grigor.biz   
+id_g_m_161206_1        Gromit/1.0      Australasian Legal Information Institute (AustLII) robot        R               http://www.austlii.edu.au/      http://www2.austlii.edu.au/~dan/gromit/
+id_g_m_421     grub crawler(http://www.grub.org)       Grub open source crawler        R               http://www.grub.org     
+id_g_m_422     grub-client     Grub open source crawler        R               http://www.grub.org     
+id_g_m_423     gsa-crawler (Enterprise; GID-01422; jplastiras@google.com)      Google Search Appliance robot (216.239.xx.xx)   R               http://www.google.com/enterprise/gsa/   
+id_g_m_424     gsa-crawler (Enterprise; GID-01742;gsatesting@rediffmail.com)   Google Search Appliance robot (216.239.xx.xx)   R               http://www.google.com/enterprise/gsa/   
+id_g_m_060506_1        gsa-crawler (Enterprise; GIX-02057; dm@enhesa.com)      Google Enterprise Search Appliance used by Enhesa (212.35.100.1xx)      R               http://www.enhesa.com/enhesa/en/default.asp     http://www.google.com/enterprise/gsa/
+id_g_m_311205_1        gsa-crawler (Enterprise; GIX-03519; cknuetter@stubhub.com)      Google Enterprise Search Appliance used by IBM (129.41.20.1xx)  R               http://www.google.com/enterprise/gsa/   
+id_g_m_425     gsa-crawler (Enterprise; GIX-0xxxx; enterprise-training@google.com)     Google Search Appliance robot (216.239.xx.xx)   R               http://www.google.com/enterprise/gsa/   
+id_g_m_081006_1        GSiteCrawler/v1.xx rev. xxx (http://gsitecrawler.com/)  GSiteCrawler - Google sitemap generator for Windows     C               http://gsitecrawler.com/        
+id_g_m_260207_1        Guestbook Auto Submitter        Guestbook spamming tool S                       
+id_g_m_426     Gulliver/1.3    Northernlight robot     R               http://www.northernlight.com    
+id_g_m_427     Gulper Web Bot 0.2.4 (www.ecsl.cs.sunysb.edu/~maxim/cgi-bin/Link/GulperBot)     Yuntis Collaborative Web Resource Categorization and Ranking Project robot      R               http://www.ecsl.cs.sunysb.edu/yuntis/   
+id_g_m_140907_1        Gungho/0.08004 (http://code.google.com/p/gungho-crawler/wiki/Index)     Gungho - Extensible web crawler written in Perl by Google Code  R               http://code.google.com/p/gungho-crawler/wiki/Index      
+id_g_m_211106_1        GurujiBot/1.0 (+http://www.guruji.com/WebmasterFAQ.html)        guruji : the Indian search engine robot R       209.128.80.1xx / 72.20.109.xx   http://www.guruji.com/  
+id_g_m_100508_2        GurujiImageBot/1.0 (+http://www.guruji.com/en/WebmasterFAQ.html)        guruji : the Indian search engine picture crawler       R       72.20.109.xx    http://www.guruji.com/  
+id_g_m_291108_3        Haier-T10C/1.0 iPanel/2.0 WAP2.0 (compatible; UP.Browser/6.2.2.4; UPG1; UP/4.0; Embedded)       Openwave Mobile Browser on Haier T10C mobile    B               http://www.openwave.com 
+id_g_m_171105_5        HappyFunBot/1.1 Happy Fun Search robot  R               http://www.happyfunsearch.com/bot.html  
+id_g_m_428     Harvest-NG/1.0.2        Harvest-NG web crawler used by search.yahoo.com R       see also Exalead NG and NG/1.0  http://search.yahoo.com 
+id_g_m_429     Haste/0.12 (HOME: http://haste.kytoon.com/)     Haste - web mapping and monitoring system       R C     site is closed  http://haste.kytoon.com 
+id_g_m_430     Hatena Antenna/0.4 (http://a.hatena.ne.jp/help#robot)   Hatena::Antenna Japan robot     R       221.186.146.xx  http://a.hatena.ne.jp   
+id_g_m_110606_2        Hatena Mobile Gateway/1.0       Hatena Japan proxy for handheld/mobile clients  P       221.186.146.xx  http://www.hatena.ne.jp/        
+id_g_m_431     Hatena Pagetitle Agent/1.0      Hatena Japan robot      R       221.186.146.xx  http://www.hatena.ne.jp 
+id_g_m_240207_1        Hatena RSS/0.3 (http://r.hatena.ne.jp)  Hatena Japan RSS feed robot     R       221.186.146.xx  http://www.hatena.ne.jp 
+id_g_m_110606_1        HatenaScreenshot/1.0 (checker)  Hatena::Diary (Japan) web page screenshot robot R D     221.186.146.xx  http://www.hatena.ne.jp/        
+id_g_m_120108_1        hbtronix.spider.2 -- http://hbtronix.de/spider.php      hbtronix.spider - Domain name spider (Germany)  R       89.110.157.*    http://hbtronix.de/spider.php   
+id_g_m_432     HeinrichderMiragoRobot  Mirago Germany robot    R               http://www.mirago.de/   
+id_g_m_433     HeinrichderMiragoRobot (http://www.miragorobot.com/scripts/deinfo.asp)  Mirago Germany robot    R               http://www.mirago.de/   
+id_g_m_434     Helix/1.x ( http://www.sitesearch.ca/helix/)    Helix - The SiteSearch (Canada) web crawler     R               http://www.sitesearch.ca        
+id_g_m_080206_3        HenriLeRobotMirago (http://www.miragorobot.com/scripts/frinfo.asp)      Mirago France robot     R               http://www.mirago.fr/   
+id_g_m_435     HenrytheMiragoRobot     Mirago search (UK) robot        R       217.154.245.2xx http://www.mirago.co.uk 
+id_g_m_060806_3        HenryTheMiragoRobot (http://www.miragorobot.com/scripts/mrinfo.asp)     Mirago search (UK) robot        R       217.154.245.2xx http://www.mirago.co.uk 
+id_g_m_436     hgrepurl/1.0    O'Reilly's Perl LWP example client program from Web Client Programming with Perl                                
+id_g_m_437     Hi! I'm CsCrawler my homepage: http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html RPT-HTTPClient/0.3-3        University of Kassel Germany CsCrawler using the HTTPClient library     R               http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html    http://www.innovation.ch/java/HTTPClient/
+id_g_m_438     HiDownload      HiDownload download manager     D               http://www.streamingstar.com/hidownload.htm     
+id_g_m_439     Hippias/0.9 Beta        Hippias robot   R       site is offline http://hippias.evansville.edu   
+id_g_m_440     HitList Pilot Hitlist web analytics solution    R               http://www.pilotsoftware.com/products_solutions/hitlist.html    
+id_g_m_441     Hitwise Spider v1.0 http://www.hitwise.com      Hitwise spider  R               http://www.hitwise.com  
+id_g_m_442     HLoader diff. IPs / unknown services            i.e.: - 204.95.207.xxx user agent ? - 66.27.113.xx link checking ?              
+id_g_m_040907_1        holmes/3.11 (http://morfeo.centrum.cz/bot)      Morfeo / Centrum Search (Czech Republic) robot from 65.102.46.xxx       R               http://morfeo.centrum.cz/       
+id_g_m_220906_2        holmes/3.9 (onet.pl)    Onet.pl (Poland) search robot   R       213.180.137.xx  http://szukaj.onet.pl/  
+id_g_m_181006_1        holmes/3.xx (OnetSzukaj/5.0; +http://szukaj.onet.pl)    Onet.pl (Poland) search robot   R       213.180.137.xx  http://szukaj.onet.pl/  
+id_g_m_443     holmes/x.x      Morfeo / Centrum Search (Czech Republic) robot from 65.102.46.xxx       R               http://morfeo.centrum.cz/       
+id_g_m_021108_2        HolmesBot (http://holmes.ge)    Holes search robot (Georgia)    R       77.92.229.3x    http://holmes.ge/       
+id_g_m_444     HomePageSearch(hpsearch.uni-trier.de)   HomePageSearch robot    R               http://hpsearch.uni-trier.de/   
+id_g_m_445     Homerbot: www.homerweb.com      Homerweb search robot   R               http://www.homerweb.com 
+id_g_m_220606_1        Honda-Search/0.7.2 (Nutch; http://lucene.apache.org/nutch/bot.html; search@honda-search.com)    Honda-Search.com - Honda cars related search robot      R       69.16.227.1xx   http://www.honda-search.com/    
+id_g_m_090206_1        HooWWWer/2.1.3 (debugging run) (+http://cosco.hiit.fi/search/hoowwwer/ | mailto:crawler-info<at>hiit.fi)        HooWWer - Next Generation Information Retrieval robot   R               http://cosco.hiit.fi    
+id_g_m_446     HooWWWer/2.1.x ( http://cosco.hiit.fi/search/hoowwwer/ | mailto:crawler-info<at>hiit.fi)        HooWWer - Next Generation Information Retrieval robot (128.214.112.xx)  R               http://cosco.hiit.fi/   
+id_g_m_447     HotJava/1.0.1/JRE1.1.x  HotJava browser plus HTML Component 1.1.x       B                       
+id_g_m_448     Hotzonu/x.0     Hotzuno - Japanese BBS reader client    B               http://hotzonu.hp.infoseek.co.jp/       
+id_g_m_040507_1        HPL/Nutch-0.9 - Unknown robot from HP Labs      R       15.203.249.12x  http://hpl.hp.com/      
+id_g_m_449     htdig/3.1.6 (http://computerorgs.com)   COMPUTERorgs.com robot (205.134.190.xxx) using htdig    R               http://www.computerorgs.com/    http://www.htdig.org
+id_g_m_210106_1        htdig/3.1.6 (unconfigured@htdig.searchengine.maintainer)        htdig used by the Academie de Toulouse  R       reads robots.txt        http://www.ac-toulouse.fr/html/_.php    http://www.htdig.org
+id_g_m_450     htdig/3.1.x (root@localhost)    htdig search tool       R               http://www.htdig.org    
+id_g_m_451     Html Link Validator (www.lithopssoft.com)       Lithops Software link validation tool   C               http://www.lithopssoft.com      
+id_g_m_110506_3        HTML2JPG Blackbox, http://www.html2jpg.com      HTML2JPG webpage to image converter     D               http://www.html2jpg.com 
+id_g_m_452     HTML2JPG Enterprise     HTML2JPG webpage to image converter     D               http://www.html2jpg.com 
+id_g_m_101205_1        HTMLParser/1.x  HTML Parser Java library to parse HTML  D               http://sourceforge.net/projects/htmlparser      
+id_g_m_071006_1        HTTP Retriever  PHP HTTP client to access Web servers   D               http://code.blitzaffe.com/pages/home/   
+id_g_m_240306_1        http://Anonymouse.org/ (Unix)   Anonymous web proxy service     P               http://anonymouse.org/  
+id_g_m_453     http://Ask.24x.Info/ (http://narres.it/)        Ask 24x Info (Germany) DMOZ related robot       R               http://narres.it        
+id_g_m_070209_6        http://hilfe.acont.de/bot.html ACONTBOT ACONTBOT - Acont search Germany robot   R       82.149.246.2x   http://acont.de/        http://hilfe.acont.de/bot.htm
+id_g_m_230408_1        http://OzySoftware.com/Index.html       OzySoftware.com software directory link checking        C       202.173.141.x   http://ozysoftware.com/index.html       
+id_g_m_454     http://www.almaden.ibm.com/cs/crawler   IBM's Almaden Research robot    R       s. also: - FocusedSampler - WFARC       http://www.almaden.ibm.com      
+id_g_m_455     http://www.almaden.ibm.com/cs/crawler [rc1.wf.ibm.com]  IBM's Almaden Research robot    R               http://www.almaden.ibm.com      
+id_g_m_456     http://www.almaden.ibm.com/cs/crawler [wf216]   IBM's Almaden Research robot    R               http://www.almaden.ibm.com      
+id_g_m_271105_4        http://www.istarthere.com_spider@istarthere.com Istarthere.com search robot     R               http://www.istarthere.com/      
+id_g_m_070106_1        http://www.monogol.de   Monogol - German open source search engine project (195.226.167.1xx)    R               http://www.monogol.de/  
+id_g_m_060806_4        http://www.trendtech.dk/spider.asp)     TrendTech Search Engine (Denmark) robot R       87.104.18.xx    http://www.trendtech.dk/        
+id_g_m_290106_1        HTTP::Lite/2.x.x        HTTP::Lite - Standalone Perl module for retreiving HTTP documents       D               http://www.toybox.ca/http-lite/ 
+id_g_m_050108_1        HTTPEyes        HTTPEyes - Web proxy cache      P               http://bachue.com/httpeyes/     
+id_g_m_457     HTTPResume v. 1.x       HTTPResume Amiga download manager       D               http://tesla.rcub.bg.ac.yu/%7Eantony/HTTPResume/        
+id_g_m_031107_2        httpunit/1.5    HttpUnit - Java test code for emulating browser behaviour       B               http://httpunit.sourceforge.net/        
+id_g_m_090306_1        httpunit/1.x    HttpUnit - Java browser behavior simulation tool        B               http://httpunit.sourceforge.net/        
+id_g_m_010807_1        Hybrid/1.2 [en] (OS Independent)        Hybrid Share mono C#/Gtk# application for file sharing                  http://hybrid-share.sourceforge.net/index.php   
+id_g_m_300507_1        HyperEstraier/1.x.xx    Hyper Estraier full-text search system  D               http://hyperestraier.sourceforge.net/   
+id_g_m_170906_1        i1searchbot/2.0 (i1search web crawler; http://www.i1search.com; crawler@i1search.com)   i1search robot  R       65.111.164.1xx  http://www.i1search.com/        
+id_g_m_461     IAArchiver-1.0  Alexa / The Internet Archive (209.237.238.1xx)  R               http://www.alexa.com    
+id_g_m_091205_2        iaskspider      Unknown robot (reads robots.txt) from chinatelecom (219.142.78.xx)              Not from iask.com.cn - s. also Mozilla/5.0 (compatible; iaskspider/1.0 ..               
+id_g_m_111106_1        iaskspider2 (iask@staff.sina.com.cn)    Iask search / Sina portal robot (China) R       202.106.184.xxx http://iask.com/        http://english.sina.com/index.html
+id_g_m_458     ia_archiver     Alexa / The Internet Archive (209.237.238.1xx)  R               http://www.alexa.com    
+id_g_m_459     ia_archiver-web.archive.org     Alexa / The Internet Archive (209.237.238.1xx)  R               http://www.alexa.com    
+id_g_m_460     ia_archiver/1.6 Alexa / The Internet Archive (209.237.238.1xx)  R               http://www.alexa.com    
+id_g_m_462     IBrowse/2.2 (AmigaOS 3.5)       IOSpirit iBrowse Amiga Browser  B       was Hisoft (http://www.hisoft.co.uk)    http://amiga.iospirit.de/       
+id_g_m_463     IBrowse/2.2 (Windows 3.1)       IOSpirit iBrowse Amiga Browser  B       was Hisoft (http://www.hisoft.co.uk)    http://amiga.iospirit.de/       
+id_g_m_464     iCab/2.5.2 (Macintosh; I; PPC)  iCab MAC Web browser    B               http://www.icab.de      
+id_g_m_110207_2        ICC-Crawler(Mozilla-compatible; http://kc.nict.go.jp/icc/crawl.html; icc-crawl(at)ml(dot)nict(dot)go(dot)jp)    Knowledge Clustered Group ICC-Crawler (University of Tokyo - Japan)     R       202.180.34.1xx  http://kc.nict.go.jp/icc/crawl.html     
+id_g_m_250607_1        ICC-Crawler(Mozilla-compatible;http://kc.nict.go.jp/icc/crawl.html;icc-crawl-contact(at)ml(dot)nict(dot)go(dot)jp)      Knowledge Clustered Group ICC-Crawler (University of Tokyo - Japan)     R       202.180.34.1xx  http://kc.nict.go.jp/icc/crawl.html     
+id_g_m_465     iCCrawler (http://www.iccenter.net)     ICJobs - Intelligence Competence Center (Germany) robot R       212.227.76.xx   http://www.iccenter.net 
+id_g_m_121006_1        ICCrawler - ICjobs (http://www.icjobs.de/bot.htm)       ICJobs - Intelligence Competence Center (Germany) robot R       212.227.76.xx   http://www.iccenter.net 
+id_g_m_466     ICE Browser/5.05 (Java 1.4.0; Windows 2000 5.0 x86)     ICE Java browser        B               http://www.ii.uib.no/~alexey/jb/        
+id_g_m_040206_2        ichiro/x.0 (http://help.goo.ne.jp/door/crawler.html)    Goo Japan / Inktomi robot (210.173.179.xx)      R       s. also moget / mogimogi        http://www.goo.ne.jp    
+id_g_m_468     ichiro/x.0 (ichiro@nttr.co.jp)  Goo Japan / Inktomi robot (210.173.179.xx)      R       s. also moget / mogimogi        http://www.goo.ne.jp    
+id_g_m_469     IconSurf/2.0 favicon finder (see http://iconsurf.com/robot.html)        Iconsurf.com - Visual Surf Engine / favicon finder      R               http://iconsurf.com     
+id_g_m_470     IconSurf/2.0 favicon monitor (see http://iconsurf.com/robot.html)       Iconsurf.com - Visual Surf Engine / favicon finder      R               http://iconsurf.com     
+id_g_m_471     ICOO Loader v.x.x.x     icooLoader download manager     D               http://www.icoonet.com  
+id_g_m_472     ICRA_label_spider/x.0   ICRA (Internet Content Rating Association) label spider R               http://www.icra.org     
+id_g_m_473     icsbot-0.1      ICS Robot Search Engine (International Christian school of Seoul)       R               http://icseoul.org/     
+id_g_m_260306_1        IDA     Internet Download Accelerator   D               http://www.westbyte.com/ida/    
+id_g_m_474     ideare - SignSite/1.x   Janas (Ideare.com / Tiscali.it) robot   R                       
+id_g_m_200806_1        iearthworm/1.0, iearthworm@yahoo.com.cn Unknown UA from Yahoo China             202.165.105.x           
+id_g_m_475     IEFav172Free    Some bookmark manager   C       possibly Visit URL ??   http://www.lodz.pdi.net/%7Eeristic/free/index.html      
+id_g_m_060608_4        iFeed.jp/2.0 (www.psychedelix.com/agents/agents.rss; 0 subscribers)     iFeed.jp - online rss aggregator (in development)       R       67.15.2[3-4][X].xxx     http://www.ifeed.jp/    
+id_g_m_281207_1        igdeSpyder (compatible; igde.ru; +http://igde.ru/doc/tech.html) Igde search (Russia) robot      R       87.118.118.12x  http://igde.ru/ 
+id_g_m_476     iGetter/1.x (Macintosh;G;PPC)   iGetter download manager        D               http://www.igetter.net  
+id_g_m_477     iGetter/2 (Macintosh; U; PPC Mac OS X; en)      iGetter download manager        D               http://www.igetter.net  
+id_g_m_120507_1        IIITBOT/1.1 (Indian Language Web Search Engine; http://webkhoj.iiit.net; pvvpr at iiit dot ac dot in)   Webkhoj - Indian language search engine R       196.12.53.xx    http://webkhoj.iiit.net/        
+id_g_m_040607_2        ilial/Nutch-0.9 (Ilial, Inc. is a Los Angeles based Internet startup company. For more information please visit http://www.ilial.com/crawler; http://www.ilial.com/crawler; crawl@ilial.com)    Ilial Knowledge Search robot    R       72.44.58.2xx    http://www.ilial.com/crawler/   
+id_g_m_290906_1        ilial/Nutch-0.9-dev     Unknown robot from UCLA using Nutch     R       164.67.195.xx   http://www.ucla.edu/    http://lucene.apache.org/nutch/
+id_g_m_270806_1        IlseBot/1.x     Ilse Netherlands robot (62.69.178.xx)   R       s. also INGRID/3.0 .. / Mozilla/3.0 (INGRID/3.0 ..      http://www.ilse.nl/     
+id_g_m_478     IlTrovatore-Setaccio ( http://www.iltrovatore.it)       Il Trovatore - Italian search engine robot      R       213.215.201.2xx http://www.iltrovatore.it       
+id_g_m_479     Iltrovatore-Setaccio/0.3-dev (Indexing; http://www.iltrovatore.it/bot.html; info@iltrovatore.it)        Il Trovatore - Italian search engine robot      R       213.215.201.2xx http://www.iltrovatore.it       
+id_g_m_480     IlTrovatore-Setaccio/1.2 ( http://www.iltrovatore.it/aiuto/faq.html)    Il Trovatore - Italian search engine robot      R       213.215.201.2xx http://www.iltrovatore.it       
+id_g_m_481     Iltrovatore-Setaccio/1.2 (It-bot; http://www.iltrovatore.it/bot.html; info@iltrovatore.it)      Il Trovatore - Italian search engine robot      R       213.215.201.2xx http://www.iltrovatore.it       
+id_g_m_482     iltrovatore-setaccio/1.2-dev (spidering; http://www.iltrovatore.it/aiuto/.....) Il Trovatore - Italian search engine robot      R       213.215.201.2xx http://www.iltrovatore.it       
+id_g_m_040506_1        IlTrovatore/1.2 (IlTrovatore; http://www.iltrovatore.it/bot.html; bot@iltrovatore.it)   Il Trovatore - Italian search engine robot      R       213.215.201.2xx http://www.iltrovatore.it       
+id_g_m_060107_2        ImageVisu/v4.x.x        ImageVisu image and graphics viewer - display files from the Web (HTTP and ECWP)        B               http://geovisu.free.fr/imagvisu/english/        
+id_g_m_080907_1        ImageWalker/2.0 (www.bdbrandprotect.com)        BD-Brandprotect copyright infringement crawler  R       72.14.164.1xx   http://www.bdbrandprotect.com/  http://www.bdbrandprotect.com/solutions_5.html
+id_g_m_110306_1        Incutio HttpClient v0.x HttpClient - a PHP Web Client Class                     http://scripts.incutio.com/httpclient/index.php 
+id_g_m_483     IncyWincy data gatherer(webmaster@loopimprovements.com  IncyWincy search engine using DMOZ Open Directory database      R               http://www.loopimprovements.com 
+id_g_m_484     IncyWincy page crawler(webmaster@loopimprovements.com   IncyWincy search engine using DMOZ Open Directory database      R               http://www.loopimprovements.com 
+id_g_m_485     IncyWincy(http://www.look.com)  Look.com robot using IncyWincy search engine    R               http://www.loopimprovements.com 
+id_g_m_486     IncyWincy(http://www.loopimprovements.com/robot.html)   IncyWincy search engine using DMOZ Open Directory database      R               http://www.loopimprovements.com 
+id_g_m_487     IncyWincy/2.1(loopimprovements.com/robot.html)  IncyWincy search engine using DMOZ Open Directory database      R               http://www.loopimprovements.com 
+id_g_m_488     IndexTheWeb.com Crawler7        Index the Web (69.57.134.xx) crawler    R               http://www.indextheweb.com/     
+id_g_m_489     Industry Program 1.0.x  Spam bot from diff. IPs S       see also Educate Search VxB - Full Web Bot              
+id_g_m_490     Inet library    Inet Library Resource Center robot      R               http://www.inetlibrary.com      
+id_g_m_491     InetURL/1.0     InetURL IVM (phone software) plugin for web server access ?                     http://www.nch.com.au/ivm/plugins.html  
+id_g_m_270607_1        info@pubblisito.com- (http://www.pubblisito.com) il Sud dei Motori di Ricerca   Pubblisito.com search - Italia  R       88.149.164.2xx  http://www.pubblisito.com/search/       
+id_g_m_211208_2        Infoaxe./Nutch-0.9      Infoaxe - search history and bookmark service   C       75.126.48.17x   http://www.infoaxe.com/ 
+id_g_m_492     infoConveraCrawler/0.8 ( http://www.authoritativeweb.com/crawl) Converas RetrievalWare Internet Spider (63.241.61.x)    R S ?   s.also - Convera... Maybe does guestbook / forum spamming s. here http://www.webmasterworld.com/forum11/2871.htm        http://www.convera.com/Products/        
+id_g_m_493     InfoFly/1.0 (http://www.versions-project.org/)  Versions-project.org Ingelin spider     R               http://www.versions-project.org/        
+id_g_m_494     InfoLink/1.x    InfoLink link checking tool     C               http://www.biggbyte.com/biggbyte3/index.html    
+id_g_m_495     INFOMINE/8.0 Adders     INFOMINE Scholary Internet Resource Collection crawler  R               http://infomine.ucr.edu 
+id_g_m_496     INFOMINE/8.0 RemoteServices     INFOMINE Scholary Internet Resource Collection crawler  R               http://infomine.ucr.edu 
+id_g_m_497     INFOMINE/8.0 VLCrawler (http://infomine.ucr.edu/useragents)     INFOMINE Scholary Internet Resource Collection crawler  R               http://infomine.ucr.edu 
+id_g_m_498     InfoNaviRobot(F107)     164.71.1.1xx jp.co.fujitsu.t2 Robot     R                       
+id_g_m_499     InfoSeek Sidewinder/0.9 Infoseek robot  R               http://www.infoseek.com 
+id_g_m_500     InfoSeek Sidewinder/1.0A        Infoseek robot  R               http://www.infoseek.com 
+id_g_m_501     InfoSeek Sidewinder/1.1A        Infoseek robot  R               http://www.infoseek.com 
+id_g_m_502     Infoseek SideWinder/1.45 (Compatible; MSIE 10.0; UNIX)  Infoseek robot  R               http://www.infoseek.com 
+id_g_m_503     Infoseek SideWinder/2.0B (Linux 2.4 i686)       Infoseek Japan robot    R       210.148.160.1xx http://www.infoseek.com 
+id_g_m_504     INGRID/3.0 MT (webcrawler@NOSPAMexperimental.net; http://webmaster.ilse.nl/jsp/webmaster.jsp)   Ilse Netherlands robot (62.69.178.xx)   R       s.also - Mozilla/3.0 (INGRID/3.0 .. / IlseBot/1.0 ..    http://www.ilse.nl/     
+id_g_m_505     Inktomi Search  Inktomi (Hotbot-Lycos NBCi etc.) robot  R               http://www.inktomi.com/ 
+id_g_m_506     InnerpriseBot/1.0 (http://www.innerprise.com/)  Enterprise Search engine software (64.202.165.xxx)      R       s. also - Enterprise_Search - ES.NET_Crawler    http://www.innerprise.net       
+id_g_m_111205_4        Insitor.com search and find world wide! Insitor Search robot (80.67.20.1xx)     R       s. also Insitornaut     http://www.insitor.com/ 
+id_g_m_121205_3        Insitornaut     Insitor Search robot (80.67.20.1xx)     R       s. also Insitor.com     http://www.insitor.com/ 
+id_g_m_507     InstallShield DigitalWizard     download manager        D                       
+id_g_m_200308_1        integrity/1.6   Integrity - website broken link checker for MAC OSx     C               http://peacockmedia.co.uk/index.php/products/7-products/4-integrity     
+id_g_m_010907_1        Intelix/0.x (cs; http://www.microton.cz/intelix/; microton@@microton.cz)        Microton Intelix robot for Eurotran translation software ?      D               http://www.microton.cz/intelix/ 
+id_g_m_508     Interarchy/x.x.x (InterarchyCrawler)    Interarchy file transfer software - SFTP/FTP client for Mac OS X        D               http://www.interarchy.com       
+id_g_m_509     Internet Ninja x.0      Dream Train (Japan) Internet search robot       R               http://www.dti.ne.jp    
+id_g_m_510     InternetArchive/0.8-dev(Nutch;http://lucene.apache.org/nutch/bot.html;nutch-agent@lucene.apache Heritrix - The Internet Archive's open-source crawler based on Nutch (207.241.225.2xx)  R       s.also - archive.org_bot - Mozilla/5.0 (compatible;archive.org_bot/...  http://www.archive.org/ http://lucene.apache.org
+id_g_m_511     InternetLinkAgent/3.1   Internet Link Agent - link checking tool        C               http://www.osk.3web.ne.jp/~goronyan/winprg/sub.shtml    
+id_g_m_512     InternetSeer.com        Internetseer Web site monitoring / Claymont robot       R               http://www.internetseer.com     
+id_g_m_513     intraVnews/1.x  intraVNews - Feed reader & RSS aggregator for Outlook   B               http://www.intravnews.com       
+id_g_m_061208_1        IOI/2.0 (ISC Open Index crawler; http://index.isc.org/; bot@index.isc.org)      Internet Open Index crawler using Nutch R       149.20.54.1xx   http://index.isc.org/   http://www.nutch.org
+id_g_m_514     IP*Works! V5 HTTP/S Component - by /n software - www.nsoftware.com      IP*Works! HTTP Component                        http://www.nsoftware.com/products/controls/?ctl=HTTP    
+id_g_m_515     http://www.ip2location.com      IP2Location - Reverse lookup geographical data and ISP by IP    R C             http://www.ip2location.com      
+id_g_m_270106_1        IP2MapBot/1.1 <a href=http://www.ip2map.com>http://www.ip2map.com</a>   IP2Map - geographical IP mapping        R C             http://www.ip2map.com/  
+id_g_m_516     IPiumBot laurion(dot)com        Laurions Ipium robot    R               http://www.laurion.com  
+id_g_m_517     IpselonBot/0.xx-beta (Ipselon; http://www.ipselon.com; ipselonbot@ipselon.com)  Ipselon Web Search robot        R               http://www.ipselon.com  
+id_g_m_518     Iria/1.xxa      Iria download manager   D               http://www5.tok2.com/home/koteturamu/soft/iria.htm      
+id_g_m_519     IRLbot/1.0 ( http://irl.cs.tamu.edu/crawler)    IRL-crawler - Texas A&M University research project crawler     R       128.194.135.xx  http://irl.cs.tamu.edu  
+id_g_m_240308_4        IRLbot/3.0 (compatible; MSIE 6.0; http://irl.cs.tamu.edu/crawler/)      IRL-crawler - Texas A&M University research project crawler     R       128.194.135.xx  http://irl.cs.tamu.edu  
+id_g_m_520     IrssiUrlLog/0.2 url_log - Irssi Perl url grabber                        http://www.irssi.org/scripts/html/url_log.pl.html       
+id_g_m_521     Irvine/1.x.x    Irvine downloading tool D               http://hp.vector.co.jp/authors/VA024591/        
+id_g_m_140506_1        ISC Systems iRc Search 2.1      Unknown spambot / harvester from diff. IPs      S               http://www.projecthoneypot.org/ip_inspector.php?iph=978231e229521680d11cb93f32de0fa1    
+id_g_m_030106_1        iSiloX/4.xx Windows/32  iSiloX document converter for iSilo reader      B               http://www.isilox.com/  
+id_g_m_522     isurf (tszhu@canada.com)        Unknown University of Alberta link-checking ?   C               http://www.ualberta.ca  
+id_g_m_150408_5        iTunes/x.x.x    iTunes UA name for access and decrypt the iTunes music store pages      B               http://www.apple.com/itunes/    
+id_g_m_523     IUPUI Research Bot v 1.9a       Some spam bot from 66.139.78.xx(x)      S                       
+id_g_m_280906_1        iVia Page Fetcher (http://ivia.ucr.edu/useragents.shtml)        iVia robot - Open source Internet portal & virtual library system software      D               http://ivia.ucr.edu/    
+id_g_m_524     iVia/4.0 CanonizeUrl (http://infomine.ucr.edu/iVia/useragents.shtml     iVia robot - Open source Internet portal & virtual library system software      D               http://ivia.ucr.edu/    
+id_g_m_180707_1        IWAgent/ 1.0 - www.brandprotect.com     BD BrandProtect - brand, company or trademarks online monitoring        R       72.14.164.1xx   http://www.brandprotect.com/    
+id_g_m_525     J-PHONE/3.0/J-SH07      Proxy message from jp-q.ne.jp   P                       
+id_g_m_526     Jabot/6.x (http://odin.ingrid.org/)     ODIN Directory Japan robot (163.138.95.xx)      R               http://www.ingrid.org   
+id_g_m_527     Jabot/7.x.x (http://odin.ingrid.org/)   ODIN Directory Japan robot (163.138.95.xx)      R               http://www.ingrid.org   
+id_g_m_528     Jack    German Domanova (offline since Feb.02) robot    R                       
+id_g_m_529     Jakarta Commons-HttpClient/2.0xxx       Jakarta Commons (Java based) HTTP client        B               http://jakarta.apache.org/commons/httpclient/   
+id_g_m_530     Jakarta Commons-HttpClient/3.0-rcx      Jakarta Commons (Java based) HTTP client        B               http://jakarta.apache.org/commons/httpclient/   
+id_g_m_240306_3        Jambot/0.1.x (Jambot; http://www.jambot.com/blog; crawler@jambot.com)   JamBot search robot (70.146.82.xx)      R               http://www.jambot.com/  
+id_g_m_130108_1        Jambot/0.2.1 (Jambot; http://www.jambot.com/blog/static.php?page=webmaster-robot; crawler@jambot.com)   JamBot search robot     R       70.146.82.xx    http://www.jambot.com/  
+id_g_m_531     Java 1.1        Java VM                 http://java.sun.com/    
+id_g_m_532     Java/1.4.1_01   Java VM R B D   used as robot from 194.203.40.xx        http://java.sun.com/    
+id_g_m_533     Java1.0.21.0    Java VM B               http://java.sun.com/    
+id_g_m_534     Java1.1.xx.x    Java VM                 http://java.sun.com/    
+id_g_m_535     Java1.3.0rc1    Java VM                 http://java.sun.com/    
+id_g_m_536     Java1.3.x       Java VM                 http://java.sun.com/    
+id_g_m_537     Java1.4.0       Java VM R B D   used by diff. IPs for various purposes i.e.: - Dortmund University Java based robot - Roadrunner.net (66.108.xxx.xxx) user robot in conjunction w. RPT-HTTPClient/0.3-3 http://java.sun.com/    http://www.informatik.uni-dortmund.DE
+id_g_m_538     Jayde Crawler. http://www.jayde.com     Jayde B2B Search robot (66.28.139.xx)   R               http://www.jayde.com    
+id_g_m_539     JBH Agent 2.0   some site downloading tool ? via 61.77.51.xxx   D                       
+id_g_m_540     jBrowser/J2ME Profile/MIDP-1.0 Configuration/CLDC-1.0 (Google WAP Proxy/1.0)    WAP 2.0 / jBrowser for handhelds        B               http://www.jataayusoft.com/DbWAPHH.htm  
+id_g_m_541     JCheckLinks/0.1 RPT-HTTPClient/0.3-1    JCheckLinks Java hyperlink validator    C               http://web.purplefrog.com/%7Ethoth/jchecklinks/ 
+id_g_m_542     JDK/1.1 Java Development Kit                    http://developers.sun.com/index.html    
+id_g_m_543     Jeode/1.x.x     Insignias Jeode (PDA) Java platform     B               http://www.insignia.com/content/products/jvmProducts.shtml      
+id_g_m_544     Jetbot/1.0      JetEye Search robot (64.62.142.xxx / 64.71.144.xxx)     R               http://www.jeteye.com   
+id_g_m_545     JetBrains Omea Reader 1.0.x (http://www.jetbrains.com/omea_reader/)     Omea RSS - Atom - newsgroups web page reader    B               http://www.jetbrains.com/omea_reader/   
+id_g_m_546     JetBrains Omea Reader 2.0 Release Candidate 1 (http://www.jetbrains.com/omea_reader/)   Omea RSS - Atom - newsgroups web page reader    B               http://www.jetbrains.com/omea_reader/   
+id_g_m_547     JetCar  JetCar / Flashget download manager      D               http://www.amazesoft.com        
+id_g_m_548     Jigsaw/2.2.x W3C_CSS_Validator_JFouffa/2.0      Jigsaw - W3C's CSS Validator Server     C               http://jigsaw.w3.org/css-validator/validator-uri.html   
+id_g_m_550     JoBo/1.x (http://www.matuschek.net/jobo.html)   Jobo website downloading program        D B             http://www.matuschek.net/software/jobo/index.html       
+id_g_m_549     JoBo/@JOBO_VERSION@(http://www.matuschek.net/jobo.html) Jobo website downloading program        D B             http://www.matuschek.net/software/jobo/index.html       
+id_g_m_551     JobSpider_BA/1.1        Finacialbot.com - German (213.61.218.xx) job search JobRoboter  R               http://www.finbot.com/jr1.html  
+id_g_m_552     JOC Web Spider  Jocsoft Web Spider - website downloading tool   D B             http://www.jocsoft.com/jws/index.htm    
+id_g_m_051206_5        JordoMedia/1.0 RSS File Reader (http://www.jordomedia.com)      Jordo Media RSS / Atom feed directory link checking     C       216.227.208.1xx http://www.jordomedia.com/      
+id_g_m_090206_2        Journster [alpha] (http://journster.com/)       Journster.com RSS/Atom aggregator       C               http://beta.journster.com/      
+id_g_m_090206_3        Journster.com RSS/Atom aggregator 0.5 (http://www.journster.com/bot.phtml)      Journster.com RSS/Atom aggregator       C               http://beta.journster.com/      
+id_g_m_553     JRTS Check Favorites Utility    Check Favorites bookmark checking       C               http://www.jrtwine.com/Products/CheckFavs/      
+id_g_m_554     JRTwine Software Check Favorites Utility        Check Favorites bookmark checking       C               http://www.jrtwine.com/Products/CheckFavs/      
+id_g_m_555     Jyxobot/x       Jyxo search (Czech Republic) robot (212.71.128.xx)      R               http://jyxo.cz/ 
+id_g_m_556     K-Meleon/0.6 (Windows; U; Windows NT 5.1; en-US; rv:0.9.5) Gecko/20011011       K-meleon browser - Windows 2000 B               http://kmeleon.sourceforge.net/ 
+id_g_m_557     k2spider        Verity K2 Spider ( Network search software)     R               http://www.verity.com/products/pdf/MK0368a_K2_Spider.pdf        
+id_g_m_010108_3        KAIST AITrc Crawler     Unknown robot from AITrc (Advanced Information Technology Research Center) - Korea      R       143.248.134.22x http://aitrc.kaist.ac.kr/english/       
+id_g_m_010506_1        KakleBot - www.kakle.com/0.1 (KakleBot - www.kakle.com; http:// www.kakle.com/bot.html; support@kakle.com)      Kakle ranked metasearch robot   R       216.139.221.1xx http://www.kakle.com/   
+id_g_m_250408_3        kalooga/kalooga-4.0-dev-datahouse (Kalooga; http://www.kalooga.com; info@kalooga.com)   Kalooga image crawler   R       195.210.57.1xx  http://www.kalooga.com/ 
+id_g_m_011108_3        kalooga/KaloogaBot (Kalooga; http://www.kalooga.com/info.html?page=crawler; crawler@kalooga.com)        Kalooga image crawler   R       195.210.57.1xx  http://www.kalooga.com/ 
+id_g_m_558     Kapere (http://www.kapere.com)  Kapere site grapper / web downloader    D               http://www.kapere.com   
+id_g_m_090807_1        Kazehakase/0.x.x.[x]    Kazehakase - Gecko based browser (Japan)        B               http://kazehakase.sourceforge.jp/       
+id_g_m_559     KDDI-SN22 UP.Browser/6.0.7 (GUI) MMP/1.1 (Google WAP Proxy/1.0) Openwave UP.Browser for mobiles via Google WAP Proxy (216.239.33.x)     P               http://www.openwave.com 
+id_g_m_561     Kenjin Spider   Kenjin Spider search agent      R               http://www.kenjin.ne.jp 
+id_g_m_562     Kevin http://dznet.com/kevin/   Dznet.com Kevin crawler (link checking ?) via 68.39.148.xx (nj.comcast.net)     R               http://www.dznet.com    
+id_g_m_563     Kevin http://websitealert.net/kevin/    Website AlertsKevin crawler (website monitoring) via 68.39.148.xx (nj.comcast.net)      R               http://www.websitealert.net     
+id_g_m_560     KE_1.0/2.0 libwww/5.2.8 Voila.fr robot  R               http://www.voila.fr     
+id_g_m_301105_5        KFSW-Bot (Version: 1.01 powered by KFSW www.kfsw.de)    Some Perl search script from KFSW (Germany)     R               http://www.kfsw.de/     
+id_g_m_100206_4        kinja-imagebot (http://www.kinja.com/)  kinja weblog search robot       R               http://www.kinja.com/   
+id_g_m_100206_3        kinjabot (http://www.kinja.com) kinja weblog search robot       R               http://www.kinja.com/   
+id_g_m_564     KIT-Fireball/2.0        Fireball search (Germany) robot R               http://www.fireball.de  
+id_g_m_565     KIT-Fireball/2.0 (compatible; Mozilla 4.0; MSIE 5.5)    Fireball search (Germany) robot R               http://www.fireball.de  
+id_g_m_566     Klondike/1.50 (WSP Win32) (Google WAP Proxy/1.0)        Klondike WAP Browser    B               http://www.apachesoftware.com   
+id_g_m_567     KnowItAll(knowitall@cs.washington.edu)  University of Washington KnowItAll - web information extraction R               http://www.cs.washington.edu    
+id_g_m_568     Knowledge.com/0.x       The knowledge.com (ODP) directory robot R               http://www.knowledge.com        
+id_g_m_569     Kontiki Client x.xx     Kontiki Client download manager D               http://www.kontiki.com/client/userhelp_f.shtml  
+id_g_m_280406_2        Krugle/Krugle,Nutch/0.8+ (Krugle web crawler; http://www.krugle.com/crawler/info.html; webcrawler@krugle.com)   Krugle source code search engine for developers (64.71.164.1xx) R       powered by Nutch        http://www.krugle.com/  
+id_g_m_180606_2        KSbot/1.0 (KnowledgeStorm crawler; http://www.knowledgestorm.com/resources/content/crawler/index.html; crawleradmin@knowledgestorm.com) KnowledgeStorm technology industry crawler for Findtech.com     R       12.129.110.xx   http://www.findtech.com/        http://www.knowledgestorm.com/resources/content/crawler/index.html
+id_g_m_570     kuloko-bot/0.x  Kuloko contextual search robot  R               http://www.kuloko.com/  
+id_g_m_571     kulokobot www.kuloko.com kuloko@backweave.com   Kuloko contextual search robot  R               http://www.kuloko.com   
+id_g_m_572     kulturarw3/0.1  National Library of Sweden Heritage Project robot       R               http://www.kb.se/ENG/kbstart.htm        
+id_g_m_301105_2        KummHttp/1.1 (compatible; KummClient; Linux rulez)      Link or server checking from Sanoma Budapest (195.70.35.xxx)    C R     Sanoma also runs some web-portals i.e. http://www.startlap.com/ http://sanomabp.hu/     
+id_g_m_280209_3        KWC-KX9/1109 UP.Browser/6.2.3.9.g.1.107 (GUI) MMP/2.0 UP.Link/6.3.0.0.0 UP.Browser for mobiles on Kyocera KWC-KX9 cellphone     B               http://www.openwave.com 
+id_g_m_211208_3        Labrador/0.2; http://ir.dcs.gla.ac.uk/labrador; craigm@dcs.gla.ac.uk    TREC Blog Track - Blog and news feed crawler    130.209.241.2xx http://ir.dcs.gla.ac.uk/wiki/TREC-Blog          
+id_g_m_573     Lachesis        Intels Lachesis web site response time monitoring tool  C               ftp://ftp.imag.fr/pub/labo-LSR/DRAKKAR/internet-performance/lachesis/   
+id_g_m_140406_1        lanshanbot/1.0  Unknown robot from Easten Network China (202.96.51.1xx)         reads robots.txt                
+id_g_m_021206_2        lanshanbot/1.0 (+http://search.msn.com/msnbot.htm)      Unknown robot from Easten Network China (202.96.51.1xx)         reads robots.txt                
+id_g_m_271105_1        LapozzBot/1.4 ( http://robot.lapozz.com)        Lapozz search (Hungary) robot (82.131.195.xx)   R               http://www.lapozz.com/  
+id_g_m_280508_3        LapozzBot/1.5 (+http://robot.lapozz.hu) Lapozz search (Hungary) robot (82.131.195.xx)   R               http://www.lapozz.com/  
+id_g_m_574     larbin (samualt9@bigfoot.com)   Larbin indexer used as Metacarta.com (66.28.xx.xxx) robot       R               http://www.metacarta.com/       http://larbin.sourceforge.net/index-eng.html
+id_g_m_592     LARBIN-EXPERIMENTAL (efp@gmx.net)       Unknown robot from 66.230.140.xx (argon.oxeo.com)       S       maybe an e-mail collector - see also Mozilla/4.0 efp@gmx.net            
+id_g_m_575     larbin_2.1.1 larbin2.1.1@somewhere.com  Larbin indexer used by Mitsubishi Electric Research Labs        R               http://www.merl.com     http://larbin.sourceforge.net/index-eng.html
+id_g_m_576     larbin_2.2.0 (crawl@compete.com)        Larbin indexer used as Compete.com crawler      R               http://www.compete.com  http://larbin.sourceforge.net/index-eng.html
+id_g_m_577     larbin_2.2.1_de_Viennot (Laurent.Viennot@inria.fr)      Larbin indexer used as Inria robot      R               http://www.inria.fr/index.en.html       http://larbin.sourceforge.net/index-eng.html
+id_g_m_578     larbin_2.2.2 (sugayama@lab7.kuis.kyoto-u.ac.jp) Larbin indexer used as Kyoto University robot   R               http://www.kyoto-u.ac.jp/       http://larbin.sourceforge.net/index-eng.html
+id_g_m_579     larbin_2.2.2_guillaume (guillaume@liafa.jussieu.fr)     Larbin indexer used as Inria robot      R               http://www.inria.fr/index.en.html       http://larbin.sourceforge.net/index-eng.html
+id_g_m_581     larbin_2.6.0 (larbin2.6.0@unspecified.mail)     Larbin indexer used by an unknown dsl.net client        R               http://larbin.sourceforge.net/index-eng.html    
+id_g_m_582     larbin_2.6.1 (larbin2.6.1@unspecified.mail)     Larbin indexer used by diff. IPs / services     R       ie.: -Central Host Inc. (client) robot ? - Colt Net France robot        http://www.centralhost.com      http://larbin.sourceforge.net/index-eng.html
+id_g_m_583     larbin_2.6.2 (hamasaki@grad.nii.ac.jp)  Larbin indexer used by National Institut of Informatics (NII/Japan)     R               http://www.nii.ac.jp    http://larbin.sourceforge.net/index-eng.html
+id_g_m_584     larbin_2.6.2 (larbin2.6.2@unspecified.mail)     Larbin indexer used by diff. IPs        R               http://larbin.sourceforge.net/index-eng.html    
+id_g_m_585     larbin_2.6.2 (listonATccDOTgatechDOTedu)        Larbin indexer used as robot by Georgia Institute of Technology http://www.gatech.edu/  R               http://www.gatech.edu   http://larbin.sourceforge.net/index-eng.html
+id_g_m_586     larbin_2.6.2 (pimenas@systems.tuc.gr)   Larbin indexer used by Technical University of Crete    R               http://www.systems.tuc.gr       http://larbin.sourceforge.net/index-eng.html
+id_g_m_587     larbin_2.6.2 (tom@lemurconsulting.com)  Larbin indexer used as Lemur Consulting robot   R               http://www.lemurconsulting.com  http://larbin.sourceforge.net/index-eng.html
+id_g_m_588     larbin_2.6.2 (vitalbox1@hotmail.com)    Larbin indexer used as robot via cloud9.net (168.100.192.xxx)   R               http://larbin.sourceforge.net/index-eng.html    
+id_g_m_261205_1        larbin_2.6.3 (ltaa_web_crawler@groupes.epfl.ch) Unknown robot from EPFL Lausanne Switzerland (128.178.155.1xx)  R       reads robots.txt        http://www.epfl.ch/Eindex.html  
+id_g_m_589     larbin_2.6.3 (wgao@genieknows.com)      Larbin indexer used by GenieKnows.com search    R       s. also: - geniebot wgao@genieknows.com http://www.genieknows.com       http://larbin.sourceforge.net/index-eng.html
+id_g_m_590     larbin_2.6.3_for_(http://cosco.hiit.fi/search/) tsilande@hiit.fi        Larbin indexer used by Next Generation Information Retrieval (NGIR)     R               http://cosco.hiit.fi    http://larbin.sourceforge.net/index-eng.html
+id_g_m_580     larbin_2.6_basileocaml (basile.starynkevitch@cea.fr)    Larbin indexer used by CEA / DCom Rechercher    R               http://www.cea.fr       http://larbin.sourceforge.net/index-eng.html
+id_g_m_591     larbin_devel (http://pauillac.inria.fr/~ailleret/prog/larbin/)  Larbin indexer used as Inria robot      R               http://pauillac.inria.fr        http://larbin.sourceforge.net/index-eng.html
+id_g_m_160807_2        lawinfo-crawler/Nutch-0.9-dev (Crawler for lawinfo.com pages; http://www.lawinfo.com; webmaster@lawinfo.com)    LawInfo - Lawyer and attorney directory R       216.86.137.xx   http://www.lawinfo.com/ 
+id_g_m_020506_3        lc/$ROADS::Version libwww-perl/5.00     ROADS - Perl web based subject based gateway tool                       http://roads.opensource.ac.uk/  
+id_g_m_593     lcabotAccept: */*       unknown robot via MTT.ca / Aliant.ca            142.177.168.xxx         
+id_g_m_140408_1        LeapTag/0.8.1.beta081.r3750 (compatible; Mozilla 4.0; MSIE 5.5; robot@yoriwa.com)       LeapTag news reader and content discovery tool  B               http://www.leaptag.com/ 
+id_g_m_594     LECodeChecker/3.0 libgetdoc/1.0 Linkexchange crawler    R               http://www.linkexchange.com     
+id_g_m_595     LeechGet 200x (www.leechget.de) Leechget download manager       D               http://www.leechget.de  
+id_g_m_596     LEIA/2.90       Gseek.com (site is offline) robot       R                       
+id_g_m_597     LEIA/3.01pr (LEIAcrawler; [SNIP])       Gseek.com (site is offline) robot       R                       
+id_g_m_210106_2        LetsCrawl.com/1.0 +http://letscrawl.com/        Maybe logfile spamming for Lets crawl! search (Germany) S       website has no function http://letscrawl.com/   
+id_g_m_598     LexiBot/1.00    Lexibot (exMataHari) search software    R               http://www.lexibot.com/index.asp        
+id_g_m_140209_2        LG-LX260 POLARIS-LX260/2.0 MMP/2.0 Profile/MIDP-2.0 Configuration/CLDC-1.1      Polaris mobile browser on LG LX 260 Sprint Rumor phone  B               http://www.infraware.co.kr/eng/01_product/product10.asp 
+id_g_m_599     LG/U8138/v1.0   LG 8138 Mobile Phone browser    B                       
+id_g_m_600     Libby_1.1/libwww-perl/5.47      About.com robot R               http://www.about.com/   
+id_g_m_100306_1        libcurl-agent/1.0       libcurl's (multiprotocol file transfer library) standard user-agent name        D               http://curl.haxx.se/libcurl/    
+id_g_m_080507_1        LibertyW (+http://www.lw01.com) LibertyW search for mobile (France)     R       213.251.135.2xx http://www.lw01.com/en/ 
+id_g_m_601     libWeb/clsHTTP -- hiongun@kt.co.kr      Korea Telecom Search robot      R               http://www.kt.co.kr/kt_home/eng/index.jsp       
+id_g_m_602     libwww-perl/5.41        CMP United Media robot  R               http://www.cmpnet.com   
+id_g_m_603     libwww-perl/5.45        SplatSearch robot (207.44.142.xx)       R               http://www.splatsearch.com      
+id_g_m_604     libwww-perl/5.48        Alexa robot     R               http://www.alexa.com    
+id_g_m_605     libwww-perl/5.50        diff. IPs / services    R C P   ie.: - secure-netz.de link checking (in conjunction w. LWP::Simple/5.50) -N2H2 Internet filtering       http://www.n2h2.com     
+id_g_m_606     libwww-perl/5.52 FP/2.1 Fast Search robot       R               http://www.alltheweb.com        
+id_g_m_607     libwww-perl/5.52 FP/4.0 Fast Search robot       R               http://www.alltheweb.com        
+id_g_m_608     libwww-perl/5.53        diff. IPs / services    R C P   ie.: -iPrism Web filtering software - softclub.net link checking        http://www.stbernard.com/default.asp    
+id_g_m_609     libwww-perl/5.63        Profile for You internet profiling (?)  R C             http://www.profile4u.com        
+id_g_m_610     libwww-perl/5.64        unknown link checking from Wanadoo.fr (193.253.33.xxx)  R C                     
+id_g_m_611     libwww-perl/5.65        Amidalla search engine robot (62.241.33.xx)     R       s. also amibot  http://www.amidalla.com 
+id_g_m_612     libwww-perl/5.800       SplatSearch robot (72.36.210.xx)        R               http://www.splatsearch.com/     
+id_g_m_613     libwww/5.3.2    Mediater Rechercher robot       R               http://www.mediater.net 
+id_g_m_160206_1        Liferea/0.x.x (Linux; en_US.UTF-8; http://liferea.sf.net/)      Liferea - Linux feed reader     B               http://liferea.sourceforge.net/ 
+id_g_m_140508_4        Liferea/1.x.x (Linux; es_ES.UTF-8; http://liferea.sf.net/)      Liferea (Linux Feed Reader) news aggregator for Unix and Linux  B               http://liferea.sourceforge.net/ 
+id_g_m_614     LightningDownload/1.0beta2      Lightning Download manager      D               http://www.lightningdownload.com        
+id_g_m_615     LightningDownload/1.x.x Lightning Download manager      D               http://www.lightningdownload.com        
+id_g_m_616     LightningDownload/1.x.x [Accelerated x] Lightning Download manager      D               http://www.lightningdownload.com        
+id_g_m_131207_1        LijitSpider/Nutch-0.9 (Reports crawler; http://www.lijit.com/; info(a)lijit(d)com)      Lijit blog search spider        R       216.24.131.1xx  http://www.lijit.com/   
+id_g_m_617     Lincoln State Web Browser       Some spam bot   S       s. this Guestbook http://www.donotenter.com/guestbook/gbook.html        http://www.donotenter.com/guestbook/gbook.html  
+id_g_m_618     Link Valet Online 1.x   Link Valet online link checking C               http://www.htmlhelp.com 
+id_g_m_620     LinkAlarm/2.x   Linkalarm link validation       C               http://www.linkalarm.com        
+id_g_m_621     Linkbot Linkbot Pro link checking software      C               http://www.watchfire.com        
+id_g_m_622     linkbot Rpsoft 2000 Site-Crawler        R               http://www.rpsoft2000.com/rps-site-crawler.htm  
+id_g_m_623     Linkbot x.0     Linkbot Pro link checking software      C               http://www.watchfire.com        
+id_g_m_624     LinkCheck (linkcheck@inter7.com http://www.inter7.com/linkcheck)        Linkcheck - linkchecking tool for Unix/Linux    C               http://www.inter7.com   
+id_g_m_625     LinkLint-checkonly/2.x.x        Linklint - Perl html link checker       C               http://www.linklint.org 
+id_g_m_626     LinkLint-spider/2.x.x   Linklint - Perl html link checker       C               http://www.linklint.org 
+id_g_m_627     linknzbot       Linknz - The Kiwi Search Engine (New Zealand)   R               http://www.linknz.co.nz 
+id_g_m_280606_1        LinkPimpin v1.0 Link-Pimp web directory link checking   C       216.89.111.x    http://www.link-pimp.com/       
+id_g_m_628     LinkProver 2.1  TafWeb link checking program    C               http://www.tafweb.com   
+id_g_m_630     Links (0.9x; Linux 2.4.7-10 i686)       Links text browser for Unix & OS/2      B               http://artax.karlin.mff.cuni.cz/%7Emikulas/links/       
+id_g_m_631     Links (0.9xpre12; Linux 2.2.14-5.0 i686; 80x24) Links text browser for Unix & OS/2      B               http://artax.karlin.mff.cuni.cz/%7Emikulas/links/       
+id_g_m_632     Links (2.xpre7; Linux 2.4.18 i586; x)   Links text browser for Unix & OS/2      B               http://artax.karlin.mff.cuni.cz/%7Emikulas/links/       
+id_g_m_629     Links - http://gossamer-threads.com/scripts/links/      Links SQL directory management program  C               http://gossamer-threads.com/scripts/links/      
+id_g_m_633     Links 2.0 (http://gossamer-threads.com/scripts/links/)  Links SQL directory management program  R               http://gossamer-threads.com/scripts/links/      
+id_g_m_634     Links SQL (http://gossamer-threads.com/scripts/links-sql/)      Links SQL directory management program  R               http://gossamer-threads.com/scripts/links-sql/  
+id_g_m_280406_3        Links4US-Crawler, (+http://links4us.com/)       Links4us ODP based directory link checking      C       209.190.5.2xx   http://links4us.com/    
+id_g_m_635     LinkScan/11.0beta2 UnixShareware robot from Elsop.com (used by Indiafocus/Indiainfo)    Shareware robot from Elsop.com (used by Indiafocus/Indiainfo and others)        R               http://www.elsop.com    http://indiafocus.indiainfo.com/
+id_g_m_636     LinkScan/9.0g Unix      Shareware robot from Elsop.com (used by Indiafocus/Indiainfo and others)        R               http://www.elsop.com    http://indiafocus.indiainfo.com/
+id_g_m_637     LinkScan/x.x Unix       Shareware robot from Elsop.com  R               http://www.elsop.com    
+id_g_m_638     LinksManager.com (http://linksmanager.com/linkchecker.html)     Linksmanager bookmark checking  C       s.also Mozilla/5.0 (compatible; LinksManager.com_bot... http://linksmanager.com/linkchecker.html        
+id_g_m_639     LinkSonar/1.35  LinkSonar (Japan) link checking tool    C               http://hp.vector.co.jp/authors/VA014575/chicchi/linksonar/readme.html   
+id_g_m_640     LinkSweeper/1.x Left Side Software's LinkSweeper (ceased) bookmark utility      C               http://www.lss.com.au/lss/lss_main.htm  
+id_g_m_641     LinkWalker      Seventwentyfour link checking robot     C               http://www.seventwentyfour.com  
+id_g_m_619     link_check3.plx libwww-perl/5.65        link check 3 - Perl HTML link checker (from Perl for Web Site Management)       C               http://www.elanus.net/cgi/examples.cgi/view/ex_1102.txt 
+id_g_m_642     ListBidBot (freelance job spider http://listbid.com)<a href=http://listbid.com>Freelance</a>    Listbid.com / Directnic.com link checking ?     R C             http://listbid.com      
+id_g_m_031107_3        LiveTrans/Nutch-0.9 (maintainer: cobain at iis dot sinica dot edu dot tw; http://wkd.iis.sinica.edu.tw/LiveTrans/)      WKD Lab: LiveTrans - Online query and terminology translation service   R       140.109.19.1xx  http://wkd.iis.sinica.edu.tw/LiveTrans/ 
+id_g_m_643     Llaut/1.0 (http://mnm.uib.es/~gallir/llaut/bot.html)    llaut robot - Universitat de les Illes Balears (Spain)  R               http://mnm.uib.es       
+id_g_m_200307_2        LMQueueBot/0.2  E-Mail harvesting robot - same as ContactBot    S       64.124.152.xx           
+id_g_m_644     lmspider (lmspider@scansoft.com)        lmspider from Scansoft (192.133.61.xx) - Web text collector     R       see here        http://www.kahunaburger.com/blog/archives/000117.html   
+id_g_m_645     LNSpiderguy     Lexis-Nexis robot       R               http://www.lexis-nexis.com/     
+id_g_m_300106_4        LocalBot/1.0 ( http://www.localbot.co.uk/)      LocalBot company information collector  R               http://www.localbot.co.uk/      
+id_g_m_646     LocalcomBot/1.2.x ( http://www.local.com/bot.htm)       Local.com local search robot (216.52.252.xxx)   R               http://www.local.com/   
+id_g_m_647     Lockstep Spider/1.0     Lockstep (website content protection tool) user agent   R               http://www.lockstep.com 
+id_g_m_648     Look.com        GlobalQueue spider (64.40.105.xxx)      R               http://www.multi-mode.com/      
+id_g_m_649     Lotus-Notes/4.5 ( Windows-NT )  Lotus Notes browser     B                       
+id_g_m_650     LotusDiscovery/x.0 (compatible; Mozilla 4.0; MSIE 4.01; Windows NT)     IBM Lotus Discovery Server                      http://www-142.ibm.com/software/sw-lotus/products/product3.nsf/wdocs/644012e0434859b585256ec9006d37b8   
+id_g_m_051207_1        Lovel as 1.0 ( +http://www.everatom.com)        Everatom.com song lyrics search R       80.91.191.2xx   http://www.everatom.com 
+id_g_m_100308_2        LTI/LemurProject Nutch Spider/Nutch-1.0-dev (lti crawler for CMU; http://www.lti.cs.cmu.edu; changkuk at cmu dot edu)   LTI - The Lemur Toolkit for Language Modeling and Information Retrieval via Yahoo       R       68.180.139.12x  http://www.lemurproject.org/    http://www.yahoo.com/
+id_g_m_050208_3        LTI/LemurProject Nutch Spider/Nutch-1.0-dev (Research spider using Nutch; http://www.lemurproject.org; mhoy@cs.cmu.edu) LTI - The Lemur Toolkit for Language Modeling and Information Retrieval via Yahoo       R       68.180.139.12x  http://www.lemurproject.org/    http://www.yahoo.com/
+id_g_m_651     luchs.at URL checker    Luchs.at (Linux Wiki) link checking     C               http://web.luchs.at/information/linkchecker.php 
+id_g_m_090106_1        Lunascape       Lunascape IE based browser (Japan)      B       s. also Mozilla/4.0 (... Lunascape ...) http://www2.lunascape.jp/index.aspx     
+id_g_m_652     lwp-trivial/1.32        Ultimate Search / Smartdesk (no website) robot  R                       
+id_g_m_653     lwp-trivial/1.34        Search4free robot       R               http://www.search4free.com      
+id_g_m_654     lwp-trivial/1.34        Search4free robot       R               http://www.search4free.com      
+id_g_m_656     lwp-trivial/1.35        Expert HTML online source viewer        B               http://www.expert-html.com/     
+id_g_m_655     lwp-trivial/1.35        Expert HTML online source viewer        B               http://www.expert-html.com/     
+id_g_m_657     LWP::Simple/5.22        Perl LWP:Collective module      R               http://www.thatrobotsite.com    
+id_g_m_658     LWP::Simple/5.36        Perl LWP:Collective module      R               http://www.thatrobotsite.com    
+id_g_m_659     LWP::Simple/5.48        Perl LWP:Collective module - Linkomatic robot   R               http://www.linkomatic.com/      http://www.thatrobotsite.com
+id_g_m_660     LWP::Simple/5.50        Perl LWP:Collective module - secure-netz.de link checking (in conjunction w. libwww-perl/5.50)  R               http://www.secure-netz.de       http://www.thatrobotsite.com
+id_g_m_661     LWP::Simple/5.51        Perl LWP:Collective module - Inktomi (62.253.64.x) robot        R               http://www.inktomi.com/ http://www.thatrobotsite.com
+id_g_m_662     LWP::Simple/5.53        Perl LWP:Collective module - Only.com   R       in conjunction w. Spida/0.1     http://www.only.com     http://www.thatrobotsite.com
+id_g_m_663     LWP::Simple/5.63        Perl LWP:Collective module      R               http://www.thatrobotsite.com    
+id_g_m_291105_3        LWP::Simple/5.803       ThePlanet/jaja-jak-globusy.com Google Adsense refferer spam bot from 70.85.116.* / 70.84.128.xxx / 70.85.193.xxx        S       appears also as Poirot - Mozilla/4.76 [en] (Win98; U) - Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1)      http://spamhuntress.com/wiki/Manila_Industries  
+id_g_m_664     Lycos_Spider_(modspider)        Lycos spider    R               http://www.lycos.com    
+id_g_m_665     Lycos_Spider_(T-Rex)    Lycos spider    R               http://www.lycos.com    
+id_g_m_200308_2        Lynx/2-4-2 (Bobcat/0.5 [DOS] Jp Beta04) Bobcat - Text and Lynx based DOS browser        B               http://www.fdisk.com/doslynx/bobcat.htm 
+id_g_m_666     Lynx/2.6 libwww-FM/2.14 Lynx 2.x text mode browser      B               http://lynx.browser.org/        
+id_g_m_180108_1        Lynx/2.8 (;http://seebot.org)   seebot.org online service - uses lynx browser for crawlers view of web pages    B       208.113.176.x[xx]       http://seebot.org/      
+id_g_m_667     Lynx/2.8.3dev.9 libwww-FM/2.14 SSL-MM/1.4.1 OpenSSL/0.9.6       Lynx 2.x text mode browser      B               http://lynx.browser.org/        
+id_g_m_668     Lynx/2.8.4rel.1 libwww-FM/2.14 SSL-MM/1.4.1 OpenSSL/0.9.6c (human-guided@lerly.net)     Lynx 2.x text mode browser used as robot via cogentco.com       R                       
+id_g_m_669     Mac Finder 1.0.xx       Some spam bot   S               http://www.kloth.net/internet/badbots.php       
+id_g_m_670     Mackster( http://www.ukwizz.com )       UKWizz search robot     R       s. also UKWizz/Nutch    http://www.ukwizz.com   
+id_g_m_671     Mag-Net Wind.it client user-agent ?                             
+id_g_m_180606_3        MagicWML/1.0 (forcewml) All Magic/Wap wml service for mobile devices    P               http://allmagic3.com/wap/       
+id_g_m_061206_1        MagpieRSS/0.7x (+http://magpierss.sf.net)       Magpie RSS - PHP RSS Parser     B               http://magpierss.sourceforge.net/       
+id_g_m_030308_1        Mahiti.Com/Mahiti Crawler-1.0 (Mahiti.Com; http://mahiti.com ; mahiti.com)      Mahiti.com India search crawler R       72.167.143.1x   http://mahiti.com/      
+id_g_m_020707_2        Mail.Ru/1.0     Mail.ru search  R       194.186.55.2xx  http://www.mail.ru/     
+id_g_m_672     mailto:webcraft@bea.com Unknown Bea robot       R               http://www.beasys.com   
+id_g_m_673     mammoth/1.0 ( http://www.sli-systems.com/)      SLI Systems mammoth robot       R       s. also Mozilla/5.0 (+http://www.sli-systems.com/) Mammoth/0.1  http://www.sli-systems.com/     http://www.tenspider.com/business-blog/more.php?id=A45_0_1_0_M
+id_g_m_674     MantraAgent     Looksmart robot R               http://www.looksmart.com        
+id_g_m_675     MapoftheInternet.com ( http://MapoftheInternet.com)     Map of the Internet visual search engine index robot    R               http://MapoftheInternet.com     
+id_g_m_676     Mariner/5.1b [de] (Win95; I ;Kolibri gncwebbot) Kolibri.de robot        R               http://www.kolibri.de   
+id_g_m_677     Marketwave Hit List     Pilot Hitlist web site analysis R               http://www.marketwave.com/products_solutions/hitlist.html       
+id_g_m_678     Martini Looksmart directory page analysis       R               http://www.looksmart.com        
+id_g_m_679     MARTINI Looksmart directory page analysis       R               http://www.looksmart.com        
+id_g_m_680     Marvin v0.3     Marvin Medhunt robot    R               http://www.hon.ch/MedHunt/Marvin.html   
+id_g_m_270606_1        MaSagool/1.0 (MaSagool; http://sagool.jp/; info@sagool.jp)      Sagool search Japan robot       R       124.32.246.xx   http://sagool.jp/       
+id_g_m_681     Mass Downloader 2.x     Mass Downloader download manager        D               http://www.metaproducts.com     
+id_g_m_682     MasterSeek      Masterseek (Scandinavia) Beta business search ? R               http://www.masterseek.com       
+id_g_m_683     Mata Hari/2.00  Lexibot (exMataHari) search software    R               http://www.lexibot.com  
+id_g_m_684     Matrix S.p.A. - FAST Enterprise Crawler 6 (Unknown admin e-mail address)        Virgilio Italy robot (212.48.11.xxx) using Fast Enterprise Search       R               http://www.virgilio.it  
+id_g_m_685     maxomobot/dev-20051201 (maxomo; http://67.102.134.34:4047/MAXOMO/MAXOMObot.html; maxomobot@maxomo.com)  Maxomo multimedia search robot  R               http://www.maxomo.com   
+id_g_m_686     McBot/5.001 (windows; U; NT4.0; en-us)  Unknown robot from McAfee Austria (80.123.144.xx)                               
+id_g_m_290108_1        MDbot/1.0 (+http://www.megadownload.net/bot.html)       MegaDownload files search robot R       91.121.83.19x   http://www.megadownload.net/    http://www.megadownload.net/bot.html
+id_g_m_170306_1        Media Player Classic    Substitute for Windows Media Player     B               http://sourceforge.net/projects/guliverkli/     
+id_g_m_687     MediaCrawler-1.0 (Experimental) Media Find crawler      R               http://www.mediacrawler.de      
+id_g_m_688     Mediapartners-Google/2.1 ( http://www.googlebot.com/bot.html)   Google AdSense robot    R               http://www.google.com/ads/      
+id_g_m_689     MediaSearch/0.1 WWW.fi Media Search     R               http://www.fi/haku/     
+id_g_m_690     MegaSheep v1.0 (www.searchuk.com internet sheep)        Search UK robot R               http://www.searchuk.com 
+id_g_m_131107_1        Megite2.0 (http://www.megite.com)       Megite web2.0 RSS and news service software     R               http://www.megite.com/  
+id_g_m_691     Mercator-1.x    Mercator crawler software (used by Altavista)   R               http://www.research.compaq.com  
+id_g_m_692     Mercator-2.0    Mercator crawler software (used by Altavista)   R               http://www.research.compaq.com  
+id_g_m_693     Mercator-Scrub-1.1      Mercator crawler software (used by Altavista)   R               http://www.research.compaq.com  
+id_g_m_070207_1        Metaeuro Web Crawler/0.2 (MetaEuro Web Search Clustering Engine; http://www.metaeuro.com; crawler at metaeuro dot com)  MetaEuro.com Clustering Web Search Engine crawler       R       83.97.31.1xx    http://www.metaeuro.com/        
+id_g_m_694     MetaGer-LinkChecker     MetaGer search robot (Germany)  R       130.75.2.xx     http://www.metager.de/  
+id_g_m_270706_1        MetagerBot/0.8-dev (MetagerBot; http://metager.de; )    MetaGer search robot (Germany)  R       130.75.2.xx     http://www.metager.de/  
+id_g_m_060307_1        MetaGer_PreChecker0.1   MetaGer search robot (Germany)  R       130.75.2.xx     http://www.metager.de/  
+id_g_m_695     MetaProducts Download Express/1.x       Download Express download manager       D               http://www.metaproducts.com     
+id_g_m_696     Metaspinner/0.01 (Metaspinner; http://www.meta-spinner.de/; support@meta-spinner.de/)   Metaspinner search robot - Germany      R               http://www.meta-spinner.de/     
+id_g_m_300407_1        metatagsdir/0.7 (+http://metatagsdir.com/directory/)    Metatagsdir.com directory index spider  R       206.196.111.2xx http://metatagsdir.com/directory/       
+id_g_m_697     MFC Foundation Class Library 4.0        Microsoft Foundation Class Library - i.e. used for e-mail harvesting from 68.154.96.xx (bellsouth.net)  S       appears also as Full Web Bot 0516B or Demo Bot Z 16b            
+id_g_m_698     MFC_Tear_Sample Microsoft.com user agent                                
+id_g_m_699     MFHttpScan      Advanced Site Crawler web site ripper and extractor     D               http://www.innovative.go.ro/sitecrawler/index.htm       
+id_g_m_700     MicroBaz        GigaBaz Brainbot (Germany) robot (213.139.152.xx)       R       s. also - gigabaz/3.1x ...      http://brainbot.com//site3      
+id_g_m_701     Microsoft Data Access Internet Publishing Provider Cache Manager        MS Office 2000 acting as WebDAV client  B P                     
+id_g_m_702     Microsoft Data Access Internet Publishing Provider DAV  MS Office 2000 acting as WebDAV client  B                       
+id_g_m_704     Microsoft Data Access Internet Publishing Provider Protocol Discovery   Server probe for data access operations using MS Frontpage with OPTION header   B C                     
+id_g_m_703     Microsoft Data Access Internet Publishing Provider Protocol Discovery   MS Office 2000 acting as WebDAV client  B C                     
+id_g_m_190807_2        Microsoft Log Parser 2.2        Microsoft Log Parser text query tool    D               http://www.microsoft.com/technet/scriptcenter/tools/logparser/default.mspx      
+id_g_m_180306_1        Microsoft Small Business Indexer        MS Small Business Server content indexer        R       Indexing from Microsoft: 204.71.191.xx  http://www.microsoft.com/windowsserver2003/sbs/default.mspx     
+id_g_m_705     Microsoft URL Control - 6.00.8xxx       user agent looks for form-mail components (spam-bot)    S                       
+id_g_m_707     MicrosoftPrototypeCrawler (How's my crawling? mailto:newbiecrawler@hotmail.com) Unknown robot from Microsoft.com (131.107.163.xx)       R                       
+id_g_m_706     Microsoft_Internet_Explorer_5.00.438 (fjones@isd.net)   Secure Computing SmartFilterWhere / Bess web filter (192.55.214.xx)     P               http://www.securecomputing.com/index.cfm?skey=22        
+id_g_m_708     MIIxpc/4.2      xpc-mii.net HTTP server message P                       
+id_g_m_130807_2        Mindjet MindManager     The Mindjet blog MindManager category   D       80.229.1xx      http://blog.mindjet.com/category/mindjet/mindmanager/   
+id_g_m_709     minibot unknown robot via Korea Telecom (211.218.xxx.xxx)                               
+id_g_m_110506_2        miniRank/1.6 (Website ranking; www.minirank.com; robot) mini- Rank website popularity tool      C       64.230.71.2xx   http://www.minirank.com/        
+id_g_m_710     MiracleAlphaTest        unknown robot via nec.co.jp Telecom (210.143.35.xx)                             
+id_g_m_711     Missauga Locate 1.0.0   Some spam bot   S               http://www.neilgunton.com/spambot_trap/appendix/        
+id_g_m_712     Missigua Locator 1.9    Some spam bot   S               http://www.neilgunton.com/spambot_trap/appendix/        
+id_g_m_713     Missouri College Browse Some spam bot   S                       
+id_g_m_714     Mister Pix II 2.02a     Mister PiX picture finding software     D R             http://www.mister-pix.com/      
+id_g_m_715     Mister PiX version.dll  Mister PiX picture finding software     D R             http://www.mister-pix.com/      
+id_g_m_110206_3        Misterbot-Nutch/0.7.1 (Misterbot-Nutch; http://www.misterbot.fr; admin@misterbot.fr)    Misterbot search France robot   R               http://www.misterbot.fr/        
+id_g_m_716     Miva (AlgoFeedback@miva.com)    Miva / ex Findwhat.com search robot (66.150.55.2xx)     R               http://www.miva.com/    
+id_g_m_141105_2        Mizzu Labs 2.2  Some spam bot from Jasmine Internet - Bangkok (203.147.0.xx)    S       s. link http://www.projecthoneypot.org/ip_inspector.php?iph=7bc2eae614063a45b0e1d0786dbe6a2e    
+id_g_m_080706_3        MJ12bot/vx.x.x (http://majestic12.co.uk/bot.php?+)      Majestic-12 DSearch MJ12bot (Experimental distributed crawler)  R               http://www.majestic12.co.uk/projects/dsearch/   
+id_g_m_717     MJ12bot/vx.x.x (http://www.majestic12.co.uk/projects/dsearch/mj12bot.php)       Majestic-12 DSearch MJ12bot (Experimental distributed crawler)  R               http://www.majestic12.co.uk/projects/dsearch/mj12bot.php        
+id_g_m_200108_1        MJBot (SEO assessment)  MJB SEO Club MJBot      R       217.8.248.19x   http://www.mjbdata.com/information/     
+id_g_m_030308_2        MLBot (www.metadatalabs.com)    MLBot - metadata labs web crawler for building a media index (beta)     R               http://www.metadatalabs.com/    
+id_g_m_718     MnogoSearch/3.2.xx      mnoGoSearch (ex UdmSearch) software robot       R               http://mnogosearch.org/ 
+id_g_m_260306_3        Mo College 1.9  Unknown bad bot - maybe guestbook spamming or email harvesting  S       see link:       http://www.kloth.net/internet/badbots.php       
+id_g_m_719     moget/x.x (moget@goo.ne.jp)     Goo Japan / Inktomi robot (210.173.179.xx)      R       s. also ichiro  http://www.goo.ne.jp    
+id_g_m_720     mogimogi/1.0    Goo Japan / Inktomi robot (210.173.179.xx)      R       s. also ichiro  http://www.goo.ne.jp    
+id_g_m_721     moiNAG 0.02     moiNag - net.art generator      R D             http://soundwarez.org/generator/moiNAG/ 
+id_g_m_722     MojeekBot/0.x (archi; http://www.mojeek.com/bot.html)   Mojeek Search Preview robot (217.155.205.xx)    R       s.also Mozilla/5.0 (compatible; MojeekBot/2.0 ...       http://www.mojeek.com   
+id_g_m_150407_1        monkeyagent     Greasemonkey Firefox extension  D               http://www.greasespot.net/      http://diveintogreasemonkey.org/install/what-is-greasemonkey.html
+id_g_m_090106_2        MoonBrowser (version 0.41 Beta4)        Moonbrowser - IE based browser (Japan)  B               http://www.geocities.co.jp/SiliconValley-Cupertino/8986/        
+id_g_m_010307_2        Moreoverbot/x.00 (+http://www.moreover.com)     Moreover / FeedDirect RSS feed robot    C       72.13.32.x      http://w.moreover.com/  http://www.feeddirect.com/
+id_g_m_723     Morris - Mixcat Crawler ( http://mixcat.com)    MixCat robot s. also Felix      R               http://mixcat.com       
+id_g_m_100206_2        Motoricerca-Robots.txt-Checker/1.0 (http://tool.motoricerca.info/robots-checker.phtml)  Robots.txt online checker       C               http://tool.motoricerca.info/robots-checker.phtml       
+id_g_m_240108_1        Motorola-V3m Obigo      Obigo WAP browser for mobiles on Motorola V3    B               http://www.obigo.com/   http://en.wikipedia.org/wiki/Obigo_Browser
+id_g_m_724     Mouse-House/7.4 (spider_monkey spider info at www.mobrien.com/sm.shtml) MPRM Group Ltd. Spider Monkey robot     R               http://www.spidermonkey.ca/sm.shtml     
+id_g_m_725     MovableType/x.x Movable Type web-based personal publishing system       B               http://www.movabletype.org      
+id_g_m_726     mozDex/0.xx-dev (mozDex; http://www.mozdex.com/en/bot.html; spider@mozdex.com)  Mozdex Open search engine spider (65.98.100.2xx)        R               http://www.mozdex.com/  
+id_g_m_727     Mozi!   Bell Nexxia / Sympatico Canada user robot & spoofed referer from diff. IPs                              
+id_moz_728     Mozilla Unknown robots from diff. IPs                           
+id_moz_100109_3        Mozilla (libwhisker/2.4)        libwhisker - HTTP client and utility - Perl library                     http://www.wiretrip.net/rfp/lw.asp      
+id_moz_729     Mozilla (Mozilla@somewhere.com) http://www.somewhere.com robot  R               http://www.somewhere.com        
+id_moz_041007_1        Mozilla 4.0(compatible; BotSeer/1.0; +http://botseer.ist.psu.edu)       BotSeer search engine for robots.txt    R       130.203.154.2xx http://botseer.ist.psu.edu/     http://botseer.ist.psu.edu/about.html
+id_moz_731     Mozilla/1.1 (compatible; MSPIE 2.0; Windows CE) PDA Pocket IE 2.x Windows CE    B                       
+id_moz_732     Mozilla/1.10 [en] (Compatible; RISC OS 3.70; Oregano 1.10)      Oregano browser for RISC OS     B               http://www.crashnet.org.uk      
+id_moz_730     Mozilla/1.22 (compatible; MSIE 2.0d; Windows NT)        IE 2.x WinNT    B                       
+id_moz_733     Mozilla/1.22 (compatible; MSIE 5.01; PalmOS 3.0) EudoraWeb 2    EudoraWeb 2.0 browser (Eudora Internet Suite) for PalmOS        B               http://www.eudora.com/products/unsupported/internetsuite/       
+id_moz_1552    Mozilla/2.0     Dummy user agent - i.e. used by Namo Web Editor B               http://www.namo.com/    
+id_moz_734     Mozilla/2.0 (compatible; AOL 3.0; Mac_PowerPC)  AOL Mac B                       
+id_moz_735     Mozilla/2.0 (Compatible; AOL-IWENG 3.0; Win16)  AOL Win 3.x     B                       
+id_moz_736     Mozilla/2.0 (compatible; Ask Jeeves)    Ask Jeeves /Teoma robot R       65.214.45.[x]xx http://sp.ask.com       
+id_moz_040707_2        Mozilla/2.0 (compatible; Ask Jeeves/Teoma)      Ask Jeeves /Teoma robot R       65.214.45.[x]xx http://sp.ask.com       
+id_moz_160506_3        Mozilla/2.0 (compatible; Ask Jeeves/Teoma; http://about.ask.com/en/docs/about/webmasters.shtml) Ask Jeeves /Teoma robot R       65.214.45.[x]xx http://sp.ask.com       
+id_moz_737     Mozilla/2.0 (compatible; Ask Jeeves/Teoma; http://sp.ask.com/docs/about/tech_crawling.html)     Ask Jeeves /Teoma robot R       65.214.45.[x]xx http://sp.ask.com       
+id_moz_738     Mozilla/2.0 (compatible; EZResult -- Internet Search Engine)    Direct Hit Robot        R               http://www.directhit.com        
+id_moz_739     Mozilla/2.0 (compatible; MS FrontPage x.0)      MS Frontpage x.x web editor     B                       
+id_moz_740     Mozilla/2.0 (compatible; MSIE 2.1; Mac_PowerPC) IE 2.x Mac Power PC     B                       
+id_moz_743     Mozilla/2.0 (compatible; MSIE 3.02; Update a; AK; Windows NT)   IE 3.x WinNT    B                       
+id_moz_744     Mozilla/2.0 (compatible; MSIE 3.02; Update a; AOL 3.0; Windows 95)      IE 3.x AOL Win95        B                       
+id_moz_741     Mozilla/2.0 (compatible; MSIE 3.0; AK; Windows 95)      IE 3.x Win95    B                       
+id_moz_742     Mozilla/2.0 (compatible; MSIE 3.0; Windows 3.1) IE 3.x Win 3.1  B                       
+id_moz_745     Mozilla/2.0 (compatible; MSIE 3.0B; Win32)      IE 3.x WinXP    B                       
+id_moz_746     Mozilla/2.0 (compatible; NEWT ActiveX; Win32)   Borland Delphi .OCX component used by WebCollector email harverster     S                       
+id_moz_747     Mozilla/2.0 (compatible; T-H-U-N-D-E-R-S-T-O-N-E)       Thunderstone's Webinator Web indexing program   R               http://www.thunderstone.com/texis/site/pages/Products.html      
+id_moz_748     Mozilla/2.0 compatible; Check&Get 1.1x (Windows 98)     Check&Get bookmark and link checking tool       C               http://www.activeurls.com       
+id_moz_749     Mozilla/2.01 (Win16; I) Netscape 2.x Win3.x International       B                       
+id_moz_750     Mozilla/2.02Gold (Win95; I)     Netscape 2.x Gold Win95 B                       
+id_moz_771     Mozilla/3.0 (compatible)        Faked user agent for diff. purposes i.e.: - some download manager - E-mail harvesting   S D                     
+id_moz_751     Mozilla/3.0 (compatible; AvantGo 3.2)   AvantGo PDA browser     B               http://avantgo.com/products/solutions/sfa.html  
+id_moz_752     Mozilla/3.0 (compatible; Fluffy the spider; http://www.searchhippo.com/; info@searchhippo.com)  Searchhippo robot       R               http://www.searchhippo.com      
+id_moz_753     Mozilla/3.0 (compatible; HP Web PrintSmart 04b0 1.0.1.34)       HP Web PrintSmart (discontinued) - web page printing software   B D                     
+id_moz_754     Mozilla/3.0 (compatible; Indy Library)  Internet Direct Library for Borland (often used as e-mail address collector and mass mailing tool)      S               http://forge.novell.com/modules/xfmod/project/?indy-net http://www.indyproject.org/
+id_moz_755     Mozilla/3.0 (compatible; Linkman)       Outertechs Linkman bookmark tool        C               http://www.outertech.com        
+id_moz_757     Mozilla/3.0 (compatible; MuscatFerret/1.5.4; claude@euroferret.com)     Euroferret robot        R               http://www.euroferret.com       
+id_moz_756     Mozilla/3.0 (compatible; MuscatFerret/1.5; olly@muscat.co.uk)   Euroferret robot        R               http://www.euroferret.com       
+id_moz_758     Mozilla/3.0 (compatible; MuscatFerret/1.6.x; claude@euroferret.com)     Euroferret robot        R               http://www.euroferret.com       
+id_moz_759     Mozilla/3.0 (compatible; netart generator/1.0; libwww-perl/5.64)        Netart Generator - script generated random websites     R D             http://www.obn.org/generator/   
+id_moz_760     Mozilla/3.0 (compatible; NetPositive/2.2)       NetPositive BEOS browser        B               http://www.tunetrackersystems.com/bedocs/documentation/User's%20Guide/03_network/Network07_NetPositive.html     
+id_moz_761     Mozilla/3.0 (compatible; Opera/3.0; Windows 3.1) v3.1   Opera 3.x Win3.x        B                       
+id_moz_762     Mozilla/3.0 (compatible; Opera/3.0; Windows 95/NT4) 3.2 Opera 3.x Win95/NT      B                       
+id_moz_763     Mozilla/3.0 (compatible; PerMan Surfer 3.0; Win95)      Perman Surfer bookmark tool     C               http://www.bug.co.jp/nami-nori/ 
+id_moz_764     Mozilla/3.0 (compatible; REL Software Web Link Validator 2.x)   Web Link Validator link validation software     C               http://www.relsoftware.com      
+id_moz_765     Mozilla/3.0 (compatible; scan4mail (advanced version) http://www.peterspages.net/?scan4mail)    Scan4Mail online mail extraction service        S               http://www.peterspages.net      
+id_moz_220606_2        Mozilla/3.0 (compatible; ScollSpider; http://www.webwobot.com)  WebWobot UK search engine robot (82.43.129.2xx) R       s. also ScollSpider     http://www.webwobot.com/        
+id_moz_766     Mozilla/3.0 (compatible; Web Link Validator 2.x)Web Link Validator http://www.relsoftware.com/ link validation software Web Link Validator link validation software     C               http://www.relsoftware.com      
+id_moz_767     Mozilla/3.0 (compatible; WebCapture x.x; Auto; Windows) Xelios Web Capture (now Wysigot) website downloading tool (Discontinued)        D               http://www.xelios.com/  http://www.wysigot.com/int/about.html
+id_moz_768     Mozilla/3.0 (compatible; Webinator-DEV01.home.iprospect.com/2.56)       Iprospect search engine positioning using Thunderstone's Webinator      R               http://www.iprospect.com        http://www.thunderstone.com/texis/site/pages/Products.html
+id_moz_769     Mozilla/3.0 (compatible; Webinator-indexer.cyberalert.com/2.56) CyberAlert's Media Monitor using Thunderstone's Webinator       R               http://www.cyberalert.com       http://www.thunderstone.com/texis/site/pages/Products.html
+id_moz_770     Mozilla/3.0 (Compatible;Viking/1.8)     Viking server user/client       P               http://www.robtex.com   
+id_moz_772     Mozilla/3.0 (DreamPassport/3.0) One of DC-Sakuras download manager user-agent names     D               http://www.dc-sakura.com        
+id_moz_773     Mozilla/3.0 (INGRID/3.0 MT; webcrawler@NOSPAMexperimental.net; http://aanmelden.ilse.nl/?aanmeld_mode=webhints) Ilse Netherlands robot (62.69.178.xx)   R       s. also - INGRID/3.0 .. / IlseBot/1.0 ..        http://www.ilse.nl/     
+id_moz_774     Mozilla/3.0 (Liberate DTV 1.1)  Liberate DTV server suite / TV-emulator B P             http://www.liberate.com 
+id_moz_775     Mozilla/3.0 (Planetweb/2.100 JS SSL US; Dreamcast US)   Planetweb 2.1 Browser (discontinued) for Dreamcast      B               http://www.planetweb.com        
+id_moz_776     Mozilla/3.0 (Slurp.so/Goo; slurp@inktomi.com; http://www.inktomi.com/slurp.html)        http://www.goo.ne.jp /Inktomi robot     R               http://www.goo.ne.jp    
+id_moz_777     Mozilla/3.0 (Slurp/cat; slurp@inktomi.com; http://www.inktomi.com/slurp.html)   Inktomi (Hotbot-Lycos-NBCi) robot - 72.30.61.xx(x)      R       s. also Slurpy Verifier ...     http://www.inktomi.com/ 
+id_moz_778     Mozilla/3.0 (Slurp/si; slurp@inktomi.com; http://www.inktomi.com/slurp.html)    Inktomi (Hotbot-Lycos-NBCi) robot - 72.30.61.xx(x)      R       s. also Slurpy Verifier ...     http://www.inktomi.com/ 
+id_moz_779     Mozilla/3.0 (Vagabondo/1.1 MT; webcrawler@NOSPAMwise-guys.nl; http://webagent.wise-guys.nl/)    WiseGuys robot Netherland - 82.94.216.2 R       s. also Vagabondo       http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk 
+id_moz_780     Mozilla/3.0 (Vagabondo/1.x MT; webagent@wise-guys.nl; http://webagent.wise-guys.nl/)    WiseGuys robot Netherland - 82.94.216.2 R       s. also Vagabondo       http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk 
+id_moz_781     Mozilla/3.0 (Vagabondo/2.0 MT; webcrawler@NOSPAMexperimental.net; http://aanmelden.ilse.nl/?aanmeld_mode=webhints)      Ilse Netherlands robot  R               http://www.ilse.nl      
+id_moz_782     Mozilla/3.0 (Vagabondo/2.0 MT; webcrawler@NOSPAMwise-guys.nl; http://webagent.wise-guys.nl/)    WiseGuys robot Netherland - 82.94.216.2 R       s. also Vagabondo       http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk 
+id_moz_783     Mozilla/3.0 (Win16; I)  Netscape 3.x Win3.x     B                       
+id_moz_784     Mozilla/3.0 (Win95; I)  Netscape 3.x Win95      B                       
+id_moz_785     Mozilla/3.0 (WinNT; I)  Netscape 3.x WinNT      B                       
+id_moz_786     Mozilla/3.0 (WorldGate Gazelle 3.5.1 build 11; FreeBSD2.2.8-STABLE)     Netscape 3.x FreeBSD    B                       
+id_moz_787     Mozilla/3.0 (X11; I; OSF1 V4.0 alpha)   Netscape 3.x OSF1 V4.0 alpha    B                       
+id_moz_788     Mozilla/3.0 NAVIO_AOLTV (11; 13; Philips; PH200; 1; R2.0C36_AOL.0110OPTIK; R2.0.0139d_OPTIK)    AOL Web TV      B                       
+id_moz_789     Mozilla/3.0 WebTV/1.2 (compatible; MSIE 2.0)    WebTV   B                       
+id_moz_790     Mozilla/3.01 (compatible; AmigaVoyager/2.95; AmigaOS/MC680x0)   Amiga Voyager Browser Amiga     B                       
+id_moz_791     Mozilla/3.01 (Compatible; Links2Go Similarity Engine)   Links2Go robot  R               http://www.links2go.com 
+id_moz_792     Mozilla/3.01 (compatible; Netbox/3.5 R92; Linux 2.2)    Netgem Netbox cable modem TV Box Linux  B               http://www.netgem.com   
+id_moz_793     Mozilla/3.01-C-MACOS8 (Macintosh; I; PPC)       Netscape 3.x Mac        B                       
+id_moz_794     Mozilla/3.01Gold (X11; I; Linux 2.0.32 i486)    Netscape 3.x Linux      B                       
+id_moz_795     Mozilla/3.01Gold (X11; I; SunOS 5.5.1 sun4m)    Netscape 3.x SunOS      B                       
+id_moz_796     Mozilla/3.01SGoldC-SGI (X11; I; IRIX 6.3 IP32)  Netscape 3.x Irix       B                       
+id_moz_797     Mozilla/3.04 (compatible; ANTFresco/2.13; RISC OS 4.02) ANT Fresco Browser Risc OS      B               http://www.antlimited.com       
+id_moz_798     Mozilla/3.04 (compatible; NCBrowser/2.35; ANTFresco/2.17; RISC OS-NC 5.13 Laz1UK1309)   NCBrowser ANT Fresco Browser Risc OS    B               http://www.antlimited.com       
+id_moz_281106_1        Mozilla/3.04 (compatible;QNX Voyager 2.03B ;Photon)     QNX OS Voyager embedded browser B               http://www.qnx.com/products/browsers/   
+id_moz_799     Mozilla/3.x (I-Opener 1.1; Netpliance)  I-Opener (was www.netpliance.com/) web PC       B                       
+id_moz_100406_3        Mozilla/4.0     Yahoo Mindset: Intent-driven Search (66.228.182.1xx)    R       s. also Yahoo! Mindset  http://mindset.research.yahoo.com/      
+id_moz_800     Mozilla/4.0 (agadine3.0) www.agada.de   Agada search (Germany) robot    R       s. also agadine/1.x.x   http://www.agada.de     
+id_moz_290406_1        Mozilla/4.0 (Compatible); URLBase 6     URLBase 6 bookmark manager      C       s. also URLBase/6.x     http://www.terriadev.com/products/urlbase/      
+id_moz_895     Mozilla/4.0 (compatible: AstraSpider V.2.1 : astrafind.com)     Astrafind! adult search robot (66.98.252.xx)    R               http://www.astrafind.com        
+id_moz_021205_1        Mozilla/4.0 (compatible; Vagabondo/2.2; webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/)  WiseGuys robot Netherland - 82.94.216.2 R       s.also - Mozilla/3.0 (Vagabondo... - Vagabondo..        http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk 
+id_moz_240906_1        Mozilla/4.0 (compatible; Vagabondo/4.0Beta; webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/)      WiseGuys robot Netherland - 82.94.216.2 R       s.also - Mozilla/3.0 (Vagabondo... - Vagabondo..        http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk 
+id_moz_100208_1        Mozilla/4.0 (compatible; <a href=http://www.reget.com>ReGet Deluxe 5.1</a>; Windows NT 5.1)     ReGet Deluxe! download manager  D               http://deluxe.reget.com/en/     
+id_moz_801     Mozilla/4.0 (compatible; Advanced Email Extractor v2.xx)        Advanced Email Extractor e-mail collector (spam bot)    S               http://www.mailutilities.com    
+id_moz_802     Mozilla/4.0 (compatible; Arachmo)       Arachmo Spider - web site file extraction tool  D               http://bbbearchan.hp.infoseek.co.jp/    
+id_moz_804     Mozilla/4.0 (compatible; BorderManager 3.0)     Novell Border Manager security suite    P                       
+id_moz_090807_3        Mozilla/4.0 (compatible; BOTW Spider; +http://botw.org) Best of the Web directory link checking C       209.11.177.1xx  http://botw.org/        
+id_moz_803     Mozilla/4.0 (compatible; B_L_I_T_Z_B_O_T)       Blitzsuche Germany robot        R       s. BlitzBOT@tricus.net  http://blitzsuche.rp-online.de/ 
+id_moz_805     Mozilla/4.0 (compatible; Cerberian Drtrs Version-3.2-Build-0)   Content Control from Blue Coat  P               http://www.cerberian.com        
+id_moz_080706_1        Mozilla/4.0 (compatible; Check&Get 3.0; Windows NT)     Check&Get bookmark manager, web change monitor and archiver     C               http://activeurls.com/en/       
+id_moz_806     Mozilla/4.0 (compatible; ChristCrawler.com ChristCrawler@ChristCENTRAL.com)     Christcentral.com Christcrawler (was www.christcrawler.com)     R       s.also ChristCRAWLER            
+id_moz_301105_4        Mozilla/4.0 (compatible; crawlx, crawler@trd.overture.com)      Yahoo Search Marketing crawler (68.142.211.1xx) R               http://www.content.overture.com/d/      
+id_moz_011207_1        Mozilla/4.0 (compatible; DAUMOA-video; +http://ws.daum.net/aboutkr.html)        DAUMOA - Daum search Korea robot (211.115.109.xxx)      R       s. also RaBot   http://www.daum.net/    http://ws.daum.net/abouten.html
+id_moz_131206_1        Mozilla/4.0 (compatible; DepSpid/5.0x; +http://about.depspid.net)       DepSpid distributed web crawler for link dependencies   C               http://depspid.net/     http://about.depspid.net/
+id_moz_807     Mozilla/4.0 (compatible; DnloadMage 1.0)        Download Mage download manager  D               http://www.dlmage.com   
+id_moz_808     Mozilla/4.0 (compatible; FastCrawler3 support-fastcrawler3@fast.no)     Fast/Alltheweb crawler  R               http://www.alltheweb.com        
+id_moz_809     Mozilla/4.0 (compatible; FDSE robot)    Fluid Dynamics Search Engine (FDSE) robot used by Abadoor.de    R               http://www.xav.com/scripts/search/      http://www.abadoor.de/
+id_moz_161105_2        Mozilla/4.0 (compatible; GPU p2p crawler http://gpu.sourceforge.net/search_engine.php)  GPU Distributed Search Engine crawler   R               http://gpu.sourceforge.net/search_engine.php    
+id_moz_810     Mozilla/4.0 (compatible; grub-client-0.2.x; Crawl your stuff with http://grub.org)      Grub open source crawler        R               http://www.grub.org     
+id_moz_811     Mozilla/4.0 (compatible; grub-client-0.3.x; Crawl your own stuff with http://grub.org)  Grub open source crawler        R               http://www.grub.org     
+id_moz_812     Mozilla/4.0 (compatible; grub-client-2.x)       Grub open source crawler used by Looksmart ( 64.241.242.xx)     R               http://www.grub.org     
+id_moz_261205_2        Mozilla/4.0 (compatible; ibisBrowser)   ibisBrowser Japanese mobile browser     B               http://www.ibis.ne.jp/products/ibisBrowser/index.html   
+id_moz_813     Mozilla/4.0 (compatible; ICS 1.2.xxx)   Novell iChain Cool Solutions caching    P               http://www.novell.com   
+id_moz_220206_1        Mozilla/4.0 (compatible; IE-Favorites-Check-0.5)        IE Favorites Check - Bookmark manager   C               http://secure.sintraweb.net/public/soft/iefc/   
+id_moz_814     Mozilla/4.0 (compatible; Iplexx Spider/1.0 http://www.iplexx.at)        Iplexx Austria (webhosting company) logfile spamming bot        S               http://www.iplexx.at    
+id_moz_020208_1        Mozilla/4.0 (compatible; KeepNI web site monitor)       KeepNi Monitors - Web site monitoring / link checking tool      C               http://www.keepni.com/  
+id_moz_815     Mozilla/4.0 (compatible; Link Utility; http://net-promoter.com) NetPromoter Link Utility link checking tool     C       s. also - Mozilla/4.0 (compatible; NetPromoter Spider ...       http://www.net-promoter.com/    
+id_moz_816     Mozilla/4.0 (compatible; Lotus-Notes/5.0; Windows-NT)   Lotus Notes 5.0 browser B               http://www-10.lotus.com/ldd/whatisnotes#Release%205.0%3A%20Web%20integration%20by%20d   
+id_moz_819     Mozilla/4.0 (compatible; MSIE 4.01; AOL 4.0; Windows 98)        IE 4.x AOL Win98        B                       
+id_moz_820     Mozilla/4.0 (compatible; MSIE 4.01; Mac_PowerPC)        IE 4.x Mac Power PC     B                       
+id_moz_821     Mozilla/4.0 (compatible; MSIE 4.01; MSIECrawler; Windows 95)    Internet Explorer 4.0 URL check B C                     
+id_moz_090506_1        Mozilla/4.0 (compatible; MSIE 4.01; Vonna.com b o t)    Vonna search robot      R               http://www.vonna.com/   
+id_moz_822     Mozilla/4.0 (compatible; MSIE 4.01; Windows 95) IE 4.x Win95    B                       
+id_moz_823     Mozilla/4.0 (compatible; MSIE 4.01; Windows CE; MSN Companion 2.0; 800x600; Compaq)     IE PDA Browser Windows CE       B                       
+id_moz_100109_4        Mozilla/4.0 (compatible; MSIE 4.01; Windows CE; PPC; 240x320; SPV M700; OpVer 19.123.2.733) OrangeBot-Mobile 2008.0 (mobilesearch.support@orange-ftgroup.com)   Orange France robot for mobiles R       81.52.143.xx    http://www.orange.com/en_EN/    
+id_moz_010308_2        Mozilla/4.0 (compatible; MSIE 4.01; Windows CE; PPS; 240x320)   IE for Windows CE on a PocketPC (HP iPAQ)       B               http://www.hp.com/      
+id_moz_824     Mozilla/4.0 (compatible; MSIE 4.01; Windows NT Windows CE)      IE PDA Browser Windows CE       B                       
+id_moz_826     Mozilla/4.0 (compatible; MSIE 4.01; Windows NT) IE 4.x WinNT    B                       
+id_moz_825     Mozilla/4.0 (compatible; MSIE 4.01; Windows NT; MS Search 4.0 Robot) Microsoft  diff. IPs / services i.e.: - Microsoft server information robot (see link) - Okanagan Internet Junction web filter (robot)                      http://www.webmasterworld.com/forum11/841.htm   http://www.junction.net/
+id_moz_010406_3        Mozilla/4.0 (compatible; MSIE 4.0; Windows NT; Site Server 3.0 Robot) ACR       Unknown robot from American College of Radiology (ACR) running MS Site Server   R C     208.236.180.xx  http://www.acr.org/s_acr/index.asp      http://www.microsoft.com/commerceserver/default.mspx
+id_moz_817     Mozilla/4.0 (compatible; MSIE 4.0; Windows NT; Site Server 3.0 Robot) Indonesia Interactive     Indonesia Interactive Web-portal robot on MS Site Server        R               http://www.i-2.co.id/   http://www.microsoft.com/commerceserver/default.mspx
+id_moz_818     Mozilla/4.0 (compatible; MSIE 4.0; Windows NT; Site Server 3.0 Robot) WebQuest Designs  Webquestdesigns hosting                 http://www.webquestdesigns.com  
+id_moz_841     Mozilla/4.0 (compatible; MSIE 5.01; Windows 95) via <B>Avirt Gateway Server</B> v4.0    Avirt Gateway proxy server      P               http://www.avirt.com/products/gateway.html      
+id_moz_843     Mozilla/4.0 (compatible; MSIE 5.01; Windows NT 5.0) (samualt9@bigfoot.com)      Metacarta.com (66.28.xx.xxx) robot      R       s. Larbin....   http://www.metacarta.com/       
+id_moz_842     Mozilla/4.0 (compatible; MSIE 5.01; Windows NT 5.0; NetCaptor 6.5.0RC1) NetCaptor IE browser addon      B               http://www.netcaptor.com        
+id_moz_827     Mozilla/4.0 (compatible; MSIE 5.0; AOL 5.0; Windows 95; DigExt; Gateway2000; sureseeker.com)    IE 5.x AOL Win95 Sureseeker search plugin       B               http://www.sureseeker.com       
+id_moz_828     Mozilla/4.0 (compatible; MSIE 5.0; Mac_PowerPC; AtHome021)      IE 5.x Mac PowerPC AtHome user  B                       
+id_moz_829     Mozilla/4.0 (compatible; MSIE 5.0; NetNose-Crawler 2.0; A New Search Experience: http://www.netnose.com)        www.netnose.com crawler R       parked domain   http://www.netnose.com/ 
+id_moz_830     Mozilla/4.0 (compatible; MSIE 5.0; Win32) via proxy gateway CERN-HTTPD/3.0 libwww/2.17  WinXP via CERN httpd proxy server       P               http://www.w3.org       
+id_moz_831     Mozilla/4.0 (compatible; MSIE 5.0; Windows 95) TrueRobot; 1.5   Echo.com robot  R               http://www.echo.com     
+id_moz_832     Mozilla/4.0 (compatible; MSIE 5.0; Windows 95) VoilaBot BETA 1.2 (http://www.voila.com/)        Voila.fr robot  R               http://www.voila.fr     
+id_moz_833     Mozilla/4.0 (compatible; MSIE 5.0; Windows 95) VoilaBot; 1.6    Voila.fr robot  R               http://www.voila.fr     
+id_moz_835     Mozilla/4.0 (compatible; MSIE 5.0; Windows ME) Opera 5.11 [en]  WinME Opera 5.x B                       
+id_moz_834     Mozilla/4.0 (compatible; MSIE 5.0; Windows ME; Link Checker 2.x.xx http://www.kyosoft.com)      Kyosoft's Link Checker  C               http://www.kyosoft.com  
+id_moz_836     Mozilla/4.0 (compatible; MSIE 5.0; Windows NT; DigExt; DTS Agent        Beijing Express Email Address Extractor via DHCP Data Transport Services (DTS)  S       site is closed  http://www.zstools.com  http://esupport.ca.com/index.html?/public/dto_transportit/infodocs/dto1013.asp
+id_moz_837     Mozilla/4.0 (compatible; MSIE 5.0; Windows NT; Girafabot; girafabot at girafa dot com; http://www.girafa.com)   Girafa (browser plug-in) robot  B R             http://www.girafa.com   
+id_moz_838     Mozilla/4.0 (compatible; MSIE 5.0; www.galaxy.com; www.psychedelix.com) Galaxy robot (63.121.41.xxx)    R       s. also GalaxyBot..     http://www.galaxy.com/  
+id_moz_839     Mozilla/4.0 (compatible; MSIE 5.0; www.galaxy.com; www.psychedelix.com/; http://www.galaxy.com/info/crawler.html)       Galaxy robot (63.121.41.xxx)    R       s. also GalaxyBot..     http://www.galaxy.com/  
+id_moz_840     Mozilla/4.0 (compatible; MSIE 5.0; YANDEX)      Yandex Search Russia link checking (213.180.206.2xx)    R       s. also Yandex/1...     http://www.yandex.ru    
+id_moz_844     Mozilla/4.0 (compatible; MSIE 5.5; AOL 4.0; Windows 98; GoBeez (www.gobeez.com))        Gobeez starting page plugin     C       site is offline http://www.gobeez.com/  
+id_moz_845     Mozilla/4.0 (compatible; MSIE 5.5; Windows 95; Transmission Segment; Hotbar 2.0)        IE 5.5 Win95 Hotbar plug-in                     http://hotbar.com/install/firstvisit.asp        
+id_moz_846     Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; Crazy Browser 1.x.x)     Crazy Browser - IE based tabbed Browser B               http://www.crazybrowser.com     
+id_moz_847     Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; KITV4.7 Wanadoo) Wanadoo Internet services       B                       
+id_moz_848     Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; SAFEXPLORER TL)  Safexplorer (safexplorer.com - site is offline) kids browser    B                       
+id_moz_849     Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; SYMPA; Katiesoft 7; SimulBrowse 3.0)     Katiesoft Scroll (ex www.katiesoft.com now discarded) & SimulBrowse (ex www.simulbrowse.com now dead) IE browser plugins        B                       
+id_moz_850     Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; Win 9x 4.90; BTinternet V8.1)    Windows ME BTOpenworld Internet services        B                       
+id_moz_851     Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; Win 9x 4.90; MSIECrawler)        Windows ME Internet Explorer URL check  B C                     
+id_moz_852     Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 4.0; obot)        Cobion Germany Brand Protection Services robot  R               http://www.cobion.com   
+id_moz_853     Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 4.0; QXW03018)    Cobion Germany Brand Protection Services robot  R               http://www.cobion.com   
+id_moz_858     Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0) Active Cache Request IE 5.5 Win2000 / user agent     B                       
+id_moz_859     Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0) Fetch API Request    Maybe: - MS Internet Security & Acceleration Server (ISA) cache refreshing request (see link) or - IE 5.5 Win2000 probably with some (website) API request component (see 2nd link) - suspected as email-harvester / site scanning tool (see http://www.byte.com/documents/s=493/byt20010208s0001/index.htm     P S ?           http://groups.google.com/groups?hl=en&lr=&ie=UTF-8&safe=off&threadm=uGoenyodBHA.1472%40tkmsftngp07&rnum=1&prev=/groups%3Fq%3DFetch%2BAPI%26hl%3Den%26lr%3D%26ie%3DUTF-8%26safe%3Doff%26selm%3DuGoenyodBHA.1472%2540tkmsftngp07%26rnum%3D1       http://groups.google.de/groups?q=%22fetch+api+request%22&hl=de&lr=&ie=UTF-8&oe=UTF-8&selm=3CAD577B.C29BA3B2%40execpc.com&rnum=2
+id_moz_854     Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; .NET CLR 1.0.3705)   IE 5.5 Win2000 with MS.NET SDK  B                       
+id_moz_855     Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; AIRF)        IE 5.5 Win2000 / user agent w. AI RoboForm (AIRF) password manager      B               http://www.roboform.com 
+id_moz_856     Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; AspTear 1.5) AspTear URL fetching program component / Download32.com spider  R D             http://www.alphasierrapapa.com/IisDev/Components/AspTear/       http://www.download32.com
+id_moz_857     Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; N_o_k_i_a)   Nokia.com network       B                       
+id_moz_051102_1        Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; T312461) RPT-HTTPClient/0.3-3E       Unknown Object Sciences Corp. robot using the HTTPClient                        http://www.objectsciences.com   http://www.innovation.ch/java/HTTPClient/
+id_moz_060406_2        Mozilla/4.0 (compatible; MSIE 6.0 compatible; Asterias Crawler v4; +http://www.singingfish.com/help/spider.html; webmaster@singingfish.com); SpiderThread Revision: 3.10        Singingfish media spider (64.12.186.2xx) via AOL search R       s. also asterias/2.0    http://search.singingfish.com/sfw/home.jsp      
+id_moz_200108_2        Mozilla/4.0 (compatible; MSIE 6.0; AOL 9.0; Windows 98; .NET CLR 1.1.4322; MEGAUPLOAD 2.0)      Megaupload Mega Manager - Download manager toolbar for IE       D               http://www.megaupload.com/manager/de/   
+id_moz_010106_1        Mozilla/4.0 (compatible; MSIE 6.0; AOL 9.0; Windows NT 5.1; SV1; HbTools 4.7.2) Hotbar IE graphical skin        B       Adware / Spyware component      http://hotbar.com/Installation/Browsing/WhatIs/Hotbar.htm       
+id_moz_860     Mozilla/4.0 (compatible; MSIE 6.0; MSIE 5.5; Windows NT 5.1) Skampy/0.9.x [en]  Skaffe.com directory link checker       R       s. also Skampy  http://www.skaffe.com   
+id_moz_100606_1        Mozilla/4.0 (compatible; MSIE 6.0; TargetSeek/1.0; +http://www.targetgroups.net/TargetSeek.html)        TargetSeek Crawler concerning electronics industry product announcements        R       71.161.205.2xx  http://www.targetgroups.net/TargetSeek.html     
+id_moz_861     Mozilla/4.0 (compatible; MSIE 6.0; Win32) WebWasher 3.0 IE 6.0 WebWasher ad filter      B P             http://www.webwasher.com        
+id_moz_864     Mozilla/4.0 (compatible; MSIE 6.0; Windows 98) REL Software Web Link Validator 2.x)     Web Link Validator link validation software     C               http://www.relsoftware.com      
+id_moz_865     Mozilla/4.0 (compatible; MSIE 6.0; Windows 98) Web Link Validator 2.x)  Web Link Validator link validation software     C               http://www.relsoftware.com      
+id_moz_862     Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; Net M@nager V3.02 - www.vinn.com.au)     IE 6.0 Netmanager IE add-on     B               http://www.vinn.com.au  
+id_moz_290306_1        Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; support@illumit.com; http://www.illumit.com/Products/weblight/)  WebLight web analyzer & link checker    C       s. also WebLight/4.x.x ...      http://www.illumit.com/Products/weblight/       
+id_moz_863     Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; Win 9x 4.90; http://www.Abolimba.de)     Abolimba Multibrowser - IE based browser        C               http://www.autag.com    
+id_moz_866     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; .NET CLR 1.1.4322; Lunascape 2.1.3)  Lunascape IE based browser (Japan)      B       s. also Lunascape       http://www2.lunascape.jp/index.aspx     
+id_moz_290708_4        Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; Google Wireless Transcoder;) Google wireless transcoder (GWT) proxy for rewriting websites for mobiles       P       209.85.136.xxx  http://www.google.com/gwt/n     
+id_moz_150906_1        Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; ODP entries t_st; http://tuezilla.de/t_st-odp-entries-agent.html)    Tüzilla (Germany) - ODP link checking using Robozilla  R       81.169.154.xx   http://tuezilla.de      http://dmoz.org/profiles/robozilla.html
+id_moz_867     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; ODP links test; http://tuezilla.de/test-odp-links-agent.html)        Tüzilla (Germany) - ODP link checking using Robozilla  R       81.169.154.xx   http://tuezilla.de      http://dmoz.org/profiles/robozilla.html
+id_moz_080606_1        Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; ZoomSpider.net bot; .NET CLR 1.1.4322)       ZoomSpider.Net indexing robot for several directorys    R       70.94.232.2xx   http://www.zoomspider.net/      
+id_moz_882     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1) (dns_admin@c-a-s-h.com)      unknown robot from 64.246.44.xx                         
+id_moz_280408_1        Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Covac UPPS Cathan 1.2.5;)    Covac Software UPPS (Universal PHP Proxy Server) - free public proxy server     P               http://www.covac-software.com/proxy/    
+id_moz_160406_1        Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Crayon Crawler; snprtz|T04056566514940; (R1 1.5))    GetNetWise Crayon Crawler web filter    P               http://kids.getnetwise.org/tools/tool_info.php?tool_id=931919301.7202   
+id_moz_868     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Deepnet Explorer)    Deepnet Explorer - IE based browser     B               http://deepnetexplorer.com/     
+id_moz_869     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; heritrix/1.3.0 http://www.cs.washington.edu/research/networking/websys/)     Heritrix Internet Archive's open-source web project used by Analysis Projects at UW     R               http://crawler.archive.org/     http://www.cs.washington.edu/research/networking/websys/
+id_moz_870     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Hotbar 3.0)  IE 6x WinXP Hotbar plug-in      B               http://hotbar.com/install/firstvisit.asp        
+id_moz_871     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; iOpus-I-M)   IE 6x WinXP iOpus Internet Macros - Internet-based macro recorder       B               http://www.iopus.com    
+id_moz_872     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; iRider 2.21.1108; FDM)       iRider - IE based browser / Free Download Manager (FDM) D               http://www.irider.com/irider/index.htm  http://www.freedownloadmanager.org/
+id_moz_873     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; KKman3.0)    KKman http://www.kkman.com/ - Japanese IE based browser B               http://www.kkman.com    
+id_moz_874     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; MathPlayer2.0)       IE 6x WinXP MathPlayer mathematical notation plugin     B               http://www.mathtype.com/en/products/mathplayer/ 
+id_moz_875     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Maxthon)     Maxton (ex MyIE2) - IE based browser    B               http://www.maxthon.com  
+id_moz_876     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; PeoplePal 3.0; MSIECrawler)  IE 6x WinXP peoplepc online PeoplePal IE toolbar        B               http://home.vfw-online.com/peoplepal/default.asp        
+id_moz_877     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Q312461; IOpener Release 1.1.04)     IE 6x WinXP / I-Opener (was www.netpliance.com/) web PC B                       
+id_moz_050307_1        Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; QihooBot 1.0 qihoobot@qihoo.net)     Qihoo search (China) robot      R       220.181.34.1xx  http://www.qihoo.com/   
+id_moz_070306_1        Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SIMBAR Enabled; InfoPath.1)  SimBar IE toolbar for accessing The Sims sites / Infopath IE form & spreadsheet plugin  B               http://www.simstools.com/simbar.php     http://office.microsoft.com/en-us/fx010857921033.aspx
+id_moz_878     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; StumbleUpon.com 1.760; .NET CLR 1.1.4322)    IE 6x WinXP Stumble Upon IE toolbar     B               http://www.stumbleupon.com      
+id_moz_150807_1        Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; Embedded Web Browser from: http://bsalsa.com/; MSIECrawler)     Balsa Productions embedded web browser package for Borland Delphi       B               http://bsalsa.com/product.html  
+id_moz_030807_2        Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; http://www.changedetection.com/bot.html )       ChangeDetection robot for web page monitoring   C       68.166.223.x    http://www.changedetection.com/ http://www.changedetection.com/bot.html
+id_moz_879     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; .NET CLR 1.1.4322)      IE 6x WinXP also used by WebSite Pro HTML editor        B               http://www.gtpcc.org/gtpcc/websitepro.htm       
+id_moz_880     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; DX-Browser 5.0.0.0)     DX-Browser - German IE based browser    B       was http://www.dx-soft.net/ (expired)   http://www.zdnet.de/downloads/prg/t/p/deDCTP-wc.html    
+id_moz_271006_1        Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; FunWebProducts; ezPeer+ v1.0 Beta (0.4.1.98); ezPeer+ v1.0 (0.5.0.00); .NET CLR 1.1.4322; MSIECrawler)  ezPeer+ P2P IE addon    B               http://web.ezpeer.com/  
+id_moz_881     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; IBP; .NET CLR 1.1.4322) Axandra IBP website promotion software ?        C B             http://www.axandra-web-site-promotion-software-tool.com/index.htm       
+id_moz_290606_3        Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; MRA 4.3 (build 01218))  MRA = Mail.ru Agent - Instant Messenger / VoIP  B               http://agent.mail.ru/   
+id_moz_883     Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search 4.0 Robot)     MSN Search robot (207.46.89.xx) R       s. also: - MSNBOT               
+id_moz_170207_3        Mozilla/4.0 (compatible; MSIE 7.0; Win32) Link Commander 4.0    Link Commander bookmark manager C               http://www.resortlabs.com/bookmark-manager/linkcommander.php    
+id_moz_170706_2        Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; bgft)        IE 7.0 - WinXP  B               http://www.microsoft.com/windows/ie/default.mspx        
+id_moz_080209_1        Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; GTB5; User-agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; http://bsalsa.com) ; .NET CLR 2.0.50727)   GTB = Google Toolbar Internet Explorer add-on   B               http://toolbar.google.com/T4/index.html 
+id_moz_080209_2        Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; Tablet PC 2.0)  MSIE 7.0 *and* Trident token used by Internet Explorer 8 in compatibility view mode     B               http://blogs.msdn.com/ie/archive/2009/01/09/the-internet-explorer-8-user-agent-string-updated-edition.aspx      
+id_moz_080209_3        Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 5.1; Trident/4.0; .NET CLR 2.0.50727; .NET CLR 1.1.4322; .NET CLR 3.0.04506.30; .NET CLR 3.0.04506.648)   Internet Explorer 8     B               http://www.microsoft.com/windows/internet-explorer/beta/default.aspx    
+id_moz_150408_4        Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.0)      IE 8.0 (beta) on Win Vista      B               http://www.microsoft.com/windows/products/winfamily/ie/ie8/default.mspx 
+id_moz_030110_1        Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.0; Trident/4.0; Orange 8.0; GTB6.3; Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1) ; Embedded Web Browser from: http://bsalsa.com/; SLCC1; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30618; OfficeLiveConnector.1.3; OfficeLivePatch.1.3)   Bsalsa embedded browser B               http://bsalsa.com/      
+id_moz_010108_4        Mozilla/4.0 (compatible; MSIE enviable; DAUMOA 2.0; DAUM Web Robot; Daum Communications Corp., Korea; +http://ws.daum.net/aboutkr.html) DAUMOA - Daum search Korea robot (211.115.109.xxx)      R       s. also RaBot   http://www.daum.net/    http://ws.daum.net/abouten.html
+id_moz_311206_1        Mozilla/4.0 (compatible; MSIE is not me; DAUMOA/1.0.1; DAUM Web Robot; Daum Communications Corp., Korea)        DAUMOA - Daum search Korea robot (211.115.109.xxx)      R       s. also RaBot   http://www.daum.net/    
+id_moz_281106_2        Mozilla/4.0 (compatible; NaverBot/1.0; http://help.naver.com/delete_main.asp)   Naver Search Korea Naverbot     R               http://www.naver.com/   
+id_moz_884     Mozilla/4.0 (compatible; Netcraft Web Server Survey)    Netcraft webserver info R C             http://www.netcraft.com 
+id_moz_885     Mozilla/4.0 (compatible; NetPromoter Spider;http://www.net-promoter.com/)       NetPromoter Link Utility link checking tool     C       s. also - Mozilla/4.0 (compatible; Link Utility ...     http://www.net-promoter.com/    
+id_moz_886     Mozilla/4.0 (compatible; Opera/3.0; Windows 4.10) 3.51 [en]     Opera 3.x WinNT B                       
+id_moz_887     Mozilla/4.0 (compatible; Powermarks/3.5; Windows 95/98/2000/NT) Powermarks bookmark manager     C               http://www.kaylon.com   
+id_moz_230607_1        Mozilla/4.0 (compatible; RSS Popper)    RSS Popper - MS Outlook RSS reader plugin       B               http://rsspopper.unknown/2004/10/home.html      
+id_moz_888     Mozilla/4.0 (compatible; SiteKiosk 4.0; MSIE 5.0; Windows 98; SiteCoach 1.0)    SiteKiosk public terminal browser       B               http://www.sitekiosk.com        
+id_moz_889     Mozilla/4.0 (compatible; SpeedySpider; www.entireweb.com)       Entireweb Search Speedyspider (62.13.25.xxx)    R       s. also Worldlight      http://www.entireweb.com        
+id_moz_890     Mozilla/4.0 (compatible; SPENG) SiteProbe - website status checking     R C             http://www.siteprobe.com        
+id_moz_891     Mozilla/4.0 (compatible; SuperCleaner 2.xx; Windows 98) Super Cleaner privacy tool (bookmark checking)  C               http://www.southbaypc.com/SuperCleaner/ 
+id_moz_020406_1        Mozilla/4.0 (compatible; Synapse)       Synapse - Apache web service for processing XML documents       P               http://wiki.apache.org/incubator/SynapseProposal        
+id_moz_150207_1        Mozilla/4.0 (compatible; WebCapture 3.0; Windows)       Web2PDF - Adobe Acrobat plugin for site traversal and other services for the Web Capture feature        D                       
+id_moz_892     Mozilla/4.0 (compatible; Win32; WinHttp.WinHttpRequest.5)       Windows HTTP Services (WinHTTP / XML-parser)                            
+id_moz_170108_1        Mozilla/4.0 (compatible; WSN Links)     WSN Links PHP directory software        C               http://scripts.webmastersite.net/wsnlinks/      
+id_moz_111205_6        Mozilla/4.0 (compatible; www.euro-directory.com; urlchecker1.0) Euro Directory (German / Austrian) directory link checking      R C             http://www.euro-directory.com/  
+id_moz_893     Mozilla/4.0 (compatible; www.galaxy.com)        Galaxy robot    R               http://www.galaxy.com   
+id_moz_894     Mozilla/4.0 (compatible; www.linkguard.com Linkguard Online 1.0; Windows NT)    Linkguard.com link validation (service is offline)      C                       
+id_moz_240106_1        Mozilla/4.0 (compatible; Y!J; for robot study; keyoshid)        Yahoo Search Japan robot (203.141.52.)  R       s. also Y!J-BSC/1.0...  http://www.yahoo.co.jp/ 
+id_moz_170706_1        Mozilla/4.0 (compatible; Yahoo Japan; for robot study; kasugiya)        Yahoo Japan robot (202.93.76.xx)        R               http://www.yahoo.co.jp/ 
+id_moz_210207_1        Mozilla/4.0 (compatible;MSIE 6.0; Windows NT 5.0; H010818)      Faked IE id string used by DeepTrawl link checking tool C               http://deeptrawl.com/   
+id_moz_896     Mozilla/4.0 (fantomBrowser)     spoofed referer by Fantomaster (Multiblocker) anonymity products        P               http://fantomaster.com  http://multiblocker.com/home.html
+id_moz_897     Mozilla/4.0 (fantomCrew Browser)        spoofed referer by Fantomaster (Multiblocker) anonymity products        P               http://fantomaster.com  http://multiblocker.com/home.html
+id_moz_898     Mozilla/4.0 (hhjhj@yahoo.com)   unknown robot from - 64.57.223.40 - 66.28.233.xxx (cogentco.com)                                
+id_moz_899     Mozilla/4.0 (JemmaTheTourist;http://www.activtourist.com)       Activtourist Jemma spider       R               http://www.activtourist.com     
+id_moz_900     Mozilla/4.0 (MobilePhone PM-8200/US/1.0) NetFront/3.x MMP/2.0   NetFront (v3.x) for Pocket PC (here on Sanyo PM-8200 cell phone)        B               http://nfppc.access.co.jp/english/      
+id_moz_901     Mozilla/4.0 (MobilePhone SCP-5500/US/1.0) NetFront/3.0 MMP/2.0 (compatible; Googlebot/2.1; http://www.google.com/bot.html)      Google robot from 66.249.66.xxx R       s. also: - Googlebot - Mozilla/5.0 (compatible; Googlebot/2.1...        http://www.google.com   
+id_moz_902     Mozilla/4.0 (MobilePhone SCP-5500/US/1.0) NetFront/3.0 MMP/2.0 FAKE (compatible; Googlebot/2.1; http://www.google.com/bot.html) Google robot from 66.249.66.xxx R       s. also: - Googlebot - Mozilla/5.0 (compatible; Googlebot/2.1...        http://www.google.com   
+id_moz_081106_1        Mozilla/4.0 (Mozilla; http://www.mozilla.org/docs/en/bot.html; master@mozilla.com)      Unknown robot from Mozilla.org  R       63.209.222.xx   http://www.mozilla.org/ 
+id_moz_903     Mozilla/4.0 (Sleek Spider/1.2)  ASI - Any Search Info robot     R               http://search-info.com/ 
+id_moz_170406_1        Mozilla/4.0 compatible FurlBot/Furl Search 2.0 (FurlBot; http://www.furl.net; wn.furlbot@looksmart.net) Furl (Looksmart) online bookmark tool robot     R       64.242.88.xx    http://www.furl.net/    
+id_moz_905     Mozilla/4.0 compatible ZyBorg/1.0 (wn.zyborg@looksmart.net; http://www.WISEnutbot.com)  Wisenut robot   R               http://www.wisenut.com/ 
+id_moz_906     Mozilla/4.0 compatible ZyBorg/1.0 (ZyBorg@WISEnutbot.com; http://www.WISEnutbot.com)    Wisenut robot   R               http://www.wisenut.com/ 
+id_moz_907     Mozilla/4.0 compatible ZyBorg/1.0 Dead Link Checker (wn.zyborg@looksmart.net; http://www.WISEnutbot.com)        Wisenut robot   R               http://www.wisenut.com/ 
+id_moz_908     Mozilla/4.0 compatible ZyBorg/1.0 for Homepage (ZyBorg@WISEnutbot.com; http://www.WISEnutbot.com)       Wisenut robot   R               http://www.wisenut.com/ 
+id_moz_909     Mozilla/4.0 efp@gmx.net Unknown robot from 66.230.140.xx (argon.oxeo.com) maybe an e-mail collector     S       see also LARBIN-EXPERIMENTAL            
+id_moz_910     Mozilla/4.0 WebTV/2.6 (compatible; MSIE 4.0)    WebTV   B                       
+id_moz_904     Mozilla/4.0 [en] (Ask Jeeves Corporate Spider)  Ask / Ask Jeeves robot  R               http://www.Ask.com      
+id_moz_913     Mozilla/4.0(compatible; Zealbot 1.0)    LookSmart spider        R               http://www.looksmart.com        
+id_moz_290807_1        Mozilla/4.01 (compatible; NORAD National Defence Network)       HideMe - Web based anonymous proxy server service       P               http://www.hideme.biz/  http://www.cnn.com/TECH/computing/9901/25/hacktracts.idg/index.html
+id_moz_914     Mozilla/4.01 [en](Win95;I)      Some download manager spoofing Netscape 4.01    D                       
+id_moz_915     Mozilla/4.02 [en] (X11; I; SunOS 5.6 sun4u)     Netscape 4.x SunOS 5.6  B                       
+id_moz_161105_3        Mozilla/4.04 (compatible; Dulance bot; +http://www.dulance.com/bot.jsp) Dulance Bot - Dulance automated price comparison engine R               http://www.dulance.com/ 
+id_moz_916     Mozilla/4.04 [en] (X11; I; HP-UX B.10.20 9000/712)      Netscape 4.x HP-Unix    B                       
+id_moz_917     Mozilla/4.04 [en] (X11; I; IRIX 5.3 IP22)       Netscape 4.x IRIX       B                       
+id_moz_918     Mozilla/4.05 (Macintosh; I; 68K Nav)    Netscape 4.x Macintosh 68k      B                       
+id_moz_919     Mozilla/4.05 (Macintosh; I; PPC Nav)    Netscape 4.x Macintosh PowerPC  B                       
+id_moz_920     Mozilla/4.05 [en] (X11; I; SunOS 4.1.4 sun4m)   Netscape 4.x SunOS 4.1.4        B                       
+id_moz_921     Mozilla/4.08 [en] (Win98; U ;Nav)       Version 4.08 [en]-98306 Someone copied the help function in the referrer field ?                        
+id_moz_922     Mozilla/4.08 [en] (WinNT; U)    Netscape 4.x WinNT      B                       
+id_moz_911     Mozilla/4.0_(compatible;_MSIE_5.0;_Windows_95)_TrueRobot/1.4 libwww/5.2.8       Echo.com robot  R               http://www.echo.com     
+id_moz_912     Mozilla/4.0_(compatible;_MSIE_5.0;_Windows_95)_VoilaBot/1.6 libwww/5.3.2        Voila.fr robot  R               http://www.voila.fr     
+id_moz_923     Mozilla/4.5 (compatible; HTTrack 3.0x; Windows 98)      HTTrack Offline Browser B D             http://www.httrack.com/ 
+id_moz_924     Mozilla/4.5 (compatible; iCab 2.5.3; Macintosh; I; PPC) iCab MAC Web browser MAC Power PC       B               http://www.icab.de      
+id_moz_925     Mozilla/4.5 (compatible; OmniWeb/4.0.5; Mac_PowerPC)    OmniWeb 4.x.x Mac browser       B               http://www.omnigroup.com        
+id_moz_926     Mozilla/4.5 (compatible; OmniWeb/4.1-beta-1; Mac_PowerPC)       OmniWeb 4.x.x Mac browser       B               http://www.omnigroup.com        
+id_moz_928     Mozilla/4.5 RPT-HTTPClient/0.3-2        different IPs using the HTTPClient library (mostly link checking)       C R             http://www.innovation.ch        
+id_moz_927     Mozilla/4.5 [en]C-CCK-MCD {RuralNet} (Win98; I) RuralNet Internet Services      B               http://www.ruralnet.net.au      
+id_moz_929     Mozilla/4.5b1 [en] (X11; I; Linux 2.0.35 i586)  Netscape 4.x Linux      B                       
+id_moz_301105_3        Mozilla/4.6 [en] (http://www.cnet.com/) Cnet robot for Search.com (216.239.114.xx)      R               http://www.search.com/  http://www.cnet.com/
+id_moz_930     Mozilla/4.61 [de] (OS/2; I)     Netscape 4.x OS/2       B                       
+id_moz_931     Mozilla/4.61 [en] (X11; U; ) - BrowseX (2.0.0 Windows)  BrowseX cross-platform browser  B               http://browsex.com/     
+id_moz_932     Mozilla/4.7     Nameprotect (12.148.196.128 - 12.148.196.255) snoopbot  R               http://www.nameprotect.com      
+id_moz_933     Mozilla/4.7 (compatible; http://eidetica.com/spider)    Eidetica earch and text mining spider   R               http://eidetica.com/    
+id_moz_934     Mozilla/4.7 (compatible; Intelliseek; http://www.intelliseek.com)       Intelliseek (64.158.138.xx) robot       R               http://www.intelliseek.com      
+id_moz_935     Mozilla/4.7 (compatible; OffByOne; Windows 98) Webster Pro V3.2 OffByOne Browser        B               http://www.offbyone.com 
+id_moz_937     Mozilla/4.7 (compatible; Whizbang)      WhizBang! Labs information extraction robot     R       closed since May 2002   http://www.whizbang.com 
+id_moz_936     Mozilla/4.7 (compatible; WhizBang; http://www.whizbang.com/crawler)     WhizBang! Labs information extraction robot     R       closed since May 2002   http://www.whizbang.com 
+id_moz_938     Mozilla/4.7 [en](BecomeBot@exava.com)   BecomeBot - Becomecom shopping search (64.124.85.xx(x)) R       64.124.85.[x]xx http://www.become.com   
+id_moz_939     Mozilla/4.7 [en](Exabot@exava.com)      Exabot - exava shopping search (64.124.85.xx(x))        R               http://www.exava.com    
+id_moz_940     Mozilla/4.7 [en]C-CCK-MCD {Yahoo;YIP052400} (Win95; I)  unknown                         
+id_moz_941     Mozilla/4.72 [en] (BACS http://www.ba.be)       http://www.ba.be robot  R               http://www.ba.be        
+id_moz_942     Mozilla/4.72C-CCK-MCD Caldera Systems OpenLinux [en] (X11; U; Linux 2.2.14 i686)        Netscpape 4.7x Caldera Open Linux Pentium III   B                       
+id_moz_943     Mozilla/4.75C-ja [ja] (X11; U; OSF1 V5.1 alpha) Netscape 4.7x Japan OSF1 alpha  B                       
+id_moz_944     Mozilla/4.76 (Windows 98; U) Opera 5.12 [en]    Opera 5.x Win 98        B                       
+id_moz_945     Mozilla/4.76 [en] (X11; U; FreeBSD 4.4-STABLE i386)     Netscape 4.7x FreeBSD   B                       
+id_moz_946     Mozilla/4.76 [en] (X11; U; SunOS 5.7 sun4u)     Netscape 4.7x SunOS     B                       
+id_moz_947     Mozilla/4.77C-SGI [en] (X11; U; IRIX 6.5 IP32)  IRIX 6.5        B                       
+id_moz_948     Mozilla/5.0     GigaMedia / NTT DoCoMo robot    R               http://ir.giga.net.tw/products.htm      
+id_moz_040707_3        Mozilla/5.0 (+http://www.eurekster.com/mammoth) Mammoth/0.1     Eurekster Swicki community search using SLI-Systems site search engine Mammoth  R       64.106.253.1xx  http://www.eurekster.com/       http://www.sli-systems.com/
+id_moz_240306_2        Mozilla/5.0 (+http://www.sli-systems.com/) Mammoth/0.1  SLI Systems mammoth robot       R       s. also mammoth/1.0 ... http://www.sli-systems.com/     http://www.tenspider.com/business-blog/more.php?id=A45_0_1_0_M
+id_moz_949     Mozilla/5.0 (Clustered-Search-Bot/1.0; support@clush.com; http://www.clush.com/)        Clush search robot      R               http://www.clush.com    
+id_moz_020807_1        Mozilla/5.0 (compatible) GM RSS Panel X Greasemonkey RSS panel Firefox plugin   B               http://www.xs4all.nl/~jlpoutre/BoT/Javascript/RSSpanel/ 
+id_moz_140209_3        Mozilla/5.0 (compatible; +http://www.evri.com/evrinid)  Evri search robot       R       216.168.43.1xx  http://www.evri.com/    
+id_moz_250310_1        Mozilla/5.0 (compatible; 008/0.83; http://www.80legs.com/spider.html;) Gecko/2008032620 008 distributed crawler for 80legs      R               http://www.80legs.com/spider.html       
+id_moz_140209_4        Mozilla/5.0 (compatible; Abonti/0.8 - http://www.abonti.com)    Abonti WebSearch beta robot     R       77.233.225.11x  http://www.abonti.com/  
+id_moz_030110_4        Mozilla/5.0 (compatible; aiHitBot/1.0; +http://www.aihit.com/)  HitCompanies Aihit crawler      R       195.128.18.xx   http://hitcompanies.aihit.com/search.htm        
+id_moz_300406_1        Mozilla/5.0 (compatible; AnsearchBot/1.x; +http://www.ansearch.com.au/) Ansearch Australian search robot        R       203.206.162.x   http://www.ansearch.com.au/     
+id_moz_011107_1        Mozilla/5.0 (compatible; archive.org_bot/1.10.0 +http://www.loc.gov/minerva/crawl.html) The Library of Congress Minerva crawler R       207.241.232.1xx http://www.loc.gov/minerva/crawl.html   
+id_moz_230607_2        Mozilla/5.0 (compatible; archive.org_bot/1.13.1x http://crawler.archive.org)    Heritrix - The Internet Archive's open-source crawler (207.241.225.2xx) R       s.also - InternetArchive/0.8-dev - Mozilla/5.0 (compatible;archive.org_bot/...  http://www.archive.org/ 
+id_moz_141105_1        Mozilla/5.0 (compatible; archive.org_bot/1.5.0-200506132127 http://crawler.archive.org) Hurricane Katrina       Heritrix - The Internet Archive's open-source crawler   R       s. also - InternetArchive/0.8-dev... - mozilla/5.0 (compatible; heritrix/...    http://www.archive.org/ 
+id_moz_150207_2        Mozilla/5.0 (compatible; Ask Jeeves/Teoma; http://about.ask.com/en/docs/about/webmasters.shtml) Ask Jeeves /Teoma robot R       65.214.45.[x]xx http://sp.ask.com       
+id_moz_291205_2        Mozilla/5.0 (compatible; BanBots/2.0b; Fetch; +http://www.banbots.com)  Project BanBots Perl script robot       C       s. also BanBots/1.2...  http://www.banbots.com/ 
+id_moz_950     Mozilla/5.0 (compatible; BecomeBot/1.23; http://www.become.com/webmasters.html) BecomeBot - Become.com shopping search (64.124.85.xx(x))        R       64.124.85.[x]xx http://www.become.com   
+id_moz_951     Mozilla/5.0 (compatible; BecomeBot/1.xx; MSIE 6.0 compatible; http://www.become.com/webmasters.html)    BecomeBot - Become.com shopping search (64.124.85.xx(x))        R       64.124.85.[x]xx http://www.become.com   
+id_moz_952     Mozilla/5.0 (compatible; BecomeBot/2.0beta; http://www.become.com/webmasters.html)      BecomeBot - Become.com shopping search (64.124.85.xx(x))        R       64.124.85.[x]xx http://www.become.com   
+id_moz_953     Mozilla/5.0 (compatible; BecomeBot/2.x; MSIE 6.0 compatible; http://www.become.com/site_owners.html)    BecomeBot - Become.com shopping search (64.124.85.xx(x))        R       64.124.85.[x]xx http://www.become.com   
+id_moz_090506_2        Mozilla/5.0 (compatible; BecomeJPBot/2.3; MSIE 6.0 compatible; +http://www.become.co.jp/site_owners.html)       BecomeBot - Become.com shopping search (64.124.85.xx(x))        R       64.124.85.[x]xx http://www.become.com   
+id_moz_020907_1        Mozilla/5.0 (compatible; BlogRefsBot/0.1; http://www.blogrefs.com/about/bloggers)       BlogRefsBot.com blog robot      R       69.90.42.xx     http://www.blogrefs.com/        http://www.blogrefs.com/about/bloggers
+id_moz_171107_1        Mozilla/5.0 (compatible; Bot; +http://pressemitteilung.ws/spamfilter    Pressemitteilungen Webservice RSS / news crawler (Germany)      R       87.164.242.1xx  http://pressemitteilung.ws/     
+id_moz_031206_1        Mozilla/5.0 (compatible; BuzzRankingBot/1.0; +http://www.buzzrankingbot.com/)   BuzzRanking internet content analysis   R       213.251.187.1xx http://www.buzzrankingbot.com/  
+id_moz_310506_1        Mozilla/5.0 (compatible; Charlotte/1.0b; charlotte@betaspider.com)      Charlotte indexing spider for Searchme / Wikiseek       R       209.249.86.x    http://www.searchme.com/        http://www.wikiseek.com/
+id_moz_080307_1        Mozilla/5.0 (compatible; Charlotte/1.0b; http://www.searchme.com/support/)      Charlotte indexing spider for Searchme / Wikiseek       R       209.249.86.x    http://www.searchme.com/        http://www.wikiseek.com/
+id_moz_220106_1        Mozilla/5.0 (compatible; Crawling jpeg; http://www.yama.info.waseda.ac.jp)      Unknown graphics crawler or downloading agent from Yamana Laboratory - Waseda Univerity Japan (133.9.238.xx)    R       doesn't read robots.txt http://www.yama.info.waseda.ac.jp/eng/index.html        
+id_moz_954     Mozilla/5.0 (compatible; Custo 3 (Netwu.com); Windows NT 5.1)   Custo web site spidering tool (link checking)   C       s. also - Custo x.x (www.netwu.com)     http://www.netwu.com    
+id_moz_071207_1        Mozilla/5.0 (compatible; de/1.13.2 +http://www.de.com)  De.com German travel related search via Amazon Web Services     R       67.202.29.xx    http://www.de.com/start.php?homepage=true       http://www.amazon.com/gp/browse.html?node=3435361
+id_moz_170109_1        Mozilla/5.0 (compatible; Diffbot/0.1; +http://www.diffbot.com)  Diffbot beta - RSS and news feed crawler        R       64.71.190.13x   http://www.diffbot.com/ 
+id_moz_030207_1        Mozilla/5.0 (compatible; DNS-Digger-Explorer/1.0; +http://www.dnsdigger.com)    DNS-Digger - DNS server neighbourhood search    R       212.214.165.2xx http://www.dnsdigger.com/       
+id_moz_100606_2        Mozilla/5.0 (compatible; DNS-Digger/1.0; +http://www.dnsdigger.com)     DNS-Digger - DNS server neighbourhood search    R       212.214.165.2xx http://www.dnsdigger.com/       
+id_moz_020506_1        Mozilla/5.0 (compatible; EARTHCOM.info/2.01; http://www.earthcom.info)  Earthcom (Czech Republic) search robot (194.108.39.xx)  R       s. also EARTHCOM ..     http://www.earthcom.info        
+id_moz_190807_3        Mozilla/5.0 (compatible; EARTHCOM/2.2; +http://enter4u.eu)      enter4u / Earthcom.info search (Czech Republic) R               http://enter4u.eu/      http://www.earthcom.info
+id_moz_050107_1        Mozilla/5.0 (compatible; egothor/8.0g; +http://ego.ms.mff.cuni.cz/)     Prague Faculty of Mathematics and Physics using Egothor open source crawler     P       195.113.20.125  http://ego.ms.mff.cuni.cz/      http://www.egothor.org/
+id_moz_310507_1        Mozilla/5.0 (compatible; Exabot Test/3.0; +http://www.exabot.com/go/robot)      Exalead (France) search robot (193.47.80.xx)    R       s. Harvest-NG/1.0.2 and Exalead NG...   http://www.exabot.com/  
+id_moz_221207_1        Mozilla/5.0 (compatible; FatBot 2.0; http://www.thefind.com/main/CrawlerFAQs.fhtml)     TheFind.com - Shopping search robot     R       64.124.148.xx[x]        http://www.thefind.com/ 
+id_moz_170109_2        Mozilla/5.0 (compatible; Galbot/1.0; +http://www.galbot.com/bot.html)   Galbot tagging robot (beta) - Denmark   R               http://www.galbot.com/  
+id_moz_955     mozilla/5.0 (compatible; genevabot http://www.healthdash.com)   Geneva Single-Site Search Engine used by Healthdash health search       R               http://www.healthdash.com       
+id_moz_170207_4        Mozilla/5.0 (compatible; Google Desktop) Paros/3.2.12   Paros - a Java based HTTP/HTTPS proxy   P               http://sourceforge.net/projects/paros   
+id_moz_956     Mozilla/5.0 (compatible; Googlebot/2.1; http://www.google.com/bot.html) Google robot    R       s. also: - Googlebot - Mozilla/4.0 (MobilePhone SCP ... http://www.google.com   
+id_moz_957     mozilla/5.0 (compatible; heritrix/1.0.4 http://innovationblog.com)      Unknown robot using Heritrix    R               http://innovationblog.com       http://crawler.archive.org/
+id_moz_280207_1        Mozilla/5.0 (compatible; heritrix/1.10.2 +http://i.stanford.edu/)       The Stanford University InfoLab robot using Heritrix    R       171.67.73.1x    http://i.stanford.edu/  http://www.archive.org/
+id_moz_280108_2        Mozilla/5.0 (compatible; heritrix/1.12.1 +http://newstin.com/)  Newstin news feed search using Heritrix R       195.39.35.1xx   http://www.newstin.com/ 
+id_moz_210807_1        Mozilla/5.0 (compatible; heritrix/1.12.1 +http://www.page-store.com)    Page-store.com vertical search via Amazon Web Services  R       72.44.62.1xx    http://www.page-store.com/      http://www.amazonaws.com/
+id_moz_230108_1        Mozilla/5.0 (compatible; heritrix/1.12.1 +http://www.page-store.com) [email:paul@page-store.com]        Page-store.com vertical search via Amazon Web Services  R       72.44.62.1xx    http://www.page-store.com/      http://www.amazonaws.com/
+id_moz_958     mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org)     Heritrix Internet Archive's open-source web project     R               http://archive.crawler.org      
+id_moz_270106_2        Mozilla/5.0 (compatible; heritrix/1.4.0 +http://www.chepi.net)  Chepi Beta search Spain (194.116.240.1xx) using Heritrix        R               http://www.chepi.net/   http://lucene.apache.org
+id_moz_959     Mozilla/5.0 (compatible; heritrix/1.4t http://www.truveo.com/)  Truveo data mining robot using Heritrix R               http://www.truveo.com/home/     http://crawler.archive.org/
+id_moz_960     Mozilla/5.0 (compatible; heritrix/1.5.0 http://www.l3s.de/~kohlschuetter/projects/crawling/)    L3S WebCrawling Project (Germany) using Heritrix        R               http://www.l3s.de/~kohlschuetter/projects/crawling/     http://crawler.archive.org/
+id_moz_961     Mozilla/5.0 (compatible; heritrix/1.5.0-200506231921 http://pandora.nla.gov.au/crawl.html)      Pandora Internet Archive crawler (Australia) using Heritrix     R               http://pandora.nla.gov.au       http://crawler.archive.org/
+id_moz_250706_3        Mozilla/5.0 (compatible; heritrix/1.6.0 http://www.worio.com/)  WORIO (beta) search for computer scientists and programmers using Heritrix open-source crawler  R       137.82.84.xx    http://www.worio.com/   http://www.archive.org/
+id_moz_190607_1        Mozilla/5.0 (compatible; heritrix/1.7.0 +http://www.greaterera.com/)    greatarea.com website collection project using Heritrix R       63.209.222.     http://www.greaterera.com/      
+id_moz_230307_1        Mozilla/5.0 (compatible; Heritrix/1.8.0 http://www.hanzoarchives.com)   hanzo:web social web archiving service  D       216.182.238.    http://www.hanzoweb.com/        
+id_moz_151106_1        Mozilla/5.0 (compatible; heritrix/1.x.x +http://www.accelobot.com)      Accelobot - Accelovation Market Discovery software robot        R       72.20.99.xx     http://www.accelobot.com/       http://www.accelovation.com/solutions.html
+id_moz_030208_1        Mozilla/5.0 (compatible; heritrix/2.0.0-RC1 +http://www.aol.com)        Unknown AOL robot using Heritrix        R       64.236.128.x    http://www.aol.com/     
+id_moz_051207_2        Mozilla/5.0 (compatible; Hermit Search. Com; +http://www.hermitsearch.com)      Hermits Search.com - Products and service search robot  R       72.55.165.11x   http://www.hermitsearch.com/    
+id_moz_161006_2        Mozilla/5.0 (compatible; http://www.IsMySiteUp.Net/bot/ )       IsMySiteUp? - Online website monitoring service C       142.179.247.xx  http://www.ismysiteup.net/      
+id_moz_101106_2        Mozilla/5.0 (compatible; http://www.UptimeAuditor.com/bot/ )    UptimeAuditor - real time web monitoring        C       142.179.247.xx  http://www.uptimeauditor.com/   
+id_moz_180508_1        Mozilla/5.0 (compatible; HyperixScoop/1.3; +http://www.hyperix.com)     Hyperix vertical search crawler R       64.40.113.[x]xx http://www.hyperix.com/ 
+id_moz_070406_1        Mozilla/5.0 (compatible; iaskspider/1.0; MSIE 6.0)      Unknown robot (reads robots.txt) from chinatelecom (219.142.78.xx)              Not from iask.com.cn - s. also iaskspider               
+id_moz_280607_1        Mozilla/5.0 (compatible; IDBot/1.0; +http://www.id-search.org/bot.html) ID-Search.org - Russian search project  R       67.159.44.2xx   http://id-search.org/bot.html   
+id_moz_962     Mozilla/5.0 (compatible; InterseekWeb/3.x)      Najdi.si (Slovenia) search using Interseek/Web Interseek/API Search Engine      R               http://www.najdi.si/pomoc/eng/index.jsp 
+id_moz_130807_4        Mozilla/5.0 (compatible; Jim +http://www.hanzoarchives.com)     hanzo:web social web archiving service  D       216.182.238.    http://www.hanzoweb.com/        
+id_moz_963     Mozilla/5.0 (compatible; Konqueror/2.0.1; X11); Supports MD5-Digest; Supports gzip encoding     Konqueror 2.0.x X11     B               http://www.konqueror.org/       
+id_moz_964     Mozilla/5.0 (compatible; Konqueror/2.1.1; X11)  Konqueror 2.1.x X11     B               http://www.konqueror.org/       
+id_moz_966     Mozilla/5.0 (compatible; Konqueror/2.2.2)       Konqueror 2.2.x B               http://www.konqueror.org/       
+id_moz_965     Mozilla/5.0 (compatible; Konqueror/2.2.2; Linux 2.4.14-xfs; X11; i686)  Konqueror 2.2.x Linux   B               http://www.konqueror.org/       
+id_moz_050108_2        Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails)     Exalead (France) search robot (193.47.80.xx)    R       s. Harvest-NG/1.0.2 and Exalead NG...   http://www.exabot.com/  
+id_moz_967     Mozilla/5.0 (compatible; LemSpider 0.1) Lemur Consulting LemIR spider   R               http://www.lemurconsulting.com  
+id_moz_968     Mozilla/5.0 (compatible; LinksManager.com_bot http://linksmanager.com/linkchecker.html) Linksmanager.com online link checking service   C       s.also LinksManager.com http://www.linksmanager.com     
+id_moz_140408_2        Mozilla/5.0 (compatible; LinkStash Bookmark Manager; http://www.xrayz.co.uk/)   LinkStash Bookmark Manager      C               http://www.xrayz.co.uk/ 
+id_moz_060706_2        Mozilla/5.0 (compatible; MojeekBot/2.0; http://www.mojeek.com/bot.html) Mojeek Search Preview robot (217.155.205.xx)    R       s. also MojeekBot/0.x   http://www.mojeek.com   
+id_moz_290107_1        Mozilla/5.0 (compatible; MOSBookmarks/v2.6-Plus; Link Checker)  Joomla!/Mambo component - MosBookmarks (bot) link checking      C               http://www.tegdesign.ch/        
+id_moz_091007_1        Mozilla/5.0 (compatible; MSIE 6.0; Podtech Network; crawler_admin@podtech.net)  PodTech entertainment and video network crawler R       71.134.235.xx   http://www.podtech.net/home/    
+id_moz_969     Mozilla/5.0 (compatible; OnetSzukaj/5.0; http://szukaj.onet.pl) onet.pl Szukaj (Search) robot (213.180.128.1xx) R       s. also - Onet.pl SA    http://szukaj.onet.pl   
+id_moz_181207_1        Mozilla/5.0 (compatible; PagestackerBot; http://www.pagestacker.com)    Pagestacker online bookmark service     C       70.85.129.12x   http://www.pagestacker.com/     
+id_moz_020307_1        Mozilla/5.0 (compatible; PalmeraBot; http://www.links24h.com/help/palmera) Version 0.001        PalmeraBot - Links24h.com search engine robot   R       80.59.111.2xx   http://www.links24h.com/        http://www.links24h.com/help/palmera/
+id_moz_130806_1        Mozilla/5.0 (compatible; PEAR HTTP_Request class; http://feed.moo.jp/)  FeedMo feed search (Japan) using Pear HTTP      C ?     210.188.205.2xx http://feed.moo.jp/     http://pear.php.net/
+id_moz_190607_2        Mozilla/5.0 (compatible; Phonifier; +http://www.phonifier.com)  PHONifier mobile access to web content  D B             http://www.phonifier.com/       
+id_moz_240208_2        Mozilla/5.0 (compatible; pmoz.info ODP link checker; +http://pmoz.info/doc/botinfo.htm) pmoz.info ODP link checking bot C       74.208.25.118 / 216.15.74.85    http://pmoz.info/doc/botinfo.htm        http://www.dmoz.org/
+id_moz_970     Mozilla/5.0 (compatible; pogodak.ba/3.x)        Pogodak search (Slovenia) robot via Interseek   R       89.143.229.1xx  http://www.pogodak.hr   http://www.interseek.com/
+id_moz_100408_2        Mozilla/5.0 (compatible; Pogodak.hr/3.1)        Pogodak search (Slovenia) robot via Interseek   R       89.143.229.1xx  http://www.pogodak.hr   http://www.interseek.com/
+id_moz_101107_1        Mozilla/5.0 (compatible; Proximic crawler; +http://www.proximic.com/en/about-us/contact-us.html)        Proximic Publisher Widget - RSS and news content generator      C               http://www.proximic.com/        
+id_moz_230907_1        Mozilla/5.0 (compatible; PWeBot/3.1; http://www.programacionweb.net/robot.php)  ProgramacionWeb.net PWeBot crawler (Argentina)  R       62.149.236.2xx  http://www.programacionweb.net/robot-en.php     http://www.programacionweb.net/
+id_moz_130507_1        Mozilla/5.0 (compatible; Quantcastbot/1.0; www.quantcast.com)   Quantcast - Open Internet Ratings Service       R               http://www.quantcast.com/       
+id_moz_190706_1        Mozilla/5.0 (compatible; robtexbot/1.0; http://www.robtex.com/ )        robtex - Multi-RBL check and AS-numbercheck     C               http://www.robtex.com/  
+id_moz_050408_1        Mozilla/5.0 (compatible; ScoutJet; +http://www.scoutjet.com/)   ScoutJet (Blekko) search web crawler    R               http://www.scoutjet.com/        
+id_moz_300106_3        Mozilla/5.0 (compatible; Scrubby/2.2; http://www.scrubtheweb.com/)      Scrub the web robot (66.93.156.xx)      R       s.also Scrubby/2.x      http://www.scrubtheweb.com/     
+id_moz_031107_4        Mozilla/5.0 (compatible; ShunixBot/1.x.x +http://www.shunix.com/robot.htm)      Shunixbot (France) beta / test semantic web indexing robot      R               http://www.shunix.com/  
+id_moz_971     Mozilla/5.0 (compatible; ShunixBot/1.x; http://www.shunix.com/bot.htm)  Shunixbot (France) beta / test semantic web indexing robot      R               http://www.shunix.com/  
+id_moz_280607_2        Mozilla/5.0 (compatible; SkreemRBot +http://skreemr.com)        Skreemr - Audio search engine   R       64.15.69.x      http://skreemr.com/     
+id_moz_070207_2        Mozilla/5.0 (compatible; SnapPreviewBot; en-US; rv:1.8.0.9) Gecko/20061206 Firefox/1.5.0.9      Snap Firefox Search Plugin      B               http://www.snap.com/about/spa1A.php     
+id_moz_972     Mozilla/5.0 (compatible; SpurlBot/0.2)  Spurl.net bookmark service & search engine (84.40.30.xxx)       R C             http://www.spurl.net    
+id_moz_190108_1        Mozilla/5.0 (compatible; SummizeBot +http://www.summize.com)    Summize - Opinion and review search robot       R       208.79.17.x[x]  http://www.summize.com/ 
+id_moz_973     Mozilla/5.0 (compatible; SYCLIKControl/LinkChecker;)    Syclik Control web content management system    R C             http://www.syclik.com   
+id_moz_070607_1        Mozilla/5.0 (compatible; Synoobot/0.9; http://www.synoo.com/search/bot.html)    Synoo web directory robot       R       212.12.114.2xx  http://www.synoo.com/search/bot.html    
+id_moz_261105_1        Mozilla/5.0 (compatible; Theophrastus/x.x; http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php) Theophrastus Internet Spider for a basic search engine project  R               http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php     
+id_moz_030207_2        Mozilla/5.0 (compatible; TridentSpider/3.1)     Interseek - Java search engine technology used for Pogodak search       R       213.253.92.x    http://www.interseek.com/       http://www.pogodak.com/
+id_moz_974     Mozilla/5.0 (compatible; Vagabondo/2.1; webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/)  WiseGuys robot  R       s.also - Mozilla/3.0 (Vagabondo... - Vagabondo..        http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk 
+id_moz_280209_4        Mozilla/5.0 (compatible; Webduniabot/1.0; +http://search.webdunia.com/bot.aspx) Webdunia search (India) robot   R               http://www.webdunia.com/        
+id_moz_151205_1        Mozilla/5.0 (compatible; Windows NT 5.0; phpwebbrainBot/0.1 - http://www.monsterli.ch/phpwebbrain/)     phpwebbrain online bookmark service (Germany)   C               http://www.monsterli.ch/phpwebbrain/    
+id_moz_150307_1        Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)   WORIO (beta) search for computer scientists and programmers using Heritrix open-source crawler  R       137.82.84.xx    http://www.worio.com/   http://www.archive.org/
+id_moz_221008_1        Mozilla/5.0 (compatible; WoW Lemmings Kathune/2.0;http://www.wowlemmings.com/kathune.html)      Kathune spider for World of Warcraft guild data. Used to power WoW Lemmings     R       76.12.83.24x    http://www.wowlemmings.com/kathune.html http://www.wowlemmings.com/
+id_moz_260407_1        Mozilla/5.0 (compatible; XTbot/1.0v; +http://www.externaltest.com)      eXternalTest - Server and online services monitoring    C               http://www.externaltest.com/    
+id_moz_290606_2        Mozilla/5.0 (compatible; Yahoo! DE Slurp; http://help.yahoo.com/help/us/ysearch/slurp)  Yahoo / Inktomi search robot    R       66.196.77.1xx / 72.30.98.2xx            
+id_moz_181105_1        Mozilla/5.0 (compatible; Yahoo! Slurp China; http://misc.yahoo.com.cn/help.html)        Inktomi robot (202.160.180.xxx) for Yahoo China R               http://www.yahoo.com.cn/        http://www.inktomi.com/
+id_moz_975     Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)     Inktomi robot for Yahoo (via 66.196.xx.xxx)     R               http://www.inktomi.com  
+id_moz_061208_2        Mozilla/5.0 (compatible; YesupBot/1.0; +http://www.yesup.net/bot.html)  Yesup Seo - Toronto SEO Service C       66.48.78.1xx    http://yesupseo.com/    
+id_moz_250107_1        Mozilla/5.0 (compatible; Yoono; http://www.yoono.com/)  Yoono - community based search (193.110.140.xxx / 194.0.179.[x]xx)      R       s. also yoono/1.0 web-crawler - yoofind/yoofind ..      http://www.yoono.com/   
+id_moz_061208_3        Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; ) Youdao search (China) robot     R       202.108.7.1xx   http://www.youdao.com/  
+id_moz_050807_1        Mozilla/5.0 (compatible; Zenbot/1.3; +http://zen.co.za/webmasters/)     Zenbot robot for the Southern African Zen search service        R       196.46.116.x[x] / 196.23.180.x[x]       http://zen.co.za/       http://zen.co.za/webmasters/
+id_moz_110408_1        Mozilla/5.0 (compatible; zermelo +http://www.powerset.com) [email:paul@page-store.com,crawl@powerset.com]       Powerset Natural Language Search crawler (under development) using Heritrix via Amazon Web Services     R       67.202.34.xxx   http://www.powerset.com/        http://www.amazon.com/gp/browse.html?node=3435361
+id_moz_030606_1        Mozilla/5.0 (compatible;archive.org_bot/1.7.1; collectionId=316; Archive-It; +http://www.archive-it.org)        Heritrix - The Internet Archive's open-source crawler (207.241.225.2xx) R       s.also - InternetArchive/0.8-dev - archive.org_bot      http://www.archive.org/ 
+id_moz_180906_2        Mozilla/5.0 (compatible;archive.org_bot/heritrix-1.9.0-200608171144 +http://pandora.nla.gov.au/crawl.html)      Wayback Machine Internet Archive crawler        R       207.241.233.2xx http://www.archive.org/index.php        
+id_moz_180107_1        Mozilla/5.0 (compatible;FindITAnswersbot/1.0;+http://search.it-influentials.com/bot.htm)        FindITAnswers - Search engine for software developers   B       74.93.15.249    http://www.finditanswers.com/   
+id_moz_170906_2        Mozilla/5.0 (compatible;MAINSEEK_BOT)   Mainseek search (Poland) robot  R       80.190.213.xx   http://www.mainseek.com/        
+id_moz_290708_1        Mozilla/5.0 (Gecko/20070310 Mozshot/0.0.20070628; http://mozshot.nemui.org/)    MozShot - Technical demo to take screenshot of any URL  B               http://mozshot.nemui.org/       
+id_moz_150408_2        Mozilla/5.0 (Macintosh; U; Intel Mac OS X 10.4; en-US; rv:1.9b5) Gecko/2008032619 Firefox/3.0b5 Mozilla Firefox 3.0 beta (Gran Paradiso) for MacOS      B               http://developer.mozilla.org/en/docs/Firefox_3_for_developers   
+id_moz_976     Mozilla/5.0 (Macintosh; U; PPC Mac OS X Mach-O; en-US; rv:1.0.1) Gecko/20021219 Chimera/0.6     Chimera browser (Mozilla/Gecko engine) - now Camino Mac PowerPC B               http://www.mozilla.org  
+id_moz_977     Mozilla/5.0 (Macintosh; U; PPC Mac OS X Mach-O; en-US; rv:1.0.1) Gecko/20030306 Camino/0.7      Camino browser (Mozilla/Gecko engine) - ex Chimera Mac PowerPC  B               http://www.mozilla.org  
+id_moz_978     Mozilla/5.0 (Macintosh; U; PPC Mac OS X; en-US) AppleWebKit/xx (KHTML like Gecko) OmniWeb/v5xx.xx       OmniWeb 5.x.x Mac OS X browser  B               http://www.omnigroup.com        
+id_moz_979     Mozilla/5.0 (Macintosh; U; PPC Mac OS X; en-us) AppleWebKit/xxx.x (KHTML like Gecko) Safari/12x.x       Safari 1.2x browser (Mozilla/Gecko engine) MAC OS X     B               http://www.apple.com    
+id_moz_980     Mozilla/5.0 (Macintosh; U; PPC; en-US; rv:0.9.2) Gecko/20010726 Netscape6/6.1   Netscape 6.x Mac PowerPC        B                       
+id_moz_981     Mozilla/5.0 (research@mediatrec.com)    unknown robot from gw.ocg-corp.com                              
+id_moz_260806_1        Mozilla/5.0 (Sage)      Sage - RSS and Atom feed reader extension for Mozilla Firefox   B               http://sage.mozdev.org/ 
+id_moz_982     Mozilla/5.0 (Slurp/cat; slurp@inktomi.com; http://www.inktomi.com/slurp.html)   Inktomi (Hotbot-Lycos - NBCi etc.) robot        R               http://www.inktomi.com  
+id_moz_983     Mozilla/5.0 (Slurp/si; slurp@inktomi.com; http://www.inktomi.com/slurp.html)    Inktomi (Hotbot-Lycos - NBCi etc.) robot        R               http://www.inktomi.com  
+id_moz_984     Mozilla/5.0 (SunOS 5.8 sun4u; U) Opera 5.0 [en] Opera 5.x SunOS B                       
+id_moz_020507_1        Mozilla/5.0 (Twiceler-0.9 http://www.cuill.com/twiceler/robot.html)     Twiceler experimental web crawler       R       64.62.136.xxx   http://www.cuill.com/   
+id_moz_070106_2        Mozilla/5.0 (Version: xxxx Type:xx)     Some spambot from Romania (82.208.139.1xx & 86.123.65.xx) - Maybe email harvesting      S       UA sometimes have random letters like: vkfjkgo...               
+id_moz_985     Mozilla/5.0 (wgao@genieknows.com)       GenieKnows.com search robot (64.5.245.xx / 64.5.220.xxx)        R               http://www.genieknows.com/      
+id_moz_986     Mozilla/5.0 (Windows; U; Win98; en-US; rv:0.9.2) Gecko/20010726 Netscape6/6.1   Netscape 6.x Win98      B                       
+id_moz_987     Mozilla/5.0 (Windows; U; Win98; en-US; rv:x.xx) Gecko/20030423 Firebird Browser/0.6     Firebird browser (Mozilla/Gecko engine) - ex Phoenix Win98      B               http://www.mozilla.org  
+id_moz_988     Mozilla/5.0 (Windows; U; Win9x; en; Stable) Gecko/20020911 Beonex/0.8.1-stable  Beonex Communicator browser (Mozilla/Gecko engine)      B               http://www.beonex.com   
+id_moz_111205_1        Mozilla/5.0 (Windows; U; Windows NT 5.0; en-US; rv:1.7.7) NimbleCrawler 1.11 obeys UserAgent NimbleCrawler For problems contact: crawler_at_dataalchemy.com     Healthline health related search robot (72.5.115.xx)    R               http://www.healthline.com/      
+id_moz_171008_2        Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US) AppleWebKit/525.19 (KHTML, like Gecko) Chrome/0.2.153.1 Safari/525.19   Google Chrome browser based on WebKit (Safari)  B               http://www.google.com/chrome    
+id_moz_170207_1        Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.8.0.5) Gecko/20060731 Firefox/1.5.0.5 Flock/0.7.4.1        Flock web browser built on Mozilla technologies B               http://www.flock.com/   
+id_moz_190108_3        Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.8.1.11) Gecko/20071127 Firefox/2.0.0.4/Megaupload x.0      Megaupload Mega Manager - Download manager plugin for Firefox   D               http://www.megaupload.com/manager/de/   
+id_moz_171008_1        Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.9.0.1) Gecko/2008092215 Firefox/3.0.1 Orca/1.1 beta 3      Orca browser - based on Gecko   B               http://www.orcabrowser.com      
+id_moz_989     Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:x.x.x) Gecko/20041107 Firefox/x.x    Firefox browser (Mozilla/Gecko engine) - ex Firebird WinXP      B               http://www.mozilla.org  
+id_moz_990     Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:x.xx) Gecko/20030504 Mozilla Firebird/0.6    Firebird browser (Mozilla/Gecko engine) - ex Phoenix WinXP      B               http://www.mozilla.org  
+id_moz_991     Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:x.xxx) Gecko/20041027 Mnenhy/0.6.0.104       Mnenhy - enhanced mail & news Mozilla based browser     B               http://mnenhy.mozdev.org/index-de.html  
+id_moz_060508_2        Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)  Voila.fr robot  R               http://www.voila.fr     
+id_moz_080608_2        Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)  Voila.fr robot  R               http://www.voila.fr     
+id_moz_150408_3        Mozilla/5.0 (Windows; U; Windows NT 6.0; en-US; rv:1.9b5) Gecko/2008032620 Firefox/3.0b5        Mozilla Firefox 3.0 beta (Gran Paradiso) for Win        B               http://developer.mozilla.org/en/docs/Firefox_3_for_developers   
+id_moz_300407_2        Mozilla/5.0 (Windows; U;XMPP Tiscali Communicator v.10.0.1; Windows NT 5.1; it; rv:1.8.1.3) Gecko/20070309 Firefox/2.0.0.3      Tiscali Communicator - Online services suite    B               http://im.tiscali.com/index.html        
+id_moz_300106_1        Mozilla/5.0 (Windows;) NimbleCrawler 1.12 obeys UserAgent NimbleCrawler For problems contact: crawler@health    Healthline health related search robot (72.5.115.xx)    R               http://www.healthline.com/      
+id_moz_161205_2        Mozilla/5.0 (Windows;) NimbleCrawler 1.12 obeys UserAgent NimbleCrawler For problems contact: crawler@healthline.com    Healthline health related search robot (72.5.115.xx)    R               http://www.healthline.com/      
+id_moz_090807_2        Mozilla/5.0 (X11; Linux i686; U;rv: 1.7.13) Gecko/20070322 Kazehakase/0.4.4.1   Kazehakase - Gecko based browser (Japan)        B               http://kazehakase.sourceforge.jp/       
+id_moz_992     Mozilla/5.0 (X11; U; Linux 2.4.2-2 i586; en-US; m18) Gecko/20010131 Netscape6/6.01      Netscape 6.x Linux      B                       
+id_moz_160306_1        Mozilla/5.0 (X11; U; Linux i686; de-AT; rv:1.8.0.2) Gecko/20060309 SeaMonkey/1.0        SeaMonkey browser suite (ex Mozilla) on Linux   B               http://www.mozilla.org/projects/seamonkey/      
+id_moz_993     Mozilla/5.0 (X11; U; Linux i686; en-GB; rv:1.7.6) Gecko/20050405 Epiphany/1.6.1 (Ubuntu) (Ubuntu package 1.0.2) Epiphany (Mozilla/Gecko engine) browser Linux   B               http://www.gnome.org/projects/epiphany/ 
+id_moz_994     Mozilla/5.0 (X11; U; Linux i686; en-US; Nautilus/1.0Final) Gecko/20020408       Nautilus (developed by Eazel.com) 1.x Browser Linux     B               http://swin05.dyndns.biz/Doc/Docrh7.03us/DocRH7.3us/sunsite.mff.cuni.cz/pub/redhat/linux/7.3/fr/doc/RH-DOCS/rhl-gsg-en-7.3/s1-browsers-nautilus.html    
+id_moz_995     Mozilla/5.0 (X11; U; Linux i686; en-US; rv:0.9.3) Gecko/20010801        Mozilla (Gecko) 0.9x browser Linux      B                       
+id_moz_030110_5        Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.2.1; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/20021130    Spinn3r social network crawler  R       64.34.195.1xx   http://spinn3r.com/     
+id_moz_996     Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.2b) Gecko/20021007 Phoenix/0.3     Phoenix 0.3 browser (Mozilla/Gecko engine) - now Firebird Linux B               http://www.firebirdsql.org/     
+id_moz_997     Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.6) Gecko/20040413 Epiphany/1.2.1   Epiphany (Mozilla/Gecko engine) browser Linux   B               http://www.gnome.org/projects/epiphany/ 
+id_moz_190107_1        Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8.0.7) Gecko/20060909 Firefox/1.5.0.7 SnapPreviewBot       Snap Firefox Search Plugin      B               http://www.snap.com/about/spa1A.php     
+id_moz_240107_2        Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8.1) Gecko/20061129 BonEcho/2.0    Bon Echo Alpha - developer preview of future Firefox browser    B               http://www.mozilla.org/projects/bonecho/releases/2.0a1.html     
+id_moz_240207_2        Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8.1.1) Gecko/20061205 Iceweasel/2.0.0.1 (Debian-2.0.0.1+dfsg-2)    IceWeasel - the GNU version of the Firefox browser      B               http://www.gnu.org/software/gnuzilla/   
+id_moz_150408_1        Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9a8) Gecko/2007100619 GranParadiso/3.0a8 Mozilla Firefox 3.0 beta (Gran Paradiso) for Linux      B               http://developer.mozilla.org/en/docs/Firefox_3_for_developers   
+id_moz_999     Mozilla/5.0 Galeon/1.0.2 (X11; Linux i686; U;) Gecko/20011224   Galeon 1.x Browser Linux        B               http://galeon.sourceforge.net/  
+id_moz_1000    Mozilla/5.0 gURLChecker/0.x.x (Linux)   gURLChecker - GNOME link checking tool  C               http://www.nongnu.org   
+id_moz_1001    Mozilla/5.0 URL-Spider  URL Spider - used by usww.net   R               http://www.url-spider.com/      
+id_moz_1002    Mozilla/5.0 usww.com-Spider-for-w8.net  W8net spider    R               http://www.usww.com     
+id_moz_1003    Mozilla/5.0 wgao@genieknows.com GenieKnows.com search robot (64.5.245.xx / 64.5.220.xxx)        R               http://www.genieknows.com       
+id_moz_111205_7        Mozilla/5.0 whoiam [http://www.axxus.de/]       axxus.de German business directory      R C             http://www.axxus.de/    
+id_moz_998     Mozilla/5.0 [en] (compatible; Gulper Web Bot 0.2.4 www.ecsl.cs.sunysb.edu/~maxim/cgi-bin/Link/GulperBot)        Yuntis : Collaborative Web Resource Categorization and Ranking Project robot    R               http://www.ecsl.cs.sunysb.edu/yuntis/   
+id_g_m_190606_1        MQbot metaquerier.cs.uiuc.edu/crawler   MetaExplorer project's MetaQuerier robot        R       192.17.11.xx    http://metaquerier.cs.uiuc.edu/ 
+id_g_m_251006_1        MQBOT/Nutch-0.9-dev (MQBOT Nutch Crawler; http://falcon.cs.uiuc.edu; mqbot@cs.uiuc.edu) MetaExplorer project's MetaQuerier robot        R       192.17.11.xx    http://metaquerier.cs.uiuc.edu/ 
+id_g_m_1004    MSFrontPage/4.0 MS Frontpage 4.x        B                       
+id_g_m_1005    MSIE 4.0 (Win95)        Some faked UA - maybe for a download manager    D                       
+id_g_m_1006    MSIE-5.13 (larbin@unspecified.mail)     unknown robot from gw.ocg-corp.com (209.126.176.x)              see also: - Opera/6.01 (larbin@.....) - WinampMPEG/2.00 larbin@....             
+id_g_m_190506_1        msnbot-media/1.0 (+http://search.msn.com/msnbot.htm)    MSN media search robot  R       65.55.235.1xx   http://search.msn.com   
+id_g_m_290806_1        msnbot-Products/1.0 (+http://search.msn.com/msnbot.htm) Windows Live product search (Beta) robot        R       207.68.157.xxx  http://products.live.com        http://productsearch.spaces.live.com/
+id_g_m_1007    MSNBOT/0.xx (http://search.msn.com/msnbot.htm)  MSN Search robot - 131.107.xxx.xxx 204.95.96.xxx - 204.95.111.xxx 207.46.xxx.xxx        R       s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search...     http://search.msn.com   
+id_g_m_1008    msnbot/x.xx ( http://search.msn.com/msnbot.htm) MSN Search robot - 131.107.xxx.xxx 204.95.96.xxx - 204.95.111.xxx 207.46.xxx.xxx        R       s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search...     http://search.msn.com   
+id_g_m_190108_2        MSNBOT_Mobile MSMOBOT Mozilla/2.0 (compatible; MSIE 4.02; Windows CE; Default)  Microsoft search for mobiles    R       65.55.241.2xx   http://livesearchmobile.com/?mid=1011   
+id_g_m_1009    MSNPTC/1.0      MSN Search robot - 131.107.xxx.xxx 204.95.96.xxx - 204.95.111.xxx 207.46.xxx.xxx        R       s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search...     http://search.msn.com   
+id_g_m_1010    MSProxy/2.0     Microsoft proxy server  P               http://www.microsoft.com/isaserver/evaluation/previousversions/default.mspx     
+id_g_m_181205_3        MSRBOT  MacEdition CodeBitch link checking      C               http://www.macedition.com/cb/cb_20030310.php    
+id_g_m_270407_1        MSRBOT (http://research.microsoft.com/research/sv/msrbot)       Microsoft MSRBot        R               http://research.microsoft.com/research/sv/msrbot/       
+id_g_m_070406_3        Mulder, VCR-1.0 StreamBox VCR user agent        D               http://all-streaming-media.com/streaming-media-faq/faq-streambox-vcr-download-problems.htm      
+id_g_m_1011    multiBlocker browser    Multiblocker (Fantomaster) anonymity software user      P               http://multiblocker.com/home.html       http://fantomaster.com
+id_g_m_030807_1        multicrawler ( http://sw.deri.org/2006/04/multicrawler/robots.html)     MultiCrawler for DERI Galway's Semantic Web Search Engine cluster       R       140.203.154.1xx http://sw.deri.org/2006/04/multicrawler/robots.html     http://sw.deri.ie/
+id_g_m_1012    MultiText/0.1   Virginia Tech Digital Library Research Laboratory robot R               http://www.dlib.vt.edu  
+id_g_m_1013    MusicWalker2.0 ( http://www.somusical.com)      SoMusical! musical directory link checking      R               http://www.somusical.com        
+id_g_m_270306_1        MVAClient       Unknown bad bot from diff. Taiwanese IPs        S       see this blog:  http://www.tenspider.com/business-blog/weblog.php       
+id_g_m_241105_1        My WinHTTP Connection   Windows HTTP Services (WinHTTP)                 http://msdn.microsoft.com/library/?url=/library/en-us/winhttp/http/about_winhttp.asp    
+id_g_m_1014    myDaemon        unknown user robot (24.124.34.42)                               
+id_g_m_1015    MyGetRight/1.0.0        GetRight download manager       D               http://www.getright.com 
+id_g_m_1016    MyGetRight/1.0b GetRight download manager       D               http://www.getright.com 
+id_g_m_1017    Mylinea.com Crawler 2.0 Mylinea France web catalogue crawler    R               http://www.mylinea.com  
+id_g_m_040906_1        mylinkcheck/1.02        VDOG - SEO webdirecory (Germany) link checking  C               http://www.vdog.de/     
+id_n_s_1018    Naamah 1.0.1/Blogbot (http://blogbot.de/)       Blogbot (Germany) robot R               http://blogbot.de/      
+id_n_s_1019    Naamah 1.0a/Blogbot (http://blogbot.de/)        Blogbot (Germany) robot R               http://blogbot.de/      
+id_n_s_1021    NABOT/5.0       Naver Japan / Korea robot       R       s.also Python-urllib/1.15 - dloader(NaverRobot)/1.0 & Cowbot    http://www.naver.co.jp/ 
+id_n_s_1020    nabot_1.0       Naver Japan / Korea robot       R       s.also Python-urllib/1.15 - dloader(NaverRobot)/1.0 & Cowbot    http://www.naver.co.jp/ 
+id_n_s_180408_4        NameOfAgent (CMS Spider)        Badbot searching for Wordpress wp-login.php     S                       
+id_n_s_071205_1        naoFavicon4IE/1.xx      naoFavicon4IE   D               http://nao4u.com/software/naoFavicon4IE/        
+id_n_s_140506_2        NASA Search 1.0 Unknown spambot / harvester from diff. IPs      S               http://www.projecthoneypot.org/ip_inspector.php?iph=978231e229521680d11cb93f32de0fa1    
+id_n_s_1022    NationalDirectory-WebSpider/1.3 Nationaldirectory spider        R               http://www.nationaldirectory.com/       
+id_n_s_1023    NationalDirectoryAddURL/1.0     Nationaldirectory spider        R               http://www.nationaldirectory.com/       
+id_n_s_1025    NaverBot-1.0 (NHN Corp. / +82-2-3011-1954 / nhnbot@naver.com)   Naver Japan / Korea robot       R       s. also Python-urllib/1.15- nabot- cowbot & dloader     http://www.naver.co.jp/ 
+id_n_s_1024    NaverBot_dloader/1.5    Naver Japan / Korea robot       R       s. also Python-urllib/1.15 - nabot - cowbot & dloader   http://www.naver.co.jp/ 
+id_n_s_181205_1        NavissoBot      Navisso closed beta robot (69.41.162.1xx)       R               http://navisso.com/     
+id_n_s_181205_2        NavissoBot/1.7 (+http://navisso.com/)   Navisso closed beta robot (69.41.162.1xx)       R               http://navisso.com/     
+id_n_s_1026    NCSA Beta 1 (http://vias.ncsa.uiuc.edu/viasarchivinginformation.html)   Vias Information Archival robot R               http://vias.ncsa.uiuc.edu/      
+id_n_s_250507_1        Nebullabot/2.2 (http://bot.nebulla.info)        Nebulla.info distributed crawler (Germany)      R       81.169.180.2xx  http://www.nebulla.info/        http://bot.nebulla.info/
+id_n_s_1027    NEC Research Agent -- compuman at research.nj.nec.com   NEC Researchindex robot - now CiteSeer.IST scientific document index    R               http://citeseer.ist.psu.edu/    
+id_n_s_1028    NEC-Hayek/1.0   rcn.com user agent ? NEC Researchindex robot ?          s. NEC Research Agent           
+id_n_s_291108_4        Net-Seekr Bot/Net-Seekr Bot V1 (http://www.net-seekr.com)       Net Seekr search robot  R       78.129.201.19x  http://www.net-seekr.com/       
+id_n_s_1029    NetAnts/1.2x    NetAnts download manager        D               http://www.netants.com/en/index.html    
+id_n_s_1030    NETCOMplete/x.xx        NetComplete IE browser package  B               http://www.netcom.net.uk/       
+id_n_s_010807_2        NetinfoBot/1.0 (http://netinfo.bg/netinfobot.html)      Netinfo.bg search (Bulgaria) robot      R       194.153.145.x[xx]       http://netinfo.bg/      
+id_n_s_1031    NetLookout/2.24 Netlookout internet notifier    R       site is offline http://www.frugalsoft.com       
+id_n_s_230406_3        Netluchs/0.8-dev ( ; http://www.netluchs.de/; ___don't___spam_me_@netluchs.de)  Netluchs (Germany) search (193.164.8.xx)        R       Same IP-range as Metager search - powered by Nutch      http://www.netluchs.de/ 
+id_n_s_1032    NetMechanic Vx.0        NetMechanic link checker        C               http://www.netmechanic.com/     
+id_n_s_030906_1        NetNewsWire/2.x (Mac OS X; http://ranchero.com/netnewswire/)    NewsGator NetNewsWire - Mac RSS feed reader     B               http://www.newsgator.com/NGOLProduct.aspx?ProdID=NetNewsWire    
+id_n_s_1033    NetNoseCrawler/v1.0     unknown InCom (216.0.107.xx) robot      R               http://www.incom.net/   
+id_n_s_1034    Netprospector JavaCrawler       Netprospector metasearch software       R               http://www.actaddons.com/products/netprospector.asp     
+id_n_s_1035    NetPumper/x.xx  Netpumper download manager      D               http://www.netpumper.com/       
+id_n_s_1036    NetResearchServer(http://www.look.com)  Look.com robot (209.87.232.x)   R               http://www.look.com/    
+id_n_s_1037    NetResearchServer/x.x(loopimprovements.com/robot.html)  IncyWincy search engine using DMOZ database     R               http://www.loopimprovements.com/        
+id_n_s_140209_5        NetSeer/Nutch-0.9 (NetSeer Crawler; http://www.netseer.com; crawler@netseer.com)        NetSeer search (beta) crawler via Amazon Web Services - see also Teemer R       67.202.26.1xx   http://www.netseer.com/ http://www.amazon.com/gp/browse.html?node=3435361
+id_n_s_150906_2        NetSprint -- 2.0        Wirtualna Polska / Netsprint search (Poland) robot      R       212.77.102.1xx  http://www.wp.pl/       http://www.netsprint.pl/serwis/
+id_n_s_190306_1        NetWhatCrawler/0.06-dev (NetWhatCrawler from NetWhat.com; http://www.netwhat.com; support@netwhat.com)  NetWhat Search crawler (69.9.167.1xx)   R               http://www.netwhat.com/ 
+id_n_s_1038    NetZippy        Netzippy robot  R       site is closed  http://www.netzippy.com/        
+id_n_s_1039    NeuralBot/0.2   unknown                         
+id_n_s_1040    newsearchengine (ThisUser@unspecified.mail)     Unknown (12.238.4.xxx) attbi.com client robot                           
+id_n_s_250707_3        NewsGator FetchLinks extension/0.2.0 (http://graemef.com)       FetchLinks plugin for NewsGator RSS reader      B               http://graemef.com/project/fetchlinks   
+id_n_s_250707_4        NewsGatorOnline/2.0 (http://www.newsgator.com; 1 subscribers)   NewsGator online RSS reader     B       64.78.155.1xx   http://www.newsgator.com/       
+id_n_s_1041    NextGenSearchBot 1 (for information visit http://www.eliyon.com/NextGenSearchBot)       Eliyon Crawler for Business People Search       R               http://www.eliyon.com/NextGenSearchBot  
+id_n_s_1042    NextopiaBOT (+http://www.nextopia.com) distributed crawler client beta v0.x     Nextopia crawler        R               http://www.nextopia.com/        
+id_n_s_060906_1        NG-Search/0.90 (NG-SearchBot; http://www.ng-search.com; )       find your keywords - semantic search (Germany) robot    R       84.56.87.1xx    http://www.ng-search.com/       
+id_n_s_1043    NG/1.0  Exalead (France) search robot (193.47.80.xx)    R       s. Harvest-NG/1.0.2 and Exalead NG...   http://www.exabot.com/  
+id_n_s_050406_3        NG/4.0.1229     Exalead Websearch image crawler (193.47.80.xx)  R       s. also Exabot-Images/1.0       http://www.exalead.com/search   
+id_n_s_071106_1        nicebot Unknown UA from PlanetLab distributed network           128.8.126.xx    http://planetlab2.cs.umd.edu/   
+id_n_s_1044    NICO/1.0        NicoZone childsafe search robot R P     -site is offline-       http://www.nicozone.net/        
+id_n_s_291007_2        Nikita the Spider (http://NikitaTheSpider.com/) Nikita the Spider - Online HTML validation , link checking      C       69.61.23.11x    http://nikitathespider.com/     
+id_n_s_1045    NITLE Blog Spider/0.01  Experimental LSI (?) robot from 140.233.69.xx (Middlebury.edu)  R               http://javelina.cet.middlebury.edu/lsa/out/lsa_intro.htm        
+id_n_s_1046    Nitro Downloader 1.x (www.klsofttools.com)      Download manager        D               http://www.klsofttools.com      
+id_n_s_1047    Noago Spider    Noago spider    R               http://www.noago.com/   
+id_n_s_1048    Nocilla/1.0     telefonica.es user robot                                
+id_n_s_1049    Nokia-WAPToolkit/1.2 googlebot(at)googlebot.com Google WAP robot        R               http://www.google.com/  
+id_n_s_290708_3        Nokia6300/2.0 (05.50) Profile/MIDP-2.0 Configuration/CLDC-1.1 (botmobi http://find.mobi/bot.html abuse@mtld.mobi)       Botmobi crawler for Find.mobi mobile search     C               http://find.mobi/bot.html       http://find.mobi/
+id_n_s_200108_3        Nokia6610/1.0 (3.09) Profile/MIDP-1.0 Configuration/CLDC-1.0 (compatible;YahooSeeker/M1A1-R2D2; http://help.yahoo.com/help/us/ysearch/crawling/crawling-01.html)        YahooSeeker/M1A1-R2D2 - Yahoo mobile web crawling robot R       68.180.2xx.[x]xx        http://help.yahoo.com/l/us/yahoo/search/mobilecrawler/mobilecrawler-01.html     
+id_n_s_1050    Nokia7110/1.0 (05.01) (Google WAP Proxy/1.0)    Google WAP proxy        P               http://www.google.com/  
+id_n_s_1051    NokodoBot/1.x (+http://nokodo.com/bot.htm)      Nokodo public beta search robot (67.18.222.xx)  R               http://www.nokodo.com/  
+id_n_s_1052    Norbert the Spider(Burf.com)    Burf.com UK Search Engine robot R               http://www.burf.com/    
+id_n_s_1053    noxtrumbot/1.0 (crawler@noxtrum.com)    noXtrum search robot (Spain)    R       194.224.199.xx  http://www.noxtrum.com/ 
+id_n_s_040506_2        noyona_0_1      Noyona job search (preview)     R       207.210.106.1xx http://www.noyona.com/index.pl  
+id_n_s_1054    NP/0.1 (NP; http://www.nameprotect.com; npbot@nameprotect.com)  Nameprotect copyright search robot (24.177.134.x)       R       s. also - aipbot/1.0 (aipbot; http://www.aipbot.com... - NPBot ...      http://www.nameprotect.com/     
+id_n_s_1553    NPBot (http://www.nameprotect.com/botinfo.html) Nameprotect copyright search robot (24.177.134.x)       R               http://www.nameprotect.com/     
+id_n_s_1552    NPBot-1/2.0     Nameprotect copyright search robot (24.177.134.x)       R               http://www.nameprotect.com/     
+id_n_s_291205_3        Nsauditor/1.x   Nsauditor Network Security Auditor      S               http://www.nsauditor.com/       
+id_n_s_1055    NSPlayer/10.0.0.xxxx WMFSDK/10.0        NetShow Media Player = Windows Media Player 10  B                       
+id_n_s_281207_2        nsyght.com/Nutch-1.0-dev (nsyght.com; Nsyght.com)       Nsyght social search application        R               http://search.nsyght.com/       
+id_n_s_161007_1        nsyght.com/Nutch-x.x (nsyght.com; search.nsyght.com)    Nsyght social search application        R               http://search.nsyght.com/       
+id_n_s_1056    nttdirectory_robot/0.9 (super-robot@super.navi.ocn.ne.jp)       NTT Directory robot     R               http://navi.ocn.ne.jp/  
+id_n_s_180206_1        Nucleus SiteList LinkChecker/1.1        Nucleus CMS SiteList link managing plugin       C               http://wakka.xiffy.nl/sitelist  
+id_n_s_1058    nuSearch Spider <a href='http://www.nusearch.com'>www.nusearch.com</a> (compatible; MSIE 4.01)  nuSearch spider (84.9.136.xxx)  R               http://www.nusearch.com/        
+id_n_s_1057    NuSearch Spider (compatible; MSIE 6.0)  nuSearch spider (84.9.136.xxx)  R               http://www.nusearch.com/        
+id_n_s_1059    NuSearch Spider www.nusearch.com        nuSearch spider (84.9.136.xxx)  R               http://www.nusearch.com/        
+id_n_s_1060    Nutch   Nutch open source robot R               http://www.nutch.org/docs/bot.html      
+id_n_s_211107_1        Nutch crawler/Nutch-0.9 (picapage.com; admin@picapage.com)      Picapage search for handheld devices using Nutch        R               http://picapage.biz/    
+id_n_s_230408_1        Nutch/Nutch-0.9 (Eurobot; http://www.ayell.eu ) Ayell Euronet business directory robot using Nutch      R               http://www.ayell.eu/    
+id_n_s_120406_1        NutchCVS/0.06-dev (Nutch; http://www.nutch.org/docs/en/bot.html; nutch-agent@lists.sourceforge.net)     Netsweeper content filtering engine (66.207.120.2xx) powered by Nutch   P       uses also: Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.7.5) Gecko/20041107 Firefox/1.0 http://www.netsweeper.com/      
+id_n_s_1061    NutchCVS/0.0x-dev (Nutch; http://www.nutch.org/docs/bot.html; nutch-agent@lists.sourceforge.net)        Nutch open source robot R               http://www.nutch.org/docs/bot.html      
+id_n_s_010406_1        NutchCVS/0.7.1 (Nutch running at UW; http://www.nutch.org/docs/en/bot.html; sycrawl@cs.washington.edu)  Robot from University of Washington Computer Science & Engineering (128.208.6.2xx)      R       powered by Nutch        http://qbert.cs.washington.edu/ 
+id_n_s_251006_2        NutchEC2Test/Nutch-0.9-dev (Testing Nutch on Amazon EC2.; http://lucene.apache.org/nutch/bot.html; ec2test at lucene.com)       Amazon Elastic Compute Cloud (Amazon EC2) robot R       216.182.236.xx  http://www.amazon.com/b/ref=sc_fe_l_2/104-6713356-1433533?ie=UTF8&node=201590011&no=3435361&me=A36L942TSJ2AJA   
+id_n_s_1062    NutchOrg/0.0x-dev (Nutch; http://www.nutch.org/docs/bot.html; nutch-agent@lists.sourceforge.net)        Nutch open source robot R               http://www.nutch.org/docs/bot.html      
+id_n_s_210108_1        nutchsearch/Nutch-0.9 (Nutch Search 1.0; herceg_novi at yahoo dot com)  Unknown robot using Nutch (maybe private crawling) via Cox network (70.187.130.25x)     R       reads robots.txt        http://lucene.apache.org/nutch/ 
+id_n_s_041106_1        NutchVinegarCrawl/Nutch-0.8.1 (Vinegar; http://www.cs.washington.edu; eytanadar at gmail dot com)       Unknown crawler from University of Washington - Computer science        R       128.208.3.1xx   http://www.cs.washington.edu/   
+id_n_s_1063    obidos-bot (just looking for books.)    Weblog bookwatch robot  R               http://www.onfocus.com/bookwatch/       
+id_n_s_1064    ObjectsSearch/0.01-dev (ObjectsSearch;http://www.ObjectsSearch.com/bot.html; support@thesoftwareobjects.com)    Objects Search robot    R               http://www.objectssearch.com/   
+id_n_s_1065    ObjectsSearch/0.0x (ObjectsSearch; http://www.ObjectsSearch.com/bot.html; support@thesoftwareobjects.com)       Objects Search robot    R               http://www.objectssearch.com/   
+id_n_s_1066    oBot ((compatible;Win32))       Cobion Germany Brand Protection Services robot  R               http://www.cobion.com/  
+id_n_s_1067    Ocelli/1.x (http://www.globalspec.com/Ocelli)   GlobalSpec Engineering Search robot (66.194.55.xxx)     R               http://www.globalspec.com/      
+id_n_s_1068    Octopus Octopus download manager        D               http://moskalyuk.com/octopus/   
+id_n_s_230306_1        Octora Beta - www.octora.com    Octora blog or RSS information crawler - beta (66.228.114.xx)   R               http://www.octora.com/  
+id_n_s_230606_4        Octora Beta Bot - www.octora.com        Octora RSS feed search  R       66.228.114.xx   http://www.octora.com/  
+id_n_s_1069    Offline Explorer 1.*    Meta Products Offlinebrowser    B D             http://www.metaproducts.com/    
+id_n_s_1070    OliverPerry     Claymont robot / Internetseer Web Site Monitoring       R C             http://www.claymont.com/        
+id_n_s_1071    OmniExplorer_Bot/1.0x (+http://www.omni-explorer.com) Internet CategorizerOmniExplorer http://www.omni-explorer.com/ car & shopping search (64.62.175.xxx)      OmniExplorer car & shopping search (64.62.175.xxx)      R       based on YottaCars... (see there)       http://www.omni-explorer.com    
+id_n_s_1072    OmniExplorer_Bot/1.0x (+http://www.omni-explorer.com) Job Crawler       OmniExplorer car & shopping search (64.62.175.xxx)      R       based on YottaCars... (see there)       http://www.omni-explorer.com    
+id_n_s_1073    OmniExplorer_Bot/1.1x (+http://www.omni-explorer.com) Torrent Crawler   OmniExplorer car & shopping search (64.62.175.xxx)      R       based on YottaCars... (see there)       http://www.omni-explorer.com    
+id_n_s_1074    OmniExplorer_Bot/x.xx (+http://www.omni-explorer.com) WorldIndexer      OmniExplorer car & shopping search (64.62.175.xxx)      R       based on YottaCars... (see there)       http://www.omni-explorer.com    
+id_n_s_290106_3        onCHECK Linkchecker von www.scientec.de fuer www.onsinn.de      onsearch.de German web directory link checking  C       85.176.108.2xx  http://www.onsearch.de/ 
+id_n_s_290106_2        onCHECK-Robot, www.onsearch.de  onsearch.de German web directory link checking  C       85.176.108.2xx  http://www.onsearch.de/ 
+id_n_s_1075    Onet.pl SA- http://szukaj.onet.pl       onet.pl Szukaj (Search) robot (213.180.128.1xx) R       s. also - Mozilla/5.0 (compatible; OnetSzukaj/5.0....   http://szukaj.onet.pl/  
+id_n_s_1076    online link validator (http://www.dead-links.com/)      Dead-Links.com link validation spider   C               http://www.dead-links.com/      
+id_n_s_040206_3        Online24-Bot (Version: 1.0x, powered by www.online24.de)        Online24 shopping portal (Germany) link checking        C               http://www.online24.de/ 
+id_n_s_1077    OntoSpider/1.0 libwww-perl/5.65 OntoSpider - Dutch robot for a research project. (195.11.244.xx)        R               http://ontospider.i-n.info      
+id_n_s_030110_6        OOZBOT/0.20 ( http://www.setooz.com/oozbot.html ; agentname at setooz dot_com ) SeetooZ search crawler  R       67.215.230.xx   http://www.setooz.com/  
+id_g_m_280508_4        OpenAcoon v4.0.x (www.openacoon.de)     OpenAcoon open source search engine (used by Acoon search)      R       (80.237.209.xx) http://www.openacoon.de/        http://www.acoon.de/
+id_n_s_1078    Openbot/3.0+(robot-response@openfind.com.tw;+http://www.openfind.com.tw/robot.html)     Openfind.com.tw robot   R               http://www.openfind.com.tw/     
+id_n_s_1079    Openfind data gatherer- Openbot/3.0+(robot-response@openfind.com.tw;+http://www.openfind.com.tw/robot.html)     Openfind.com.tw robot   R               http://www.openfind.com.tw/     
+id_n_s_1080    Openfind Robot/1.1A2    Openfind.com.tw robot   R               http://www.openfind.com.tw/     
+id_n_s_250107_2        OpenISearch/1.x (www.openisearch.com)   open i search robot - search engine in development      R       216.182.236.1xx http://www.openisearch.com/     
+id_n_s_291105_4        OpenTaggerBot (http://www.opentagger.com/opentaggerbot.htm)     Opentagger social bookmarking system    R               http://www.opentagger.com/      
+id_n_s_1081    OpenTextSiteCrawler/2.9.2       OpenText crawler        R               http://www.opentext.net/        
+id_n_s_310806_1        OpenWebSpider/0.x.x (http://www.openwebspider.org)      OpenWebSpider - Open Source web search engine   R               http://www.openwebspider.org/   
+id_n_s_1082    OpenWebSpider/x OpenWebSpider - Open Source web search engine   R               http://www.openwebspider.org/   
+id_n_s_1083    Opera/5.0 (Linux 2.0.38 i386; U) [en]   Opera 5.0 Linux B                       
+id_n_s_1084    Opera/5.11 (Windows ME; U) [ru] Opera 5.11 faked WinME referer  B                       
+id_n_s_1085    Opera/5.12 (Windows 98; U) [en] Opera 5.12 Win98        B                       
+id_n_s_1086    Opera/6.01 (larbin@unspecified.mail)    unknown robot from gw.ocg-corp.com (209.126.176.x)              see also: - MSIE-5.13 (larbin@.....) - WinampMPEG/2.00 larbin@....              
+id_n_s_1087    Opera/6.x (Linux 2.4.8-26mdk i686; U) [en]      Opera 6.x- Mandrake Linux       B                       
+id_n_s_1088    Opera/6.x (Windows NT 4.0; U) [de]      Opera 6.x WinNT B                       
+id_n_s_1089    Opera/7.x (Windows NT 5.1; U) [en]      Opera 7.x WinXP B                       
+id_n_s_1090    Opera/8.xx (Windows NT 5.1; U; en)      Opera 8.x (Beta) WinXP  B                       
+id_n_s_141105_2        Opera/9.0 (Windows NT 5.1; U; en)       Opera 9 (Beta) Browser  B               http://snapshot.opera.com/      
+id_n_s_250606_1        Opera/9.00 (Windows NT 5.1; U; de)      Opera 9 (final) B               http://www.opera.com/   
+id_n_s_201008_1        Opera/9.60 (Windows NT 5.1; U; de) Presto/2.1.1 Opera browser 9.6x on WinXP (Presto = Operas rendering engine)  B               http://my.opera.com/ODIN/blog/a-look-under-the-hood-of-opera-9-6        
+id_n_s_1091    OpidooBOT (larbin2.6.3@unspecified.mail)        Opidoo Search Belgium robot (62.4.83.xxx)       R               http://www.opidoo.com/  
+id_n_s_080208_1        OPWV-SDK UP.Browser/7.0.2.3.119 (GUI) MMP/2.0 Push/PO   Open Wave Phone Simulator SDK   B               http://developer.openwave.com/dvl/tools_and_sdk/phone_simulator/        
+id_n_s_190406_2        Oracle Application Server Web Cache 10g Oracle Application Server cache P               http://www.oracle.com/appserver/index.html      
+id_n_s_1092    Oracle iMTCrawler       Oracle interMedia Text - Text and web documents indexing        D               http://www.oracle.com/technology//products/text/index.html      
+id_n_s_1093    Oracle Ultra Search     Oracle Search   R               http://www.oracle.com/  
+id_n_s_220306_1        OrangeSpider    Orangeslicer semantic search (Beta) Germany (193.201.52.1xx)    R               http://www.orangeslicer.com/    
+id_n_s_1094    Orbiter/T-2.0 (+http://www.dailyorbit.com/bot.htm)      Orbiter - DailyOrbit search spider      R               http://www.dailyorbit.com/      
+id_n_s_150206_1        Orca Browser (http://www.orcabrowser.com)       Orca browser - based on Gecko   B               http://www.orcabrowser.com      
+id_n_s_251205_1        OSSProxy 1.3.305.321 (Build 305.321 Win32 en-us)(Dec 21 2005 16:30:54)  Marketscore (was Netsetter) internet accelerator        P       Spyware proxy service   http://www.marketscore.com/Home.aspx    
+id_n_s_141105_1        OutfoxBot/0.x (For internet experiments; http://; outfox.agent@gmail.com)       Unknown robot from Chinanet (220.181.8.xxx)                             
+id_n_s_221106_1        OutfoxMelonBot/0.5 (for internet experiments; http://; outfoxbot@gmail.com)     Unknown robot from Chinanet (60.191.80.1)                               
+id_n_s_1095    Overture-WebCrawler/3.8/Fresh (atw-crawler at fast dot no; http://fast.no/support/crawler.asp)  Overture/Fast/Alltheweb crawler (66.77.73.xxx)  R               http://www.alltheweb.com/       
+id_n_s_1096    OWR_Crawler 0.1 Unknown robot from 198.169.127.xx (innovationplace.com)                         
+id_n_s_090906_1        ozelot/2.7.3 (Search engine indexer; www.flying-cat.de/ozelot; ozelot@flying-cat.de)    Ozelot - Flying Cat's search engine robot (Germany)     R       87.139.106.xx   http://www.flying-cat.de/ozelot/        
+id_n_s_290108_2        PADLibrary Spider       PADLibrary.com - PAD file software robot for FindFiles.com      R       72.167.37.20x   http://padlibrary.com/  http://www.findfiles.com/
+id_n_s_150207_3        PageBitesHyperBot/600 (http://www.pagebites.com/)       Pagebites job search crawler    R       208.185.247.xx  http://www.pagebites.com/       
+id_n_s_111206_1        Pagebull http://www.pagebull.com/       Pagebull visual search engine   R       209.9.228.1xx   http://www.pagebull.com/        
+id_n_s_051207_3        Pagestacker Bot Pagestacker online bookmark service     C       70.85.129.12x   http://www.pagestacker.com/     
+id_n_s_290506_1        page_verifier (http://www.securecomputing.com/goto/pv)  Secure Computing SmartFilter Tools - malware crawler    R       206.169.110.xx  http://www.securecomputing.com/PageVerifier.cfm 
+id_n_s_1097    PagmIEDownload  Downloadmanager ?       D                       
+id_n_s_1098    parallelContextFocusCrawler1.1parallelContextFocusCrawler1.1    CFC crawler used by Italian academic and research network (GARR)        R               http://www.garr.it/     
+id_n_s_1099    ParaSite/1.0b (http://www.ianett.com/parasite/) http://www.ianett.com robot     R               http://www.ianett.com/  
+id_n_s_1100    Patwebbot (http://www.herz-power.de/technik.html)       Patsearch (Germany) robot       R               http://www.herz-power.de/       
+id_n_s_1101    pavuk/0.9pl29b i686-pc-linux-gnu        Pavuk web downloading program for Unix  D               http://www.idata.sk/%7Eondrej/pavuk/about.html  
+id_n_s_1102    PBrowse 1.4b    Some site scanning tool via diff. IPs- i.e.: - cox.net (68.4.xxx.xxx)   S       - UA sometimes DSurf15a         
+id_n_s_1103    pd02_1.0.0 pd02_1.0.0@dzimi@post.sk     Post.sk / Eurotel.sk robot      R                       
+id_n_s_1104    PEAR HTTP_Request class ( http://pear.php.net/ )        Pear HTTP_Request PHP extension package                 http://pear.php.net/    
+id_n_s_1105    PEERbot www.peerbot.com Peerbot - favicon search robot  R               http://www.peerbot.com/ 
+id_n_s_1106    PeopleChat/Search_Engine        Unknown robot from 64.5.48.xxx (Plethoric.net)                          
+id_n_s_1107    PEval 1.4b      Some site scanning tool via diff. IPs   S       s. DBrowse- PSurf etc.          
+id_n_s_1108    PHP/3.x.xx      diff. IPs / services                            
+id_n_s_1109    PHP/4.0.4pl1    diff. IPs / services                            
+id_n_s_1110    PHP/4.0.6       diff. IPs / services- i.e.: -NTT/Verio Inc. link checker        C       in conjunction w. Weblink's Checker UA  http://www.verio.com/   
+id_n_s_1111    PHP/4.1.1       diff. IPs / services- i.e.: - Phenominet.com link checking      C               http://www.phenominet.com       
+id_n_s_1112    PHP/4.1.2       diff. IPs / services- i.e.: - 209.114.200.xx = MyNetCrawler link checking - 216.139.207.xxx = Mixcat crawler            Mixcat s. also Felix and Morris http://mynetcrawler.com/        http://mixcat.com
+id_n_s_1113    PicoSearch/1.0  Pico Search robot       R               http://www.picosearch.com/      
+id_n_s_010506_3        Piffany_Web_Scraper_v0.x        Piffany targeted search web spider      R               http://www.piffany.com/ http://www.piffany.com/spider.html
+id_n_s_010506_2        Piffany_Web_Spider_v0.x Piffany targeted search web spider      R               http://www.piffany.com/ http://www.piffany.com/spider.html
+id_n_s_1114    PigeonBot1.0 BETA       Whois Source domain name information robot (66.249.26.xx)- s.also: - SurveyBot  R C             http://www.whois.sc/    
+id_n_s_1115    PingALink Monitoring Services 1.0       PingALink website monitoring    R C             http://www.pingalink.com/       
+id_n_s_1116    PingALink Monitoring Services 1.0 (http://www.pingalink.com)    PingALink website monitoring    R C             http://www.pingalink.com/       
+id_n_s_120607_1        Pingdom GIGRIB (http://www.pingdom.com) Pingdom web site monitoring     C       66.98.148.xx    http://www.pingdom.com/ 
+id_n_s_1117    pipeLiner/0.3a (PipeLine Spider;http://www.pipeline-search.com/webmaster.html; webmaster'at'pipeline-search.com)        pipeline search (DMOZ based) search robot (24.106.39. xxx)      R               http://www.pipeline-search.com/ 
+id_n_s_1118    pipeLiner/0.xx (PipeLine Spider; http://www.pipeline-search.com/webmaster.html) pipeline search (DMOZ based) search robot (24.106.39. xxx)      R               http://www.pipeline-search.com/ 
+id_n_s_1119    Pita    Pita crawler    R       now WebVac s. there     http://www-diglib.stanford.edu/~testbed/doc2/WebBase/webbase-pages.html 
+id_n_s_1120    Pizilla++ ver 2.45      Private user-agent via Hurricane Electric Internet Services     B ?             http://www.he.net/      
+id_n_s_1121    PJspider/3.0 (pjspider@portaljuice.com; http://www.portaljuice.com)     Portaljuice spider      R               http://www.portaljuice.com/     
+id_n_s_121106_1        Plagger/0.x.xx (http://plagger.org/)    Plagger - pluggable RSS/Atom feed aggregator written in Perl    B               http://plagger.org/trac 
+id_n_s_1122    PlagiarBot/1.0  unknown ucsd.edu robot  R                       
+id_n_s_1123    PlantyNet_WebRobot_V1.9 dhkang@plantynet.com    Plantynet web filtering services - Blacklist DB robot   R P             http://www.plantynet.com/       
+id_n_s_120106_1        plinki/0.1 (you got plinked! (thats a good thing..); http://www.plinki.com; crawl@plinki.com)   Unknown UA from 66.220.23.2xx           Doesn't read robots.txt - Plinki.com's website has no content   http://www.plinki.com/  
+id_n_s_061206_2        PluckFeedCrawler/2.0 (compatible; Mozilla 4.0; MSIE 5.5; http://www.pluck.com; 1 subscribers)   Pluck RSS feed crawler  R       66.179.81.1xx   http://www.pluck.com/   
+id_n_s_140807_1        Pluggd/Nutch-0.9 (automated crawler http://www.pluggd.com;support at pluggd dot com)    Pluggd Podcast search engine    R       209.85.62.1xx   http://www.pluggd.com/  
+id_n_s_1124    Pockey-GetHTML/4.12.0 (Win32; GUI; ix86)        Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan    D               http://www.vector.co.jp/soft/win95/net/se077067.html    
+id_n_s_1125    Pockey-GetHTML/x.xx     Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan    D               http://www.vector.co.jp/soft/win95/net/se077067.html    
+id_n_s_1126    Pockey/x.x.x    Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan    D               http://www.vector.co.jp/soft/win95/net/se077067.html    
+id_n_s_1127    Pockey7.x.x(WIN32GUI)   Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan    D               http://www.vector.co.jp/soft/win95/net/se077067.html    
+id_n_s_1128    POE-Component-Client-HTTP/0.64 (perl; N; POE; en; rv:0.640000)  HTTP user-agent for POE (portable networking framework for Perl )                       http://search.cpan.org/dist/POE-Component-Client-HTTP/HTTP.pm   
+id_n_s_291105_2        Poirot  ThePlanet/jaja-jak-globusy.com Google Adsense refferer spam bot from 70.85.116.* / 70.84.128.xxx / 70.85.193.xxx        S       appears also as LWP::Simple/5.803 - Mozilla/4.76 [en] (Win98; U) - Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1)   http://spamhuntress.com/wiki/Manila_Industries  
+id_n_s_1129    polybot 1.0 (http://cis.poly.edu/polybot/)      Polybot webcrawler      R               http://cis.poly.edu/polybot/    
+id_n_s_1130    Pompos/1.x http://dir.com/pompos.html   Dir.com / Iliad French recherche robot  R               http://www.iliad.fr/    
+id_n_s_1131    Pompos/1.x pompos@iliad.fr      Iliad / Free French recherche robot     R               http://www.iliad.fr/    
+id_n_s_1132    Popdexter/1.0   Popdex - web site popularity crawler    R               http://www.popdex.com/  
+id_n_s_1133    Port Huron Labs Unknown spam bot / harvester (63.223.10.***)    S       s. also - Wells Search II               
+id_n_s_1134    PortalBSpider/2.0 (spider@portalb.com)  PortalB (now Alacra search) spider      R               http://www.portalb.com/alacra/index.htm 
+id_n_s_080706_2        portalmmm/2.0 S500i(c20;TB)     portalmmm IMode mobile browser  B                       
+id_n_s_1135    PostFavorites   Yahoo (66.94.237.1xx / 216.109.121.xx) favorites tracking robot C                       
+id_n_s_1136    potbot 1.0      Potbot : A simple IRC bot written in Perl       R               http://sourceforge.net/projects/potbot/ 
+id_n_s_050408_2        PRCrawler/Nutch-0.9 (data mining development project; crawler@projectrialto.com)        Project Rialto - data mining development project        R               http://projectrialto.com/index.html     
+id_n_s_1137    PrivacyFinder Cache Bot v1.0    CUPS robot for AT&T Privacy Bird Privacy Preferences (P3P) enhancements R               http://cups.cs.cmu.edu/ http://privacybird.com/
+id_n_s_111205_2        PrivacyFinder/1.1       CUPS robot for AT&T Privacy Bird Privacy Preferences (P3P) enhancements R               http://cups.cs.cmu.edu/ http://privacybird.com/
+id_n_s_1138    Privoxy/3.0 (Anonymous) Privoxy web proxy       P       s.also (Privoxy/1.0)    http://www.privoxy.org/ 
+id_n_s_1139    Production Bot 0116B    Some site scanning tool from diff. IPs- i.e.: - 67.99.33.x (lightningcon.broadwing.net) S                       
+id_n_s_1140    Production Bot 2016B    Some site scanning tool from diff. IPs- i.e.: - 216.232.64.xx (telus.net)       S                       
+id_n_s_1141    Production Bot DOT 3016B        Some site scanning tool from diff. IPs- i.e.: - 141.154.181.xxx (east.verizon.net)      S                       
+id_n_s_1142    Program Shareware 1.0.2 Some spam bot   S       - see here: http://www.kloth.net/internet/badbots-2004.php      http://www.kloth.net/internet/badbots-2004.php  
+id_n_s_1143    Progressive Download    unknown                         
+id_n_s_1144    Progressive Download HTTP check unknown                         
+id_n_s_1145    Project XP5 [2.03.07-111203]    XP5 robot       R               http://marty.anstey.ca/projects/robots/index.html       
+id_n_s_1146    PROve AnswerBot 4.0     Answerchase PROve Answerbot     R               http://www.answerchase.com/     
+id_n_s_1147    ProWebGuide Link Checker (http://www.prowebguide.com)   ProWebguide robot       R               http://www.prowebguide.com/     
+id_n_s_1148    psbot/0.1 (+http://www.picsearch.com/bot.html)  Picsearch robot (62.119.21.13x) R               http://www.picsearch.com/       
+id_n_s_1149    PSurf15a 11     Some site scanning tool via diff. IPs- i.e.: QWest Net  S                       
+id_n_s_1150    PSurf15a 51     Some site scanning tool via diff. IPs- i.e.: Optonline net (24.191.xxx.xxx)     S                       
+id_n_s_1151    PSurf15a VA     Some site scanning tool via diff. IPs- i.e.: - choiceone.net (216.153.xxx.xxx) - attbi.com (12.250.xxx.xxx) - optonline.net (24.191.xxx.xxx)    S       UA sometimes SSurf15a 11 or random letters like RXMYRCJ         
+id_n_s_160606_1        psycheclone     Unknown website grabbing / ripping for unknown purposes from 208.66.195.x - Digitalinfinity.org Russia  S       no active website               
+id_n_s_1152    PubCrawl (pubcrawl.stanford.edu)        Some robot from Stanford University (171.64.75.xxx = PubCrawl.Stanford.EDU)     R                       
+id_n_s_1153    puf/0.91beta6a (Linux 2.2.18; i686)     Parallel URL Fetcher downloading tool   D               http://puf.sourceforge.net/     
+id_n_s_1154    puf/0.93.2a (Linux 2.4.18; i686)        Parallel URL Fetcher downloading tool   D               http://puf.sourceforge.net/     
+id_n_s_130407_1        pulseBot (pulse Web Miner)      WebarooBot - Webaroo web site search / theme based downloading tool (64.124.122.2xx)    R       s. also RufusBot        http://www.webaroo.com/index    http://www.webaroo.com/company/site-owners
+id_n_s_1155    PureSight       PureSight Internet content filter       P               http://www.puresight.com/Products/PureSightHomeDescription.shtml        
+id_n_s_1156    PuxaRapido v1.0 Puxa Rapido download manager    D               http://www.puxarapido.com.br/   
+id_n_s_230907_2        PWeBot/1.2 Inspector (http://www.programacionweb.net/robot.php) ProgramacionWeb.net PWeBot link checking (Argentina)    R       62.149.236.2xx  http://www.programacionweb.net/robot-en.php     http://www.programacionweb.net/
+id_n_s_1157    PycURL  Fast Search robot (using PycURL Python component- s. below)     R               http://www.fastsearch.net/      http://pycurl.sourceforge.net/
+id_n_s_060107_1        PycURL/7.xx.x   PycURL - Python interface to libcurl    D               http://pycurl.sourceforge.net/  
+id_n_s_1158    Python-urllib/1.1x      Python URL fetcher - robot used by Naver Japan/Korea    R       s. also nabot- dloader- NaverBot & Cowbot       http://www.indyproject.org/     http://www.python.org/
+id_n_s_1159    Python-urllib/2.0a1     Python URL fetcher - robot used by Google       R               http://labs.google.com  http://www.python.org/
+id_n_s_1160    Qango.com Web Directory (http://www.qango.com/) Qango.com Web Directory robot   R               http://www.qango.com/   
+id_n_s_170408_1        QEAVis Agent/Nutch-0.9 (Quantitative Evaluation of Academic Websites Visibility; http://nlp.uned.es/qeavis      QEAVis: Quantitative Evaluation of Academic Websites Visibility using Nutch     R       83.33.209.10x   http://nlp.uned.es/qeavis/      
+id_n_s_1161    QPCreep Test Rig ( We are not indexing- just testing )  Quepasa!com (Latin American search) robot       R               http://www.quepasa.com/ 
+id_n_s_1162    QuepasaCreep ( crawler@quepasacorp.com )        Quepasa!com (Latin American search) robot       R               http://www.quepasa.com/ 
+id_n_s_1163    QuepasaCreep v0.9.1x    Quepasa!com (Latin American search) robot       R               http://www.quepasa.com/ 
+id_n_s_1164    QueryN Metasearch       QueryN Metasearch robot R               http://www.queryn.com/queryn/   
+id_n_s_230108_2        Quicksilver (Blacktree,MacOSX)  Blacktrees Quicksilver helper application for Mac       B               http://docs.blacktree.com/quicksilver/what_is_quicksilver       
+id_n_s_230606_3        QuickTime\xaa.7.0.4 (qtver=7.0.4;cpu=PPC;os=Mac 10.3.9) Quicktime for Macintosh B                       
+id_n_s_060107_4        QweeryBot/3.01 ( http://qweerybot.qweery.nl)    Qweerybot for the Qweery search engine (in development) - Netherland    R       85.158.204.2xx  http://qweerybot.qweery.nl/     
+id_n_s_060107_3        Qweery_robot.txt_CheckBot/3.01 (http://qweerybot.qweery.com)    Qweerybot for the Qweery search engine (in development) - Netherland    R       85.158.204.2xx  http://qweerybot.qweery.nl/     
+id_n_s_160208_1        R6_CommentReader_(www.radian6.com/crawler)      Radian6 RSS feed comment crawler        R               http://www.radian6.com/cms/index.php    http://www.radian6.com/crawler/
+id_n_s_160208_2        R6_FeedFetcher_(www.radian6.com/crawler)        Radian6 Rss feed crawler        R               http://www.radian6.com/cms/index.php    http://www.radian6.com/crawler/
+id_n_s_1165    rabaz (rabaz at gigabaz dot com)        gigaBaz - the brainbot (Germany) robot  R               http://brainbot.com//site3      
+id_n_s_1166    RaBot/1.0 Agent-admin/phortse@hanmail.net       DAUMOA - Daum search Korea robot (211.115.109.xxx)      R       s. also Mozilla/4.0 (compatible; MSIE is not me; DAUMOA ...     http://www.daum.net/    
+id_n_s_1167    Rainbot1.1      Bot Provider for the All Womans Bot Service?            - site is dead  http://bservice.org/bots/       
+id_n_s_1168    ramBot xtreme x.x       Intersearch.de (was www.intersearch.de) robot (Germany) R                       
+id_n_s_160406_2        RAMPyBot - www.giveRAMP.com/0.1 (RAMPyBot - www.giveRAMP.com; http://www.giveramp.com/bot.html; support@giveRAMP.com)   giveRAMP Search Engine robot (64.69.43.1xx)     R               http://www.giveramp.com/        
+id_n_s_260206_1        RAMPyBot/0.8-dev (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org)        giveRAMP Search Engine robot (64.69.43.1xx)     R       powered by Nutch        http://www.giveramp.com/        http://lucene.apache.org/nutch/
+id_n_s_1169    Rank Exec (rankexec.com) Reciprocal Link Manager 1.x/bot        Rank Exec reciprocal link checking      C               http://www.rankexec.com/        
+id_n_s_180408_5        Rankivabot/3.2 (www.rankiva.com; 3.2; vzmxikn)  Rankiva website popularity robot        R               http://www.rankiva.com/ 
+id_n_s_1170    Rational SiteCheck (Windows NT) Innova/IBM Rational SiteCheck - Rational robot  R               http://www.rational.com.ar/defaultenglish.html  
+id_n_s_290708_2        RAYSPIDER/Nutch-0.9     Unknown spider from Raytheon Company - maybe Raytheon High Speed Guard proxy    P       199.46.198.xxx  http://www.raytheon.com/        
+id_n_s_230207_3        ReadABlog Spider (compatible; 1.1; feed update; www.readablog.com)      Read A Blog - RSS feed and blog search engine   C       70.85.24.xx     http://www.readablog.com/       
+id_n_s_1171    RealDownload/4.0.0.4x   RealDownload download manager   D               http://service.real.com/help/faq/rdown4/rdownfaqa01.html        
+id_n_s_100408_3        REAP-crawler Nutch/Nutch-1.0-dev (Reap Project; http://reap.cs.cmu.edu/REAP-crawler/; Reap Project)     The REAP Web Crawler for the REAP project       C               http://reap.cs.cmu.edu/REAP-crawler/    http://reap.cs.cmu.edu/
+id_n_s_1172    Reaper [2.03.10-031204] (http://www.sitesearch.ca/reaper/)      Reaper robot for SiteSearch     R               http://marty.anstey.ca/projects/robots/reaper.html      
+id_n_s_1173    Reaper/2.0x (+http://www.sitesearch.ca/reaper)  Reaper robot for SiteSearch     R               http://marty.anstey.ca/projects/robots/reaper.html      
+id_n_s_1174    REBOL Core 2.x.x.x.x    REBOL messaging language for distributed Internet apps                  http://www.rebol.com/   
+id_n_s_250307_1        REBOL View 1.x.x.x.x    REBOL/View - machine independent internet client application    B               http://www.rebol.com/prod-view.html     
+id_n_s_1175    RebusnetBot (+http://www.rebusnet.biz)  Rebusnet software site - link / submission checking     R C             http://www.rebusnet.biz 
+id_n_s_1176    RebusnetPADBot/1.5x (+http://www.rebusnet.biz)  Rebusnet software site - link / submission checking     R C             http://www.rebusnet.biz 
+id_n_s_171205_1        reciprocal links checker (http://www.recip-links.com/)  Online reciprocal link checker  C               http://www.recip-links.com/     
+id_n_s_110307_2        RedBot/redbot-1.0 (Rediff.com Crawler; redbot at rediff dot com)        rediff.com search link checking C       220.226.198.xx  http://www.rediff.com/  
+id_n_s_130106_1        RedCarpet/1.2 (http://www.redcarpet-inc.com/robots.html)        RedCarpet crawler for Pronto price comparison search(66.179.107.1xx)    R               http://www.redcarpet-inc.com/robots.html        http://www.pronto.com/
+id_n_s_171205_2        RedCell/0.1 (InfoSec Search Bot (Coming Soon); http://www.telegenetic.net/bot.html; lhall@telegenetic.net)      Der Bot for telegenetic.net's security related search (65.220.67.2xx)   R       Based on Nutch  http://www.telegenetic.net/bot.html     
+id_n_s_040106_1        RedCell/0.1 (RedCell; telegenetic.net/bot.html; lhall_at_telegenetic.net)       Der Bot for telegenetic.net's security related search (65.220.67.2xx)   R       Based on Nutch  http://www.telegenetic.net/bot.html     
+id_n_s_1177    RedKernel WWW-Spider 2/0 (+http://www-spider.redkernel-softwares.com/)  RedKernel Softwares robot       R               http://www.redkernel-softwares.com/     
+id_n_s_1178    REL Link Checker Lite x.x       REL Link Checker Lite free version of Web Link Validator        C               http://www.relsoftware.com/rlc/ 
+id_n_s_1179    RepoMonkey Bait & Tackle/v1.01  unknown                         
+id_n_s_1180    Rewebber/1.2 libwww-perl/5.41   Rewebber proxy service  P               http://www.rewebber.com/        
+id_n_s_1181    rico/0.1        Applied Semantics Auto-Categorizer for QWestDex Direct  R               http://www.dotcomdirectory.com  
+id_n_s_241105_2        RixBot (http://babelserver.org/rix)     RixBot Rebol Indexer for the RIX - Rebol related search (195.204.121.xx)        R               http://babelserver.org/rix      
+id_n_s_070406_2        RMA/1.0 (compatible; RealMedia) StreamBox VCR user agent        D               http://all-streaming-media.com/streaming-media-faq/faq-streambox-vcr-download-problems.htm      
+id_n_s_1182    RMA/1.0 (compatible; RealMedia) Real Media server acting as client      B P             http://service.real.com/help/library/whitepapers/wpaper.html    
+id_n_s_061206_4        RoboCrawl (http://www.canadiancontent.net)      Canadian Content search crawler R               http://www.canadiancontent.net/ 
+id_n_s_1183    RoboCrawl (www.canadiancontent.net)     Canadian Content Search (207.44.220.xx) robot   R               http://www.canadiancontent.net/ 
+id_n_s_1184    RoboPal (http://www.findpal.com/)       FindPal Australia metasearch robot (61.68.139.xx)       R               http://www.findpal.com/ 
+id_n_s_1187    Robot/www.pj-search.com PopJapanSearch robot    R               http://www.pj-search.com/       
+id_n_s_1185    Robot: NutchCrawler- Owner: wdavies@acm.org     Experimental robot using Wget via attbi.net     R                       
+id_n_s_1186    Robot@SuperSnooper.Com  Supersnooper robot      R               http://www.Supersnooper.com/    
+id_n_s_1188    Robozilla/1.0   Netscape Directory / DMOZ Open Directory link crawler   R               http://directory.mozilla.org/   
+id_n_s_220208_1        Rome Client (http://tinyurl.com/64t5n) Ver: 0.9 ROME - Open source Java tools for RSS and Atom feeds    B               https://rome.dev.java.net/      
+id_n_s_1189    Rotondo/3.1 libwww/5.3.1        Qualigo.de robot        R               http://www.qualigo.de/  
+id_n_s_1190    RPT-HTTPClient/0.3-x    different IPs using the HTTPClient library (mostly link checking)       C       Java1.4.0       http://www.innovation.ch/java/HTTPClient/       
+id_n_s_1191    RRC (crawler_admin@bigfoot.com) Metacarta.com (66.28.xx.xxx) robot      R       s. Larbin...    http://www.metacarta.com        
+id_n_s_250707_5        RssBandit/1.5.0.10 (.NET CLR 1.1.4322.2407; WinNT 5.1.2600.0; http://www.rssbandit.org) (.NET CLR 1.1.4322.2407; WinNT 5.1.2600.0; )    RSS Bandit RSS/Atom reader for .NET framework   B               http://www.rssbandit.org/       
+id_n_s_230607_3        RSSMicro.com RSS/Atom Feed Robot        RSS Micro Search - RSS feed search engine       R       209.216.63.xx   http://www.rssmicro.com/        
+id_n_s_080307_2        RSSOwl/1.2.3 2006-11-26 (Windows; U; zhtw)      RSSOwl embedded RSS feed reader B               http://www.rssowl.org/  
+id_n_s_060108_1        RSSOwl/1.2.4 Preview Release 2007-04-15 (Windows; U; zhtw)      RSSOwl embedded RSS feed reader B               http://www.rssowl.org/  
+id_n_s_181006_3        RssReader/1.0.xx.x (http://www.rssreader.com) Microsoft Windows NT 5.1.2600.0   Ykoon RssReader news feed reader        B               http://www.rssreader.com/       
+id_n_s_1192    RSurf15a 41     Some site scanning tool via diff. IPs- i.e.: - dslx.net (208.35.1x.xxx) - Home.com      S                       
+id_n_s_1193    RSurf15a 51     Some site scanning tool via diff. IPs- i.e.: - dslx.net (208.35.1x.xxx) - Home.com      S                       
+id_n_s_1194    RSurf15a 81     Some site scanning tool via diff. IPs- i.e.: - dslx.net (208.35.1x.xxx) - Home.com      S                       
+id_n_s_080206_2        Rubbot/1.0 (+http://rubhub.com/)        rubhub blog spider      C       based on XFN relationship lookup engine http://rubhub.com/main/ http://gmpg.org/xfn/more
+id_n_s_191105_1        RufusBot (Rufus Web Miner; http://64.124.122.252/feedback.html) WebarooBot - Webaroo web site search / theme based downloading tool (64.124.122.2xx)    R       s. also pulseBot        http://www.webaroo.com/index    http://www.webaroo.com/company/site-owners
+id_n_s_020407_1        RufusBot (Rufus Web Miner; http://www.webaroo.com/rooSiteOwners.html)   WebarooBot - Webaroo web site search / theme based downloading tool (64.124.122.2xx)    R       s. also pulseBot        http://www.webaroo.com/index    http://www.webaroo.com/company/site-owners
+id_n_s_1195    Rumours-Agent   unknown robot from rumours.jp (202.214.69.xxx)                          
+id_n_s_1196    RX Bar  RX (Reflexive Search) Bar for IE        B               http://www.searchenginebar.com/ 
+id_n_s_160506_1        S&L Spider (http://search.hirners.com/) Search & Links directory spider C       80.108.7.xx     http://search.hirners.com/      
+id_n_s_1197    S.T.A.L.K.E.R. (http://www.seo-tools.net/en/bot.aspx)   SEO-Tools.net link checking ?   C               http://www.seo-tools.net/       
+id_n_s_1198    SafariBookmarkChecker (+http://www.coriolis.ch/)        SafariBookmarkChecker for Mac OS X      C               http://www.coriolis.ch/ 
+id_n_s_061107_1        sait/Nutch-0.9 (SAIT Research; http://www.samsung.com)  sait robot - unknown robot from Samsung International Korea     R       202.20.190.xx   http://samsungnetworks.co.kr/eng/index.jsp      
+id_n_s_191105_2        SandCrawler - Compatibility Testing     Sandcrawler robot from Microsoft (131.107.0.xx) R                       
+id_n_s_170109_3        SapphireWebCrawler/1.0 (Sapphire Web Crawler using Nutch; http://boston.lti.cs.cmu.edu/crawler/; mhoy@cs.cmu.edu)       Sapphire Web Crawler from Carnegie Mellon University's Language Technologies Institute  R               http://boston.lti.cs.cmu.edu/crawler/   
+id_n_s_170109_4        SapphireWebCrawler/Nutch-1.0-dev (Sapphire Web Crawler using Nutch; http://boston.lti.cs.cmu.edu/crawler/; mhoy@cs.cmu.edu)     Sapphire Web Crawler from Carnegie Mellon University's Language Technologies Institute  R               http://boston.lti.cs.cmu.edu/crawler/   
+id_n_s_021205_4        savvybot/0.2    WebSavvy Directory robot        R               http://www.websavvy.cc/bot.php  
+id_n_s_1199    SBIder/0.7 (SBIder; http://www.sitesell.com/sbider.html; http://support.sitesell.com/contact-support.html)      SiteSell SBIder Nutch based crawler     R               http://www.sitesell.com/        
+id_n_s_030106_2        SBIder/0.8-dev (SBIder; http://www.sitesell.com/sbider.html; http://support.sitesell.com/contact-support.html)  SiteSell SBIder Nutch based crawler     R               http://www.sitesell.com/        
+id_n_s_1200    SBL-BOT (http://sbl.net)        Softbyte Labs Black Widow web site ripper       D B             http://sbl.net/ 
+id_n_s_1201    ScanWeb ScanWeb - regular expression based web page searching tool      R               http://eserver.host.sk/ 
+id_n_s_301006_1        ScholarUniverse/0.8 (Nutch;+http://scholaruniverse.com/bot.jsp; fetch-agent@scholaruniverse.com)        ScholarUniverse - Scholarly experts search robot        R       209.216.243.xx  http://www.scholaruniverse.com/index.jsp        
+id_n_s_1202    schwarzmann.biz-Spider_for_paddel.org+(http://www.innerprise.net/usp-spider.asp)        URL Spider Pro (USP) used by German Schwarzmann GmbH    R               http://www.schwarzmann.biz/     
+id_n_s_1203    Science Traveller International 1X/1.0  1X Web Browser  B               http://www.scitrav.com/ 
+id_n_s_190407_1        ScollSpider/2.0 (+http://www.webwobot.com/ScollSpider.php)      WebWobot UK search engine robot (82.43.129.2xx) R       s. also Mozilla/3.0 (compatible; ScollSpider ...        http://www.webwobot.com/        
+id_n_s_1206    Scooter-3.0.EU  Altavista robot R               http://www.altavista.com/       
+id_n_s_1207    Scooter-3.0.FS  Altavista robot R               http://www.altavista.com/       
+id_n_s_1208    Scooter-3.0.HD  Altavista robot R               http://www.altavista.com/       
+id_n_s_1209    Scooter-3.0.VNS Altavista robot R               http://www.altavista.com/       
+id_n_s_1210    Scooter-3.0QI   Altavista robot R               http://www.altavista.com/       
+id_n_s_1211    Scooter-3.2     Altavista robot R               http://www.altavista.com/       
+id_n_s_1212    Scooter-3.2.BT  Altavista robot R               http://www.altavista.com/       
+id_n_s_1213    Scooter-3.2.DIL Altavista robot R               http://www.altavista.com/       
+id_n_s_1214    Scooter-3.2.EX  Altavista robot R               http://www.altavista.com/       
+id_n_s_1215    Scooter-3.2.JT  Altavista robot R               http://www.altavista.com/       
+id_n_s_1216    Scooter-3.2.NIV Altavista robot R               http://www.altavista.com/       
+id_n_s_1217    Scooter-3.2.SF0 Altavista robot R               http://www.altavista.com/       
+id_n_s_1218    Scooter-3.2.snippet     Altavista robot R               http://www.altavista.com/       
+id_n_s_1219    Scooter-3.3dev  Altavista robot R               http://www.altavista.com/       
+id_n_s_1220    Scooter-ARS-1.1 Altavista robot R               http://www.altavista.com/       
+id_n_s_1221    Scooter-ARS-1.1-ih      Altavista robot R               http://www.altavista.com/       
+id_n_s_1222    scooter-venus-3.0.vns   Altavista robot R               http://www.altavista.com/       
+id_n_s_1223    Scooter-W3-1.0  Altavista robot R               http://www.altavista.com/       
+id_n_s_1224    Scooter-W3.1.2  Altavista robot R               http://www.altavista.com/       
+id_n_s_1225    Scooter/1.0     Altavista robot R               http://www.altavista.com/       
+id_n_s_1226    Scooter/1.0 scooter@pa.dec.com  Altavista robot R               http://www.altavista.com/       
+id_n_s_1227    Scooter/1.1 (custom)    Altavista robot R               http://www.altavista.com/       
+id_n_s_1228    Scooter/2.0 G.R.A.B. V1.1.0     Altavista robot R               http://www.altavista.com/       
+id_n_s_1229    Scooter/2.0 G.R.A.B. X2.0       Altavista robot R               http://www.altavista.com/       
+id_n_s_1230    Scooter/3.3     Altavista robot R               http://www.altavista.com/       
+id_n_s_1232    Scooter/3.3.QA.pczukor  Altavista robot R               http://www.altavista.com/       
+id_n_s_1233    Scooter/3.3.vscooter    Altavista robot R               http://www.altavista.com/       
+id_n_s_1231    Scooter/3.3_SF  Altavista robot R               http://www.altavista.com/       
+id_n_s_1234    Scooter2_Mercator_x-x.0 Altavista using Mercator robot  R               http://www.altavista.com/       http://www.research.compaq.com/SRC/mercator/
+id_n_s_1204    Scooter_bh0-3.0.3       Altavista robot R               http://www.altavista.com/       
+id_n_s_1205    Scooter_trk3-3.0.3      Altavista robot R               http://www.altavista.com/       
+id_n_s_190306_3        Scope (Mars+)   Scope Navigator mobile browser (Japan)  B               http://www.programmer.co.jp/scope.shtml 
+id_n_s_1235    ScoutAbout      Some nec.com robot using Research Republic ScoutAbout Research Tool     R               http://www.researchrepublic.com/        
+id_n_s_051207_4        ScoutAnt/0.1; +http://www.ant.com/what_is_ant.com/      Ant.com search robot    R       66.230.171.17x  http://www.ant.com/     
+id_n_s_271105_3        scoutmaster     ScoutMaster information retrieval software      R               http://www.scoutmaster.de/      
+id_n_s_1236    Scrubby/2.x (http://www.scrubtheweb.com/)       Scrub the web robot (66.93.156.xx)      R       s.also Mozilla/5.0 (compatible; Scrubby/2.2 ... http://www.scrubtheweb.com/     
+id_n_s_030308_3        Scrubby/3.0 (+http://www.scrubtheweb.com/help/technology.html)  Scrub the web robot (66.93.156.xx)      R       s.also Mozilla/5.0 (compatible; Scrubby/2.2 ... http://www.scrubtheweb.com/     
+id_n_s_1240    Search+ URL Search+ search software     R               http://srchplus.chat.ru/index.htm       
+id_n_s_110606_3        Search-Engine-Studio    Xtreem Search Engine Studio - SE software       R               http://www.xtreeme.com/search-engine-studio/    
+id_n_s_1237    search.ch V1.4  Search.ch robot R               http://www.search.ch/   
+id_n_s_1238    search.ch V1.4.2 (spiderman@search.ch; http://www.search.ch)    Search.ch robot R               http://www.search.ch/   
+id_n_s_1239    Search/1.0 (http://www.innerprise.net/es-spider.asp)    Enterprise Search web indexing / site searching tool    R               http://www.innerprise.net/es-bi.asp     
+id_n_s_1241    searchbot admin@google.com      Unknown robot / website grabber from Chinatelecom (219.142.78.xxx)      S                       
+id_n_s_1242    SearchByUsa/2 (SearchByUsa; http://www.SearchByUsa.com/bot.html; info@SearchByUsa.com)  SearchByUSA robot (69.150.7.xxx)        R               http://www.searchbyusa.com/     
+id_n_s_231006_1        SearchdayBot    Searchday (Germany) search robot        R       85.25.131.1xx   http://www.searchday.de/        
+id_n_s_1243    SearchExpress Spider0.99        Searchexpress spider    R               http://www.searchexpress.com/   
+id_n_s_1245    SearchGuild/DMOZ/Experiment (searchguild@gmail.com)     Searchguild forum & directory robot (81.3.75.xxx)       R               http://searchguild.com/ 
+id_n_s_1244    SearchGuild_DMOZ_Experiment (chris@searchguild.com)     Searchguild forum & directory robot (81.3.75.xxx)       R               http://searchguild.com/ 
+id_n_s_1246    Searchit-Now Robot/2.2 (+http://www.searchit-now.co.uk) Searchit robot (69.93.107.xx)   R               http://www.searchit-now.co.uk   
+id_n_s_220906_3        Searchmee! Spider v0.98a        Searchmee! Search Engine (prototype) robot by findanisp.com     R       64.202.100.     http://www.searchmee.com/       
+id_n_s_100506_1        SearchSight/2.0 (http://SearchSight.com/)       SearchSight search robot        R               http://searchsight.com/ 
+id_n_s_1247    SearchSpider.com/1.1    SearchSpider robot      R               http://www.searchspider.com/    
+id_n_s_1248    Searchspider/1.2 (SearchSpider; http://www.searchspider.com; webmaster@searchspider.com)        SearchSpider robot      R               http://www.searchspider.com/    
+id_n_s_1249    SearchTone2.0 - IDEARE  Janas (Ideare.com / Tiscali.it) robot   R               http://www.ideare.com/  http://www.tiscali.it
+id_n_s_1250    Seekbot/1.0 (http://www.seekbot.net/bot.html) HTTPFetcher/0.3   seekport. beta search (Germany) robot   R       195.27.215.xx   http://www.seekbot.net/ 
+id_n_s_1251    Seekbot/1.0 (http://www.seekbot.net/bot.html) RobotsTxtFetcher/1.0 (XDF)        seekport. beta search (Germany) robot   R       195.27.215.xx   http://www.seekbot.net/ 
+id_n_s_1252    Seekbot/1.0 (http://www.seekbot.net/bot.html) RobotsTxtFetcher/1.2      seekport. beta search (Germany) robot   R       195.27.215.xx   http://www.seekbot.net/ 
+id_n_s_1253    Seeker.lookseek.com     Lookseek search robot / link checking   R       12.199.64.xx    http://www.lookseek.com/        
+id_n_s_011006_3        semaforo.net    semaforo.net web filtering software     P               http://www.semaforo.net/en/default.htm  
+id_n_s_020807_2        Semager/1.1 (http://www.semager.de/blog/semager-bots/)  Semager.de (was NG-Search) semantic search - Germany    R       212.114.209.2xx http://www.semager.de/  http://www.semager.de/blog/semager-bots/
+id_n_s_230507_2        Semager/1.x (http://www.semager.de)     Semager.de (was NG-Search) semantic search - Germany    R       212.114.209.2xx http://www.semager.de/  http://www.semager.de/blog/semager-bots/
+id_n_s_1254    semanticdiscovery/0.x   Semantic Discovery domain checking tool R C             http://www.semanticdiscovery.com/products.html  
+id_n_s_1255    Sensis Web Crawler (search_comments\at\sensis\dot\com\dot\au)   Sensis Australia search robot   R               http://www.sensis.com.au/       
+id_n_s_1256    Sensis.com.au Web Crawler (search_comments\at\sensis\dot\com\dot\au)    Sensis Australia search robot   R               http://www.sensis.com.au/       
+id_n_s_1257    SeznamBot/1.0   Seznam Search (Czech Republic) robot    R       212.80.76.xx    http://www.seznam.cz/   
+id_n_s_1258    SeznamBot/1.0 (+http://fulltext.seznam.cz/)     Seznam Search (Czech Republic) robot    R       212.80.76.xx    http://www.seznam.cz/   
+id_n_s_080907_2        SeznamBot/2.0-test (+http://fulltext.sblog.cz/) Seznam Search (Czech Republic) robot    R       212.80.76.xx    http://www.seznam.cz/   
+id_n_s_280208_2        ShablastBot 1.0 Unknown robot from Shablast.com - Website has no content - Ignores robots.txt   S       67.228.100.1xx / 67.228.102.2xx http://shablast.com/    
+id_n_s_1259    Shareaza v1.x.x.xx      Shareaza P2P peer-to-peer download client       D B             http://www.shareaza.com/        
+id_n_s_1260    SharewarePlazaFileCheckBot/1.0+(+http://www.SharewarePlaza.com) SharewarePlaza File Check Bot - link checking   R C             http://www.sharewareplaza.com/  
+id_n_s_1261    Shim Crawler    Chikayama-Taura Lab Shim-Crawler used for The Kototoi Project (Japan) - (133.11.36.xx)  R       s. also Shim-Crawler ...        http://www.logos.ic.i.u-tokyo.ac.jp/crawler/index.en.html       http://www.kototoi.org/index.html
+id_n_s_240106_2        Shim-Crawler(Mozilla-compatible; http://www.logos.ic.i.u-tokyo.ac.jp/crawler/; crawl@logos.ic.i.u-tokyo.ac.jp)  Chikayama-Taura Lab Shim-Crawler used for The Kototoi Project (Japan) - (133.11.36.xx)  R       s. also Shim Crawler    http://www.logos.ic.i.u-tokyo.ac.jp/crawler/index.en.html       http://www.kototoi.org/index.html
+id_n_s_131205_1        ShopWiki/1.0 ( +http://www.shopwiki.com/)       ShopWiki shopping search based on LittleWiki search     R       4.78.166.1xx    http://www.shopwiki.com/        http://dev.littlewiki.com/wiki/Home
+id_n_s_250706_1        ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot)  ShopWiki shopping search based on LittleWiki search     R       4.78.166.1xx    http://www.shopwiki.com/        http://dev.littlewiki.com/wiki/Home
+id_n_s_1262    Shoula.com Crawler 2.0  Shoula Search Engine crawler    R               http://www.shoula.com/  
+id_n_s_230107_1        SietsCrawler/1.1 (+http://www.siets.biz)        Siets Crawler - Web based site crawling application     R               http://www.siets.biz/products/crawler/  
+id_n_s_070308_1        Sigram/Nutch-1.0-dev (Test agent for Nutch development; http://www.sigram.com/bot.html; bot at sigram dot com)  Sigram's Nutch robot - crawler testing  R               http://www.sigram.com/bot.html  
+id_n_s_050906_1        Siigle Orumcex v.001 Turkey (http://www.siigle.com)     Siigle search (Turkey) robot    R       62.68.196.xx    http://www.siigle.com/  
+id_n_s_171006_1        silk/1.0        Slider Search directory robot (194.213.194.2xx) R       s. also Slider_Search...        http://www.slider.com/index.html        
+id_n_s_281205_1        silk/1.0 (+http://www.slider.com/silk.htm)/3.7  Slider Search directory robot (194.213.194.2xx) R       s. also Slider_Search...        http://www.slider.com/index.html        
+id_n_s_131206_2        SimpleFavPanel/1.2      SimpleFavPanel - IE newsfeed panel plugin       B               http://www.egrath.net/index.php?ExplorerBarPlus%2F%A5%D1%A5%CD%A5%EB%B0%EC%CD%F7%2FSimpleFavPanel       
+id_n_s_1263    Simpy 1.x; http://www.simpy.com/        Simpy bookmarking and personal search engine    R C     s. also Argus   http://www.simpy.com/   
+id_n_s_1264    Simpy/1.x (Simpy; http://www.simpy.com/?ref=bot; feedback at simpy dot com)     Simpy bookmarking and personal search engine    R C     s. also Argus   http://www.simpy.com/   
+id_n_s_180707_2        Sirketcebot/v.01 (http://www.sirketce.com/bot.html)     Sirketçe search - Turkey       R       88.255.173.xx   http://www.sirketce.com/        
+id_n_s_070207_3        SiteBar/3.x.x (Bookmark Server; http://sitebar.org/)    SiteBar online bookmark manager C               http://sitebar.org/     
+id_n_s_1265    SiteBar/x.x     SiteBar bookmark server C               http://sitebar.sourceforge.net/ 
+id_n_s_1266    SiteBar/x.x.x (Bookmark Server; http://sitebar.org/)    SiteBar bookmark server C               http://sitebar.sourceforge.net/ 
+id_n_s_1267    sitecheck.internetseer.com      Internetseer Web Site Monitoring / Claymont robot       R C             http://www.internetseer.com/    http://www.claymont.com/
+id_n_s_1268    sitecheck.internetseer.com (For more info see: http://sitecheck.internetseer.com)       Internetseer Web Site Monitoring        R C             http://www.internetseer.com/    
+id_n_s_1269    SiteRecon+(xx)  SiteRecon website monitoring spider at xx minute intervals      R C             http://www.siterecon.com/       
+id_n_s_1270    SiteSnagger     PC Magazin web site downloadmanager     D               http://www.zdnet.com/pcmag/pctech/content/17/04/ut1704.001.html 
+id_n_s_1271    SiteSpider +(http://www.SiteSpider.com/)        Site Spider robot (66.249.17.xx)        R               http://www.SiteSpider.com/      
+id_n_s_021205_3        SiteSucker/1.x.x        SiteSucker Mac website downloading tool D               http://www.sitesucker.us/       
+id_n_s_140306_2        SiteTaggerBot (http://www.sitetagger.com/bot.htm)       SiteTagger.com bookmark organizer       C               http://www.sitetagger.com/      
+id_n_s_030407_1        SiteTruth.com site rating system        SiteTruth - Automatic site legitimacy rating system     R       69.64.67.xx     http://www.sitetruth.com/       
+id_n_s_1272    SiteWinder      Webwasher.com (217.146.159.xx) internet filter  B P             http://www.webwasher.com/       
+id_n_s_1273    SiteXpert       Xtreeme SiteXpert sitemap & search engine builder       R               http://www.xtreeme.com/sitexpert/index.php      
+id_n_s_1274    Skampy/0.9.x (http://www.skaffe.com/skampy-info.html)   Skaffe.com directory link checker       R               http://www.skaffe.com/  
+id_n_s_1275    Skimpy/0.x (http://www.skaffe.com/skampy-info.html)     Skaffe.com directory link checker       R               http://www.skaffe.com/  
+id_n_s_090706_1        Skywalker/0.1 (Skywalker; anonymous; anonymous) Visvo distributed website crawler based on Nutch        R       63.133.162.xx   http://www.visvo.com/bot.html   
+id_n_s_1276    Slarp/0.1       Only.com robot  R               http://www.only.com/    
+id_n_s_1277    Sleipnir        Sleipnir - Japanese Explorer based browser & search bar B               http://www20.pos.to/~sleipnir/software/sleipnir/index.html      
+id_n_s_1278    Sleipnir Version 1.xx   Sleipnir - Japanese Explorer based browser & search bar B               http://www20.pos.to/~sleipnir/software/sleipnir/index.html      
+id_n_s_170207_5        Sleipnir Version2.x     Sleipnir - Japanese Explorer based browser & search bar B               http://www20.pos.to/~sleipnir/software/sleipnir/index.html      
+id_n_s_260706_1        Sleipnir/2.xx   Sleipnir - Japanese Explorer based browser & search bar B               http://www20.pos.to/~sleipnir/software/sleipnir/index.html      
+id_n_s_1279    Slider_Search_v1-de     Slider Search directory robot (194.213.194.2xx) R       s. also silk/1.0...     http://www.slider.com/index.html        
+id_n_s_1280    SlimBrowser     Slim Browser (IE based browser) - uses this user agent for favicon.ico only     B               http://www.flashpeak.com/sbrowser/      
+id_n_s_1281    Slurp/2.0 (slurp@inktomi.com; http://www.inktomi.com/slurp.html)        Inktomi (Hotbot-Lycos-NBCi) robot       R               http://www.inktomi.com/slurp.html       
+id_n_s_1282    Slurp/2.0-KiteWeekly (slurp@inktomi.com; http://www.inktomi.com/slurp.html)     Inktomi (Hotbot-Lycos-NBCi) robot       R               http://www.inktomi.com/slurp.html       
+id_n_s_1283    Slurp/si (slurp@inktomi.com; http://www.inktomi.com/slurp.html) Inktomi (Hotbot-Lycos-NBCi) robot       R               http://www.inktomi.com/slurp.html       
+id_n_s_240806_1        Slurpy Verifier/1.0     Inktomi (Hotbot-Lycos-NBCi) robot - 72.30.61.xx(x)      R       s. also Mozilla/3.0 (Slurp/.....        http://www.inktomi.com/ 
+id_n_s_1284    SlySearch (slysearch@slysearch.com)     Slysearch robot (now Turnitin robot)    R               http://www.slysearch.com/       
+id_n_s_1285    SlySearch/1.0 http://www.plagiarism.org/crawler/robotinfo.html  Slysearch robot (now Turnitin robot)    R               http://www.slysearch.com/       
+id_n_s_1286    SlySearch/1.x http://www.slysearch.com  Slysearch robot (now Turnitin robot)    R               http://www.slysearch.com/       
+id_n_s_1287    SmartDownload/1.2.67 (Win32; Jan 12 1999)       Netzip/Smartdownload download manager   D               http://www.netzip.com/  
+id_n_s_1288    SmartDownload/1.2.77 (Win32; Feb 1 2000)        Netzip/Smartdownload download manager   D               http://www.netzip.com/  
+id_n_s_1289    SmartDownload/1.2.77 (Win32; Jun 19 2001)       Netzip/Smartdownload download manager   D               http://www.netzip.com/  
+id_n_s_1290    smartwit.com    Loop Improvements NRS Enterprise search (69.44.155.xx[x])       R               http://www.loopimprovements.com/        http://demo.loopimprovements.com/demo/
+id_n_s_020307_2        SmiffyDCMetaSpider/1.0  SmiffyDCMetaSpider - Robot to check the retro-adding of Dublin Core metadata    R       64.71.152.xx    http://www.smiffysplace.com     http://www.smiffysplace.com/smiffydcmetaspider
+id_n_s_1291    sna-0.0.1 (mikemuzio@msn.com)   Snoopy PHP-client               see Snoopy      http://sourceforge.net/projects/snoopy/ 
+id_n_s_1292    sna-0.0.1 mikeelliott@hotmail.com       Snoopy PHP-client               see Snoopy      http://sourceforge.net/projects/snoopy/ 
+id_n_s_080106_1        snap.com beta crawler v0        Unknown bot from bb2.net (66.234.139.xxx) also as Snapbot/1.0   S       Gets only the robots.txt - Not from Snap.com / Idealab (63.251.211.xxx) http://www.kloth.net/internet/badbots.php       
+id_n_s_250506_1        Snapbot/1.0     Unknown bot from bb2.net (66.234.139.xxx) - also as snap.com    S       Not from Snap.com / Idealab (63.251.211.xxx)    http://www.kloth.net/internet/badbots.php       
+id_n_s_250408_1        Snapbot/1.0 (Snap Shots, +http://www.snap.com)  Unknown bot from Psinet / Cogentco - not from Snap.com  S       38.98.19.6x             
+id_n_s_270906_2        Snappy/1.1 ( http://www.urltrends.com/ )        My UrlTrends online web ranking service C       205.138.199.1xx / 209.85.36.x   http://www.urltrends.com/       
+id_n_s_100707_1        Snarfer/0.x.x (http://www.snarfware.com/)       Snarfer RSS reader      B               http://www.snarfware.com/       
+id_n_s_1293    SnoopRob/x.x    Unknown robot from 217.229.156.xx (T-Online Germany)                            
+id_n_s_1294    Snoopy v1.xx    Snoopy PHP-client               s. also sna-x.x.x       http://sourceforge.net/projects/snoopy/ 
+id_n_s_1295    Snoopy v1.xx- : User-Agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; MyIE2)   Snoopy PHP-client               s. also sna-x.x.x       http://sourceforge.net/projects/snoopy/ 
+id_n_s_1296    Snoopy_v0.xx    Snoopy PHP-client               s. also sna-x.x.x       http://sourceforge.net/projects/snoopy/ 
+id_n_s_1297    SnykeBot/0.6 (http://www.snyke.com)     Snyke.com France robot  R               http://www.snyke.com/   
+id_n_s_250706_2        SocSciBot ()    Link crawler for the social sciences    R               http://socscibot.wlv.ac.uk/     
+id_n_s_170407_1        SoftBank/1.0/812SH/SHJ001 Browser/NetFront/3.3 Profile/MIDP-2.0 Configuration/CLDC-1.1  NetFront browser on Softbank mobile phone       B               http://www.access-company.com/products/netfrontmobile/browser/index.html        http://mb.softbank.jp/mb/en/product/
+id_n_s_1298    SoftHypermarketFileCheckBot/1.0+(+http://www.softhypermaket.com)        Soft Hypermarket link checking  R               http://www.softhypermarket.com/ 
+id_n_s_1299    Softizerbot (http://www.softizer.com)   Softizer.com software directory link checking   C       72.9.97.xx      http://www.softizer.com/        
+id_n_s_090208_1        sogou develop spider    Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot     S       s. also sohu agent & Sogou web spider           
+id_n_s_011207_2        Sogou Orion spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm#07)       Unknown UA from Chinanet (220.181.18.xx) faking Sogou search robot      S       s. also sohu agent , Sogou web spider & sogou develop spider            
+id_n_s_150106_1        sogou spider    Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot     S       s. also sohu agent , Sogou web spider & sogou develop spider            
+id_n_s_280407_1        Sogou web spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm#07) Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot     S       s. also sohu agent , sogou spider & sogou develop spider                
+id_n_s_291105_1        sohu agent      Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot     S       s. also sogou spider , sogou spider & sogou develop spider              
+id_n_s_1300    sohu-search     Sohu (Search Fox) search robot China (61.135.131.xxx)   R       this UA also comes from 220.181.26.xxx (not Sohus IP range) as spam bot - s.also sohu agent     http://www.sohu.com/    
+id_n_s_160308_3        Sosospider+(+http://help.soso.com/webspider.htm)        SOSO search (China) spider      R               http://www.soso.com/    http://help.soso.com/webspider.htm
+id_n_s_1301    Space Bison/0.02 [fu] (Win67; X; SK)    Default Proxomitron (discontinued) filtering proxy user agent identifier        P B             http://duke.usask.ca/~macphed/prox/     
+id_n_s_1302    SpeedDownload/1.x       Speed Download (Mac) download manager   D               http://www.yazsoft.com/ 
+id_n_s_1303    speedfind ramBot xtreme 8.1     Speedfind.de robot      R               http://www.speedfind.de/        
+id_n_s_1304    Speedy Spider (Beta/x.x; speedy@entireweb.com)  Entireweb search robot  R       62.13.25.2xx    http://www.entireweb.com/       
+id_n_s_070906_1        Speedy Spider (Entireweb; Beta/1.0; http://www.entireweb.com/about/search_tech/speedyspider/)   Entireweb search spider R       62.13.25.2xx    http://www.entireweb.com/       
+id_n_s_1305    Speedy_Spider (http://www.entireweb.com)        Entireweb search robot  R       62.13.25.2xx    http://www.entireweb.com/       
+id_n_s_050208_4        Sphere Scout&v4.0 - scout at sphere dot com     Sphere blog and news search robot       R       64.40.11[7-8].[x]xx     http://www.sphere.com/  
+id_n_s_040106_3        Sphider Sphider - a lightweight search engine in PHP    R               http://www.cs.ioc.ee/~ando/sphider/     
+id_n_s_1306    Spida/0.1       Only.com robot  R       in conjunction with LWP::Simple/5.53    http://www.only.com/    
+id_n_s_1307    Spider-Sleek/2.0 (+http://search-info.com/linktous.html)        Search-Info ODP/DMOZ spider     R               http://search-info.com/ 
+id_n_s_1308    spider.batsch.com       Batsch robot    R       - site unreachable      http://www.batsch.com   
+id_n_s_110206_4        Spider.TerraNautic.net - v:1.04 TerraNautic spider for Schnellsuchen touristic search (Germany) C               http://www.terranautic.net/     http://www.schnellsuchen.com/
+id_n_s_1309    spider.yellopet.com - www.yellopet.com  Yellopet spider R               http://www.yellopet.com/        
+id_n_s_1310    Spider/maxbot.com admin@maxbot.com      Maxbot .gov .mil .edu indexing robot    R               http://www.maxbot.com/  
+id_n_s_1311    SpiderKU/0.x    Unknown robot from CPE at Kasetsart University (158.108.35.xxx) R               http://www.cpe.ku.ac.th/        
+id_n_s_1312    SpiderMan       Yahoo Search user agent or spider (202.165.102.xxx)     R               http://search.yahoo.com/        
+id_n_s_1313    SpiderMonkey/7.0x (SpiderMonkey.ca info at http://spidermonkey.ca/sm.shtml)     SpiderMonkey Canada robot       R               http://spidermonkey.ca/ 
+id_n_s_1314    Spinne/2.0      Spider.de robot R               http://www.spider.de/   
+id_n_s_1315    Spinne/2.0 med  Medkatalog (medical catalogue) Austria robot    R               http://www.medkatalog.com/      
+id_n_s_1316    Spinne/2.0 med_AH       Medkatalog (medical catalogue) Austria robot    R               http://www.medkatalog.com/      
+id_n_s_180707_3        Spock Crawler (http://www.spock.com/crawler)    Spock - people search application - via Amazon web services     R       72.44.62.1xx    http://www.spock.com/crawler    http://www.amazon.com/gp/browse.html?node=3435361
+id_n_s_1317    sportsuchmaschine.de-Robot (Version: 1.02- powered by www.sportsuchmaschine.de) Sportsuchmaschine (German sports related search) link checking / robot  R               http://www.sportsuchmaschine.de/        
+id_n_s_040306_1        sproose/0.1-alpha (sproose crawler; http://www.sproose.com/bot.html; crawler@sproose.com)       Sproose personalized search (38.100.225.xx)     R       powered by Nutch        http://www.sproose.com/ http://lucene.apache.org/nutch/
+id_n_s_1318    SQ Webscanner   SQ Webscanner Mac download manager      D       product is discontinued http://macinsearch.com/users/webscanner/        
+id_n_s_1319    Squid-Prefetch  Simple page-prefetch for Squid web proxy        P               http://packages.debian.org/stable/web/squid-prefetch    
+id_n_s_171105_2        squidclam       Squidclam is a replacement for SquidClamAV-Redirector   P       s.also SquidClamAV_Redirector 1.x.x     http://sourceforge.net/projects/squidclam       
+id_n_s_1320    SquidClamAV_Redirector 1.x.x    SCAVR - Squid helper script for scanning download URLs for viruses      P       s.also squidclam        http://www.jackal-net.at/tiki-read_article.php?articleId=1      
+id_n_s_1321    Sqworm/2.9.81-BETA (beta_release; 20011102-760; i686-pc-linux-gnu)      AOL Search / Pacific Internet Exchange robot    R               http://www.aol.com/     
+id_n_s_1322    Sqworm/2.9.85-BETA (beta_release; 20011115-775; i686-pc-linux-gnu)      diff. IPs / services i.e.: - Inria.fr robot - Websense (Internet filtering) robot       R               http://www.inria.fr/    http://www.websense.com/
+id_n_s_1323    Sqworm/2.9.89-BETA (beta_release; 20020130-839; i686-pc-linux-gnu)      Time Warner Telecom user robot ?                                
+id_n_s_1324    SSurf15a 11     Some site scanning tool via diff. IPs i.e.: - choiceone.net (216.153.xxx.xxx) - epix.net (216.108.198.xx)       S       see also - PSurf15a VA or random letters like - AWSCBA - URVUSLNAM              
+id_n_s_1325    StackRambler/x.x        Rambler search (Russia) robot (81.19.6x.xx)     R               http://www.rambler.ru   
+id_n_s_1326    Stamina/1.4     Stamina download manager        D               http://www.wildbits.com/stamina/        
+id_n_s_1327    Star Downloader Star Downloader download manager        D               http://www.stardownloader.com/  
+id_n_s_140106_3        StarDownloader/1.xx     Star Downloader download manager        D               http://www.stardownloader.com/  
+id_n_s_1328    stat statcrawler@gmail.com      Experimental search engine spider from 66.92.186.xxx    R       66.92.186.xxx           
+id_n_s_1329    Steeler/1.x (http://www.tkl.iis.u-tokyo.ac.jp/~crawler/)        Steeler crawler R               http://www.tkl.iis.u-tokyo.ac.jp/~crawler/      
+id_n_s_031107_5        Steeler/3.3 (http://www.tkl.iis.u-tokyo.ac.jp/~crawler/)        Steeler - University of Tokyo web crawler       R       157.82.156.xx[x]        http://www.tkl.iis.u-tokyo.ac.jp/~crawler/crawler.html.en       
+id_n_s_060106_1        Strategic Board Bot (+http://www.strategicboard.com)    Strategic Board blog & news search robot        R               http://www.strategicboard.com/  
+id_n_s_140906_2        Strategic Board Bot (+http://www.strategicboard.com)    Strategic Board blogs and news aggregator robot R       62.0.99.2xx     http://www.strategicboard.com/  
+id_n_s_1330    Submission Spider at surfsafely.com     Surfsafely submission verifier  R               http://www.surfsafely.com/      
+id_n_s_210106_4        suchbaer.de     Suchbaer.de (Germany) search robot      R               http://www.suchbaer.de/ 
+id_n_s_010206_3        suchbaer.de (CrawlerAgent v0.103)       Suchbaer.de (Germany) search robot      R               http://www.suchbaer.de/ 
+id_n_s_1331    suchbot Suchbot Germany robot   R               http://www.suchbot.de/  
+id_n_s_1332    Suchknecht.at-Robot     Suchknecht Austria robot        R               http://www.suchknecht.at/       
+id_n_s_120206_1        suchpadbot/1.0 (+http://www.suchpad.de) suchpad search Germany robot (213.239.194.xx)   R               http://www.suchpad.de/  
+id_n_s_160107_2        Sunrise XP/2.x  Sunrise XP handheld news / website reader and converter B               http://sourceforge.net/projects/sunrisexp       
+id_n_s_230406_4        Sunrise/0.42g (Windows XP)      Sunrise XP web sites and newsfeeds converter and handheld reader        B               http://www.sunrisexp.com/       
+id_n_s_1333    SuperBot/x.x (Win32)    SuperBot website copier D               http://www.sparkleware.com/superbot/index.html  
+id_n_s_260108_2        SuperBot/x.x.x.xx (Windows XP)  SuperBot website copier D               http://www.sparkleware.com/superbot/index.html  
+id_n_s_1334    Superdownloads Spiderman        Ubbi Superdownloads (Brazil) link checking      C               http://superdownloads.ubbi.com.br/      
+id_n_s_1335    SURF    SurfControl Web Filtering       P               http://www.surfcontrol.com/     
+id_n_s_1336    SurferF3 1/0    Wanadoo Rechereche robot        R               http://www.wanadoo.fr/qqo/      
+id_n_s_1337    SurfMaster      Maskbit Surfmaster bookmark tool        C               http://www.maskbit.com/surfmaster.htm   
+id_n_s_1338    SurveyBot/2.2 <a href='http://www.whois.sc'>Whois Source</a>    Whois Source domain name information robot (66.249.26.xx)       R C     s.also: PigeonBot       http://www.whois.sc/    
+id_n_s_1339    SurveyBot/2.3 (Whois Source)    Whois Source domain name information robot (66.249.26.xx)       R C     s.also: PigeonBot       http://www.whois.sc/    
+id_n_s_1340    suzuran Yokogao Search Engine robot (Kanazawa University)       R               http://web.kanazawa-u.ac.jp/esearch.html        
+id_n_s_1341    SWB/V1.4 (HP)   HP Secure Web Browser for OpenVMS       B               http://h71000.www7.hp.com/openvms/products/ips/cswb/cswb.html   
+id_n_s_1342    swbot/0.9c libwww/5.3.1 unknown                         
+id_n_s_1343    Swooglebot/2.0. (+http://swoogle.umbc.edu/swooglebot.htm)       Swooglebot Swoogle's semantic web crawler       R               http://swoogle.umbc.edu 
+id_n_s_060106_2        SWSBot-Images/1.2 http://www.smartwaresoft.com/swsbot12.html    SWSBot - SmartWareSoft (85.186.255.xx) software search engine created for Playfuls.com  R               http://www.smartwaresoft.com/swsbot12.html      http://www.playfuls.com/
+id_n_s_300106_2        SygolBot http://www.sygol.net   Sygol Search (Italy) robot      R       s.also <http://www.sygol.com/>  http://www.sygol.com/   
+id_n_s_1344    Sylera/1.2.x    Sylera browser (Japan)  B               http://tabbrowser.ktplan.jp/valinor/sylera.html 
+id_n_s_1345    SyncBot Mindspring.com user robot                       http://www.mindspring.com/      
+id_n_s_1346    SyncIT/x.x      SyncIT link validation  C               http://www.bookmarksync.com/    
+id_n_s_140906_1        Syndirella/0.91pre      Syndirella desktop information aggregator (beta)        B               http://www.yole.ru/projects/syndirella/ 
+id_n_s_1347    SynoBot Synomia (France) robot  R               http://www.synomia.fr/  
+id_n_s_150406_1        Syntryx ANT Scout Chassis Pheromone; Mozilla/4.0 compatible crawler     Syntryx Solution Suite - domain / keyword crawler (216.7.179.xx)        R               http://www.syntryx.com/ 
+id_n_s_1348    Szukacz/1.x     Szukacz.pl (Polish search) robot        R               http://www.szukacz.pl/  
+id_n_s_1349    Szukacz/1.x (robot; www.szukacz.pl/jakdzialarobot.html; szukacz@proszynski.pl)  Szukacz.pl (Polish search) robot        R               http://www.szukacz.pl/  
+id_t_z_220106_2        T-Online Browser        German T-Online browser & internet suite        B               http://service.t-online.de/c/06/52/67/652672.html       
+id_t_z_070807_1        tags2dir.com/0.8 (+http://tags2dir.com/directory/)      tags2dir.com directory index    R       74.115.102.1xx  http://tags2dir.com/directory/  
+id_t_z_1350    Tagword (http://tagword.com/dmoz_survey.php)    TAGword DMOZ survey - ODP link checking robot   R               http://tagword.com/dmoz_survey.php      
+id_t_z_271105_2        Tagyu Agent/1.0 Tagyu - del.icio.us bookmark collection online tag generator                    http://www.tagyu.com/   http://del.icio.us/
+id_t_z_1351    Talkro Web-Shot/1.0 (E-mail: webshot@daumsoft.com- Home: http://222.122.15.190/webshot) Daumsoft Talkro IR robot        R               http://www.daumsoft.com/        
+id_t_z_1352    TAMU_CS_IRL_CRAWLER/1.0 Texas A&M University - Dept. of Computer Science crawler (server or link checking ?)    R C             http://www.cs.tamu.edu/ 
+id_t_z_1353    targetblaster.com/0.9k  Targetblaster user link validation ?    R C             http://www.targetblaster.com/   
+id_t_z_230706_2        TargetYourNews.com bot  Target Your News - user submitted links C       72.36.160.xxx   http://targetyournews.com/      
+id_t_z_201006_1        TCDBOT/Nutch-0.8 (PhD student research;http://www.tcd.ie; mcgettrs at t c d dot IE)     Trinity College Dublin (Ireland) TCDBOT R       134.226.1.xx    http://www.tcd.ie/      
+id_t_z_1354    TE      HTTP header for transfer encoding used as user agent name ?                             
+id_t_z_1355    TeamSoft WinInet Component      WinInet Internet client app.                    http://www.winsoft.sk/wininet.htm       
+id_t_z_1356    TECOMAC-Crawler/0.x     Tecomac Gmbh (Germany) crawler software - now Arexera Information Technologies  R               http://www.arexera.de/  
+id_t_z_1357    Tecomi Bot (http://www.tecomi.com/bot.htm)      Tecomi (Germany) beta / test robot (84.201.65.xxx)      R               http://www.tecomi.com/Suchmaschine      
+id_t_z_101107_2        Teemer (NetSeer, Inc. is a Los Angeles based Internet startup company.; http://www.netseer.com/crawler.html; crawler@netseer.com)       Teemer crawler for NetSeer search (beta) via Amazon Web Services - see also NetSeer/Nutch       R       67.202.26.1xx   http://www.netseer.com/ http://www.amazon.com/gp/browse.html?node=3435361
+id_t_z_1358    Teleport Pro/1.2x(.1xxx)        Teleport (website) downloading tool     D               http://www.tenmax.com/teleport/pro/home.htm     
+id_t_z_1359    Teoma MP        Teoma crawler (65.214.36.xx[x]) R               http://www.teoma.com/   
+id_t_z_1361    teomaagent crawler-admin@teoma.com      Teoma crawler (65.214.36.xx[x]) R               http://www.teoma.com/   
+id_t_z_1362    teomaagent1 [crawler-admin@teoma.com]   Teoma crawler (65.214.36.xx[x]) R               http://www.teoma.com/   
+id_t_z_1360    teoma_agent1    Teoma crawler (65.214.36.xx[x]) R               http://www.teoma.com/   
+id_t_z_1363    Teradex Mapper; mapper@teradex.com; http://www.teradex.com      Teradex Directory robot R               http://directory.teradex.com/   
+id_t_z_010406_4        TeragramCrawler Teragram multilingual text & data processing software   D ?             http://www.teragram.com/        
+id_t_z_150807_2        terraminds-bot/1.0 (support@terraminds.de)      Terraminds blog search (Germany)        R       88.198.44.2xx   http://www.terraminds.de/       
+id_t_z_220406_1        TerrawizBot/1.0 (+http://www.terrawiz.com/bot.html)     Terrawiz Indian Search Engine robot     R       209.128.80.1xx  http://www.terrawiz.com/        
+id_t_z_1364    Test spider     Noceans Information Portfolio Manager (66.35.69.x)      R               http://www.noceans.com/ 
+id_t_z_160507_1        TestCrawler/Nutch-0.9 (Testing Crawler for Research ; http://balihoo.com/index.aspx; tgautier at balihoo dot com)       Balihoo - Search Engine for Advertising Media   R       204.228.230.xx  http://balihoo.com/     
+id_t_z_1365    The Expert HTML Source Viewer (http://www.expert-html.com)      Expert HTML online source viewer        D B     in conjunction with lwp-trivial/1.35    http://www.expert-html.net - site is offline    
+id_t_z_281207_3        TheRarestParser/0.2a (http://therarestwords.com/)       The Rarest Words - Linguistic experiment crawler via Amazon Web Services        R       67.202.27.19x   http://therarestwords.com/      http://www.amazon.com/gp/browse.html?node=3435361
+id_t_z_1366    TheSuBot/0.1 (www.thesubot.de)  TheSuBot robot (Germany) for an unknown theme based search engine       R               http://www.thesubot.de/ 
+id_t_z_171106_1        thumbshots-de-Bot (Version: 1.02, powered by www.thumbshots.de) ThumbShots website thumbnail service (Germany) robot    D       212.112.238.xx  http://www.thumbshots.de/       
+id_t_z_1367    thumbshots-de-Bot (Version: 1.02- powered by www.thumbshots.de) ThumbShots.de (Germany) robot   R               http://www.thumbshots.de/       
+id_t_z_250206_1        timboBot/0.9 http://www.breakingblogs.com/timbo_bot.html        Breaking Blogs timbo bot blog robot     R               http://www.breakingblogs.com/   
+id_t_z_140106_4        http://www.timelyweb.com/       TimelyWeb web page monitoring tool      C       s. also EldoS ...       http://www.eldos.org/timelyweb/timelyweb.html   
+id_t_z_180408_6        TinEye/1.1 (http://tineye.com/crawler.html)     TinEye crawler for an open image search project R               http://tineye.com/crawler.html  
+id_t_z_1368    tivraSpider/1.0 (crawler@tivra.com)     Tivra spider from AT&T Labs Research    R       see this document: http://trec.nist.gov/pubs/trec9/papers/att-trec9.ps  http://trec.nist.gov/pubs/trec9/papers/att-trec9.ps     
+id_t_z_1369    TJG/Spider      Tjgroup spider  R               http://www.tjgroup.com/ 
+id_t_z_1370    TJvMultiHttpGrabber Component   TJvHttpGrabber (JEDI Visual Component Library)          Possibly used by Bit Torrent Search     http://homepages.borland.com/jedi/jedihelp/item.php?Id=22015    http://www.btsearch.net/
+id_t_z_1371    Tkensaku/x.x(http://www.tkensaku.com/q.html)    Tkensaku Search (Japan) robot from 210.239.46.xxx (www.tken.com)        R               http://www.tkensaku.com/q.html  
+id_t_z_1372    toCrawl/UrlDispatcher   Unknown robot from 195.68.98.xx (coltfrance.com)                                
+id_t_z_200207_1        Topodia/1.2-dev (Topodia - Crawler for HTTP content indexing; http://www.topodia.com/; support@topodia.com)     Topodia search engine and personal information assistant (in development)       R       88.153.148.xx   http://www.topodia.com/ 
+id_t_z_160506_2        TOPOS robot/1.1 (http://www.topos.com.ua/)      Topos search (Russia) robot     C       193.17.73.1xx   http://www.topos.com.ua/        
+id_t_z_050806_2        traazibot/testengine (+http://www.traazi.de)    Traazi! search (Germany) robot  R       87.230.5.2xx    http://www.traazi.de/   
+id_t_z_041007_2        Trailfire-bot/0.7.1 (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org)     Trailfire web collection and annotating system  C               http://www.trailfire.com/       
+id_t_z_081207_2        Trailfire-bot/0.7.1 (Trailfire page content analyzer; http://trailfire.com; info@trailfire.com) Trailfire web collection and annotating system  C               http://www.trailfire.com/       
+id_t_z_260807_2        Trailfire/0.7.1 (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org) Trailfire web collection and annotating system  C               http://www.trailfire.com/       
+id_t_z_1376    Trampelpfad-Spider      Trampelpfad Webkatalog spider   R               http://www2.trampelpfad.de/     
+id_t_z_1377    Trampelpfad-Spider-v0.1 Trampelpfad Webkatalog spider   R               http://www2.trampelpfad.de/     
+id_t_z_1378    tricosMetaCheck 1.2216-08-1999 (http://www.tricos.com/metacheck)        Tricos meta tag validation      C               http://www.tricos.us/metaone.php        
+id_t_z_1379    TSurf15a 11     some bad user agent     S       - s. DBrowse- Dsurf etc.                
+id_t_z_1380    TulipChain/5.x (http://ostermiller.org/tulipchain/) Java/1.x.1_0x (http://java.sun.com/) Linux/2.4.17   Tulip Chain browser / link checker for Dmoz.org directory       B C R           http://ostermiller.org/tulipchain/      
+id_t_z_1381    TulipChain/5.xx (http://ostermiller.org/tulipchain/) Java/1.x.1_0x (http://apple.com/) Mac_OS_X/10.2.8  Tulip Chain browser / link checker for Dmoz.org directory       B C R           http://ostermiller.org/tulipchain/      
+id_t_z_101107_3        Tumblr/1.0 RSS syndication (+http://www.tumblr.com/) (support@tumblr.com)       Tumblr Tumblelogs RSS and news syndication crawler      R       72.32.6.15x     http://www.tumblr.com/  
+id_t_z_1382    TurnitinBot/x.x (http://www.turnitin.com/robot/crawlerinfo.html)        Turnitin (ex SlySearch) robot for helping educational institutions prevent plagiarism   R       64.140.49.xx    http://www.turnitin.com/robot/crawlerinfo.html  
+id_t_z_1383    Turnpike Emporium LinkChecker/0.1       TurnPike Emporium Directory (207.67.198.x) link checking        R               http://www.turnpike.net/directory.phtml 
+id_t_z_1384    TutorGig/1.5 (+http://www.tutorgig.com/crawler) TutorGig tutorial search robot  R               http://www.tutorgig.com/crawler/        
+id_t_z_1385    Tutorial Crawler 1.4 (http://www.tutorgig.com/crawler)  TutorGig tutorial search robot  R               http://www.tutorgig.com/crawler/        
+id_t_z_1386    Twiceler www.cuill.com/robots.html      Twiceler experimental web crawler       R       64.62.136.xxx   http://www.cuill.com/   
+id_t_z_290407_1        Twiceler-0.9 http://www.cuill.com/twiceler/robot.html   Twiceler experimental web crawler       R       64.62.136.xxx   http://www.cuill.com/   
+id_t_z_291105_5        Twisted PageGetter      File downloading component from Twisted Python  D               http://twistedmatrix.com/       
+id_t_z_140508_5        Twitturly / v0.x        Twitt(url)y URL tracking service for Twitter via Amazon Web Services    C       75.101.135.[x]xx        http://twitturly.com/   http://twitter.com/
+id_t_z_1387    Twotrees Reactive Filter V2.0   Twotrees content filter P               http://www.twotrees.com/        
+id_t_z_221207_2        Tycoon Agent/Nutch-1.0-dev      Tycoon - Hewlett-Packards distributed cluster solution robot    R       204.123.46.xx[x]        http://tycoon.hpl.hp.com/       
+id_t_z_1388    TygoBot Tygo Search robot       R               http://www.tygo.com/    
+id_t_z_1389    TygoProwler     Tygo Search robot       R               http://www.tygo.com/    
+id_t_z_1390    UCmore  UCMore - IE navigation and search plugin        B               http://www.ucmore.com/  
+id_t_z_1391    UCMore Crawler App      UCMore - IE navigation and search plugin        B               http://www.ucmore.com/  
+id_t_z_290208_1        UCWEB5.1        Ucweb mobile browser    B               http://www.ucweb.com/English/product.shtml      
+id_t_z_1392    UDM     user agent - maybe UdmSearch (see UdmSearch) ?                          
+id_t_z_1393    UdmSearch/3.1.x UdmSearch / MySearch (now mnoGoSeach) offline browser/search client     R B             http://mnogosearch.org/ 
+id_t_z_1394    UIowaCrawler/1.0        University of Iowa Crawler- possibly MySpiders  R               http://myspiders.biz.uiowa.edu/ 
+id_t_z_231106_1        UKWizz/Nutch-0.8.1 (UKWizz Nutch crawler; http://www.ukwizz.com/)       UKWizz search robot     R       s. also Mackster        http://www.ukwizz.com   
+id_t_z_1395    Ultraseek       Infoseek robot  R               http://www.infoseek.com/        
+id_t_z_1396    Under the Rainbow 2.2   Unknown mail harvester/spambot from 80.58.13.xxx (proxycache.rima-tde.net)      S               http://www.honeypot.be/ 
+id_a_f_140308_1        unknownght.com Web Server IIS vs Apache Survey. See Results at www.DNSRight.com DNS Right - Online DNS tools    C       203.161.71.17x  http://www.dnsright.com/        
+id_t_z_1397    UofTDB_experiment (leehyun@cs.toronto.edu)      Unknown robot from University of Toronto (128.100.5.1xx)        R                       
+id_t_z_1398    UP.Browser/3.01-IG01 UP.Link/3.2.3.4    Mobile phone browser    B                       
+id_t_z_050806_1        updated/0.1-alpha (updated crawler; http://www.updated.com; crawler@updated.com)        Updated! search robot   R       38.119.96.1xx   http://www.updated.com/ 
+id_t_z_1399    updated/0.1beta (updated.com; http://www.updated.com; crawler@updated.om)       Updated! search robot   R       38.119.96.1xx   http://www.updated.com/ 
+id_t_z_1400    UPG1 UP/4.0 (compatible; Blazer 1.0)    Handspring (PalmOS powered cellphone) Treo Blazer browser       B                       
+id_t_z_1401    Uptimebot       UptimeBot.com online link popularity check      R               http://www.uptimebot.com/       
+id_t_z_1402    UptimeBot(www.uptimebot.com)    UptimeBot.com online link popularity check      R               http://www.uptimebot.com/       
+id_t_z_160706_2        URI::Fetch/0.06 URI::Fetch - client for fetching HTTP pages and syndication feeds (RSS Atom)    D               http://search.cpan.org/dist/URI-Fetch/  
+id_t_z_1403    URL Spider Pro/x.xx (innerprise.net)    Innerprise URL Spider Pro (now ES.NET) web indexing / site searching tool       R               http://www.innerprise.net/      
+id_t_z_121106_2        URLBase/6.x     URLBase - Internet shortcut manager     C       s. also Mozilla/4.0 (Compatible); URLBase 6     http://www.terriadev.com/products/urlbase/      
+id_t_z_1406    URLBlaze        URLBlaze file sharing link toolkit      C               http://www.urlblaze.net/        
+id_t_z_011108_4        urlfan-bot/1.0; +http://www.urlfan.com/site/bot/350.html        ://URLFAN news crawler  R       70.165.48.16x   http://www.urlfan.com/  
+id_t_z_1407    URLGetFile      URLGetFile downloading tool     D               http://shazron.com/freeware/java-utils/ 
+id_t_z_1404    URL_Spider_Pro/x.x      Innerprise URL Spider Pro (now ES.NET) web indexing / site searching tool       R               http://www.innerprise.net/      
+id_t_z_1405    URL_Spider_Pro/x.x+(http://www.innerprise.net/usp-spider.asp)   Innerprise URL Spider Pro (now ES.NET) web indexing / site searching tool       R               http://www.innerprise.net/      
+id_t_z_291006_1        User-Agent: BoardReader Favicon Fetcher /1.0 info@boardreader.com       BoardReader search favicon fetcher      D       208.65.71.xx    http://www.boardreader.com/     http://www.internetadsales.com/modules/news/article.php?storyid=4050
+id_t_z_081206_1        User-Agent: BoardReader Image Fetcher /1.0 info@boardreader.com BoardReader search image fetcher        D       208.65.71.xx    http://www.boardreader.com/     http://www.internetadsales.com/modules/news/article.php?storyid=4050
+id_t_z_060206_2        User-Agent: LjSEEK Picture-Bot /1.0 contact@ljseek.com  ljpic.com - LiveJournal picture feed search     C               http://www.ljpic.com/   
+id_t_z_1408    User-Agent: FileHeap! file downloader (http://www.fileheap.com) FileHeap download manager       D               http://www.fileheap.com 
+id_t_z_270306_2        User-Agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1)  Malformed UA header from some guestbook/forum spammer   S                       
+id_t_z_1409    User-Agent: Mozilla/4.0 (SKIZZLE! Distributed Internet Spider v1.0 - www.SKIZZLE.com)   Skizzle search robot    R               http://www.skizzle.com/ 
+id_t_z_1410    user-agent=Mozilla/3.01Gold     unknown robot (reads robots.txt) or sitegrabber. From different IPs- ie.: 62.98.8.xx (wind.it)  R D ?                   
+id_t_z_1411    USyd-NLP-Spider (http://www.it.usyd.edu.au/~vinci/bot.html)     University of Sydney NLP Spider for research in Natural Language Processing     R               http://www.it.usyd.edu.au/~vinci/bot.html       
+id_t_z_1412    UtilMind HTTPGet        Web Thief Site Grabber  D               http://www.utilmind.com/scripts/webthief.html   
+id_t_z_1413    Utopia WebWasher 3.0    WebWasher ad filter     P B             http://www.webwasher.com/       
+id_t_z_100406_1        uTorrent/1500   uTorrent BitTorrent client      D               http://www.utorrent.com/        
+id_t_z_060108_2        VadixBot        Unknown bad behaving bot via Road Runner - see link     S       67.78.34.1[6-7][0-9] - 70.112.211.2x    http://mikesblog.americasdebate.com/2007/06/06/vadixbot-look-out/       
+id_t_z_050406_4        Vagabondo-WAP/2.0 (webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/)/1.0 Profile   WiseGuys WAP pages robot        R               http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk 
+id_t_z_1414    Vagabondo/1.x MT (webagent@wise-guys.nl)        WiseGuys robot Netherland - 82.94.216.2 R       s. also Mozilla/3.0 (Vagabondo...       http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk 
+id_t_z_1415    Vagabondo/2.0 MT        WiseGuys robot Netherland - 82.94.216.2 R       s. also Mozilla/3.0 (Vagabondo...       http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk 
+id_t_z_1416    Vagabondo/2.0 MT (webagent at wise-guys dot nl) WiseGuys robot Netherland - 82.94.216.2 R       s. also Mozilla/3.0 (Vagabondo...       http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk 
+id_t_z_1417    Vagabondo/2.0 MT (webagent@NOSPAMwise-guys.nl)  WiseGuys robot Netherland - 82.94.216.2 R       s. also Mozilla/3.0 (Vagabondo...       http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk 
+id_t_z_021205_2        Vagabondo/3.0 (webagent at wise-guys dot nl)    WiseGuys robot Netherland - 82.94.216.2 R       s.also - Mozilla/3.0 (Vagabondo...      http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk 
+id_t_z_1418    Vakes/0.01 (Vakes; http://www.vakes.com/; search@vakes.com)     Open Directory link checking from Vakes R               http://www.vakes.com/   
+id_t_z_1420    VayalaCreep-v0.0.1 (haploid@haploid.com)        unknown level3.net (63.214.172.xxx) robot                               
+id_t_z_1419    Vayala|Creep-v0.0.1 (codepoet@wildties.com)     unknown level3.net (63.214.172.xxx) robot                               
+id_t_z_1421    vb wininet      iNet Grabber - Internet content grabber D               http://www.aldostools.com/igrabber.html 
+id_t_z_1422    versus 0.2 (+http://versus.integis.ch)  Versus Project robot - Comparing methods for near-uniform URL sampling  R               http://versus.integis.ch/       
+id_t_z_1423    versus crawler eda.baykan@epfl.ch       Unknown robot from EPFL University Switzerland (128.178.155.xxx)        R               http://www.epfl.ch/Eindex.html  
+id_t_z_120408_1        Verticrawlbot   Verticrawl - Semantic search engine solution (French)   C               http://www.verticrawl.com/fr/homepage.php       
+id_t_z_1424    VeryGoodSearch.com.DaddyLongLegs        VeryGoodSearch.com link submission checking     R               http://www.verygoodsearch.com/  
+id_t_z_1425    verzamelgids.nl - Networking4all Bot/x.x        Verzamelgids NL link checking robot     R       213.247.50.xx   http://www.verzamelgids.nl/     
+id_t_z_181006_2        Verzamelgids/2.2 (http://www.verzamelgids.nl)   Verzamelgids NL link checking robot     R       213.247.50.xx   http://www.verzamelgids.nl/     
+id_t_z_030406_1        Vespa Crawler   Unknown robot from Yahoo Norway R       217.144.236.x   http://no.yahoo.com/    
+id_t_z_190206_1        virus_detector (virus_harvester@securecomputing.com)    Sidewinder G2 anti-virus and anti-spyware protection    D               http://www.securecomputing.com/sg2_antivirus.cfm?menu=solutions 
+id_t_z_140407_1        VisBot/2.0 (Visvo.com Crawler; http://www.visvo.com/bot.html; bot@visvo.com)    Visbot crawler for a search software under development  R       63.133.162..xx  http://www.visvo.com/bot.html   
+id_t_z_1426    Visicom Toolbar Some IE toolbar made with Visicom Media Dynamic Toolbar software        B               http://www.dynamictoolbar.com/en/products/toolbar/      
+id_t_z_1427    Vision Research Lab image spider at vision.ece.ucsb.edu Vision research lab's Cortina - content based image retrieval (128.111.60.xx)   R               http://vision.ece.ucsb.edu/multimedia/cortina.html      
+id_t_z_160906_1        VLC media player - version 0.8.5 Janus - (c) 1996-2006 the VideoLAN team        VLC - Cross-platform media player and streaming server  B               http://www.videolan.org/vlc/    
+id_t_z_140806_1        VMBot/0.x.x (VMBot; http://www.VerticalMatch.com/; vmbot@tradedot.com)  VM - Vertical Search Engine (China)     R       202.83.221.2xx  http://www.verticalmatch.com/   
+id_t_z_020106_1        Vortex/2.2 (+http://marty.anstey.ca/robots/vortex/)     Vortex Web Indexing Robot for a study on internet link distribution     R               http://marty.anstey.ca/projects/robots/vortex/  
+id_t_z_041207_1        voyager-hc/1.0  Kosmix health, auto and travel search crawler (204.14.48.x / 38.113.234.xxx)    R       s. also - cfetch/1.x - carleson/1.x     http://www.kosmix.com/  
+id_t_z_231105_1        voyager/1.0     Kosmix health, auto and travel search crawler (204.14.48.x / 38.113.234.xxx)    R       s. also - cfetch/1.x - carleson/1.x     http://www.kosmix.com/  
+id_t_z_301108_3        voyager/2.0 (http://www.kosmix.com/html/crawler.html)   Kosmix health, auto and travel search crawler (204.14.48.x / 38.113.234.xxx)    R       s. also - cfetch/1.x - carleson/1.x     http://www.kosmix.com/  
+id_t_z_171105_3        VSE/1.0 (testcrawler@hotmail.com)       Vivisimo search crawler (206.210.89.xxx)        R               http://www.vivisimo.com/        
+id_t_z_171105_4        VSE/1.0 (testcrawler@vivisimo.com)      Vivisimo search crawler (206.210.89.xxx)        R               http://www.vivisimo.com/        
+id_t_z_1428    vspider Verity vspider indexing software        R               http://www.verity.com/  
+id_t_z_1429    vspider/3.x     Verity vspider indexing software        R               http://www.verity.com/  
+id_t_z_130707_1        VWBOT/Nutch-0.9-dev (VWBOT Nutch Crawler; http://vwbot.cs.uiuc.edu;+vwbot@cs.uiuc.edu   VWBot - MetaQuerier Crawler for the MetaQuerier project at the University of Illinois   R       192.17.240.xx   http://vwbot.cs.uiuc.edu/       http://metaquerier.cs.uiuc.edu/
+id_t_z_1431    W3C-checklink/3.x.x.x libwww-perl/5.xx  W3C Link Checker        C               http://validator.w3.org/checklink       
+id_t_z_1432    W3C-checklink/4.x [4.xx] libwww-perl/5.xxx      W3C Link Checker        C               http://validator.w3.org/checklink       
+id_t_z_080806_1        W3C-WebCon/5.x.x libwww/5.x.x   WebCon - the Libwww command line tool   D               http://www.w3.org/ComLine/      
+id_t_z_1433    W3CLineMode/5.4.0 libwww/5.x.x  W3C Line Mode (character based Web browser)     B               http://www.w3.org/LineMode/     
+id_t_z_1434    W3CRobot/5.4.0 libwww/5.4.0     Unknown link checking using Libwww via Korea Telecom (221.148.44.xxx)   C               http://www.w3.org/Library/      
+id_t_z_1430    W3C_Validator/1.xxx libwww-perl/5.xx    W3C HTML-Code Validator C               http://validator.w3.org/        
+id_t_z_1435    w3m/0.x.xx      w3m Linux pager / text-based browser    B               http://w3m.sourceforge.net/     
+id_t_z_1436    W3SiteSearch Crawler_v1.1 http://www.w3sitesearch.de    W3 Site Search (Germany) search engine solution R               http://www.w3sitesearch.de/     
+id_t_z_061206_3        wadaino.jp-crawler 0.2 (http://wadaino.jp/)     Wadain (Japan) Blog / RSS search crawler        R       202.51.14.1xx   http://wadaino.jp/      
+id_t_z_1437    WannaBe (Macintosh; PPC)        Wanna-Be text mode browser      B               http://mindstory.com/wb2/       
+id_t_z_270906_1        WapOnWindows 1.0        WapOnWindows WAP browser for PCs        B       Site is dead    http://www.waponwindows.com/    
+id_t_z_250206_2        Watchfire WebXM 1.0     Watchfire WebXM intranet solution       P               http://www.watchfire.com/products/webxm/default.aspx    
+id_t_z_200706_1        WAVcheck 1.0.x (http://www.webbanalys.se/apps/WAVcheck/)        WAVcheck - Simple Vendor Discovery Tool for detecting client-side tags from web analytics vendors       C               http://www.webbanalys.se/apps/WAVcheck/ 
+id_t_z_110106_1        Wavefire/0.8-dev (Wavefire; http://www.wavefire.com; info@wavefire.com) Wavefire local search community engine (64.141.15.1xx)  R               http://www.wavefire.com/        
+id_t_z_110206_5        Waypath development crawler - info at waypath dot com   Waypath blog discovery engine robot     R               http://www.waypath.com/ 
+id_t_z_110206_6        Waypath Scout v2.x - info at waypath dot com    Waypath blog discovery engine robot     R               http://www.waypath.com/ 
+id_t_z_1438    WDG_Validator/1.1       WDG HTML-code validator C               http://www.htmlhelp.tne.co.uk/tools/validator/  
+id_t_z_1439    Web Image Collector     Datafire.com's Web Image Collector (graphics downloading tool)  D               http://www.datafire.com/        
+id_t_z_1440    Web Link Validator 1.5  Relsoft link checking software  C               http://www.relsoftware.com/     
+id_t_z_1441    Web Snooper     RankMeter ranking software      R               http://www.searchutilities.com/ 
+id_t_z_010206_2        web-bekannt (Version: 1.02, powered by www.internetservice-franken.de)  Web-bekannt German web directory link checking  C               http://www.web-bekannt.de/      
+id_t_z_010206_1        web-bekannt (Version: 1.02, powered by www.web-bekannt.de)      Web-bekannt German web directory link checking  C               http://www.web-bekannt.de/      
+id_t_z_1442    Web-Bot V1.03   Unkown link or server checking from Würzburg University Germany (132.187.10.xx)        R C             http://informatik.uni-wuerzburg.de/     
+id_t_z_1443    Web-Robot/5.0 (en-US; web-robot.com/policy.html) Web-Robot Crawler/2.0.3        Unknown robot from 69.50.233.x (nectartech.com)         no active website               
+id_t_z_010107_2        web2express.org/Nutch-0.9-dev (leveled playing field; http://web2express.org/; info at web2express.org) Web2Express / Web2x - Open data searching tool  R               http://search.web2express.org/search/search.html        
+id_t_z_050206_1        WebAlta Crawler/1.2.1 (http://www.webalta.ru/bot.html)  WebAlta search Russia crawler (85.21.201.xx)    R               http://www.webalta.ru/  
+id_t_z_250806_1        WebarooBot (Webaroo Bot; http://64.124.122.252/feedback.html)   WebarooBot / RufusBot from webaroo offline search service       R       64.124.122.2xx  http://www.webaroo.com/ http://www.webaroo.com/company/site-owners
+id_t_z_210407_1        WebarooBot (Webaroo Bot; http://www.webaroo.com/rooSiteOwners.html)     WebarooBot / RufusBot from webaroo offline search service       R       64.124.122.2xx  http://www.webaroo.com/ http://www.webaroo.com/company/site-owners
+id_t_z_1444    WebAuto/3.4xxx (WinNT; I)       Yanasoft WebAuto website copier / downloading tool      D               http://www.yanasoft.co.jp/webauto.html  
+id_t_z_1445    webbandit/4.xx.0        Web Bandit personal search software     R               http://softwaresolutions.net/webbandit/ 
+id_t_z_140106_2        WebBug/5.x      Amansoft WebBug web server protocol test        C               http://www.cyberspyder.com/webbug.html  
+id_t_z_1446    Webclipping.com WebClipping.com - online news monitoring service        R               http://www.webclipping.com      
+id_t_z_1447    webcollage/1.xx WebCollage Syndicator graphics crawler/collector        R D     s. also collage.cgi/1.xx        http://www.webcollage.com/      
+id_t_z_1448    WebCompass 2.0  Quarterdecks WebCompass search tool     R                       
+id_t_z_1449    WebCopier vx.x  WebCopier offline browser       D B             http://www.maximumsoft.com/     
+id_t_z_1450    WebCopier vx.xa WebCopier offline browser       D B             http://www.maximumsoft.com/     
+id_t_z_210506_1        WebCorp/1.0     WebCorp linguistic search engine (UK)   R       193.60.130.xx   http://webcorp.uce.ac.uk/       
+id_t_z_1451    webcrawl.net    Webcrawl Search robot (64.40.105.xxx)   R               http://www.webcrawl.net/        
+id_t_z_1452    WebDownloader for X x.xx        Unix/Linux Web Downloader       D               http://www.krasu.ru/soft/chuchelo/      
+id_t_z_1453    Webdup/0.9      Unknown robot from china-netcom.com                             
+id_t_z_1454    WebFetch        WingFlyer WebFetch website downloading tool     D B             http://www.wingflyer.com/       
+id_t_z_1455    webfetch/5.x.x  webfetch - command line tool to fetch files via HTTP    D               http://tony.aiu.to/sa/webfetch/ 
+id_t_z_310806_2        WebFilter Robot 1.0     Verso NetSpective WebFilter     P               http://www.verso.com/enterprise/netspective/webfilter.asp       
+id_t_z_1456    WebFilter Robot 1.x     Telemate.net NetSpective WebFilter      P               http://www.telemate.net/        
+id_t_z_1457    WebFindBot(http://www.web-find.com)     Webfind search robot    R               http://www.web-find.com/        
+id_t_z_1458    Webglimpse 2.xx.x (http://webglimpse.net)       Webglimpse search engine software       R               http://www.webglimpse.net/      
+id_t_z_150306_2        webGobbler/1.x.x        webGobbler - Online random image generator      R D             http://sebsauvage.net/webgobbler/       
+id_t_z_1459    webhack fake ?                          
+id_t_z_290807_2        WebImages 0.3 ( http://herbert.groot.jebbink.nl/?app=WebImages )        herbert.groot.jebbink.nl Web Images collage generator   D       212.204.217.1xx http://herbert.groot.jebbink.nl/        
+id_t_z_280306_2        WebLight/4.x.x (support@illumit.com; http://www.illumit.com/Products/weblight/) WebLight web analyzer & link checker    C       s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; support@illumit.com...   http://www.illumit.com/Products/weblight/       
+id_t_z_1460    Weblink's checker/      WebLink's link management system for HTTP- FTP and Mail hyperlinks      C       sometimes in conjunction w. PHP/4.0.6   http://www.harlequin.ch/technologien/tools/weblinks.php 
+id_t_z_140307_1        Weblog Attitude Diffusion 1.0   Los Alamos National Laboratoy weblog research project   R               http://www.user-agents.org/agents/weblogattitude.shtml  http://www.lanl.gov/
+id_t_z_230606_1        webmeasurement-bot, http://rvs.informatik.uni-leipzig.de        Unknown robot from Leipzig University (Germany) faculty for computer science    R       139.18.38.1xx   http://rvs.informatik.uni-leipzig.de/   
+id_t_z_1461    WebMiner/x.x [en] (Win98; I)    WebMiner bulk file downloader   D               http://tribolic.com/webminer/   
+id_t_z_1462    WeBoX/0.xx      WeBoX (Japan) - Browser and web collector       B D             http://www-nishio.ise.eng.osaka-u.ac.jp/~nakamura/webox/        
+id_t_z_1463    WebPix 1.0 (www.netwu.com)      WebPix - picture downloading tool       D               http://www.netwu.com/webpix/    
+id_t_z_1464    WebQL   Caesius WebQL - Custom robot/agent generator / web extraction software  B D             http://www.caesius.com/ 
+id_t_z_1465    WebRACE/1.1 (University of Cyprus- Distributed Crawler) WebRACE - HTTP retrieval- annotation and caching engine P               http://www.cs.ucy.ac.cy/Projects/eRACE/webrace.html     
+id_t_z_130907_1        WebRankSpider/1.37 (+http://ulm191.server4you.de/crawler/)      WebRankSpider experimental web crawler  R       62.75.202.1xx   http://ulm191.server4you.de/crawler/    
+id_t_z_1468    WebReaper vx.x - www.webreaper.net      Webreaper download manager      D               http://www.webreaper.net/       
+id_t_z_1466    WebReaper [info@webreaper.net]  Webreaper download manager      D               http://www.webreaper.net/       
+id_t_z_1467    WebReaper [webreaper@webreaper.net]     Webreaper download manager      D               http://www.webreaper.net/       
+id_t_z_1469    WebSearch.COM.AU/3.0.1 (The Australian Search Engine; http://WebSearch.COM.AU; Search@WebSearch.COM.AU) Websearch Australia robot       R               http://WebSearch.COM.AU/        
+id_t_z_1470    WebSearchBench WebCrawler v0.1(Experimental)    Dortmund University WebSearchBench - Open source search software        R               http://websearchbench.cs.uni-dortmund.de/websearch/about.html.de        
+id_t_z_1471    WebSearchBench WebCrawler V1.0 (Beta)- Prof. Dr.-Ing. Christoph Lindemann- Universität Dortmund- cl@cs.uni-dortmund.de- http://websearchbench.cs.uni-dortmund.de/      Dortmund University WebSearchBench - Open source search software        R               http://websearchbench.cs.uni-dortmund.de/websearch/about.html.de        
+id_t_z_260806_2        Website Explorer/0.9.x.x        Web site downloading tool and offline browser (Japan)   D               http://www.umechando.com/webex/ 
+id_t_z_1472    Website eXtractor       Website eXtractor web site downloading tool     D               http://www.asona.org/   http://www.internet-soft.com/
+id_t_z_090606_1        WebsiteWorth v1.0       Sootle web directory Website Worth ranking tool R       216.89.111.x    http://directory.sootle.com/website-worth/      
+id_t_z_1473    Webspinne/1.0 webmaster@webspinne.de    Webspinne.de robot      R               http://www.webspinne.de/        
+id_t_z_1474    Websquash.com (Add url robot)   Websquash.com Search Engine robot / link checking       R               http://www.websquash.com/       
+id_t_z_1475    WebStat/1.0 (Unix; beta; 20040314)      WebStat - Java statistical computing environment for the web    R               http://www.math.psu.edu/babcock/webstat/version1.0/     
+id_t_z_091006_2        Webster v0.3 ( http://webster.healeys.net/ )    Webster - Rev. Healeys web crawler      R       24.99.22.xx     http://webster.healeys.net/     http://webster.healeys.net/search.php
+id_t_z_1476    webster-internet.de pad browser Websters Webmaster Archive (Germany) submission / pad checking  C B             http://webster.de/      
+id_t_z_1477    WebStripper/2.xx        WebStripper download manager    D               http://webstripper.net/index.html       http://www.netidea.it
+id_t_z_1478    WebTrafficExpress/x.0   WebTrafficExpress IBM server software   P                       
+id_t_z_1479    WebTrends/3.0 (WinNT)   Web Trends link analyzer        C               http://www.netiq.com/webtrends/default.asp      
+id_t_z_1480    WebVac (webmaster@pita.stanford.edu)    The Stanford WebBase Project crawler    R       ex Pita- s. there       http://www-diglib.stanford.edu/~testbed/doc2/WebBase/   
+id_t_z_1481    WebVal/1.0      webval - Python link checking tool      C               http://www.alcyone.com/pyos/webval/     
+id_t_z_171205_3        Webverzeichnis.de - Telefon: 01908 / 26005      Webverzeichnis.de (Germany) directory robot     R               http://www.webverzeichnis.de/   
+id_t_z_060306_1        WebVulnCrawl.unknown/1.0 libwww-perl/5.803      Web Vulnerability Crawler       S       Looking for excluded directories in robots.txt  http://webvulncrawl.blogspot.com/2005/12/what-am-i-doing.html   
+id_t_z_1482    WebWatcherMonitor/2.01  Studio Net.Idea's Web Watcher Monitor robot     R C             http://www.web-watcher.com/web-watcher-monitor.html     
+id_t_z_1483    WebZIP/x.x (http://www.spidersoft.com)  WebZip offline browser  B D             http://www.spidersoft.com/      
+id_t_z_1484    Wells Search II Unknown spam bot / harvester (62.163.**.** / 62.194.**.*)       S       s.also - Port Huron Labs                
+id_t_z_1485    WEP Search 00   Some spam bot- see link S               http://www.kloth.net/internet/badbots-2004.php  
+id_t_z_230606_2        West Wind Internet Protocols 4.xx       wwIPStuff - Internet client tools for Visual FoxPro     B D             http://www.west-wind.com/wwipstuff.asp  
+id_t_z_1486    WFARC   IBM's Almaden Research robot (Clever search project)    R       s. also: - http://www.almaden.ibm.com/cs/crawler - FocusedSampler       http://www.almaden.ibm.com/cs/k53/clever.html   
+id_t_z_1488    Wget/1.x(.x)GNU wget http://www.gnu.org/software/wget/wget.html - file downloader       GNU wget - file downloader      D               http://www.gnu.org/software/wget/wget.html      
+id_t_z_1489    Wget/1.x+cvs-stable (Red Hat modified)  GNU wget - file downloader      D               http://www.gnu.org/software/wget/wget.html      
+id_t_z_1487    Wget/1.x.x+cvs  GNU wget - file downloader      D               http://www.gnu.org/software/wget/wget.html      
+id_t_z_1490    Whatsup/x.x     Whatsup Gold network monitor    C               http://www.ipswitch.com/products/network-management.html        
+id_t_z_1491    whatUseek_winona/3.0    WhatUSeek / Chubba robot        R       166.90.205.x    http://www.whatuseek.com/       
+id_t_z_1492    WhizBang! Lab   WhizBang! Labs (closed since May 2002) information extraction robot     R                       
+id_t_z_1493    Wildsoft Surfer some download agent     D       - in conjunction w. dlman               
+id_t_z_1494    Willow Internet Crawler by Twotrees V2.1        Twotrees crawler        R               http://www.twotrees.com/        
+id_t_z_1495    WinampMPEG/2.00 (larbin@unspecified.mail)       unknown robot from gw.ocg-corp.com (209.126.176.x)              see also: - Opera/6.01 (larbin@.....) - MSIE-5.13 larbin@....           
+id_t_z_1496    WincerSong Agent v1.0   Super Affiliate Tracker agent by Wincer Song                    http://www.superaffiliatetracker.com/index.htm  
+id_t_z_191105_3        Windows-Media-Player/10.00.00.xxxx      Windows Media Player 10 B                       
+id_t_z_160107_1        WinGet 1.1      Nicksoft WinGet download manager        D       Domain is for sale              
+id_t_z_060406_1        WinHTTP Example/1.0     Example code for a WinHTTP C++ library crawler  R               http://www.codeguru.com/cpp/i-n/internet/http/article.php/c6237/        http://www.microsoft.com/msdownload/platformsdk/sdkupdate/update.htm
+id_t_z_260506_1        WinkBot/0.06 (Wink.com search engine web crawler; http://www.wink.com/Wink:WinkBot; winkbot@wink.com)   Wink beta search robot (64.13.136.x)    R               http://www.wink.com/    
+id_t_z_010607_1        WinPodder (http://winpodder.com)        WinPodder - Podcast player and RSS reader       B               http://winpodder.com/   
+id_t_z_251105_1        WinWAP/3.x (3.x.x.xx; Win32) (Google WAP Proxy/1.0)     WinWap - Windows PC WAP browser B               http://www.winwap.com/products_2_1.php  
+id_t_z_111206_2        Wir sind die Borg (Version: 1.03, Sie wurden Assimiliert +http://www.yammba.com/suchmaschine/bot.html)  Yammba web directory (Germany) link checking    C               http://www.yammba.com/  
+id_t_z_130506_2        WIRE/0.11 (Linux; i686; Bot,Robot,Spider,Crawler,aromano@cli.di.unipi.it)       WIRE crawler used by the University of Pisa - Italy     R       146.48.82.xx    http://www.cwr.cl/projects/WIRE/        http://www.unipi.it/english/index.htm
+id_t_z_1497    WIRE/0.x (Linux; i686; Bot,Robot,Spider,Crawler)        WIRE - Web information retrieval environment crawler    R       Used by different IPs for different purposes    http://www.cwr.cl/projects/WIRE/        
+id_t_z_1498    WISEbot/1.0 (WISEbot@koreawisenut.com; http://wisebot.koreawisenut.com) Korea Wisenut robot     R               http://www.koreawisenut.com/    
+id_t_z_1499    WiseWire-Spider2        Wisewire domain checker (Discontinued)  R C             http://www.wisewire.com/        
+id_t_z_110107_2        wish-project (http://wish.slis.tsukuba.ac.jp/)  WISH academic research project for link checking        C       133.51.22.xx    http://wish.slis.tsukuba.ac.jp/ 
+id_t_z_1500    WordChampBot    Wordchamp web page vocabulary / translation robot       B D             http://www.wordchamp.com/       
+id_t_z_301105_1        WordPress/x.x.x.x PHP/4.x.xx    WordPress personal Blog publishing platform     B               http://wordpress.org/   
+id_t_z_100207_1        worio heritrix bot (+http://worio.com/) WORIO (beta) search for computer scientists and programmers using Heritrix open-source crawler  R       137.82.84.xx    http://www.worio.com/   http://www.archive.org/
+id_t_z_291007_1        woriobot ( http://www.worio.com/)       WORIO (beta) search for computer scientists and programmers via Amazon Web Services     R       67.202.45.2xx   http://www.worio.com/   http://www.amazon.com/gp/browse.html?node=3435361
+id_t_z_1501    WorldLight      Entireweb Search robot (62.13.25.xxx)   R       s. also Mozilla/4.0 (compatible; SpeedySpider ....      http://www.entireweb.com/       
+id_t_z_1502    WorQmada/1.0    unknown link checking (from 4.18.57.126) ?      C                       
+id_t_z_1503    Wotbox/alpha0.6 (bot@wotbox.com; http://www.wotbox.com) Wotbox spider   R               http://www.wotbox.com/  
+id_t_z_1504    Wotbox/alpha0.x.x (bot@wotbox.com; http://www.wotbox.com) Java/1.4.1_02 Wotbox spider   R               http://www.wotbox.com/  
+id_t_z_1505    WSB WebCrawler V1.0 (Beta)- cl@cs.uni-dortmund.de       WebSearchBench crawler from Dortmund University- Germany        R               http://websearchbench.cs.uni-dortmund.de/       
+id_t_z_1506    WSB, http://websearchbench.cs.uni-dortmund.de   WebSearchBench crawler from Dortmund University- Germany        R               http://websearchbench.cs.uni-dortmund.de/       
+id_t_z_1507    wume_crawler/1.1 (http://wume.cse.lehigh.edu/~xiq204/crawler/)  WUME Lab's web crawler (128.180.121.xxx)        R               http://wume.cse.lehigh.edu/~xiq204/crawler/     
+id_t_z_1508    Wusage/x.0@boutell.com  Wusage log-file analysis        R C             http://www.boutell.com/wusage/  
+id_t_z_120106_2        Wwlib/Linux     WWLib - Wolverhampton Univerity Web Library for classifying web documents       R               http://www.scit.wlv.ac.uk/wwlib/        
+id_t_z_1509    WWSBOT 1.x [--- http://www.analyzer.nu ---]     WWSBOT web server version checker       C               http://www.analyzer.nu/Perl/WWSBOT.html 
+id_t_z_170506_2        WWW-Mechanize/1.1x      Perl web page fetching module   D               http://search.cpan.org/dist/WWW-Mechanize/      
+id_t_z_1510    www.arianna.it  Arianna robot   R               http://arianna.libero.it/       
+id_t_z_1511    www.business-socket.com registry verify/1.x     Business-Socket.com link checking ?     C               http://www.business-socket.com  
+id_t_z_221006_2        www.doweb.co.uk crawler The DoWeb UK Business directory link checking   C       85.13.252.x     http://www.doweb.co.uk/action_home+page.htm     
+id_t_z_1512    www4mail/2.x libwww-FM/2.14 (Unix; I)   www4mail - web navigation & database search by e-mail                   http://www4mail.org/    
+id_t_z_1513    WWWC/1.0x       WWWC Updating check of Web pages. (Japanese only)       C               http://www.nakka.com/soft/index_eng.html        
+id_t_z_1514    WWWeasel Robot v1.00 (http://wwweasel.de)       World Wide Weasel Germany robot R               http://wwweasel.de/     
+id_t_z_1515    WWWOFFLE/2.x    WWWoffle download manager       D               http://www.gedanken.demon.co.uk/wwwoffle/       
+id_t_z_1516    wwwster/1.x (Beta- mailto:gue@cis.uni-muenchen.de)      Unknown robot from CIS at Munich University     R       129.187.254.xxx http://www.cis.uni-muenchen.de/ 
+id_t_z_050208_5        wxDownload Fast wxDownload Fast (wxDFast) open source download manager  D               http://dfast.sourceforge.net/index.html 
+id_t_z_1517    X-Crawler       Arexera (Germany) crawler software      R               http://www.arexera.de/de/products/crawler.php   
+id_t_z_1518    Xaldon WebSpider        Xaldon WebSpider offline browser        B D             http://www.xaldon.de/produkte_webspider.html    
+id_t_z_1519    Xenu Link Sleuth 1.xx   Xenu link checker       C               http://home.snafu.de/tilman/xenulink.html       
+id_t_z_1520    Xenu's Link Sleuth 1.x[a-z]     Xenu link checker       C               http://home.snafu.de/tilman/xenulink.html       
+id_t_z_270706_2        Xerka WebBot v1.0.0 [UPVOpenDir]        XerKa text mining and information retrieval software    D               http://www.diana-teknologia.com/www1/english/xerka.htm  
+id_t_z_250106_2        xine/1.0        xine - free Linux / OS/2 multimedia player      B               http://xinehq.de/       
+id_t_z_141205_3        xirq/0.1-beta (xirq; http://www.xirq.com; xirq@xirq.com)        XIRQ search (beta) robot (70.86.206.1xx)        R               http://www.xirq.com/    
+id_t_z_160806_1        XMLSlurp/0.1 libwww-perl/5.805  GPath / XMLSlurp - Expression language for tree structured data                 http://groovy.codehaus.org/GPath        
+id_t_z_070506_1        XRL/2.00b1 (Linux; i686; en-us) (+http://metamark.net/about)    Metamark URL Shorten Service    P               http://metamark.net/    
+id_t_z_200308_3        Xylix   Xylix Retrieval System software C               http://www.xylixsoftware.ch/retrievalsystem.php 
+id_t_z_1521    xyro_(xcrawler@cosmos.inria.fr) Inria Crawler   R               http://www.inria.fr/    
+id_t_z_081205_1        Y!J-BSC/1.0 (http://help.yahoo.co.jp/help/jp/search/indexing/indexing-15.html)  Yahoo Search Japan robot (211.14.8.2xx) R       s. also Mozilla/4.0 (compatible; Y!J... http://www.yahoo.co.jp/ 
+id_t_z_271006_2        Y!J-SRD/1.0     Yahoo Search Japan robot (203.216.197.xxx)      R       s. also DoCoMo/2.0/SO502i (compatible; Y!J-SRD/1.0 ...  http://www.yahoo.co.jp/ 
+id_t_z_240106_3        Y!J/1.0 (http://help.yahoo.co.jp/help/jp/search/indexing/indexing-15.html)      Yahoo Search Japan robot (211.14.8.2xx) R       s. also Mozilla/4.0 (compatible; Y!J... http://www.yahoo.co.jp/ 
+id_t_z_220206_2        Y!OASIS/TEST no-ad Mozilla/4.08 [en] (X11; I; FreeBSD 2.2.8-STABLE i386)        Yahoo picture service for mobiles       P       217.12.4.xx             
+id_t_z_1522    Y!TunnelPro     Y!TunnelPro - Yahoo! Messenger companion user agent     B       s. YTunnelPro   http://www.ytunnelpro.com/      
+id_t_z_121205_1        yacy (www.yacy.net; v20040602; i386 Linux 2.4.26-gentoo-r13; java 1.4.2_06; MET/en)     Yacy distributed P2P web search engine robot    R               http://www.yacy.net/    
+id_t_z_260306_4        yacybot (x86 Windows XP 5.1; java 1.5.0_06; Europe/de) yacy.net Yacy distributed P2P web search engine robot    R               http://www.yacy.net/    
+id_t_z_300707_2        Yahoo Pipes 1.0 (Yahoo) Pipes interactive data aggregator robot R               http://pipes.yahoo.com/pipes/   
+id_t_z_100406_2        Yahoo! Mindset  Yahoo Mindset: Intent-driven Search (66.228.182.1xx)    R       s. also Mozilla/4.0     http://mindset.research.yahoo.com/      
+id_t_z_040106_2        Yahoo-Blogs/v3.9 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html )  Yahoo blog indexing robot (209.191.83.1xx)      R               http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html 
+id_t_z_1523    Yahoo-MMAudVid/1.0 (mms dash mmaudvidcrawler dash support at yahoo dash inc dot com)    Yahoo multimedia crawler (206.190.43.xx)        R                       
+id_t_z_080108_2        Yahoo-MMAudVid/2.0(mms dash mm aud vid crawler dash support at yahoo dash inc.com ;Mozilla 4.0 compatible; MSIE 7.0;Windows NT 5.0; .NET CLR 2.0)       Yahoo multimedia crawler        R                       
+id_t_z_1524    Yahoo-MMCrawler/3.x (mm dash crawler at trd dot overture dot com)       Yahoo multimedia crawler via Fastsearch.net (66.77.73.xx)       R       see also FAST-WebCrawler/3.x Multimedia...              
+id_t_z_110806_1        Yahoo-Test/4.0  Yahoo Search robot      R       216.145.49.xx           
+id_t_z_1525    Yahoo-VerticalCrawler-FormerWebCrawler/3.9 crawler at trd dot overture dot com; http://www.alltheweb.com/help/webmaster/crawler Yahoo crawler via Overture (66.77.73.3x)        R                       
+id_t_z_010906_2        YahooFeedSeeker/2.0 (compatible; Mozilla 4.0; MSIE 5.5; http://publisher.yahoo.com/rssguide)    Yahoo Publisher Network RSS crawler     R               http://publisher.yahoo.com/rssguide     
+id_t_z_1526    YahooSeeker-Testing/v3.9 (compatible; Mozilla 4.0; MSIE 5.5; http://search.yahoo.com/)  Yahoo Product Search crawler ( 68.142.195..x)   R                       
+id_t_z_1527    YahooSeeker/1.0 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/shop/merchant/)       Yahoo Product Search crawler ( 66.196.93.x)     R                       
+id_t_z_1528    YahooSeeker/1.0 (compatible; Mozilla 4.0; MSIE 5.5; http://search.yahoo.com/yahooseeker.html)   Yahoo Product Search crawler ( 66.196.93.x)     R                       
+id_t_z_1529    YahooSeeker/1.1 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/shop/merchant/)       Yahoo Product Search crawler ( 66.196.93.x)     R                       
+id_t_z_1530    YahooSeeker/bsv3.9 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html )        Yahoo Product Search crawler ( 68.142.195..x)   R                       
+id_t_z_1531    YahooSeeker/CafeKelsa-dev (compatible; Konqueror/3.2; FreeBSD ;cafekelsa-dev-webmaster@yahoo-inc.com )  Yahoo robot     R       64.157.137.xxx          
+id_t_z_231106_2        Yandex/1.01.001 (compatible; Win16; I)  Yandex Search Russia link checking (213.180.206.2xx)    R       s. also Mozilla/4.0 (compatible; MSIE 5.0; YANDEX)      http://www.yandex.ru    
+id_t_z_301108_2        Yanga WorldSearch Bot v1.1/beta (http://www.yanga.co.uk/)       Yanga search robot by Gigabase (Russian Federation)     R       91.205.124.x    http://www.yanga.co.uk/ 
+id_t_z_1532    yarienavoir.net/0.2     Yarienavoir search (Belgium) robot      R       217.71.121.xx   http://www.yarienavoir.net/     
+id_t_z_300506_1        Yeti    1noon.com search Korea robot (222.231.21.xxx)   R       uses also a blank UA field      http://www.1noon.com/   
+id_t_z_040407_1        Yeti/0.01 (nhn/1noon, yetibot@naver.com, check robots.txt daily and follows it) 1noon.com search Korea robot (222.231.21.xxx)   R       uses also a blank UA field      http://www.1noon.com/   
+id_t_z_301108_1        Yeti/1.0 (NHN Corp.; http://help.naver.com/robots/)     Naver search (Korea) robot      R       61.247.222.xx   http://www.naver.com/   
+id_t_z_290407_2        yggdrasil/Nutch-0.9 (yggdrasil biorelated search engine; www dot biotec dot tu minus dresden do de slash schroeder; heiko dot dietze at biotec dot tu minus dresden dot de)     yggdrasil spider for GoPubMed biorelated search engine  R       141.30.193.x[x] http://www.biotec.tu-dresden.de/schroeder       http://gopubmed.biotec.tu-dresden.de/
+id_t_z_211206_3        YodaoBot/1.0 (http://www.yodao.com/help/webmaster/spider/; )    Yodao search (China)    R       60.191.80.xx    http://www.yodao.com/   
+id_t_z_110308_1        yoofind/yoofind-0.1-dev (yoono webcrawler; http://www.yoono.com ; MyEmail)      Yoono - community based search (193.110.140.xxx / 194.0.179.[x]xx)      R       s. also Mozilla/5.0 (compatible; Yoono; http://www.yoono.com/) - yoono/1.0 web-crawler ..       http://www.yoono.com/   
+id_t_z_210106_3        yoogliFetchAgent/0.1    Yoogli search (under development) agent R               http://www.yoogli.com/  
+id_t_z_120606_1        yoono/1.0 web-crawler/1.0       Yoono - community based search (193.110.140.xxx / 194.0.179.[x]xx)      R       s. also Mozilla/5.0 (compatible; Yoono; http://www.yoono.com/) - yoofind/yoofind ..     http://www.yoono.com/   
+id_t_z_1533    YottaCars_Bot/4.12 (+http://www.yottacars.com) Car Search Engine        YottaCars bot - YottaCar car search engine ( 64.62.175.xxx)     R       s. also OmniExplorer_Bot        http://www.yottacars.com/       
+id_t_z_1534    YottaShopping_Bot/4.12 (+http://www.yottashopping.com) Shopping Search Engine   YottaShopping bot - YottaShopping search engine ( 64.62.175.xxx)        R       s. also OmniExplorer_Bot        http://www.yottashopping.com/   
+id_t_z_1535    YTunnelPro      Y!TunnelPro - Yahoo! Messenger companion user agent     B       s. Y!TunnelPro  http://www.ytunnelpro.com/      
+id_t_z_1536    Z-Add Link Checker (http://w3.z-add.co.uk/linkcheck/)   Z-Add online link checker       C               http://w3.z-add.co.uk/linkcheck/        
+id_t_z_1537    Zao-Crawler     Zao crawler for Kototoi Project R               http://www.kototoi.org/zao/     
+id_t_z_1538    Zao-Crawler 0.2b        Zao crawler for Kototoi Project R               http://www.kototoi.org/zao/     
+id_t_z_1539    Zao/0.1 (http://www.kototoi.org/zao/)   Zao crawler for Kototoi Project R               http://www.kototoi.org/zao/     
+id_t_z_1540    ZBot/1.00 (icaulfield@zeus.com) Zeus Internet Marketing Robot based on Webster Pro component    R               http://cyber-robotics.com/      http://www.homepagesw.com/
+id_t_z_111205_5        Zearchit        Zearchit German search / directory      R       212.227.109.1xx http://www.zearchit.de/ 
+id_t_z_130106_2        ZeBot_lseek.net (bot@ze.bz)     Ze.bz Moteur de Recherche robot R       213.251.135.xx  http://www.ze.bz/       
+id_t_z_1541    ZeBot_www.ze.bz (ze.bz@hotmail.com)     Ze.bz Moteur de Recherche robot R       213.251.135.xx  http://www.ze.bz/       
+id_t_z_130806_2        zedzo.digest/0.1 (http://www.zedzo.com/)        ZedZo Search (beta) robot       R       24.62.50.1xx    http://www.zedzo.com/   
+id_t_z_210807_2        Zend_Http_Client        Zend PHP frameworks Zend_Http_Client component  D               http://framework.zend.com/manual/en/zend.http.html      
+id_t_z_290208_2        zermelo Mozilla/5.0 compatible; heritrix/1.12.1 (+http://www.powerset.com) [email:crawl@powerset.com,email:paul@page-store.com] Powerset Natural Language Search crawler (under development) using Heritrix via Amazon Web Services     R       67.202.34.xxx   http://www.powerset.com/        http://www.amazon.com/gp/browse.html?node=3435361
+id_t_z_1542    zerxbot/Version 0.6 libwww-perl/5.79    Zerx search robot ?     R       138.88.147.xxx  http://www.zerx.com/    
+id_t_z_1543    Zeus ThemeSite Viewer Webster Pro V2.9 Win32    Zeus Internet Marketing Robot (based on Webster Pro)    R               http://cyber-robotics.com/      
+id_t_z_1544    Zeus xxxxx Webster Pro V2.9 Win32       Zeus Internet Marketing Robot (based on Webster Pro)    R               http://cyber-robotics.com/      
+id_t_z_281105_1        Zeusbot/0.07 (Ulysseek's web-crawling robot; http://www.zeusbot.com; agent@zeusbot.com) Zeusbot robot for building the Ulsysseek.com index      R       powered by Nutch        http://www.zeusbot.com/ http://www.ulysseek.com/
+id_t_z_1545    Ziggy -- The Clown From Hell!!  Unknown agent (server- or link checking ?) from 198.173.158.xx  C                       
+id_t_z_1546    ZipppBot/0.xx (ZipppBot; http://www.zippp.net; webmaster@zippp.net)     Zipp.net web search robot       R               http://www.zippp.net/   
+id_t_z_1547    ZIPPPCVS/0.xx (ZipppBot/.xx;http://www.zippp.net; webmaster@zippp.net)  Zipp.net web search robot       R               http://www.zippp.net/   
+id_t_z_1548    Zippy v2.0 - Zippyfinder.com    Zippyfinder robot       R               http://www.zippyfinder.com/     
+id_t_z_1549    Zoo Tycoon 2 Client -- http://www.zootycoon.com Microsoft Zoo Tycoon 2 game client      B               http://www.zootycoon.com        
+id_t_z_1550    ZoomSpider - wrensoft.com       Zoom Search Engine software spider      R               http://www.wrensoft.com/        
+id_t_z_160110_1        Zscho.de Crawler/Nutch-1.0-Zscho.de-semantic_patch (Zscho.de Crawler    collecting for machine learning; http://zscho.de/ )     Zscho search crawler (Germany)  R       141.65.161.xx   http://www.zscho.de/
+id_t_z_280306_1        zspider/0.9-dev http://feedback.redkolibri.com/ zspider robot for a new search engine   R               http://feedback.redkolibri.com/ 
+id_t_z_1551    ZyBorg/1.0 (ZyBorg@WISEnut.com; http://www.WISEnut.com) Wisenut robot   R               http://www.wisenutbot.com/      
+id_new_190610_1        Mozilla/5.0 (Windows; U; Windows NT 5.1; de; rv:1.9.2.3) Gecko/20100401 Firefox/3.6.3 (FM Scene 4.6.1)  FM Scene soccer fan pages plugin        L               http://www.fmscene.de   
+id_new_190610_2        Mozilla/5.0 (Windows; U; Windows NT 5.1; de; rv:1.9.2.3) Gecko/20100401 Firefox/3.6.3 (.NET CLR 3.5.30729) (Prevx 3.0.5)        PrevX security plugin                   http://www.prevx.com    
\ No newline at end of file
index ba581c82afab6a96cdcb009d18d43e0d5c4a9a0f..1c34ad7e3b1d1d94c42320453c89ea14b9b4a9ca 100644 (file)
@@ -1,3 +1,30 @@
+-- Type:
+-- B = Browser
+-- C = Link-, bookmark-, server- checking D = Downloading tool
+-- P = Proxy server, web filtering
+-- R = Robot, crawler, spider
+-- S = Spam or bad bot
+
+CREATE TEMPORARY TABLE _useragent (
+  id INT PRIMARY KEY,
+  string VARCHAR(500),
+  description VARCHAR(2000),
+  type VARCHAR(20),
+  comment VARCHAR(100),
+  link1 VARCHAR(1000),
+  link2 VARCHAR(1000)
+);
+
+CREATE TEMPORARY TABLE new_useragent (
+  id INT PRIMARY KEY,
+  string VARCHAR(500),
+  description VARCHAR(2000),
+  type VARCHAR(20),
+  comment VARCHAR(100),
+  link1 VARCHAR(1000),
+  link2 VARCHAR(1000)
+);
+
 DROP TABLE IF EXISTS useragent;
 CREATE TABLE IF NOT EXISTS useragent (
   id INT PRIMARY KEY,
@@ -11,5 +38,6 @@ CREATE TABLE IF NOT EXISTS useragent (
 
 BEGIN TRANSACTION;
 .separator \t
+.import "useragent.csv" _useragent
 .import "useragent.csv" useragent
 COMMIT;