From 51d47fda355a86df49a8d2fbb6f9e6ed1dd714cb Mon Sep 17 00:00:00 2001 From: Nicolas Boisselier Date: Fri, 12 Jan 2018 02:06:36 +0000 Subject: [PATCH] share/db/shell_replace.sh --- lib/php/db/table.php | 1 - lib/php/db/types/pgsql.php | 12 +- lib/postgres/lang.sql | 6 +- share/db/0-pre.sql | 22 - share/db/adservers | 2 - share/db/country | 17 - share/db/country.csv | 252 ---- share/db/country.sql | 48 - share/db/http_status | 13 - share/db/http_status.sql | 6 - share/db/mime.sql | 5 - share/db/mime_type.csv | 686 ---------- share/db/mime_type.sql | 12 - share/db/port | 9 - share/db/port.sql | 8 - share/db/shell_function | 56 - share/db/shell_function.sql | 5 - share/db/shell_replace.sh | 4 +- share/db/timezone | 13 - share/db/timezone.csv | 424 ------ share/db/timezone.sql | 12 - share/db/update.sh | 87 +- share/db/useragent | 3 - share/db/useragent.csv | 2459 ---------------------------------- share/db/useragent.sql | 64 - www/dbq/html/default.min.css | 2 +- 26 files changed, 20 insertions(+), 4208 deletions(-) delete mode 100644 share/db/0-pre.sql delete mode 100755 share/db/adservers delete mode 100755 share/db/country delete mode 100644 share/db/country.csv delete mode 100644 share/db/country.sql delete mode 100755 share/db/http_status delete mode 100644 share/db/http_status.sql delete mode 100644 share/db/mime.sql delete mode 100644 share/db/mime_type.csv delete mode 100644 share/db/mime_type.sql delete mode 100755 share/db/port delete mode 100644 share/db/port.sql delete mode 100755 share/db/shell_function delete mode 100644 share/db/shell_function.sql delete mode 100755 share/db/timezone delete mode 100644 share/db/timezone.csv delete mode 100644 share/db/timezone.sql delete mode 100755 share/db/useragent delete mode 100644 share/db/useragent.csv delete mode 100644 share/db/useragent.sql diff --git a/lib/php/db/table.php b/lib/php/db/table.php index 22f8c258..65c7a25a 100644 --- a/lib/php/db/table.php +++ b/lib/php/db/table.php @@ -953,7 +953,6 @@ Class Table extends nb { public function buttons() { if (!$this->show_buttons or empty(self::$params)) return false; if (!preg_match('/(table|view)/',$this->type())) return false; - if ($fct = $this->db()->conf_type('print_buttons')) { $r = $fct($this); if ($r!==null) return $r; } return true; } diff --git a/lib/php/db/types/pgsql.php b/lib/php/db/types/pgsql.php index c7f03217..d55b4261 100644 --- a/lib/php/db/types/pgsql.php +++ b/lib/php/db/types/pgsql.php @@ -1,17 +1,17 @@ [ + 'BEGIN TRANSACTION', +], +'sql.post' => [ + 'COMMIT', +], 'delete_no_limit' => true, -# NB 19.12.17 'print_buttons' => function(&$t) { -# NB 19.12.17 if ($t->type = 'view' and preg_match('/GROUP BY/i',$t->sql())) return false; -# NB 19.12.17 return true; -# NB 19.12.17 }, 'replace_insert' => function(&$sql,&$table,$fields=[]) { $keys = $table->fields_keys($others); - #if ($table->p('debug')) { if (!empty($fields)) $others = $fields; $sql .= ' ON CONFLICT ('.join(',',array_keys($keys)).') DO UPDATE'; $sql .= ' SET ' . join(',',$table->ar_map('"$a=:$a"',array_keys($others))); - #$info['debug'] = [$keys,$others]; }, 'like_nocase' => 'ILIKE', 'cast_text' => function($name) { return "$name::text"; }, diff --git a/lib/postgres/lang.sql b/lib/postgres/lang.sql index 9af851c1..a892c1fe 100644 --- a/lib/postgres/lang.sql +++ b/lib/postgres/lang.sql @@ -8,5 +8,9 @@ GRANT ALL ON TABLE lang TO nico; GRANT ALL ON TABLE lang TO root; BEGIN TRANSACTION; DELETE FROM lang; -COPY lang FROM PROGRAM 'curl -s http://download.geonames.org/export/dump/iso-languagecodes.txt | tail -n +2 | cut -f 1,4' WITH (format 'text', NULL ''); +COPY lang FROM PROGRAM 'curl -s http://download.geonames.org/export/dump/iso-languagecodes.txt \ +| tail -n +2 \ +| cut -f 1,4 \ +| sed -e "s/ *(.*$//" -e "s/\tModern /\t/" +' WITH (format 'text', NULL ''); COMMIT; diff --git a/share/db/0-pre.sql b/share/db/0-pre.sql deleted file mode 100644 index b49af9be..00000000 --- a/share/db/0-pre.sql +++ /dev/null @@ -1,22 +0,0 @@ --- NB 05.12.17 DROP TABLE IF EXISTS service; --- NB 25.10.17 CREATE TABLE IF NOT EXISTS service ( --- NB 25.10.17 name VARCHAR(100), --- NB 25.10.17 description VARCHAR(200), --- NB 25.10.17 PRIMARY KEY (port,name) --- NB 25.10.17 ); - --- NB 25.10.17 DROP TABLE IF EXISTS service_port; - --- NB 25.10.17 DROP TABLE IF EXISTS ovh_dedicated; --- NB 25.10.17 CREATE TABLE ovh_dedicated ( --- NB 25.10.17 offer VARCHAR(80), --- NB 25.10.17 proc VARCHAR(150), --- NB 25.10.17 cpu VARCHAR(150), --- NB 25.10.17 ram VARCHAR(150), --- NB 25.10.17 disk VARCHAR(150), --- NB 25.10.17 option VARCHAR(100), --- NB 25.10.17 price float(5,2) --- NB 25.10.17 ); - -PRAGMA encoding="UTF-8"; -PRAGMA foreign_keys=OFF; diff --git a/share/db/adservers b/share/db/adservers deleted file mode 100755 index 42d32082..00000000 --- a/share/db/adservers +++ /dev/null @@ -1,2 +0,0 @@ -#!/usr/bin/env sh -curl -s http://pgl.yoyo.org/adservers/serverlist.php?hostformat=nohtml diff --git a/share/db/country b/share/db/country deleted file mode 100755 index 9d60ae94..00000000 --- a/share/db/country +++ /dev/null @@ -1,17 +0,0 @@ -#!/usr/bin/env perl -use strict; -use warnings; -@ARGV = ('curl -s http://download.geonames.org/export/dump/countryInfo.txt |'); - -while (<>) { - #s/^#ISO/ISO/; - next if /^#/; - chomp($_); - #for postgres s,\\,\\\\,g; - my @r = split("\t",$_); - unshift @r,$r[0]; - while (@r<20) { - push @r,''; - } - print join("\t",@r)."\n"; -} diff --git a/share/db/country.csv b/share/db/country.csv deleted file mode 100644 index 169ba045..00000000 --- a/share/db/country.csv +++ /dev/null @@ -1,252 +0,0 @@ -AD AD AND 020 AN Andorra Andorra la Vella 468 84000 EU .ad EUR Euro 376 AD### ^(?:AD)*(\d{3})$ ca 3041565 ES,FR -AE AE ARE 784 AE United Arab Emirates Abu Dhabi 82880 4975593 AS .ae AED Dirham 971 ar-AE,fa,en,hi,ur 290557 SA,OM -AF AF AFG 004 AF Afghanistan Kabul 647500 29121286 AS .af AFN Afghani 93 fa-AF,ps,uz-AF,tk 1149361 TM,CN,IR,TJ,PK,UZ -AG AG ATG 028 AC Antigua and Barbuda St. John's 443 86754 NA .ag XCD Dollar +1-268 en-AG 3576396 -AI AI AIA 660 AV Anguilla The Valley 102 13254 NA .ai XCD Dollar +1-264 en-AI 3573511 -AL AL ALB 008 AL Albania Tirana 28748 2986952 EU .al ALL Lek 355 sq,el 783754 MK,GR,ME,RS,XK -AM AM ARM 051 AM Armenia Yerevan 29800 2968000 AS .am AMD Dram 374 ###### ^(\d{6})$ hy 174982 GE,IR,AZ,TR -AO AO AGO 024 AO Angola Luanda 1246700 13068161 AF .ao AOA Kwanza 244 pt-AO 3351879 CD,NA,ZM,CG -AQ AQ ATA 010 AY Antarctica 14000000 0 AN .aq 6697173 -AR AR ARG 032 AR Argentina Buenos Aires 2766890 41343201 SA .ar ARS Peso 54 @####@@@ ^[A-Z]?\d{4}[A-Z]{0,3}$ es-AR,en,it,de,fr,gn 3865483 CL,BO,UY,PY,BR -AS AS ASM 016 AQ American Samoa Pago Pago 199 57881 OC .as USD Dollar +1-684 #####-#### 96799 en-AS,sm,to 5880801 -AT AT AUT 040 AU Austria Vienna 83858 8205000 EU .at EUR Euro 43 #### ^(\d{4})$ de-AT,hr,hu,sl 2782113 CH,DE,HU,SK,CZ,IT,SI,LI -AU AU AUS 036 AS Australia Canberra 7686850 21515754 OC .au AUD Dollar 61 #### ^(\d{4})$ en-AU 2077456 -AW AW ABW 533 AA Aruba Oranjestad 193 71566 NA .aw AWG Guilder 297 nl-AW,es,en 3577279 -AX AX ALA 248 Aland Islands Mariehamn 1580 26711 EU .ax EUR Euro +358-18 ##### ^(?:FI)*(\d{5})$ sv-AX 661882 FI -AZ AZ AZE 031 AJ Azerbaijan Baku 86600 8303512 AS .az AZN Manat 994 AZ #### ^(?:AZ)*(\d{4})$ az,ru,hy 587116 GE,IR,AM,TR,RU -BA BA BIH 070 BK Bosnia and Herzegovina Sarajevo 51129 4590000 EU .ba BAM Marka 387 ##### ^(\d{5})$ bs,hr-BA,sr-BA 3277605 HR,ME,RS -BB BB BRB 052 BB Barbados Bridgetown 431 285653 NA .bb BBD Dollar +1-246 BB##### ^(?:BB)*(\d{5})$ en-BB 3374084 -BD BD BGD 050 BG Bangladesh Dhaka 144000 156118464 AS .bd BDT Taka 880 #### ^(\d{4})$ bn-BD,en 1210997 MM,IN -BE BE BEL 056 BE Belgium Brussels 30510 10403000 EU .be EUR Euro 32 #### ^(\d{4})$ nl-BE,fr-BE,de-BE 2802361 DE,NL,LU,FR -BF BF BFA 854 UV Burkina Faso Ouagadougou 274200 16241811 AF .bf XOF Franc 226 fr-BF 2361809 NE,BJ,GH,CI,TG,ML -BG BG BGR 100 BU Bulgaria Sofia 110910 7148785 EU .bg BGN Lev 359 #### ^(\d{4})$ bg,tr-BG,rom 732800 MK,GR,RO,TR,RS -BH BH BHR 048 BA Bahrain Manama 665 738004 AS .bh BHD Dinar 973 ####|### ^(\d{3}\d?)$ ar-BH,en,fa,ur 290291 -BI BI BDI 108 BY Burundi Bujumbura 27830 9863117 AF .bi BIF Franc 257 fr-BI,rn 433561 TZ,CD,RW -BJ BJ BEN 204 BN Benin Porto-Novo 112620 9056010 AF .bj XOF Franc 229 fr-BJ 2395170 NE,TG,BF,NG -BL BL BLM 652 TB Saint Barthelemy Gustavia 21 8450 NA .gp EUR Euro 590 ### ### fr 3578476 -BM BM BMU 060 BD Bermuda Hamilton 53 65365 NA .bm BMD Dollar +1-441 @@ ## ^([A-Z]{2}\d{2})$ en-BM,pt 3573345 -BN BN BRN 096 BX Brunei Bandar Seri Begawan 5770 395027 AS .bn BND Dollar 673 @@#### ^([A-Z]{2}\d{4})$ ms-BN,en-BN 1820814 MY -BO BO BOL 068 BL Bolivia Sucre 1098580 9947418 SA .bo BOB Boliviano 591 es-BO,qu,ay 3923057 PE,CL,PY,BR,AR -BQ BQ BES 535 Bonaire, Saint Eustatius and Saba 328 18012 NA .bq USD Dollar 599 nl,pap,en 7626844 -BR BR BRA 076 BR Brazil Brasilia 8511965 201103330 SA .br BRL Real 55 #####-### ^\d{5}-\d{3}$ pt-BR,es,en,fr 3469034 SR,PE,BO,UY,GY,PY,GF,VE,CO,AR -BS BS BHS 044 BF Bahamas Nassau 13940 301790 NA .bs BSD Dollar +1-242 en-BS 3572887 -BT BT BTN 064 BT Bhutan Thimphu 47000 699847 AS .bt BTN Ngultrum 975 dz 1252634 CN,IN -BV BV BVT 074 BV Bouvet Island 49 0 AN .bv NOK Krone 3371123 -BW BW BWA 072 BC Botswana Gaborone 600370 2029307 AF .bw BWP Pula 267 en-BW,tn-BW 933860 ZW,ZA,NA -BY BY BLR 112 BO Belarus Minsk 207600 9685000 EU .by BYR Ruble 375 ###### ^(\d{6})$ be,ru 630336 PL,LT,UA,RU,LV -BZ BZ BLZ 084 BH Belize Belmopan 22966 314522 NA .bz BZD Dollar 501 en-BZ,es 3582678 GT,MX -CA CA CAN 124 CA Canada Ottawa 9984670 33679000 NA .ca CAD Dollar 1 @#@ #@# ^([ABCEGHJKLMNPRSTVXY]\d[ABCEGHJKLMNPRSTVWXYZ]) ?(\d[ABCEGHJKLMNPRSTVWXYZ]\d)$ en-CA,fr-CA,iu 6251999 US -CC CC CCK 166 CK Cocos Islands West Island 14 628 AS .cc AUD Dollar 61 ms-CC,en 1547376 -CD CD COD 180 CG Democratic Republic of the Congo Kinshasa 2345410 70916439 AF .cd CDF Franc 243 fr-CD,ln,kg 203312 TZ,CF,SS,RW,ZM,BI,UG,CG,AO -CF CF CAF 140 CT Central African Republic Bangui 622984 4844927 AF .cf XAF Franc 236 fr-CF,sg,ln,kg 239880 TD,SD,CD,SS,CM,CG -CG CG COG 178 CF Republic of the Congo Brazzaville 342000 3039126 AF .cg XAF Franc 242 fr-CG,kg,ln-CG 2260494 CF,GA,CD,CM,AO -CH CH CHE 756 SZ Switzerland Bern 41290 7581000 EU .ch CHF Franc 41 #### ^(\d{4})$ de-CH,fr-CH,it-CH,rm 2658434 DE,IT,LI,FR,AT -CI CI CIV 384 IV Ivory Coast Yamoussoukro 322460 21058798 AF .ci XOF Franc 225 fr-CI 2287781 LR,GH,GN,BF,ML -CK CK COK 184 CW Cook Islands Avarua 240 21388 OC .ck NZD Dollar 682 en-CK,mi 1899402 -CL CL CHL 152 CI Chile Santiago 756950 16746491 SA .cl CLP Peso 56 ####### ^(\d{7})$ es-CL 3895114 PE,BO,AR -CM CM CMR 120 CM Cameroon Yaounde 475440 19294149 AF .cm XAF Franc 237 en-CM,fr-CM 2233387 TD,CF,GA,GQ,CG,NG -CN CN CHN 156 CH China Beijing 9596960 1330044000 AS .cn CNY Yuan Renminbi 86 ###### ^(\d{6})$ zh-CN,yue,wuu,dta,ug,za 1814991 LA,BT,TJ,KZ,MN,AF,NP,MM,KG,PK,KP,RU,VN,IN -CO CO COL 170 CO Colombia Bogota 1138910 47790000 SA .co COP Peso 57 es-CO 3686110 EC,PE,PA,BR,VE -CR CR CRI 188 CS Costa Rica San Jose 51100 4516220 NA .cr CRC Colon 506 ##### ^(\d{5})$ es-CR,en 3624060 PA,NI -CU CU CUB 192 CU Cuba Havana 110860 11423000 NA .cu CUP Peso 53 CP ##### ^(?:CP)*(\d{5})$ es-CU 3562981 US -CV CV CPV 132 CV Cape Verde Praia 4033 508659 AF .cv CVE Escudo 238 #### ^(\d{4})$ pt-CV 3374766 -CW CW CUW 531 UC Curacao Willemstad 444 141766 NA .cw ANG Guilder 599 nl,pap 7626836 -CX CX CXR 162 KT Christmas Island Flying Fish Cove 135 1500 AS .cx AUD Dollar 61 #### ^(\d{4})$ en,zh,ms-CC 2078138 -CY CY CYP 196 CY Cyprus Nicosia 9250 1102677 EU .cy EUR Euro 357 #### ^(\d{4})$ el-CY,tr-CY,en 146669 -CZ CZ CZE 203 EZ Czechia Prague 78866 10476000 EU .cz CZK Koruna 420 ### ## ^\d{3}\s?\d{2}$ cs,sk 3077311 PL,DE,SK,AT -DE DE DEU 276 GM Germany Berlin 357021 81802257 EU .de EUR Euro 49 ##### ^(\d{5})$ de 2921044 CH,PL,NL,DK,BE,CZ,LU,FR,AT -DJ DJ DJI 262 DJ Djibouti Djibouti 23000 740528 AF .dj DJF Franc 253 fr-DJ,ar,so-DJ,aa 223816 ER,ET,SO -DK DK DNK 208 DA Denmark Copenhagen 43094 5484000 EU .dk DKK Krone 45 #### ^(\d{4})$ da-DK,en,fo,de-DK 2623032 DE -DM DM DMA 212 DO Dominica Roseau 754 72813 NA .dm XCD Dollar +1-767 en-DM 3575830 -DO DO DOM 214 DR Dominican Republic Santo Domingo 48730 9823821 NA .do DOP Peso +1-809 and 1-829 ##### ^(\d{5})$ es-DO 3508796 HT -DZ DZ DZA 012 AG Algeria Algiers 2381740 34586184 AF .dz DZD Dinar 213 ##### ^(\d{5})$ ar-DZ 2589581 NE,EH,LY,MR,TN,MA,ML -EC EC ECU 218 EC Ecuador Quito 283560 14790608 SA .ec USD Dollar 593 @####@ ^([a-zA-Z]\d{4}[a-zA-Z])$ es-EC 3658394 PE,CO -EE EE EST 233 EN Estonia Tallinn 45226 1291170 EU .ee EUR Euro 372 ##### ^(\d{5})$ et,ru 453733 RU,LV -EG EG EGY 818 EG Egypt Cairo 1001450 80471869 AF .eg EGP Pound 20 ##### ^(\d{5})$ ar-EG,en,fr 357994 LY,SD,IL,PS -EH EH ESH 732 WI Western Sahara El-Aaiun 266000 273008 AF .eh MAD Dirham 212 ar,mey 2461445 DZ,MR,MA -ER ER ERI 232 ER Eritrea Asmara 121320 5792984 AF .er ERN Nakfa 291 aa-ER,ar,tig,kun,ti-ER 338010 ET,SD,DJ -ES ES ESP 724 SP Spain Madrid 504782 46505963 EU .es EUR Euro 34 ##### ^(\d{5})$ es-ES,ca,gl,eu,oc 2510769 AD,PT,GI,FR,MA -ET ET ETH 231 ET Ethiopia Addis Ababa 1127127 88013491 AF .et ETB Birr 251 #### ^(\d{4})$ am,en-ET,om-ET,ti-ET,so-ET,sid 337996 ER,KE,SD,SS,SO,DJ -FI FI FIN 246 FI Finland Helsinki 337030 5244000 EU .fi EUR Euro 358 ##### ^(?:FI)*(\d{5})$ fi-FI,sv-FI,smn 660013 NO,RU,SE -FJ FJ FJI 242 FJ Fiji Suva 18270 875983 OC .fj FJD Dollar 679 en-FJ,fj 2205218 -FK FK FLK 238 FK Falkland Islands Stanley 12173 2638 SA .fk FKP Pound 500 en-FK 3474414 -FM FM FSM 583 FM Micronesia Palikir 702 107708 OC .fm USD Dollar 691 ##### ^(\d{5})$ en-FM,chk,pon,yap,kos,uli,woe,nkr,kpg 2081918 -FO FO FRO 234 FO Faroe Islands Torshavn 1399 48228 EU .fo DKK Krone 298 ### ^(?:FO)*(\d{3})$ fo,da-FO 2622320 -FR FR FRA 250 FR France Paris 547030 64768389 EU .fr EUR Euro 33 ##### ^(\d{5})$ fr-FR,frp,br,co,ca,eu,oc 3017382 CH,DE,BE,LU,IT,AD,MC,ES -GA GA GAB 266 GB Gabon Libreville 267667 1545255 AF .ga XAF Franc 241 fr-GA 2400553 CM,GQ,CG -GB GB GBR 826 UK United Kingdom London 244820 62348447 EU .uk GBP Pound 44 @# #@@|@## #@@|@@# #@@|@@## #@@|@#@ #@@|@@#@ #@@|GIR0AA ^((?:(?:[A-PR-UWYZ][A-HK-Y]\d[ABEHMNPRV-Y0-9]|[A-PR-UWYZ]\d[A-HJKPS-UW0-9])\s\d[ABD-HJLNP-UW-Z]{2})|GIR\s?0AA)$ en-GB,cy-GB,gd 2635167 IE -GD GD GRD 308 GJ Grenada St. George's 344 107818 NA .gd XCD Dollar +1-473 en-GD 3580239 -GE GE GEO 268 GG Georgia Tbilisi 69700 4630000 AS .ge GEL Lari 995 #### ^(\d{4})$ ka,ru,hy,az 614540 AM,AZ,TR,RU -GF GF GUF 254 FG French Guiana Cayenne 91000 195506 SA .gf EUR Euro 594 ##### ^((97|98)3\d{2})$ fr-GF 3381670 SR,BR -GG GG GGY 831 GK Guernsey St Peter Port 78 65228 EU .gg GBP Pound +44-1481 @# #@@|@## #@@|@@# #@@|@@## #@@|@#@ #@@|@@#@ #@@|GIR0AA ^((?:(?:[A-PR-UWYZ][A-HK-Y]\d[ABEHMNPRV-Y0-9]|[A-PR-UWYZ]\d[A-HJKPS-UW0-9])\s\d[ABD-HJLNP-UW-Z]{2})|GIR\s?0AA)$ en,fr 3042362 -GH GH GHA 288 GH Ghana Accra 239460 24339838 AF .gh GHS Cedi 233 en-GH,ak,ee,tw 2300660 CI,TG,BF -GI GI GIB 292 GI Gibraltar Gibraltar 6.5 27884 EU .gi GIP Pound 350 en-GI,es,it,pt 2411586 ES -GL GL GRL 304 GL Greenland Nuuk 2166086 56375 NA .gl DKK Krone 299 #### ^(\d{4})$ kl,da-GL,en 3425505 -GM GM GMB 270 GA Gambia Banjul 11300 1593256 AF .gm GMD Dalasi 220 en-GM,mnk,wof,wo,ff 2413451 SN -GN GN GIN 324 GV Guinea Conakry 245857 10324025 AF .gn GNF Franc 224 fr-GN 2420477 LR,SN,SL,CI,GW,ML -GP GP GLP 312 GP Guadeloupe Basse-Terre 1780 443000 NA .gp EUR Euro 590 ##### ^((97|98)\d{3})$ fr-GP 3579143 -GQ GQ GNQ 226 EK Equatorial Guinea Malabo 28051 1014999 AF .gq XAF Franc 240 es-GQ,fr 2309096 GA,CM -GR GR GRC 300 GR Greece Athens 131940 11000000 EU .gr EUR Euro 30 ### ## ^(\d{5})$ el-GR,en,fr 390903 AL,MK,TR,BG -GS GS SGS 239 SX South Georgia and the South Sandwich Islands Grytviken 3903 30 AN .gs GBP Pound en 3474415 -GT GT GTM 320 GT Guatemala Guatemala City 108890 13550440 NA .gt GTQ Quetzal 502 ##### ^(\d{5})$ es-GT 3595528 MX,HN,BZ,SV -GU GU GUM 316 GQ Guam Hagatna 549 159358 OC .gu USD Dollar +1-671 969## ^(969\d{2})$ en-GU,ch-GU 4043988 -GW GW GNB 624 PU Guinea-Bissau Bissau 36120 1565126 AF .gw XOF Franc 245 #### ^(\d{4})$ pt-GW,pov 2372248 SN,GN -GY GY GUY 328 GY Guyana Georgetown 214970 748486 SA .gy GYD Dollar 592 en-GY 3378535 SR,BR,VE -HK HK HKG 344 HK Hong Kong Hong Kong 1092 6898686 AS .hk HKD Dollar 852 zh-HK,yue,zh,en 1819730 -HM HM HMD 334 HM Heard Island and McDonald Islands 412 0 AN .hm AUD Dollar 1547314 -HN HN HND 340 HO Honduras Tegucigalpa 112090 7989415 NA .hn HNL Lempira 504 @@#### ^([A-Z]{2}\d{4})$ es-HN 3608932 GT,NI,SV -HR HR HRV 191 HR Croatia Zagreb 56542 4284889 EU .hr HRK Kuna 385 ##### ^(?:HR)*(\d{5})$ hr-HR,sr 3202326 HU,SI,BA,ME,RS -HT HT HTI 332 HA Haiti Port-au-Prince 27750 9648924 NA .ht HTG Gourde 509 HT#### ^(?:HT)*(\d{4})$ ht,fr-HT 3723988 DO -HU HU HUN 348 HU Hungary Budapest 93030 9982000 EU .hu HUF Forint 36 #### ^(\d{4})$ hu-HU 719819 SK,SI,RO,UA,HR,AT,RS -ID ID IDN 360 ID Indonesia Jakarta 1919440 242968342 AS .id IDR Rupiah 62 ##### ^(\d{5})$ id,en,nl,jv 1643084 PG,TL,MY -IE IE IRL 372 EI Ireland Dublin 70280 4622917 EU .ie EUR Euro 353 @@@ @@@@ ^[A-Z]\d{2}$|^[A-Z]{3}[A-Z]{4}$ en-IE,ga-IE 2963597 GB -IL IL ISR 376 IS Israel Jerusalem 20770 7353985 AS .il ILS Shekel 972 ##### ^(\d{5})$ he,ar-IL,en-IL, 294640 SY,JO,LB,EG,PS -IM IM IMN 833 IM Isle of Man Douglas 572 75049 EU .im GBP Pound +44-1624 @# #@@|@## #@@|@@# #@@|@@## #@@|@#@ #@@|@@#@ #@@|GIR0AA ^((?:(?:[A-PR-UWYZ][A-HK-Y]\d[ABEHMNPRV-Y0-9]|[A-PR-UWYZ]\d[A-HJKPS-UW0-9])\s\d[ABD-HJLNP-UW-Z]{2})|GIR\s?0AA)$ en,gv 3042225 -IN IN IND 356 IN India New Delhi 3287590 1173108018 AS .in INR Rupee 91 ###### ^(\d{6})$ en-IN,hi,bn,te,mr,ta,ur,gu,kn,ml,or,pa,as,bh,sat,ks,ne,sd,kok,doi,mni,sit,sa,fr,lus,inc 1269750 CN,NP,MM,BT,PK,BD -IO IO IOT 086 IO British Indian Ocean Territory Diego Garcia 60 4000 AS .io USD Dollar 246 en-IO 1282588 -IQ IQ IRQ 368 IZ Iraq Baghdad 437072 29671605 AS .iq IQD Dinar 964 ##### ^(\d{5})$ ar-IQ,ku,hy 99237 SY,SA,IR,JO,TR,KW -IR IR IRN 364 IR Iran Tehran 1648000 76923300 AS .ir IRR Rial 98 ########## ^(\d{10})$ fa-IR,ku 130758 TM,AF,IQ,AM,PK,AZ,TR -IS IS ISL 352 IC Iceland Reykjavik 103000 308910 EU .is ISK Krona 354 ### ^(\d{3})$ is,en,de,da,sv,no 2629691 -IT IT ITA 380 IT Italy Rome 301230 60340328 EU .it EUR Euro 39 ##### ^(\d{5})$ it-IT,de-IT,fr-IT,sc,ca,co,sl 3175395 CH,VA,SI,SM,FR,AT -JE JE JEY 832 JE Jersey Saint Helier 116 90812 EU .je GBP Pound +44-1534 @# #@@|@## #@@|@@# #@@|@@## #@@|@#@ #@@|@@#@ #@@|GIR0AA ^((?:(?:[A-PR-UWYZ][A-HK-Y]\d[ABEHMNPRV-Y0-9]|[A-PR-UWYZ]\d[A-HJKPS-UW0-9])\s\d[ABD-HJLNP-UW-Z]{2})|GIR\s?0AA)$ en,pt 3042142 -JM JM JAM 388 JM Jamaica Kingston 10991 2847232 NA .jm JMD Dollar +1-876 en-JM 3489940 -JO JO JOR 400 JO Jordan Amman 92300 6407085 AS .jo JOD Dinar 962 ##### ^(\d{5})$ ar-JO,en 248816 SY,SA,IQ,IL,PS -JP JP JPN 392 JA Japan Tokyo 377835 127288000 AS .jp JPY Yen 81 ###-#### ^\d{3}-\d{4}$ ja 1861060 -KE KE KEN 404 KE Kenya Nairobi 582650 40046566 AF .ke KES Shilling 254 ##### ^(\d{5})$ en-KE,sw-KE 192950 ET,TZ,SS,SO,UG -KG KG KGZ 417 KG Kyrgyzstan Bishkek 198500 5776500 AS .kg KGS Som 996 ###### ^(\d{6})$ ky,uz,ru 1527747 CN,TJ,UZ,KZ -KH KH KHM 116 CB Cambodia Phnom Penh 181040 14453680 AS .kh KHR Riels 855 ##### ^(\d{5})$ km,fr,en 1831722 LA,TH,VN -KI KI KIR 296 KR Kiribati Tarawa 811 92533 OC .ki AUD Dollar 686 en-KI,gil 4030945 -KM KM COM 174 CN Comoros Moroni 2170 773407 AF .km KMF Franc 269 ar,fr-KM 921929 -KN KN KNA 659 SC Saint Kitts and Nevis Basseterre 261 51134 NA .kn XCD Dollar +1-869 en-KN 3575174 -KP KP PRK 408 KN North Korea Pyongyang 120540 22912177 AS .kp KPW Won 850 ###-### ^(\d{6})$ ko-KP 1873107 CN,KR,RU -KR KR KOR 410 KS South Korea Seoul 98480 48422644 AS .kr KRW Won 82 SEOUL ###-### ^(?:SEOUL)*(\d{6})$ ko-KR,en 1835841 KP -XK XK XKX 0 KV Kosovo Pristina 10908 1800000 EU EUR Euro sq,sr 831053 RS,AL,MK,ME -KW KW KWT 414 KU Kuwait Kuwait City 17820 2789132 AS .kw KWD Dinar 965 ##### ^(\d{5})$ ar-KW,en 285570 SA,IQ -KY KY CYM 136 CJ Cayman Islands George Town 262 44270 NA .ky KYD Dollar +1-345 en-KY 3580718 -KZ KZ KAZ 398 KZ Kazakhstan Astana 2717300 15340000 AS .kz KZT Tenge 7 ###### ^(\d{6})$ kk,ru 1522867 TM,CN,KG,UZ,RU -LA LA LAO 418 LA Laos Vientiane 236800 6368162 AS .la LAK Kip 856 ##### ^(\d{5})$ lo,fr,en 1655842 CN,MM,KH,TH,VN -LB LB LBN 422 LE Lebanon Beirut 10400 4125247 AS .lb LBP Pound 961 #### ####|#### ^(\d{4}(\d{4})?)$ ar-LB,fr-LB,en,hy 272103 SY,IL -LC LC LCA 662 ST Saint Lucia Castries 616 160922 NA .lc XCD Dollar +1-758 en-LC 3576468 -LI LI LIE 438 LS Liechtenstein Vaduz 160 35000 EU .li CHF Franc 423 #### ^(\d{4})$ de-LI 3042058 CH,AT -LK LK LKA 144 CE Sri Lanka Colombo 65610 21513990 AS .lk LKR Rupee 94 ##### ^(\d{5})$ si,ta,en 1227603 -LR LR LBR 430 LI Liberia Monrovia 111370 3685076 AF .lr LRD Dollar 231 #### ^(\d{4})$ en-LR 2275384 SL,CI,GN -LS LS LSO 426 LT Lesotho Maseru 30355 1919552 AF .ls LSL Loti 266 ### ^(\d{3})$ en-LS,st,zu,xh 932692 ZA -LT LT LTU 440 LH Lithuania Vilnius 65200 2944459 EU .lt EUR Euro 370 LT-##### ^(?:LT)*(\d{5})$ lt,ru,pl 597427 PL,BY,RU,LV -LU LU LUX 442 LU Luxembourg Luxembourg 2586 497538 EU .lu EUR Euro 352 L-#### ^(?:L-)?\d{4}$ lb,de-LU,fr-LU 2960313 DE,BE,FR -LV LV LVA 428 LG Latvia Riga 64589 2217969 EU .lv EUR Euro 371 LV-#### ^(?:LV)*(\d{4})$ lv,ru,lt 458258 LT,EE,BY,RU -LY LY LBY 434 LY Libya Tripoli 1759540 6461454 AF .ly LYD Dinar 218 ar-LY,it,en 2215636 TD,NE,DZ,SD,TN,EG -MA MA MAR 504 MO Morocco Rabat 446550 33848242 AF .ma MAD Dirham 212 ##### ^(\d{5})$ ar-MA,ber,fr 2542007 DZ,EH,ES -MC MC MCO 492 MN Monaco Monaco 1.95 32965 EU .mc EUR Euro 377 ##### ^(\d{5})$ fr-MC,en,it 2993457 FR -MD MD MDA 498 MD Moldova Chisinau 33843 4324000 EU .md MDL Leu 373 MD-#### ^MD-\d{4}$ ro,ru,gag,tr 617790 RO,UA -ME ME MNE 499 MJ Montenegro Podgorica 14026 666730 EU .me EUR Euro 382 ##### ^(\d{5})$ sr,hu,bs,sq,hr,rom 3194884 AL,HR,BA,RS,XK -MF MF MAF 663 RN Saint Martin Marigot 53 35925 NA .gp EUR Euro 590 ### ### fr 3578421 SX -MG MG MDG 450 MA Madagascar Antananarivo 587040 21281844 AF .mg MGA Ariary 261 ### ^(\d{3})$ fr-MG,mg 1062947 -MH MH MHL 584 RM Marshall Islands Majuro 181.3 65859 OC .mh USD Dollar 692 #####-#### ^969\d{2}(-\d{4})$ mh,en-MH 2080185 -MK MK MKD 807 MK Macedonia Skopje 25333 2062294 EU .mk MKD Denar 389 #### ^(\d{4})$ mk,sq,tr,rmm,sr 718075 AL,GR,BG,RS,XK -ML ML MLI 466 ML Mali Bamako 1240000 13796354 AF .ml XOF Franc 223 fr-ML,bm 2453866 SN,NE,DZ,CI,GN,MR,BF -MM MM MMR 104 BM Myanmar Nay Pyi Taw 678500 53414374 AS .mm MMK Kyat 95 ##### ^(\d{5})$ my 1327865 CN,LA,TH,BD,IN -MN MN MNG 496 MG Mongolia Ulan Bator 1565000 3086918 AS .mn MNT Tugrik 976 ###### ^(\d{6})$ mn,ru 2029969 CN,RU -MO MO MAC 446 MC Macao Macao 254 449198 AS .mo MOP Pataca 853 zh,zh-MO,pt 1821275 -MP MP MNP 580 CQ Northern Mariana Islands Saipan 477 53883 OC .mp USD Dollar +1-670 #####-#### ^9695\d{1}(-\d{4})$ fil,tl,zh,ch-MP,en-MP 4041468 -MQ MQ MTQ 474 MB Martinique Fort-de-France 1100 432900 NA .mq EUR Euro 596 ##### ^(\d{5})$ fr-MQ 3570311 -MR MR MRT 478 MR Mauritania Nouakchott 1030700 3205060 AF .mr MRO Ouguiya 222 ar-MR,fuc,snk,fr,mey,wo 2378080 SN,DZ,EH,ML -MS MS MSR 500 MH Montserrat Plymouth 102 9341 NA .ms XCD Dollar +1-664 en-MS 3578097 -MT MT MLT 470 MT Malta Valletta 316 403000 EU .mt EUR Euro 356 @@@ #### ^[A-Z]{3}\s?\d{4}$ mt,en-MT 2562770 -MU MU MUS 480 MP Mauritius Port Louis 2040 1294104 AF .mu MUR Rupee 230 en-MU,bho,fr 934292 -MV MV MDV 462 MV Maldives Male 300 395650 AS .mv MVR Rufiyaa 960 ##### ^(\d{5})$ dv,en 1282028 -MW MW MWI 454 MI Malawi Lilongwe 118480 15447500 AF .mw MWK Kwacha 265 ny,yao,tum,swk 927384 TZ,MZ,ZM -MX MX MEX 484 MX Mexico Mexico City 1972550 112468855 NA .mx MXN Peso 52 ##### ^(\d{5})$ es-MX 3996063 GT,US,BZ -MY MY MYS 458 MY Malaysia Kuala Lumpur 329750 28274729 AS .my MYR Ringgit 60 ##### ^(\d{5})$ ms-MY,en,zh,ta,te,ml,pa,th 1733045 BN,TH,ID -MZ MZ MOZ 508 MZ Mozambique Maputo 801590 22061451 AF .mz MZN Metical 258 #### ^(\d{4})$ pt-MZ,vmw 1036973 ZW,TZ,SZ,ZA,ZM,MW -NA NA NAM 516 WA Namibia Windhoek 825418 2128471 AF .na NAD Dollar 264 en-NA,af,de,hz,naq 3355338 ZA,BW,ZM,AO -NC NC NCL 540 NC New Caledonia Noumea 19060 216494 OC .nc XPF Franc 687 ##### ^(\d{5})$ fr-NC 2139685 -NE NE NER 562 NG Niger Niamey 1267000 15878271 AF .ne XOF Franc 227 #### ^(\d{4})$ fr-NE,ha,kr,dje 2440476 TD,BJ,DZ,LY,BF,NG,ML -NF NF NFK 574 NF Norfolk Island Kingston 34.6 1828 OC .nf AUD Dollar 672 #### ^(\d{4})$ en-NF 2155115 -NG NG NGA 566 NI Nigeria Abuja 923768 154000000 AF .ng NGN Naira 234 ###### ^(\d{6})$ en-NG,ha,yo,ig,ff 2328926 TD,NE,BJ,CM -NI NI NIC 558 NU Nicaragua Managua 129494 5995928 NA .ni NIO Cordoba 505 ###-###-# ^(\d{7})$ es-NI,en 3617476 CR,HN -NL NL NLD 528 NL Netherlands Amsterdam 41526 16645000 EU .nl EUR Euro 31 #### @@ ^(\d{4}[A-Z]{2})$ nl-NL,fy-NL 2750405 DE,BE -NO NO NOR 578 NO Norway Oslo 324220 5009150 EU .no NOK Krone 47 #### ^(\d{4})$ no,nb,nn,se,fi 3144096 FI,RU,SE -NP NP NPL 524 NP Nepal Kathmandu 140800 28951852 AS .np NPR Rupee 977 ##### ^(\d{5})$ ne,en 1282988 CN,IN -NR NR NRU 520 NR Nauru Yaren 21 10065 OC .nr AUD Dollar 674 na,en-NR 2110425 -NU NU NIU 570 NE Niue Alofi 260 2166 OC .nu NZD Dollar 683 niu,en-NU 4036232 -NZ NZ NZL 554 NZ New Zealand Wellington 268680 4252277 OC .nz NZD Dollar 64 #### ^(\d{4})$ en-NZ,mi 2186224 -OM OM OMN 512 MU Oman Muscat 212460 2967717 AS .om OMR Rial 968 ### ^(\d{3})$ ar-OM,en,bal,ur 286963 SA,YE,AE -PA PA PAN 591 PM Panama Panama City 78200 3410676 NA .pa PAB Balboa 507 es-PA,en 3703430 CR,CO -PE PE PER 604 PE Peru Lima 1285220 29907003 SA .pe PEN Sol 51 es-PE,qu,ay 3932488 EC,CL,BO,BR,CO -PF PF PYF 258 FP French Polynesia Papeete 4167 270485 OC .pf XPF Franc 689 ##### ^((97|98)7\d{2})$ fr-PF,ty 4030656 -PG PG PNG 598 PP Papua New Guinea Port Moresby 462840 6064515 OC .pg PGK Kina 675 ### ^(\d{3})$ en-PG,ho,meu,tpi 2088628 ID -PH PH PHL 608 RP Philippines Manila 300000 99900177 AS .ph PHP Peso 63 #### ^(\d{4})$ tl,en-PH,fil 1694008 -PK PK PAK 586 PK Pakistan Islamabad 803940 184404791 AS .pk PKR Rupee 92 ##### ^(\d{5})$ ur-PK,en-PK,pa,sd,ps,brh 1168579 CN,AF,IR,IN -PL PL POL 616 PL Poland Warsaw 312685 38500000 EU .pl PLN Zloty 48 ##-### ^\d{2}-\d{3}$ pl 798544 DE,LT,SK,CZ,BY,UA,RU -PM PM SPM 666 SB Saint Pierre and Miquelon Saint-Pierre 242 7012 NA .pm EUR Euro 508 ##### ^(97500)$ fr-PM 3424932 -PN PN PCN 612 PC Pitcairn Adamstown 47 46 OC .pn NZD Dollar 870 en-PN 4030699 -PR PR PRI 630 RQ Puerto Rico San Juan 9104 3916632 NA .pr USD Dollar +1-787 and 1-939 #####-#### ^00[679]\d{2}(?:-\d{4})?$ en-PR,es-PR 4566966 -PS PS PSE 275 WE Palestinian Territory East Jerusalem 5970 3800000 AS .ps ILS Shekel 970 ar-PS 6254930 JO,IL,EG -PT PT PRT 620 PO Portugal Lisbon 92391 10676000 EU .pt EUR Euro 351 ####-### ^\d{4}-\d{3}\s?[a-zA-Z]{0,25}$ pt-PT,mwl 2264397 ES -PW PW PLW 585 PS Palau Melekeok 458 19907 OC .pw USD Dollar 680 96940 ^(96940)$ pau,sov,en-PW,tox,ja,fil,zh 1559582 -PY PY PRY 600 PA Paraguay Asuncion 406750 6375830 SA .py PYG Guarani 595 #### ^(\d{4})$ es-PY,gn 3437598 BO,BR,AR -QA QA QAT 634 QA Qatar Doha 11437 840926 AS .qa QAR Rial 974 ar-QA,es 289688 SA -RE RE REU 638 RE Reunion Saint-Denis 2517 776948 AF .re EUR Euro 262 ##### ^((97|98)(4|7|8)\d{2})$ fr-RE 935317 -RO RO ROU 642 RO Romania Bucharest 237500 21959278 EU .ro RON Leu 40 ###### ^(\d{6})$ ro,hu,rom 798549 MD,HU,UA,BG,RS -RS RS SRB 688 RI Serbia Belgrade 88361 7344847 EU .rs RSD Dinar 381 ###### ^(\d{6})$ sr,hu,bs,rom 6290252 AL,HU,MK,RO,HR,BA,BG,ME,XK -RU RU RUS 643 RS Russia Moscow 17100000 140702000 EU .ru RUB Ruble 7 ###### ^(\d{6})$ ru,tt,xal,cau,ady,kv,ce,tyv,cv,udm,tut,mns,bua,myv,mdf,chm,ba,inh,tut,kbd,krc,av,sah,nog 2017370 GE,CN,BY,UA,KZ,LV,PL,EE,LT,FI,MN,NO,AZ,KP -RW RW RWA 646 RW Rwanda Kigali 26338 11055976 AF .rw RWF Franc 250 rw,en-RW,fr-RW,sw 49518 TZ,CD,BI,UG -SA SA SAU 682 SA Saudi Arabia Riyadh 1960582 25731776 AS .sa SAR Rial 966 ##### ^(\d{5})$ ar-SA 102358 QA,OM,IQ,YE,JO,AE,KW -SB SB SLB 090 BP Solomon Islands Honiara 28450 559198 OC .sb SBD Dollar 677 en-SB,tpi 2103350 -SC SC SYC 690 SE Seychelles Victoria 455 88340 AF .sc SCR Rupee 248 en-SC,fr-SC 241170 -SD SD SDN 729 SU Sudan Khartoum 1861484 35000000 AF .sd SDG Pound 249 ##### ^(\d{5})$ ar-SD,en,fia 366755 SS,TD,EG,ET,ER,LY,CF -SS SS SSD 728 OD South Sudan Juba 644329 8260490 AF SSP Pound 211 en 7909807 CD,CF,ET,KE,SD,UG -SE SE SWE 752 SW Sweden Stockholm 449964 9828655 EU .se SEK Krona 46 ### ## ^(?:SE)?\d{3}\s\d{2}$ sv-SE,se,sma,fi-SE 2661886 NO,FI -SG SG SGP 702 SN Singapore Singapore 692.7 4701069 AS .sg SGD Dollar 65 ###### ^(\d{6})$ cmn,en-SG,ms-SG,ta-SG,zh-SG 1880251 -SH SH SHN 654 SH Saint Helena Jamestown 410 7460 AF .sh SHP Pound 290 STHL 1ZZ ^(STHL1ZZ)$ en-SH 3370751 -SI SI SVN 705 SI Slovenia Ljubljana 20273 2007000 EU .si EUR Euro 386 #### ^(?:SI)*(\d{4})$ sl,sh 3190538 HU,IT,HR,AT -SJ SJ SJM 744 SV Svalbard and Jan Mayen Longyearbyen 62049 2550 EU .sj NOK Krone 47 #### ^(\d{4})$ no,ru 607072 -SK SK SVK 703 LO Slovakia Bratislava 48845 5455000 EU .sk EUR Euro 421 ### ## ^\d{3}\s?\d{2}$ sk,hu 3057568 PL,HU,CZ,UA,AT -SL SL SLE 694 SL Sierra Leone Freetown 71740 5245695 AF .sl SLL Leone 232 en-SL,men,tem 2403846 LR,GN -SM SM SMR 674 SM San Marino San Marino 61.2 31477 EU .sm EUR Euro 378 4789# ^(4789\d)$ it-SM 3168068 IT -SN SN SEN 686 SG Senegal Dakar 196190 12323252 AF .sn XOF Franc 221 ##### ^(\d{5})$ fr-SN,wo,fuc,mnk 2245662 GN,MR,GW,GM,ML -SO SO SOM 706 SO Somalia Mogadishu 637657 10112453 AF .so SOS Shilling 252 @@ ##### ^([A-Z]{2}\d{5})$ so-SO,ar-SO,it,en-SO 51537 ET,KE,DJ -SR SR SUR 740 NS Suriname Paramaribo 163270 492829 SA .sr SRD Dollar 597 nl-SR,en,srn,hns,jv 3382998 GY,BR,GF -ST ST STP 678 TP Sao Tome and Principe Sao Tome 1001 175808 AF .st STD Dobra 239 pt-ST 2410758 -SV SV SLV 222 ES El Salvador San Salvador 21040 6052064 NA .sv USD Dollar 503 CP #### ^(?:CP)*(\d{4})$ es-SV 3585968 GT,HN -SX SX SXM 534 NN Sint Maarten Philipsburg 21 37429 NA .sx ANG Guilder 599 nl,en 7609695 MF -SY SY SYR 760 SY Syria Damascus 185180 22198110 AS .sy SYP Pound 963 ar-SY,ku,hy,arc,fr,en 163843 IQ,JO,IL,TR,LB -SZ SZ SWZ 748 WZ Swaziland Mbabane 17363 1354051 AF .sz SZL Lilangeni 268 @### ^([A-Z]\d{3})$ en-SZ,ss-SZ 934841 ZA,MZ -TC TC TCA 796 TK Turks and Caicos Islands Cockburn Town 430 20556 NA .tc USD Dollar +1-649 TKCA 1ZZ ^(TKCA 1ZZ)$ en-TC 3576916 -TD TD TCD 148 CD Chad N'Djamena 1284000 10543464 AF .td XAF Franc 235 fr-TD,ar-TD,sre 2434508 NE,LY,CF,SD,CM,NG -TF TF ATF 260 FS French Southern Territories Port-aux-Francais 7829 140 AN .tf EUR Euro fr 1546748 -TG TG TGO 768 TO Togo Lome 56785 6587239 AF .tg XOF Franc 228 fr-TG,ee,hna,kbp,dag,ha 2363686 BJ,GH,BF -TH TH THA 764 TH Thailand Bangkok 514000 67089500 AS .th THB Baht 66 ##### ^(\d{5})$ th,en 1605651 LA,MM,KH,MY -TJ TJ TJK 762 TI Tajikistan Dushanbe 143100 7487489 AS .tj TJS Somoni 992 ###### ^(\d{6})$ tg,ru 1220409 CN,AF,KG,UZ -TK TK TKL 772 TL Tokelau 10 1466 OC .tk NZD Dollar 690 tkl,en-TK 4031074 -TL TL TLS 626 TT East Timor Dili 15007 1154625 OC .tl USD Dollar 670 tet,pt-TL,id,en 1966436 ID -TM TM TKM 795 TX Turkmenistan Ashgabat 488100 4940916 AS .tm TMT Manat 993 ###### ^(\d{6})$ tk,ru,uz 1218197 AF,IR,UZ,KZ -TN TN TUN 788 TS Tunisia Tunis 163610 10589025 AF .tn TND Dinar 216 #### ^(\d{4})$ ar-TN,fr 2464461 DZ,LY -TO TO TON 776 TN Tonga Nuku'alofa 748 122580 OC .to TOP Pa'anga 676 to,en-TO 4032283 -TR TR TUR 792 TU Turkey Ankara 780580 77804122 AS .tr TRY Lira 90 ##### ^(\d{5})$ tr-TR,ku,diq,az,av 298795 SY,GE,IQ,IR,GR,AM,AZ,BG -TT TT TTO 780 TD Trinidad and Tobago Port of Spain 5128 1228691 NA .tt TTD Dollar +1-868 en-TT,hns,fr,es,zh 3573591 -TV TV TUV 798 TV Tuvalu Funafuti 26 10472 OC .tv AUD Dollar 688 tvl,en,sm,gil 2110297 -TW TW TWN 158 TW Taiwan Taipei 35980 22894384 AS .tw TWD Dollar 886 ##### ^(\d{5})$ zh-TW,zh,nan,hak 1668284 -TZ TZ TZA 834 TZ Tanzania Dodoma 945087 41892895 AF .tz TZS Shilling 255 sw-TZ,en,ar 149590 MZ,KE,CD,RW,ZM,BI,UG,MW -UA UA UKR 804 UP Ukraine Kiev 603700 45415596 EU .ua UAH Hryvnia 380 ##### ^(\d{5})$ uk,ru-UA,rom,pl,hu 690791 PL,MD,HU,SK,BY,RO,RU -UG UG UGA 800 UG Uganda Kampala 236040 33398682 AF .ug UGX Shilling 256 en-UG,lg,sw,ar 226074 TZ,KE,SS,CD,RW -UM UM UMI 581 United States Minor Outlying Islands 0 0 OC .um USD Dollar 1 en-UM 5854968 -US US USA 840 US United States Washington 9629091 310232863 NA .us USD Dollar 1 #####-#### ^\d{5}(-\d{4})?$ en-US,es-US,haw,fr 6252001 CA,MX,CU -UY UY URY 858 UY Uruguay Montevideo 176220 3477000 SA .uy UYU Peso 598 ##### ^(\d{5})$ es-UY 3439705 BR,AR -UZ UZ UZB 860 UZ Uzbekistan Tashkent 447400 27865738 AS .uz UZS Som 998 ###### ^(\d{6})$ uz,ru,tg 1512440 TM,AF,KG,TJ,KZ -VA VA VAT 336 VT Vatican Vatican City 0.44 921 EU .va EUR Euro 379 ##### ^(\d{5})$ la,it,fr 3164670 IT -VC VC VCT 670 VC Saint Vincent and the Grenadines Kingstown 389 104217 NA .vc XCD Dollar +1-784 en-VC,fr 3577815 -VE VE VEN 862 VE Venezuela Caracas 912050 27223228 SA .ve VEF Bolivar 58 #### ^(\d{4})$ es-VE 3625428 GY,BR,CO -VG VG VGB 092 VI British Virgin Islands Road Town 153 21730 NA .vg USD Dollar +1-284 en-VG 3577718 -VI VI VIR 850 VQ U.S. Virgin Islands Charlotte Amalie 352 108708 NA .vi USD Dollar +1-340 #####-#### ^008\d{2}(?:-\d{4})?$ en-VI 4796775 -VN VN VNM 704 VM Vietnam Hanoi 329560 89571130 AS .vn VND Dong 84 ###### ^(\d{6})$ vi,en,fr,zh,km 1562822 CN,LA,KH -VU VU VUT 548 NH Vanuatu Port Vila 12200 221552 OC .vu VUV Vatu 678 bi,en-VU,fr-VU 2134431 -WF WF WLF 876 WF Wallis and Futuna Mata Utu 274 16025 OC .wf XPF Franc 681 ##### ^(986\d{2})$ wls,fud,fr-WF 4034749 -WS WS WSM 882 WS Samoa Apia 2944 192001 OC .ws WST Tala 685 sm,en-WS 4034894 -YE YE YEM 887 YM Yemen Sanaa 527970 23495361 AS .ye YER Rial 967 ar-YE 69543 SA,OM -YT YT MYT 175 MF Mayotte Mamoudzou 374 159042 AF .yt EUR Euro 262 ##### ^(\d{5})$ fr-YT 1024031 -ZA ZA ZAF 710 SF South Africa Pretoria 1219912 49000000 AF .za ZAR Rand 27 #### ^(\d{4})$ zu,xh,af,nso,en-ZA,tn,st,ts,ss,ve,nr 953987 ZW,SZ,MZ,BW,NA,LS -ZM ZM ZMB 894 ZA Zambia Lusaka 752614 13460305 AF .zm ZMW Kwacha 260 ##### ^(\d{5})$ en-ZM,bem,loz,lun,lue,ny,toi 895949 ZW,TZ,MZ,CD,NA,MW,AO -ZW ZW ZWE 716 ZI Zimbabwe Harare 390580 13061000 AF .zw ZWL Dollar 263 en-ZW,sn,nr,nd 878675 ZA,MZ,BW,ZM -CS CS SCG 891 YI Serbia and Montenegro Belgrade 102350 10829175 EU .cs RSD Dinar 381 ##### ^(\d{5})$ cu,hu,sq,sr 8505033 AL,HU,MK,RO,HR,BA,BG -AN AN ANT 530 NT Netherlands Antilles Willemstad 960 300000 NA .an ANG Guilder 599 nl-AN,en,es 8505032 GP diff --git a/share/db/country.sql b/share/db/country.sql deleted file mode 100644 index ecef737d..00000000 --- a/share/db/country.sql +++ /dev/null @@ -1,48 +0,0 @@ --- ISO --- ISO3 --- ISO-Numeric --- fips --- Country --- Capital --- Area(in sq km) --- Population --- Continent --- tld --- CurrencyCode --- CurrencyName --- Phone --- Postal Code Format --- Postal Code Regex --- Languages --- geonameid --- neighbours --- EquivalentFipsCode -DROP TABLE IF EXISTS country; -CREATE TABLE IF NOT EXISTS country ( - id varchar(2) PRIMARY KEY, - iso varchar(2) UNIQUE, - iso3 varchar(3) UNIQUE, - isonum varchar(3) UNIQUE, - fips varchar(2), - name varchar(50), - capital varchar(30), - area_km varchar(9), - population bigint, - continent varchar(2), - tld varchar(10), - currency_code varchar(3), - currency_name varchar(20), - phone varchar(30), - zip_format varchar(60), - zip_regexp varchar(150), - languages varchar(100), - geonameid integer, - neighbours varchar(60), - eqfips varchar(2) -); -CREATE INDEX IF NOT EXISTS country_geonameid_idx ON country (geonameid); -BEGIN TRANSACTION; -DELETE FROM country; -.import "country.csv" country -COMMIT; - diff --git a/share/db/http_status b/share/db/http_status deleted file mode 100755 index 1d8837ee..00000000 --- a/share/db/http_status +++ /dev/null @@ -1,13 +0,0 @@ -#!/usr/bin/env perl -use strict; -use warnings; -@ARGV = ('bash --login -c "html2txt https://en.wikipedia.org/wiki/List_of_HTTP_status_codes" |'); - -while (<>) { - next unless /^\d\d\d / .. /^ /; - s/.\[\d+\]//g; - s/^ *//; - s/\t/ /g; - s/^(\d+) ([\w _-]+).*?\n$/$1\t$2\t/; - print; -} diff --git a/share/db/http_status.sql b/share/db/http_status.sql deleted file mode 100644 index fa699ae3..00000000 --- a/share/db/http_status.sql +++ /dev/null @@ -1,6 +0,0 @@ --- DROP TABLE IF EXISTS http_status; -CREATE TABLE IF NOT EXISTS http_status ( - id int PRIMARY KEY, - name varchar(100), - description varchar(1000) -); diff --git a/share/db/mime.sql b/share/db/mime.sql deleted file mode 100644 index 8d3b086f..00000000 --- a/share/db/mime.sql +++ /dev/null @@ -1,5 +0,0 @@ -CREATE TABLE IF NOT EXISTS mime ( - id varchar(32) NOT NULL PRIMARY KEY, - name varchar(128), - cmd_check varchar(300) -); diff --git a/share/db/mime_type.csv b/share/db/mime_type.csv deleted file mode 100644 index 904248a0..00000000 --- a/share/db/mime_type.csv +++ /dev/null @@ -1,686 +0,0 @@ -3D Crossword Plugin application/vnd.hzn-3d-crossword x3d -3GP2 video/3gpp2 3g2 -3GPP MSEQ File application/vnd.mseq mseq -3GP video/3gpp 3gp -3M Post It Notes application/vnd.3m.post-it-notes pwn -3rd Generation Partnership Project - Pic Large application/vnd.3gpp.pic-bw-large plb -3rd Generation Partnership Project - Pic Small application/vnd.3gpp.pic-bw-small psb -3rd Generation Partnership Project - Pic Var application/vnd.3gpp.pic-bw-var pvb -3rd Generation Partnership Project - Transaction Capabilities Application Part application/vnd.3gpp2.tcap tcap -7-Zip application/x-7z-compressed 7z -AbiWord application/x-abiword abw -Ace Archive application/x-ace-compressed ace -Active Content Compression application/vnd.americandynamics.acc acc -ACU Cobol application/vnd.acucobol acu -ACU Cobol application/vnd.acucorp atc -Adaptive differential pulse-code modulation audio/adpcm adp -Adobe AIR Application application/vnd.adobe.air-application-installer-package+zip air -Adobe Flash application/x-shockwave-flash swf -Adobe Flex Project application/vnd.adobe.fxp fxp -Adobe (Macropedia) Authorware - Binary File application/x-authorware-bin aab -Adobe (Macropedia) Authorware - Map application/x-authorware-map aam -Adobe (Macropedia) Authorware - Segment File application/x-authorware-seg aas -Adobe Portable Document Format application/pdf pdf -Adobe PostScript Printer Description File Format application/vnd.cups-ppd ppd -Adobe Shockwave Player application/x-director dir -Adobe XML Data Package application/vnd.adobe.xdp+xml xdp -Adobe XML Forms Data Format application/vnd.adobe.xfdf xfdf -Advanced Audio Coding (AAC) audio/x-aac aac -Ahead AIR Application application/vnd.ahead.space ahead -AirZip FileSECURE application/vnd.airzip.filesecure.azf azf -AirZip FileSECURE application/vnd.airzip.filesecure.azs azs -Amazon Kindle eBook format application/vnd.amazon.ebook azw -AmigaDE application/vnd.amiga.ami ami -Android Package Archive application/vnd.android.package-archive apk -ANSER-WEB Terminal Client - Certificate Issue application/vnd.anser-web-certificate-issue-initiation cii -ANSER-WEB Terminal Client - Web Funds Transfer application/vnd.anser-web-funds-transfer-initiation fti -Antix Game Player application/vnd.antix.game-component atx -Apple Installer Package application/vnd.apple.installer+xml mpkg -Application Php text/x-php php -Applixware application/applixware aw -Archipelago Lesson Player application/vnd.hhe.lesson-player les -Arista Networks Software Image application/vnd.aristanetworks.swi swi -Assembler Source File text/x-asm s -Atom Publishing Protocol application/atomcat+xml atomcat -Atom Publishing Protocol Service Document application/atomsvc+xml atomsvc -Attribute Certificate application/pkix-attr-cert ac -Audiograph application/vnd.audiograph aep -Audio Interchange File Format audio/x-aiff aif -Audio Video Interleave (AVI) video/x-msvideo avi -AutoCAD DXF image/vnd.dxf dxf -Autodesk Design Web Format (DWF) model/vnd.dwf dwf -BAS Partitur Format text/plain-bas par -Binary CPIO Archive application/x-bcpio bcpio -Binary Data application/octet-stream bin -Bitmap Image File image/bmp bmp -BitTorrent application/x-bittorrent torrent -Blackberry COD File application/vnd.rim.cod cod -Blueice Research Multipass application/vnd.blueice.multipass mpm -BMI Drawing Data Interchange application/vnd.bmi bmi -Bourne Shell Script application/x-sh sh -BTIF image/prs.btif btif -BusinessObjects application/vnd.businessobjects rep -Bzip2 Archive application/x-bzip2 bz2 -Bzip Archive application/x-bzip bz -CambridgeSoft Chem Draw application/vnd.chemdraw+xml cdxml -Cascading Style Sheets (CSS) text/css css -ChemDraw eXchange file chemical/x-cdx cdx -Chemical Markup Language chemical/x-cml cml -Chemical Style Markup Language chemical/x-csml csml -CIM Database application/vnd.contact.cmsg cdbcmsg -Claymore Data Files application/vnd.claymore cla -Clonk Game application/vnd.clonk.c4group c4g -Close Captioning - Subtitle image/vnd.dvb.subtitle sub -Cloud Data Management Interface (CDMI) - Capability application/cdmi-capability cdmia -Cloud Data Management Interface (CDMI) - Contaimer application/cdmi-container cdmic -Cloud Data Management Interface (CDMI) - Domain application/cdmi-domain cdmid -Cloud Data Management Interface (CDMI) - Object application/cdmi-object cdmio -Cloud Data Management Interface (CDMI) - Queue application/cdmi-queue cdmiq -ClueTrust CartoMobile - Config application/vnd.cluetrust.cartomobile-config c11amc -ClueTrust CartoMobile - Config Package application/vnd.cluetrust.cartomobile-config-pkg c11amz -CMU Image image/x-cmu-raster ras -COLLADA model/vnd.collada+xml dae -Comma-Seperated Values text/csv csv -Compact Pro application/mac-compactpro cpt -Compiled Wireless Markup Language (WMLC) application/vnd.wap.wmlc wmlc -Computer Graphics Metafile image/cgm cgm -CoolTalk x-conference/x-cooltalk ice -Corel Metafile Exchange (CMX) image/x-cmx cmx -CorelXARA application/vnd.xara xar -CosmoCaller application/vnd.cosmocaller cmc -CPIO Archive application/x-cpio cpio -CrickSoftware - Clicker application/vnd.crick.clicker clkx -CrickSoftware - Clicker - Keyboard application/vnd.crick.clicker.keyboard clkk -CrickSoftware - Clicker - Palette application/vnd.crick.clicker.palette clkp -CrickSoftware - Clicker - Template application/vnd.crick.clicker.template clkt -CrickSoftware - Clicker - Wordbank application/vnd.crick.clicker.wordbank clkw -Critical Tools - PERT Chart EXPERT application/vnd.criticaltools.wbs+xml wbs -CryptoNote application/vnd.rig.cryptonote cryptonote -Crystallographic Interchange Format chemical/x-cif cif -CrystalMaker Data Format chemical/x-cmdf cmdf -C Shell Script application/x-csh csh -C Source File text/x-c c -CURL Applet application/vnd.curl.car car -CURL Applet application/vnd.curl.pcurl pcurl -Curl - Applet text/vnd.curl curl -Curl - Detached Applet text/vnd.curl.dcurl dcurl -Curl - Manifest File text/vnd.curl.mcurl mcurl -Curl - Source Code text/vnd.curl.scurl scurl -CU-SeeMe application/cu-seeme cu -CustomMenu application/vnd.yellowriver-custom-menu cmp -CU-Writer application/prs.cww cww -Data Structure for the Security Suitability of Cryptographic Algorithms application/dssc+der dssc -Data Structure for the Security Suitability of Cryptographic Algorithms application/dssc+xml xdssc -Debian Package application/x-debian-package deb -DECE Audio audio/vnd.dece.audio uva -DECE Graphic image/vnd.dece.graphic uvi -DECE High Definition Video video/vnd.dece.hd uvh -DECE Mobile Video video/vnd.dece.mobile uvm -DECE MP4 video/vnd.uvvu.mp4 uvu -DECE PD Video video/vnd.dece.pd uvp -DECE SD Video video/vnd.dece.sd uvs -DECE Video video/vnd.dece.video uvv -Device Independent File Format (DVI) application/x-dvi dvi -Digital Siesmograph Networks - SEED Datafiles application/vnd.fdsn.seed seed -Digital Talking Book application/x-dtbook+xml dtb -Digital Talking Book - Resource File application/x-dtbresource+xml res -Digital Video Broadcasting application/vnd.dvb.ait ait -Digital Video Broadcasting application/vnd.dvb.service svc -Digital Winds Music audio/vnd.digital-winds eol -DjVu image/vnd.djvu djvu -Document Type Definition application/xml-dtd dtd -Dolby Meridian Lossless Packing application/vnd.dolby.mlp mlp -Doom Video Game application/x-doom wad -DPGraph application/vnd.dpgraph dpg -DRA Audio audio/vnd.dra dra -DreamFactory application/vnd.dreamfactory dfac -DTS Audio audio/vnd.dts dts -DTS High Definition Audio audio/vnd.dts.hd dtshd -DWG Drawing image/vnd.dwg dwg -DynaGeo application/vnd.dynageo geo -ECMAScript application/ecmascript es -EcoWin Chart application/vnd.ecowin.chart mag -EDMICS 2000 image/vnd.fujixerox.edmics-mmr mmr -EDMICS 2000 image/vnd.fujixerox.edmics-rlc rlc -Efficient XML Interchange application/exi exi -EFI Proteus application/vnd.proteus.magazine mgz -Electronic Publication application/epub+zip epub -Email Message message/rfc822 eml -Enliven Viewer application/vnd.enliven nml -Express by Infoseek application/vnd.is-xpr xpr -eXtended Image File Format (XIFF) image/vnd.xiff xif -Extensible Forms Description Language application/vnd.xfdl xfdl -Extensible MultiModal Annotation application/emma+xml emma -EZPix Secure Photo Album application/vnd.ezpix-album ez2 -EZPix Secure Photo Album application/vnd.ezpix-package ez3 -FastBid Sheet image/vnd.fastbidsheet fbs -FAST Search & Transfer ASA image/vnd.fst fst -FAST Search & Transfer ASA video/vnd.fvt fvt -FCS Express Layout Link application/vnd.denovo.fcselayout-link fe_launch -FlashPix image/vnd.fpx fpx -FlashPix image/vnd.net-fpx npx -Flash Video video/x-f4v f4v -Flash Video video/x-flv flv -FLEXSTOR text/vnd.fmi.flexstor flx -FLI/FLC Animation Format video/x-fli fli -FluxTime Clip application/vnd.fluxtime.clip ftc -Forms Data Format application/vnd.fdf fdf -Fortran Source File text/x-fortran f -FrameMaker Interchange Format application/vnd.mif mif -FrameMaker Normal Format application/vnd.framemaker fm -FreeHand MX image/x-freehand fh -Friendly Software Corporation application/vnd.fsc.weblaunch fsc -Frogans Player application/vnd.frogans.fnc fnc -Frogans Player application/vnd.frogans.ltf ltf -Fujitsu Oasys application/vnd.fujitsu.oasys2 oa2 -Fujitsu Oasys application/vnd.fujitsu.oasys3 oa3 -Fujitsu Oasys application/vnd.fujitsu.oasysgp fg5 -Fujitsu Oasys application/vnd.fujitsu.oasys oas -Fujitsu Oasys application/vnd.fujitsu.oasysprs bh2 -Fujitsu - Xerox 2D CAD Data application/vnd.fujixerox.ddd ddd -Fujitsu - Xerox DocuWorks application/vnd.fujixerox.docuworks xdw -Fujitsu - Xerox DocuWorks Binder application/vnd.fujixerox.docuworks.binder xbd -FutureSplash Animator application/x-futuresplash spl -FuzzySheet application/vnd.fuzzysheet fzs -G3 Fax Image image/g3fax g3 -GameMaker ActiveX application/vnd.gmx gmx -Genomatix Tuxedo Framework application/vnd.genomatix.tuxedo txd -Gen-Trix Studio model/vnd.gtw gtw -GeoGebra application/vnd.geogebra.file ggb -GeoGebra application/vnd.geogebra.tool ggt -Geometric Description Language (GDL) model/vnd.gdl gdl -GeoMetry Explorer application/vnd.geometry-explorer gex -GEONExT and JSXGraph application/vnd.geonext gxt -GeoplanW application/vnd.geoplan g2w -GeospacW application/vnd.geospace g3w -Ghostscript Font application/x-font-ghostscript gsf -Glyph Bitmap Distribution Format application/x-font-bdf bdf -Gnumeric application/x-gnumeric gnumeric -GNU Tar Files application/x-gtar gtar -GNU Texinfo Document application/x-texinfo texinfo -Google Earth - KML application/vnd.google-earth.kml+xml kml -Google Earth - Zipped KML application/vnd.google-earth.kmz kmz -GrafEq application/vnd.grafeq gqf -Graphics Interchange Format image/gif gif -Graphviz text/vnd.graphviz gv -Groove - Account application/vnd.groove-account gac -Groove - Help application/vnd.groove-help ghf -Groove - Identity Message application/vnd.groove-identity-message gim -Groove - Injector application/vnd.groove-injector grv -Groove - Tool Message application/vnd.groove-tool-message gtm -Groove - Tool Template application/vnd.groove-tool-template tpl -Groove - Vcard application/vnd.groove-vcard vcg -H.261 video/h261 h261 -H.263 video/h263 h263 -H.264 video/h264 h264 -Hewlett Packard Instant Delivery application/vnd.hp-hpid hpid -Hewlett-Packard's WebPrintSmart application/vnd.hp-hps hps -Hierarchical Data Format application/x-hdf hdf -Hit'n'Mix audio/vnd.rip rip -Homebanking Computer Interface (HBCI) application/vnd.hbci hbci -HP-GL/2 and HP RTL application/vnd.hp-hpgl hpgl -HP Indigo Digital Press - Job Layout Languate application/vnd.hp-jlyt jlt -HP Printer Command Language application/vnd.hp-pcl pcl -HV Script application/vnd.yamaha.hv-script hvs -HV Voice Dictionary application/vnd.yamaha.hv-dic hvd -HV Voice Parameter application/vnd.yamaha.hv-voice hvp -Hydrostatix Master Suite application/vnd.hydrostatix.sof-data sfd-hdstx -Hyperstudio application/hyperstudio stk -Hypertext Application Language application/vnd.hal+xml hal -HyperText Markup Language (HTML) text/html html -IBM DB2 Rights Manager application/vnd.ibm.rights-management irm -IBM Electronic Media Management System - Secure Container application/vnd.ibm.secure-container sc -iCalendar text/calendar ics -ICC profile application/vnd.iccprofile icc -Icon Image image/x-icon ico -igLoader application/vnd.igloader igl -Image Exchange Format image/ief ief -ImmerVision PURE Players application/vnd.immervision-ivp ivp -ImmerVision PURE Players application/vnd.immervision-ivu ivu -IMS Networks application/reginfo+xml rif -In3D - 3DML text/vnd.in3d.3dml 3dml -In3D - 3DML text/vnd.in3d.spot spot -Initial Graphics Exchange Specification (IGES) model/iges igs -Interactive Geometry Software application/vnd.intergeo i2g -Interactive Geometry Software Cinderella application/vnd.cinderella cdy -Intercon FormNet application/vnd.intercon.formnet xpw -International Society for Advancement of Cytometry application/vnd.isac.fcs fcs -Internet Protocol Flow Information Export application/ipfix ipfix -Internet Public Key Infrastructure - Certificate application/pkix-cert cer -Internet Public Key Infrastructure - Certificate Management Protocole application/pkixcmp pki -Internet Public Key Infrastructure - Certificate Revocation Lists application/pkix-crl crl -Internet Public Key Infrastructure - Certification Path application/pkix-pkipath pkipath -IOCOM Visimeet application/vnd.insors.igm igm -IP Unplugged Roaming Client application/vnd.ipunplugged.rcprofile rcprofile -iRepository / Lucidoc Editor application/vnd.irepository.package+xml irp -J2ME App Descriptor text/vnd.sun.j2me.app-descriptor jad -Java Archive application/java-archive jar -Java Bytecode File application/java-vm class -Java Network Launching Protocol application/x-java-jnlp-file jnlp -JavaScript application/javascript js -JavaScript Object Notation (JSON) application/json json -JavaScript Object Notation (JSON) text/json json -Java Serialized Object application/java-serialized-object ser -Java Source File text/x-java-source,java java -Joda Archive application/vnd.joost.joda-archive joda -JPEG 2000 Compound Image File Format video/jpm jpm -JPEG Image image/jpeg jpeg -JPEG Image image/jpeg jpg -JPGVideo video/jpeg jpgv -Kahootz application/vnd.kahootz ktz -Karaoke on Chipnuts Chipsets application/vnd.chipnuts.karaoke-mmd mmd -KDE KOffice Office Suite - Karbon application/vnd.kde.karbon karbon -KDE KOffice Office Suite - KChart application/vnd.kde.kchart chrt -KDE KOffice Office Suite - Kformula application/vnd.kde.kformula kfo -KDE KOffice Office Suite - Kivio application/vnd.kde.kivio flw -KDE KOffice Office Suite - Kontour application/vnd.kde.kontour kon -KDE KOffice Office Suite - Kpresenter application/vnd.kde.kpresenter kpr -KDE KOffice Office Suite - Kspread application/vnd.kde.kspread ksp -KDE KOffice Office Suite - Kword application/vnd.kde.kword kwd -Kenamea App application/vnd.kenameaapp htke -Kidspiration application/vnd.kidspiration kia -Kinar Applications application/vnd.kinar kne -Kodak Storyshare application/vnd.kodak-descriptor sse -Laser App Enterprise application/vnd.las.las+xml lasxml -LaTeX application/x-latex latex -Life Balance - Desktop Edition application/vnd.llamagraphics.life-balance.desktop lbd -Life Balance - Exchange Format application/vnd.llamagraphics.life-balance.exchange+xml lbe -Lightspeed Audio Lab application/vnd.jam jam -Lotus 1-2-3 application/vnd.lotus-1-2-3 123 -Lotus Approach application/vnd.lotus-approach apr -Lotus Freelance application/vnd.lotus-freelance pre -Lotus Notes application/vnd.lotus-notes nsf -Lotus Organizer application/vnd.lotus-organizer org -Lotus Screencam application/vnd.lotus-screencam scm -Lotus Wordpro application/vnd.lotus-wordpro lwp -Lucent Voice audio/vnd.lucent.voice lvp -M3U (Multimedia Playlist) audio/x-mpegurl m3u -M4v video/x-m4v m4v -Macintosh BinHex 4.0 application/mac-binhex40 hqx -MacPorts Port System application/vnd.macports.portpkg portpkg -MapGuide DBXML application/vnd.osgeo.mapguide.package mgp -MARC21 XML Schema application/marcxml+xml mrcx -MARC Formats application/marc mrc -Markdown text/x-markdown md -Material Exchange Format application/mxf mxf -Mathematical Markup Language application/mathml+xml mathml -Mathematica Notebook Player application/vnd.wolfram.player nbp -Mathematica Notebooks application/mathematica ma -Mbox database files application/mbox mbox -MedCalc application/vnd.medcalcdata mc1 -MediaRemote application/vnd.mediastation.cdkey cdkey -Media Server Control Markup Language application/mediaservercontrol+xml mscml -Medical Waveform Encoding Format application/vnd.mfer mwf -Melody Format for Mobile Platform application/vnd.mfmp mfm -Mesh Data Type model/mesh msh -Metadata Authority Description Schema application/mads+xml mads -Metadata Encoding and Transmission Standard application/mets+xml mets -Metadata Object Description Schema application/mods+xml mods -Metalink application/metalink4+xml meta4 -Micosoft PowerPoint - Macro-Enabled Template File application/vnd.ms-powerpoint.template.macroenabled.12 potm -Micosoft Word - Macro-Enabled Document application/vnd.ms-word.document.macroenabled.12 docm -Micosoft Word - Macro-Enabled Template application/vnd.ms-word.template.macroenabled.12 dotm -Micro CADAM Helix D&D application/vnd.mcd mcd -Micrografx application/vnd.micrografx.flo flo -Micrografx iGrafx Professional application/vnd.micrografx.igx igx -MICROSEC e-Szign¢ application/vnd.eszigno3+xml es3 -Microsoft Access application/x-msaccess mdb -Microsoft Advanced Systems Format (ASF) video/x-ms-asf asf -Microsoft Application application/x-msdownload exe -Microsoft Artgalry application/vnd.ms-artgalry cil -Microsoft Cabinet File application/vnd.ms-cab-compressed cab -Microsoft Class Server application/vnd.ms-ims ims -Microsoft ClickOnce application/x-ms-application application -Microsoft Clipboard Clip application/x-msclip clp -Microsoft Document Imaging Format image/vnd.ms-modi mdi -Microsoft Embedded OpenType application/vnd.ms-fontobject eot -Microsoft Excel - Add-In File application/vnd.ms-excel.addin.macroenabled.12 xlam -Microsoft Excel application/vnd.ms-excel xls -Microsoft Excel - Binary Workbook application/vnd.ms-excel.sheet.binary.macroenabled.12 xlsb -Microsoft Excel - Macro-Enabled Template File application/vnd.ms-excel.template.macroenabled.12 xltm -Microsoft Excel - Macro-Enabled Workbook application/vnd.ms-excel.sheet.macroenabled.12 xlsm -Microsoft Html Help File application/vnd.ms-htmlhelp chm -Microsoft Information Card application/x-mscardfile crd -Microsoft Learning Resource Module application/vnd.ms-lrm lrm -Microsoft MediaView application/x-msmediaview mvb -Microsoft Money application/x-msmoney mny -Microsoft Office Binder application/x-msbinder obd -Microsoft Office - OOXML - Presentation application/vnd.openxmlformats-officedocument.presentationml.presentation pptx -Microsoft Office - OOXML - Presentation (Slide) application/vnd.openxmlformats-officedocument.presentationml.slide sldx -Microsoft Office - OOXML - Presentation (Slideshow) application/vnd.openxmlformats-officedocument.presentationml.slideshow ppsx -Microsoft Office - OOXML - Presentation Template application/vnd.openxmlformats-officedocument.presentationml.template potx -Microsoft Office - OOXML - Spreadsheet application/vnd.openxmlformats-officedocument.spreadsheetml.sheet xlsx -Microsoft Office - OOXML - Spreadsheet Teplate application/vnd.openxmlformats-officedocument.spreadsheetml.template xltx -Microsoft Office - OOXML - Word Document application/vnd.openxmlformats-officedocument.wordprocessingml.document docx -Microsoft Office - OOXML - Word Document Template application/vnd.openxmlformats-officedocument.wordprocessingml.template dotx -Microsoft Office System Release Theme application/vnd.ms-officetheme thmx -Microsoft OneNote application/onenote onetoc -Microsoft PlayReady Ecosystem audio/vnd.ms-playready.media.pya pya -Microsoft PlayReady Ecosystem Video video/vnd.ms-playready.media.pyv pyv -Microsoft PowerPoint - Add-in file application/vnd.ms-powerpoint.addin.macroenabled.12 ppam -Microsoft PowerPoint application/vnd.ms-powerpoint ppt -Microsoft PowerPoint - Macro-Enabled Open XML Slide application/vnd.ms-powerpoint.slide.macroenabled.12 sldm -Microsoft PowerPoint - Macro-Enabled Presentation File application/vnd.ms-powerpoint.presentation.macroenabled.12 pptm -Microsoft PowerPoint - Macro-Enabled Slide Show File application/vnd.ms-powerpoint.slideshow.macroenabled.12 ppsm -Microsoft Project application/vnd.ms-project mpp -Microsoft Publisher application/x-mspublisher pub -Microsoft Schedule+ application/x-msschedule scd -Microsoft Silverlight application/x-silverlight-app xap -Microsoft Trust UI Provider - Certificate Trust Link application/vnd.ms-pki.stl stl -Microsoft Trust UI Provider - Security Catalog application/vnd.ms-pki.seccat cat -Microsoft Visio application/vnd.visio vsd -Microsoft Windows Media Audio audio/x-ms-wma wma -Microsoft Windows Media Audio Redirector audio/x-ms-wax wax -Microsoft Windows Media Audio/Video Playlist video/x-ms-wmx wmx -Microsoft Windows Media Player Download Package application/x-ms-wmd wmd -Microsoft Windows Media Player Playlist application/vnd.ms-wpl wpl -Microsoft Windows Media Player Skin Package application/x-ms-wmz wmz -Microsoft Windows Media Video Playlist video/x-ms-wvx wvx -Microsoft Windows Media Video video/x-ms-wmv wmv -Microsoft Windows Media video/x-ms-wm wm -Microsoft Windows Metafile application/x-msmetafile wmf -Microsoft Windows Terminal Services application/x-msterminal trm -Microsoft Word application/msword doc -Microsoft Wordpad application/x-mswrite wri -Microsoft Works application/vnd.ms-works wps -Microsoft XAML Browser Application application/x-ms-xbap xbap -Microsoft XML Paper Specification application/vnd.ms-xpsdocument xps -MIDI - Musical Instrument Digital Interface audio/midi mid -MiniPay application/vnd.ibm.minipay mpy -Mobile Information Device Profile application/vnd.jcp.javame.midlet-rms rms -MobileTV application/vnd.tmobile-livetv tmo -Mobipocket application/x-mobipocket-ebook prc -Mobius Management Systems - Basket file application/vnd.mobius.mbk mbk -Mobius Management Systems - Distribution Database application/vnd.mobius.dis dis -Mobius Management Systems - Policy Definition Language File application/vnd.mobius.plc plc -Mobius Management Systems - Query File application/vnd.mobius.mqy mqy -Mobius Management Systems - Script Language application/vnd.mobius.msl msl -Mobius Management Systems - Topic Index File application/vnd.mobius.txf txf -Mobius Management Systems - UniversalArchive application/vnd.mobius.daf daf -MO:DCA-P application/vnd.ibm.modcap afp -mod_fly / fly.cgi text/vnd.fly fly -Mophun Certificate application/vnd.mophun.certificate mpc -Mophun VM application/vnd.mophun.application mpn -Motion JPEG 2000 video/mj2 mj2 -MPEG-21 application/mp21 m21 -MPEG4 application/mp4 mp4 -MPEG-4 Audio audio/mp4 mp4a -MPEG-4 Video video/mp4 mp4 -MPEG Audio audio/mpeg mpga -MPEG Url video/vnd.mpegurl mxu -MPEG Video video/mpeg mpeg -Multimedia Playlist Unicode application/vnd.apple.mpegurl m3u8 -MUsical Score Interpreted Code Invented for the ASCII designation of Notation application/vnd.musician mus -Muvee Automatic Video Editing application/vnd.muvee.style msty -MXML application/xv+xml mxml -Navigation Control file for XML (for ePub) application/x-dtbncx+xml ncx -Network Common Data Form (NetCDF) application/x-netcdf nc -neuroLanguage application/vnd.neurolanguage.nlu nlu -New Moon Liftoff/DNA application/vnd.dna dna -N-Gage Game Data application/vnd.nokia.n-gage.data ngdat -N-Gage Game Installer application/vnd.nokia.n-gage.symbian.install n-gage -NobleNet Directory application/vnd.noblenet-directory nnd -NobleNet Sealer application/vnd.noblenet-sealer nns -NobleNet Web application/vnd.noblenet-web nnw -Nokia Radio Application - Preset application/vnd.nokia.radio-preset rpst -Nokia Radio Application - Preset application/vnd.nokia.radio-presets rpss -Notation3 text/n3 n3 -Novadigm's RADIA and EDM products application/vnd.novadigm.edm edm -Novadigm's RADIA and EDM products application/vnd.novadigm.edx edx -Novadigm's RADIA and EDM products application/vnd.novadigm.ext ext -NpGraphIt application/vnd.flographit gph -Nuera ECELP 4800 audio/vnd.nuera.ecelp4800 ecelp4800 -Nuera ECELP 7470 audio/vnd.nuera.ecelp7470 ecelp7470 -Nuera ECELP 9600 audio/vnd.nuera.ecelp9600 ecelp9600 -Office Document Architecture application/oda oda -Ogg application/ogg ogx -Ogg Audio audio/ogg oga -Ogg Video video/ogg ogv -OMA Download Agents application/vnd.oma.dd2+xml dd2 -OpenDocument Chart application/vnd.oasis.opendocument.chart odc -OpenDocument Chart Template application/vnd.oasis.opendocument.chart-template otc -OpenDocument Database application/vnd.oasis.opendocument.database odb -OpenDocument Formula application/vnd.oasis.opendocument.formula odf -OpenDocument Formula Template application/vnd.oasis.opendocument.formula-template odft -OpenDocument Graphics application/vnd.oasis.opendocument.graphics odg -OpenDocument Graphics Template application/vnd.oasis.opendocument.graphics-template otg -OpenDocument Image application/vnd.oasis.opendocument.image odi -OpenDocument Image Template application/vnd.oasis.opendocument.image-template oti -OpenDocument Presentation application/vnd.oasis.opendocument.presentation odp -OpenDocument Presentation Template application/vnd.oasis.opendocument.presentation-template otp -OpenDocument Spreadsheet application/vnd.oasis.opendocument.spreadsheet ods -OpenDocument Spreadsheet Template application/vnd.oasis.opendocument.spreadsheet-template ots -OpenDocument Text application/vnd.oasis.opendocument.text odt -OpenDocument Text Master application/vnd.oasis.opendocument.text-master odm -OpenDocument Text Template application/vnd.oasis.opendocument.text-template ott -Open Document Text Web application/vnd.oasis.opendocument.text-web oth -Open eBook Publication Structure application/oebps-package+xml opf -Open Financial Exchange application/vnd.intu.qbo qbo -OpenGL Textures (KTX) image/ktx ktx -OpenOffice - Calc (Spreadsheet) application/vnd.sun.xml.calc sxc -OpenOffice - Calc Template (Spreadsheet) application/vnd.sun.xml.calc.template stc -OpenOffice - Draw (Graphics) application/vnd.sun.xml.draw sxd -OpenOffice - Draw Template (Graphics) application/vnd.sun.xml.draw.template std -Open Office Extension application/vnd.openofficeorg.extension oxt -OpenOffice - Impress (Presentation) application/vnd.sun.xml.impress sxi -OpenOffice - Impress Template (Presentation) application/vnd.sun.xml.impress.template sti -OpenOffice - Math (Formula) application/vnd.sun.xml.math sxm -OpenOffice - Writer Template (Text - HTML) application/vnd.sun.xml.writer.template stw -OpenOffice - Writer (Text - HTML) application/vnd.sun.xml.writer.global sxg -OpenOffice - Writer (Text - HTML) application/vnd.sun.xml.writer sxw -Open Score Format application/vnd.yamaha.openscoreformat osf -OpenType Font File application/x-font-otf otf -Open Web Media Project - Audio audio/webm weba -Open Web Media Project - Video video/webm webm -OSFPVG application/vnd.yamaha.openscoreformat.osfpvg+xml osfpvg -OSGi Deployment Package application/vnd.osgi.dp dp -PalmOS Data application/vnd.palm pdb -Pascal Source File text/x-pascal p -PawaaFILE application/vnd.pawaafile paw -PCL 6 Enhanced (Formely PCL XL) application/vnd.hp-pclxl pclxl -Pcsel eFIF File application/vnd.picsel efif -PCX Image image/x-pcx pcx -Photoshop Document image/vnd.adobe.photoshop psd -PICSRules application/pics-rules prf -PICT Image image/x-pict pic -pIRCh application/x-chat chat -PKCS #10 - Certification Request Standard application/pkcs10 p10 -PKCS #12 - Personal Information Exchange Syntax Standard application/x-pkcs12 p12 -PKCS #7 - Cryptographic Message Syntax Standard application/pkcs7-mime p7m -PKCS #7 - Cryptographic Message Syntax Standard application/pkcs7-signature p7s -PKCS #7 - Cryptographic Message Syntax Standard (Certificate Request Response) application/x-pkcs7-certreqresp p7r -PKCS #7 - Cryptographic Message Syntax Standard (Certificates) application/x-pkcs7-certificates p7b -PKCS #8 - Private-Key Information Syntax Standard application/pkcs8 p8 -PocketLearn Viewers application/vnd.pocketlearn plf -Portable Anymap Image image/x-portable-anymap pnm -Portable Bitmap Format image/x-portable-bitmap pbm -Portable Compiled Format application/x-font-pcf pcf -Portable Font Resource application/font-tdpfr pfr -Portable Game Notation (Chess Games) application/x-chess-pgn pgn -Portable Graymap Format image/x-portable-graymap pgm -Portable Network Graphics (PNG) image/png png -Portable Pixmap Format image/x-portable-pixmap ppm -Portable Symmetric Key Container application/pskc+xml pskcxml -PosML application/vnd.ctc-posml pml -PostScript application/postscript ai -PostScript Fonts application/x-font-type1 pfa -PowerBuilder application/vnd.powerbuilder6 pbd -Pretty Good Privacy - Signature application/pgp-signature pgp -Preview Systems ZipLock/VBox application/vnd.previewsystems.box box -Princeton Video Image application/vnd.pvi.ptid1 ptid -Pronunciation Lexicon Specification application/pls+xml pls -Proprietary P&G Standard Reporting System application/vnd.pg.format str -Proprietary P&G Standard Reporting System application/vnd.pg.osasli ei6 -PRS Lines Tag text/prs.lines.tag dsc -PSF Fonts application/x-font-linux-psf psf -PubliShare Objects application/vnd.publishare-delta-tree qps -Qualcomm's Plaza Mobile Internet application/vnd.pmi.widget wg -QuarkXpress application/vnd.quark.quarkxpress qxd -QUASS Stream Player application/vnd.epson.esf esf -QUASS Stream Player application/vnd.epson.msf msf -QUASS Stream Player application/vnd.epson.ssf ssf -QuickAnime Player application/vnd.epson.quickanime qam -Quicken application/vnd.intu.qfx qfx -Quicktime Video video/quicktime qt -RAR Archive application/x-rar-compressed rar -Real Audio Sound audio/x-pn-realaudio-plugin rmp -Real Audio Sound audio/x-pn-realaudio ram -Really Simple Discovery application/rsd+xml rsd -RealMedia application/vnd.rn-realmedia rm -RealVNC application/vnd.realvnc.bed bed -Recordare Applications application/vnd.recordare.musicxml mxl -Recordare Applications application/vnd.recordare.musicxml+xml musicxml -Relax NG Compact Syntax application/relax-ng-compact-syntax rnc -RemoteDocs R-Viewer application/vnd.data-vision.rdz rdz -Resource Description Framework application/rdf+xml rdf -RetroPlatform Player application/vnd.cloanto.rp9 rp9 -RhymBox application/vnd.jisp jisp -Rich Text Format application/rtf rtf -Rich Text Format (RTF) text/richtext rtx -ROUTE 66 Location Based Services application/vnd.route66.link66+xml link66 -RSS - Really Simple Syndication application/rss+xml rss -SailingTracker application/vnd.sailingtracker.track st -Scalable Vector Graphics (SVG) image/svg+xml svg -ScheduleUs application/vnd.sus-calendar sus -Search/Retrieve via URL Response Format application/sru+xml sru -Secured eMail application/vnd.sema sema -Secured eMail application/vnd.semd semd -Secured eMail application/vnd.semf semf -Secure Electronic Transaction - Payment application/set-payment-initiation setpay -Secure Electronic Transaction - Registration application/set-registration-initiation setreg -SeeMail application/vnd.seemail see -Server-Based Certificate Validation Protocol - Validation Policies - Request application/scvp-vp-request spq -Server-Based Certificate Validation Protocol - Validation Policies - Response application/scvp-vp-response spp -Server-Based Certificate Validation Protocol - Validation Request application/scvp-cv-request scq -Server-Based Certificate Validation Protocol - Validation Response application/scvp-cv-response scs -Server Normal Format application/x-font-snf snf -Session Description Protocol application/sdp sdp -Setext text/x-setext etx -SGI Movie video/x-sgi-movie movie -Shana Informed Filler application/vnd.shana.informed.formdata ifm -Shana Informed Filler application/vnd.shana.informed.formtemplate itp -Shana Informed Filler application/vnd.shana.informed.interchange iif -Shana Informed Filler application/vnd.shana.informed.package ipk -Sharing Transaction Fraud Data application/thraud+xml tfi -Shell Archive application/x-shar shar -S Hexdump Format application/shf+xml shf -Silicon Graphics RGB Bitmap image/x-rgb rgb -SimpleAnimeLite Player application/vnd.epson.salt slt -Simply Accounting application/vnd.accpac.simply.aso aso -Simply Accounting - Data Import application/vnd.accpac.simply.imp imp -SimTech MindMapper application/vnd.simtech-mindmapper twd -Sixth Floor Media - CommonSpace application/vnd.commonspace csp -SMAF Audio application/vnd.yamaha.smaf-audio saf -SMAF File application/vnd.smaf mmf -SMAF Phrase application/vnd.yamaha.smaf-phrase spf -SMART Technologies Apps application/vnd.smart.teacher teacher -SourceView Document application/vnd.svd svd -SPARQL - Query application/sparql-query rq -SPARQL - Results application/sparql-results+xml srx -Speech Recognition Grammar Specification application/srgs gram -Speech Recognition Grammar Specification - XML application/srgs+xml grxml -Speech Synthesis Markup Language application/ssml+xml ssml -SSEYO Koan Play File application/vnd.koan skp -Standard Generalized Markup Language (SGML) text/sgml sgml -StarOffice - Calc application/vnd.stardivision.calc sdc -StarOffice - Draw application/vnd.stardivision.draw sda -StarOffice - Impress application/vnd.stardivision.impress sdd -StarOffice - Math application/vnd.stardivision.math smf -StarOffice - Writer application/vnd.stardivision.writer sdw -StarOffice - Writer (Global) application/vnd.stardivision.writer-global sgl -StepMania application/vnd.stepmania.stepchart sm -Stuffit Archive application/x-stuffit sit -Stuffit Archive application/x-stuffitx sitx -SudokuMagic application/vnd.solent.sdkm+xml sdkm -Sugar Linux Application Bundle application/vnd.olpc-sugar xo -Sun Audio - Au file format audio/basic au -SundaHus WQ application/vnd.wqd wqd -Symbian Install Package application/vnd.symbian.install sis -Synchronized Multimedia Integration Language application/smil+xml smi -SyncML application/vnd.syncml+xml xsm -SyncML - Device Management application/vnd.syncml.dm+wbxml bdm -SyncML - Device Management application/vnd.syncml.dm+xml xdm -Systems Biology Markup Language application/sbml+xml sbml -System V Release 4 CPIO Archive application/x-sv4cpio sv4cpio -System V Release 4 CPIO Checksum Data application/x-sv4crc sv4crc -Tab Seperated Values text/tab-separated-values tsv -Tagged Image File Format image/tiff tiff -Tao Intent application/vnd.tao.intent-module-archive tao -Tar File (Tape Archive) application/x-tar tar -Tcl Script application/x-tcl tcl -TeX application/x-tex tex -TeX Font Metric application/x-tex-tfm tfm -Text Encoding and Interchange application/tei+xml tei -Text File text/plain txt -TIBCO Spotfire application/vnd.spotfire.dxp dxp -TIBCO Spotfire application/vnd.spotfire.sfs sfs -Time Stamped Data Envelope application/timestamped-data tsd -Triscape Map Explorer application/vnd.triscape.mxs mxs -TRI Systems Config application/vnd.trid.tpt tpt -troff text/troff t -True BASIC application/vnd.trueapp tra -TrueType Font application/x-font-ttf ttf -Turtle (Terse RDF Triple Language) text/turtle ttl -UMAJIN application/vnd.umajin umj -Unique Object Markup Language application/vnd.uoml+xml uoml -Unity 3d application/vnd.unity unityweb -Universal Forms Description Language application/vnd.ufdl ufd -URI Resolution Services text/uri-list uri -User Interface Quartz - Theme (Symbian) application/vnd.uiq.theme utz -Ustar (Uniform Standard Tape Archive) application/x-ustar ustar -UUEncode text/x-uuencode uu -vCalendar text/x-vcalendar vcs -vCard text/x-vcard vcf -Video CD application/x-cdlink vcd -Viewport+ application/vnd.vsf vsf -VirtualCatalog application/vnd.vcx vcx -Virtual Reality Modeling Language model/vrml wrl -Virtue MTS model/vnd.mts mts -Virtue VTU model/vnd.vtu vtu -Visionary application/vnd.visionary vis -Vivo video/vnd.vivo viv -Voice Browser Call Control application/ccxml+xml, ccxml -VoiceXML application/voicexml+xml vxml -WAIS Source application/x-wais-source src -WAP Binary XML (WBXML) application/vnd.wap.wbxml wbxml -WAP Bitamp (WBMP) image/vnd.wap.wbmp wbmp -Waveform Audio File Format (WAV) audio/x-wav wav -Web Distributed Authoring and Versioning application/davmount+xml davmount -Web Open Font Format application/x-font-woff woff -WebP Image image/webp webp -Web Services Policy application/wspolicy+xml wspolicy -WebTurbo application/vnd.webturbo wtb -Widget Packaging and XML Configuration application/widget wgt -WinHelp application/winhlp hlp -Wireless Markup Language Script (WMLScript) text/vnd.wap.wmlscript wmls -Wireless Markup Language (WML) text/vnd.wap.wml wml -WMLScript application/vnd.wap.wmlscriptc wmlsc -Wordperfect application/vnd.wordperfect wpd -Worldtalk application/vnd.wt.stf stf -WSDL - Web Services Description Language application/wsdl+xml wsdl -X.509 Certificate application/x-x509-ca-cert der -X BitMap image/x-xbitmap xbm -Xfig application/x-xfig fig -XHTML - The Extensible HyperText Markup Language application/xhtml+xml xhtml -XML-Binary Optimized Packaging application/xop+xml xop -XML Configuration Access Protocol - XCAP Diff application/xcap-diff+xml xdf -XML Encryption Syntax and Processing application/xenc+xml xenc -XML - Extensible Markup Language application/xml xml -XML Patch Framework application/patch-ops-error+xml xer -XML Resource Lists application/resource-lists+xml rl -XML Resource Lists application/rls-services+xml rs -XML Resource Lists Diff application/resource-lists-diff+xml rld -XML Transformations application/xslt+xml xslt -XPInstall - Mozilla application/x-xpinstall xpi -X PixMap image/x-xpixmap xpm -XSPF - XML Shareable Playlist Format application/xspf+xml xspf -XUL - XML User Interface Language application/vnd.mozilla.xul+xml xul -X Window Dump image/x-xwindowdump xwd -XYZ File Format chemical/x-xyz xyz -YAML Ain't Markup Language / Yet Another Markup Language text/yaml yaml -YANG Data Modeling Language application/yang yang -YIN (YANG - XML) application/yin+xml yin -Zip Archive application/zip zip -Z.U.L. Geometry application/vnd.zul zir -ZVUE Media Manager application/vnd.handheld-entertainment+xml zmm -Zzazz Deck application/vnd.zzazz.deck+xml zaz diff --git a/share/db/mime_type.sql b/share/db/mime_type.sql deleted file mode 100644 index fd465cd0..00000000 --- a/share/db/mime_type.sql +++ /dev/null @@ -1,12 +0,0 @@ -DROP TABLE IF EXISTS mime_type; -CREATE TABLE IF NOT EXISTS mime_type ( - name varchar(128), - type varchar(128) NOT NULL DEFAULT '', - ext varchar(128), - PRIMARY KEY(type,ext) -); -CREATE INDEX IF NOT EXISTS mime_type_ext_idx ON mime_type (ext); -BEGIN TRANSACTION; -.separator \t -.import "mime_type.csv" mime_type -COMMIT; diff --git a/share/db/port b/share/db/port deleted file mode 100755 index 473aab60..00000000 --- a/share/db/port +++ /dev/null @@ -1,9 +0,0 @@ -#!/usr/bin/env perl -use strict; -use warnings; - -@ARGV = ('/etc/services'); -while (<>) { - m,^(\w+)\s+(\d+)/(\w+)\s+#\s*(.*?)$, or next; - print join(qq|\t|,map(/^\s*(.*?)\s*$/,$2,$3,$1)).qq|\n|; -} diff --git a/share/db/port.sql b/share/db/port.sql deleted file mode 100644 index eae612e5..00000000 --- a/share/db/port.sql +++ /dev/null @@ -1,8 +0,0 @@ -DROP TABLE IF EXISTS port; -CREATE TABLE IF NOT EXISTS port ( - port INT, - proto VARCHAR(3), - name VARCHAR(100), - PRIMARY KEY (port,proto,name), - FOREIGN KEY(name) REFERENCES service(name) -); diff --git a/share/db/shell_function b/share/db/shell_function deleted file mode 100755 index 8d3e03a6..00000000 --- a/share/db/shell_function +++ /dev/null @@ -1,56 +0,0 @@ -#!/usr/bin/env perl -use strict; -use warnings; -$|=1; - -my $TABLE = 'shell_function'; -my $q = chr(39); - -print '' - ."SELECT 'Update shell_function';\n" - ."DROP TABLE IF EXISTS $TABLE;\n" - ."CREATE TABLE $TABLE (name VARCHAR(255) PRIMARY KEY,code BLOB);\n" - ."BEGIN TRANSACTION;\n" -; -END { print "COMMIT;\n"; } - -#@ARGV = ("bash --login -c 'for f in `shell_functions`; do type \$f || continue; done' |"); -@ARGV = ("bash -norc -c 'for i in $ENV{NB_ROOT}/etc/profile.d/*; do . \$i; done; for f in `shell_functions`; do type \$f || continue; done' |"); -$? and die; -my @fct = ( '', () ); -while ( <> ) { - - if (/^(\S+) is a function$/) { - sql(@fct); - @fct = ( $1, () ); - next; - } - - next unless $fct[0]; - push @{$fct[1]}, $_; - -} -sql(@fct); - -exit 0; - -sub sql { - #use Data::Dumper; print Dumper(\@_),"\n"; return; - return if !@_ or !$_[0]; - my $k = $_[0]; - my $v = join('',map { - s/$q/$q.$q/ge; $_ - } @{ $_[1] }); - print qq|INSERT INTO $TABLE VALUES ($q$k$q,$q$v$q);\n|; - return; - - while (@{ $_[1] }) { - my $k = shift @{ $_[1] }; - next unless $k; - - my $v = shift @{ $_[1] }; - $v =~ s/$q/$q.$q/ge; - - #print qq|INSERT INTO $t VALUES ($q$k$q,$q$v$q);\n|; - } -} diff --git a/share/db/shell_function.sql b/share/db/shell_function.sql deleted file mode 100644 index 29e57826..00000000 --- a/share/db/shell_function.sql +++ /dev/null @@ -1,5 +0,0 @@ -DROP TABLE IF EXISTS shell_function; -CREATE TABLE shell_function ( - name VARCHAR(255) PRIMARY KEY, - code BLOB -); diff --git a/share/db/shell_replace.sh b/share/db/shell_replace.sh index ac33251c..61896b86 100644 --- a/share/db/shell_replace.sh +++ b/share/db/shell_replace.sh @@ -1,11 +1,11 @@ #!/bin/bash --login # # -# We want a new proper bash shell, we are going to search with `set` +# Find file to parse with shell_replace # # set +e -for f in $(shell_replace -find $NB_ROOT/*); do +[ "$NB_ROOT" = "" ] || for f in $(shell_replace -find $NB_ROOT/*); do echo "shell_replace $f" | sed "s; $NB_ROOT/; ;" shell_replace -i.shell_replace "$f" diff --git a/share/db/timezone b/share/db/timezone deleted file mode 100755 index 07238622..00000000 --- a/share/db/timezone +++ /dev/null @@ -1,13 +0,0 @@ -#!/usr/bin/env perl -use strict; -use warnings; -@ARGV = ('curl -s http://download.geonames.org/export/dump/timeZones.txt |'); - -my $i; -while (<>) { - next unless $i++; - chomp($_); - @_ = (split("\t",$_))[1,2,3,4]; - #$_[1] = join("\t",reverse split('/',$_[1])); - print join ("\t",@_)."\n"; -} diff --git a/share/db/timezone.csv b/share/db/timezone.csv deleted file mode 100644 index 29233ba3..00000000 --- a/share/db/timezone.csv +++ /dev/null @@ -1,424 +0,0 @@ -Africa/Abidjan 0.0 0.0 0.0 -Africa/Accra 0.0 0.0 0.0 -Africa/Addis_Ababa 3.0 3.0 3.0 -Africa/Algiers 1.0 1.0 1.0 -Africa/Asmara 3.0 3.0 3.0 -Africa/Bamako 0.0 0.0 0.0 -Africa/Bangui 1.0 1.0 1.0 -Africa/Banjul 0.0 0.0 0.0 -Africa/Bissau 0.0 0.0 0.0 -Africa/Blantyre 2.0 2.0 2.0 -Africa/Brazzaville 1.0 1.0 1.0 -Africa/Bujumbura 2.0 2.0 2.0 -Africa/Cairo 2.0 2.0 2.0 -Africa/Casablanca 0.0 1.0 0.0 -Africa/Ceuta 1.0 2.0 1.0 -Africa/Conakry 0.0 0.0 0.0 -Africa/Dakar 0.0 0.0 0.0 -Africa/Dar_es_Salaam 3.0 3.0 3.0 -Africa/Djibouti 3.0 3.0 3.0 -Africa/Douala 1.0 1.0 1.0 -Africa/El_Aaiun 0.0 1.0 0.0 -Africa/Freetown 0.0 0.0 0.0 -Africa/Gaborone 2.0 2.0 2.0 -Africa/Harare 2.0 2.0 2.0 -Africa/Johannesburg 2.0 2.0 2.0 -Africa/Juba 3.0 3.0 3.0 -Africa/Kampala 3.0 3.0 3.0 -Africa/Khartoum 3.0 3.0 3.0 -Africa/Kigali 2.0 2.0 2.0 -Africa/Kinshasa 1.0 1.0 1.0 -Africa/Lagos 1.0 1.0 1.0 -Africa/Libreville 1.0 1.0 1.0 -Africa/Lome 0.0 0.0 0.0 -Africa/Luanda 1.0 1.0 1.0 -Africa/Lubumbashi 2.0 2.0 2.0 -Africa/Lusaka 2.0 2.0 2.0 -Africa/Malabo 1.0 1.0 1.0 -Africa/Maputo 2.0 2.0 2.0 -Africa/Maseru 2.0 2.0 2.0 -Africa/Mbabane 2.0 2.0 2.0 -Africa/Mogadishu 3.0 3.0 3.0 -Africa/Monrovia 0.0 0.0 0.0 -Africa/Nairobi 3.0 3.0 3.0 -Africa/Ndjamena 1.0 1.0 1.0 -Africa/Niamey 1.0 1.0 1.0 -Africa/Nouakchott 0.0 0.0 0.0 -Africa/Ouagadougou 0.0 0.0 0.0 -Africa/Porto-Novo 1.0 1.0 1.0 -Africa/Sao_Tome 0.0 0.0 0.0 -Africa/Tripoli 2.0 2.0 2.0 -Africa/Tunis 1.0 1.0 1.0 -Africa/Windhoek 2.0 1.0 1.0 -America/Adak -10.0 -9.0 -10.0 -America/Anchorage -9.0 -8.0 -9.0 -America/Anguilla -4.0 -4.0 -4.0 -America/Antigua -4.0 -4.0 -4.0 -America/Araguaina -3.0 -3.0 -3.0 -America/Argentina/Buenos_Aires -3.0 -3.0 -3.0 -America/Argentina/Catamarca -3.0 -3.0 -3.0 -America/Argentina/Cordoba -3.0 -3.0 -3.0 -America/Argentina/Jujuy -3.0 -3.0 -3.0 -America/Argentina/La_Rioja -3.0 -3.0 -3.0 -America/Argentina/Mendoza -3.0 -3.0 -3.0 -America/Argentina/Rio_Gallegos -3.0 -3.0 -3.0 -America/Argentina/Salta -3.0 -3.0 -3.0 -America/Argentina/San_Juan -3.0 -3.0 -3.0 -America/Argentina/San_Luis -3.0 -3.0 -3.0 -America/Argentina/Tucuman -3.0 -3.0 -3.0 -America/Argentina/Ushuaia -3.0 -3.0 -3.0 -America/Aruba -4.0 -4.0 -4.0 -America/Asuncion -3.0 -4.0 -4.0 -America/Atikokan -5.0 -5.0 -5.0 -America/Bahia -3.0 -3.0 -3.0 -America/Bahia_Banderas -6.0 -5.0 -6.0 -America/Barbados -4.0 -4.0 -4.0 -America/Belem -3.0 -3.0 -3.0 -America/Belize -6.0 -6.0 -6.0 -America/Blanc-Sablon -4.0 -4.0 -4.0 -America/Boa_Vista -4.0 -4.0 -4.0 -America/Bogota -5.0 -5.0 -5.0 -America/Boise -7.0 -6.0 -7.0 -America/Cambridge_Bay -7.0 -6.0 -7.0 -America/Campo_Grande -3.0 -4.0 -4.0 -America/Cancun -5.0 -5.0 -5.0 -America/Caracas -4.0 -4.0 -4.0 -America/Cayenne -3.0 -3.0 -3.0 -America/Cayman -5.0 -5.0 -5.0 -America/Chicago -6.0 -5.0 -6.0 -America/Chihuahua -7.0 -6.0 -7.0 -America/Costa_Rica -6.0 -6.0 -6.0 -America/Creston -7.0 -7.0 -7.0 -America/Cuiaba -3.0 -4.0 -4.0 -America/Curacao -4.0 -4.0 -4.0 -America/Danmarkshavn 0.0 0.0 0.0 -America/Dawson -8.0 -7.0 -8.0 -America/Dawson_Creek -7.0 -7.0 -7.0 -America/Denver -7.0 -6.0 -7.0 -America/Detroit -5.0 -4.0 -5.0 -America/Dominica -4.0 -4.0 -4.0 -America/Edmonton -7.0 -6.0 -7.0 -America/Eirunepe -5.0 -5.0 -5.0 -America/El_Salvador -6.0 -6.0 -6.0 -America/Fort_Nelson -7.0 -7.0 -7.0 -America/Fortaleza -3.0 -3.0 -3.0 -America/Glace_Bay -4.0 -3.0 -4.0 -America/Godthab -3.0 -2.0 -3.0 -America/Goose_Bay -4.0 -3.0 -4.0 -America/Grand_Turk -4.0 -4.0 -4.0 -America/Grenada -4.0 -4.0 -4.0 -America/Guadeloupe -4.0 -4.0 -4.0 -America/Guatemala -6.0 -6.0 -6.0 -America/Guayaquil -5.0 -5.0 -5.0 -America/Guyana -4.0 -4.0 -4.0 -America/Halifax -4.0 -3.0 -4.0 -America/Havana -5.0 -4.0 -5.0 -America/Hermosillo -7.0 -7.0 -7.0 -America/Indiana/Indianapolis -5.0 -4.0 -5.0 -America/Indiana/Knox -6.0 -5.0 -6.0 -America/Indiana/Marengo -5.0 -4.0 -5.0 -America/Indiana/Petersburg -5.0 -4.0 -5.0 -America/Indiana/Tell_City -6.0 -5.0 -6.0 -America/Indiana/Vevay -5.0 -4.0 -5.0 -America/Indiana/Vincennes -5.0 -4.0 -5.0 -America/Indiana/Winamac -5.0 -4.0 -5.0 -America/Inuvik -7.0 -6.0 -7.0 -America/Iqaluit -5.0 -4.0 -5.0 -America/Jamaica -5.0 -5.0 -5.0 -America/Juneau -9.0 -8.0 -9.0 -America/Kentucky/Louisville -5.0 -4.0 -5.0 -America/Kentucky/Monticello -5.0 -4.0 -5.0 -America/Kralendijk -4.0 -4.0 -4.0 -America/La_Paz -4.0 -4.0 -4.0 -America/Lima -5.0 -5.0 -5.0 -America/Los_Angeles -8.0 -7.0 -8.0 -America/Lower_Princes -4.0 -4.0 -4.0 -America/Maceio -3.0 -3.0 -3.0 -America/Managua -6.0 -6.0 -6.0 -America/Manaus -4.0 -4.0 -4.0 -America/Marigot -4.0 -4.0 -4.0 -America/Martinique -4.0 -4.0 -4.0 -America/Matamoros -6.0 -5.0 -6.0 -America/Mazatlan -7.0 -6.0 -7.0 -America/Menominee -6.0 -5.0 -6.0 -America/Merida -6.0 -5.0 -6.0 -America/Metlakatla -9.0 -8.0 -9.0 -America/Mexico_City -6.0 -5.0 -6.0 -America/Miquelon -3.0 -2.0 -3.0 -America/Moncton -4.0 -3.0 -4.0 -America/Monterrey -6.0 -5.0 -6.0 -America/Montevideo -3.0 -3.0 -3.0 -America/Montserrat -4.0 -4.0 -4.0 -America/Nassau -5.0 -4.0 -5.0 -America/New_York -5.0 -4.0 -5.0 -America/Nipigon -5.0 -4.0 -5.0 -America/Nome -9.0 -8.0 -9.0 -America/Noronha -2.0 -2.0 -2.0 -America/North_Dakota/Beulah -6.0 -5.0 -6.0 -America/North_Dakota/Center -6.0 -5.0 -6.0 -America/North_Dakota/New_Salem -6.0 -5.0 -6.0 -America/Ojinaga -7.0 -6.0 -7.0 -America/Panama -5.0 -5.0 -5.0 -America/Pangnirtung -5.0 -4.0 -5.0 -America/Paramaribo -3.0 -3.0 -3.0 -America/Phoenix -7.0 -7.0 -7.0 -America/Port-au-Prince -5.0 -4.0 -5.0 -America/Port_of_Spain -4.0 -4.0 -4.0 -America/Porto_Velho -4.0 -4.0 -4.0 -America/Puerto_Rico -4.0 -4.0 -4.0 -America/Punta_Arenas -3.0 -3.0 -3.0 -America/Rainy_River -6.0 -5.0 -6.0 -America/Rankin_Inlet -6.0 -5.0 -6.0 -America/Recife -3.0 -3.0 -3.0 -America/Regina -6.0 -6.0 -6.0 -America/Resolute -6.0 -5.0 -6.0 -America/Rio_Branco -5.0 -5.0 -5.0 -America/Santarem -3.0 -3.0 -3.0 -America/Santiago -3.0 -4.0 -4.0 -America/Santo_Domingo -4.0 -4.0 -4.0 -America/Sao_Paulo -2.0 -3.0 -3.0 -America/Scoresbysund -1.0 0.0 -1.0 -America/Sitka -9.0 -8.0 -9.0 -America/St_Barthelemy -4.0 -4.0 -4.0 -America/St_Johns -3.5 -2.5 -3.5 -America/St_Kitts -4.0 -4.0 -4.0 -America/St_Lucia -4.0 -4.0 -4.0 -America/St_Thomas -4.0 -4.0 -4.0 -America/St_Vincent -4.0 -4.0 -4.0 -America/Swift_Current -6.0 -6.0 -6.0 -America/Tegucigalpa -6.0 -6.0 -6.0 -America/Thule -4.0 -3.0 -4.0 -America/Thunder_Bay -5.0 -4.0 -5.0 -America/Tijuana -8.0 -7.0 -8.0 -America/Toronto -5.0 -4.0 -5.0 -America/Tortola -4.0 -4.0 -4.0 -America/Vancouver -8.0 -7.0 -8.0 -America/Whitehorse -8.0 -7.0 -8.0 -America/Winnipeg -6.0 -5.0 -6.0 -America/Yakutat -9.0 -8.0 -9.0 -America/Yellowknife -7.0 -6.0 -7.0 -Antarctica/Casey 11.0 11.0 11.0 -Antarctica/Davis 7.0 7.0 7.0 -Antarctica/DumontDUrville 10.0 10.0 10.0 -Antarctica/Macquarie 11.0 11.0 11.0 -Antarctica/Mawson 5.0 5.0 5.0 -Antarctica/McMurdo 13.0 12.0 12.0 -Antarctica/Palmer -3.0 -3.0 -3.0 -Antarctica/Rothera -3.0 -3.0 -3.0 -Antarctica/Syowa 3.0 3.0 3.0 -Antarctica/Troll 0.0 2.0 0.0 -Antarctica/Vostok 6.0 6.0 6.0 -Arctic/Longyearbyen 1.0 2.0 1.0 -Asia/Aden 3.0 3.0 3.0 -Asia/Almaty 6.0 6.0 6.0 -Asia/Amman 2.0 3.0 2.0 -Asia/Anadyr 12.0 12.0 12.0 -Asia/Aqtau 5.0 5.0 5.0 -Asia/Aqtobe 5.0 5.0 5.0 -Asia/Ashgabat 5.0 5.0 5.0 -Asia/Atyrau 5.0 5.0 5.0 -Asia/Baghdad 3.0 3.0 3.0 -Asia/Bahrain 3.0 3.0 3.0 -Asia/Baku 4.0 4.0 4.0 -Asia/Bangkok 7.0 7.0 7.0 -Asia/Barnaul 7.0 7.0 7.0 -Asia/Beirut 2.0 3.0 2.0 -Asia/Bishkek 6.0 6.0 6.0 -Asia/Brunei 8.0 8.0 8.0 -Asia/Chita 9.0 9.0 9.0 -Asia/Choibalsan 8.0 8.0 8.0 -Asia/Colombo 5.5 5.5 5.5 -Asia/Damascus 2.0 3.0 2.0 -Asia/Dhaka 6.0 6.0 6.0 -Asia/Dili 9.0 9.0 9.0 -Asia/Dubai 4.0 4.0 4.0 -Asia/Dushanbe 5.0 5.0 5.0 -Asia/Famagusta 3.0 3.0 3.0 -Asia/Gaza 2.0 3.0 2.0 -Asia/Hebron 2.0 3.0 2.0 -Asia/Ho_Chi_Minh 7.0 7.0 7.0 -Asia/Hong_Kong 8.0 8.0 8.0 -Asia/Hovd 7.0 7.0 7.0 -Asia/Irkutsk 8.0 8.0 8.0 -Asia/Jakarta 7.0 7.0 7.0 -Asia/Jayapura 9.0 9.0 9.0 -Asia/Jerusalem 2.0 3.0 2.0 -Asia/Kabul 4.5 4.5 4.5 -Asia/Kamchatka 12.0 12.0 12.0 -Asia/Karachi 5.0 5.0 5.0 -Asia/Kathmandu 5.75 5.75 5.75 -Asia/Khandyga 9.0 9.0 9.0 -Asia/Kolkata 5.5 5.5 5.5 -Asia/Krasnoyarsk 7.0 7.0 7.0 -Asia/Kuala_Lumpur 8.0 8.0 8.0 -Asia/Kuching 8.0 8.0 8.0 -Asia/Kuwait 3.0 3.0 3.0 -Asia/Macau 8.0 8.0 8.0 -Asia/Magadan 11.0 11.0 11.0 -Asia/Makassar 8.0 8.0 8.0 -Asia/Manila 8.0 8.0 8.0 -Asia/Muscat 4.0 4.0 4.0 -Asia/Nicosia 2.0 3.0 2.0 -Asia/Novokuznetsk 7.0 7.0 7.0 -Asia/Novosibirsk 7.0 7.0 7.0 -Asia/Omsk 6.0 6.0 6.0 -Asia/Oral 5.0 5.0 5.0 -Asia/Phnom_Penh 7.0 7.0 7.0 -Asia/Pontianak 7.0 7.0 7.0 -Asia/Pyongyang 8.5 8.5 8.5 -Asia/Qatar 3.0 3.0 3.0 -Asia/Qyzylorda 6.0 6.0 6.0 -Asia/Riyadh 3.0 3.0 3.0 -Asia/Sakhalin 11.0 11.0 11.0 -Asia/Samarkand 5.0 5.0 5.0 -Asia/Seoul 9.0 9.0 9.0 -Asia/Shanghai 8.0 8.0 8.0 -Asia/Singapore 8.0 8.0 8.0 -Asia/Srednekolymsk 11.0 11.0 11.0 -Asia/Taipei 8.0 8.0 8.0 -Asia/Tashkent 5.0 5.0 5.0 -Asia/Tbilisi 4.0 4.0 4.0 -Asia/Tehran 3.5 4.5 3.5 -Asia/Thimphu 6.0 6.0 6.0 -Asia/Tokyo 9.0 9.0 9.0 -Asia/Tomsk 7.0 7.0 7.0 -Asia/Ulaanbaatar 8.0 8.0 8.0 -Asia/Urumqi 6.0 6.0 6.0 -Asia/Ust-Nera 10.0 10.0 10.0 -Asia/Vientiane 7.0 7.0 7.0 -Asia/Vladivostok 10.0 10.0 10.0 -Asia/Yakutsk 9.0 9.0 9.0 -Asia/Yangon 6.5 6.5 6.5 -Asia/Yekaterinburg 5.0 5.0 5.0 -Asia/Yerevan 4.0 4.0 4.0 -Atlantic/Azores -1.0 0.0 -1.0 -Atlantic/Bermuda -4.0 -3.0 -4.0 -Atlantic/Canary 0.0 1.0 0.0 -Atlantic/Cape_Verde -1.0 -1.0 -1.0 -Atlantic/Faroe 0.0 1.0 0.0 -Atlantic/Madeira 0.0 1.0 0.0 -Atlantic/Reykjavik 0.0 0.0 0.0 -Atlantic/South_Georgia -2.0 -2.0 -2.0 -Atlantic/St_Helena 0.0 0.0 0.0 -Atlantic/Stanley -3.0 -3.0 -3.0 -Australia/Adelaide 10.5 9.5 9.5 -Australia/Brisbane 10.0 10.0 10.0 -Australia/Broken_Hill 10.5 9.5 9.5 -Australia/Currie 11.0 10.0 10.0 -Australia/Darwin 9.5 9.5 9.5 -Australia/Eucla 8.75 8.75 8.75 -Australia/Hobart 11.0 10.0 10.0 -Australia/Lindeman 10.0 10.0 10.0 -Australia/Lord_Howe 11.0 10.5 10.5 -Australia/Melbourne 11.0 10.0 10.0 -Australia/Perth 8.0 8.0 8.0 -Australia/Sydney 11.0 10.0 10.0 -Europe/Amsterdam 1.0 2.0 1.0 -Europe/Andorra 1.0 2.0 1.0 -Europe/Astrakhan 4.0 4.0 4.0 -Europe/Athens 2.0 3.0 2.0 -Europe/Belgrade 1.0 2.0 1.0 -Europe/Berlin 1.0 2.0 1.0 -Europe/Bratislava 1.0 2.0 1.0 -Europe/Brussels 1.0 2.0 1.0 -Europe/Bucharest 2.0 3.0 2.0 -Europe/Budapest 1.0 2.0 1.0 -Europe/Busingen 1.0 2.0 1.0 -Europe/Chisinau 2.0 3.0 2.0 -Europe/Copenhagen 1.0 2.0 1.0 -Europe/Dublin 0.0 1.0 0.0 -Europe/Gibraltar 1.0 2.0 1.0 -Europe/Guernsey 0.0 1.0 0.0 -Europe/Helsinki 2.0 3.0 2.0 -Europe/Isle_of_Man 0.0 1.0 0.0 -Europe/Istanbul 3.0 3.0 3.0 -Europe/Jersey 0.0 1.0 0.0 -Europe/Kaliningrad 2.0 2.0 2.0 -Europe/Kiev 2.0 3.0 2.0 -Europe/Kirov 3.0 3.0 3.0 -Europe/Lisbon 0.0 1.0 0.0 -Europe/Ljubljana 1.0 2.0 1.0 -Europe/London 0.0 1.0 0.0 -Europe/Luxembourg 1.0 2.0 1.0 -Europe/Madrid 1.0 2.0 1.0 -Europe/Malta 1.0 2.0 1.0 -Europe/Mariehamn 2.0 3.0 2.0 -Europe/Minsk 3.0 3.0 3.0 -Europe/Monaco 1.0 2.0 1.0 -Europe/Moscow 3.0 3.0 3.0 -Europe/Oslo 1.0 2.0 1.0 -Europe/Paris 1.0 2.0 1.0 -Europe/Podgorica 1.0 2.0 1.0 -Europe/Prague 1.0 2.0 1.0 -Europe/Riga 2.0 3.0 2.0 -Europe/Rome 1.0 2.0 1.0 -Europe/Samara 4.0 4.0 4.0 -Europe/San_Marino 1.0 2.0 1.0 -Europe/Sarajevo 1.0 2.0 1.0 -Europe/Saratov 4.0 4.0 4.0 -Europe/Simferopol 3.0 3.0 3.0 -Europe/Skopje 1.0 2.0 1.0 -Europe/Sofia 2.0 3.0 2.0 -Europe/Stockholm 1.0 2.0 1.0 -Europe/Tallinn 2.0 3.0 2.0 -Europe/Tirane 1.0 2.0 1.0 -Europe/Ulyanovsk 4.0 4.0 4.0 -Europe/Uzhgorod 2.0 3.0 2.0 -Europe/Vaduz 1.0 2.0 1.0 -Europe/Vatican 1.0 2.0 1.0 -Europe/Vienna 1.0 2.0 1.0 -Europe/Vilnius 2.0 3.0 2.0 -Europe/Volgograd 3.0 3.0 3.0 -Europe/Warsaw 1.0 2.0 1.0 -Europe/Zagreb 1.0 2.0 1.0 -Europe/Zaporozhye 2.0 3.0 2.0 -Europe/Zurich 1.0 2.0 1.0 -Indian/Antananarivo 3.0 3.0 3.0 -Indian/Chagos 6.0 6.0 6.0 -Indian/Christmas 7.0 7.0 7.0 -Indian/Cocos 6.5 6.5 6.5 -Indian/Comoro 3.0 3.0 3.0 -Indian/Kerguelen 5.0 5.0 5.0 -Indian/Mahe 4.0 4.0 4.0 -Indian/Maldives 5.0 5.0 5.0 -Indian/Mauritius 4.0 4.0 4.0 -Indian/Mayotte 3.0 3.0 3.0 -Indian/Reunion 4.0 4.0 4.0 -Pacific/Apia 14.0 13.0 13.0 -Pacific/Auckland 13.0 12.0 12.0 -Pacific/Bougainville 11.0 11.0 11.0 -Pacific/Chatham 13.75 12.75 12.75 -Pacific/Chuuk 10.0 10.0 10.0 -Pacific/Easter -5.0 -6.0 -6.0 -Pacific/Efate 11.0 11.0 11.0 -Pacific/Enderbury 13.0 13.0 13.0 -Pacific/Fakaofo 13.0 13.0 13.0 -Pacific/Fiji 13.0 12.0 12.0 -Pacific/Funafuti 12.0 12.0 12.0 -Pacific/Galapagos -6.0 -6.0 -6.0 -Pacific/Gambier -9.0 -9.0 -9.0 -Pacific/Guadalcanal 11.0 11.0 11.0 -Pacific/Guam 10.0 10.0 10.0 -Pacific/Honolulu -10.0 -10.0 -10.0 -Pacific/Kiritimati 14.0 14.0 14.0 -Pacific/Kosrae 11.0 11.0 11.0 -Pacific/Kwajalein 12.0 12.0 12.0 -Pacific/Majuro 12.0 12.0 12.0 -Pacific/Marquesas -9.5 -9.5 -9.5 -Pacific/Midway -11.0 -11.0 -11.0 -Pacific/Nauru 12.0 12.0 12.0 -Pacific/Niue -11.0 -11.0 -11.0 -Pacific/Norfolk 11.0 11.0 11.0 -Pacific/Noumea 11.0 11.0 11.0 -Pacific/Pago_Pago -11.0 -11.0 -11.0 -Pacific/Palau 9.0 9.0 9.0 -Pacific/Pitcairn -8.0 -8.0 -8.0 -Pacific/Pohnpei 11.0 11.0 11.0 -Pacific/Port_Moresby 10.0 10.0 10.0 -Pacific/Rarotonga -10.0 -10.0 -10.0 -Pacific/Saipan 10.0 10.0 10.0 -Pacific/Tahiti -10.0 -10.0 -10.0 -Pacific/Tarawa 12.0 12.0 12.0 -Pacific/Tongatapu 14.0 13.0 13.0 -Pacific/Wake 12.0 12.0 12.0 -Pacific/Wallis 12.0 12.0 12.0 diff --git a/share/db/timezone.sql b/share/db/timezone.sql deleted file mode 100644 index db67672a..00000000 --- a/share/db/timezone.sql +++ /dev/null @@ -1,12 +0,0 @@ -DROP TABLE IF EXISTS timezone; -CREATE TABLE IF NOT EXISTS timezone ( - id varchar(2) PRIMARY KEY, - -- capital varchar(300), - -- continent varchar(300), - gmt float(1,1), - dst float(1,1), - raw float(1,1) -); -BEGIN TRANSACTION; -.import "timezone.csv" timezone -COMMIT; diff --git a/share/db/update.sh b/share/db/update.sh index 62035681..ff9b6918 100755 --- a/share/db/update.sh +++ b/share/db/update.sh @@ -1,90 +1,15 @@ #!/bin/bash --login # # -# We want a new proper bash shell, we are going to search with `set` +# Update $NB_DB # # set +e -TMP=`mktemp -d` -DIR=$(dirname "$0") -cd "$DIR" +cd "$(dirname "$0")" && ( -main() { -( - -$(dbq f=txt a=db.sql db-type=sqlite db=pub 'table-name=!~^(zipcode|geo)') -$(echo "VACUUM;") + echo 'PRAGMA encoding="UTF-8";' + echo 'PRAGMA foreign_keys=OFF;' + dbq2sqlite db=pub 'table-name=!~^(zipcode|geo)' + echo 'VACUUM;' ) | sqlite3 "nb.db" - -rm -rf "$TMP" -} - -update_csv() { - local t=$1 - ./$t > $TMP/$t.csv - [ -s $TMP/$t.csv ] && mv $TMP/$t.csv $t.csv && echo Update $t.csv 1>&2 -} - -csv2table() { - local name="$1"; shift - local file="$1"; shift - - cat << EOF -CREATE TEMPORARY TABLE IF NOT EXISTS _var (k varchar(10),v varhcar(10)); -DELETE FROM _var; - -DROP TABLE IF EXISTS ${name}_tmp; -CREATE TEMPORARY TABLE ${name}_tmp AS SELECT * FROM $name WHERE 0; - -INSERT INTO _var VALUES('pre',(SELECT count(*) FROM ${name})); - --- SELECT 'Update $name ('||(SELECT count(*) FROM ${name})||')'; - -BEGIN TRANSACTION; -.import "$file" ${name}_tmp -COMMIT; -INSERT INTO _var VALUES('import',(SELECT count(*) FROM ${name}_tmp)); - -INSERT OR IGNORE INTO $name SELECT * FROM ${name}_tmp; -INSERT INTO _var VALUES('post',(SELECT count(*) FROM ${name})); - -SELECT 'Update $name (' - || ((SELECT v FROM _var WHERE k='post')-(SELECT v FROM _var WHERE k='pre')) - || '/' - ||(SELECT v FROM _var WHERE k='import') -||')' -||' = ('||(SELECT count(*) FROM ${name})||')' -; -EOF -} - -shell_functions2sql() { - local t="$1"; shift - local f - ( - for f in `shell_functions`; do - type "$f" || continue - done - ) | perl -MData::Dumper -e ' -BEGIN{$t=shift @ARGV and print qq|PRAGMA encoding="UTF-8";\n| -."DROP TABLE IF EXISTS $t;\n" -."CREATE TABLE $t (name VARCHAR(255) PRIMARY KEY,code BLOB);\n" -and $t="INSERT INTO $t "; -$|=1; -} -$_=join("",<>);@_=(map{s/^\s*(.*?)\s*$/$1/m;$_}split(/^(.*?) is a function$/m,$_)); -0&&die Dumper(\\@_); -0&&die Dumper($_[2]); -$q=chr(39); -while (@_) { - $k=shift @_; - next unless $k; - $v=shift @_; - $v =~ s/$q/$q.$q/ge; - print $t.qq|VALUES ($q$k$q,$q$v$q);\n|; -} -' "$t" -} - -main diff --git a/share/db/useragent b/share/db/useragent deleted file mode 100755 index c410f15e..00000000 --- a/share/db/useragent +++ /dev/null @@ -1,3 +0,0 @@ -#!/usr/bin/env bash -[ -n "$NB_ROOT" ] || . "$(dirname "$0")/../../etc/profile" || exit -xml2csv http://www.user-agents.org/allagents.xml diff --git a/share/db/useragent.csv b/share/db/useragent.csv deleted file mode 100644 index 6aa9f83d..00000000 --- a/share/db/useragent.csv +++ /dev/null @@ -1,2459 +0,0 @@ -id_a_f_3 !Susie (http://www.sync2it.com/susie) Sync2It bookmark management & clustering engine C R http://www.sync2it.com -id_a_f_6 UnChaos From Chaos To Order Hybrid Web Search Engine.(vadim_gonchar@unchaos.com) UnCHAOS search robot R Site is dead http://www.unchaos.com/ -id_a_f_7 UnChaos Bot Hybrid Web Search Engine. (vadim_gonchar@unchaos.com) UnCHAOS search robot R Site is dead http://www.unchaos.com/ -id_a_f_8 UnChaosBot From Chaos To Order UnChaos Hybrid Web Search Engine at www.unchaos.com (info@unchaos.com) UnCHAOS search robot R Site is dead http://www.unchaos.com/ -id_a_f_9 http://www.sygol.com Sygol Search (Italy) robot R s.also SygolBot http://www.sygol.com/ -id_a_f_4 ( Robots.txt Validator http://www.searchengineworld.com/cgi-bin/robotcheck.cgi ) SearchEngineWorld's robots.txt validator C Services is no more available http://www.searchengineworld.com/cgi-bin/robotcheck.cgi -id_a_f_171105_1 (DreamPassport/3.0; isao/MyDiGiRabi) DreamCast DreamPassport browser B http://www.dricas.com/dp/ -id_a_f_290606_1 (Privoxy/1.0) Privoxy web proxy P s.also Privoxy/3.0 (Anonymous) http://www.privoxy.org/ -id_a_f_230507_1 */Nutch-0.9-dev Unknown Yahoo robot R 123.113.184.2xx http://www.yahoo.com -id_a_f_5 +SitiDi.net/SitiDiBot/1.0 (+Have Good Day) SitiDi.net search (Germany) robot R http://www.sitidi.net/ -id_a_f_1 -DIE-KRAEHE- META-SEARCH-ENGINE/1.1 http://www.die-kraehe.de Die Kraehe Meta-Search-Engine (Germany) link checking R http://www.die-kraehe.de -id_a_f_060206_1 123spider-Bot (Version: 1.02, powered by www.123spider.de 123spider.de (Germany) web directory link checking C http://www.123spider.de/ -id_a_f_180806_1 192.comAgent 192.com - UK web directory R 217.160.75.2xx http://www.192.com/ -id_a_f_060606_1 1st ZipCommander (Net) - http://www.zipcommander.com/ 1st ZipCommander Net - IE based browser B http://www.zipcommander.com/ -id_a_f_10 2Bone_LinkChecker/1.0 libwww-perl/5.64 2Bone online link checker C http://www.2bone.com/links/linkchecker.shtml -id_a_f_11 4anything.com LinkChecker v2.0 4Anything robot R http://www.4anything.com -id_a_f_110207_1 8484 Boston Project v 1.0 Unknown guestbook spamming or harvesting tool from diff. IPs S s. various honey pot sites http://www.projecthoneypot.org/bsh_X19tb2RlPWdsb2JhbCZfX2J5PWMmY3RyeT11cyZ1YWc9ODQ4NCtCb3N0b24rUHJvamVjdCt2KzEuMA.. -id_a_f_2 :robot/1.0 (linux) ( admin e-mail: undefined http://www.neofonie.de/loesungen/search/robot.html ) neofonie search robot Germany R http://www.neofonie.de/loesungen/search/ -id_a_f_12 A-Online Search A-Online.at robot - now Jet2Web Search R http://www.jet2web.net/portal -id_a_f_090707_1 A1 Keyword Research/1.0.2 (+http://www.micro-sys.dk/products/keyword-research/) miggibot/2007.03.27 A1 Keyword Research - search engine and keyword optimization software C http://www.micro-sys.dk/products/keyword-research/ -id_a_f_100906_1 A1 Sitemap Generator/1.0 (+http://www.micro-sys.dk/products/sitemap-generator/) miggibot/2006.01.24 MiggiBot website crawler engine - A1 Sitemap Generator R http://www.micro-sys.dk/products/sitemap-generator/ http://www.micro-sys.dk/developer/miggibot/ -id_a_f_250408_2 aardvark-crawler Aardvark web crawler for Sun's Blog recommendations R 192.9.71.7x http://blogs.sun.com/plamere/ -id_a_f_13 AbachoBOT Abacho / Crawler.de robot R http://www.abacho.com -id_a_f_14 AbachoBOT (Mozilla compatible) Abacho / Crawler.de robot R http://www.abacho.com -id_a_f_15 ABCdatos BotLink/5.xx.xxx#BBL ABCdatos - Castilian program & tutorial directory R http://www.abcdatos.com -id_a_f_16 Aberja Checkomat Aberja Hybridsuchmaschine (Germany) link checking R http://www.aberja.de -id_a_f_17 abot/0.1 (abot; http://www.abot.com; abot@abot.com) Nameprotect copyright search robot (24.177.134.x) R s. also - np/0.1_(np;_http://www.nameprotect.com... - aipbot/1.0 (aipbot; http://www.aipbot.com... http://www.nameprotect.com/ -id_a_f_18 About/0.1libwww-perl/5.47 About robot R http://www.about.com -id_a_f_051206_3 Accelatech RSSCrawler/0.4 Accela Technology RSS feed crawler R 125.100.242.2xx http://www.accelatech.com/ -id_a_f_19 accoona Accoona Search robot R 65.17.255.xx http://www.accoona.com -id_a_f_20 Accoona-AI-Agent/1.1.1 (crawler at accoona dot com) Accoona Search robot R 65.17.255.xx http://www.accoona.com -id_a_f_140906_3 Accoona-AI-Agent/1.1.2 (aicrawler at accoonabot dot com) Accoona Search robot R 65.17.255.xx http://www.accoona.com -id_a_f_21 Ace Explorer Ace Explorer - IE based browser B http://www.aceexplorer.com -id_a_f_280806_1 Ack (http://www.ackerm.com/) Ackerm search robot R 64.74.153.xx http://www.ackerm.com/ -id_a_f_22 AcoiRobot Acoi picture finder robot R http://monetdb.cwi.nl/acoi/projects.html -id_a_f_23 Acoon Robot v1.50.001 Acoon.de search (Germany) robot R 80.237.153.10x http://www.acoon.de -id_a_f_24 Acoon Robot v1.52 (http://www.acoon.de) Acoon.de search (Germany) robot R 80.237.153.10x http://www.acoon.de -id_a_f_100508_1 Acoon-Robot 4.0.x.[xx] (http://www.acoon.de) Acoon.de search (Germany) robot R 80.237.209.xx http://www.acoon.de -id_a_f_010108_1 Acoon-Robot v3.xx (http://www.acoon.de and http://www.acoon.com) Acoon.de search (Germany) robot R 80.237.153.10x http://www.acoon.de -id_a_f_110507_1 Acorn/Nutch-0.9 (Non-Profit Search Engine; acorn.isara.org; acorn at isara dot org) Acorn Search Project R 124.157.145.1xx http://acorn.no-ip.org/ -id_a_f_25 ActiveBookmark 1.x LibMaster.com Active Bookmark HTML page creator C B http://www.libmaster.com/software.php -id_a_f_060806_2 Activeworlds Activeworlds 3D homepage browser B http://www.activeworlds.com -id_a_f_26 ActiveWorlds/3.xx (xxx) Activeworlds 3D homepage browser B http://www.activeworlds.com -id_a_f_27 Ad Muncher v4.xx.x Ad Muncher - banner killer P http://www.admuncher.com/ -id_a_f_28 Ad Muncher v4x Build xxxxx Ad Muncher - banner killer P http://www.admuncher.com/ -id_a_f_061006_1 Adaxas Spider (http://www.adaxas.net/) website directory adaxas link checking C 85.10.199.xx http://www.adaxas.net/ -id_a_f_29 Advanced Browser (http://www.avantbrowser.com) Avant Browser - IE based browser B http://www.avantbrowser.com -id_a_f_30 AESOP_com_SpiderMan Aesop robot R http://www.aesop.com -id_a_f_31 agadine/1.x.x (+http://www.agada.de) Agada search (Germany) robot R s. also Mozilla/4.0 (agadine3.0) http://www.agada.de -id_a_f_32 Agent-SharewarePlazaFileCheckBot/2.0+(+http://www.SharewarePlaza.com) SharewarePlaza link checking R http://www.sharewareplaza.com -id_a_f_33 AgentName/0.1 libwww-perl/5.48 Linkomatic submission verifier R http://www.linkomatic.com/ -id_a_f_34 AIBOT/2.1 By +(www.21seek.com A Real artificial intelligence search engine China) 21seek.com (China) robot (218.17.90.xxx) R http://www.21seek.com -id_a_f_130807_1 AideRSS/1.0 (aiderss.com) AideRss - Postrank RSS and Blog filtering C 72.44.35.2xx http://www.aiderss.com/ -id_a_f_35 aipbot/1.0 (aipbot; http://www.aipbot.com; aipbot@aipbot.com) Nameprotect copyright search robot (24.177.134.x) R s. also - np/0.1_(np;_http://www.nameprotect.com... - abot/0.1 (abot; http://www.abot.com... http://www.nameprotect.com/ -id_a_f_36 aipbot/2-beta (aipbot dev; http://aipbot.com; aipbot@aipbot.com) Nameprotect copyright search robot (24.177.134.x) R s. also - np/0.1_(np;_http://www.nameprotect.com... - abot/0.1 (abot; http://www.abot.com... http://www.nameprotect.com/ -id_a_f_291108_1 Akregator/1.2.9; librss/remnants Akregator news feed reader for KDE B http://akregator.kde.org/ -id_a_f_37 Aladin/3.324 Aladin robot R http://www.aladin.de -id_a_f_180408_1 Alcatel-BG3/1.0 UP.Browser/5.0.3.1.2 Phone.com UP.Browser for mobiles on Alcatel cellphone B http://www.openwave.com -id_a_f_38 Aleksika Spider/1.0 (+http://www.aleksika.com/) Aleksika Danmark - Search engine optimization spider R http://www.aleksika.com -id_a_f_291108_2 AlertInfo 2.0 (Powered by Newsbrain) Alertinfo - French version of Feedreader 3.xx B http://www.feedreader.com/ http://www.geste.fr/alertinfo/home.html -id_a_f_39 AlkalineBOT/1.3 Vestris robot R http://alkaline.vestris.com/ -id_a_f_40 AlkalineBOT/1.4 (1.4.0326.0 RTM) Vestris robot R http://alkaline.vestris.com/ -id_a_f_41 Allesklar/0.1 libwww-perl/5.46 Allesklar.de robot R http://www.allesklar.de -id_a_f_42 Alligator 1.31 (www.nearsoftware.com) Alligator download manager D http://www.nearsoftware.com -id_a_f_011108_1 Allrati/1.1 (+) Unknown robot from Allrati.com R 67.205.96.xxx/67.205.104.xx http://www.allrati.com/ -id_a_f_43 AltaVista Intranet V2.0 AVS EVAL search@freeit.com Altavista robot R http://www.altavista.com -id_a_f_44 AltaVista Intranet V2.0 Compaq Altavista Eval sveand@altavista.net Altavista robot R http://www.altavista.com -id_a_f_45 AltaVista Intranet V2.0 evreka.com crawler@evreka.com Altavista robot R http://www.altavista.com -id_a_f_46 AltaVista V2.0B crawler@evreka.com Altavista robot R http://www.altavista.com -id_a_f_280209_1 amaya/x.xx libwww/x.x.x Amaya - W3C's Editor/Browser B http://www.w3.org/Amaya/ -id_a_f_47 AmfibiBOT Amfibi Search robot R 64.111.217.9x http://www.amfibi.com/ -id_a_f_48 Amfibibot/0.06 (Amfibi Web Search; http://www.amfibi.com; agent@amfibi.com) Amfibi Search robot R 64.111.217.9x http://www.amfibi.com/ -id_a_f_141105_2 Amfibibot/0.07 (Amfibi Robot; http://www.amfibi.com; agent@amfibi.com) Amfibi Search robot R 64.111.217.9x http://www.amfibi.com/ -id_a_f_49 amibot amibot - Amidalla search engine robot (62.241.33.xx) R s. also libwww-perl/5.65 http://www.amidalla.com/ -id_a_f_50 Amiga-AWeb/3.4.167SE AWeb Amiga browser B http://www.amitrix.com/aweb.html -id_a_f_51 AmigaVoyager/3.4.4 (MorphOS/PPC native) Voyager - Amiga browser B http://www.vapor.com/voyager/ -id_a_f_091205_1 AmiTCP Miami (AmigaOS 2.04) Amiga Miami TCP Stack http://home.ptd.net/~strdustr/amirc/Netware.html -id_a_f_210608_1 Amoi 8512/R21.0 NF-Browser/3.3 NF embedded browser on Amois Skypephone B http://3skypephone.com/ -id_a_f_190206_3 amzn_assoc Amazon.com robot for checking their affiliate sites C s. also aranhabot -id_a_f_52 AnnoMille spider 0.1 alpha - http://www.annomille.it Annomille Italian historical oriented robot R http://www.annomille.it -id_a_f_53 annotate_google; http://ponderer.org/download/annotate_google.user.js annotate Google - Firefox extension for annotating Google search results B http://ponderer.org/annotate_google -id_a_f_54 Anonymized by ProxyOS: http://www.megaproxy.com Megaproxy user P http://www.megaproxy.com -id_a_f_55 Anonymizer/1.1 faked user agent -id_a_f_56 AnswerBus (http://www.answerbus.com/) AnswerBus natural language search using COLLATE technology R http://www.answerbus.com http://collate.dfki.de/kurzdarstellung.html -id_a_f_57 AnswerChase PROve x.0 AnswerChase search tool http://www.answerchase.com -id_a_f_58 AnswerChase x.0 AnswerChase search tool http://www.answerchase.com -id_a_f_59 ANTFresco/x.xx ANT Fresco Browser B s. also Mozilla/x.xx (compatible; ANTFresco....) http://www.antlimited.com/products/fresco.htm -id_a_f_60 antibot-V1.1.5/i586-linux-2.2 Antibot (discontinued) robot R http://www.antidot.net -id_a_f_61 AnzwersCrawl/2.0 (anzwerscrawl@anzwers.com.au;Engine) Anzwers (Yahoo) Australia robot R http://au.anzwers.yahoo.com/ -id_a_f_030206_1 Apexoo Spider 1.x Apexoo Search spider R 216.240.143.xx http://www.apexoo.com/ -id_a_f_62 Aplix HTTP/1.0.1 JavaOS app. for SEGA Saturn Internet and Sanyo Internet-TV B -id_a_f_63 Aplix_SANYO_browser/1.x (Japanese) JavaOS app. for Sanyo Internet-TV B -id_a_f_64 Aplix_SEGASATURN_browser/1.x (Japanese) JavaOS app. for SEGA Saturn Internet B -id_a_f_65 Aport Aport robot R http://www.aport.ru -id_a_f_66 appie 1.1 (www.walhello.com) Walhello Internet Search robot R http://www.walhello.com -id_a_f_140608_1 Apple iPhone v1.1.4 CoreMedia v1.0.0.4A102 CoreMedia player on Apple iPhone B http://www.apple.com/iphone/ -id_a_f_070209_1 Apple-PubSub/65.1.1 PubSub - Mac OS X utility for managing RSS/Atom subscriptions via the PubSub framework B http://developer.apple.com/documentation/Darwin/Reference/ManPages/man1/pubsub.1.html -id_a_f_120707_1 ArabyBot (compatible; Mozilla/5.0; GoogleBot; FAST Crawler 6.4; http://www.araby.com;) Araby search - Arabia R 209.85.31.2xx http://www.araby.com/ -id_a_f_260608_1 ArachBot Covac Arachnid Web Crawler R s.also Covac TexAs Arachbot http://www.covac-software.com/ -id_a_f_67 Arachnoidea (arachnoidea@euroseek.com) Euroseek spider R http://www.euroseek.com -id_a_f_190206_2 aranhabot Amazon.com robot for checking their affiliate sites C s. also amzn_assoc -id_a_f_68 ArchitextSpider Excite spider R http://www.excite.com -id_a_f_69 archive.org_bot Heritrix - The Internet Archive's open-source crawler (207.241.225.2xx) R s.also - InternetArchive/0.8-dev - Mozilla/5.0 (compatible;archive.org_bot/... http://www.archive.org/ -id_a_f_70 Argus/1.1 (Nutch; http://www.simpy.com/bot.html; feedback at simpy dot com) Simpy Bookmarklet crawler (69.55.233.xx) C s. also Simpy http://www.simpy.com/ -id_a_f_031205_1 Arikus_Spider Arikus inContext search engine software R http://www.arikus.com/inContext-enterprise.html -id_a_f_210208_1 Arquivo-web-crawler (compatible; heritrix/1.12.1 +http://arquivo-web.fccn.pt) Tomba project: the Portuguese web archive R 193.136.192.xx http://arquivo-web.fccn.pt/ http://arquivo-web.fccn.pt/crawler?set_language=en -id_a_f_251007_1 ASAHA Search Engine Turkey V.001 (http://www.asaha.com/) Asaha search robot (Turkey) R 62.68.194.2xx http://www.asaha.com/ -id_a_f_71 Asahina-Antenna/1.x ASAHINA Antenna information detecting agent R http://masshy.fastwave.gr.jp/hina/release/ -id_a_f_72 Asahina-Antenna/1.x (libhina.pl/x.x ; libtime.pl/x.x) ASAHINA Antenna information detecting agent R http://masshy.fastwave.gr.jp/hina/release/ -id_a_f_73 ask.24x.info Ask 24x Info robot R http://ask.24x.info/ -id_a_f_74 AskAboutOil/0.06-rcp (Nutch; http://www.nutch.org/docs/en/bot.html; nutch-agent@askaboutoil.com) Ask About Oil - Petroleum related search (24.227.212.xxx) using Nutch R http://askaboutoil.com/search.jsp http://www.nutch.org -id_a_f_120806_1 asked/Nutch-0.8 (web crawler; http://asked.jp; epicurus at gmail dot com) askEd! / Inferret search (Japan) robot using Nutch R 131.112.125.1xx http://asked.jp/ -id_a_f_75 ASPSeek/1.2.5 ASPSeek search engine software -Yahoo-Inc. / Telecom Canada robot R http://www.aspseek.org -id_a_f_76 ASPseek/1.2.9d Swsoft.net robot using Aspseek R http://www.aspseek.com -id_a_f_77 ASPSeek/1.2.x ASPSeek search engine software R http://www.aspseek.org -id_a_f_78 ASPSeek/1.2.xa ASPSeek search engine software R http://www.aspseek.org -id_a_f_79 ASPseek/1.2.xx ASPSeek search engine software R http://www.aspseek.org -id_a_f_80 ASPSeek/1.2.xxpre ASPSeek search engine software R http://www.aspseek.org -id_a_f_81 ASSORT/0.10 Associative Sort robot R site is down http://pcmath126.unice.fr/assort-robot.html -id_a_f_82 asterias/2.0 Singingfish media spider (64.12.186.2xx) via AOL search R s. also Mozilla/4.0 (compatible; MSIE 6.0 compatible; Asterias Crawler ... http://search.singingfish.com/sfw/home.jsp -id_a_f_83 AtlocalBot/1.1 +(http://www.atlocal.com/local-web-site-owner.html) Atlocal local business search robot R http://www.atlocal.com/ -id_a_f_041207_2 Atomic_Email_Hunter/4.0 Atomic Email Hunter email extracing and harvesting S -id_a_f_84 Atomz/1.0 Atomz robot R http://www.atomz.com -id_a_f_85 atSpider/1.0 atSpider (ceased) email harvester / spambot S -id_a_f_060707_1 Attentio/Nutch-0.9-dev (Attentio's beta blog crawler; www.attentio.com; info@attentio.com) Attentio social media monitoring and analysing R 85.88.35.xx http://www.attentio.com/ -id_a_f_231105_2 AU-MIC/2.0 MMP/2.0 Samsung SPH-A660 phone with Sprint software B http://www1.sprintpcs.com/explore/showcase/Showcase.jsp?scTopic=pcsVision -id_a_f_240208_1 AUDIOVOX-SMT5600 Audiovox SMT5600 (AT&T) Smartphone mobile phone browser B http://www.audiovox.com/ http://www.audiovox.com/manuals/owners/SMT%205600%20QSG%209-7%20FINAL.pdf -id_a_f_86 augurfind Augurnet Swiss (was www.augurnet.ch) search robot R -id_a_f_87 augurnfind V-1.x Augurnet Swiss (was www.augurnet.ch) search robot R -id_a_f_88 autoemailspider Auto Email Pro Email harvester S was http://autoemailspider.com - site is dead -id_a_f_89 autohttp Linkscan tool from Elsop C s. Linkscan/x ? http://www.elsop.com/linkscan/ -id_a_f_050208_1 autowebdir 1.1 (www.autowebdir.com) Autowebdir - The Automatically Generated Web Directory R 84.104.43.x http://www.autowebdir.com/ -id_a_f_90 AV Fetch 1.0 Altavista robot ?? R http://www.altavista.com/ -id_a_f_91 Avant Browser (http://www.avantbrowser.com) Avant Browser - IE based browser B http://www.avantbrowser.com -id_a_f_92 AVSearch-1.0(peter.turney@nrc.ca) National Research Council Canada robot R http://www.nrc-cnrc.gc.ca/main_e.html -id_a_f_93 AVSearch-2.0-fusionIdx-14-CompetitorWebSites Unknown robot from 205.203.108.xx (telerate.com) -id_a_f_94 AVSearch-3.0(AltaVista/AVC) Altavista robot R http://www.altavista.com/ -id_a_f_95 AWeb AWeb Amiga browser B http://aweb.sunsite.dk/ -id_a_f_96 axadine/ (Axadine Crawler; http://www.axada.de/; ) Axada search Germany robot R http://www.axada.de -id_a_f_97 AxmoRobot - Crawling your site for better indexing on www.axmo.com search engine. Axmo search robot R http://www.axmo.com -id_a_f_250306_1 Azureus 2.x.x.x Azureus Java BitTorrent Client D http://azureus.sourceforge.net/ -id_a_f_131208_1 BabalooSpider/1.3 (BabalooSpider; http://www.babaloo.si; spider@babaloo.si) Babaloo search robot (Slovenia) R 84.255.237.2xx http://www.babaloo.si/ -id_a_f_98 BaboomBot/1.x.x (+http://www.baboom.us) BaBoom Web Portal (ODP) robot (66.98.254.xx) R http://www.baboom.us -id_a_f_050406_1 BackStreet Browser 3.x BackStreet Browser - Offline browser / website downloader D http://www.spadixbd.com/backstreet/ -id_a_f_140508_1 BaiduImagespider+(+http://www.baidu.jp/search/s308.html) Baidu search (Japan) image crawler R 119.63.193.94.[x]xx http://www.baidu.jp/ -id_a_f_99 BaiDuSpider Baidu spidering engine - used by diff. IPs R http://www.baidu.com -id_a_f_080608_1 Baiduspider+(+http://help.baidu.jp/system/05.html) Baidu spidering engine - used by diff. IPs R http://www.baidu.com -id_a_f_100 Baiduspider+(+http://www.baidu.com/search/spider.htm) Baidu spidering engine - used by diff. IPs R http://www.baidu.com -id_a_f_080407_1 Baiduspider+(+http://www.baidu.com/search/spider_jp.html) Baidu search (Japan) crawler R 119.63.193.[x]xx http://www.baidu.jp -id_a_f_031107_1 Balihoo/Nutch-1.0-dev (Crawler for Balihoo.com search engine - obeys robots.txt and robots meta tags ; http://balihoo.com/index.aspx; robot at balihoo dot com) Balihoo - Vertical search engine crawler (beta) R http://www.balihoo.com/ http://www.balihoo.com/pdfs/BalihooFactSheet.pdf -id_a_f_101 BanBots/1.2 (spider@banbots.com) Project BanBots Perl script robot C s. also Mozilla/5.0 (compatible; BanBots/2.0b.. http://www.banbots.com/ -id_a_f_140506_3 Barca/2.0.xxxx Barca Pro email & PIM software B http://www.pocosystems.com/home/index.php?option=com_content&task=view&id=105&Itemid=54 -id_a_f_120206_2 BarcaPro/1.4.xxxx Barca Pro email & PIM software B http://www.pocosystems.com/home/index.php?option=com_content&task=view&id=105&Itemid=54 -id_a_f_102 BarraHomeCrawler (albertof@barrahome.org) Barrahome crawler R 64.246.56.xx http://www.barrahome.org -id_a_f_011006_1 bCentral Billing Post-Process Unknown user agent from Microsoft 204.71.191.1xx -id_a_f_103 bdcindexer_2.6.2 (research@bdc) Business.com robot R 208.144.233.xxx http://www.business.com -id_a_f_104 BDFetch Brandimensions Brand Protection robot R http://www.brandimensions.com/ -id_a_f_105 BDNcentral Crawler v2.3 [en] (http://www.bdncentral.com/robot.html) (X11; I; Linux 2.0.44 i686) Bdncentral Sitesearch robot R http://www.bdncentral.com -id_a_f_111205_3 BeamMachine/0.5 (dead link remover of www.beammachine.net) beammachine web directory (Germany) link checking R C http://www.beammachine.net/de/ -id_a_f_106 beautybot/1.0 (+http://www.uchoose.de/crawler/beautybot/) Beauty robot for Cosmoty - German beauty and wellness search R http://www.cosmoty.de http://www.uchoose.de/Projekte/Lifestyle/beauty/ -id_a_f_230406_1 BebopBot/2.5.1 ( crawler http://www.apassion4jazz.net/bebopbot.html ) A Passion for Jazz music related search robot R 68.6.204.2xx http://www.apassion4jazz.net/ -id_a_f_107 BeebwareDirectory/v0.01 LinkcheckerBeepware (site is down) web directory link checking C http://directory.beebware.co.uk -id_a_f_108 Big Brother (http://pauillac.inria.fr/~fpottier/) Big Brother link checking tool C http://pauillac.inria.fr -id_a_f_130606_1 Big Fish v1.0 GoonGee.com link popularity checking C 216.89.111.x http://www.goongee.com/big-fish/ -id_a_f_109 BigBrother/1.6e BB4 network monitoring C http://www.bb4.com -id_a_f_110 BigCliqueBOT/1.03-dev (bigclicbot; http://www.bigclique.com; bot@bigclique.com) BigClique Search robot R http://www.bigclique.com -id_a_f_080206_4 BIGLOTRON (Beta 2;GNU/Linux) Biglotron search (France) robot R http://www.biglotron.com/ -id_a_f_171106_2 Bigsearch.ca/Nutch-x.x-dev (Bigsearch.ca Internet Spider; http://www.bigsearch.ca/; info@enhancededge.com) Bigsearch.ca search robot R 72.0.207.1xx http://www.bigsearch.ca/ -id_a_f_111 Bilbo/2.3b-UNIX Bilbo - web frontend for the Nessus Security Scanner C http://home.broadpark.no/%7Etnilsen-1/Linux/Bilbo_-_Nessus_WEB/bilbo_-_nessus_web.html -id_a_f_170806_1 BilgiBetaBot/0.8-dev (bilgi.com (Beta) ; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org) Bilgi.com (Beta) search robot - Turkey R 212.156.230.2xx http://www.bilgi.com/ -id_a_f_080607_1 BilgiBot/1.0(beta) (http://www.bilgi.com/; bilgi at bilgi dot com) Bilgi.com (Beta) search robot - Turkey R 212.156.230.2xx http://www.bilgi.com/ -id_a_f_112 billbot wjj@cs.cmu.edu Carnegie Mellon School robot/link checking ? C http://www.cs.cmu.edu -id_a_f_050206_3 Bitacle bot/1.1 Bitacle Blog Search Archive robot R http://bitacle.org/ -id_a_f_050206_2 Bitacle Robot (V:1.0;) (http://www.bitacle.com) Bitacle Blog Search Archive robot R http://bitacle.org/ -id_a_f_113 Biyubi/x.x (Sistema Fenix; G11; Familia Toledo; es-mx) Biyubi Navigator - Mexican browser for Fenix OS B http://www.biyubi.com -id_a_f_114 BlackBerry7520/4.0.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/5.0.3.3 UP.Link/5.1.2.12 (Google WAP Proxy/1.0) Blackberry Wireless Internet browser via Google WAP Proxy B P http://www.blackberry.com/products/service/web.shtml http://www.openwave.com -id_a_f_115 BlackWidow FS Consulting (was www.fsconsult.net) Black Widow web crawler R -id_a_f_010306_1 BlackWidow BlackWidow web site scanner / downloading tool D http://www.softbytelabs.com/BlackWidow -id_a_f_116 Blaiz-Bee/1.0 (+http://www.blaiz.net) Blaiz Enterprises RawGrunt search R 203.87.123.1xx http://www.rawgrunt.com/ http://www.blaiz.net -id_a_f_160307_1 Blaiz-Bee/2.00.8222 (BE Internet Search Engine http://www.rawgrunt.com) Blaiz Enterprises RawGrunt search R 203.87.123.1xx http://www.rawgrunt.com/ http://www.blaiz.net -id_a_f_240706_1 Blaiz-Bee/2.00.xxxx (+http://www.blaiz.net) Blaiz Enterprises RawGrunt search R 203.87.123.1xx http://www.rawgrunt.com/ http://www.blaiz.net -id_a_f_117 BlitzBOT@tricus.net Blitzsuche Germany robot R http://blitzsuche.rp-online.de/ -id_a_f_118 BlitzBOT@tricus.net (Mozilla compatible) Blitzsuche Germany robot R http://blitzsuche.rp-online.de/ -id_a_f_090307_1 BlockNote.Net BlockNote web page editor B http://blocknote.net/ -id_a_f_119 BlogBot/1.x blogdex robot from MIT.edu R http://blogdex.media.mit.edu/ -id_a_f_071206_1 BlogBridge 2.13 (http://www.blogbridge.com/) BlogBridge RSS reader B http://www.blogbridge.com/ -id_a_f_120 Bloglines Title Fetch/1.0 (http://www.bloglines.com) Bloglines article search R 65.214.44.xx http://www.bloglines.com -id_a_f_250907_1 Bloglines-Images/0.1 (http://www.bloglines.com) Bloglines graphics crawler R 65.214.44.xx http://www.bloglines.com -id_a_f_011108_2 Bloglines/3.1 (http://www.bloglines.com) Bloglines news crawler R 65.214.44.xx http://www.bloglines.com -id_a_f_071206_2 BlogMap (http://www.feedmap.net) FeedMap / BlogMap geo coding service C http://www.feedmap.net/BlogMap/ -id_a_f_121 Blogpulse (info@blogpulse.com) Intelliseek's BlogPulse blog search R 64.158.138.xx http://www.blogpulse.com -id_a_f_050208_2 BlogPulseLive (support@blogpulse.com) Intelliseek's BlogPulse blog search R 64.158.138.xx http://www.blogpulse.com -id_a_f_161206_2 BlogSearch/1.x +http://www.icerocket.com/ IceRocket Web search robot R s. also BlogzIce ... http://www.icerocket.com -id_a_f_020707_1 blogsearchbot-pumpkin-3 Art of Computing blog search project R 88.198.44.2xx http://artofcomputing.net/blog/?p=4 -id_a_f_241205_1 BlogsNowBot, V 2.01 (+http://www.blogsnow.com/) BlogsNow realtime link tracker robot R http://www.blogsnow.com/ -id_a_f_261107_1 BlogVibeBot-v1.1 (spider@blogvibe.nl) BlogVipe news and Blog crawler (Netherlands) R 212.61.21.xx http://www.blogvibe.nl -id_a_f_122 blogWatcher_Spider/0.1 (http://www.lr.pi.titech.ac.jp/blogWatcher/) blogWatcher robot from Okumura Group Tokyo (131.112.182.xxx) R http://www.lr.pi.titech.ac.jp -id_a_f_123 BlogzIce/1.0 (+http://icerocket.com; rhodes@icerocket.com) IceRocket Web search robot R s. also BlogSearch ... http://www.icerocket.com -id_a_f_124 BlogzIce/1.0 +http://www.icerocket.com/ IceRocket Web search robot R s. also BlogSearch ... http://www.icerocket.com -id_a_f_310108_1 BloobyBot Blooby search (beta) robot R 206.166.206.18x http://www.blooby.com/ -id_a_f_270507_1 Bloodhound/Nutch-0.9 (Testing Crawler for Research - obeys robots.txt and robots meta tags ; http://balihoo.com/index.aspx; robot at balihoo dot com) Balihoo - Search Engine for Advertising Media R 204.228.230.xx http://balihoo.com/ -id_a_f_125 bluefish 0.6 HTML editor Bluefish HTML-editor for Linux B http://bluefish.openoffice.nl/ -id_a_f_126 BMCLIENT Part of ButtMan remote access tool seems to be a Trojan - see link http://www.glocksoft.com/trojan_list/ButtMan.htm -id_a_f_120506_1 BMLAUNCHER Bookmark Express bookmark manager C Website is dead - was: http://www.bookmarkexpress.com/ -id_a_f_127 Bobby/4.0.x RPT-HTTPClient/0.3-3E Bobby web accessibility desktop testing tool C http://bobby.watchfire.com/bobby/html/en/index.jsp -id_a_f_128 boitho.com-dc/0.xx (http://www.boitho.com/dcbot.html) Boitho search (Norway) robot via 80.202.212.xx / 80.80.111.xx R http://www.boitho.com -id_a_f_129 boitho.com-robot/1.x Boitho search (Norway) robot via 80.202.212.xx / 80.80.111.xx R http://www.boitho.com -id_a_f_130 boitho.com-robot/1.x (http://www.boitho.com/bot.html) Boitho search (Norway) robot via 80.202.212.xx / 80.80.111.xx R http://www.boitho.com -id_a_f_060806_1 Bookdog/x.x Bookdog - Mac bookmark manager C http://www.sheepsystems.com/bookdog/ -id_a_f_131 Bookmark Buddy bookmark checker (http://www.bookmarkbuddy.net/) Bookmark Buddy - favorite bookmark manager C http://www.bookmarkbuddy.net -id_a_f_132 Bookmark Renewal Check Agent [http://www.bookmark.ne.jp/] Favourites managing program C http://www.bookmark.ne.jp -id_a_f_230807_1 Bookmark Renewal Check Agent [http://www.bookmark.ne.jp/] (Version 2.0beta) Favourites managing program C http://www.bookmark.ne.jp -id_a_f_300408_1 BookmarkBase(2/;http://bookmarkbase.com) Bookmark Base bookmark manager C http://www.bookmarkbase.com/ -id_a_f_133 Bot mailto:craftbot@yahoo.com cybercity.fr user robot / faked user agent ? -id_a_f_160308_1 BPImageWalker/2.0 (www.bdbrandprotect.com) BD-Brandprotect copyright infringement crawler R 72.14.164.1xx http://www.bdbrandprotect.com/ http://www.bdbrandprotect.com/solutions_5.html -id_a_f_134 BravoBrian bstop.bravobrian.it BravoBrian bSTOP parental control P R s. also BStop http://bstop.bravobrian.it/ -id_a_f_135 BravoBrian SpiderEngine MarcoPolo Robot for BravoBrian bSTOP R s. also BStop http://bstop.bravobrian.it/ -id_a_f_220508_1 BrightCrawler (http://www.brightcloud.com/brightcrawler.asp) BrightCloud web filtering for classifying websites P R http://www.brightcloud.com/brightcrawler.asp -id_a_f_136 BruinBot (+http://webarchive.cs.ucla.edu/bruinbot.html) Webarchive Project Bruinbot crawler R http://webarchive.cs.ucla.edu -id_a_f_137 BSDSeek/1.0 Inktomi (Hotbot-Lycos NBCi) robot R http://www.inktomi.com/ -id_a_f_138 BStop.BravoBrian.it Agent Detector BravoBrian bSTOP parental control P R s. also BravoBrian .. http://bstop.bravobrian.it/ -id_a_f_139 BTbot/0.x (+http://www.btbot.com/btbot.html) BitTorrent Search Engine btbot robot R http://www.btbot.com -id_a_f_300408_2 BTWebClient/180B(9704) µTorrent BitTorrent Client D http://www.utorrent.com/ -id_a_f_080407_2 BuildCMS crawler (http://www.buildcms.com/crawler) BuildCMS crawler - market monitoring project of BuildCMS R 194.24.253.xx http://www.buildcms.com/index.php http://www.buildcms.com/about_us/crawler -id_a_f_051206_4 Bulkfeeds/r1752 (http://bulkfeeds.net/) Bulkfeeds: RSS directory link checking C 202.181.96.2xx http://bulkfeeds.net/ -id_a_f_140 BullsEye BullsEye/Intelliseek robot R http://www.intelliseek.com/be/bullseye.htm -id_a_f_141 bumblebee@relevare.com Relevare Portal software robot R http://www.relevare.com -id_a_f_142 BunnySlippers Microsoft server information robot (see link) C http://www.webmasterworld.com/forum11/841.htm -id_a_f_070606_1 BurstFindCrawler/1.1 (crawler.burstfind.com; http://crawler.burstfind.com; crawler@burstfind.com) BurstFind search crawler (64.34.172.xx) R http://www.burstfind.com/ -id_a_f_143 Buscaplus Robi/1.0 (http://www.buscaplus.com/robi/) Buscaplus (Spain) robot R http://www.buscaplus.com -id_a_f_050807_2 BW-C-2.0 Logitech Desktop Managers (LDM) Backweb (BW) update check D http://www.logitech.com/index.cfm/494/3041&cl=de,de -id_a_f_140508_2 bwh3_user_agent Basic Web Hacking 3 fake user-agent from Hellbound Hackers challenges S http://www.hellboundhackers.org/forum/_basic_web_hacking_3-7-6960_0.html http://vuau.wordpress.com/2008/03/12/hbh-basic-web-3-switch-user-agent/ -id_a_f_140508_3 Cabot/Nutch-0.9 (Amfibi's web-crawling robot; http://www.amfibi.com/cabot/; agent@amfibi.com) Amfibi Search robot R 64.111.217.9x http://www.amfibi.com/ -id_a_f_280508_1 Cabot/Nutch-1.0-dev (Amfibi's web-crawling robot; http://www.amfibi.com/cabot/; agent@amfibi.com) Amfibi Search robot R 64.111.217.9x http://www.amfibi.com/ -id_a_f_140506_4 CamelHttpStream/1.0 Evolution integrated mail solution Camel TCP stream class http://www.gnome.org/projects/evolution/ http://go-evolution.org/Camel.Stream -id_a_f_144 Cancer Information and Support International; Some user agent -id_a_f_110206_1 carleson/1.0 Cosmix project crawler (204.14.48.x / 38.113.234.xxx) R s. also - voyager/1.x - cfetch/1. http://www.cosmixcorp.com/ -id_a_f_145 Carnegie_Mellon_University_Research_WebBOT-->PLEASE READ-->http://www.andrew.cmu.edu/~brgordon/webbot/index.html http://www.andrew.cmu.edu/~brgordon/webbot/index.html Carnegie Mellon University WebBOT R http://www.andrew.cmu.edu -id_a_f_146 Carnegie_Mellon_University_WebCrawler http://www.andrew.cmu.edu/~brgordon/webbot/index.html Carnegie Mellon University WebBOT R http://www.andrew.cmu.edu -id_a_f_170206_1 Catall Spider Catall.de search & web directory (Germany) R http://www.catall.de/ -id_a_f_130807_3 CazoodleBot/CazoodleBot-0.1 (CazoodleBot Crawler; http://www.cazoodle.com/cazoodlebot; cazoodlebot@cazoodle.com) UIUCs Cazoodle search based on MetaQuerier R 72.36.94.1xx http://www.cazoodle.com/ http://metaquerier.cs.uiuc.edu/ -id_a_f_290308_1 CCBot/1.0 (+http://www.commoncrawl.org/bot.html) CommonCrawl Foundation search crawler R 38.103.63.1[6-8] http://www.commoncrawl.org/faq.htm -id_a_f_147 ccubee/x.x Empyreum Ccubee (Czech) search engine solution R http://empyreum.com/technologies/ccubee -id_a_f_010108_2 CDR/1.7.1 Simulator/0.7(+http://timewe.net) Profile/MIDP-1.0 Configuration/CLDC-1.0 Timewe mobile browser (WAP) simulator (Japan) B 61.142.xx.x[xx] http://timewe.net/ -id_a_f_291105_6 CE-Preload Cisco Content Engine P http://www.cisco.com/en/US/products/hw/contnetw/index.html -id_a_f_100408_4 CentiverseBot Nordic semantic search engine C 87.72.214.9x http://www.centiverse-project.net/post/Educating-the-bots.aspx -id_a_f_180408_2 CentiverseBot - investigator Nordic semantic search engine C 87.72.214.9x http://www.centiverse-project.net/post/Educating-the-bots.aspx -id_a_f_180408_3 CentiverseBot/3.0 (http://www.centiverse-project.net) Nordic semantic search engine C 87.72.214.9x http://www.centiverse-project.net/post/Educating-the-bots.aspx -id_a_f_148 Ceramic Tile Installation Guide (http://www.floorstransformed.com) Floortransformed.com robot (link ckecking ??) R http://www.floorstransformed.com -id_a_f_131208_2 CERN-LineMode/2.15 CERN Line Mode Browser B http://www.w3.org/LineMode/ -id_a_f_149 cfetch/1.0 Cosmix project crawler (204.14.48.x / 38.113.234.xxx) R s. also - voyager/1.x - carleson/1.x http://www.cosmixcorp.com -id_a_f_150 CFNetwork/x.x MaxOS X CoreFoundation CFNetwork API http://www.cocoadev.com/index.pl?CFNetwork -id_a_f_151 cg-eye interactive cg-eye CGI checker C http://www.htmlhelp.com -id_a_f_152 Charon/1.x (Amiga) Charon Amiga download manager D http://tesla.rcub.bg.ac.yu/%7Eantony/Charon/ -id_a_f_131208_3 Chat Catcher/1.0 Chat Catcher blog monitoring robot C 69.80.208.2xx http://chatcatcher.com/cc/ -id_a_f_153 Checkbot/1.xx LWP/5.xx Checkbot link validation C http://degraaff.org/checkbot/ -id_a_f_154 CheckLinks/1.x.x Checklinks - Perl link checker C http://www.jmarshall.com -id_a_f_155 CheckUrl NTL user agent http://www.ntl.com -id_a_f_156 CheckWeb CheckWeb link validation C http://p.duby.free.fr/chkweb.htm -id_a_f_030206_2 Chilkat/1.0.0 (+http://www.chilkatsoft.com/ChilkatHttpUA.asp) Chilkat HTTP component user-agent http://www.chilkatsoft.com/HttpDotNet.asp -id_a_f_230506_1 China Local Browse 2.6 Unknown spam bot from telekom.com.my (218.111.83.xxx) S see link: http://linuxreviews.org/webdesign/602_Apache_Webalizer/ -id_a_f_170408_2 Chitika ContentHit 1.0 Chitika Inc. Blog advertising C 67.15.219.[x]x http://chitika.com/ -id_a_f_157 ChristCRAWLER 2.0 Christcentral.com Christcrawler (was www.christcrawler.com) R - s. also Mozilla/4.0 (compatible; ChristCrawler..) -id_a_f_010607_2 CHttpClient by Open Text Corporation CHttpClient - C++ class using WinInet http://www.codeproject.com/library/lyoulhttpclient.asp -id_a_f_158 CipinetBot (http://www.cipinet.com/bot.html) CipinetBot -Cipinet Search Engine Web Crawler R http://www.cipinet.com -id_a_f_130108_1 Cityreview Robot (+http://www.cityreview.org/crawler/) Cityreview regional search (Germany) link checking C 88.198.212.5x http://www.cityreview.de/ http://www.cityreview.org/crawler/ -id_a_f_159 CJ Spider/ Commision Junction link checking spider C http://www.cj.com/ -id_a_f_050606_1 CJB.NET Proxy CJB Net anonymous socks proxy service (216.194.70.x) P http://proxy.cjb.net/ -id_a_f_160 ClariaBot/1.0 Claria (ex Gator) SearchScout robot (64.152.73.xx) R s. also Diamond http://www.searchscout.com -id_a_f_161 Claymont.com Claymont Search robot R http://www.claymont.com -id_a_f_100307_1 CloakDetect/0.9 (+http://fulltext.seznam.cz/) Seznam Search (Czech Republic) robot R 212.80.76.xx http://www.seznam.cz/ -id_a_f_162 Clushbot/2.x (+http://www.clush.com/bot.html) Clush clustered search robot R http://www.clush.com -id_a_f_163 Clushbot/3.x-BinaryFury (+http://www.clush.com/bot.html) Clush clustered search robot R http://www.clush.com -id_a_f_164 Clushbot/3.xx-Ajax (+http://www.clush.com/bot.html) Clush clustered search robot R http://www.clush.com -id_a_f_165 Clushbot/3.xx-Hector (+http://www.clush.com/bot.html) Clush clustered search robot R http://www.clush.com -id_a_f_166 Clushbot/3.xx-Peleus (+http://www.clush.com/bot.html) Clush clustered search robot R http://www.clush.com -id_a_f_070506_1 COAST WebMaster Pro/4.x.x.xx (Windows NT) COAST Webmaster - Web management and maintenance software C http://www.extablish.com/cwm.htm -id_a_f_150306_1 CoBITSProbe Proposed Content-Based Image Tracking System (CoBITS) P2P crawler R C http://www.iis.sinica.edu.tw/~hungchi/CBIT/ -id_a_f_167 Cocoal.icio.us/1.0 (v36) (Mac OS X; http://www.scifihifi.com/cocoalicious) Cocoa del.icio.us (social bookmarks manager) client for Mac OS X C http://www.scifihifi.com -id_a_f_070209_2 Cogentbot/1.X (+http://www.cogentsoftwaresolutions.com/bot.html) Cogent Search Bot from Cogent Software Solutions for unknown purposes R 72.81.252.9x http://www.cogentsoftwaresolutions.com/bot.html -id_a_f_168 ColdFusion Cold Fusion server used by various IPs i.e.: - NetWORLD web catalogue link checking P C http://www.networld.com http://www.macromedia.com/software/coldfusion/ -id_a_f_169 ColdFusion (BookmarkTracker.com) Cold Fusion server used by Bookmark Tracker - online favourites managment C http://www.bookmarktracker.com http://www.macromedia.com/software/coldfusion/ -id_a_f_170 collage.cgi/1.xx WebCollage Syndicator graphics crawler/collector R D http://www.webcollage.com -id_a_f_171 combine/0.0 Combine harvesting & indexing robot R 130.235.4.xx http://combine.it.lth.se/ -id_a_f_080406_1 Combine/2.0 http://combine.it.lth.se/ Combine harvesting & indexing robot R 130.235.4.xx http://combine.it.lth.se/ -id_a_f_160807_1 Combine/3 http://combine.it.lth.se/ Combine harvesting & indexing robot R 130.235.4.xx http://combine.it.lth.se/ -id_a_f_172 Combine/x.0 Combine harvesting & indexing robot R 130.235.4.xx http://combine.it.lth.se/ -id_a_f_280606_3 cometrics-bot, http://www.cometrics.de cometrics Web Content Mining solution - Germany R http://www.cometrics.de/ -id_a_f_173 Commerce Browser Center Wildsoft Germany (closed) Internet client system user-agent (was www.oskarweb.de) B -id_a_f_240107_1 complex_network_group/Nutch-0.9-dev (discovering the structure of the world-wide-web; http://cantor.ee.ucla.edu/~networks/crawl; nimakhaj@gmail.com) UCLA Complex Networks Groups Complex Network Analysis C 216.182.233.1xx http://cantor.ee.ucla.edu/~networks/ -id_a_f_174 Computer_and_Automation_Research_Institute_Crawler crawler@ilab.sztaki.hu Hungarian Academy of Sciences data mining search R http://www.ilab.sztaki.hu/websearch/ -id_a_f_010406_2 Comrite/0.7.1 (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org) ComRite Chinese Search Engine for Oversea Web Sites (69.248.26.xx) R powered by Nutch http://www.comrite.com/ http://meidong.comrite.com/ -id_a_f_175 Contact unknown -id_a_f_200307_1 ContactBot/0.2 Probably E-Mail harvesting robot - same as LMQueueBot S 64.124.152.xx -id_a_f_291105_7 ContentSmartz ContentSmartz e-mail harvesting tools S -id_a_f_176 contype Internet Explorer versions 4.x and 5 plugin content B NOT Contype mime type managment Perl script http://support.microsoft.com/default.aspx?scid=kb;en-us;293792 -id_a_f_177 Convera Internet Spider V6.x Converas RetrievalWare Internet Spider (63.241.61.x) R s. also - infoConveraCrawler... - CrawlConvera ... http://www.convera.com -id_a_f_178 ConveraCrawler/0.2 Converas RetrievalWare Internet Spider (63.241.61.x) R s. also - infoConveraCrawler... - CrawlConvera ... http://www.convera.com -id_a_f_051205_1 ConveraCrawler/0.9d (+http://www.authoritativeweb.com/crawl) Converas RetrievalWare Internet Spider (63.241.61.x) R s. also - infoConveraCrawler... - CrawlConvera ... http://www.convera.com/ -id_a_f_179 ConveraMultiMediaCrawler/0.1 (+http://www.authoritativeweb.com/crawl) Converas RetrievalWare Internet Spider (63.241.61.x) R s. also - infoConveraCrawler... - CrawlConvera ... http://www.convera.com -id_a_f_180 CoolBot Suchmaschine21 (Germany) robot R http://www.suchmaschine21.de/ -id_a_f_030110_2 Cooliris/1.5 CFNetwork/459 Darwin/10.0.0d3 Cooliris photo and video browser B http://www.cooliris.com/ -id_a_f_040406_1 CoralWebPrx/0.1.1x (See http://coralcdn.org/) Coral Content Distribution Network P C http://coralcdn.org/ -id_a_f_181 cosmos/0.8_(robot@xyleme.com) Xyleme SA France robot R http://www.xyleme.com/en/index.jsp -id_a_f_182 cosmos/0.9_(robot@xyleme.com) Xyleme SA France robot R http://www.xyleme.com/en/index.jsp -id_a_f_040607_1 CoteoNutchCrawler/Nutch-0.9 (info [at] coteo [dot] com) Coteo.com - local French directory link checking C http://www.coteo.com/ -id_a_f_030206_3 CougarSearch/0.x (+http://www.cougarsearch.com/faq.shtml) Cougarsearch.com robot R http://www.cougarsearch.com/ -id_a_f_280408_2 Covac TexAs Arachbot Covac Arachnid Web Crawler R s.also ArachBot http://www.covac-software.com/ -id_a_f_211208_1 CoverScout%203/3.0.1 CFNetwork/339.5 Darwin/9.5.0 (i386) (iMac5,1) CoverScout for iTunes - CD cover search tool B http://www.equinux.com/de/products/coverscout/index.html -id_a_f_183 Cowbot-0.1 (NHN Corp. / +82-2-3011-1954 / nhnbot@naver.com) Naver Japan / Korea robot R s. also Python-urllib/1.15 - nabot - NaverBot & dloader http://www.naver.co.jp -id_a_f_184 Cowbot-0.1.x (NHN Corp. / +82-2-3011-1954 / nhnbot@naver.com) Naver Japan / Korea robot R s. also Python-urllib/1.15 - nabot - NaverBot & dloader http://www.naver.co.jp -id_a_f_185 CrawlConvera0.1 (CrawlConvera@yahoo.com) Converas RetrievalWare Internet Spider R s. also - Convera Internet Spider .. - infoConveraCrawler... http://www.convera.com -id_a_f_186 Crawler unknown robot via Level3.net -id_a_f_187 Crawler (cometsearch@cometsystems.com) Cometsystems Comet Search robot via Findwhat (now Miva) R http://www.cometsystems.com http://www.miva.com/ -id_a_f_188 Crawler admin@crawler.de Crawler.de / Abacho robot R http://www.crawler.de http://www.abacho.de/ -id_a_f_189 Crawler V 0.2.x admin@crawler.de Crawler.de / Abacho robot R http://www.crawler.de http://www.abacho.de/ -id_a_f_190 crawler@alexa.com Alexa crawler R http://www.alexa.com -id_a_f_191 CrawlerBoy Pinpoint.com Pinpoint WAP search robot R http://www.pinpoint.com -id_a_f_130506_1 Crawllybot/0.1 (Crawllybot; +http://www.crawlly.com; crawler@crawlly.com) Crawlly Beta search - Germany (72.232.194.2xx) R powered by Nutch http://www.crawlly.com/ -id_a_f_192 CreativeCommons/0.06-dev (Nutch; http://www.nutch.org/docs/en/bot.html; nutch-agent@lists.sourceforge.net) Creatice Commons using Nutch open source robot R http://www.nutch.org -id_a_f_030110_3 Cricket-A100/1.0 UP.Browser/6.3.0.7 (GUI) MMP/2.0 Cricket A100 cell phone browser B http://www.mycricket.com/cell-phones/details/Cricket-A100 -id_a_f_193 CrocCrawler vx.3 [en] (http://www.croccrawler.com) (X11; I; Linux 2.0.44 i686) Croccrawler robot R http://www.croccrawler.com -id_a_f_090306_2 csci_b659/0.13 Web mining project from CSCI 659 (computer science course) at Indiana Univerity R http://informatics.indiana.edu/fil/Class/b659/ -id_a_f_180906_1 CSE HTML Validator Professional (http://www.htmlvalidator.com/) CSE HTML Validator for Windows C http://www.htmlvalidator.com/ -id_a_f_194 Cuam Ver0.050bx Cuam - IE based browser B site is dead http://cuam.virtualave.net -id_a_f_195 Cuasarbot/0.9b http://www.cuasar.com/spider_beta/ Cuasar (Spain) music / ringtone search spider R http://www.cuasar.com -id_a_f_196 curl/7.10.x (i386-redhat-linux-gnu) libcurl/7.10.x OpenSSL/0.9.7a ipv6 zlib/1.1.4 Curl file transferring tool D http://curl.haxx.se/ -id_a_f_197 curl/7.7.x (i386--freebsd4.3) libcurl 7.7.x (SSL 0.9.6) (ipv6 enabled) Curl file transferring tool D http://curl.haxx.se/ -id_a_f_198 curl/7.8 (i686-pc-linux-gnu) libcurl 7.8 (OpenSSL 0.9.6) Curl file transferring tool D http://curl.haxx.se/ -id_a_f_199 curl/7.9.x (win32) libcurl 7.9.x Curl file transferring tool D http://curl.haxx.se/ -id_a_f_200 CurryGuide SiteScan 1.1 CurryGuide UK link check robot R http://uk.curryguide.com/ -id_a_f_201 Custo x.x (www.netwu.com) Custo web site spidering tool (link checking) C s. also - - Mozilla/5.0 (compatible; Custo 3... http://www.netwu.com -id_a_f_202 Custom Spider www.bisnisseek.com /1.0 Bisnisseek (was www.bisnisseek.com) robot R -id_a_f_203 Cyberdog/2.0 (Macintosh; 68k) Cyberdog Mac Browser (was www.cyberdog.org) B -id_a_f_260608_2 CyberPatrol SiteCat Webbot (http://www.cyberpatrol.com/cyberpatrolcrawler.asp) CyberPatrol LLC robot for web filtering software R 38.103.17.16x http://www.cyberpatrol.com/cyberpatrolcrawler.asp -id_a_f_204 CyberSpyder Link Test/2.1.12 (admin@mspennyworth.com) CyberSpyder Link Test software C http://www.cyberspyder.com/cslnkts1.html -id_a_f_205 CydralSpider/1.x (Cydral Web Image Search; http://www.cydral.com) Cydral image & site search spider R http://www.cydral.com -id_a_f_060508_1 CydralSpider/3.0 (Cydral Image Search; http://www.cydral.com) Cydral image & site search spider R http://www.cydral.com -id_a_f_206 DA 3.5 (www.lidan.com) Downloadaccelerator download manager D http://www.downloadaccelerator.com -id_a_f_207 DA 4.0 Downloadaccelerator download manager D http://www.downloadaccelerator.com -id_a_f_208 DA 4.0 (www.downloadaccelerator.com) Downloadaccelerator download manager D http://www.downloadaccelerator.com -id_a_f_209 DA 5.0 Downloadaccelerator download manager D http://www.downloadaccelerator.com -id_a_f_210 DA 7.0 Downloadaccelerator download manager D http://www.downloadaccelerator.com -id_a_f_070209_3 DAP x.x Download Accelerator Plus download manager D http://www.speedbit.com/ -id_a_f_211 Dart Communications PowerTCP PowerTCP ActiveX control tool http://www.dart.com -id_a_f_212 DataCha0s/2.0 Unknown bot from Kornet Korea (218.149.129.xxx) scans for Perl Awstats S -id_a_f_101106_1 DataCha0s/2.0 Unknown UA looking for Awstats Perl components S from various IPs -id_a_f_213 DataFountains/DMOZ Downloader INFOMINE/iVia Scholary Internet Resource Collections robot R 138.23.85.xx http://infomine.ucr.edu/ http://ivia.ucr.edu/useragents.shtml -id_a_f_040307_1 DataFountains/Dmoz Downloader (http://ivia.ucr.edu/useragents.shtml) INFOMINE/iVia Scholary Internet Resource Collections robot R 138.23.85.xx http://infomine.ucr.edu/ http://ivia.ucr.edu/useragents.shtml -id_a_f_110307_1 DataFountains/DMOZ Feature Vector Corpus Creator (http://ivia.ucr.edu/useragents.shtml) INFOMINE/iVia Scholary Internet Resource Collections robot R 138.23.85.xx http://infomine.ucr.edu/ http://ivia.ucr.edu/useragents.shtml -id_a_f_050907_1 DataparkSearch/4.47 (+http://dataparksearch.org/bot) DataparkSearch open source search engine R http://www.dataparksearch.org -id_a_f_214 DataparkSearch/4.xx (http://www.dataparksearch.org/) DataparkSearch open source search engine R http://www.dataparksearch.org -id_a_f_080206_1 DataSpear/1.0 (Spider; http://www.dataspear.com/spider.html; spider@dataspear.com) DataSpear Directory robot (24.109.29.xx) R http://www.dataspear.com/ -id_a_f_215 DataSpearSpiderBot/0.2 (DataSpear Spider Bot; http://dssb.dataspear.com/bot.html; dssb@dataspear.com) DataSpear Directory robot (24.109.29.xx) R http://www.dataspear.com/ -id_a_f_161105_1 DatenBot( http://www.sicher-durchs-netz.de/bot.html) Sicher-durchs-Netz German security related search (62.75.220.xxx) R http://www.sicher-durchs-netz.de/suche -id_a_f_216 DaviesBot/1.7 (www.wholeweb.net) Wholeweb robot R site is closed http://www.wholeweb.net -id_a_f_217 daypopbot/0.x Daypop blog - weblog - online mag search spider R http://www.daypop.com/info/about.htm -id_a_f_218 dbDig(http://www.prairielandconsulting.com) dbDig search engine R http://www.prairielandconsulting.com -id_a_f_219 DBrowse 1.4b Some site scanning tool via diff. IPs i.e.: - wanweb.net (208.6.163.xxx) - cox.net (68.4.xxx.xxx) S UA sometimes - DSurf15a 01 - DBrowse 1.4d -id_a_f_220 DBrowse 1.4d Some site scanning tool via diff. IPs i.e.: - pacbell.net (67.112.xxx.xxx) S see also DSurf15a 01 - DBrowse 1.4b -id_a_f_221 DC-Sakura/x.xx DC-Sakura download manager D http://www.dc-sakura.com/ -id_a_f_222 dCSbot/1.1 unknown divine/Openmarket.com robot R http://www.openmarket.com/ -id_a_f_223 DDD some (website) downloading tool D -id_a_f_224 dds explorer v1.0 beta Unknown user agent -id_a_f_225 de.searchengine.comBot 1.2 (http://de.searchengine.com/spider) Searchengine.com (Germany) submission checking / robot (84.73.57.xx) R http://de.searchengine.com -id_a_f_226 DeadLinkCheck/0.4.0 libwww-perl/5.xx DLC Perl HTTP link checking C http://dlc.sourceforge.net/ -id_a_f_111206_3 Deep Link Calculator v1.0 Sootle Web Directory deep link checker C 216.89.111.x http://directory.sootle.com/deep-links/ -id_a_f_227 deepak-USC/ISI deepak-USC/ISI robot from USC/Information Science Institute R http://www.isi.edu/%7Eravichan/deepak-usc-isi.html http://www.isi.edu/ -id_a_f_228 DeepIndex Deepindex robot R http://www.deepindex.net/utilisateurs.php?referral=deepindex -id_a_f_229 DeepIndex ( http://www.zetbot.com ) Zetbot search Belgium (213.41.128.xx) using Deepindex robot R http://www.zetbot.com/ http://www.deepindex.net/utilisateurs.php?referral=deepindex -id_a_f_230 DeepIndex (www.en.deepindex.com) Deepindex robot R http://www.deepindex.net/utilisateurs.php?referral=deepindex -id_a_f_231 DeepIndexer.ca Deepindex robot (via Paragon.net Canada) R http://www.deepindex.net/utilisateurs.php?referral=deepindex -id_a_f_011006_2 del.icio.us-thumbnails/1.0 Mozilla/5.0 (compatible; Konqueror/3.4; FreeBSD) KHTML/3.4.2 (like Gecko) del.icio.us picture robot for thumbnail preview via Yahoo D 66.94.237.1xx http://del.icio.us/ -id_a_f_250106_1 DeleGate/9.0.5-fix1 DeleGate application level gateway / proxy server P http://www.delegate.org/delegate/ -id_a_f_232 Demo Bot DOT 16b Some site scanning tool from 217.34.59.xxx (btopenworld.com) S -id_a_f_233 Demo Bot Z 16b Some site scanning tool from 68.154.96.xx (bellsouth.net) S appears also as - MFC Foundation Class Library - Full Web Bot 0516B -id_a_f_234 Denmex websearch (http://search.denmex.com) Denmex Websearch robot/link checking R http://search.denmex.com -id_a_f_235 Der große BilderSauger 2.00u DataBecker Bilder Sauger (discontinued) web graphics downloader D http://www.databecker.de -id_a_f_230206_1 dev-spider2.searchpsider.com/1.3b Searchspider.com robot (72.245.225.xxx) R http://www.searchspider.com/ -id_a_f_236 DevComponents.com HtmlDocument Object DevComponents HTMLDocument Class Library for Visual Studio.net http://www.devcomponents.com -id_a_f_237 DiaGem/1.1 (http://www.skyrocket.gr.jp/diagem.html) DiaGem Japan web crawler R (site is offline) http://www.skyrocket.gr.jp -id_a_f_238 Diamond/x.0 Claria (ex Gator) SearchScout robot (64.152.73.xx) R s. also Claria http://www.searchscout.com -id_a_f_239 DiamondBot Claria (ex Gator) SearchScout robot (64.152.73.xx) R s. also Claria http://www.searchscout.com -id_a_f_240 Digger/1.0 JDK/1.3.0rc3 Diggit! robot R http://www.diggit.com -id_a_f_241 DigOut4U OpenPortal4U robot R http://www.arisem.com -id_a_f_242 DIIbot/1.2 Findsame.com (site is offline) / Digital-Integrity robot R http://www.digital-integrity.com/ -id_a_f_100206_1 Dillo/0.8.5-i18n-misc Dillo Web Browser B http://www.dillo.org/ -id_a_f_243 Dillo/0.x.x Dillo Web Browser B http://www.dillo.org/ -id_a_f_100109_1 disastrous/1.0.5 (running with Python 2.5.1; http://www.bortzmeyer.org/disastrous.html; archangel77@del.icio.us) disastrous - a del.icio.us link checker based on Python C http://www.bortzmeyer.org/disastrous.html -id_a_f_140306_1 DISCo Pump x.x DISCo Pump offline browser / website ripper D No active homepage http://www.arssoft.com/ http://www.filetransit.com/view.php?id=3870 -id_a_f_300907_1 disco/Nutch-0.9 (experimental crawler; www.discoveryengine.com; disco-crawl@discoveryengine.com) Unkown robot from Discovery Engine Corp. R 208.96.54.xx http://www.discoveryengine.com/ -id_a_f_300907_2 disco/Nutch-1.0-dev (experimental crawler; www.discoveryengine.com; disco-crawl@discoveryengine.com) Unkown robot from Discovery Engine Corp. R 208.96.54.xx http://www.discoveryengine.com/ -id_a_f_244 DittoSpyder Ditto picture search robot R http://www.ditto.com -id_a_f_245 dlman some download agent D Wildsoft Surfer -id_a_f_246 dloader(NaverRobot)/1.0 Naver Japan / Korea robot R s. also Python-urllib/1.15 - nabot - NaverBot & Cowbot http://www.naver.co.jp -id_a_f_100408_1 DNSRight.com WebBot Link Ckeck Tool. Report abuse to: dnsr@dnsright.com DNS Right - Online DNS tools C 203.161.71.17x http://www.dnsright.com/ -id_a_f_247 DoCoMo/1.0/Nxxxi/c10 NTT DoCoMo (Japan) robot R http://www.nttdocomo.co.jp/ -id_a_f_248 DoCoMo/1.0/Nxxxi/c10/TB NTT DoCoMo (Japan) robot R http://www.nttdocomo.co.jp/ -id_a_f_249 DoCoMo/1.0/P502i/c10 (Google CHTML Proxy/1.0) Google (216.239.39.x) proxy server P -id_a_f_250 DoCoMo/2.0 P900iV(c100;TB;W24H11) NTT DoCoMo (Japan) robot R http://www.nttdocomo.co.jp/ -id_a_f_141205_1 DoCoMo/2.0 SH901iS(c100;TB;W24H12),gzip(gfe) (via translate.google.com) NTT DoCoMo (Japan) proxy server (210.136.161.1xx) P http://www.nttdocomo.co.jp/ -id_a_f_081207_1 DoCoMo/2.0 SH902i (compatible; Y!J-SRD/1.0; http://help.yahoo.co.jp/help/jp/search/indexing/indexing-27.html) Yahoo Search Japan robot (203.216.197.xxx) R s. also Y!J-SRD/1.0 http://www.yahoo.co.jp/ -id_a_f_271006_3 DoCoMo/2.0/SO502i (compatible; Y!J-SRD/1.0; http://help.yahoo.co.jp/help/jp/search/indexing/indexing-27.html) Yahoo Search Japan robot (203.216.197.xxx) R s. also Y!J-SRD/1.0 http://www.yahoo.co.jp/ -id_a_f_251 DocZilla/1.0 (Windows; U; WinNT4.0; en-US; rv:1.0.0) Gecko/20020804 DocZilla - Mozilla-based SGML/XML/HTML- browser B http://www.doczilla.com -id_a_f_210607_1 dodgebot/experimental unknown robot from AGMLAB Information Technologies (Information retrieval system ?) R 212.174.130.1xx http://www.agmlab.com/agmlab_eng.html -id_a_f_180606_1 DonutP; Windows98SE Donut P - Japanese IE based browser B http://donutp.com/ -id_a_f_250907_2 Doubanbot/1.0 (bot@douban.com http://www.douban.com) Unknown robot from douban search (China) - maybe image crawling 59.151.41.xx http://www.douban.com/ -id_a_f_252 Download Demon/3.x.x.x Download Demon/Netzip download manager D http://www.netzip.com -id_a_f_191105_4 Download Druid 2.x Download Druid IE plugin download manager D http://www.xemico.com/druid/index.html -id_a_f_253 Download Express 1.0 Download Express download manager D http://www.metaproducts.com -id_a_f_254 Download Master Download Master download manager D http://www.westbyte.com/dm/index.phtml -id_a_f_191105_5 Download Ninja 3.0 Download Ninja download manager (Japan) D http://www.h-fd.org/mkro/mt/archives/2002/09/download_ninja_1.html -id_a_f_255 Download Wonder Download Wonder download manager D http://www.forty.com -id_a_f_256 Download-Tipp Linkcheck (http://download-tipp.de/) Download-Tipp Germany link checking R http://download-tipp.de/ -id_a_f_257 Download.exe(1.1) (+http://www.sql-und-xml.de/freeware-tools/) download.exe .NET based downloading tool D http://www.sql-und-xml.de/freeware-tools/ -id_a_f_300907_3 DownloadDirect.1.0 Download Direct download manager D http://senbit.com/ -id_a_f_258 Dr.Web (R) online scanner: http://online.drweb.com/ Dr.WEB online virus scanner http://online.drweb.com -id_a_f_259 Dragonfly File Reader Dragonfly CMS - Open Source content management system B http://www.cpgnuke.com -id_a_f_260 Drecombot/1.0 (http://career.drecom.jp/bot.html) Drecom Japan (210.233.67.xxx) - Blog search ?? R http://www.drecom.co.jp -id_a_f_3090906_1 Drupal (+http://drupal.org/) Drupal - open source content management platform C http://drupal.org/ -id_a_f_261 DSurf15a 01 Some site scanning tool via diff. IPs i.e.: - cox.net (68.5.xxx.xxx) - pacbell.net (64.16x.xxx.xxx) S DBrowse 1.4d -id_a_f_262 DSurf15a 71 Some site scanning tool via diff. IPs i.e.: - cox.net (68.4.xxx.xxx) S TRPMFHXE -id_a_f_263 DSurf15a 81 Some site scanning tool via diff. IPs i.e.: - verizon.net (4.47.xxx.xxx) S WFRIKXVNFL -id_a_f_264 DSurf15a VA Some site scanning tool via diff. IPs i.e.: - eastlink.ca (24.222.xxx.xxx) - cogeco.net (216.221.8x.xxx) S -id_a_f_020506_2 DTAAgent DTAAgent Java object for data collecting R D http://www.ibr.cs.tu-bs.de/courses/ss00/sep-vs/gruppe1/jdoc/DTA/agent/DTAAgent.html -id_a_f_265 dtSearchSpider dt Search Spider software R http://www.dtsearch.com/spider.html -id_a_f_266 Dual Proxy Fourelle Venturi proxy server P http://www.fourelle.com/news/articles/148457.htm -id_a_f_290308_2 DuckDuckBot/1.0; (+http://duckduckgo.com/duckduckbot.html) Duck Duck Go search crawler R 72.94.249.34 http://duckduckgo.com/ http://duckduckgo.com/duckduckbot.html -id_a_f_267 Dumbot(version 0.1 beta - dumbfind.com) DumbFind.com robot R http://www.dumbfind.com -id_a_f_268 Dumbot(version 0.1 beta - http://www.dumbfind.com/dumbot.html) DumbFind.com robot R http://www.dumbfind.com -id_a_f_269 Dumbot(version 0.1 beta) DumbFind.com robot R http://www.dumbfind.com -id_a_f_270 e-sense 1.0 ea(www.vigiltech.com/esensedisclaim.html) Vigiltech e-Sense user research robot (website is offline) R -id_a_f_271 e-SocietyRobot(http://www.yama.info.waseda.ac.jp/~yamana/es/) e-Society Project (Japan) crawler (133.9.238.xx) R http://www.yama.info.waseda.ac.jp -id_a_f_280108_1 eApolloBot/2.0 (compatible; heritrix/2.0.0-SNAPSHOT-20071024.170148 +http://www.eapollo-opto.com) Global Opto's eApollo Flash based search engine - Taiwan R http://www.eapollo.com/eaSE.jsp?language=eng http://www.global-opto.com/ -id_a_f_272 EARTHCOM.info/1.x [www.earthcom.info] Earthcom (Czech Republic) search robot (194.108.39.xx) R s. also Mozilla/5.0 (compatible; EARTHCOM.info/2.01 ... http://www.earthcom.info -id_a_f_273 EARTHCOM.info/1.xbeta [www.earthcom.info] Earthcom (Czech Republic) search robot (194.108.39.xx) R s. also Mozilla/5.0 (compatible; EARTHCOM.info/2.01 ... http://www.earthcom.info -id_a_f_274 EasyDL/3.xx Keywen Encyclopedia Bot R http://keywen.com/Encyclopedia/Bot/ -id_a_f_275 EasyDL/3.xx http://keywen.com/Encyclopedia/Bot Keywen Encyclopedia Bot R http://keywen.com/Encyclopedia/Bot/ -id_a_f_276 EBrowse 1.4b Some site scanning tool via diff. IPs i.e.: - swbell.net (65.66.xxx.xxx) S -id_a_f_277 eCatch/3.0 eCatch (now Wysigot) offline browser B D http://www.ecatch.com -id_a_f_278 EchO!/2.0 Echo.fr robot R http://echo.fr/ -id_a_f_279 Educate Search VxB Some site scanning tool via diff. IPs i.e.: - cox.net (68.4.xxx.xxx) S s. also DSurf - 66.118.1xx.xxx (sagonet.com) - see also Full Web Bot - Industry Program 1.0.5 -id_a_f_280 egothor/3.0a (+http://www.xdefine.org/robot.html) Xdefine text search engine robot - based on Egothor open source crawler R http://www.xdefine.com/ http://www.egothor.org/ -id_a_f_281 EgotoBot/4.8 (+http://www.egoto.com/about.htm) Egoto Search robot R http://www.egoto.com -id_a_f_211105_1 ejupiter.com eJupiter searcg robot (206.191.49.xx) R http://search.ejupiter.com/ -id_a_f_282 EldoS TimelyWeb/3.x TimelyWeb web page monitoring tool C s. also TimelyWeb/... http://www.eldos.org/timelyweb/timelyweb.html -id_a_f_283 elfbot/1.0 (+http://www.uchoose.de/crawler/elfbot/) Elftales crawler for uChoose theme based search (Germany) R http://www.uchoose.de -id_a_f_300707_1 ELI/20070402:2.0 (DAUM RSS Robot, Daum Communications Corp.; +http://ws.daum.net/aboutkr.html) DAUMOA - RSS search robot of Daum R 211.115.109.1xx http://ws.daum.net/abouten.html -id_a_f_284 ELinks (0.x.x; Linux 2.4.20 i586; 132x60) ELinks text mode browser B http://elinks.or.cz/ -id_a_f_285 ELinks/0.x.x (textmode; NetBSD 1.6.2 sparc; 132x43) ELinks text mode browser B http://elinks.or.cz/ -id_a_f_286 EmailSiphon Sonic E-mail collector S http://www.americaint.com/superstore/elist.html -id_a_f_220508_2 EmailSpider EmailSpider E-mail harvesting software S http://www.emailspider.net/index.php?kat=11 -id_a_f_287 EmailWolf 1.00 Trellian EMailWolf E-mail collector S http://www.trellian.com -id_a_f_288 EmeraldShield.com WebBot EmeraldShield spam and web filtration services P R http://www.emeraldshield.com -id_a_f_289 EmeraldShield.com WebBot (http://www.emeraldshield.com/webbot.aspx) EmeraldShield spam and web filtration services P R http://www.emeraldshield.com -id_a_f_070606_2 EMPAS_ROBOT Empas search Korea robot (220.95.22x.xxx) R http://www.empas.com/ -id_a_f_280208_1 EnaBot/1.x (http://www.enaball.com/crawler.html) Enabot - Enaball semantic search project crawler R http://www.enaball.com/crawler.html -id_a_f_110506_4 endo/1.0 (Mac OS X; ppc i386; http://kula.jp/endo) endo - Mac news site and blog aggregator B http://kula.jp/software/endo/ -id_a_f_290 Enfish Tracker Enfish Personal search tool R http://www.enfish.com -id_a_f_291 Enterprise_Search/1.0 Enterprise Search engine software (64.202.165.xxx) R s. also - ES.NET_Crawler - InnerpriseBot http://www.innerprise.net -id_a_f_292 Enterprise_Search/1.0.xxx Enterprise Search engine software (64.202.165.xxx) R s. also - ES.NET_Crawler - InnerpriseBot http://www.innerprise.net -id_a_f_293 Enterprise_Search/1.00.xxx;MSSQL (http://www.innerprise.net/es-spider.asp) Enterprise Search engine software (64.202.165.xxx) R s. also - ES.NET_Crawler - InnerpriseBot http://www.innerprise.net -id_a_f_230706_1 envolk/1.7 (+http://www.envolk.com/envolkspiderinfo.php) Envolk Web Search robot R 70.169.191.x http://www.envolk.com/ -id_a_f_294 envolk[ITS]spider/1.6(+http://www.envolk.com/envolkspider.html) Envolk Web Search robot R 70.169.191.x http://www.envolk.com/ -id_a_f_295 EroCrawler EroCrawler adult search robot R http://www.erocrawler.com -id_a_f_296 ES.NET_Crawler/2.0 (http://search.innerprise.net/) Enterprise Search engine software (64.202.165.xxx) R s. also - Enterprise_Search - InnerpriseBot http://search.innerprise.net -id_a_f_297 eseek-larbin_2.6.2 (crawler@exactseek.com) ExactSEEK (Jayde Online) robot R see also ExactSeek Crawler / eseek-larbin / exactseek.com http://www.exactseek.com -id_a_f_298 ESISmartSpider ESI Smart-Spider toolkit R http://www.smart-spider.com/ -id_a_f_299 eStyleSearch 4 (compatible; MSIE 6.0; Windows NT 5.0) e-Style ISP search (Russia) robot (217.174.103.xxx) R http://www.e-styleisp.ru/ -id_a_f_300 ESurf15a 15 Some site scanning tool via diff. IPs S s. also DSurf - PBrowse ... -id_a_f_301 EuripBot/0.x (+http://www.eurip.com) GetFile Eurip.com - European Internet Portal robot R http://www.eurip.com -id_a_f_302 EuripBot/0.x (+http://www.eurip.com) GetRobots Eurip.com - European Internet Portal robot R http://www.eurip.com -id_a_f_303 EuripBot/0.x (+http://www.eurip.com) PreCheck Eurip.com - European Internet Portal robot R http://www.eurip.com -id_a_f_220508_3 Eurobot/1.0 (http://www.ayell.eu) Ayell Euronet business directory robot R http://www.ayell.eu/ -id_a_f_030206_4 EvaalSE - bot@evaal.com Evaal Search Engine robot R based on Nutch http://www.evaal.com/ http://search.evaal.com/en/about.html -id_a_f_304 eventax/1.3 (eventax; http://www.eventax.de/; info@eventax.de) Eventax event search (Germany) R http://www.eventax.de -id_a_f_291205_1 Everest-Vulcan Inc./0.1 (R&D project; host=e-1-24; http://everest.vulcan.com/crawlerhelp) Vulcan Inc. Everest crawler (in development) R http://www.vulcan.com/ -id_a_f_305 Everest-Vulcan Inc./0.1 (R&D project; http://everest.vulcan.com/crawlerhelp) Vulcan Inc. Everest crawler (in development) R http://www.vulcan.com/ -id_a_f_050406_2 Exabot-Images/1.0 Exalead Websearch image crawler (193.47.80.xx) R Exabot-Images only requests robots.txt - image crawling under UA NG/4.0.1229 http://www.exalead.com/search -id_a_f_211206_1 Exabot-Test/1.0 Exalead (France) search robot (193.47.80.xx) R s. Harvest-NG/1.0.2 and Exalead NG... http://www.exabot.com/ -id_a_f_190106_1 Exabot/2.0 Exalead (France) search robot (193.47.80.xx) R s. Harvest-NG/1.0.2 and Exalead NG... http://www.exabot.com/ -id_a_f_211206_2 Exabot/3.0 Exalead (France) search robot (193.47.80.xx) R s. Harvest-NG/1.0.2 and Exalead NG... http://www.exabot.com/ -id_a_f_306 ExactSearch eXact Search Bar for IE B http://www.exactsearchbar.com/exact04 -id_a_f_307 ExactSeek Crawler/0.1 ExactSEEK (Jayde Online) robot R see also eseek-larbin / exactseek.com http://www.exactseek.com -id_a_f_308 exactseek-crawler-2.63 (crawler@exactseek.com) ExactSEEK (Jayde Online) robot R see also eseek-larbin / exactseek.com http://www.exactseek.com -id_a_f_309 exactseek-pagereaper-2.63 (crawler@exactseek.com) ExactSEEK (Jayde Online) robot R see also eseek-larbin / exactseek.com http://www.exactseek.com -id_a_f_050606_2 exactseek.com ExactSEEK (Jayde Online) robot (69.9.181.1xx) R see also eseek-larbin http://www.exactseek.com -id_a_f_310 Exalead NG/MimeLive Client (convert/http/0.120) Exalead (France) search robot (193.47.80.xx) R s. Harvest-NG/1.0.2 and NG/1.0 http://www.exabot.com -id_a_f_311 Excalibur Internet Spider V6.5.4 Excalibur (now Convera) spider software R http://www.excalib.com -id_a_f_191206_1 Execrawl/1.0 (Execrawl; http://www.execrawl.com/; bot@execrawl.com) Execrawl software search using nutch R 72.36.179.1xx http://www.execrawl.com/ -id_a_f_060608_1 exooba crawler/exooba crawler (crawler for exooba.com; http://www.exooba.com/; info at exooba dot com) exooba crawler for exooba search pre-alpha development R 216.195.184.xx http://www.exooba.com/ -id_a_f_060608_2 exooba/exooba crawler (exooba; exooba) exooba crawler for exooba search pre-alpha development R 216.195.184.xx http://www.exooba.com/ -id_a_f_312 ExperimentalHenrytheMiragoRobot Mirago UK Robot R http://www.mirago.co.uk -id_a_f_313 Expired Domain Sleuth Expired Domain Sleuth domain name tool R C http://expireddomainsleuth.com/ -id_a_f_314 Express WebPictures (www.express-soft.com) Express Web Pictures image browser B D http://www.express-soft.com/ -id_a_f_315 ExtractorPro Extractor Pro e-mail collector S http://www.extractorpro.com -id_a_f_170106_1 Extreme Picture Finder Exisoftware image grabber and downloading tool D http://www.exisoftware.com/picture_finder/ -id_a_f_316 EyeCatcher (Download-tipp.de)/1.0 Download-Tipp Germany robot R http://download-tipp.de -id_a_f_091006_1 Factbot 1.09 (see http://www.factbites.com/webmasters.php) Factbites search robot R 70.86.159.1xx http://www.factbites.com/ -id_a_f_220906_1 factbot : http://www.factbites.com/robots Factbites search robot R 70.86.159.1xx http://www.factbites.com/ -id_a_f_221006_1 FaEdit/2.0.x FaEdit Professional - Japanese bookmark manager C https://sw.vector.co.jp/swreg/step1.reserve?srno=SR040433&site=y -id_a_f_317 FairAd Client FairAd user P http://www.fairad.de -id_a_f_051206_1 FANGCrawl/0.01 Safe-t.net web filtering service P 63.167.160.1xx http://www.safe-t.net/ -id_a_f_210206_1 FARK.com link verifier Drew Curtis' FARK.com link checking C http://www.fark.com/ -id_a_f_318 Fast Crawler Gold Edition Fast/Alltheweb crawler (66.151.181.xx) R http://www.alltheweb.com -id_a_f_319 FAST Enterprise Crawler 6 (Experimental) Fast/Alltheweb crawler (66.151.181.xx) R http://www.alltheweb.com -id_a_f_040206_1 FAST Enterprise Crawler 6 / Scirus scirus-crawler@fast.no; http://www.scirus.com/srsapp/contactus/ Fast Enterprise Crawler (66.151.181.xx) for Scirus scienctific information search R http://www.scirus.com/srsapp/ http://www.alltheweb.com -id_a_f_320 FAST Enterprise Crawler 6 used by Cobra Development (admin@fastsearch.com) Fast/Alltheweb crawler (66.151.181.xx) R http://www.alltheweb.com -id_a_f_070507_1 FAST Enterprise Crawler 6 used by Comperio AS (sts@comperio.no) Comperio Web Miner based on Fast ESP R http://www.comperio.no/index.php?option=com_content&task=blogcategory&id=7&Itemid=27 -id_a_f_321 FAST Enterprise Crawler 6 used by FAST (FAST) Fast/Alltheweb crawler (66.151.181.xx) R http://www.alltheweb.com -id_a_f_161106_1 FAST Enterprise Crawler 6 used by Pages Jaunes (pvincent@pagesjaunes.fr) Pages Jaunes business search (France) robot using Fast Enterprise Crawler R 193.252.242.xx http://www.pagesjaunes.fr/ -id_a_f_322 FAST Enterprise Crawler 6 used by Sensis.com.au Web Crawler (search_comments\at\sensis\dot\com\dot\au) Fast/Alltheweb crawler for Sensis.com.au Australian search (66.151.181.xx) R http://www.sensis.com.au/ http://www.alltheweb.com -id_a_f_251007_2 FAST Enterprise Crawler 6 used by Singapore Press Holdings (crawler@sphsearch.sg) SPH Search - Singapore related search using Fast crawler R 202.176.220.xx http://www.sphsearch.sg/ -id_a_f_280606_2 FAST Enterprise Crawler 6 used by WWU (wardi@uni-muenster.de) FAST Enterprise Crawler used by WWU (University of Muenster - Germany) C 128.176.188.2xx http://www.uni-muenster.de/en/index.html http://www.alltheweb.com -id_a_f_323 FAST Enterprise Crawler/6 (www.fastsearch.com) Fast/Alltheweb crawler (66.151.181.xx) R http://www.alltheweb.com -id_a_f_324 FAST Enterprise Crawler/6.4 (helpdesk at fast.no) Fast/Alltheweb crawler (66.151.181.xx) R http://www.alltheweb.com -id_a_f_325 FAST FirstPage retriever (compatible; MSIE 5.5; Mozilla/4.0) Fast/Alltheweb crawler (66.151.181.xx) R http://www.alltheweb.com -id_a_f_326 FAST MetaWeb Crawler (helpdesk at fastsearch dot com) Fast/Alltheweb crawler (66.151.181.xx) R http://www.alltheweb.com -id_a_f_327 Fast PartnerSite Crawler Fast/Alltheweb crawler (66.151.181.xx) R http://www.alltheweb.com -id_a_f_328 FAST-WebCrawler/2.2.10 (Multimedia Search) (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html) Fast/Alltheweb multimedia crawler R see also Yahoo-MMCrawler/3.x http://www.alltheweb.com -id_a_f_329 FAST-WebCrawler/2.2.6 (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html) Fast/Alltheweb crawler R http://www.alltheweb.com -id_a_f_330 FAST-WebCrawler/2.2.7 (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html)http://www.fast.no Fast/Alltheweb crawler R http://www.alltheweb.com -id_a_f_331 FAST-WebCrawler/2.2.8 (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html)http://www.fast.no Fast/Alltheweb crawler R http://www.alltheweb.com -id_a_f_332 FAST-WebCrawler/3.2 test Fast/Alltheweb crawler R http://www.alltheweb.com -id_a_f_333 FAST-WebCrawler/3.3 (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler) Fast/Alltheweb crawler R http://www.alltheweb.com -id_a_f_334 FAST-WebCrawler/3.4/Nirvana (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler) Fast/Alltheweb crawler R http://www.alltheweb.com -id_a_f_335 FAST-WebCrawler/3.4/PartnerSite (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler) Fast/Alltheweb crawler R http://www.alltheweb.com -id_a_f_336 FAST-WebCrawler/3.5 (atw-crawler at fast dot no; http://fast.no/support.php?c=faqs/crawler) Fast/Alltheweb crawler R http://www.alltheweb.com -id_a_f_337 FAST-WebCrawler/3.6 (atw-crawler at fast dot no; http://fast.no/support/crawler.asp) Fast/Alltheweb crawler R http://www.alltheweb.com -id_a_f_338 FAST-WebCrawler/3.6/FirstPage (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler) Fast/Alltheweb crawler R http://www.alltheweb.com -id_a_f_339 FAST-WebCrawler/3.7 (atw-crawler at fast dot no; http://fast.no/support/crawler.asp) Fast/Alltheweb crawler R http://www.alltheweb.com -id_a_f_340 FAST-WebCrawler/3.7/FirstPage (atw-crawler at fast dot no;http://fast.no/support/crawler.asp) Fast/Alltheweb crawler R http://www.alltheweb.com -id_a_f_341 FAST-WebCrawler/3.8 (atw-crawler at fast dot no; http://fast.no/support/crawler.asp) Fast/Alltheweb crawler R http://www.alltheweb.com -id_a_f_342 FAST-WebCrawler/3.8/Fresh (atw-crawler at fast dot no; http://fast.no/support/crawler.asp) Fast/Alltheweb crawler R http://www.alltheweb.com -id_a_f_343 FAST-WebCrawler/3.x Multimedia Fast/Alltheweb multimedia crawler R see also Yahoo-MMCrawler/3.x http://www.alltheweb.com -id_a_f_344 FAST-WebCrawler/3.x Multimedia (mm dash crawler at fast dot no) Fast/Alltheweb multimedia crawler R see also Yahoo-MMCrawler/3.x http://www.alltheweb.com -id_a_f_121205_2 fastbot crawler beta 2.0 (+http://www.fastbot.de) Fastbot search Germany crawler (80.252.104.1xx) R http://www.fastbot.de/ -id_a_f_345 FastBug http://www.ay-up.com Ay-Up geo sync search robot R http://www.ay-up.com -id_a_f_346 FastCrawler 3.0.1 (crawler@1klik.dk) Fast/Alltheweb crawler (66.151.181.xx) R http://www.alltheweb.com -id_a_f_347 FastSearch Web Crawler for Verizon SuperPages (kevin.watters@fastsearch.com) Fast/Alltheweb crawler used by SuperPages.com R http://www.superpages.com http://www.alltheweb.com -id_a_f_170408_3 Favcollector/2.0 (info@favcollector.com http://www.favcollector.com/) Favcollector Favicon collecting robot R 66.207.217.13x http://www.favcollector.com/ -id_a_f_161006_1 FavIconizer FavIconizer - IE favorites icons refreshing tool D http://www.codeproject.com/tools/faviconizer.asp -id_a_f_151206_1 favo.eu crawler/0.6 (http://www.favo.eu) favo.eu (Germany) search robot R 84.19.186.1xx http://www.favo.eu/ -id_a_f_348 FavOrg ZD's FavOrg favourites managing program C http://www.pcmag.com/article2/0,4149,108438,00.asp -id_a_f_260108_1 Favorites Checking (http://campulka.net) Campulka.net Favorites checking tool C http://campulka.net/?dir=Utility -id_a_f_349 Favorites Sweeper v.2.03 Favorites Sweeper bookmark checker C http://www.manitoolssoftware.cjb.net -id_a_f_350 Faxobot/1.0 FaXo Search robot (69.152.89.xx) R http://www.faxo.com -id_a_f_351 FDM 1.x Free Download Manager (FDM) download accelerator D http://www.freedownloadmanager.org -id_a_f_180207_1 FDM 2.x Free Download Manager (FDM) download accelerator D http://www.freedownloadmanager.org -id_a_f_352 Feed Seeker Bot (RSS Feed Seeker http://www.MyNewFavoriteThing.com/fsb.php) RSS Feed Seeker bot (68.225.95.2xx) R http://www.MyNewFavoriteThing.com -id_a_f_241206_1 Feed24.com Feed24 news feed and blog search R 194.105.139.2xx http://www.feed24.com/ -id_a_f_050306_1 Feed::Find/0.0x Feed::Find - Syndication feed (RSS/Atom) auto-discovery D http://search.cpan.org/~btrott/Feed-Find-0.06/lib/Feed/Find.pm -id_a_f_250707_1 Feedable/0.1 (compatible; MSIE 6.0; Windows NT 5.1) Feedable beta web based RSS service B 64.27.19.25x http://reader.feedable.com/ -id_a_f_230406_2 FeedChecker/0.01 Unknown robot from the University of Tokyo (157.82.157.xx) R reads robots.txt http://www.u-tokyo.ac.jp/index_e.html -id_a_f_140608_2 FeedDemon/2.7 (http://www.newsgator.com/; Microsoft Windows XP) FeedDemon RSS reader B http://www.newsgator.com/individuals/feeddemon/ -id_a_f_160308_2 Feedfetcher-Google-iGoogleGadgets; (+http://www.google.com/feedfetcher.html) Google news feed feetcher for iGoogle gadgets C 72.14.[1-2]xx.[X]xx http://www.google.com/feedfetcher.html -id_a_f_010906_1 Feedfetcher-Google; (+http://www.google.com/feedfetcher.html) Google Feedfetcher - RSS and Atom feed crawler R 72.14.199.x[xx] http://www.google.com/feedfetcher.html -id_a_f_010307_1 FeedForAll rss2html.php v2 FeedForAll RSS feed robot C 216.92.192.1xx http://www.feedforall.com/ -id_a_f_010308_1 FeedHub FeedDiscovery/1.0 (http://www.feedhub.com) FeedHub news feed personalization engine powered by mSpoke R 216.134.194.xx http://www.feedhub.com/ http://www.mspoke.com/ -id_a_f_060608_3 FeedHub MetaDataFetcher/1.0 (http://www.feedhub.com) FeedHub news feed personalization engine powered by mSpoke R 216.134.194.xx http://www.feedhub.com/ http://www.mspoke.com/ -id_a_f_260608_3 Feedjit Favicon Crawler 1.0 Feedjit news feed service favicon crawler R 69.46.36.x http://feedjit.com/ -id_a_f_150108_1 Feedreader 3.xx (Powered by Newsbrain) Newsbrain Feedreader3 B http://www.feedreader.com/ -id_a_f_281106_3 Feedshow/x.0 (http://www.feedshow.com; 1 subscriber) FeedShow online RSS feed reader B http://www.feedshow.com/ -id_a_f_051206_2 FeedshowOnline (http://www.feedshow.com) FeedShow online RSS feed reader B http://www.feedshow.com/ -id_a_f_040207_1 FeedZcollector v1.x (Platinum) http://www.feeds4all.com/feedzcollector FeedZcollector - Feed (RSS, ATOM and RDF) capturing software B http://www.feeds4all.com/feedzcollector/ -id_a_f_353 Felix - Mixcat Crawler (+http://mixcat.com) MixCat robot R s. also Morris http://mixcat.com -id_a_f_354 fetch libfetch/2.0 FreeBSD download tool D -id_a_f_355 FFC Trap Door Spider Frequent Finders spider via Sitefusion.com R http://www.frequentfinders.com -id_a_f_356 Filangy/0.01-beta (Filangy; http://www.nutch.org/docs/en/bot.html; filangy-agent@filangy.com) Filangy search and bookmark service R C http://www.filangy.com -id_a_f_357 Filangy/1.0x (Filangy; http://www.filangy.com/filangyinfo.jsp?inc=robots.jsp; filangy-agent@filangy.com) Filangy search and bookmark service R C http://www.filangy.com -id_a_f_358 Filangy/1.0x (Filangy; http://www.nutch.org/docs/en/bot.html; filangy-agent@filangy.com) Filangy search and bookmark service R C http://www.filangy.com -id_a_f_359 fileboost.net/1.0 (+http://www.fileboost.net) File Boost Network link checking R C http://www.fileboost.net -id_a_f_360 FileHound x.x FileHound download manager D http://www.allabout.com -id_a_f_180208_1 Filtrbox/1.0 filtrbox media content (news) monitoring R 72.47.203.8x http://www.filtrbox.com/ -id_a_f_361 FindAnISP.com_ISP_Finder_v99a Find An ISP robot R C site is down http://www.findanisp.com/ -id_a_f_141205_2 Findexa Crawler (http://www.findexa.no/gulesider/article26548.ece) Yelo.no business search (Norway) via Findexa R http://www.findexa.no/english/article27709.ece -id_a_f_362 findlinks/x.xxx (+http://wortschatz.uni-leipzig.de/findlinks/) NextLinks - German vocabulary and hyperlink search R http://wortschatz.uni-leipzig.de/nextlinks/findlinks.html -id_a_f_363 FineBot Finesearch robot R http://www.finesearch.com -id_a_f_080306_1 Finjan-prefetch Finjan Vital Security Web Appliance security solution P http://www.finjan.com/ -id_a_f_364 Firefly/1.0 Fireball.de robot R http://www.fireball.de -id_a_f_365 Firefly/1.0 (compatible; Mozilla 4.0; MSIE 5.5) Fireball.de robot R http://www.fireball.de -id_a_f_210906_1 Firefox (kastaneta03@hotmail.com) Unknown robot from Czech Technical University Prague (147.32.141.xx) R reads robots.txt http://www.cvut.cz/ -id_a_f_190306_2 Firefox_1.0.6 (kasparek@naparek.cz) Unknown robot from Czech Technical University Prague (147.32.141.xx) R reads robots.txt http://www.cvut.cz/ -id_a_f_366 FirstGov.gov Search - POC:firstgov.webmasters@gsa.gov AT&T/Fast Search robot for FirstGov (U.S.Government) portal R http://www.firstgov.gov -id_a_f_367 firstsbot Firstsfind Germany robot / link checking R http://www.firstsfind.de -id_a_f_020906_1 Flapbot/0.7.2 (Flaptor Crawler; http://www.flaptor.com; crawler at flaptor period com) Flaptor information retrieval solutions robot R http://www.flaptor.com/index.htm -id_a_f_368 FlashGet JetCar/FlashGet download manager D http://www.amazesoft.com -id_a_f_161205_1 FLATARTS_FAVICO FlatArts Favorites Icon Tool C D http://flatarts.jp/contents/software/information.php?name=rico -id_a_f_100308_1 Flexum spider Flexum.ru search service R 81.176.76.93 http://www.flexum.ru/ -id_a_f_280508_2 Flexum/2.0 Flexum.ru search service R 81.176.76.93 http://www.flexum.ru/ -id_a_f_369 FlickBot 2.0 RPT-HTTPClient/0.3-3 DivX.com Movie Find robot R http://www.divx.com -id_a_f_370 flunky Metacarta / Cogent robot R http://www.metacarta.com -id_a_f_371 fly/6.01 libwww/4.0D unknown -id_a_f_110107_1 flyindex.net 1.0/http://www.flyindex.net FLY Index Metasearch link checking C 62.141.52.2xx http://www.flyindex.net/ -id_a_f_021108_1 FnooleBot/2.5.2 (+http://www.fnoole.com/addurl.html) Fnoole news crawler R 209.205.65.9x http://www.fnoole.com/ -id_a_f_372 FocusedSampler/1.0 IBM's Almaden Research robot R s. also: - - WFARC http://www.almaden.ibm.com -id_a_f_080108_1 Folkd.com Spider/0.1 beta 1 (www.folkd.com) folkd.com social search robot R 212.227.95.3x http://www.folkd.com/ -id_a_f_070209_4 FollowSite Bot ( http://www.followsite.com/bot.html ) FollowSite robot - website monitoring C 77.232.77.13x http://www.followsite.com/bot.html -id_a_f_140209_1 FollowSite.com ( http://www.followsite.com/b.html ) FollowSite robot - website monitoring C 77.232.77.13x http://www.followsite.com/bot.html -id_a_f_141105_1 Fooky.com/ScorpionBot/ScoutOut; http://www.fooky.com/scorpionbots Fooky search Scorpionbots robot (65.12.170.xxx) R http://www.fooky.com/ -id_a_f_373 Francis/1.0 (francis@neomo.de http://www.neomo.de/) Neomo Search (Germany) robot (85.10.197.1xx) R http://www.neomo.de -id_a_f_374 Franklin Locator 1.8 Some spam bot S -id_a_f_110506_1 free-downloads.net download-link validator /0.1 Free Downloads shareware directory link checking C http://www.free-downloads.net/ -id_a_f_375 FreeFind.com-SiteSearchEngine/1.0 (http://freefind.com; spiderinfo@freefind.com) FreeFind.com robot R http://freefind.com -id_a_f_221008_2 Frelicbot/1.0 +http://www.frelic.com/ Frelics backlink checking bot (beta) C http://www.frelic.com/ -id_a_f_376 FreshDownload/x.xx Fresh Download download manager D http://www.freshdevices.com -id_a_f_230306_2 FreshNotes crawler< report problems to crawler-at-freshnotes-dot-com FreshNotes - music related artist search (72.3.225.xx) R http://freshnotes.com/fn/ -id_a_f_377 FSurf15a 01 Some site scanning tool via diff. IPs S s. also DSurf - PBrowse ... -id_a_f_070209_5 FTB-Bot http://www.findthebest.co.uk/ Find the Best search robot R 83.105.71.16x http://www.findthebest.co.uk/ -id_a_f_378 Full Web Bot 0416B Some site scanning tool from diff. IPs i.e.: - 66.28.240.xx (cogentco.com) - 68.5.174.xx (cox.net) S -id_a_f_379 Full Web Bot 0516B Some site scanning tool i.e. from - 68.154.96.xx (bellsouth.net) S appears also as MFC Foundation Class Library & Demo Bot Z 16b - 66.118.1xx.xxx (sagonet.com) - s. also Educate Search VxB - Industry Program 1.0.5 -id_a_f_380 Full Web Bot 2816B Some site scanning tool from 66.255.6.xxx (uslec.com) S -id_a_f_190807_1 FuseBulb.Com FuseBulb search R 208.109.126.1xx http://www.fusebulb.com/ -id_a_f_381 FyberSpider (+http://www.fybersearch.com/fyberspider.php) FyberSearch FyberSpider robot R http://www.fybersearch.com -id_g_m_382 Gagglebot Some user from bbnplanet.net (4.63.218.2xx) using an Innerprise robot tool R C ? http://www.innerprise.net -id_g_m_383 GAIS Robot/1.0B2 Seed Search robot R http://www.seed.net.tw -id_g_m_384 Gaisbot/3.0 (indexer@gais.cs.ccu.edu.tw; http://gais.cs.ccu.edu.tw/robot.php) Gaislab Taiwan robot R 140.123.100.x http://gais.cs.ccu.edu.tw -id_g_m_160706_1 Gaisbot/3.0+(robot06@gais.cs.ccu.edu.tw;+http://gais.cs.ccu.edu.tw/robot.php) Gaislab Taiwan robot R 140.123.100.x http://gais.cs.ccu.edu.tw -id_g_m_385 GalaxyBot/1.0 (http://www.galaxy.com/galaxybot.html) Galaxy robot (63.121.41.xxx) R s. also Mozilla/4.0 (compatible; MSIE 5.0; www.galaxy.com....) http://www.galaxy.com -id_g_m_130407_2 Gallent Search Spider v1.4 Robot 2 (http://robot.GallentSearch.com) Gallent Search directory (UK) R 88.208.223.xx http://www.gallent.co.uk/ http://robot.gallentsearch.com/ -id_g_m_010107_1 gamekitbot/1.0 (+http://www.uchoose.de/crawler/gamekitbot/) Gamekit game search engine - Germany R 80.65.45.xx http://www.gamekit.de/ -id_g_m_386 Gamespy_Arcade GameSpyHTTP/1.0 D GameSpy Arcade download manager (FilePlanet) http://www.gamespyarcade.com/features/ -id_g_m_387 GammaSpider/1.0 GammaWare GammaSpider R http://www.gammasite.com -id_g_m_388 gazz/x.x (gazz@nttrd.com) nttrd.com / Infobee.ne.jp robot R -id_g_m_389 geckobot Geckobot user robot no active website http://www.geckobot.com/ -id_g_m_280406_1 Generic Mobile Phone (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html) Google Mobile Search crawler R P 66.249.72.1xx http://www.google.com/mobile/formats.html -id_g_m_390 generic_crawler/01.0217/ Unknown robot from Carnegie Mellon University (128.2.211.xxx) R http://www.cmu.edu -id_g_m_100109_2 GenesisBrowser (HTTP 1.1; 0.9; XP SP2; .NET CLR 2.0.50727) Lunascape Genesis browser B http://www.lunascape.tv/ -id_g_m_231205_1 genieBot (http://64.5.245.11/faq/faq.html) GenieKnows.com search R s. also: - larbin_2.6.3 (wgao@genieknows.com) http://www.genieknows.com/ -id_g_m_391 geniebot wgao@genieknows.com GenieKnows.com search R s. also: - larbin_2.6.3 (wgao@genieknows.com) http://www.genieknows.com/ -id_g_m_050606_3 GeoBot/1.0 Unknown robot from wavepath.com (65.254.33.1xx) no active website -id_g_m_392 GeonaBot 1.x; http://www.geona.com/ Geona Search robot / link checking R http://www.geona.com -id_g_m_160206_3 geourl/2.0b2 GeoURL ICBM Address Server - a location-to-URL reverse directory C http://geourl.org/ -id_g_m_160206_2 GeoURLBot 1.0 (http://geourl.org) GeoURL ICBM Address Server - a location-to-URL reverse directory C http://geourl.org/ -id_g_m_393 GetBot Getbot web downloading tool / site grabber D http://www.getbot.com -id_g_m_394 GetRight/3.x.x GetRight download manager D http://www.getright.com -id_g_m_395 GetRight/4.5xx GetRight download manager D http://www.getright.com -id_g_m_396 GetRight/4.x GetRight download manager D http://www.getright.com -id_g_m_397 GetRight/4.x[a-e] GetRight download manager D http://www.getright.com -id_g_m_260807_1 GetRight/6.1 (Pro) GetRight download manager D http://www.getright.com -id_g_m_398 GetRightPro/6.0beta2 GetRight download manager D http://www.getright.com -id_g_m_170706_3 GetWeb/0.1 libwww-perl/5.16 GetWeb - web page to email service D 216.204.133.xxx http://www.healthnet.org/getweb.php -id_g_m_399 GhostRouteHunter/20021130 (https://www.sixxs.net/tools/grh/; info@sixxs.net) Sixxs Ghost Route Hunter C http://www.sixxs.net/tools/grh/ -id_g_m_400 gigabaz/3.1x (baz@gigabaz.com; http://gigabaz.com/gigabaz/) GigaBaz Brainbot (Germany) robot R s. also - MicroBaz http://gigabaz.com -id_g_m_401 Gigabot/2.0 (gigablast.com) Gigablast robot (64.62.168.xx) R http://www.gigablast.com -id_g_m_140106_1 Gigabot/2.0/gigablast.com/spider.html Gigablast robot R comes from 64.62.168.xx AND 66.154.102.xx http://www.gigablast.com -id_g_m_170506_1 Gigabot/2.0; http://www.gigablast.com/spider.html Gigablast robot R comes from 64.62.168.xx AND 66.154.102.xx http://www.gigablast.com -id_g_m_190507_1 Gigabot/2.0att Gigablast robot R 66.231.188.1xx http://www.gigablast.com -id_g_m_230508_1 Gigabot/3.0 (http://www.gigablast.com/spider.html) Gigablast robot R 66.231.18x.[x]xx http://www.gigablast.com -id_g_m_402 Gigabot/x.0 Gigablast robot (64.62.168.xx) R http://www.gigablast.com -id_g_m_403 GigabotSiteSearch/2.0 (sitesearch.gigablast.com) Gigablast robot (64.62.168.xx) R http://www.gigablast.com -id_g_m_404 GNODSPIDER (www.gnod.net) www.gnod.net spider R http://www.gnod.net -id_g_m_406 Go!Zilla 3.x (www.gozilla.com) Go!Zilla download manager D http://www.gozilla.com -id_g_m_407 Go!Zilla/4.x.x.xx Go!Zilla download manager D http://www.gozilla.com -id_g_m_405 Go-Ahead-Got-It/1.1 GotIt web accelerator (discontinued) P D -id_g_m_408 Goblin/0.9 (http://www.goguides.org/) GoGuides.Org (195.226.137.xx) robot R http://www.goguides.org/goblin-info.html -id_g_m_409 Goblin/0.9.x (http://www.goguides.org/goblin-info.html) GoGuides.Org (195.226.137.xx) robot R http://www.goguides.org/goblin-info.html -id_g_m_410 GoForIt.com GoForIt Search robot R 208.109.236.xx http://www.goforit.com -id_g_m_411 GOFORITBOT ( http://www.goforit.com/about/ ) GoForIt Search robot R 208.109.236.xx http://www.goforit.com -id_g_m_020306_1 GoGuides.Org Link Check GoGuides.org directory & search link checking C http://www.goguides.org/ -id_g_m_230207_2 GoldenFeed Spider 1.0 (http://www.goldenfeed.com) GoldenFeed.com - RSS search engine C 74.52.41.1xx http://www.goldenfeed.com/ -id_g_m_412 Goldfire Server Invention Machines Goldfire Server P http://www.invention-machine.com/custsupport/GFR_install.cfm -id_g_m_041006_1 gonzo1[P] +http://www.suchen.de/popups/faq.jsp suchen.de German local search robot R 212.34.185.xx http://www.suchen.de/ -id_g_m_130108_2 gonzo2[P] +http://www.suchen.de/faq.html suchen.de German local search robot R 212.34.185.xx http://www.suchen.de/ -id_g_m_413 Goofer/0.2 Some private robot (Wanadoo.fr client) R -id_g_m_300606_1 Google Talk Google instant messenger B http://www.google.com/talk/ -id_g_m_414 googlebot (larbin2.6.0@unspecified.mail) Packard Bell Net user robot (*not* Google) -id_g_m_050106_1 Googlebot-Image/1.0 Google image crawler (66.249.72.xxx) R http://www.google.com -id_g_m_415 Googlebot-Image/1.0 ( http://www.googlebot.com/bot.html) Google image crawler (66.249.72.xxx) R http://www.google.com -id_g_m_416 Googlebot/2.1 ( http://www.google.com/bot.html) Google robot 66.249.64.XXX R s. also: - Mozilla/4.0 (MobilePhone SCP ... - Mozilla/5.0 (compatible; Googlebot/2.1... http://www.google.com -id_g_m_417 Googlebot/2.1 ( http://www.googlebot.com/bot.html) Google robot 66.249.64.XXX R http://www.google.com -id_g_m_418 Googlebot/Test ( http://www.googlebot.com/bot.html) Google robot 66.249.64.XXX R http://www.google.com -id_g_m_280209_2 Gordon's Spider/Nutch-0.9 (http://www.sharethis.com; gordon@sharethis.com) ShareThis social networking service via Amazon Web Services C 174.129.242.x http://sharethis.com/ http://www.amazonaws.com/ -id_g_m_419 GrapeFX/0.3 libwww/5.4.0 Grapeshot web search system API R http://www.grapeshot.co.uk/html/Index.html -id_g_m_300907_4 great-plains-web-spider/flatlandbot (Flatland Industries Web Spider; http://www.flatlandindustries.com/flatlandbot.php; jason@flatlandindustries.com) Flatland Industries vertical search solution R 74.62.161.xx http://www.flatlandindustries.com/ http://www.flatlandindustries.com/flatlandbot.php -id_g_m_250707_2 GreatNews/1.0 GreatNews 1.0 Beta RSS reader B http://www.curiostudio.com/ -id_g_m_170207_2 GreenBrowser GreenBrowser - IE based browser (China) B http://www.morequick.com/indexen.htm -id_g_m_100307_2 gridwell (http://search.gridwell.com) search gridwell favicon display D 212.227.127.xx http://search.gridwell.com/ -id_g_m_420 GrigorBot 0.8 (http://www.grigor.biz/bot.html) Grigor Search bot R http://www.grigor.biz -id_g_m_161206_1 Gromit/1.0 Australasian Legal Information Institute (AustLII) robot R http://www.austlii.edu.au/ http://www2.austlii.edu.au/~dan/gromit/ -id_g_m_421 grub crawler(http://www.grub.org) Grub open source crawler R http://www.grub.org -id_g_m_422 grub-client Grub open source crawler R http://www.grub.org -id_g_m_423 gsa-crawler (Enterprise; GID-01422; jplastiras@google.com) Google Search Appliance robot (216.239.xx.xx) R http://www.google.com/enterprise/gsa/ -id_g_m_424 gsa-crawler (Enterprise; GID-01742;gsatesting@rediffmail.com) Google Search Appliance robot (216.239.xx.xx) R http://www.google.com/enterprise/gsa/ -id_g_m_060506_1 gsa-crawler (Enterprise; GIX-02057; dm@enhesa.com) Google Enterprise Search Appliance used by Enhesa (212.35.100.1xx) R http://www.enhesa.com/enhesa/en/default.asp http://www.google.com/enterprise/gsa/ -id_g_m_311205_1 gsa-crawler (Enterprise; GIX-03519; cknuetter@stubhub.com) Google Enterprise Search Appliance used by IBM (129.41.20.1xx) R http://www.google.com/enterprise/gsa/ -id_g_m_425 gsa-crawler (Enterprise; GIX-0xxxx; enterprise-training@google.com) Google Search Appliance robot (216.239.xx.xx) R http://www.google.com/enterprise/gsa/ -id_g_m_081006_1 GSiteCrawler/v1.xx rev. xxx (http://gsitecrawler.com/) GSiteCrawler - Google sitemap generator for Windows C http://gsitecrawler.com/ -id_g_m_260207_1 Guestbook Auto Submitter Guestbook spamming tool S -id_g_m_426 Gulliver/1.3 Northernlight robot R http://www.northernlight.com -id_g_m_427 Gulper Web Bot 0.2.4 (www.ecsl.cs.sunysb.edu/~maxim/cgi-bin/Link/GulperBot) Yuntis Collaborative Web Resource Categorization and Ranking Project robot R http://www.ecsl.cs.sunysb.edu/yuntis/ -id_g_m_140907_1 Gungho/0.08004 (http://code.google.com/p/gungho-crawler/wiki/Index) Gungho - Extensible web crawler written in Perl by Google Code R http://code.google.com/p/gungho-crawler/wiki/Index -id_g_m_211106_1 GurujiBot/1.0 (+http://www.guruji.com/WebmasterFAQ.html) guruji : the Indian search engine robot R 209.128.80.1xx / 72.20.109.xx http://www.guruji.com/ -id_g_m_100508_2 GurujiImageBot/1.0 (+http://www.guruji.com/en/WebmasterFAQ.html) guruji : the Indian search engine picture crawler R 72.20.109.xx http://www.guruji.com/ -id_g_m_291108_3 Haier-T10C/1.0 iPanel/2.0 WAP2.0 (compatible; UP.Browser/6.2.2.4; UPG1; UP/4.0; Embedded) Openwave Mobile Browser on Haier T10C mobile B http://www.openwave.com -id_g_m_171105_5 HappyFunBot/1.1 Happy Fun Search robot R http://www.happyfunsearch.com/bot.html -id_g_m_428 Harvest-NG/1.0.2 Harvest-NG web crawler used by search.yahoo.com R see also Exalead NG and NG/1.0 http://search.yahoo.com -id_g_m_429 Haste/0.12 (HOME: http://haste.kytoon.com/) Haste - web mapping and monitoring system R C site is closed http://haste.kytoon.com -id_g_m_430 Hatena Antenna/0.4 (http://a.hatena.ne.jp/help#robot) Hatena::Antenna Japan robot R 221.186.146.xx http://a.hatena.ne.jp -id_g_m_110606_2 Hatena Mobile Gateway/1.0 Hatena Japan proxy for handheld/mobile clients P 221.186.146.xx http://www.hatena.ne.jp/ -id_g_m_431 Hatena Pagetitle Agent/1.0 Hatena Japan robot R 221.186.146.xx http://www.hatena.ne.jp -id_g_m_240207_1 Hatena RSS/0.3 (http://r.hatena.ne.jp) Hatena Japan RSS feed robot R 221.186.146.xx http://www.hatena.ne.jp -id_g_m_110606_1 HatenaScreenshot/1.0 (checker) Hatena::Diary (Japan) web page screenshot robot R D 221.186.146.xx http://www.hatena.ne.jp/ -id_g_m_120108_1 hbtronix.spider.2 -- http://hbtronix.de/spider.php hbtronix.spider - Domain name spider (Germany) R 89.110.157.* http://hbtronix.de/spider.php -id_g_m_432 HeinrichderMiragoRobot Mirago Germany robot R http://www.mirago.de/ -id_g_m_433 HeinrichderMiragoRobot (http://www.miragorobot.com/scripts/deinfo.asp) Mirago Germany robot R http://www.mirago.de/ -id_g_m_434 Helix/1.x ( http://www.sitesearch.ca/helix/) Helix - The SiteSearch (Canada) web crawler R http://www.sitesearch.ca -id_g_m_080206_3 HenriLeRobotMirago (http://www.miragorobot.com/scripts/frinfo.asp) Mirago France robot R http://www.mirago.fr/ -id_g_m_435 HenrytheMiragoRobot Mirago search (UK) robot R 217.154.245.2xx http://www.mirago.co.uk -id_g_m_060806_3 HenryTheMiragoRobot (http://www.miragorobot.com/scripts/mrinfo.asp) Mirago search (UK) robot R 217.154.245.2xx http://www.mirago.co.uk -id_g_m_436 hgrepurl/1.0 O'Reilly's Perl LWP example client program from Web Client Programming with Perl -id_g_m_437 Hi! I'm CsCrawler my homepage: http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html RPT-HTTPClient/0.3-3 University of Kassel Germany CsCrawler using the HTTPClient library R http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html http://www.innovation.ch/java/HTTPClient/ -id_g_m_438 HiDownload HiDownload download manager D http://www.streamingstar.com/hidownload.htm -id_g_m_439 Hippias/0.9 Beta Hippias robot R site is offline http://hippias.evansville.edu -id_g_m_440 HitList Pilot Hitlist web analytics solution R http://www.pilotsoftware.com/products_solutions/hitlist.html -id_g_m_441 Hitwise Spider v1.0 http://www.hitwise.com Hitwise spider R http://www.hitwise.com -id_g_m_442 HLoader diff. IPs / unknown services i.e.: - 204.95.207.xxx user agent ? - 66.27.113.xx link checking ? -id_g_m_040907_1 holmes/3.11 (http://morfeo.centrum.cz/bot) Morfeo / Centrum Search (Czech Republic) robot from 65.102.46.xxx R http://morfeo.centrum.cz/ -id_g_m_220906_2 holmes/3.9 (onet.pl) Onet.pl (Poland) search robot R 213.180.137.xx http://szukaj.onet.pl/ -id_g_m_181006_1 holmes/3.xx (OnetSzukaj/5.0; +http://szukaj.onet.pl) Onet.pl (Poland) search robot R 213.180.137.xx http://szukaj.onet.pl/ -id_g_m_443 holmes/x.x Morfeo / Centrum Search (Czech Republic) robot from 65.102.46.xxx R http://morfeo.centrum.cz/ -id_g_m_021108_2 HolmesBot (http://holmes.ge) Holes search robot (Georgia) R 77.92.229.3x http://holmes.ge/ -id_g_m_444 HomePageSearch(hpsearch.uni-trier.de) HomePageSearch robot R http://hpsearch.uni-trier.de/ -id_g_m_445 Homerbot: www.homerweb.com Homerweb search robot R http://www.homerweb.com -id_g_m_220606_1 Honda-Search/0.7.2 (Nutch; http://lucene.apache.org/nutch/bot.html; search@honda-search.com) Honda-Search.com - Honda cars related search robot R 69.16.227.1xx http://www.honda-search.com/ -id_g_m_090206_1 HooWWWer/2.1.3 (debugging run) (+http://cosco.hiit.fi/search/hoowwwer/ | mailto:crawler-infohiit.fi) HooWWer - Next Generation Information Retrieval robot R http://cosco.hiit.fi -id_g_m_446 HooWWWer/2.1.x ( http://cosco.hiit.fi/search/hoowwwer/ | mailto:crawler-infohiit.fi) HooWWer - Next Generation Information Retrieval robot (128.214.112.xx) R http://cosco.hiit.fi/ -id_g_m_447 HotJava/1.0.1/JRE1.1.x HotJava browser plus HTML Component 1.1.x B -id_g_m_448 Hotzonu/x.0 Hotzuno - Japanese BBS reader client B http://hotzonu.hp.infoseek.co.jp/ -id_g_m_040507_1 HPL/Nutch-0.9 - Unknown robot from HP Labs R 15.203.249.12x http://hpl.hp.com/ -id_g_m_449 htdig/3.1.6 (http://computerorgs.com) COMPUTERorgs.com robot (205.134.190.xxx) using htdig R http://www.computerorgs.com/ http://www.htdig.org -id_g_m_210106_1 htdig/3.1.6 (unconfigured@htdig.searchengine.maintainer) htdig used by the Academie de Toulouse R reads robots.txt http://www.ac-toulouse.fr/html/_.php http://www.htdig.org -id_g_m_450 htdig/3.1.x (root@localhost) htdig search tool R http://www.htdig.org -id_g_m_451 Html Link Validator (www.lithopssoft.com) Lithops Software link validation tool C http://www.lithopssoft.com -id_g_m_110506_3 HTML2JPG Blackbox, http://www.html2jpg.com HTML2JPG webpage to image converter D http://www.html2jpg.com -id_g_m_452 HTML2JPG Enterprise HTML2JPG webpage to image converter D http://www.html2jpg.com -id_g_m_101205_1 HTMLParser/1.x HTML Parser Java library to parse HTML D http://sourceforge.net/projects/htmlparser -id_g_m_071006_1 HTTP Retriever PHP HTTP client to access Web servers D http://code.blitzaffe.com/pages/home/ -id_g_m_240306_1 http://Anonymouse.org/ (Unix) Anonymous web proxy service P http://anonymouse.org/ -id_g_m_453 http://Ask.24x.Info/ (http://narres.it/) Ask 24x Info (Germany) DMOZ related robot R http://narres.it -id_g_m_070209_6 http://hilfe.acont.de/bot.html ACONTBOT ACONTBOT - Acont search Germany robot R 82.149.246.2x http://acont.de/ http://hilfe.acont.de/bot.htm -id_g_m_230408_1 http://OzySoftware.com/Index.html OzySoftware.com software directory link checking C 202.173.141.x http://ozysoftware.com/index.html -id_g_m_454 http://www.almaden.ibm.com/cs/crawler IBM's Almaden Research robot R s. also: - FocusedSampler - WFARC http://www.almaden.ibm.com -id_g_m_455 http://www.almaden.ibm.com/cs/crawler [rc1.wf.ibm.com] IBM's Almaden Research robot R http://www.almaden.ibm.com -id_g_m_456 http://www.almaden.ibm.com/cs/crawler [wf216] IBM's Almaden Research robot R http://www.almaden.ibm.com -id_g_m_271105_4 http://www.istarthere.com_spider@istarthere.com Istarthere.com search robot R http://www.istarthere.com/ -id_g_m_070106_1 http://www.monogol.de Monogol - German open source search engine project (195.226.167.1xx) R http://www.monogol.de/ -id_g_m_060806_4 http://www.trendtech.dk/spider.asp) TrendTech Search Engine (Denmark) robot R 87.104.18.xx http://www.trendtech.dk/ -id_g_m_290106_1 HTTP::Lite/2.x.x HTTP::Lite - Standalone Perl module for retreiving HTTP documents D http://www.toybox.ca/http-lite/ -id_g_m_050108_1 HTTPEyes HTTPEyes - Web proxy cache P http://bachue.com/httpeyes/ -id_g_m_457 HTTPResume v. 1.x HTTPResume Amiga download manager D http://tesla.rcub.bg.ac.yu/%7Eantony/HTTPResume/ -id_g_m_031107_2 httpunit/1.5 HttpUnit - Java test code for emulating browser behaviour B http://httpunit.sourceforge.net/ -id_g_m_090306_1 httpunit/1.x HttpUnit - Java browser behavior simulation tool B http://httpunit.sourceforge.net/ -id_g_m_010807_1 Hybrid/1.2 [en] (OS Independent) Hybrid Share mono C#/Gtk# application for file sharing http://hybrid-share.sourceforge.net/index.php -id_g_m_300507_1 HyperEstraier/1.x.xx Hyper Estraier full-text search system D http://hyperestraier.sourceforge.net/ -id_g_m_170906_1 i1searchbot/2.0 (i1search web crawler; http://www.i1search.com; crawler@i1search.com) i1search robot R 65.111.164.1xx http://www.i1search.com/ -id_g_m_461 IAArchiver-1.0 Alexa / The Internet Archive (209.237.238.1xx) R http://www.alexa.com -id_g_m_091205_2 iaskspider Unknown robot (reads robots.txt) from chinatelecom (219.142.78.xx) Not from iask.com.cn - s. also Mozilla/5.0 (compatible; iaskspider/1.0 .. -id_g_m_111106_1 iaskspider2 (iask@staff.sina.com.cn) Iask search / Sina portal robot (China) R 202.106.184.xxx http://iask.com/ http://english.sina.com/index.html -id_g_m_458 ia_archiver Alexa / The Internet Archive (209.237.238.1xx) R http://www.alexa.com -id_g_m_459 ia_archiver-web.archive.org Alexa / The Internet Archive (209.237.238.1xx) R http://www.alexa.com -id_g_m_460 ia_archiver/1.6 Alexa / The Internet Archive (209.237.238.1xx) R http://www.alexa.com -id_g_m_462 IBrowse/2.2 (AmigaOS 3.5) IOSpirit iBrowse Amiga Browser B was Hisoft (http://www.hisoft.co.uk) http://amiga.iospirit.de/ -id_g_m_463 IBrowse/2.2 (Windows 3.1) IOSpirit iBrowse Amiga Browser B was Hisoft (http://www.hisoft.co.uk) http://amiga.iospirit.de/ -id_g_m_464 iCab/2.5.2 (Macintosh; I; PPC) iCab MAC Web browser B http://www.icab.de -id_g_m_110207_2 ICC-Crawler(Mozilla-compatible; http://kc.nict.go.jp/icc/crawl.html; icc-crawl(at)ml(dot)nict(dot)go(dot)jp) Knowledge Clustered Group ICC-Crawler (University of Tokyo - Japan) R 202.180.34.1xx http://kc.nict.go.jp/icc/crawl.html -id_g_m_250607_1 ICC-Crawler(Mozilla-compatible;http://kc.nict.go.jp/icc/crawl.html;icc-crawl-contact(at)ml(dot)nict(dot)go(dot)jp) Knowledge Clustered Group ICC-Crawler (University of Tokyo - Japan) R 202.180.34.1xx http://kc.nict.go.jp/icc/crawl.html -id_g_m_465 iCCrawler (http://www.iccenter.net) ICJobs - Intelligence Competence Center (Germany) robot R 212.227.76.xx http://www.iccenter.net -id_g_m_121006_1 ICCrawler - ICjobs (http://www.icjobs.de/bot.htm) ICJobs - Intelligence Competence Center (Germany) robot R 212.227.76.xx http://www.iccenter.net -id_g_m_466 ICE Browser/5.05 (Java 1.4.0; Windows 2000 5.0 x86) ICE Java browser B http://www.ii.uib.no/~alexey/jb/ -id_g_m_040206_2 ichiro/x.0 (http://help.goo.ne.jp/door/crawler.html) Goo Japan / Inktomi robot (210.173.179.xx) R s. also moget / mogimogi http://www.goo.ne.jp -id_g_m_468 ichiro/x.0 (ichiro@nttr.co.jp) Goo Japan / Inktomi robot (210.173.179.xx) R s. also moget / mogimogi http://www.goo.ne.jp -id_g_m_469 IconSurf/2.0 favicon finder (see http://iconsurf.com/robot.html) Iconsurf.com - Visual Surf Engine / favicon finder R http://iconsurf.com -id_g_m_470 IconSurf/2.0 favicon monitor (see http://iconsurf.com/robot.html) Iconsurf.com - Visual Surf Engine / favicon finder R http://iconsurf.com -id_g_m_471 ICOO Loader v.x.x.x icooLoader download manager D http://www.icoonet.com -id_g_m_472 ICRA_label_spider/x.0 ICRA (Internet Content Rating Association) label spider R http://www.icra.org -id_g_m_473 icsbot-0.1 ICS Robot Search Engine (International Christian school of Seoul) R http://icseoul.org/ -id_g_m_260306_1 IDA Internet Download Accelerator D http://www.westbyte.com/ida/ -id_g_m_474 ideare - SignSite/1.x Janas (Ideare.com / Tiscali.it) robot R -id_g_m_200806_1 iearthworm/1.0, iearthworm@yahoo.com.cn Unknown UA from Yahoo China 202.165.105.x -id_g_m_475 IEFav172Free Some bookmark manager C possibly Visit URL ?? http://www.lodz.pdi.net/%7Eeristic/free/index.html -id_g_m_060608_4 iFeed.jp/2.0 (www.psychedelix.com/agents/agents.rss; 0 subscribers) iFeed.jp - online rss aggregator (in development) R 67.15.2[3-4][X].xxx http://www.ifeed.jp/ -id_g_m_281207_1 igdeSpyder (compatible; igde.ru; +http://igde.ru/doc/tech.html) Igde search (Russia) robot R 87.118.118.12x http://igde.ru/ -id_g_m_476 iGetter/1.x (Macintosh;G;PPC) iGetter download manager D http://www.igetter.net -id_g_m_477 iGetter/2 (Macintosh; U; PPC Mac OS X; en) iGetter download manager D http://www.igetter.net -id_g_m_120507_1 IIITBOT/1.1 (Indian Language Web Search Engine; http://webkhoj.iiit.net; pvvpr at iiit dot ac dot in) Webkhoj - Indian language search engine R 196.12.53.xx http://webkhoj.iiit.net/ -id_g_m_040607_2 ilial/Nutch-0.9 (Ilial, Inc. is a Los Angeles based Internet startup company. For more information please visit http://www.ilial.com/crawler; http://www.ilial.com/crawler; crawl@ilial.com) Ilial Knowledge Search robot R 72.44.58.2xx http://www.ilial.com/crawler/ -id_g_m_290906_1 ilial/Nutch-0.9-dev Unknown robot from UCLA using Nutch R 164.67.195.xx http://www.ucla.edu/ http://lucene.apache.org/nutch/ -id_g_m_270806_1 IlseBot/1.x Ilse Netherlands robot (62.69.178.xx) R s. also INGRID/3.0 .. / Mozilla/3.0 (INGRID/3.0 .. http://www.ilse.nl/ -id_g_m_478 IlTrovatore-Setaccio ( http://www.iltrovatore.it) Il Trovatore - Italian search engine robot R 213.215.201.2xx http://www.iltrovatore.it -id_g_m_479 Iltrovatore-Setaccio/0.3-dev (Indexing; http://www.iltrovatore.it/bot.html; info@iltrovatore.it) Il Trovatore - Italian search engine robot R 213.215.201.2xx http://www.iltrovatore.it -id_g_m_480 IlTrovatore-Setaccio/1.2 ( http://www.iltrovatore.it/aiuto/faq.html) Il Trovatore - Italian search engine robot R 213.215.201.2xx http://www.iltrovatore.it -id_g_m_481 Iltrovatore-Setaccio/1.2 (It-bot; http://www.iltrovatore.it/bot.html; info@iltrovatore.it) Il Trovatore - Italian search engine robot R 213.215.201.2xx http://www.iltrovatore.it -id_g_m_482 iltrovatore-setaccio/1.2-dev (spidering; http://www.iltrovatore.it/aiuto/.....) Il Trovatore - Italian search engine robot R 213.215.201.2xx http://www.iltrovatore.it -id_g_m_040506_1 IlTrovatore/1.2 (IlTrovatore; http://www.iltrovatore.it/bot.html; bot@iltrovatore.it) Il Trovatore - Italian search engine robot R 213.215.201.2xx http://www.iltrovatore.it -id_g_m_060107_2 ImageVisu/v4.x.x ImageVisu image and graphics viewer - display files from the Web (HTTP and ECWP) B http://geovisu.free.fr/imagvisu/english/ -id_g_m_080907_1 ImageWalker/2.0 (www.bdbrandprotect.com) BD-Brandprotect copyright infringement crawler R 72.14.164.1xx http://www.bdbrandprotect.com/ http://www.bdbrandprotect.com/solutions_5.html -id_g_m_110306_1 Incutio HttpClient v0.x HttpClient - a PHP Web Client Class http://scripts.incutio.com/httpclient/index.php -id_g_m_483 IncyWincy data gatherer(webmaster@loopimprovements.com IncyWincy search engine using DMOZ Open Directory database R http://www.loopimprovements.com -id_g_m_484 IncyWincy page crawler(webmaster@loopimprovements.com IncyWincy search engine using DMOZ Open Directory database R http://www.loopimprovements.com -id_g_m_485 IncyWincy(http://www.look.com) Look.com robot using IncyWincy search engine R http://www.loopimprovements.com -id_g_m_486 IncyWincy(http://www.loopimprovements.com/robot.html) IncyWincy search engine using DMOZ Open Directory database R http://www.loopimprovements.com -id_g_m_487 IncyWincy/2.1(loopimprovements.com/robot.html) IncyWincy search engine using DMOZ Open Directory database R http://www.loopimprovements.com -id_g_m_488 IndexTheWeb.com Crawler7 Index the Web (69.57.134.xx) crawler R http://www.indextheweb.com/ -id_g_m_489 Industry Program 1.0.x Spam bot from diff. IPs S see also Educate Search VxB - Full Web Bot -id_g_m_490 Inet library Inet Library Resource Center robot R http://www.inetlibrary.com -id_g_m_491 InetURL/1.0 InetURL IVM (phone software) plugin for web server access ? http://www.nch.com.au/ivm/plugins.html -id_g_m_270607_1 info@pubblisito.com- (http://www.pubblisito.com) il Sud dei Motori di Ricerca Pubblisito.com search - Italia R 88.149.164.2xx http://www.pubblisito.com/search/ -id_g_m_211208_2 Infoaxe./Nutch-0.9 Infoaxe - search history and bookmark service C 75.126.48.17x http://www.infoaxe.com/ -id_g_m_492 infoConveraCrawler/0.8 ( http://www.authoritativeweb.com/crawl) Converas RetrievalWare Internet Spider (63.241.61.x) R S ? s.also - Convera... Maybe does guestbook / forum spamming s. here http://www.webmasterworld.com/forum11/2871.htm http://www.convera.com/Products/ -id_g_m_493 InfoFly/1.0 (http://www.versions-project.org/) Versions-project.org Ingelin spider R http://www.versions-project.org/ -id_g_m_494 InfoLink/1.x InfoLink link checking tool C http://www.biggbyte.com/biggbyte3/index.html -id_g_m_495 INFOMINE/8.0 Adders INFOMINE Scholary Internet Resource Collection crawler R http://infomine.ucr.edu -id_g_m_496 INFOMINE/8.0 RemoteServices INFOMINE Scholary Internet Resource Collection crawler R http://infomine.ucr.edu -id_g_m_497 INFOMINE/8.0 VLCrawler (http://infomine.ucr.edu/useragents) INFOMINE Scholary Internet Resource Collection crawler R http://infomine.ucr.edu -id_g_m_498 InfoNaviRobot(F107) 164.71.1.1xx jp.co.fujitsu.t2 Robot R -id_g_m_499 InfoSeek Sidewinder/0.9 Infoseek robot R http://www.infoseek.com -id_g_m_500 InfoSeek Sidewinder/1.0A Infoseek robot R http://www.infoseek.com -id_g_m_501 InfoSeek Sidewinder/1.1A Infoseek robot R http://www.infoseek.com -id_g_m_502 Infoseek SideWinder/1.45 (Compatible; MSIE 10.0; UNIX) Infoseek robot R http://www.infoseek.com -id_g_m_503 Infoseek SideWinder/2.0B (Linux 2.4 i686) Infoseek Japan robot R 210.148.160.1xx http://www.infoseek.com -id_g_m_504 INGRID/3.0 MT (webcrawler@NOSPAMexperimental.net; http://webmaster.ilse.nl/jsp/webmaster.jsp) Ilse Netherlands robot (62.69.178.xx) R s.also - Mozilla/3.0 (INGRID/3.0 .. / IlseBot/1.0 .. http://www.ilse.nl/ -id_g_m_505 Inktomi Search Inktomi (Hotbot-Lycos NBCi etc.) robot R http://www.inktomi.com/ -id_g_m_506 InnerpriseBot/1.0 (http://www.innerprise.com/) Enterprise Search engine software (64.202.165.xxx) R s. also - Enterprise_Search - ES.NET_Crawler http://www.innerprise.net -id_g_m_111205_4 Insitor.com search and find world wide! Insitor Search robot (80.67.20.1xx) R s. also Insitornaut http://www.insitor.com/ -id_g_m_121205_3 Insitornaut Insitor Search robot (80.67.20.1xx) R s. also Insitor.com http://www.insitor.com/ -id_g_m_507 InstallShield DigitalWizard download manager D -id_g_m_200308_1 integrity/1.6 Integrity - website broken link checker for MAC OSx C http://peacockmedia.co.uk/index.php/products/7-products/4-integrity -id_g_m_010907_1 Intelix/0.x (cs; http://www.microton.cz/intelix/; microton@@microton.cz) Microton Intelix robot for Eurotran translation software ? D http://www.microton.cz/intelix/ -id_g_m_508 Interarchy/x.x.x (InterarchyCrawler) Interarchy file transfer software - SFTP/FTP client for Mac OS X D http://www.interarchy.com -id_g_m_509 Internet Ninja x.0 Dream Train (Japan) Internet search robot R http://www.dti.ne.jp -id_g_m_510 InternetArchive/0.8-dev(Nutch;http://lucene.apache.org/nutch/bot.html;nutch-agent@lucene.apache Heritrix - The Internet Archive's open-source crawler based on Nutch (207.241.225.2xx) R s.also - archive.org_bot - Mozilla/5.0 (compatible;archive.org_bot/... http://www.archive.org/ http://lucene.apache.org -id_g_m_511 InternetLinkAgent/3.1 Internet Link Agent - link checking tool C http://www.osk.3web.ne.jp/~goronyan/winprg/sub.shtml -id_g_m_512 InternetSeer.com Internetseer Web site monitoring / Claymont robot R http://www.internetseer.com -id_g_m_513 intraVnews/1.x intraVNews - Feed reader & RSS aggregator for Outlook B http://www.intravnews.com -id_g_m_061208_1 IOI/2.0 (ISC Open Index crawler; http://index.isc.org/; bot@index.isc.org) Internet Open Index crawler using Nutch R 149.20.54.1xx http://index.isc.org/ http://www.nutch.org -id_g_m_514 IP*Works! V5 HTTP/S Component - by /n software - www.nsoftware.com IP*Works! HTTP Component http://www.nsoftware.com/products/controls/?ctl=HTTP -id_g_m_515 http://www.ip2location.com IP2Location - Reverse lookup geographical data and ISP by IP R C http://www.ip2location.com -id_g_m_270106_1 IP2MapBot/1.1 http://www.ip2map.com IP2Map - geographical IP mapping R C http://www.ip2map.com/ -id_g_m_516 IPiumBot laurion(dot)com Laurions Ipium robot R http://www.laurion.com -id_g_m_517 IpselonBot/0.xx-beta (Ipselon; http://www.ipselon.com; ipselonbot@ipselon.com) Ipselon Web Search robot R http://www.ipselon.com -id_g_m_518 Iria/1.xxa Iria download manager D http://www5.tok2.com/home/koteturamu/soft/iria.htm -id_g_m_519 IRLbot/1.0 ( http://irl.cs.tamu.edu/crawler) IRL-crawler - Texas A&M University research project crawler R 128.194.135.xx http://irl.cs.tamu.edu -id_g_m_240308_4 IRLbot/3.0 (compatible; MSIE 6.0; http://irl.cs.tamu.edu/crawler/) IRL-crawler - Texas A&M University research project crawler R 128.194.135.xx http://irl.cs.tamu.edu -id_g_m_520 IrssiUrlLog/0.2 url_log - Irssi Perl url grabber http://www.irssi.org/scripts/html/url_log.pl.html -id_g_m_521 Irvine/1.x.x Irvine downloading tool D http://hp.vector.co.jp/authors/VA024591/ -id_g_m_140506_1 ISC Systems iRc Search 2.1 Unknown spambot / harvester from diff. IPs S http://www.projecthoneypot.org/ip_inspector.php?iph=978231e229521680d11cb93f32de0fa1 -id_g_m_030106_1 iSiloX/4.xx Windows/32 iSiloX document converter for iSilo reader B http://www.isilox.com/ -id_g_m_522 isurf (tszhu@canada.com) Unknown University of Alberta link-checking ? C http://www.ualberta.ca -id_g_m_150408_5 iTunes/x.x.x iTunes UA name for access and decrypt the iTunes music store pages B http://www.apple.com/itunes/ -id_g_m_523 IUPUI Research Bot v 1.9a Some spam bot from 66.139.78.xx(x) S -id_g_m_280906_1 iVia Page Fetcher (http://ivia.ucr.edu/useragents.shtml) iVia robot - Open source Internet portal & virtual library system software D http://ivia.ucr.edu/ -id_g_m_524 iVia/4.0 CanonizeUrl (http://infomine.ucr.edu/iVia/useragents.shtml iVia robot - Open source Internet portal & virtual library system software D http://ivia.ucr.edu/ -id_g_m_180707_1 IWAgent/ 1.0 - www.brandprotect.com BD BrandProtect - brand, company or trademarks online monitoring R 72.14.164.1xx http://www.brandprotect.com/ -id_g_m_525 J-PHONE/3.0/J-SH07 Proxy message from jp-q.ne.jp P -id_g_m_526 Jabot/6.x (http://odin.ingrid.org/) ODIN Directory Japan robot (163.138.95.xx) R http://www.ingrid.org -id_g_m_527 Jabot/7.x.x (http://odin.ingrid.org/) ODIN Directory Japan robot (163.138.95.xx) R http://www.ingrid.org -id_g_m_528 Jack German Domanova (offline since Feb.02) robot R -id_g_m_529 Jakarta Commons-HttpClient/2.0xxx Jakarta Commons (Java based) HTTP client B http://jakarta.apache.org/commons/httpclient/ -id_g_m_530 Jakarta Commons-HttpClient/3.0-rcx Jakarta Commons (Java based) HTTP client B http://jakarta.apache.org/commons/httpclient/ -id_g_m_240306_3 Jambot/0.1.x (Jambot; http://www.jambot.com/blog; crawler@jambot.com) JamBot search robot (70.146.82.xx) R http://www.jambot.com/ -id_g_m_130108_1 Jambot/0.2.1 (Jambot; http://www.jambot.com/blog/static.php?page=webmaster-robot; crawler@jambot.com) JamBot search robot R 70.146.82.xx http://www.jambot.com/ -id_g_m_531 Java 1.1 Java VM http://java.sun.com/ -id_g_m_532 Java/1.4.1_01 Java VM R B D used as robot from 194.203.40.xx http://java.sun.com/ -id_g_m_533 Java1.0.21.0 Java VM B http://java.sun.com/ -id_g_m_534 Java1.1.xx.x Java VM http://java.sun.com/ -id_g_m_535 Java1.3.0rc1 Java VM http://java.sun.com/ -id_g_m_536 Java1.3.x Java VM http://java.sun.com/ -id_g_m_537 Java1.4.0 Java VM R B D used by diff. IPs for various purposes i.e.: - Dortmund University Java based robot - Roadrunner.net (66.108.xxx.xxx) user robot in conjunction w. RPT-HTTPClient/0.3-3 http://java.sun.com/ http://www.informatik.uni-dortmund.DE -id_g_m_538 Jayde Crawler. http://www.jayde.com Jayde B2B Search robot (66.28.139.xx) R http://www.jayde.com -id_g_m_539 JBH Agent 2.0 some site downloading tool ? via 61.77.51.xxx D -id_g_m_540 jBrowser/J2ME Profile/MIDP-1.0 Configuration/CLDC-1.0 (Google WAP Proxy/1.0) WAP 2.0 / jBrowser for handhelds B http://www.jataayusoft.com/DbWAPHH.htm -id_g_m_541 JCheckLinks/0.1 RPT-HTTPClient/0.3-1 JCheckLinks Java hyperlink validator C http://web.purplefrog.com/%7Ethoth/jchecklinks/ -id_g_m_542 JDK/1.1 Java Development Kit http://developers.sun.com/index.html -id_g_m_543 Jeode/1.x.x Insignias Jeode (PDA) Java platform B http://www.insignia.com/content/products/jvmProducts.shtml -id_g_m_544 Jetbot/1.0 JetEye Search robot (64.62.142.xxx / 64.71.144.xxx) R http://www.jeteye.com -id_g_m_545 JetBrains Omea Reader 1.0.x (http://www.jetbrains.com/omea_reader/) Omea RSS - Atom - newsgroups web page reader B http://www.jetbrains.com/omea_reader/ -id_g_m_546 JetBrains Omea Reader 2.0 Release Candidate 1 (http://www.jetbrains.com/omea_reader/) Omea RSS - Atom - newsgroups web page reader B http://www.jetbrains.com/omea_reader/ -id_g_m_547 JetCar JetCar / Flashget download manager D http://www.amazesoft.com -id_g_m_548 Jigsaw/2.2.x W3C_CSS_Validator_JFouffa/2.0 Jigsaw - W3C's CSS Validator Server C http://jigsaw.w3.org/css-validator/validator-uri.html -id_g_m_550 JoBo/1.x (http://www.matuschek.net/jobo.html) Jobo website downloading program D B http://www.matuschek.net/software/jobo/index.html -id_g_m_549 JoBo/@JOBO_VERSION@(http://www.matuschek.net/jobo.html) Jobo website downloading program D B http://www.matuschek.net/software/jobo/index.html -id_g_m_551 JobSpider_BA/1.1 Finacialbot.com - German (213.61.218.xx) job search JobRoboter R http://www.finbot.com/jr1.html -id_g_m_552 JOC Web Spider Jocsoft Web Spider - website downloading tool D B http://www.jocsoft.com/jws/index.htm -id_g_m_051206_5 JordoMedia/1.0 RSS File Reader (http://www.jordomedia.com) Jordo Media RSS / Atom feed directory link checking C 216.227.208.1xx http://www.jordomedia.com/ -id_g_m_090206_2 Journster [alpha] (http://journster.com/) Journster.com RSS/Atom aggregator C http://beta.journster.com/ -id_g_m_090206_3 Journster.com RSS/Atom aggregator 0.5 (http://www.journster.com/bot.phtml) Journster.com RSS/Atom aggregator C http://beta.journster.com/ -id_g_m_553 JRTS Check Favorites Utility Check Favorites bookmark checking C http://www.jrtwine.com/Products/CheckFavs/ -id_g_m_554 JRTwine Software Check Favorites Utility Check Favorites bookmark checking C http://www.jrtwine.com/Products/CheckFavs/ -id_g_m_555 Jyxobot/x Jyxo search (Czech Republic) robot (212.71.128.xx) R http://jyxo.cz/ -id_g_m_556 K-Meleon/0.6 (Windows; U; Windows NT 5.1; en-US; rv:0.9.5) Gecko/20011011 K-meleon browser - Windows 2000 B http://kmeleon.sourceforge.net/ -id_g_m_557 k2spider Verity K2 Spider ( Network search software) R http://www.verity.com/products/pdf/MK0368a_K2_Spider.pdf -id_g_m_010108_3 KAIST AITrc Crawler Unknown robot from AITrc (Advanced Information Technology Research Center) - Korea R 143.248.134.22x http://aitrc.kaist.ac.kr/english/ -id_g_m_010506_1 KakleBot - www.kakle.com/0.1 (KakleBot - www.kakle.com; http:// www.kakle.com/bot.html; support@kakle.com) Kakle ranked metasearch robot R 216.139.221.1xx http://www.kakle.com/ -id_g_m_250408_3 kalooga/kalooga-4.0-dev-datahouse (Kalooga; http://www.kalooga.com; info@kalooga.com) Kalooga image crawler R 195.210.57.1xx http://www.kalooga.com/ -id_g_m_011108_3 kalooga/KaloogaBot (Kalooga; http://www.kalooga.com/info.html?page=crawler; crawler@kalooga.com) Kalooga image crawler R 195.210.57.1xx http://www.kalooga.com/ -id_g_m_558 Kapere (http://www.kapere.com) Kapere site grapper / web downloader D http://www.kapere.com -id_g_m_090807_1 Kazehakase/0.x.x.[x] Kazehakase - Gecko based browser (Japan) B http://kazehakase.sourceforge.jp/ -id_g_m_559 KDDI-SN22 UP.Browser/6.0.7 (GUI) MMP/1.1 (Google WAP Proxy/1.0) Openwave UP.Browser for mobiles via Google WAP Proxy (216.239.33.x) P http://www.openwave.com -id_g_m_561 Kenjin Spider Kenjin Spider search agent R http://www.kenjin.ne.jp -id_g_m_562 Kevin http://dznet.com/kevin/ Dznet.com Kevin crawler (link checking ?) via 68.39.148.xx (nj.comcast.net) R http://www.dznet.com -id_g_m_563 Kevin http://websitealert.net/kevin/ Website AlertsKevin crawler (website monitoring) via 68.39.148.xx (nj.comcast.net) R http://www.websitealert.net -id_g_m_560 KE_1.0/2.0 libwww/5.2.8 Voila.fr robot R http://www.voila.fr -id_g_m_301105_5 KFSW-Bot (Version: 1.01 powered by KFSW www.kfsw.de) Some Perl search script from KFSW (Germany) R http://www.kfsw.de/ -id_g_m_100206_4 kinja-imagebot (http://www.kinja.com/) kinja weblog search robot R http://www.kinja.com/ -id_g_m_100206_3 kinjabot (http://www.kinja.com) kinja weblog search robot R http://www.kinja.com/ -id_g_m_564 KIT-Fireball/2.0 Fireball search (Germany) robot R http://www.fireball.de -id_g_m_565 KIT-Fireball/2.0 (compatible; Mozilla 4.0; MSIE 5.5) Fireball search (Germany) robot R http://www.fireball.de -id_g_m_566 Klondike/1.50 (WSP Win32) (Google WAP Proxy/1.0) Klondike WAP Browser B http://www.apachesoftware.com -id_g_m_567 KnowItAll(knowitall@cs.washington.edu) University of Washington KnowItAll - web information extraction R http://www.cs.washington.edu -id_g_m_568 Knowledge.com/0.x The knowledge.com (ODP) directory robot R http://www.knowledge.com -id_g_m_569 Kontiki Client x.xx Kontiki Client download manager D http://www.kontiki.com/client/userhelp_f.shtml -id_g_m_280406_2 Krugle/Krugle,Nutch/0.8+ (Krugle web crawler; http://www.krugle.com/crawler/info.html; webcrawler@krugle.com) Krugle source code search engine for developers (64.71.164.1xx) R powered by Nutch http://www.krugle.com/ -id_g_m_180606_2 KSbot/1.0 (KnowledgeStorm crawler; http://www.knowledgestorm.com/resources/content/crawler/index.html; crawleradmin@knowledgestorm.com) KnowledgeStorm technology industry crawler for Findtech.com R 12.129.110.xx http://www.findtech.com/ http://www.knowledgestorm.com/resources/content/crawler/index.html -id_g_m_570 kuloko-bot/0.x Kuloko contextual search robot R http://www.kuloko.com/ -id_g_m_571 kulokobot www.kuloko.com kuloko@backweave.com Kuloko contextual search robot R http://www.kuloko.com -id_g_m_572 kulturarw3/0.1 National Library of Sweden Heritage Project robot R http://www.kb.se/ENG/kbstart.htm -id_g_m_301105_2 KummHttp/1.1 (compatible; KummClient; Linux rulez) Link or server checking from Sanoma Budapest (195.70.35.xxx) C R Sanoma also runs some web-portals i.e. http://www.startlap.com/ http://sanomabp.hu/ -id_g_m_280209_3 KWC-KX9/1109 UP.Browser/6.2.3.9.g.1.107 (GUI) MMP/2.0 UP.Link/6.3.0.0.0 UP.Browser for mobiles on Kyocera KWC-KX9 cellphone B http://www.openwave.com -id_g_m_211208_3 Labrador/0.2; http://ir.dcs.gla.ac.uk/labrador; craigm@dcs.gla.ac.uk TREC Blog Track - Blog and news feed crawler 130.209.241.2xx http://ir.dcs.gla.ac.uk/wiki/TREC-Blog -id_g_m_573 Lachesis Intels Lachesis web site response time monitoring tool C ftp://ftp.imag.fr/pub/labo-LSR/DRAKKAR/internet-performance/lachesis/ -id_g_m_140406_1 lanshanbot/1.0 Unknown robot from Easten Network China (202.96.51.1xx) reads robots.txt -id_g_m_021206_2 lanshanbot/1.0 (+http://search.msn.com/msnbot.htm) Unknown robot from Easten Network China (202.96.51.1xx) reads robots.txt -id_g_m_271105_1 LapozzBot/1.4 ( http://robot.lapozz.com) Lapozz search (Hungary) robot (82.131.195.xx) R http://www.lapozz.com/ -id_g_m_280508_3 LapozzBot/1.5 (+http://robot.lapozz.hu) Lapozz search (Hungary) robot (82.131.195.xx) R http://www.lapozz.com/ -id_g_m_574 larbin (samualt9@bigfoot.com) Larbin indexer used as Metacarta.com (66.28.xx.xxx) robot R http://www.metacarta.com/ http://larbin.sourceforge.net/index-eng.html -id_g_m_592 LARBIN-EXPERIMENTAL (efp@gmx.net) Unknown robot from 66.230.140.xx (argon.oxeo.com) S maybe an e-mail collector - see also Mozilla/4.0 efp@gmx.net -id_g_m_575 larbin_2.1.1 larbin2.1.1@somewhere.com Larbin indexer used by Mitsubishi Electric Research Labs R http://www.merl.com http://larbin.sourceforge.net/index-eng.html -id_g_m_576 larbin_2.2.0 (crawl@compete.com) Larbin indexer used as Compete.com crawler R http://www.compete.com http://larbin.sourceforge.net/index-eng.html -id_g_m_577 larbin_2.2.1_de_Viennot (Laurent.Viennot@inria.fr) Larbin indexer used as Inria robot R http://www.inria.fr/index.en.html http://larbin.sourceforge.net/index-eng.html -id_g_m_578 larbin_2.2.2 (sugayama@lab7.kuis.kyoto-u.ac.jp) Larbin indexer used as Kyoto University robot R http://www.kyoto-u.ac.jp/ http://larbin.sourceforge.net/index-eng.html -id_g_m_579 larbin_2.2.2_guillaume (guillaume@liafa.jussieu.fr) Larbin indexer used as Inria robot R http://www.inria.fr/index.en.html http://larbin.sourceforge.net/index-eng.html -id_g_m_581 larbin_2.6.0 (larbin2.6.0@unspecified.mail) Larbin indexer used by an unknown dsl.net client R http://larbin.sourceforge.net/index-eng.html -id_g_m_582 larbin_2.6.1 (larbin2.6.1@unspecified.mail) Larbin indexer used by diff. IPs / services R ie.: -Central Host Inc. (client) robot ? - Colt Net France robot http://www.centralhost.com http://larbin.sourceforge.net/index-eng.html -id_g_m_583 larbin_2.6.2 (hamasaki@grad.nii.ac.jp) Larbin indexer used by National Institut of Informatics (NII/Japan) R http://www.nii.ac.jp http://larbin.sourceforge.net/index-eng.html -id_g_m_584 larbin_2.6.2 (larbin2.6.2@unspecified.mail) Larbin indexer used by diff. IPs R http://larbin.sourceforge.net/index-eng.html -id_g_m_585 larbin_2.6.2 (listonATccDOTgatechDOTedu) Larbin indexer used as robot by Georgia Institute of Technology http://www.gatech.edu/ R http://www.gatech.edu http://larbin.sourceforge.net/index-eng.html -id_g_m_586 larbin_2.6.2 (pimenas@systems.tuc.gr) Larbin indexer used by Technical University of Crete R http://www.systems.tuc.gr http://larbin.sourceforge.net/index-eng.html -id_g_m_587 larbin_2.6.2 (tom@lemurconsulting.com) Larbin indexer used as Lemur Consulting robot R http://www.lemurconsulting.com http://larbin.sourceforge.net/index-eng.html -id_g_m_588 larbin_2.6.2 (vitalbox1@hotmail.com) Larbin indexer used as robot via cloud9.net (168.100.192.xxx) R http://larbin.sourceforge.net/index-eng.html -id_g_m_261205_1 larbin_2.6.3 (ltaa_web_crawler@groupes.epfl.ch) Unknown robot from EPFL Lausanne Switzerland (128.178.155.1xx) R reads robots.txt http://www.epfl.ch/Eindex.html -id_g_m_589 larbin_2.6.3 (wgao@genieknows.com) Larbin indexer used by GenieKnows.com search R s. also: - geniebot wgao@genieknows.com http://www.genieknows.com http://larbin.sourceforge.net/index-eng.html -id_g_m_590 larbin_2.6.3_for_(http://cosco.hiit.fi/search/) tsilande@hiit.fi Larbin indexer used by Next Generation Information Retrieval (NGIR) R http://cosco.hiit.fi http://larbin.sourceforge.net/index-eng.html -id_g_m_580 larbin_2.6_basileocaml (basile.starynkevitch@cea.fr) Larbin indexer used by CEA / DCom Rechercher R http://www.cea.fr http://larbin.sourceforge.net/index-eng.html -id_g_m_591 larbin_devel (http://pauillac.inria.fr/~ailleret/prog/larbin/) Larbin indexer used as Inria robot R http://pauillac.inria.fr http://larbin.sourceforge.net/index-eng.html -id_g_m_160807_2 lawinfo-crawler/Nutch-0.9-dev (Crawler for lawinfo.com pages; http://www.lawinfo.com; webmaster@lawinfo.com) LawInfo - Lawyer and attorney directory R 216.86.137.xx http://www.lawinfo.com/ -id_g_m_020506_3 lc/$ROADS::Version libwww-perl/5.00 ROADS - Perl web based subject based gateway tool http://roads.opensource.ac.uk/ -id_g_m_593 lcabotAccept: */* unknown robot via MTT.ca / Aliant.ca 142.177.168.xxx -id_g_m_140408_1 LeapTag/0.8.1.beta081.r3750 (compatible; Mozilla 4.0; MSIE 5.5; robot@yoriwa.com) LeapTag news reader and content discovery tool B http://www.leaptag.com/ -id_g_m_594 LECodeChecker/3.0 libgetdoc/1.0 Linkexchange crawler R http://www.linkexchange.com -id_g_m_595 LeechGet 200x (www.leechget.de) Leechget download manager D http://www.leechget.de -id_g_m_596 LEIA/2.90 Gseek.com (site is offline) robot R -id_g_m_597 LEIA/3.01pr (LEIAcrawler; [SNIP]) Gseek.com (site is offline) robot R -id_g_m_210106_2 LetsCrawl.com/1.0 +http://letscrawl.com/ Maybe logfile spamming for Lets crawl! search (Germany) S website has no function http://letscrawl.com/ -id_g_m_598 LexiBot/1.00 Lexibot (exMataHari) search software R http://www.lexibot.com/index.asp -id_g_m_140209_2 LG-LX260 POLARIS-LX260/2.0 MMP/2.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 Polaris mobile browser on LG LX 260 Sprint Rumor phone B http://www.infraware.co.kr/eng/01_product/product10.asp -id_g_m_599 LG/U8138/v1.0 LG 8138 Mobile Phone browser B -id_g_m_600 Libby_1.1/libwww-perl/5.47 About.com robot R http://www.about.com/ -id_g_m_100306_1 libcurl-agent/1.0 libcurl's (multiprotocol file transfer library) standard user-agent name D http://curl.haxx.se/libcurl/ -id_g_m_080507_1 LibertyW (+http://www.lw01.com) LibertyW search for mobile (France) R 213.251.135.2xx http://www.lw01.com/en/ -id_g_m_601 libWeb/clsHTTP -- hiongun@kt.co.kr Korea Telecom Search robot R http://www.kt.co.kr/kt_home/eng/index.jsp -id_g_m_602 libwww-perl/5.41 CMP United Media robot R http://www.cmpnet.com -id_g_m_603 libwww-perl/5.45 SplatSearch robot (207.44.142.xx) R http://www.splatsearch.com -id_g_m_604 libwww-perl/5.48 Alexa robot R http://www.alexa.com -id_g_m_605 libwww-perl/5.50 diff. IPs / services R C P ie.: - secure-netz.de link checking (in conjunction w. LWP::Simple/5.50) -N2H2 Internet filtering http://www.n2h2.com -id_g_m_606 libwww-perl/5.52 FP/2.1 Fast Search robot R http://www.alltheweb.com -id_g_m_607 libwww-perl/5.52 FP/4.0 Fast Search robot R http://www.alltheweb.com -id_g_m_608 libwww-perl/5.53 diff. IPs / services R C P ie.: -iPrism Web filtering software - softclub.net link checking http://www.stbernard.com/default.asp -id_g_m_609 libwww-perl/5.63 Profile for You internet profiling (?) R C http://www.profile4u.com -id_g_m_610 libwww-perl/5.64 unknown link checking from Wanadoo.fr (193.253.33.xxx) R C -id_g_m_611 libwww-perl/5.65 Amidalla search engine robot (62.241.33.xx) R s. also amibot http://www.amidalla.com -id_g_m_612 libwww-perl/5.800 SplatSearch robot (72.36.210.xx) R http://www.splatsearch.com/ -id_g_m_613 libwww/5.3.2 Mediater Rechercher robot R http://www.mediater.net -id_g_m_160206_1 Liferea/0.x.x (Linux; en_US.UTF-8; http://liferea.sf.net/) Liferea - Linux feed reader B http://liferea.sourceforge.net/ -id_g_m_140508_4 Liferea/1.x.x (Linux; es_ES.UTF-8; http://liferea.sf.net/) Liferea (Linux Feed Reader) news aggregator for Unix and Linux B http://liferea.sourceforge.net/ -id_g_m_614 LightningDownload/1.0beta2 Lightning Download manager D http://www.lightningdownload.com -id_g_m_615 LightningDownload/1.x.x Lightning Download manager D http://www.lightningdownload.com -id_g_m_616 LightningDownload/1.x.x [Accelerated x] Lightning Download manager D http://www.lightningdownload.com -id_g_m_131207_1 LijitSpider/Nutch-0.9 (Reports crawler; http://www.lijit.com/; info(a)lijit(d)com) Lijit blog search spider R 216.24.131.1xx http://www.lijit.com/ -id_g_m_617 Lincoln State Web Browser Some spam bot S s. this Guestbook http://www.donotenter.com/guestbook/gbook.html http://www.donotenter.com/guestbook/gbook.html -id_g_m_618 Link Valet Online 1.x Link Valet online link checking C http://www.htmlhelp.com -id_g_m_620 LinkAlarm/2.x Linkalarm link validation C http://www.linkalarm.com -id_g_m_621 Linkbot Linkbot Pro link checking software C http://www.watchfire.com -id_g_m_622 linkbot Rpsoft 2000 Site-Crawler R http://www.rpsoft2000.com/rps-site-crawler.htm -id_g_m_623 Linkbot x.0 Linkbot Pro link checking software C http://www.watchfire.com -id_g_m_624 LinkCheck (linkcheck@inter7.com http://www.inter7.com/linkcheck) Linkcheck - linkchecking tool for Unix/Linux C http://www.inter7.com -id_g_m_625 LinkLint-checkonly/2.x.x Linklint - Perl html link checker C http://www.linklint.org -id_g_m_626 LinkLint-spider/2.x.x Linklint - Perl html link checker C http://www.linklint.org -id_g_m_627 linknzbot Linknz - The Kiwi Search Engine (New Zealand) R http://www.linknz.co.nz -id_g_m_280606_1 LinkPimpin v1.0 Link-Pimp web directory link checking C 216.89.111.x http://www.link-pimp.com/ -id_g_m_628 LinkProver 2.1 TafWeb link checking program C http://www.tafweb.com -id_g_m_630 Links (0.9x; Linux 2.4.7-10 i686) Links text browser for Unix & OS/2 B http://artax.karlin.mff.cuni.cz/%7Emikulas/links/ -id_g_m_631 Links (0.9xpre12; Linux 2.2.14-5.0 i686; 80x24) Links text browser for Unix & OS/2 B http://artax.karlin.mff.cuni.cz/%7Emikulas/links/ -id_g_m_632 Links (2.xpre7; Linux 2.4.18 i586; x) Links text browser for Unix & OS/2 B http://artax.karlin.mff.cuni.cz/%7Emikulas/links/ -id_g_m_629 Links - http://gossamer-threads.com/scripts/links/ Links SQL directory management program C http://gossamer-threads.com/scripts/links/ -id_g_m_633 Links 2.0 (http://gossamer-threads.com/scripts/links/) Links SQL directory management program R http://gossamer-threads.com/scripts/links/ -id_g_m_634 Links SQL (http://gossamer-threads.com/scripts/links-sql/) Links SQL directory management program R http://gossamer-threads.com/scripts/links-sql/ -id_g_m_280406_3 Links4US-Crawler, (+http://links4us.com/) Links4us ODP based directory link checking C 209.190.5.2xx http://links4us.com/ -id_g_m_635 LinkScan/11.0beta2 UnixShareware robot from Elsop.com (used by Indiafocus/Indiainfo) Shareware robot from Elsop.com (used by Indiafocus/Indiainfo and others) R http://www.elsop.com http://indiafocus.indiainfo.com/ -id_g_m_636 LinkScan/9.0g Unix Shareware robot from Elsop.com (used by Indiafocus/Indiainfo and others) R http://www.elsop.com http://indiafocus.indiainfo.com/ -id_g_m_637 LinkScan/x.x Unix Shareware robot from Elsop.com R http://www.elsop.com -id_g_m_638 LinksManager.com (http://linksmanager.com/linkchecker.html) Linksmanager bookmark checking C s.also Mozilla/5.0 (compatible; LinksManager.com_bot... http://linksmanager.com/linkchecker.html -id_g_m_639 LinkSonar/1.35 LinkSonar (Japan) link checking tool C http://hp.vector.co.jp/authors/VA014575/chicchi/linksonar/readme.html -id_g_m_640 LinkSweeper/1.x Left Side Software's LinkSweeper (ceased) bookmark utility C http://www.lss.com.au/lss/lss_main.htm -id_g_m_641 LinkWalker Seventwentyfour link checking robot C http://www.seventwentyfour.com -id_g_m_619 link_check3.plx libwww-perl/5.65 link check 3 - Perl HTML link checker (from Perl for Web Site Management) C http://www.elanus.net/cgi/examples.cgi/view/ex_1102.txt -id_g_m_642 ListBidBot (freelance job spider http://listbid.com)Freelance Listbid.com / Directnic.com link checking ? R C http://listbid.com -id_g_m_031107_3 LiveTrans/Nutch-0.9 (maintainer: cobain at iis dot sinica dot edu dot tw; http://wkd.iis.sinica.edu.tw/LiveTrans/) WKD Lab: LiveTrans - Online query and terminology translation service R 140.109.19.1xx http://wkd.iis.sinica.edu.tw/LiveTrans/ -id_g_m_643 Llaut/1.0 (http://mnm.uib.es/~gallir/llaut/bot.html) llaut robot - Universitat de les Illes Balears (Spain) R http://mnm.uib.es -id_g_m_200307_2 LMQueueBot/0.2 E-Mail harvesting robot - same as ContactBot S 64.124.152.xx -id_g_m_644 lmspider (lmspider@scansoft.com) lmspider from Scansoft (192.133.61.xx) - Web text collector R see here http://www.kahunaburger.com/blog/archives/000117.html -id_g_m_645 LNSpiderguy Lexis-Nexis robot R http://www.lexis-nexis.com/ -id_g_m_300106_4 LocalBot/1.0 ( http://www.localbot.co.uk/) LocalBot company information collector R http://www.localbot.co.uk/ -id_g_m_646 LocalcomBot/1.2.x ( http://www.local.com/bot.htm) Local.com local search robot (216.52.252.xxx) R http://www.local.com/ -id_g_m_647 Lockstep Spider/1.0 Lockstep (website content protection tool) user agent R http://www.lockstep.com -id_g_m_648 Look.com GlobalQueue spider (64.40.105.xxx) R http://www.multi-mode.com/ -id_g_m_649 Lotus-Notes/4.5 ( Windows-NT ) Lotus Notes browser B -id_g_m_650 LotusDiscovery/x.0 (compatible; Mozilla 4.0; MSIE 4.01; Windows NT) IBM Lotus Discovery Server http://www-142.ibm.com/software/sw-lotus/products/product3.nsf/wdocs/644012e0434859b585256ec9006d37b8 -id_g_m_051207_1 Lovel as 1.0 ( +http://www.everatom.com) Everatom.com song lyrics search R 80.91.191.2xx http://www.everatom.com -id_g_m_100308_2 LTI/LemurProject Nutch Spider/Nutch-1.0-dev (lti crawler for CMU; http://www.lti.cs.cmu.edu; changkuk at cmu dot edu) LTI - The Lemur Toolkit for Language Modeling and Information Retrieval via Yahoo R 68.180.139.12x http://www.lemurproject.org/ http://www.yahoo.com/ -id_g_m_050208_3 LTI/LemurProject Nutch Spider/Nutch-1.0-dev (Research spider using Nutch; http://www.lemurproject.org; mhoy@cs.cmu.edu) LTI - The Lemur Toolkit for Language Modeling and Information Retrieval via Yahoo R 68.180.139.12x http://www.lemurproject.org/ http://www.yahoo.com/ -id_g_m_651 luchs.at URL checker Luchs.at (Linux Wiki) link checking C http://web.luchs.at/information/linkchecker.php -id_g_m_090106_1 Lunascape Lunascape IE based browser (Japan) B s. also Mozilla/4.0 (... Lunascape ...) http://www2.lunascape.jp/index.aspx -id_g_m_652 lwp-trivial/1.32 Ultimate Search / Smartdesk (no website) robot R -id_g_m_653 lwp-trivial/1.34 Search4free robot R http://www.search4free.com -id_g_m_654 lwp-trivial/1.34 Search4free robot R http://www.search4free.com -id_g_m_656 lwp-trivial/1.35 Expert HTML online source viewer B http://www.expert-html.com/ -id_g_m_655 lwp-trivial/1.35 Expert HTML online source viewer B http://www.expert-html.com/ -id_g_m_657 LWP::Simple/5.22 Perl LWP:Collective module R http://www.thatrobotsite.com -id_g_m_658 LWP::Simple/5.36 Perl LWP:Collective module R http://www.thatrobotsite.com -id_g_m_659 LWP::Simple/5.48 Perl LWP:Collective module - Linkomatic robot R http://www.linkomatic.com/ http://www.thatrobotsite.com -id_g_m_660 LWP::Simple/5.50 Perl LWP:Collective module - secure-netz.de link checking (in conjunction w. libwww-perl/5.50) R http://www.secure-netz.de http://www.thatrobotsite.com -id_g_m_661 LWP::Simple/5.51 Perl LWP:Collective module - Inktomi (62.253.64.x) robot R http://www.inktomi.com/ http://www.thatrobotsite.com -id_g_m_662 LWP::Simple/5.53 Perl LWP:Collective module - Only.com R in conjunction w. Spida/0.1 http://www.only.com http://www.thatrobotsite.com -id_g_m_663 LWP::Simple/5.63 Perl LWP:Collective module R http://www.thatrobotsite.com -id_g_m_291105_3 LWP::Simple/5.803 ThePlanet/jaja-jak-globusy.com Google Adsense refferer spam bot from 70.85.116.* / 70.84.128.xxx / 70.85.193.xxx S appears also as Poirot - Mozilla/4.76 [en] (Win98; U) - Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1) http://spamhuntress.com/wiki/Manila_Industries -id_g_m_664 Lycos_Spider_(modspider) Lycos spider R http://www.lycos.com -id_g_m_665 Lycos_Spider_(T-Rex) Lycos spider R http://www.lycos.com -id_g_m_200308_2 Lynx/2-4-2 (Bobcat/0.5 [DOS] Jp Beta04) Bobcat - Text and Lynx based DOS browser B http://www.fdisk.com/doslynx/bobcat.htm -id_g_m_666 Lynx/2.6 libwww-FM/2.14 Lynx 2.x text mode browser B http://lynx.browser.org/ -id_g_m_180108_1 Lynx/2.8 (;http://seebot.org) seebot.org online service - uses lynx browser for crawlers view of web pages B 208.113.176.x[xx] http://seebot.org/ -id_g_m_667 Lynx/2.8.3dev.9 libwww-FM/2.14 SSL-MM/1.4.1 OpenSSL/0.9.6 Lynx 2.x text mode browser B http://lynx.browser.org/ -id_g_m_668 Lynx/2.8.4rel.1 libwww-FM/2.14 SSL-MM/1.4.1 OpenSSL/0.9.6c (human-guided@lerly.net) Lynx 2.x text mode browser used as robot via cogentco.com R -id_g_m_669 Mac Finder 1.0.xx Some spam bot S http://www.kloth.net/internet/badbots.php -id_g_m_670 Mackster( http://www.ukwizz.com ) UKWizz search robot R s. also UKWizz/Nutch http://www.ukwizz.com -id_g_m_671 Mag-Net Wind.it client user-agent ? -id_g_m_180606_3 MagicWML/1.0 (forcewml) All Magic/Wap wml service for mobile devices P http://allmagic3.com/wap/ -id_g_m_061206_1 MagpieRSS/0.7x (+http://magpierss.sf.net) Magpie RSS - PHP RSS Parser B http://magpierss.sourceforge.net/ -id_g_m_030308_1 Mahiti.Com/Mahiti Crawler-1.0 (Mahiti.Com; http://mahiti.com ; mahiti.com) Mahiti.com India search crawler R 72.167.143.1x http://mahiti.com/ -id_g_m_020707_2 Mail.Ru/1.0 Mail.ru search R 194.186.55.2xx http://www.mail.ru/ -id_g_m_672 mailto:webcraft@bea.com Unknown Bea robot R http://www.beasys.com -id_g_m_673 mammoth/1.0 ( http://www.sli-systems.com/) SLI Systems mammoth robot R s. also Mozilla/5.0 (+http://www.sli-systems.com/) Mammoth/0.1 http://www.sli-systems.com/ http://www.tenspider.com/business-blog/more.php?id=A45_0_1_0_M -id_g_m_674 MantraAgent Looksmart robot R http://www.looksmart.com -id_g_m_675 MapoftheInternet.com ( http://MapoftheInternet.com) Map of the Internet visual search engine index robot R http://MapoftheInternet.com -id_g_m_676 Mariner/5.1b [de] (Win95; I ;Kolibri gncwebbot) Kolibri.de robot R http://www.kolibri.de -id_g_m_677 Marketwave Hit List Pilot Hitlist web site analysis R http://www.marketwave.com/products_solutions/hitlist.html -id_g_m_678 Martini Looksmart directory page analysis R http://www.looksmart.com -id_g_m_679 MARTINI Looksmart directory page analysis R http://www.looksmart.com -id_g_m_680 Marvin v0.3 Marvin Medhunt robot R http://www.hon.ch/MedHunt/Marvin.html -id_g_m_270606_1 MaSagool/1.0 (MaSagool; http://sagool.jp/; info@sagool.jp) Sagool search Japan robot R 124.32.246.xx http://sagool.jp/ -id_g_m_681 Mass Downloader 2.x Mass Downloader download manager D http://www.metaproducts.com -id_g_m_682 MasterSeek Masterseek (Scandinavia) Beta business search ? R http://www.masterseek.com -id_g_m_683 Mata Hari/2.00 Lexibot (exMataHari) search software R http://www.lexibot.com -id_g_m_684 Matrix S.p.A. - FAST Enterprise Crawler 6 (Unknown admin e-mail address) Virgilio Italy robot (212.48.11.xxx) using Fast Enterprise Search R http://www.virgilio.it -id_g_m_685 maxomobot/dev-20051201 (maxomo; http://67.102.134.34:4047/MAXOMO/MAXOMObot.html; maxomobot@maxomo.com) Maxomo multimedia search robot R http://www.maxomo.com -id_g_m_686 McBot/5.001 (windows; U; NT4.0; en-us) Unknown robot from McAfee Austria (80.123.144.xx) -id_g_m_290108_1 MDbot/1.0 (+http://www.megadownload.net/bot.html) MegaDownload files search robot R 91.121.83.19x http://www.megadownload.net/ http://www.megadownload.net/bot.html -id_g_m_170306_1 Media Player Classic Substitute for Windows Media Player B http://sourceforge.net/projects/guliverkli/ -id_g_m_687 MediaCrawler-1.0 (Experimental) Media Find crawler R http://www.mediacrawler.de -id_g_m_688 Mediapartners-Google/2.1 ( http://www.googlebot.com/bot.html) Google AdSense robot R http://www.google.com/ads/ -id_g_m_689 MediaSearch/0.1 WWW.fi Media Search R http://www.fi/haku/ -id_g_m_690 MegaSheep v1.0 (www.searchuk.com internet sheep) Search UK robot R http://www.searchuk.com -id_g_m_131107_1 Megite2.0 (http://www.megite.com) Megite web2.0 RSS and news service software R http://www.megite.com/ -id_g_m_691 Mercator-1.x Mercator crawler software (used by Altavista) R http://www.research.compaq.com -id_g_m_692 Mercator-2.0 Mercator crawler software (used by Altavista) R http://www.research.compaq.com -id_g_m_693 Mercator-Scrub-1.1 Mercator crawler software (used by Altavista) R http://www.research.compaq.com -id_g_m_070207_1 Metaeuro Web Crawler/0.2 (MetaEuro Web Search Clustering Engine; http://www.metaeuro.com; crawler at metaeuro dot com) MetaEuro.com Clustering Web Search Engine crawler R 83.97.31.1xx http://www.metaeuro.com/ -id_g_m_694 MetaGer-LinkChecker MetaGer search robot (Germany) R 130.75.2.xx http://www.metager.de/ -id_g_m_270706_1 MetagerBot/0.8-dev (MetagerBot; http://metager.de; ) MetaGer search robot (Germany) R 130.75.2.xx http://www.metager.de/ -id_g_m_060307_1 MetaGer_PreChecker0.1 MetaGer search robot (Germany) R 130.75.2.xx http://www.metager.de/ -id_g_m_695 MetaProducts Download Express/1.x Download Express download manager D http://www.metaproducts.com -id_g_m_696 Metaspinner/0.01 (Metaspinner; http://www.meta-spinner.de/; support@meta-spinner.de/) Metaspinner search robot - Germany R http://www.meta-spinner.de/ -id_g_m_300407_1 metatagsdir/0.7 (+http://metatagsdir.com/directory/) Metatagsdir.com directory index spider R 206.196.111.2xx http://metatagsdir.com/directory/ -id_g_m_697 MFC Foundation Class Library 4.0 Microsoft Foundation Class Library - i.e. used for e-mail harvesting from 68.154.96.xx (bellsouth.net) S appears also as Full Web Bot 0516B or Demo Bot Z 16b -id_g_m_698 MFC_Tear_Sample Microsoft.com user agent -id_g_m_699 MFHttpScan Advanced Site Crawler web site ripper and extractor D http://www.innovative.go.ro/sitecrawler/index.htm -id_g_m_700 MicroBaz GigaBaz Brainbot (Germany) robot (213.139.152.xx) R s. also - gigabaz/3.1x ... http://brainbot.com//site3 -id_g_m_701 Microsoft Data Access Internet Publishing Provider Cache Manager MS Office 2000 acting as WebDAV client B P -id_g_m_702 Microsoft Data Access Internet Publishing Provider DAV MS Office 2000 acting as WebDAV client B -id_g_m_704 Microsoft Data Access Internet Publishing Provider Protocol Discovery Server probe for data access operations using MS Frontpage with OPTION header B C -id_g_m_703 Microsoft Data Access Internet Publishing Provider Protocol Discovery MS Office 2000 acting as WebDAV client B C -id_g_m_190807_2 Microsoft Log Parser 2.2 Microsoft Log Parser text query tool D http://www.microsoft.com/technet/scriptcenter/tools/logparser/default.mspx -id_g_m_180306_1 Microsoft Small Business Indexer MS Small Business Server content indexer R Indexing from Microsoft: 204.71.191.xx http://www.microsoft.com/windowsserver2003/sbs/default.mspx -id_g_m_705 Microsoft URL Control - 6.00.8xxx user agent looks for form-mail components (spam-bot) S -id_g_m_707 MicrosoftPrototypeCrawler (How's my crawling? mailto:newbiecrawler@hotmail.com) Unknown robot from Microsoft.com (131.107.163.xx) R -id_g_m_706 Microsoft_Internet_Explorer_5.00.438 (fjones@isd.net) Secure Computing SmartFilterWhere / Bess web filter (192.55.214.xx) P http://www.securecomputing.com/index.cfm?skey=22 -id_g_m_708 MIIxpc/4.2 xpc-mii.net HTTP server message P -id_g_m_130807_2 Mindjet MindManager The Mindjet blog MindManager category D 80.229.1xx http://blog.mindjet.com/category/mindjet/mindmanager/ -id_g_m_709 minibot unknown robot via Korea Telecom (211.218.xxx.xxx) -id_g_m_110506_2 miniRank/1.6 (Website ranking; www.minirank.com; robot) mini- Rank website popularity tool C 64.230.71.2xx http://www.minirank.com/ -id_g_m_710 MiracleAlphaTest unknown robot via nec.co.jp Telecom (210.143.35.xx) -id_g_m_711 Missauga Locate 1.0.0 Some spam bot S http://www.neilgunton.com/spambot_trap/appendix/ -id_g_m_712 Missigua Locator 1.9 Some spam bot S http://www.neilgunton.com/spambot_trap/appendix/ -id_g_m_713 Missouri College Browse Some spam bot S -id_g_m_714 Mister Pix II 2.02a Mister PiX picture finding software D R http://www.mister-pix.com/ -id_g_m_715 Mister PiX version.dll Mister PiX picture finding software D R http://www.mister-pix.com/ -id_g_m_110206_3 Misterbot-Nutch/0.7.1 (Misterbot-Nutch; http://www.misterbot.fr; admin@misterbot.fr) Misterbot search France robot R http://www.misterbot.fr/ -id_g_m_716 Miva (AlgoFeedback@miva.com) Miva / ex Findwhat.com search robot (66.150.55.2xx) R http://www.miva.com/ -id_g_m_141105_2 Mizzu Labs 2.2 Some spam bot from Jasmine Internet - Bangkok (203.147.0.xx) S s. link http://www.projecthoneypot.org/ip_inspector.php?iph=7bc2eae614063a45b0e1d0786dbe6a2e -id_g_m_080706_3 MJ12bot/vx.x.x (http://majestic12.co.uk/bot.php?+) Majestic-12 DSearch MJ12bot (Experimental distributed crawler) R http://www.majestic12.co.uk/projects/dsearch/ -id_g_m_717 MJ12bot/vx.x.x (http://www.majestic12.co.uk/projects/dsearch/mj12bot.php) Majestic-12 DSearch MJ12bot (Experimental distributed crawler) R http://www.majestic12.co.uk/projects/dsearch/mj12bot.php -id_g_m_200108_1 MJBot (SEO assessment) MJB SEO Club MJBot R 217.8.248.19x http://www.mjbdata.com/information/ -id_g_m_030308_2 MLBot (www.metadatalabs.com) MLBot - metadata labs web crawler for building a media index (beta) R http://www.metadatalabs.com/ -id_g_m_718 MnogoSearch/3.2.xx mnoGoSearch (ex UdmSearch) software robot R http://mnogosearch.org/ -id_g_m_260306_3 Mo College 1.9 Unknown bad bot - maybe guestbook spamming or email harvesting S see link: http://www.kloth.net/internet/badbots.php -id_g_m_719 moget/x.x (moget@goo.ne.jp) Goo Japan / Inktomi robot (210.173.179.xx) R s. also ichiro http://www.goo.ne.jp -id_g_m_720 mogimogi/1.0 Goo Japan / Inktomi robot (210.173.179.xx) R s. also ichiro http://www.goo.ne.jp -id_g_m_721 moiNAG 0.02 moiNag - net.art generator R D http://soundwarez.org/generator/moiNAG/ -id_g_m_722 MojeekBot/0.x (archi; http://www.mojeek.com/bot.html) Mojeek Search Preview robot (217.155.205.xx) R s.also Mozilla/5.0 (compatible; MojeekBot/2.0 ... http://www.mojeek.com -id_g_m_150407_1 monkeyagent Greasemonkey Firefox extension D http://www.greasespot.net/ http://diveintogreasemonkey.org/install/what-is-greasemonkey.html -id_g_m_090106_2 MoonBrowser (version 0.41 Beta4) Moonbrowser - IE based browser (Japan) B http://www.geocities.co.jp/SiliconValley-Cupertino/8986/ -id_g_m_010307_2 Moreoverbot/x.00 (+http://www.moreover.com) Moreover / FeedDirect RSS feed robot C 72.13.32.x http://w.moreover.com/ http://www.feeddirect.com/ -id_g_m_723 Morris - Mixcat Crawler ( http://mixcat.com) MixCat robot s. also Felix R http://mixcat.com -id_g_m_100206_2 Motoricerca-Robots.txt-Checker/1.0 (http://tool.motoricerca.info/robots-checker.phtml) Robots.txt online checker C http://tool.motoricerca.info/robots-checker.phtml -id_g_m_240108_1 Motorola-V3m Obigo Obigo WAP browser for mobiles on Motorola V3 B http://www.obigo.com/ http://en.wikipedia.org/wiki/Obigo_Browser -id_g_m_724 Mouse-House/7.4 (spider_monkey spider info at www.mobrien.com/sm.shtml) MPRM Group Ltd. Spider Monkey robot R http://www.spidermonkey.ca/sm.shtml -id_g_m_725 MovableType/x.x Movable Type web-based personal publishing system B http://www.movabletype.org -id_g_m_726 mozDex/0.xx-dev (mozDex; http://www.mozdex.com/en/bot.html; spider@mozdex.com) Mozdex Open search engine spider (65.98.100.2xx) R http://www.mozdex.com/ -id_g_m_727 Mozi! Bell Nexxia / Sympatico Canada user robot & spoofed referer from diff. IPs -id_moz_728 Mozilla Unknown robots from diff. IPs -id_moz_100109_3 Mozilla (libwhisker/2.4) libwhisker - HTTP client and utility - Perl library http://www.wiretrip.net/rfp/lw.asp -id_moz_729 Mozilla (Mozilla@somewhere.com) http://www.somewhere.com robot R http://www.somewhere.com -id_moz_041007_1 Mozilla 4.0(compatible; BotSeer/1.0; +http://botseer.ist.psu.edu) BotSeer search engine for robots.txt R 130.203.154.2xx http://botseer.ist.psu.edu/ http://botseer.ist.psu.edu/about.html -id_moz_731 Mozilla/1.1 (compatible; MSPIE 2.0; Windows CE) PDA Pocket IE 2.x Windows CE B -id_moz_732 Mozilla/1.10 [en] (Compatible; RISC OS 3.70; Oregano 1.10) Oregano browser for RISC OS B http://www.crashnet.org.uk -id_moz_730 Mozilla/1.22 (compatible; MSIE 2.0d; Windows NT) IE 2.x WinNT B -id_moz_733 Mozilla/1.22 (compatible; MSIE 5.01; PalmOS 3.0) EudoraWeb 2 EudoraWeb 2.0 browser (Eudora Internet Suite) for PalmOS B http://www.eudora.com/products/unsupported/internetsuite/ -id_moz_1552 Mozilla/2.0 Dummy user agent - i.e. used by Namo Web Editor B http://www.namo.com/ -id_moz_734 Mozilla/2.0 (compatible; AOL 3.0; Mac_PowerPC) AOL Mac B -id_moz_735 Mozilla/2.0 (Compatible; AOL-IWENG 3.0; Win16) AOL Win 3.x B -id_moz_736 Mozilla/2.0 (compatible; Ask Jeeves) Ask Jeeves /Teoma robot R 65.214.45.[x]xx http://sp.ask.com -id_moz_040707_2 Mozilla/2.0 (compatible; Ask Jeeves/Teoma) Ask Jeeves /Teoma robot R 65.214.45.[x]xx http://sp.ask.com -id_moz_160506_3 Mozilla/2.0 (compatible; Ask Jeeves/Teoma; http://about.ask.com/en/docs/about/webmasters.shtml) Ask Jeeves /Teoma robot R 65.214.45.[x]xx http://sp.ask.com -id_moz_737 Mozilla/2.0 (compatible; Ask Jeeves/Teoma; http://sp.ask.com/docs/about/tech_crawling.html) Ask Jeeves /Teoma robot R 65.214.45.[x]xx http://sp.ask.com -id_moz_738 Mozilla/2.0 (compatible; EZResult -- Internet Search Engine) Direct Hit Robot R http://www.directhit.com -id_moz_739 Mozilla/2.0 (compatible; MS FrontPage x.0) MS Frontpage x.x web editor B -id_moz_740 Mozilla/2.0 (compatible; MSIE 2.1; Mac_PowerPC) IE 2.x Mac Power PC B -id_moz_743 Mozilla/2.0 (compatible; MSIE 3.02; Update a; AK; Windows NT) IE 3.x WinNT B -id_moz_744 Mozilla/2.0 (compatible; MSIE 3.02; Update a; AOL 3.0; Windows 95) IE 3.x AOL Win95 B -id_moz_741 Mozilla/2.0 (compatible; MSIE 3.0; AK; Windows 95) IE 3.x Win95 B -id_moz_742 Mozilla/2.0 (compatible; MSIE 3.0; Windows 3.1) IE 3.x Win 3.1 B -id_moz_745 Mozilla/2.0 (compatible; MSIE 3.0B; Win32) IE 3.x WinXP B -id_moz_746 Mozilla/2.0 (compatible; NEWT ActiveX; Win32) Borland Delphi .OCX component used by WebCollector email harverster S -id_moz_747 Mozilla/2.0 (compatible; T-H-U-N-D-E-R-S-T-O-N-E) Thunderstone's Webinator Web indexing program R http://www.thunderstone.com/texis/site/pages/Products.html -id_moz_748 Mozilla/2.0 compatible; Check&Get 1.1x (Windows 98) Check&Get bookmark and link checking tool C http://www.activeurls.com -id_moz_749 Mozilla/2.01 (Win16; I) Netscape 2.x Win3.x International B -id_moz_750 Mozilla/2.02Gold (Win95; I) Netscape 2.x Gold Win95 B -id_moz_771 Mozilla/3.0 (compatible) Faked user agent for diff. purposes i.e.: - some download manager - E-mail harvesting S D -id_moz_751 Mozilla/3.0 (compatible; AvantGo 3.2) AvantGo PDA browser B http://avantgo.com/products/solutions/sfa.html -id_moz_752 Mozilla/3.0 (compatible; Fluffy the spider; http://www.searchhippo.com/; info@searchhippo.com) Searchhippo robot R http://www.searchhippo.com -id_moz_753 Mozilla/3.0 (compatible; HP Web PrintSmart 04b0 1.0.1.34) HP Web PrintSmart (discontinued) - web page printing software B D -id_moz_754 Mozilla/3.0 (compatible; Indy Library) Internet Direct Library for Borland (often used as e-mail address collector and mass mailing tool) S http://forge.novell.com/modules/xfmod/project/?indy-net http://www.indyproject.org/ -id_moz_755 Mozilla/3.0 (compatible; Linkman) Outertechs Linkman bookmark tool C http://www.outertech.com -id_moz_757 Mozilla/3.0 (compatible; MuscatFerret/1.5.4; claude@euroferret.com) Euroferret robot R http://www.euroferret.com -id_moz_756 Mozilla/3.0 (compatible; MuscatFerret/1.5; olly@muscat.co.uk) Euroferret robot R http://www.euroferret.com -id_moz_758 Mozilla/3.0 (compatible; MuscatFerret/1.6.x; claude@euroferret.com) Euroferret robot R http://www.euroferret.com -id_moz_759 Mozilla/3.0 (compatible; netart generator/1.0; libwww-perl/5.64) Netart Generator - script generated random websites R D http://www.obn.org/generator/ -id_moz_760 Mozilla/3.0 (compatible; NetPositive/2.2) NetPositive BEOS browser B http://www.tunetrackersystems.com/bedocs/documentation/User's%20Guide/03_network/Network07_NetPositive.html -id_moz_761 Mozilla/3.0 (compatible; Opera/3.0; Windows 3.1) v3.1 Opera 3.x Win3.x B -id_moz_762 Mozilla/3.0 (compatible; Opera/3.0; Windows 95/NT4) 3.2 Opera 3.x Win95/NT B -id_moz_763 Mozilla/3.0 (compatible; PerMan Surfer 3.0; Win95) Perman Surfer bookmark tool C http://www.bug.co.jp/nami-nori/ -id_moz_764 Mozilla/3.0 (compatible; REL Software Web Link Validator 2.x) Web Link Validator link validation software C http://www.relsoftware.com -id_moz_765 Mozilla/3.0 (compatible; scan4mail (advanced version) http://www.peterspages.net/?scan4mail) Scan4Mail online mail extraction service S http://www.peterspages.net -id_moz_220606_2 Mozilla/3.0 (compatible; ScollSpider; http://www.webwobot.com) WebWobot UK search engine robot (82.43.129.2xx) R s. also ScollSpider http://www.webwobot.com/ -id_moz_766 Mozilla/3.0 (compatible; Web Link Validator 2.x)Web Link Validator http://www.relsoftware.com/ link validation software Web Link Validator link validation software C http://www.relsoftware.com -id_moz_767 Mozilla/3.0 (compatible; WebCapture x.x; Auto; Windows) Xelios Web Capture (now Wysigot) website downloading tool (Discontinued) D http://www.xelios.com/ http://www.wysigot.com/int/about.html -id_moz_768 Mozilla/3.0 (compatible; Webinator-DEV01.home.iprospect.com/2.56) Iprospect search engine positioning using Thunderstone's Webinator R http://www.iprospect.com http://www.thunderstone.com/texis/site/pages/Products.html -id_moz_769 Mozilla/3.0 (compatible; Webinator-indexer.cyberalert.com/2.56) CyberAlert's Media Monitor using Thunderstone's Webinator R http://www.cyberalert.com http://www.thunderstone.com/texis/site/pages/Products.html -id_moz_770 Mozilla/3.0 (Compatible;Viking/1.8) Viking server user/client P http://www.robtex.com -id_moz_772 Mozilla/3.0 (DreamPassport/3.0) One of DC-Sakuras download manager user-agent names D http://www.dc-sakura.com -id_moz_773 Mozilla/3.0 (INGRID/3.0 MT; webcrawler@NOSPAMexperimental.net; http://aanmelden.ilse.nl/?aanmeld_mode=webhints) Ilse Netherlands robot (62.69.178.xx) R s. also - INGRID/3.0 .. / IlseBot/1.0 .. http://www.ilse.nl/ -id_moz_774 Mozilla/3.0 (Liberate DTV 1.1) Liberate DTV server suite / TV-emulator B P http://www.liberate.com -id_moz_775 Mozilla/3.0 (Planetweb/2.100 JS SSL US; Dreamcast US) Planetweb 2.1 Browser (discontinued) for Dreamcast B http://www.planetweb.com -id_moz_776 Mozilla/3.0 (Slurp.so/Goo; slurp@inktomi.com; http://www.inktomi.com/slurp.html) http://www.goo.ne.jp /Inktomi robot R http://www.goo.ne.jp -id_moz_777 Mozilla/3.0 (Slurp/cat; slurp@inktomi.com; http://www.inktomi.com/slurp.html) Inktomi (Hotbot-Lycos-NBCi) robot - 72.30.61.xx(x) R s. also Slurpy Verifier ... http://www.inktomi.com/ -id_moz_778 Mozilla/3.0 (Slurp/si; slurp@inktomi.com; http://www.inktomi.com/slurp.html) Inktomi (Hotbot-Lycos-NBCi) robot - 72.30.61.xx(x) R s. also Slurpy Verifier ... http://www.inktomi.com/ -id_moz_779 Mozilla/3.0 (Vagabondo/1.1 MT; webcrawler@NOSPAMwise-guys.nl; http://webagent.wise-guys.nl/) WiseGuys robot Netherland - 82.94.216.2 R s. also Vagabondo http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk -id_moz_780 Mozilla/3.0 (Vagabondo/1.x MT; webagent@wise-guys.nl; http://webagent.wise-guys.nl/) WiseGuys robot Netherland - 82.94.216.2 R s. also Vagabondo http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk -id_moz_781 Mozilla/3.0 (Vagabondo/2.0 MT; webcrawler@NOSPAMexperimental.net; http://aanmelden.ilse.nl/?aanmeld_mode=webhints) Ilse Netherlands robot R http://www.ilse.nl -id_moz_782 Mozilla/3.0 (Vagabondo/2.0 MT; webcrawler@NOSPAMwise-guys.nl; http://webagent.wise-guys.nl/) WiseGuys robot Netherland - 82.94.216.2 R s. also Vagabondo http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk -id_moz_783 Mozilla/3.0 (Win16; I) Netscape 3.x Win3.x B -id_moz_784 Mozilla/3.0 (Win95; I) Netscape 3.x Win95 B -id_moz_785 Mozilla/3.0 (WinNT; I) Netscape 3.x WinNT B -id_moz_786 Mozilla/3.0 (WorldGate Gazelle 3.5.1 build 11; FreeBSD2.2.8-STABLE) Netscape 3.x FreeBSD B -id_moz_787 Mozilla/3.0 (X11; I; OSF1 V4.0 alpha) Netscape 3.x OSF1 V4.0 alpha B -id_moz_788 Mozilla/3.0 NAVIO_AOLTV (11; 13; Philips; PH200; 1; R2.0C36_AOL.0110OPTIK; R2.0.0139d_OPTIK) AOL Web TV B -id_moz_789 Mozilla/3.0 WebTV/1.2 (compatible; MSIE 2.0) WebTV B -id_moz_790 Mozilla/3.01 (compatible; AmigaVoyager/2.95; AmigaOS/MC680x0) Amiga Voyager Browser Amiga B -id_moz_791 Mozilla/3.01 (Compatible; Links2Go Similarity Engine) Links2Go robot R http://www.links2go.com -id_moz_792 Mozilla/3.01 (compatible; Netbox/3.5 R92; Linux 2.2) Netgem Netbox cable modem TV Box Linux B http://www.netgem.com -id_moz_793 Mozilla/3.01-C-MACOS8 (Macintosh; I; PPC) Netscape 3.x Mac B -id_moz_794 Mozilla/3.01Gold (X11; I; Linux 2.0.32 i486) Netscape 3.x Linux B -id_moz_795 Mozilla/3.01Gold (X11; I; SunOS 5.5.1 sun4m) Netscape 3.x SunOS B -id_moz_796 Mozilla/3.01SGoldC-SGI (X11; I; IRIX 6.3 IP32) Netscape 3.x Irix B -id_moz_797 Mozilla/3.04 (compatible; ANTFresco/2.13; RISC OS 4.02) ANT Fresco Browser Risc OS B http://www.antlimited.com -id_moz_798 Mozilla/3.04 (compatible; NCBrowser/2.35; ANTFresco/2.17; RISC OS-NC 5.13 Laz1UK1309) NCBrowser ANT Fresco Browser Risc OS B http://www.antlimited.com -id_moz_281106_1 Mozilla/3.04 (compatible;QNX Voyager 2.03B ;Photon) QNX OS Voyager embedded browser B http://www.qnx.com/products/browsers/ -id_moz_799 Mozilla/3.x (I-Opener 1.1; Netpliance) I-Opener (was www.netpliance.com/) web PC B -id_moz_100406_3 Mozilla/4.0 Yahoo Mindset: Intent-driven Search (66.228.182.1xx) R s. also Yahoo! Mindset http://mindset.research.yahoo.com/ -id_moz_800 Mozilla/4.0 (agadine3.0) www.agada.de Agada search (Germany) robot R s. also agadine/1.x.x http://www.agada.de -id_moz_290406_1 Mozilla/4.0 (Compatible); URLBase 6 URLBase 6 bookmark manager C s. also URLBase/6.x http://www.terriadev.com/products/urlbase/ -id_moz_895 Mozilla/4.0 (compatible: AstraSpider V.2.1 : astrafind.com) Astrafind! adult search robot (66.98.252.xx) R http://www.astrafind.com -id_moz_021205_1 Mozilla/4.0 (compatible; Vagabondo/2.2; webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/) WiseGuys robot Netherland - 82.94.216.2 R s.also - Mozilla/3.0 (Vagabondo... - Vagabondo.. http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk -id_moz_240906_1 Mozilla/4.0 (compatible; Vagabondo/4.0Beta; webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/) WiseGuys robot Netherland - 82.94.216.2 R s.also - Mozilla/3.0 (Vagabondo... - Vagabondo.. http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk -id_moz_100208_1 Mozilla/4.0 (compatible; ReGet Deluxe 5.1; Windows NT 5.1) ReGet Deluxe! download manager D http://deluxe.reget.com/en/ -id_moz_801 Mozilla/4.0 (compatible; Advanced Email Extractor v2.xx) Advanced Email Extractor e-mail collector (spam bot) S http://www.mailutilities.com -id_moz_802 Mozilla/4.0 (compatible; Arachmo) Arachmo Spider - web site file extraction tool D http://bbbearchan.hp.infoseek.co.jp/ -id_moz_804 Mozilla/4.0 (compatible; BorderManager 3.0) Novell Border Manager security suite P -id_moz_090807_3 Mozilla/4.0 (compatible; BOTW Spider; +http://botw.org) Best of the Web directory link checking C 209.11.177.1xx http://botw.org/ -id_moz_803 Mozilla/4.0 (compatible; B_L_I_T_Z_B_O_T) Blitzsuche Germany robot R s. BlitzBOT@tricus.net http://blitzsuche.rp-online.de/ -id_moz_805 Mozilla/4.0 (compatible; Cerberian Drtrs Version-3.2-Build-0) Content Control from Blue Coat P http://www.cerberian.com -id_moz_080706_1 Mozilla/4.0 (compatible; Check&Get 3.0; Windows NT) Check&Get bookmark manager, web change monitor and archiver C http://activeurls.com/en/ -id_moz_806 Mozilla/4.0 (compatible; ChristCrawler.com ChristCrawler@ChristCENTRAL.com) Christcentral.com Christcrawler (was www.christcrawler.com) R s.also ChristCRAWLER -id_moz_301105_4 Mozilla/4.0 (compatible; crawlx, crawler@trd.overture.com) Yahoo Search Marketing crawler (68.142.211.1xx) R http://www.content.overture.com/d/ -id_moz_011207_1 Mozilla/4.0 (compatible; DAUMOA-video; +http://ws.daum.net/aboutkr.html) DAUMOA - Daum search Korea robot (211.115.109.xxx) R s. also RaBot http://www.daum.net/ http://ws.daum.net/abouten.html -id_moz_131206_1 Mozilla/4.0 (compatible; DepSpid/5.0x; +http://about.depspid.net) DepSpid distributed web crawler for link dependencies C http://depspid.net/ http://about.depspid.net/ -id_moz_807 Mozilla/4.0 (compatible; DnloadMage 1.0) Download Mage download manager D http://www.dlmage.com -id_moz_808 Mozilla/4.0 (compatible; FastCrawler3 support-fastcrawler3@fast.no) Fast/Alltheweb crawler R http://www.alltheweb.com -id_moz_809 Mozilla/4.0 (compatible; FDSE robot) Fluid Dynamics Search Engine (FDSE) robot used by Abadoor.de R http://www.xav.com/scripts/search/ http://www.abadoor.de/ -id_moz_161105_2 Mozilla/4.0 (compatible; GPU p2p crawler http://gpu.sourceforge.net/search_engine.php) GPU Distributed Search Engine crawler R http://gpu.sourceforge.net/search_engine.php -id_moz_810 Mozilla/4.0 (compatible; grub-client-0.2.x; Crawl your stuff with http://grub.org) Grub open source crawler R http://www.grub.org -id_moz_811 Mozilla/4.0 (compatible; grub-client-0.3.x; Crawl your own stuff with http://grub.org) Grub open source crawler R http://www.grub.org -id_moz_812 Mozilla/4.0 (compatible; grub-client-2.x) Grub open source crawler used by Looksmart ( 64.241.242.xx) R http://www.grub.org -id_moz_261205_2 Mozilla/4.0 (compatible; ibisBrowser) ibisBrowser Japanese mobile browser B http://www.ibis.ne.jp/products/ibisBrowser/index.html -id_moz_813 Mozilla/4.0 (compatible; ICS 1.2.xxx) Novell iChain Cool Solutions caching P http://www.novell.com -id_moz_220206_1 Mozilla/4.0 (compatible; IE-Favorites-Check-0.5) IE Favorites Check - Bookmark manager C http://secure.sintraweb.net/public/soft/iefc/ -id_moz_814 Mozilla/4.0 (compatible; Iplexx Spider/1.0 http://www.iplexx.at) Iplexx Austria (webhosting company) logfile spamming bot S http://www.iplexx.at -id_moz_020208_1 Mozilla/4.0 (compatible; KeepNI web site monitor) KeepNi Monitors - Web site monitoring / link checking tool C http://www.keepni.com/ -id_moz_815 Mozilla/4.0 (compatible; Link Utility; http://net-promoter.com) NetPromoter Link Utility link checking tool C s. also - Mozilla/4.0 (compatible; NetPromoter Spider ... http://www.net-promoter.com/ -id_moz_816 Mozilla/4.0 (compatible; Lotus-Notes/5.0; Windows-NT) Lotus Notes 5.0 browser B http://www-10.lotus.com/ldd/whatisnotes#Release%205.0%3A%20Web%20integration%20by%20d -id_moz_819 Mozilla/4.0 (compatible; MSIE 4.01; AOL 4.0; Windows 98) IE 4.x AOL Win98 B -id_moz_820 Mozilla/4.0 (compatible; MSIE 4.01; Mac_PowerPC) IE 4.x Mac Power PC B -id_moz_821 Mozilla/4.0 (compatible; MSIE 4.01; MSIECrawler; Windows 95) Internet Explorer 4.0 URL check B C -id_moz_090506_1 Mozilla/4.0 (compatible; MSIE 4.01; Vonna.com b o t) Vonna search robot R http://www.vonna.com/ -id_moz_822 Mozilla/4.0 (compatible; MSIE 4.01; Windows 95) IE 4.x Win95 B -id_moz_823 Mozilla/4.0 (compatible; MSIE 4.01; Windows CE; MSN Companion 2.0; 800x600; Compaq) IE PDA Browser Windows CE B -id_moz_100109_4 Mozilla/4.0 (compatible; MSIE 4.01; Windows CE; PPC; 240x320; SPV M700; OpVer 19.123.2.733) OrangeBot-Mobile 2008.0 (mobilesearch.support@orange-ftgroup.com) Orange France robot for mobiles R 81.52.143.xx http://www.orange.com/en_EN/ -id_moz_010308_2 Mozilla/4.0 (compatible; MSIE 4.01; Windows CE; PPS; 240x320) IE for Windows CE on a PocketPC (HP iPAQ) B http://www.hp.com/ -id_moz_824 Mozilla/4.0 (compatible; MSIE 4.01; Windows NT Windows CE) IE PDA Browser Windows CE B -id_moz_826 Mozilla/4.0 (compatible; MSIE 4.01; Windows NT) IE 4.x WinNT B -id_moz_825 Mozilla/4.0 (compatible; MSIE 4.01; Windows NT; MS Search 4.0 Robot) Microsoft diff. IPs / services i.e.: - Microsoft server information robot (see link) - Okanagan Internet Junction web filter (robot) http://www.webmasterworld.com/forum11/841.htm http://www.junction.net/ -id_moz_010406_3 Mozilla/4.0 (compatible; MSIE 4.0; Windows NT; Site Server 3.0 Robot) ACR Unknown robot from American College of Radiology (ACR) running MS Site Server R C 208.236.180.xx http://www.acr.org/s_acr/index.asp http://www.microsoft.com/commerceserver/default.mspx -id_moz_817 Mozilla/4.0 (compatible; MSIE 4.0; Windows NT; Site Server 3.0 Robot) Indonesia Interactive Indonesia Interactive Web-portal robot on MS Site Server R http://www.i-2.co.id/ http://www.microsoft.com/commerceserver/default.mspx -id_moz_818 Mozilla/4.0 (compatible; MSIE 4.0; Windows NT; Site Server 3.0 Robot) WebQuest Designs Webquestdesigns hosting http://www.webquestdesigns.com -id_moz_841 Mozilla/4.0 (compatible; MSIE 5.01; Windows 95) via Avirt Gateway Server v4.0 Avirt Gateway proxy server P http://www.avirt.com/products/gateway.html -id_moz_843 Mozilla/4.0 (compatible; MSIE 5.01; Windows NT 5.0) (samualt9@bigfoot.com) Metacarta.com (66.28.xx.xxx) robot R s. Larbin.... http://www.metacarta.com/ -id_moz_842 Mozilla/4.0 (compatible; MSIE 5.01; Windows NT 5.0; NetCaptor 6.5.0RC1) NetCaptor IE browser addon B http://www.netcaptor.com -id_moz_827 Mozilla/4.0 (compatible; MSIE 5.0; AOL 5.0; Windows 95; DigExt; Gateway2000; sureseeker.com) IE 5.x AOL Win95 Sureseeker search plugin B http://www.sureseeker.com -id_moz_828 Mozilla/4.0 (compatible; MSIE 5.0; Mac_PowerPC; AtHome021) IE 5.x Mac PowerPC AtHome user B -id_moz_829 Mozilla/4.0 (compatible; MSIE 5.0; NetNose-Crawler 2.0; A New Search Experience: http://www.netnose.com) www.netnose.com crawler R parked domain http://www.netnose.com/ -id_moz_830 Mozilla/4.0 (compatible; MSIE 5.0; Win32) via proxy gateway CERN-HTTPD/3.0 libwww/2.17 WinXP via CERN httpd proxy server P http://www.w3.org -id_moz_831 Mozilla/4.0 (compatible; MSIE 5.0; Windows 95) TrueRobot; 1.5 Echo.com robot R http://www.echo.com -id_moz_832 Mozilla/4.0 (compatible; MSIE 5.0; Windows 95) VoilaBot BETA 1.2 (http://www.voila.com/) Voila.fr robot R http://www.voila.fr -id_moz_833 Mozilla/4.0 (compatible; MSIE 5.0; Windows 95) VoilaBot; 1.6 Voila.fr robot R http://www.voila.fr -id_moz_835 Mozilla/4.0 (compatible; MSIE 5.0; Windows ME) Opera 5.11 [en] WinME Opera 5.x B -id_moz_834 Mozilla/4.0 (compatible; MSIE 5.0; Windows ME; Link Checker 2.x.xx http://www.kyosoft.com) Kyosoft's Link Checker C http://www.kyosoft.com -id_moz_836 Mozilla/4.0 (compatible; MSIE 5.0; Windows NT; DigExt; DTS Agent Beijing Express Email Address Extractor via DHCP Data Transport Services (DTS) S site is closed http://www.zstools.com http://esupport.ca.com/index.html?/public/dto_transportit/infodocs/dto1013.asp -id_moz_837 Mozilla/4.0 (compatible; MSIE 5.0; Windows NT; Girafabot; girafabot at girafa dot com; http://www.girafa.com) Girafa (browser plug-in) robot B R http://www.girafa.com -id_moz_838 Mozilla/4.0 (compatible; MSIE 5.0; www.galaxy.com; www.psychedelix.com) Galaxy robot (63.121.41.xxx) R s. also GalaxyBot.. http://www.galaxy.com/ -id_moz_839 Mozilla/4.0 (compatible; MSIE 5.0; www.galaxy.com; www.psychedelix.com/; http://www.galaxy.com/info/crawler.html) Galaxy robot (63.121.41.xxx) R s. also GalaxyBot.. http://www.galaxy.com/ -id_moz_840 Mozilla/4.0 (compatible; MSIE 5.0; YANDEX) Yandex Search Russia link checking (213.180.206.2xx) R s. also Yandex/1... http://www.yandex.ru -id_moz_844 Mozilla/4.0 (compatible; MSIE 5.5; AOL 4.0; Windows 98; GoBeez (www.gobeez.com)) Gobeez starting page plugin C site is offline http://www.gobeez.com/ -id_moz_845 Mozilla/4.0 (compatible; MSIE 5.5; Windows 95; Transmission Segment; Hotbar 2.0) IE 5.5 Win95 Hotbar plug-in http://hotbar.com/install/firstvisit.asp -id_moz_846 Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; Crazy Browser 1.x.x) Crazy Browser - IE based tabbed Browser B http://www.crazybrowser.com -id_moz_847 Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; KITV4.7 Wanadoo) Wanadoo Internet services B -id_moz_848 Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; SAFEXPLORER TL) Safexplorer (safexplorer.com - site is offline) kids browser B -id_moz_849 Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; SYMPA; Katiesoft 7; SimulBrowse 3.0) Katiesoft Scroll (ex www.katiesoft.com now discarded) & SimulBrowse (ex www.simulbrowse.com now dead) IE browser plugins B -id_moz_850 Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; Win 9x 4.90; BTinternet V8.1) Windows ME BTOpenworld Internet services B -id_moz_851 Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; Win 9x 4.90; MSIECrawler) Windows ME Internet Explorer URL check B C -id_moz_852 Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 4.0; obot) Cobion Germany Brand Protection Services robot R http://www.cobion.com -id_moz_853 Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 4.0; QXW03018) Cobion Germany Brand Protection Services robot R http://www.cobion.com -id_moz_858 Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0) Active Cache Request IE 5.5 Win2000 / user agent B -id_moz_859 Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0) Fetch API Request Maybe: - MS Internet Security & Acceleration Server (ISA) cache refreshing request (see link) or - IE 5.5 Win2000 probably with some (website) API request component (see 2nd link) - suspected as email-harvester / site scanning tool (see http://www.byte.com/documents/s=493/byt20010208s0001/index.htm P S ? http://groups.google.com/groups?hl=en&lr=&ie=UTF-8&safe=off&threadm=uGoenyodBHA.1472%40tkmsftngp07&rnum=1&prev=/groups%3Fq%3DFetch%2BAPI%26hl%3Den%26lr%3D%26ie%3DUTF-8%26safe%3Doff%26selm%3DuGoenyodBHA.1472%2540tkmsftngp07%26rnum%3D1 http://groups.google.de/groups?q=%22fetch+api+request%22&hl=de&lr=&ie=UTF-8&oe=UTF-8&selm=3CAD577B.C29BA3B2%40execpc.com&rnum=2 -id_moz_854 Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; .NET CLR 1.0.3705) IE 5.5 Win2000 with MS.NET SDK B -id_moz_855 Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; AIRF) IE 5.5 Win2000 / user agent w. AI RoboForm (AIRF) password manager B http://www.roboform.com -id_moz_856 Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; AspTear 1.5) AspTear URL fetching program component / Download32.com spider R D http://www.alphasierrapapa.com/IisDev/Components/AspTear/ http://www.download32.com -id_moz_857 Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; N_o_k_i_a) Nokia.com network B -id_moz_051102_1 Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; T312461) RPT-HTTPClient/0.3-3E Unknown Object Sciences Corp. robot using the HTTPClient http://www.objectsciences.com http://www.innovation.ch/java/HTTPClient/ -id_moz_060406_2 Mozilla/4.0 (compatible; MSIE 6.0 compatible; Asterias Crawler v4; +http://www.singingfish.com/help/spider.html; webmaster@singingfish.com); SpiderThread Revision: 3.10 Singingfish media spider (64.12.186.2xx) via AOL search R s. also asterias/2.0 http://search.singingfish.com/sfw/home.jsp -id_moz_200108_2 Mozilla/4.0 (compatible; MSIE 6.0; AOL 9.0; Windows 98; .NET CLR 1.1.4322; MEGAUPLOAD 2.0) Megaupload Mega Manager - Download manager toolbar for IE D http://www.megaupload.com/manager/de/ -id_moz_010106_1 Mozilla/4.0 (compatible; MSIE 6.0; AOL 9.0; Windows NT 5.1; SV1; HbTools 4.7.2) Hotbar IE graphical skin B Adware / Spyware component http://hotbar.com/Installation/Browsing/WhatIs/Hotbar.htm -id_moz_860 Mozilla/4.0 (compatible; MSIE 6.0; MSIE 5.5; Windows NT 5.1) Skampy/0.9.x [en] Skaffe.com directory link checker R s. also Skampy http://www.skaffe.com -id_moz_100606_1 Mozilla/4.0 (compatible; MSIE 6.0; TargetSeek/1.0; +http://www.targetgroups.net/TargetSeek.html) TargetSeek Crawler concerning electronics industry product announcements R 71.161.205.2xx http://www.targetgroups.net/TargetSeek.html -id_moz_861 Mozilla/4.0 (compatible; MSIE 6.0; Win32) WebWasher 3.0 IE 6.0 WebWasher ad filter B P http://www.webwasher.com -id_moz_864 Mozilla/4.0 (compatible; MSIE 6.0; Windows 98) REL Software Web Link Validator 2.x) Web Link Validator link validation software C http://www.relsoftware.com -id_moz_865 Mozilla/4.0 (compatible; MSIE 6.0; Windows 98) Web Link Validator 2.x) Web Link Validator link validation software C http://www.relsoftware.com -id_moz_862 Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; Net M@nager V3.02 - www.vinn.com.au) IE 6.0 Netmanager IE add-on B http://www.vinn.com.au -id_moz_290306_1 Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; support@illumit.com; http://www.illumit.com/Products/weblight/) WebLight web analyzer & link checker C s. also WebLight/4.x.x ... http://www.illumit.com/Products/weblight/ -id_moz_863 Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; Win 9x 4.90; http://www.Abolimba.de) Abolimba Multibrowser - IE based browser C http://www.autag.com -id_moz_866 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; .NET CLR 1.1.4322; Lunascape 2.1.3) Lunascape IE based browser (Japan) B s. also Lunascape http://www2.lunascape.jp/index.aspx -id_moz_290708_4 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; Google Wireless Transcoder;) Google wireless transcoder (GWT) proxy for rewriting websites for mobiles P 209.85.136.xxx http://www.google.com/gwt/n -id_moz_150906_1 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; ODP entries t_st; http://tuezilla.de/t_st-odp-entries-agent.html) Tüzilla (Germany) - ODP link checking using Robozilla R 81.169.154.xx http://tuezilla.de http://dmoz.org/profiles/robozilla.html -id_moz_867 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; ODP links test; http://tuezilla.de/test-odp-links-agent.html) Tüzilla (Germany) - ODP link checking using Robozilla R 81.169.154.xx http://tuezilla.de http://dmoz.org/profiles/robozilla.html -id_moz_080606_1 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; ZoomSpider.net bot; .NET CLR 1.1.4322) ZoomSpider.Net indexing robot for several directorys R 70.94.232.2xx http://www.zoomspider.net/ -id_moz_882 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1) (dns_admin@c-a-s-h.com) unknown robot from 64.246.44.xx -id_moz_280408_1 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Covac UPPS Cathan 1.2.5;) Covac Software UPPS (Universal PHP Proxy Server) - free public proxy server P http://www.covac-software.com/proxy/ -id_moz_160406_1 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Crayon Crawler; snprtz|T04056566514940; (R1 1.5)) GetNetWise Crayon Crawler web filter P http://kids.getnetwise.org/tools/tool_info.php?tool_id=931919301.7202 -id_moz_868 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Deepnet Explorer) Deepnet Explorer - IE based browser B http://deepnetexplorer.com/ -id_moz_869 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; heritrix/1.3.0 http://www.cs.washington.edu/research/networking/websys/) Heritrix Internet Archive's open-source web project used by Analysis Projects at UW R http://crawler.archive.org/ http://www.cs.washington.edu/research/networking/websys/ -id_moz_870 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Hotbar 3.0) IE 6x WinXP Hotbar plug-in B http://hotbar.com/install/firstvisit.asp -id_moz_871 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; iOpus-I-M) IE 6x WinXP iOpus Internet Macros - Internet-based macro recorder B http://www.iopus.com -id_moz_872 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; iRider 2.21.1108; FDM) iRider - IE based browser / Free Download Manager (FDM) D http://www.irider.com/irider/index.htm http://www.freedownloadmanager.org/ -id_moz_873 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; KKman3.0) KKman http://www.kkman.com/ - Japanese IE based browser B http://www.kkman.com -id_moz_874 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; MathPlayer2.0) IE 6x WinXP MathPlayer mathematical notation plugin B http://www.mathtype.com/en/products/mathplayer/ -id_moz_875 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Maxthon) Maxton (ex MyIE2) - IE based browser B http://www.maxthon.com -id_moz_876 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; PeoplePal 3.0; MSIECrawler) IE 6x WinXP peoplepc online PeoplePal IE toolbar B http://home.vfw-online.com/peoplepal/default.asp -id_moz_877 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Q312461; IOpener Release 1.1.04) IE 6x WinXP / I-Opener (was www.netpliance.com/) web PC B -id_moz_050307_1 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; QihooBot 1.0 qihoobot@qihoo.net) Qihoo search (China) robot R 220.181.34.1xx http://www.qihoo.com/ -id_moz_070306_1 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SIMBAR Enabled; InfoPath.1) SimBar IE toolbar for accessing The Sims sites / Infopath IE form & spreadsheet plugin B http://www.simstools.com/simbar.php http://office.microsoft.com/en-us/fx010857921033.aspx -id_moz_878 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; StumbleUpon.com 1.760; .NET CLR 1.1.4322) IE 6x WinXP Stumble Upon IE toolbar B http://www.stumbleupon.com -id_moz_150807_1 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; Embedded Web Browser from: http://bsalsa.com/; MSIECrawler) Balsa Productions embedded web browser package for Borland Delphi B http://bsalsa.com/product.html -id_moz_030807_2 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; http://www.changedetection.com/bot.html ) ChangeDetection robot for web page monitoring C 68.166.223.x http://www.changedetection.com/ http://www.changedetection.com/bot.html -id_moz_879 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; .NET CLR 1.1.4322) IE 6x WinXP also used by WebSite Pro HTML editor B http://www.gtpcc.org/gtpcc/websitepro.htm -id_moz_880 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; DX-Browser 5.0.0.0) DX-Browser - German IE based browser B was http://www.dx-soft.net/ (expired) http://www.zdnet.de/downloads/prg/t/p/deDCTP-wc.html -id_moz_271006_1 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; FunWebProducts; ezPeer+ v1.0 Beta (0.4.1.98); ezPeer+ v1.0 (0.5.0.00); .NET CLR 1.1.4322; MSIECrawler) ezPeer+ P2P IE addon B http://web.ezpeer.com/ -id_moz_881 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; IBP; .NET CLR 1.1.4322) Axandra IBP website promotion software ? C B http://www.axandra-web-site-promotion-software-tool.com/index.htm -id_moz_290606_3 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; MRA 4.3 (build 01218)) MRA = Mail.ru Agent - Instant Messenger / VoIP B http://agent.mail.ru/ -id_moz_883 Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search 4.0 Robot) MSN Search robot (207.46.89.xx) R s. also: - MSNBOT -id_moz_170207_3 Mozilla/4.0 (compatible; MSIE 7.0; Win32) Link Commander 4.0 Link Commander bookmark manager C http://www.resortlabs.com/bookmark-manager/linkcommander.php -id_moz_170706_2 Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; bgft) IE 7.0 - WinXP B http://www.microsoft.com/windows/ie/default.mspx -id_moz_080209_1 Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; GTB5; User-agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; http://bsalsa.com) ; .NET CLR 2.0.50727) GTB = Google Toolbar Internet Explorer add-on B http://toolbar.google.com/T4/index.html -id_moz_080209_2 Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; Tablet PC 2.0) MSIE 7.0 *and* Trident token used by Internet Explorer 8 in compatibility view mode B http://blogs.msdn.com/ie/archive/2009/01/09/the-internet-explorer-8-user-agent-string-updated-edition.aspx -id_moz_080209_3 Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 5.1; Trident/4.0; .NET CLR 2.0.50727; .NET CLR 1.1.4322; .NET CLR 3.0.04506.30; .NET CLR 3.0.04506.648) Internet Explorer 8 B http://www.microsoft.com/windows/internet-explorer/beta/default.aspx -id_moz_150408_4 Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.0) IE 8.0 (beta) on Win Vista B http://www.microsoft.com/windows/products/winfamily/ie/ie8/default.mspx -id_moz_030110_1 Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.0; Trident/4.0; Orange 8.0; GTB6.3; Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1) ; Embedded Web Browser from: http://bsalsa.com/; SLCC1; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30618; OfficeLiveConnector.1.3; OfficeLivePatch.1.3) Bsalsa embedded browser B http://bsalsa.com/ -id_moz_010108_4 Mozilla/4.0 (compatible; MSIE enviable; DAUMOA 2.0; DAUM Web Robot; Daum Communications Corp., Korea; +http://ws.daum.net/aboutkr.html) DAUMOA - Daum search Korea robot (211.115.109.xxx) R s. also RaBot http://www.daum.net/ http://ws.daum.net/abouten.html -id_moz_311206_1 Mozilla/4.0 (compatible; MSIE is not me; DAUMOA/1.0.1; DAUM Web Robot; Daum Communications Corp., Korea) DAUMOA - Daum search Korea robot (211.115.109.xxx) R s. also RaBot http://www.daum.net/ -id_moz_281106_2 Mozilla/4.0 (compatible; NaverBot/1.0; http://help.naver.com/delete_main.asp) Naver Search Korea Naverbot R http://www.naver.com/ -id_moz_884 Mozilla/4.0 (compatible; Netcraft Web Server Survey) Netcraft webserver info R C http://www.netcraft.com -id_moz_885 Mozilla/4.0 (compatible; NetPromoter Spider;http://www.net-promoter.com/) NetPromoter Link Utility link checking tool C s. also - Mozilla/4.0 (compatible; Link Utility ... http://www.net-promoter.com/ -id_moz_886 Mozilla/4.0 (compatible; Opera/3.0; Windows 4.10) 3.51 [en] Opera 3.x WinNT B -id_moz_887 Mozilla/4.0 (compatible; Powermarks/3.5; Windows 95/98/2000/NT) Powermarks bookmark manager C http://www.kaylon.com -id_moz_230607_1 Mozilla/4.0 (compatible; RSS Popper) RSS Popper - MS Outlook RSS reader plugin B http://rsspopper.unknown/2004/10/home.html -id_moz_888 Mozilla/4.0 (compatible; SiteKiosk 4.0; MSIE 5.0; Windows 98; SiteCoach 1.0) SiteKiosk public terminal browser B http://www.sitekiosk.com -id_moz_889 Mozilla/4.0 (compatible; SpeedySpider; www.entireweb.com) Entireweb Search Speedyspider (62.13.25.xxx) R s. also Worldlight http://www.entireweb.com -id_moz_890 Mozilla/4.0 (compatible; SPENG) SiteProbe - website status checking R C http://www.siteprobe.com -id_moz_891 Mozilla/4.0 (compatible; SuperCleaner 2.xx; Windows 98) Super Cleaner privacy tool (bookmark checking) C http://www.southbaypc.com/SuperCleaner/ -id_moz_020406_1 Mozilla/4.0 (compatible; Synapse) Synapse - Apache web service for processing XML documents P http://wiki.apache.org/incubator/SynapseProposal -id_moz_150207_1 Mozilla/4.0 (compatible; WebCapture 3.0; Windows) Web2PDF - Adobe Acrobat plugin for site traversal and other services for the Web Capture feature D -id_moz_892 Mozilla/4.0 (compatible; Win32; WinHttp.WinHttpRequest.5) Windows HTTP Services (WinHTTP / XML-parser) -id_moz_170108_1 Mozilla/4.0 (compatible; WSN Links) WSN Links PHP directory software C http://scripts.webmastersite.net/wsnlinks/ -id_moz_111205_6 Mozilla/4.0 (compatible; www.euro-directory.com; urlchecker1.0) Euro Directory (German / Austrian) directory link checking R C http://www.euro-directory.com/ -id_moz_893 Mozilla/4.0 (compatible; www.galaxy.com) Galaxy robot R http://www.galaxy.com -id_moz_894 Mozilla/4.0 (compatible; www.linkguard.com Linkguard Online 1.0; Windows NT) Linkguard.com link validation (service is offline) C -id_moz_240106_1 Mozilla/4.0 (compatible; Y!J; for robot study; keyoshid) Yahoo Search Japan robot (203.141.52.) R s. also Y!J-BSC/1.0... http://www.yahoo.co.jp/ -id_moz_170706_1 Mozilla/4.0 (compatible; Yahoo Japan; for robot study; kasugiya) Yahoo Japan robot (202.93.76.xx) R http://www.yahoo.co.jp/ -id_moz_210207_1 Mozilla/4.0 (compatible;MSIE 6.0; Windows NT 5.0; H010818) Faked IE id string used by DeepTrawl link checking tool C http://deeptrawl.com/ -id_moz_896 Mozilla/4.0 (fantomBrowser) spoofed referer by Fantomaster (Multiblocker) anonymity products P http://fantomaster.com http://multiblocker.com/home.html -id_moz_897 Mozilla/4.0 (fantomCrew Browser) spoofed referer by Fantomaster (Multiblocker) anonymity products P http://fantomaster.com http://multiblocker.com/home.html -id_moz_898 Mozilla/4.0 (hhjhj@yahoo.com) unknown robot from - 64.57.223.40 - 66.28.233.xxx (cogentco.com) -id_moz_899 Mozilla/4.0 (JemmaTheTourist;http://www.activtourist.com) Activtourist Jemma spider R http://www.activtourist.com -id_moz_900 Mozilla/4.0 (MobilePhone PM-8200/US/1.0) NetFront/3.x MMP/2.0 NetFront (v3.x) for Pocket PC (here on Sanyo PM-8200 cell phone) B http://nfppc.access.co.jp/english/ -id_moz_901 Mozilla/4.0 (MobilePhone SCP-5500/US/1.0) NetFront/3.0 MMP/2.0 (compatible; Googlebot/2.1; http://www.google.com/bot.html) Google robot from 66.249.66.xxx R s. also: - Googlebot - Mozilla/5.0 (compatible; Googlebot/2.1... http://www.google.com -id_moz_902 Mozilla/4.0 (MobilePhone SCP-5500/US/1.0) NetFront/3.0 MMP/2.0 FAKE (compatible; Googlebot/2.1; http://www.google.com/bot.html) Google robot from 66.249.66.xxx R s. also: - Googlebot - Mozilla/5.0 (compatible; Googlebot/2.1... http://www.google.com -id_moz_081106_1 Mozilla/4.0 (Mozilla; http://www.mozilla.org/docs/en/bot.html; master@mozilla.com) Unknown robot from Mozilla.org R 63.209.222.xx http://www.mozilla.org/ -id_moz_903 Mozilla/4.0 (Sleek Spider/1.2) ASI - Any Search Info robot R http://search-info.com/ -id_moz_170406_1 Mozilla/4.0 compatible FurlBot/Furl Search 2.0 (FurlBot; http://www.furl.net; wn.furlbot@looksmart.net) Furl (Looksmart) online bookmark tool robot R 64.242.88.xx http://www.furl.net/ -id_moz_905 Mozilla/4.0 compatible ZyBorg/1.0 (wn.zyborg@looksmart.net; http://www.WISEnutbot.com) Wisenut robot R http://www.wisenut.com/ -id_moz_906 Mozilla/4.0 compatible ZyBorg/1.0 (ZyBorg@WISEnutbot.com; http://www.WISEnutbot.com) Wisenut robot R http://www.wisenut.com/ -id_moz_907 Mozilla/4.0 compatible ZyBorg/1.0 Dead Link Checker (wn.zyborg@looksmart.net; http://www.WISEnutbot.com) Wisenut robot R http://www.wisenut.com/ -id_moz_908 Mozilla/4.0 compatible ZyBorg/1.0 for Homepage (ZyBorg@WISEnutbot.com; http://www.WISEnutbot.com) Wisenut robot R http://www.wisenut.com/ -id_moz_909 Mozilla/4.0 efp@gmx.net Unknown robot from 66.230.140.xx (argon.oxeo.com) maybe an e-mail collector S see also LARBIN-EXPERIMENTAL -id_moz_910 Mozilla/4.0 WebTV/2.6 (compatible; MSIE 4.0) WebTV B -id_moz_904 Mozilla/4.0 [en] (Ask Jeeves Corporate Spider) Ask / Ask Jeeves robot R http://www.Ask.com -id_moz_913 Mozilla/4.0(compatible; Zealbot 1.0) LookSmart spider R http://www.looksmart.com -id_moz_290807_1 Mozilla/4.01 (compatible; NORAD National Defence Network) HideMe - Web based anonymous proxy server service P http://www.hideme.biz/ http://www.cnn.com/TECH/computing/9901/25/hacktracts.idg/index.html -id_moz_914 Mozilla/4.01 [en](Win95;I) Some download manager spoofing Netscape 4.01 D -id_moz_915 Mozilla/4.02 [en] (X11; I; SunOS 5.6 sun4u) Netscape 4.x SunOS 5.6 B -id_moz_161105_3 Mozilla/4.04 (compatible; Dulance bot; +http://www.dulance.com/bot.jsp) Dulance Bot - Dulance automated price comparison engine R http://www.dulance.com/ -id_moz_916 Mozilla/4.04 [en] (X11; I; HP-UX B.10.20 9000/712) Netscape 4.x HP-Unix B -id_moz_917 Mozilla/4.04 [en] (X11; I; IRIX 5.3 IP22) Netscape 4.x IRIX B -id_moz_918 Mozilla/4.05 (Macintosh; I; 68K Nav) Netscape 4.x Macintosh 68k B -id_moz_919 Mozilla/4.05 (Macintosh; I; PPC Nav) Netscape 4.x Macintosh PowerPC B -id_moz_920 Mozilla/4.05 [en] (X11; I; SunOS 4.1.4 sun4m) Netscape 4.x SunOS 4.1.4 B -id_moz_921 Mozilla/4.08 [en] (Win98; U ;Nav) Version 4.08 [en]-98306 Someone copied the help function in the referrer field ? -id_moz_922 Mozilla/4.08 [en] (WinNT; U) Netscape 4.x WinNT B -id_moz_911 Mozilla/4.0_(compatible;_MSIE_5.0;_Windows_95)_TrueRobot/1.4 libwww/5.2.8 Echo.com robot R http://www.echo.com -id_moz_912 Mozilla/4.0_(compatible;_MSIE_5.0;_Windows_95)_VoilaBot/1.6 libwww/5.3.2 Voila.fr robot R http://www.voila.fr -id_moz_923 Mozilla/4.5 (compatible; HTTrack 3.0x; Windows 98) HTTrack Offline Browser B D http://www.httrack.com/ -id_moz_924 Mozilla/4.5 (compatible; iCab 2.5.3; Macintosh; I; PPC) iCab MAC Web browser MAC Power PC B http://www.icab.de -id_moz_925 Mozilla/4.5 (compatible; OmniWeb/4.0.5; Mac_PowerPC) OmniWeb 4.x.x Mac browser B http://www.omnigroup.com -id_moz_926 Mozilla/4.5 (compatible; OmniWeb/4.1-beta-1; Mac_PowerPC) OmniWeb 4.x.x Mac browser B http://www.omnigroup.com -id_moz_928 Mozilla/4.5 RPT-HTTPClient/0.3-2 different IPs using the HTTPClient library (mostly link checking) C R http://www.innovation.ch -id_moz_927 Mozilla/4.5 [en]C-CCK-MCD {RuralNet} (Win98; I) RuralNet Internet Services B http://www.ruralnet.net.au -id_moz_929 Mozilla/4.5b1 [en] (X11; I; Linux 2.0.35 i586) Netscape 4.x Linux B -id_moz_301105_3 Mozilla/4.6 [en] (http://www.cnet.com/) Cnet robot for Search.com (216.239.114.xx) R http://www.search.com/ http://www.cnet.com/ -id_moz_930 Mozilla/4.61 [de] (OS/2; I) Netscape 4.x OS/2 B -id_moz_931 Mozilla/4.61 [en] (X11; U; ) - BrowseX (2.0.0 Windows) BrowseX cross-platform browser B http://browsex.com/ -id_moz_932 Mozilla/4.7 Nameprotect (12.148.196.128 - 12.148.196.255) snoopbot R http://www.nameprotect.com -id_moz_933 Mozilla/4.7 (compatible; http://eidetica.com/spider) Eidetica earch and text mining spider R http://eidetica.com/ -id_moz_934 Mozilla/4.7 (compatible; Intelliseek; http://www.intelliseek.com) Intelliseek (64.158.138.xx) robot R http://www.intelliseek.com -id_moz_935 Mozilla/4.7 (compatible; OffByOne; Windows 98) Webster Pro V3.2 OffByOne Browser B http://www.offbyone.com -id_moz_937 Mozilla/4.7 (compatible; Whizbang) WhizBang! Labs information extraction robot R closed since May 2002 http://www.whizbang.com -id_moz_936 Mozilla/4.7 (compatible; WhizBang; http://www.whizbang.com/crawler) WhizBang! Labs information extraction robot R closed since May 2002 http://www.whizbang.com -id_moz_938 Mozilla/4.7 [en](BecomeBot@exava.com) BecomeBot - Becomecom shopping search (64.124.85.xx(x)) R 64.124.85.[x]xx http://www.become.com -id_moz_939 Mozilla/4.7 [en](Exabot@exava.com) Exabot - exava shopping search (64.124.85.xx(x)) R http://www.exava.com -id_moz_940 Mozilla/4.7 [en]C-CCK-MCD {Yahoo;YIP052400} (Win95; I) unknown -id_moz_941 Mozilla/4.72 [en] (BACS http://www.ba.be) http://www.ba.be robot R http://www.ba.be -id_moz_942 Mozilla/4.72C-CCK-MCD Caldera Systems OpenLinux [en] (X11; U; Linux 2.2.14 i686) Netscpape 4.7x Caldera Open Linux Pentium III B -id_moz_943 Mozilla/4.75C-ja [ja] (X11; U; OSF1 V5.1 alpha) Netscape 4.7x Japan OSF1 alpha B -id_moz_944 Mozilla/4.76 (Windows 98; U) Opera 5.12 [en] Opera 5.x Win 98 B -id_moz_945 Mozilla/4.76 [en] (X11; U; FreeBSD 4.4-STABLE i386) Netscape 4.7x FreeBSD B -id_moz_946 Mozilla/4.76 [en] (X11; U; SunOS 5.7 sun4u) Netscape 4.7x SunOS B -id_moz_947 Mozilla/4.77C-SGI [en] (X11; U; IRIX 6.5 IP32) IRIX 6.5 B -id_moz_948 Mozilla/5.0 GigaMedia / NTT DoCoMo robot R http://ir.giga.net.tw/products.htm -id_moz_040707_3 Mozilla/5.0 (+http://www.eurekster.com/mammoth) Mammoth/0.1 Eurekster Swicki community search using SLI-Systems site search engine Mammoth R 64.106.253.1xx http://www.eurekster.com/ http://www.sli-systems.com/ -id_moz_240306_2 Mozilla/5.0 (+http://www.sli-systems.com/) Mammoth/0.1 SLI Systems mammoth robot R s. also mammoth/1.0 ... http://www.sli-systems.com/ http://www.tenspider.com/business-blog/more.php?id=A45_0_1_0_M -id_moz_949 Mozilla/5.0 (Clustered-Search-Bot/1.0; support@clush.com; http://www.clush.com/) Clush search robot R http://www.clush.com -id_moz_020807_1 Mozilla/5.0 (compatible) GM RSS Panel X Greasemonkey RSS panel Firefox plugin B http://www.xs4all.nl/~jlpoutre/BoT/Javascript/RSSpanel/ -id_moz_140209_3 Mozilla/5.0 (compatible; +http://www.evri.com/evrinid) Evri search robot R 216.168.43.1xx http://www.evri.com/ -id_moz_250310_1 Mozilla/5.0 (compatible; 008/0.83; http://www.80legs.com/spider.html;) Gecko/2008032620 008 distributed crawler for 80legs R http://www.80legs.com/spider.html -id_moz_140209_4 Mozilla/5.0 (compatible; Abonti/0.8 - http://www.abonti.com) Abonti WebSearch beta robot R 77.233.225.11x http://www.abonti.com/ -id_moz_030110_4 Mozilla/5.0 (compatible; aiHitBot/1.0; +http://www.aihit.com/) HitCompanies Aihit crawler R 195.128.18.xx http://hitcompanies.aihit.com/search.htm -id_moz_300406_1 Mozilla/5.0 (compatible; AnsearchBot/1.x; +http://www.ansearch.com.au/) Ansearch Australian search robot R 203.206.162.x http://www.ansearch.com.au/ -id_moz_011107_1 Mozilla/5.0 (compatible; archive.org_bot/1.10.0 +http://www.loc.gov/minerva/crawl.html) The Library of Congress Minerva crawler R 207.241.232.1xx http://www.loc.gov/minerva/crawl.html -id_moz_230607_2 Mozilla/5.0 (compatible; archive.org_bot/1.13.1x http://crawler.archive.org) Heritrix - The Internet Archive's open-source crawler (207.241.225.2xx) R s.also - InternetArchive/0.8-dev - Mozilla/5.0 (compatible;archive.org_bot/... http://www.archive.org/ -id_moz_141105_1 Mozilla/5.0 (compatible; archive.org_bot/1.5.0-200506132127 http://crawler.archive.org) Hurricane Katrina Heritrix - The Internet Archive's open-source crawler R s. also - InternetArchive/0.8-dev... - mozilla/5.0 (compatible; heritrix/... http://www.archive.org/ -id_moz_150207_2 Mozilla/5.0 (compatible; Ask Jeeves/Teoma; http://about.ask.com/en/docs/about/webmasters.shtml) Ask Jeeves /Teoma robot R 65.214.45.[x]xx http://sp.ask.com -id_moz_291205_2 Mozilla/5.0 (compatible; BanBots/2.0b; Fetch; +http://www.banbots.com) Project BanBots Perl script robot C s. also BanBots/1.2... http://www.banbots.com/ -id_moz_950 Mozilla/5.0 (compatible; BecomeBot/1.23; http://www.become.com/webmasters.html) BecomeBot - Become.com shopping search (64.124.85.xx(x)) R 64.124.85.[x]xx http://www.become.com -id_moz_951 Mozilla/5.0 (compatible; BecomeBot/1.xx; MSIE 6.0 compatible; http://www.become.com/webmasters.html) BecomeBot - Become.com shopping search (64.124.85.xx(x)) R 64.124.85.[x]xx http://www.become.com -id_moz_952 Mozilla/5.0 (compatible; BecomeBot/2.0beta; http://www.become.com/webmasters.html) BecomeBot - Become.com shopping search (64.124.85.xx(x)) R 64.124.85.[x]xx http://www.become.com -id_moz_953 Mozilla/5.0 (compatible; BecomeBot/2.x; MSIE 6.0 compatible; http://www.become.com/site_owners.html) BecomeBot - Become.com shopping search (64.124.85.xx(x)) R 64.124.85.[x]xx http://www.become.com -id_moz_090506_2 Mozilla/5.0 (compatible; BecomeJPBot/2.3; MSIE 6.0 compatible; +http://www.become.co.jp/site_owners.html) BecomeBot - Become.com shopping search (64.124.85.xx(x)) R 64.124.85.[x]xx http://www.become.com -id_moz_020907_1 Mozilla/5.0 (compatible; BlogRefsBot/0.1; http://www.blogrefs.com/about/bloggers) BlogRefsBot.com blog robot R 69.90.42.xx http://www.blogrefs.com/ http://www.blogrefs.com/about/bloggers -id_moz_171107_1 Mozilla/5.0 (compatible; Bot; +http://pressemitteilung.ws/spamfilter Pressemitteilungen Webservice RSS / news crawler (Germany) R 87.164.242.1xx http://pressemitteilung.ws/ -id_moz_031206_1 Mozilla/5.0 (compatible; BuzzRankingBot/1.0; +http://www.buzzrankingbot.com/) BuzzRanking internet content analysis R 213.251.187.1xx http://www.buzzrankingbot.com/ -id_moz_310506_1 Mozilla/5.0 (compatible; Charlotte/1.0b; charlotte@betaspider.com) Charlotte indexing spider for Searchme / Wikiseek R 209.249.86.x http://www.searchme.com/ http://www.wikiseek.com/ -id_moz_080307_1 Mozilla/5.0 (compatible; Charlotte/1.0b; http://www.searchme.com/support/) Charlotte indexing spider for Searchme / Wikiseek R 209.249.86.x http://www.searchme.com/ http://www.wikiseek.com/ -id_moz_220106_1 Mozilla/5.0 (compatible; Crawling jpeg; http://www.yama.info.waseda.ac.jp) Unknown graphics crawler or downloading agent from Yamana Laboratory - Waseda Univerity Japan (133.9.238.xx) R doesn't read robots.txt http://www.yama.info.waseda.ac.jp/eng/index.html -id_moz_954 Mozilla/5.0 (compatible; Custo 3 (Netwu.com); Windows NT 5.1) Custo web site spidering tool (link checking) C s. also - Custo x.x (www.netwu.com) http://www.netwu.com -id_moz_071207_1 Mozilla/5.0 (compatible; de/1.13.2 +http://www.de.com) De.com German travel related search via Amazon Web Services R 67.202.29.xx http://www.de.com/start.php?homepage=true http://www.amazon.com/gp/browse.html?node=3435361 -id_moz_170109_1 Mozilla/5.0 (compatible; Diffbot/0.1; +http://www.diffbot.com) Diffbot beta - RSS and news feed crawler R 64.71.190.13x http://www.diffbot.com/ -id_moz_030207_1 Mozilla/5.0 (compatible; DNS-Digger-Explorer/1.0; +http://www.dnsdigger.com) DNS-Digger - DNS server neighbourhood search R 212.214.165.2xx http://www.dnsdigger.com/ -id_moz_100606_2 Mozilla/5.0 (compatible; DNS-Digger/1.0; +http://www.dnsdigger.com) DNS-Digger - DNS server neighbourhood search R 212.214.165.2xx http://www.dnsdigger.com/ -id_moz_020506_1 Mozilla/5.0 (compatible; EARTHCOM.info/2.01; http://www.earthcom.info) Earthcom (Czech Republic) search robot (194.108.39.xx) R s. also EARTHCOM .. http://www.earthcom.info -id_moz_190807_3 Mozilla/5.0 (compatible; EARTHCOM/2.2; +http://enter4u.eu) enter4u / Earthcom.info search (Czech Republic) R http://enter4u.eu/ http://www.earthcom.info -id_moz_050107_1 Mozilla/5.0 (compatible; egothor/8.0g; +http://ego.ms.mff.cuni.cz/) Prague Faculty of Mathematics and Physics using Egothor open source crawler P 195.113.20.125 http://ego.ms.mff.cuni.cz/ http://www.egothor.org/ -id_moz_310507_1 Mozilla/5.0 (compatible; Exabot Test/3.0; +http://www.exabot.com/go/robot) Exalead (France) search robot (193.47.80.xx) R s. Harvest-NG/1.0.2 and Exalead NG... http://www.exabot.com/ -id_moz_221207_1 Mozilla/5.0 (compatible; FatBot 2.0; http://www.thefind.com/main/CrawlerFAQs.fhtml) TheFind.com - Shopping search robot R 64.124.148.xx[x] http://www.thefind.com/ -id_moz_170109_2 Mozilla/5.0 (compatible; Galbot/1.0; +http://www.galbot.com/bot.html) Galbot tagging robot (beta) - Denmark R http://www.galbot.com/ -id_moz_955 mozilla/5.0 (compatible; genevabot http://www.healthdash.com) Geneva Single-Site Search Engine used by Healthdash health search R http://www.healthdash.com -id_moz_170207_4 Mozilla/5.0 (compatible; Google Desktop) Paros/3.2.12 Paros - a Java based HTTP/HTTPS proxy P http://sourceforge.net/projects/paros -id_moz_956 Mozilla/5.0 (compatible; Googlebot/2.1; http://www.google.com/bot.html) Google robot R s. also: - Googlebot - Mozilla/4.0 (MobilePhone SCP ... http://www.google.com -id_moz_957 mozilla/5.0 (compatible; heritrix/1.0.4 http://innovationblog.com) Unknown robot using Heritrix R http://innovationblog.com http://crawler.archive.org/ -id_moz_280207_1 Mozilla/5.0 (compatible; heritrix/1.10.2 +http://i.stanford.edu/) The Stanford University InfoLab robot using Heritrix R 171.67.73.1x http://i.stanford.edu/ http://www.archive.org/ -id_moz_280108_2 Mozilla/5.0 (compatible; heritrix/1.12.1 +http://newstin.com/) Newstin news feed search using Heritrix R 195.39.35.1xx http://www.newstin.com/ -id_moz_210807_1 Mozilla/5.0 (compatible; heritrix/1.12.1 +http://www.page-store.com) Page-store.com vertical search via Amazon Web Services R 72.44.62.1xx http://www.page-store.com/ http://www.amazonaws.com/ -id_moz_230108_1 Mozilla/5.0 (compatible; heritrix/1.12.1 +http://www.page-store.com) [email:paul@page-store.com] Page-store.com vertical search via Amazon Web Services R 72.44.62.1xx http://www.page-store.com/ http://www.amazonaws.com/ -id_moz_958 mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org) Heritrix Internet Archive's open-source web project R http://archive.crawler.org -id_moz_270106_2 Mozilla/5.0 (compatible; heritrix/1.4.0 +http://www.chepi.net) Chepi Beta search Spain (194.116.240.1xx) using Heritrix R http://www.chepi.net/ http://lucene.apache.org -id_moz_959 Mozilla/5.0 (compatible; heritrix/1.4t http://www.truveo.com/) Truveo data mining robot using Heritrix R http://www.truveo.com/home/ http://crawler.archive.org/ -id_moz_960 Mozilla/5.0 (compatible; heritrix/1.5.0 http://www.l3s.de/~kohlschuetter/projects/crawling/) L3S WebCrawling Project (Germany) using Heritrix R http://www.l3s.de/~kohlschuetter/projects/crawling/ http://crawler.archive.org/ -id_moz_961 Mozilla/5.0 (compatible; heritrix/1.5.0-200506231921 http://pandora.nla.gov.au/crawl.html) Pandora Internet Archive crawler (Australia) using Heritrix R http://pandora.nla.gov.au http://crawler.archive.org/ -id_moz_250706_3 Mozilla/5.0 (compatible; heritrix/1.6.0 http://www.worio.com/) WORIO (beta) search for computer scientists and programmers using Heritrix open-source crawler R 137.82.84.xx http://www.worio.com/ http://www.archive.org/ -id_moz_190607_1 Mozilla/5.0 (compatible; heritrix/1.7.0 +http://www.greaterera.com/) greatarea.com website collection project using Heritrix R 63.209.222. http://www.greaterera.com/ -id_moz_230307_1 Mozilla/5.0 (compatible; Heritrix/1.8.0 http://www.hanzoarchives.com) hanzo:web social web archiving service D 216.182.238. http://www.hanzoweb.com/ -id_moz_151106_1 Mozilla/5.0 (compatible; heritrix/1.x.x +http://www.accelobot.com) Accelobot - Accelovation Market Discovery software robot R 72.20.99.xx http://www.accelobot.com/ http://www.accelovation.com/solutions.html -id_moz_030208_1 Mozilla/5.0 (compatible; heritrix/2.0.0-RC1 +http://www.aol.com) Unknown AOL robot using Heritrix R 64.236.128.x http://www.aol.com/ -id_moz_051207_2 Mozilla/5.0 (compatible; Hermit Search. Com; +http://www.hermitsearch.com) Hermits Search.com - Products and service search robot R 72.55.165.11x http://www.hermitsearch.com/ -id_moz_161006_2 Mozilla/5.0 (compatible; http://www.IsMySiteUp.Net/bot/ ) IsMySiteUp? - Online website monitoring service C 142.179.247.xx http://www.ismysiteup.net/ -id_moz_101106_2 Mozilla/5.0 (compatible; http://www.UptimeAuditor.com/bot/ ) UptimeAuditor - real time web monitoring C 142.179.247.xx http://www.uptimeauditor.com/ -id_moz_180508_1 Mozilla/5.0 (compatible; HyperixScoop/1.3; +http://www.hyperix.com) Hyperix vertical search crawler R 64.40.113.[x]xx http://www.hyperix.com/ -id_moz_070406_1 Mozilla/5.0 (compatible; iaskspider/1.0; MSIE 6.0) Unknown robot (reads robots.txt) from chinatelecom (219.142.78.xx) Not from iask.com.cn - s. also iaskspider -id_moz_280607_1 Mozilla/5.0 (compatible; IDBot/1.0; +http://www.id-search.org/bot.html) ID-Search.org - Russian search project R 67.159.44.2xx http://id-search.org/bot.html -id_moz_962 Mozilla/5.0 (compatible; InterseekWeb/3.x) Najdi.si (Slovenia) search using Interseek/Web Interseek/API Search Engine R http://www.najdi.si/pomoc/eng/index.jsp -id_moz_130807_4 Mozilla/5.0 (compatible; Jim +http://www.hanzoarchives.com) hanzo:web social web archiving service D 216.182.238. http://www.hanzoweb.com/ -id_moz_963 Mozilla/5.0 (compatible; Konqueror/2.0.1; X11); Supports MD5-Digest; Supports gzip encoding Konqueror 2.0.x X11 B http://www.konqueror.org/ -id_moz_964 Mozilla/5.0 (compatible; Konqueror/2.1.1; X11) Konqueror 2.1.x X11 B http://www.konqueror.org/ -id_moz_966 Mozilla/5.0 (compatible; Konqueror/2.2.2) Konqueror 2.2.x B http://www.konqueror.org/ -id_moz_965 Mozilla/5.0 (compatible; Konqueror/2.2.2; Linux 2.4.14-xfs; X11; i686) Konqueror 2.2.x Linux B http://www.konqueror.org/ -id_moz_050108_2 Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails) Exalead (France) search robot (193.47.80.xx) R s. Harvest-NG/1.0.2 and Exalead NG... http://www.exabot.com/ -id_moz_967 Mozilla/5.0 (compatible; LemSpider 0.1) Lemur Consulting LemIR spider R http://www.lemurconsulting.com -id_moz_968 Mozilla/5.0 (compatible; LinksManager.com_bot http://linksmanager.com/linkchecker.html) Linksmanager.com online link checking service C s.also LinksManager.com http://www.linksmanager.com -id_moz_140408_2 Mozilla/5.0 (compatible; LinkStash Bookmark Manager; http://www.xrayz.co.uk/) LinkStash Bookmark Manager C http://www.xrayz.co.uk/ -id_moz_060706_2 Mozilla/5.0 (compatible; MojeekBot/2.0; http://www.mojeek.com/bot.html) Mojeek Search Preview robot (217.155.205.xx) R s. also MojeekBot/0.x http://www.mojeek.com -id_moz_290107_1 Mozilla/5.0 (compatible; MOSBookmarks/v2.6-Plus; Link Checker) Joomla!/Mambo component - MosBookmarks (bot) link checking C http://www.tegdesign.ch/ -id_moz_091007_1 Mozilla/5.0 (compatible; MSIE 6.0; Podtech Network; crawler_admin@podtech.net) PodTech entertainment and video network crawler R 71.134.235.xx http://www.podtech.net/home/ -id_moz_969 Mozilla/5.0 (compatible; OnetSzukaj/5.0; http://szukaj.onet.pl) onet.pl Szukaj (Search) robot (213.180.128.1xx) R s. also - Onet.pl SA http://szukaj.onet.pl -id_moz_181207_1 Mozilla/5.0 (compatible; PagestackerBot; http://www.pagestacker.com) Pagestacker online bookmark service C 70.85.129.12x http://www.pagestacker.com/ -id_moz_020307_1 Mozilla/5.0 (compatible; PalmeraBot; http://www.links24h.com/help/palmera) Version 0.001 PalmeraBot - Links24h.com search engine robot R 80.59.111.2xx http://www.links24h.com/ http://www.links24h.com/help/palmera/ -id_moz_130806_1 Mozilla/5.0 (compatible; PEAR HTTP_Request class; http://feed.moo.jp/) FeedMo feed search (Japan) using Pear HTTP C ? 210.188.205.2xx http://feed.moo.jp/ http://pear.php.net/ -id_moz_190607_2 Mozilla/5.0 (compatible; Phonifier; +http://www.phonifier.com) PHONifier mobile access to web content D B http://www.phonifier.com/ -id_moz_240208_2 Mozilla/5.0 (compatible; pmoz.info ODP link checker; +http://pmoz.info/doc/botinfo.htm) pmoz.info ODP link checking bot C 74.208.25.118 / 216.15.74.85 http://pmoz.info/doc/botinfo.htm http://www.dmoz.org/ -id_moz_970 Mozilla/5.0 (compatible; pogodak.ba/3.x) Pogodak search (Slovenia) robot via Interseek R 89.143.229.1xx http://www.pogodak.hr http://www.interseek.com/ -id_moz_100408_2 Mozilla/5.0 (compatible; Pogodak.hr/3.1) Pogodak search (Slovenia) robot via Interseek R 89.143.229.1xx http://www.pogodak.hr http://www.interseek.com/ -id_moz_101107_1 Mozilla/5.0 (compatible; Proximic crawler; +http://www.proximic.com/en/about-us/contact-us.html) Proximic Publisher Widget - RSS and news content generator C http://www.proximic.com/ -id_moz_230907_1 Mozilla/5.0 (compatible; PWeBot/3.1; http://www.programacionweb.net/robot.php) ProgramacionWeb.net PWeBot crawler (Argentina) R 62.149.236.2xx http://www.programacionweb.net/robot-en.php http://www.programacionweb.net/ -id_moz_130507_1 Mozilla/5.0 (compatible; Quantcastbot/1.0; www.quantcast.com) Quantcast - Open Internet Ratings Service R http://www.quantcast.com/ -id_moz_190706_1 Mozilla/5.0 (compatible; robtexbot/1.0; http://www.robtex.com/ ) robtex - Multi-RBL check and AS-numbercheck C http://www.robtex.com/ -id_moz_050408_1 Mozilla/5.0 (compatible; ScoutJet; +http://www.scoutjet.com/) ScoutJet (Blekko) search web crawler R http://www.scoutjet.com/ -id_moz_300106_3 Mozilla/5.0 (compatible; Scrubby/2.2; http://www.scrubtheweb.com/) Scrub the web robot (66.93.156.xx) R s.also Scrubby/2.x http://www.scrubtheweb.com/ -id_moz_031107_4 Mozilla/5.0 (compatible; ShunixBot/1.x.x +http://www.shunix.com/robot.htm) Shunixbot (France) beta / test semantic web indexing robot R http://www.shunix.com/ -id_moz_971 Mozilla/5.0 (compatible; ShunixBot/1.x; http://www.shunix.com/bot.htm) Shunixbot (France) beta / test semantic web indexing robot R http://www.shunix.com/ -id_moz_280607_2 Mozilla/5.0 (compatible; SkreemRBot +http://skreemr.com) Skreemr - Audio search engine R 64.15.69.x http://skreemr.com/ -id_moz_070207_2 Mozilla/5.0 (compatible; SnapPreviewBot; en-US; rv:1.8.0.9) Gecko/20061206 Firefox/1.5.0.9 Snap Firefox Search Plugin B http://www.snap.com/about/spa1A.php -id_moz_972 Mozilla/5.0 (compatible; SpurlBot/0.2) Spurl.net bookmark service & search engine (84.40.30.xxx) R C http://www.spurl.net -id_moz_190108_1 Mozilla/5.0 (compatible; SummizeBot +http://www.summize.com) Summize - Opinion and review search robot R 208.79.17.x[x] http://www.summize.com/ -id_moz_973 Mozilla/5.0 (compatible; SYCLIKControl/LinkChecker;) Syclik Control web content management system R C http://www.syclik.com -id_moz_070607_1 Mozilla/5.0 (compatible; Synoobot/0.9; http://www.synoo.com/search/bot.html) Synoo web directory robot R 212.12.114.2xx http://www.synoo.com/search/bot.html -id_moz_261105_1 Mozilla/5.0 (compatible; Theophrastus/x.x; http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php) Theophrastus Internet Spider for a basic search engine project R http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php -id_moz_030207_2 Mozilla/5.0 (compatible; TridentSpider/3.1) Interseek - Java search engine technology used for Pogodak search R 213.253.92.x http://www.interseek.com/ http://www.pogodak.com/ -id_moz_974 Mozilla/5.0 (compatible; Vagabondo/2.1; webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/) WiseGuys robot R s.also - Mozilla/3.0 (Vagabondo... - Vagabondo.. http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk -id_moz_280209_4 Mozilla/5.0 (compatible; Webduniabot/1.0; +http://search.webdunia.com/bot.aspx) Webdunia search (India) robot R http://www.webdunia.com/ -id_moz_151205_1 Mozilla/5.0 (compatible; Windows NT 5.0; phpwebbrainBot/0.1 - http://www.monsterli.ch/phpwebbrain/) phpwebbrain online bookmark service (Germany) C http://www.monsterli.ch/phpwebbrain/ -id_moz_150307_1 Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com) WORIO (beta) search for computer scientists and programmers using Heritrix open-source crawler R 137.82.84.xx http://www.worio.com/ http://www.archive.org/ -id_moz_221008_1 Mozilla/5.0 (compatible; WoW Lemmings Kathune/2.0;http://www.wowlemmings.com/kathune.html) Kathune spider for World of Warcraft guild data. Used to power WoW Lemmings R 76.12.83.24x http://www.wowlemmings.com/kathune.html http://www.wowlemmings.com/ -id_moz_260407_1 Mozilla/5.0 (compatible; XTbot/1.0v; +http://www.externaltest.com) eXternalTest - Server and online services monitoring C http://www.externaltest.com/ -id_moz_290606_2 Mozilla/5.0 (compatible; Yahoo! DE Slurp; http://help.yahoo.com/help/us/ysearch/slurp) Yahoo / Inktomi search robot R 66.196.77.1xx / 72.30.98.2xx -id_moz_181105_1 Mozilla/5.0 (compatible; Yahoo! Slurp China; http://misc.yahoo.com.cn/help.html) Inktomi robot (202.160.180.xxx) for Yahoo China R http://www.yahoo.com.cn/ http://www.inktomi.com/ -id_moz_975 Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp) Inktomi robot for Yahoo (via 66.196.xx.xxx) R http://www.inktomi.com -id_moz_061208_2 Mozilla/5.0 (compatible; YesupBot/1.0; +http://www.yesup.net/bot.html) Yesup Seo - Toronto SEO Service C 66.48.78.1xx http://yesupseo.com/ -id_moz_250107_1 Mozilla/5.0 (compatible; Yoono; http://www.yoono.com/) Yoono - community based search (193.110.140.xxx / 194.0.179.[x]xx) R s. also yoono/1.0 web-crawler - yoofind/yoofind .. http://www.yoono.com/ -id_moz_061208_3 Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; ) Youdao search (China) robot R 202.108.7.1xx http://www.youdao.com/ -id_moz_050807_1 Mozilla/5.0 (compatible; Zenbot/1.3; +http://zen.co.za/webmasters/) Zenbot robot for the Southern African Zen search service R 196.46.116.x[x] / 196.23.180.x[x] http://zen.co.za/ http://zen.co.za/webmasters/ -id_moz_110408_1 Mozilla/5.0 (compatible; zermelo +http://www.powerset.com) [email:paul@page-store.com,crawl@powerset.com] Powerset Natural Language Search crawler (under development) using Heritrix via Amazon Web Services R 67.202.34.xxx http://www.powerset.com/ http://www.amazon.com/gp/browse.html?node=3435361 -id_moz_030606_1 Mozilla/5.0 (compatible;archive.org_bot/1.7.1; collectionId=316; Archive-It; +http://www.archive-it.org) Heritrix - The Internet Archive's open-source crawler (207.241.225.2xx) R s.also - InternetArchive/0.8-dev - archive.org_bot http://www.archive.org/ -id_moz_180906_2 Mozilla/5.0 (compatible;archive.org_bot/heritrix-1.9.0-200608171144 +http://pandora.nla.gov.au/crawl.html) Wayback Machine Internet Archive crawler R 207.241.233.2xx http://www.archive.org/index.php -id_moz_180107_1 Mozilla/5.0 (compatible;FindITAnswersbot/1.0;+http://search.it-influentials.com/bot.htm) FindITAnswers - Search engine for software developers B 74.93.15.249 http://www.finditanswers.com/ -id_moz_170906_2 Mozilla/5.0 (compatible;MAINSEEK_BOT) Mainseek search (Poland) robot R 80.190.213.xx http://www.mainseek.com/ -id_moz_290708_1 Mozilla/5.0 (Gecko/20070310 Mozshot/0.0.20070628; http://mozshot.nemui.org/) MozShot - Technical demo to take screenshot of any URL B http://mozshot.nemui.org/ -id_moz_150408_2 Mozilla/5.0 (Macintosh; U; Intel Mac OS X 10.4; en-US; rv:1.9b5) Gecko/2008032619 Firefox/3.0b5 Mozilla Firefox 3.0 beta (Gran Paradiso) for MacOS B http://developer.mozilla.org/en/docs/Firefox_3_for_developers -id_moz_976 Mozilla/5.0 (Macintosh; U; PPC Mac OS X Mach-O; en-US; rv:1.0.1) Gecko/20021219 Chimera/0.6 Chimera browser (Mozilla/Gecko engine) - now Camino Mac PowerPC B http://www.mozilla.org -id_moz_977 Mozilla/5.0 (Macintosh; U; PPC Mac OS X Mach-O; en-US; rv:1.0.1) Gecko/20030306 Camino/0.7 Camino browser (Mozilla/Gecko engine) - ex Chimera Mac PowerPC B http://www.mozilla.org -id_moz_978 Mozilla/5.0 (Macintosh; U; PPC Mac OS X; en-US) AppleWebKit/xx (KHTML like Gecko) OmniWeb/v5xx.xx OmniWeb 5.x.x Mac OS X browser B http://www.omnigroup.com -id_moz_979 Mozilla/5.0 (Macintosh; U; PPC Mac OS X; en-us) AppleWebKit/xxx.x (KHTML like Gecko) Safari/12x.x Safari 1.2x browser (Mozilla/Gecko engine) MAC OS X B http://www.apple.com -id_moz_980 Mozilla/5.0 (Macintosh; U; PPC; en-US; rv:0.9.2) Gecko/20010726 Netscape6/6.1 Netscape 6.x Mac PowerPC B -id_moz_981 Mozilla/5.0 (research@mediatrec.com) unknown robot from gw.ocg-corp.com -id_moz_260806_1 Mozilla/5.0 (Sage) Sage - RSS and Atom feed reader extension for Mozilla Firefox B http://sage.mozdev.org/ -id_moz_982 Mozilla/5.0 (Slurp/cat; slurp@inktomi.com; http://www.inktomi.com/slurp.html) Inktomi (Hotbot-Lycos - NBCi etc.) robot R http://www.inktomi.com -id_moz_983 Mozilla/5.0 (Slurp/si; slurp@inktomi.com; http://www.inktomi.com/slurp.html) Inktomi (Hotbot-Lycos - NBCi etc.) robot R http://www.inktomi.com -id_moz_984 Mozilla/5.0 (SunOS 5.8 sun4u; U) Opera 5.0 [en] Opera 5.x SunOS B -id_moz_020507_1 Mozilla/5.0 (Twiceler-0.9 http://www.cuill.com/twiceler/robot.html) Twiceler experimental web crawler R 64.62.136.xxx http://www.cuill.com/ -id_moz_070106_2 Mozilla/5.0 (Version: xxxx Type:xx) Some spambot from Romania (82.208.139.1xx & 86.123.65.xx) - Maybe email harvesting S UA sometimes have random letters like: vkfjkgo... -id_moz_985 Mozilla/5.0 (wgao@genieknows.com) GenieKnows.com search robot (64.5.245.xx / 64.5.220.xxx) R http://www.genieknows.com/ -id_moz_986 Mozilla/5.0 (Windows; U; Win98; en-US; rv:0.9.2) Gecko/20010726 Netscape6/6.1 Netscape 6.x Win98 B -id_moz_987 Mozilla/5.0 (Windows; U; Win98; en-US; rv:x.xx) Gecko/20030423 Firebird Browser/0.6 Firebird browser (Mozilla/Gecko engine) - ex Phoenix Win98 B http://www.mozilla.org -id_moz_988 Mozilla/5.0 (Windows; U; Win9x; en; Stable) Gecko/20020911 Beonex/0.8.1-stable Beonex Communicator browser (Mozilla/Gecko engine) B http://www.beonex.com -id_moz_111205_1 Mozilla/5.0 (Windows; U; Windows NT 5.0; en-US; rv:1.7.7) NimbleCrawler 1.11 obeys UserAgent NimbleCrawler For problems contact: crawler_at_dataalchemy.com Healthline health related search robot (72.5.115.xx) R http://www.healthline.com/ -id_moz_171008_2 Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US) AppleWebKit/525.19 (KHTML, like Gecko) Chrome/0.2.153.1 Safari/525.19 Google Chrome browser based on WebKit (Safari) B http://www.google.com/chrome -id_moz_170207_1 Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.8.0.5) Gecko/20060731 Firefox/1.5.0.5 Flock/0.7.4.1 Flock web browser built on Mozilla technologies B http://www.flock.com/ -id_moz_190108_3 Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.8.1.11) Gecko/20071127 Firefox/2.0.0.4/Megaupload x.0 Megaupload Mega Manager - Download manager plugin for Firefox D http://www.megaupload.com/manager/de/ -id_moz_171008_1 Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.9.0.1) Gecko/2008092215 Firefox/3.0.1 Orca/1.1 beta 3 Orca browser - based on Gecko B http://www.orcabrowser.com -id_moz_989 Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:x.x.x) Gecko/20041107 Firefox/x.x Firefox browser (Mozilla/Gecko engine) - ex Firebird WinXP B http://www.mozilla.org -id_moz_990 Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:x.xx) Gecko/20030504 Mozilla Firebird/0.6 Firebird browser (Mozilla/Gecko engine) - ex Phoenix WinXP B http://www.mozilla.org -id_moz_991 Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:x.xxx) Gecko/20041027 Mnenhy/0.6.0.104 Mnenhy - enhanced mail & news Mozilla based browser B http://mnenhy.mozdev.org/index-de.html -id_moz_060508_2 Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com) Voila.fr robot R http://www.voila.fr -id_moz_080608_2 Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com) Voila.fr robot R http://www.voila.fr -id_moz_150408_3 Mozilla/5.0 (Windows; U; Windows NT 6.0; en-US; rv:1.9b5) Gecko/2008032620 Firefox/3.0b5 Mozilla Firefox 3.0 beta (Gran Paradiso) for Win B http://developer.mozilla.org/en/docs/Firefox_3_for_developers -id_moz_300407_2 Mozilla/5.0 (Windows; U;XMPP Tiscali Communicator v.10.0.1; Windows NT 5.1; it; rv:1.8.1.3) Gecko/20070309 Firefox/2.0.0.3 Tiscali Communicator - Online services suite B http://im.tiscali.com/index.html -id_moz_300106_1 Mozilla/5.0 (Windows;) NimbleCrawler 1.12 obeys UserAgent NimbleCrawler For problems contact: crawler@health Healthline health related search robot (72.5.115.xx) R http://www.healthline.com/ -id_moz_161205_2 Mozilla/5.0 (Windows;) NimbleCrawler 1.12 obeys UserAgent NimbleCrawler For problems contact: crawler@healthline.com Healthline health related search robot (72.5.115.xx) R http://www.healthline.com/ -id_moz_090807_2 Mozilla/5.0 (X11; Linux i686; U;rv: 1.7.13) Gecko/20070322 Kazehakase/0.4.4.1 Kazehakase - Gecko based browser (Japan) B http://kazehakase.sourceforge.jp/ -id_moz_992 Mozilla/5.0 (X11; U; Linux 2.4.2-2 i586; en-US; m18) Gecko/20010131 Netscape6/6.01 Netscape 6.x Linux B -id_moz_160306_1 Mozilla/5.0 (X11; U; Linux i686; de-AT; rv:1.8.0.2) Gecko/20060309 SeaMonkey/1.0 SeaMonkey browser suite (ex Mozilla) on Linux B http://www.mozilla.org/projects/seamonkey/ -id_moz_993 Mozilla/5.0 (X11; U; Linux i686; en-GB; rv:1.7.6) Gecko/20050405 Epiphany/1.6.1 (Ubuntu) (Ubuntu package 1.0.2) Epiphany (Mozilla/Gecko engine) browser Linux B http://www.gnome.org/projects/epiphany/ -id_moz_994 Mozilla/5.0 (X11; U; Linux i686; en-US; Nautilus/1.0Final) Gecko/20020408 Nautilus (developed by Eazel.com) 1.x Browser Linux B http://swin05.dyndns.biz/Doc/Docrh7.03us/DocRH7.3us/sunsite.mff.cuni.cz/pub/redhat/linux/7.3/fr/doc/RH-DOCS/rhl-gsg-en-7.3/s1-browsers-nautilus.html -id_moz_995 Mozilla/5.0 (X11; U; Linux i686; en-US; rv:0.9.3) Gecko/20010801 Mozilla (Gecko) 0.9x browser Linux B -id_moz_030110_5 Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.2.1; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/20021130 Spinn3r social network crawler R 64.34.195.1xx http://spinn3r.com/ -id_moz_996 Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.2b) Gecko/20021007 Phoenix/0.3 Phoenix 0.3 browser (Mozilla/Gecko engine) - now Firebird Linux B http://www.firebirdsql.org/ -id_moz_997 Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.6) Gecko/20040413 Epiphany/1.2.1 Epiphany (Mozilla/Gecko engine) browser Linux B http://www.gnome.org/projects/epiphany/ -id_moz_190107_1 Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8.0.7) Gecko/20060909 Firefox/1.5.0.7 SnapPreviewBot Snap Firefox Search Plugin B http://www.snap.com/about/spa1A.php -id_moz_240107_2 Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8.1) Gecko/20061129 BonEcho/2.0 Bon Echo Alpha - developer preview of future Firefox browser B http://www.mozilla.org/projects/bonecho/releases/2.0a1.html -id_moz_240207_2 Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8.1.1) Gecko/20061205 Iceweasel/2.0.0.1 (Debian-2.0.0.1+dfsg-2) IceWeasel - the GNU version of the Firefox browser B http://www.gnu.org/software/gnuzilla/ -id_moz_150408_1 Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9a8) Gecko/2007100619 GranParadiso/3.0a8 Mozilla Firefox 3.0 beta (Gran Paradiso) for Linux B http://developer.mozilla.org/en/docs/Firefox_3_for_developers -id_moz_999 Mozilla/5.0 Galeon/1.0.2 (X11; Linux i686; U;) Gecko/20011224 Galeon 1.x Browser Linux B http://galeon.sourceforge.net/ -id_moz_1000 Mozilla/5.0 gURLChecker/0.x.x (Linux) gURLChecker - GNOME link checking tool C http://www.nongnu.org -id_moz_1001 Mozilla/5.0 URL-Spider URL Spider - used by usww.net R http://www.url-spider.com/ -id_moz_1002 Mozilla/5.0 usww.com-Spider-for-w8.net W8net spider R http://www.usww.com -id_moz_1003 Mozilla/5.0 wgao@genieknows.com GenieKnows.com search robot (64.5.245.xx / 64.5.220.xxx) R http://www.genieknows.com -id_moz_111205_7 Mozilla/5.0 whoiam [http://www.axxus.de/] axxus.de German business directory R C http://www.axxus.de/ -id_moz_998 Mozilla/5.0 [en] (compatible; Gulper Web Bot 0.2.4 www.ecsl.cs.sunysb.edu/~maxim/cgi-bin/Link/GulperBot) Yuntis : Collaborative Web Resource Categorization and Ranking Project robot R http://www.ecsl.cs.sunysb.edu/yuntis/ -id_g_m_190606_1 MQbot metaquerier.cs.uiuc.edu/crawler MetaExplorer project's MetaQuerier robot R 192.17.11.xx http://metaquerier.cs.uiuc.edu/ -id_g_m_251006_1 MQBOT/Nutch-0.9-dev (MQBOT Nutch Crawler; http://falcon.cs.uiuc.edu; mqbot@cs.uiuc.edu) MetaExplorer project's MetaQuerier robot R 192.17.11.xx http://metaquerier.cs.uiuc.edu/ -id_g_m_1004 MSFrontPage/4.0 MS Frontpage 4.x B -id_g_m_1005 MSIE 4.0 (Win95) Some faked UA - maybe for a download manager D -id_g_m_1006 MSIE-5.13 (larbin@unspecified.mail) unknown robot from gw.ocg-corp.com (209.126.176.x) see also: - Opera/6.01 (larbin@.....) - WinampMPEG/2.00 larbin@.... -id_g_m_190506_1 msnbot-media/1.0 (+http://search.msn.com/msnbot.htm) MSN media search robot R 65.55.235.1xx http://search.msn.com -id_g_m_290806_1 msnbot-Products/1.0 (+http://search.msn.com/msnbot.htm) Windows Live product search (Beta) robot R 207.68.157.xxx http://products.live.com http://productsearch.spaces.live.com/ -id_g_m_1007 MSNBOT/0.xx (http://search.msn.com/msnbot.htm) MSN Search robot - 131.107.xxx.xxx 204.95.96.xxx - 204.95.111.xxx 207.46.xxx.xxx R s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search... http://search.msn.com -id_g_m_1008 msnbot/x.xx ( http://search.msn.com/msnbot.htm) MSN Search robot - 131.107.xxx.xxx 204.95.96.xxx - 204.95.111.xxx 207.46.xxx.xxx R s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search... http://search.msn.com -id_g_m_190108_2 MSNBOT_Mobile MSMOBOT Mozilla/2.0 (compatible; MSIE 4.02; Windows CE; Default) Microsoft search for mobiles R 65.55.241.2xx http://livesearchmobile.com/?mid=1011 -id_g_m_1009 MSNPTC/1.0 MSN Search robot - 131.107.xxx.xxx 204.95.96.xxx - 204.95.111.xxx 207.46.xxx.xxx R s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search... http://search.msn.com -id_g_m_1010 MSProxy/2.0 Microsoft proxy server P http://www.microsoft.com/isaserver/evaluation/previousversions/default.mspx -id_g_m_181205_3 MSRBOT MacEdition CodeBitch link checking C http://www.macedition.com/cb/cb_20030310.php -id_g_m_270407_1 MSRBOT (http://research.microsoft.com/research/sv/msrbot) Microsoft MSRBot R http://research.microsoft.com/research/sv/msrbot/ -id_g_m_070406_3 Mulder, VCR-1.0 StreamBox VCR user agent D http://all-streaming-media.com/streaming-media-faq/faq-streambox-vcr-download-problems.htm -id_g_m_1011 multiBlocker browser Multiblocker (Fantomaster) anonymity software user P http://multiblocker.com/home.html http://fantomaster.com -id_g_m_030807_1 multicrawler ( http://sw.deri.org/2006/04/multicrawler/robots.html) MultiCrawler for DERI Galway's Semantic Web Search Engine cluster R 140.203.154.1xx http://sw.deri.org/2006/04/multicrawler/robots.html http://sw.deri.ie/ -id_g_m_1012 MultiText/0.1 Virginia Tech Digital Library Research Laboratory robot R http://www.dlib.vt.edu -id_g_m_1013 MusicWalker2.0 ( http://www.somusical.com) SoMusical! musical directory link checking R http://www.somusical.com -id_g_m_270306_1 MVAClient Unknown bad bot from diff. Taiwanese IPs S see this blog: http://www.tenspider.com/business-blog/weblog.php -id_g_m_241105_1 My WinHTTP Connection Windows HTTP Services (WinHTTP) http://msdn.microsoft.com/library/?url=/library/en-us/winhttp/http/about_winhttp.asp -id_g_m_1014 myDaemon unknown user robot (24.124.34.42) -id_g_m_1015 MyGetRight/1.0.0 GetRight download manager D http://www.getright.com -id_g_m_1016 MyGetRight/1.0b GetRight download manager D http://www.getright.com -id_g_m_1017 Mylinea.com Crawler 2.0 Mylinea France web catalogue crawler R http://www.mylinea.com -id_g_m_040906_1 mylinkcheck/1.02 VDOG - SEO webdirecory (Germany) link checking C http://www.vdog.de/ -id_n_s_1018 Naamah 1.0.1/Blogbot (http://blogbot.de/) Blogbot (Germany) robot R http://blogbot.de/ -id_n_s_1019 Naamah 1.0a/Blogbot (http://blogbot.de/) Blogbot (Germany) robot R http://blogbot.de/ -id_n_s_1021 NABOT/5.0 Naver Japan / Korea robot R s.also Python-urllib/1.15 - dloader(NaverRobot)/1.0 & Cowbot http://www.naver.co.jp/ -id_n_s_1020 nabot_1.0 Naver Japan / Korea robot R s.also Python-urllib/1.15 - dloader(NaverRobot)/1.0 & Cowbot http://www.naver.co.jp/ -id_n_s_180408_4 NameOfAgent (CMS Spider) Badbot searching for Wordpress wp-login.php S -id_n_s_071205_1 naoFavicon4IE/1.xx naoFavicon4IE D http://nao4u.com/software/naoFavicon4IE/ -id_n_s_140506_2 NASA Search 1.0 Unknown spambot / harvester from diff. IPs S http://www.projecthoneypot.org/ip_inspector.php?iph=978231e229521680d11cb93f32de0fa1 -id_n_s_1022 NationalDirectory-WebSpider/1.3 Nationaldirectory spider R http://www.nationaldirectory.com/ -id_n_s_1023 NationalDirectoryAddURL/1.0 Nationaldirectory spider R http://www.nationaldirectory.com/ -id_n_s_1025 NaverBot-1.0 (NHN Corp. / +82-2-3011-1954 / nhnbot@naver.com) Naver Japan / Korea robot R s. also Python-urllib/1.15- nabot- cowbot & dloader http://www.naver.co.jp/ -id_n_s_1024 NaverBot_dloader/1.5 Naver Japan / Korea robot R s. also Python-urllib/1.15 - nabot - cowbot & dloader http://www.naver.co.jp/ -id_n_s_181205_1 NavissoBot Navisso closed beta robot (69.41.162.1xx) R http://navisso.com/ -id_n_s_181205_2 NavissoBot/1.7 (+http://navisso.com/) Navisso closed beta robot (69.41.162.1xx) R http://navisso.com/ -id_n_s_1026 NCSA Beta 1 (http://vias.ncsa.uiuc.edu/viasarchivinginformation.html) Vias Information Archival robot R http://vias.ncsa.uiuc.edu/ -id_n_s_250507_1 Nebullabot/2.2 (http://bot.nebulla.info) Nebulla.info distributed crawler (Germany) R 81.169.180.2xx http://www.nebulla.info/ http://bot.nebulla.info/ -id_n_s_1027 NEC Research Agent -- compuman at research.nj.nec.com NEC Researchindex robot - now CiteSeer.IST scientific document index R http://citeseer.ist.psu.edu/ -id_n_s_1028 NEC-Hayek/1.0 rcn.com user agent ? NEC Researchindex robot ? s. NEC Research Agent -id_n_s_291108_4 Net-Seekr Bot/Net-Seekr Bot V1 (http://www.net-seekr.com) Net Seekr search robot R 78.129.201.19x http://www.net-seekr.com/ -id_n_s_1029 NetAnts/1.2x NetAnts download manager D http://www.netants.com/en/index.html -id_n_s_1030 NETCOMplete/x.xx NetComplete IE browser package B http://www.netcom.net.uk/ -id_n_s_010807_2 NetinfoBot/1.0 (http://netinfo.bg/netinfobot.html) Netinfo.bg search (Bulgaria) robot R 194.153.145.x[xx] http://netinfo.bg/ -id_n_s_1031 NetLookout/2.24 Netlookout internet notifier R site is offline http://www.frugalsoft.com -id_n_s_230406_3 Netluchs/0.8-dev ( ; http://www.netluchs.de/; ___don't___spam_me_@netluchs.de) Netluchs (Germany) search (193.164.8.xx) R Same IP-range as Metager search - powered by Nutch http://www.netluchs.de/ -id_n_s_1032 NetMechanic Vx.0 NetMechanic link checker C http://www.netmechanic.com/ -id_n_s_030906_1 NetNewsWire/2.x (Mac OS X; http://ranchero.com/netnewswire/) NewsGator NetNewsWire - Mac RSS feed reader B http://www.newsgator.com/NGOLProduct.aspx?ProdID=NetNewsWire -id_n_s_1033 NetNoseCrawler/v1.0 unknown InCom (216.0.107.xx) robot R http://www.incom.net/ -id_n_s_1034 Netprospector JavaCrawler Netprospector metasearch software R http://www.actaddons.com/products/netprospector.asp -id_n_s_1035 NetPumper/x.xx Netpumper download manager D http://www.netpumper.com/ -id_n_s_1036 NetResearchServer(http://www.look.com) Look.com robot (209.87.232.x) R http://www.look.com/ -id_n_s_1037 NetResearchServer/x.x(loopimprovements.com/robot.html) IncyWincy search engine using DMOZ database R http://www.loopimprovements.com/ -id_n_s_140209_5 NetSeer/Nutch-0.9 (NetSeer Crawler; http://www.netseer.com; crawler@netseer.com) NetSeer search (beta) crawler via Amazon Web Services - see also Teemer R 67.202.26.1xx http://www.netseer.com/ http://www.amazon.com/gp/browse.html?node=3435361 -id_n_s_150906_2 NetSprint -- 2.0 Wirtualna Polska / Netsprint search (Poland) robot R 212.77.102.1xx http://www.wp.pl/ http://www.netsprint.pl/serwis/ -id_n_s_190306_1 NetWhatCrawler/0.06-dev (NetWhatCrawler from NetWhat.com; http://www.netwhat.com; support@netwhat.com) NetWhat Search crawler (69.9.167.1xx) R http://www.netwhat.com/ -id_n_s_1038 NetZippy Netzippy robot R site is closed http://www.netzippy.com/ -id_n_s_1039 NeuralBot/0.2 unknown -id_n_s_1040 newsearchengine (ThisUser@unspecified.mail) Unknown (12.238.4.xxx) attbi.com client robot -id_n_s_250707_3 NewsGator FetchLinks extension/0.2.0 (http://graemef.com) FetchLinks plugin for NewsGator RSS reader B http://graemef.com/project/fetchlinks -id_n_s_250707_4 NewsGatorOnline/2.0 (http://www.newsgator.com; 1 subscribers) NewsGator online RSS reader B 64.78.155.1xx http://www.newsgator.com/ -id_n_s_1041 NextGenSearchBot 1 (for information visit http://www.eliyon.com/NextGenSearchBot) Eliyon Crawler for Business People Search R http://www.eliyon.com/NextGenSearchBot -id_n_s_1042 NextopiaBOT (+http://www.nextopia.com) distributed crawler client beta v0.x Nextopia crawler R http://www.nextopia.com/ -id_n_s_060906_1 NG-Search/0.90 (NG-SearchBot; http://www.ng-search.com; ) find your keywords - semantic search (Germany) robot R 84.56.87.1xx http://www.ng-search.com/ -id_n_s_1043 NG/1.0 Exalead (France) search robot (193.47.80.xx) R s. Harvest-NG/1.0.2 and Exalead NG... http://www.exabot.com/ -id_n_s_050406_3 NG/4.0.1229 Exalead Websearch image crawler (193.47.80.xx) R s. also Exabot-Images/1.0 http://www.exalead.com/search -id_n_s_071106_1 nicebot Unknown UA from PlanetLab distributed network 128.8.126.xx http://planetlab2.cs.umd.edu/ -id_n_s_1044 NICO/1.0 NicoZone childsafe search robot R P -site is offline- http://www.nicozone.net/ -id_n_s_291007_2 Nikita the Spider (http://NikitaTheSpider.com/) Nikita the Spider - Online HTML validation , link checking C 69.61.23.11x http://nikitathespider.com/ -id_n_s_1045 NITLE Blog Spider/0.01 Experimental LSI (?) robot from 140.233.69.xx (Middlebury.edu) R http://javelina.cet.middlebury.edu/lsa/out/lsa_intro.htm -id_n_s_1046 Nitro Downloader 1.x (www.klsofttools.com) Download manager D http://www.klsofttools.com -id_n_s_1047 Noago Spider Noago spider R http://www.noago.com/ -id_n_s_1048 Nocilla/1.0 telefonica.es user robot -id_n_s_1049 Nokia-WAPToolkit/1.2 googlebot(at)googlebot.com Google WAP robot R http://www.google.com/ -id_n_s_290708_3 Nokia6300/2.0 (05.50) Profile/MIDP-2.0 Configuration/CLDC-1.1 (botmobi http://find.mobi/bot.html abuse@mtld.mobi) Botmobi crawler for Find.mobi mobile search C http://find.mobi/bot.html http://find.mobi/ -id_n_s_200108_3 Nokia6610/1.0 (3.09) Profile/MIDP-1.0 Configuration/CLDC-1.0 (compatible;YahooSeeker/M1A1-R2D2; http://help.yahoo.com/help/us/ysearch/crawling/crawling-01.html) YahooSeeker/M1A1-R2D2 - Yahoo mobile web crawling robot R 68.180.2xx.[x]xx http://help.yahoo.com/l/us/yahoo/search/mobilecrawler/mobilecrawler-01.html -id_n_s_1050 Nokia7110/1.0 (05.01) (Google WAP Proxy/1.0) Google WAP proxy P http://www.google.com/ -id_n_s_1051 NokodoBot/1.x (+http://nokodo.com/bot.htm) Nokodo public beta search robot (67.18.222.xx) R http://www.nokodo.com/ -id_n_s_1052 Norbert the Spider(Burf.com) Burf.com UK Search Engine robot R http://www.burf.com/ -id_n_s_1053 noxtrumbot/1.0 (crawler@noxtrum.com) noXtrum search robot (Spain) R 194.224.199.xx http://www.noxtrum.com/ -id_n_s_040506_2 noyona_0_1 Noyona job search (preview) R 207.210.106.1xx http://www.noyona.com/index.pl -id_n_s_1054 NP/0.1 (NP; http://www.nameprotect.com; npbot@nameprotect.com) Nameprotect copyright search robot (24.177.134.x) R s. also - aipbot/1.0 (aipbot; http://www.aipbot.com... - NPBot ... http://www.nameprotect.com/ -id_n_s_1553 NPBot (http://www.nameprotect.com/botinfo.html) Nameprotect copyright search robot (24.177.134.x) R http://www.nameprotect.com/ -id_n_s_1552 NPBot-1/2.0 Nameprotect copyright search robot (24.177.134.x) R http://www.nameprotect.com/ -id_n_s_291205_3 Nsauditor/1.x Nsauditor Network Security Auditor S http://www.nsauditor.com/ -id_n_s_1055 NSPlayer/10.0.0.xxxx WMFSDK/10.0 NetShow Media Player = Windows Media Player 10 B -id_n_s_281207_2 nsyght.com/Nutch-1.0-dev (nsyght.com; Nsyght.com) Nsyght social search application R http://search.nsyght.com/ -id_n_s_161007_1 nsyght.com/Nutch-x.x (nsyght.com; search.nsyght.com) Nsyght social search application R http://search.nsyght.com/ -id_n_s_1056 nttdirectory_robot/0.9 (super-robot@super.navi.ocn.ne.jp) NTT Directory robot R http://navi.ocn.ne.jp/ -id_n_s_180206_1 Nucleus SiteList LinkChecker/1.1 Nucleus CMS SiteList link managing plugin C http://wakka.xiffy.nl/sitelist -id_n_s_1058 nuSearch Spider www.nusearch.com (compatible; MSIE 4.01) nuSearch spider (84.9.136.xxx) R http://www.nusearch.com/ -id_n_s_1057 NuSearch Spider (compatible; MSIE 6.0) nuSearch spider (84.9.136.xxx) R http://www.nusearch.com/ -id_n_s_1059 NuSearch Spider www.nusearch.com nuSearch spider (84.9.136.xxx) R http://www.nusearch.com/ -id_n_s_1060 Nutch Nutch open source robot R http://www.nutch.org/docs/bot.html -id_n_s_211107_1 Nutch crawler/Nutch-0.9 (picapage.com; admin@picapage.com) Picapage search for handheld devices using Nutch R http://picapage.biz/ -id_n_s_230408_1 Nutch/Nutch-0.9 (Eurobot; http://www.ayell.eu ) Ayell Euronet business directory robot using Nutch R http://www.ayell.eu/ -id_n_s_120406_1 NutchCVS/0.06-dev (Nutch; http://www.nutch.org/docs/en/bot.html; nutch-agent@lists.sourceforge.net) Netsweeper content filtering engine (66.207.120.2xx) powered by Nutch P uses also: Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.7.5) Gecko/20041107 Firefox/1.0 http://www.netsweeper.com/ -id_n_s_1061 NutchCVS/0.0x-dev (Nutch; http://www.nutch.org/docs/bot.html; nutch-agent@lists.sourceforge.net) Nutch open source robot R http://www.nutch.org/docs/bot.html -id_n_s_010406_1 NutchCVS/0.7.1 (Nutch running at UW; http://www.nutch.org/docs/en/bot.html; sycrawl@cs.washington.edu) Robot from University of Washington Computer Science & Engineering (128.208.6.2xx) R powered by Nutch http://qbert.cs.washington.edu/ -id_n_s_251006_2 NutchEC2Test/Nutch-0.9-dev (Testing Nutch on Amazon EC2.; http://lucene.apache.org/nutch/bot.html; ec2test at lucene.com) Amazon Elastic Compute Cloud (Amazon EC2) robot R 216.182.236.xx http://www.amazon.com/b/ref=sc_fe_l_2/104-6713356-1433533?ie=UTF8&node=201590011&no=3435361&me=A36L942TSJ2AJA -id_n_s_1062 NutchOrg/0.0x-dev (Nutch; http://www.nutch.org/docs/bot.html; nutch-agent@lists.sourceforge.net) Nutch open source robot R http://www.nutch.org/docs/bot.html -id_n_s_210108_1 nutchsearch/Nutch-0.9 (Nutch Search 1.0; herceg_novi at yahoo dot com) Unknown robot using Nutch (maybe private crawling) via Cox network (70.187.130.25x) R reads robots.txt http://lucene.apache.org/nutch/ -id_n_s_041106_1 NutchVinegarCrawl/Nutch-0.8.1 (Vinegar; http://www.cs.washington.edu; eytanadar at gmail dot com) Unknown crawler from University of Washington - Computer science R 128.208.3.1xx http://www.cs.washington.edu/ -id_n_s_1063 obidos-bot (just looking for books.) Weblog bookwatch robot R http://www.onfocus.com/bookwatch/ -id_n_s_1064 ObjectsSearch/0.01-dev (ObjectsSearch;http://www.ObjectsSearch.com/bot.html; support@thesoftwareobjects.com) Objects Search robot R http://www.objectssearch.com/ -id_n_s_1065 ObjectsSearch/0.0x (ObjectsSearch; http://www.ObjectsSearch.com/bot.html; support@thesoftwareobjects.com) Objects Search robot R http://www.objectssearch.com/ -id_n_s_1066 oBot ((compatible;Win32)) Cobion Germany Brand Protection Services robot R http://www.cobion.com/ -id_n_s_1067 Ocelli/1.x (http://www.globalspec.com/Ocelli) GlobalSpec Engineering Search robot (66.194.55.xxx) R http://www.globalspec.com/ -id_n_s_1068 Octopus Octopus download manager D http://moskalyuk.com/octopus/ -id_n_s_230306_1 Octora Beta - www.octora.com Octora blog or RSS information crawler - beta (66.228.114.xx) R http://www.octora.com/ -id_n_s_230606_4 Octora Beta Bot - www.octora.com Octora RSS feed search R 66.228.114.xx http://www.octora.com/ -id_n_s_1069 Offline Explorer 1.* Meta Products Offlinebrowser B D http://www.metaproducts.com/ -id_n_s_1070 OliverPerry Claymont robot / Internetseer Web Site Monitoring R C http://www.claymont.com/ -id_n_s_1071 OmniExplorer_Bot/1.0x (+http://www.omni-explorer.com) Internet CategorizerOmniExplorer http://www.omni-explorer.com/ car & shopping search (64.62.175.xxx) OmniExplorer car & shopping search (64.62.175.xxx) R based on YottaCars... (see there) http://www.omni-explorer.com -id_n_s_1072 OmniExplorer_Bot/1.0x (+http://www.omni-explorer.com) Job Crawler OmniExplorer car & shopping search (64.62.175.xxx) R based on YottaCars... (see there) http://www.omni-explorer.com -id_n_s_1073 OmniExplorer_Bot/1.1x (+http://www.omni-explorer.com) Torrent Crawler OmniExplorer car & shopping search (64.62.175.xxx) R based on YottaCars... (see there) http://www.omni-explorer.com -id_n_s_1074 OmniExplorer_Bot/x.xx (+http://www.omni-explorer.com) WorldIndexer OmniExplorer car & shopping search (64.62.175.xxx) R based on YottaCars... (see there) http://www.omni-explorer.com -id_n_s_290106_3 onCHECK Linkchecker von www.scientec.de fuer www.onsinn.de onsearch.de German web directory link checking C 85.176.108.2xx http://www.onsearch.de/ -id_n_s_290106_2 onCHECK-Robot, www.onsearch.de onsearch.de German web directory link checking C 85.176.108.2xx http://www.onsearch.de/ -id_n_s_1075 Onet.pl SA- http://szukaj.onet.pl onet.pl Szukaj (Search) robot (213.180.128.1xx) R s. also - Mozilla/5.0 (compatible; OnetSzukaj/5.0.... http://szukaj.onet.pl/ -id_n_s_1076 online link validator (http://www.dead-links.com/) Dead-Links.com link validation spider C http://www.dead-links.com/ -id_n_s_040206_3 Online24-Bot (Version: 1.0x, powered by www.online24.de) Online24 shopping portal (Germany) link checking C http://www.online24.de/ -id_n_s_1077 OntoSpider/1.0 libwww-perl/5.65 OntoSpider - Dutch robot for a research project. (195.11.244.xx) R http://ontospider.i-n.info -id_n_s_030110_6 OOZBOT/0.20 ( http://www.setooz.com/oozbot.html ; agentname at setooz dot_com ) SeetooZ search crawler R 67.215.230.xx http://www.setooz.com/ -id_g_m_280508_4 OpenAcoon v4.0.x (www.openacoon.de) OpenAcoon open source search engine (used by Acoon search) R (80.237.209.xx) http://www.openacoon.de/ http://www.acoon.de/ -id_n_s_1078 Openbot/3.0+(robot-response@openfind.com.tw;+http://www.openfind.com.tw/robot.html) Openfind.com.tw robot R http://www.openfind.com.tw/ -id_n_s_1079 Openfind data gatherer- Openbot/3.0+(robot-response@openfind.com.tw;+http://www.openfind.com.tw/robot.html) Openfind.com.tw robot R http://www.openfind.com.tw/ -id_n_s_1080 Openfind Robot/1.1A2 Openfind.com.tw robot R http://www.openfind.com.tw/ -id_n_s_250107_2 OpenISearch/1.x (www.openisearch.com) open i search robot - search engine in development R 216.182.236.1xx http://www.openisearch.com/ -id_n_s_291105_4 OpenTaggerBot (http://www.opentagger.com/opentaggerbot.htm) Opentagger social bookmarking system R http://www.opentagger.com/ -id_n_s_1081 OpenTextSiteCrawler/2.9.2 OpenText crawler R http://www.opentext.net/ -id_n_s_310806_1 OpenWebSpider/0.x.x (http://www.openwebspider.org) OpenWebSpider - Open Source web search engine R http://www.openwebspider.org/ -id_n_s_1082 OpenWebSpider/x OpenWebSpider - Open Source web search engine R http://www.openwebspider.org/ -id_n_s_1083 Opera/5.0 (Linux 2.0.38 i386; U) [en] Opera 5.0 Linux B -id_n_s_1084 Opera/5.11 (Windows ME; U) [ru] Opera 5.11 faked WinME referer B -id_n_s_1085 Opera/5.12 (Windows 98; U) [en] Opera 5.12 Win98 B -id_n_s_1086 Opera/6.01 (larbin@unspecified.mail) unknown robot from gw.ocg-corp.com (209.126.176.x) see also: - MSIE-5.13 (larbin@.....) - WinampMPEG/2.00 larbin@.... -id_n_s_1087 Opera/6.x (Linux 2.4.8-26mdk i686; U) [en] Opera 6.x- Mandrake Linux B -id_n_s_1088 Opera/6.x (Windows NT 4.0; U) [de] Opera 6.x WinNT B -id_n_s_1089 Opera/7.x (Windows NT 5.1; U) [en] Opera 7.x WinXP B -id_n_s_1090 Opera/8.xx (Windows NT 5.1; U; en) Opera 8.x (Beta) WinXP B -id_n_s_141105_2 Opera/9.0 (Windows NT 5.1; U; en) Opera 9 (Beta) Browser B http://snapshot.opera.com/ -id_n_s_250606_1 Opera/9.00 (Windows NT 5.1; U; de) Opera 9 (final) B http://www.opera.com/ -id_n_s_201008_1 Opera/9.60 (Windows NT 5.1; U; de) Presto/2.1.1 Opera browser 9.6x on WinXP (Presto = Operas rendering engine) B http://my.opera.com/ODIN/blog/a-look-under-the-hood-of-opera-9-6 -id_n_s_1091 OpidooBOT (larbin2.6.3@unspecified.mail) Opidoo Search Belgium robot (62.4.83.xxx) R http://www.opidoo.com/ -id_n_s_080208_1 OPWV-SDK UP.Browser/7.0.2.3.119 (GUI) MMP/2.0 Push/PO Open Wave Phone Simulator SDK B http://developer.openwave.com/dvl/tools_and_sdk/phone_simulator/ -id_n_s_190406_2 Oracle Application Server Web Cache 10g Oracle Application Server cache P http://www.oracle.com/appserver/index.html -id_n_s_1092 Oracle iMTCrawler Oracle interMedia Text - Text and web documents indexing D http://www.oracle.com/technology//products/text/index.html -id_n_s_1093 Oracle Ultra Search Oracle Search R http://www.oracle.com/ -id_n_s_220306_1 OrangeSpider Orangeslicer semantic search (Beta) Germany (193.201.52.1xx) R http://www.orangeslicer.com/ -id_n_s_1094 Orbiter/T-2.0 (+http://www.dailyorbit.com/bot.htm) Orbiter - DailyOrbit search spider R http://www.dailyorbit.com/ -id_n_s_150206_1 Orca Browser (http://www.orcabrowser.com) Orca browser - based on Gecko B http://www.orcabrowser.com -id_n_s_251205_1 OSSProxy 1.3.305.321 (Build 305.321 Win32 en-us)(Dec 21 2005 16:30:54) Marketscore (was Netsetter) internet accelerator P Spyware proxy service http://www.marketscore.com/Home.aspx -id_n_s_141105_1 OutfoxBot/0.x (For internet experiments; http://; outfox.agent@gmail.com) Unknown robot from Chinanet (220.181.8.xxx) -id_n_s_221106_1 OutfoxMelonBot/0.5 (for internet experiments; http://; outfoxbot@gmail.com) Unknown robot from Chinanet (60.191.80.1) -id_n_s_1095 Overture-WebCrawler/3.8/Fresh (atw-crawler at fast dot no; http://fast.no/support/crawler.asp) Overture/Fast/Alltheweb crawler (66.77.73.xxx) R http://www.alltheweb.com/ -id_n_s_1096 OWR_Crawler 0.1 Unknown robot from 198.169.127.xx (innovationplace.com) -id_n_s_090906_1 ozelot/2.7.3 (Search engine indexer; www.flying-cat.de/ozelot; ozelot@flying-cat.de) Ozelot - Flying Cat's search engine robot (Germany) R 87.139.106.xx http://www.flying-cat.de/ozelot/ -id_n_s_290108_2 PADLibrary Spider PADLibrary.com - PAD file software robot for FindFiles.com R 72.167.37.20x http://padlibrary.com/ http://www.findfiles.com/ -id_n_s_150207_3 PageBitesHyperBot/600 (http://www.pagebites.com/) Pagebites job search crawler R 208.185.247.xx http://www.pagebites.com/ -id_n_s_111206_1 Pagebull http://www.pagebull.com/ Pagebull visual search engine R 209.9.228.1xx http://www.pagebull.com/ -id_n_s_051207_3 Pagestacker Bot Pagestacker online bookmark service C 70.85.129.12x http://www.pagestacker.com/ -id_n_s_290506_1 page_verifier (http://www.securecomputing.com/goto/pv) Secure Computing SmartFilter Tools - malware crawler R 206.169.110.xx http://www.securecomputing.com/PageVerifier.cfm -id_n_s_1097 PagmIEDownload Downloadmanager ? D -id_n_s_1098 parallelContextFocusCrawler1.1parallelContextFocusCrawler1.1 CFC crawler used by Italian academic and research network (GARR) R http://www.garr.it/ -id_n_s_1099 ParaSite/1.0b (http://www.ianett.com/parasite/) http://www.ianett.com robot R http://www.ianett.com/ -id_n_s_1100 Patwebbot (http://www.herz-power.de/technik.html) Patsearch (Germany) robot R http://www.herz-power.de/ -id_n_s_1101 pavuk/0.9pl29b i686-pc-linux-gnu Pavuk web downloading program for Unix D http://www.idata.sk/%7Eondrej/pavuk/about.html -id_n_s_1102 PBrowse 1.4b Some site scanning tool via diff. IPs- i.e.: - cox.net (68.4.xxx.xxx) S - UA sometimes DSurf15a -id_n_s_1103 pd02_1.0.0 pd02_1.0.0@dzimi@post.sk Post.sk / Eurotel.sk robot R -id_n_s_1104 PEAR HTTP_Request class ( http://pear.php.net/ ) Pear HTTP_Request PHP extension package http://pear.php.net/ -id_n_s_1105 PEERbot www.peerbot.com Peerbot - favicon search robot R http://www.peerbot.com/ -id_n_s_1106 PeopleChat/Search_Engine Unknown robot from 64.5.48.xxx (Plethoric.net) -id_n_s_1107 PEval 1.4b Some site scanning tool via diff. IPs S s. DBrowse- PSurf etc. -id_n_s_1108 PHP/3.x.xx diff. IPs / services -id_n_s_1109 PHP/4.0.4pl1 diff. IPs / services -id_n_s_1110 PHP/4.0.6 diff. IPs / services- i.e.: -NTT/Verio Inc. link checker C in conjunction w. Weblink's Checker UA http://www.verio.com/ -id_n_s_1111 PHP/4.1.1 diff. IPs / services- i.e.: - Phenominet.com link checking C http://www.phenominet.com -id_n_s_1112 PHP/4.1.2 diff. IPs / services- i.e.: - 209.114.200.xx = MyNetCrawler link checking - 216.139.207.xxx = Mixcat crawler Mixcat s. also Felix and Morris http://mynetcrawler.com/ http://mixcat.com -id_n_s_1113 PicoSearch/1.0 Pico Search robot R http://www.picosearch.com/ -id_n_s_010506_3 Piffany_Web_Scraper_v0.x Piffany targeted search web spider R http://www.piffany.com/ http://www.piffany.com/spider.html -id_n_s_010506_2 Piffany_Web_Spider_v0.x Piffany targeted search web spider R http://www.piffany.com/ http://www.piffany.com/spider.html -id_n_s_1114 PigeonBot1.0 BETA Whois Source domain name information robot (66.249.26.xx)- s.also: - SurveyBot R C http://www.whois.sc/ -id_n_s_1115 PingALink Monitoring Services 1.0 PingALink website monitoring R C http://www.pingalink.com/ -id_n_s_1116 PingALink Monitoring Services 1.0 (http://www.pingalink.com) PingALink website monitoring R C http://www.pingalink.com/ -id_n_s_120607_1 Pingdom GIGRIB (http://www.pingdom.com) Pingdom web site monitoring C 66.98.148.xx http://www.pingdom.com/ -id_n_s_1117 pipeLiner/0.3a (PipeLine Spider;http://www.pipeline-search.com/webmaster.html; webmaster'at'pipeline-search.com) pipeline search (DMOZ based) search robot (24.106.39. xxx) R http://www.pipeline-search.com/ -id_n_s_1118 pipeLiner/0.xx (PipeLine Spider; http://www.pipeline-search.com/webmaster.html) pipeline search (DMOZ based) search robot (24.106.39. xxx) R http://www.pipeline-search.com/ -id_n_s_1119 Pita Pita crawler R now WebVac s. there http://www-diglib.stanford.edu/~testbed/doc2/WebBase/webbase-pages.html -id_n_s_1120 Pizilla++ ver 2.45 Private user-agent via Hurricane Electric Internet Services B ? http://www.he.net/ -id_n_s_1121 PJspider/3.0 (pjspider@portaljuice.com; http://www.portaljuice.com) Portaljuice spider R http://www.portaljuice.com/ -id_n_s_121106_1 Plagger/0.x.xx (http://plagger.org/) Plagger - pluggable RSS/Atom feed aggregator written in Perl B http://plagger.org/trac -id_n_s_1122 PlagiarBot/1.0 unknown ucsd.edu robot R -id_n_s_1123 PlantyNet_WebRobot_V1.9 dhkang@plantynet.com Plantynet web filtering services - Blacklist DB robot R P http://www.plantynet.com/ -id_n_s_120106_1 plinki/0.1 (you got plinked! (thats a good thing..); http://www.plinki.com; crawl@plinki.com) Unknown UA from 66.220.23.2xx Doesn't read robots.txt - Plinki.com's website has no content http://www.plinki.com/ -id_n_s_061206_2 PluckFeedCrawler/2.0 (compatible; Mozilla 4.0; MSIE 5.5; http://www.pluck.com; 1 subscribers) Pluck RSS feed crawler R 66.179.81.1xx http://www.pluck.com/ -id_n_s_140807_1 Pluggd/Nutch-0.9 (automated crawler http://www.pluggd.com;support at pluggd dot com) Pluggd Podcast search engine R 209.85.62.1xx http://www.pluggd.com/ -id_n_s_1124 Pockey-GetHTML/4.12.0 (Win32; GUI; ix86) Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan D http://www.vector.co.jp/soft/win95/net/se077067.html -id_n_s_1125 Pockey-GetHTML/x.xx Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan D http://www.vector.co.jp/soft/win95/net/se077067.html -id_n_s_1126 Pockey/x.x.x Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan D http://www.vector.co.jp/soft/win95/net/se077067.html -id_n_s_1127 Pockey7.x.x(WIN32GUI) Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan D http://www.vector.co.jp/soft/win95/net/se077067.html -id_n_s_1128 POE-Component-Client-HTTP/0.64 (perl; N; POE; en; rv:0.640000) HTTP user-agent for POE (portable networking framework for Perl ) http://search.cpan.org/dist/POE-Component-Client-HTTP/HTTP.pm -id_n_s_291105_2 Poirot ThePlanet/jaja-jak-globusy.com Google Adsense refferer spam bot from 70.85.116.* / 70.84.128.xxx / 70.85.193.xxx S appears also as LWP::Simple/5.803 - Mozilla/4.76 [en] (Win98; U) - Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1) http://spamhuntress.com/wiki/Manila_Industries -id_n_s_1129 polybot 1.0 (http://cis.poly.edu/polybot/) Polybot webcrawler R http://cis.poly.edu/polybot/ -id_n_s_1130 Pompos/1.x http://dir.com/pompos.html Dir.com / Iliad French recherche robot R http://www.iliad.fr/ -id_n_s_1131 Pompos/1.x pompos@iliad.fr Iliad / Free French recherche robot R http://www.iliad.fr/ -id_n_s_1132 Popdexter/1.0 Popdex - web site popularity crawler R http://www.popdex.com/ -id_n_s_1133 Port Huron Labs Unknown spam bot / harvester (63.223.10.***) S s. also - Wells Search II -id_n_s_1134 PortalBSpider/2.0 (spider@portalb.com) PortalB (now Alacra search) spider R http://www.portalb.com/alacra/index.htm -id_n_s_080706_2 portalmmm/2.0 S500i(c20;TB) portalmmm IMode mobile browser B -id_n_s_1135 PostFavorites Yahoo (66.94.237.1xx / 216.109.121.xx) favorites tracking robot C -id_n_s_1136 potbot 1.0 Potbot : A simple IRC bot written in Perl R http://sourceforge.net/projects/potbot/ -id_n_s_050408_2 PRCrawler/Nutch-0.9 (data mining development project; crawler@projectrialto.com) Project Rialto - data mining development project R http://projectrialto.com/index.html -id_n_s_1137 PrivacyFinder Cache Bot v1.0 CUPS robot for AT&T Privacy Bird Privacy Preferences (P3P) enhancements R http://cups.cs.cmu.edu/ http://privacybird.com/ -id_n_s_111205_2 PrivacyFinder/1.1 CUPS robot for AT&T Privacy Bird Privacy Preferences (P3P) enhancements R http://cups.cs.cmu.edu/ http://privacybird.com/ -id_n_s_1138 Privoxy/3.0 (Anonymous) Privoxy web proxy P s.also (Privoxy/1.0) http://www.privoxy.org/ -id_n_s_1139 Production Bot 0116B Some site scanning tool from diff. IPs- i.e.: - 67.99.33.x (lightningcon.broadwing.net) S -id_n_s_1140 Production Bot 2016B Some site scanning tool from diff. IPs- i.e.: - 216.232.64.xx (telus.net) S -id_n_s_1141 Production Bot DOT 3016B Some site scanning tool from diff. IPs- i.e.: - 141.154.181.xxx (east.verizon.net) S -id_n_s_1142 Program Shareware 1.0.2 Some spam bot S - see here: http://www.kloth.net/internet/badbots-2004.php http://www.kloth.net/internet/badbots-2004.php -id_n_s_1143 Progressive Download unknown -id_n_s_1144 Progressive Download HTTP check unknown -id_n_s_1145 Project XP5 [2.03.07-111203] XP5 robot R http://marty.anstey.ca/projects/robots/index.html -id_n_s_1146 PROve AnswerBot 4.0 Answerchase PROve Answerbot R http://www.answerchase.com/ -id_n_s_1147 ProWebGuide Link Checker (http://www.prowebguide.com) ProWebguide robot R http://www.prowebguide.com/ -id_n_s_1148 psbot/0.1 (+http://www.picsearch.com/bot.html) Picsearch robot (62.119.21.13x) R http://www.picsearch.com/ -id_n_s_1149 PSurf15a 11 Some site scanning tool via diff. IPs- i.e.: QWest Net S -id_n_s_1150 PSurf15a 51 Some site scanning tool via diff. IPs- i.e.: Optonline net (24.191.xxx.xxx) S -id_n_s_1151 PSurf15a VA Some site scanning tool via diff. IPs- i.e.: - choiceone.net (216.153.xxx.xxx) - attbi.com (12.250.xxx.xxx) - optonline.net (24.191.xxx.xxx) S UA sometimes SSurf15a 11 or random letters like RXMYRCJ -id_n_s_160606_1 psycheclone Unknown website grabbing / ripping for unknown purposes from 208.66.195.x - Digitalinfinity.org Russia S no active website -id_n_s_1152 PubCrawl (pubcrawl.stanford.edu) Some robot from Stanford University (171.64.75.xxx = PubCrawl.Stanford.EDU) R -id_n_s_1153 puf/0.91beta6a (Linux 2.2.18; i686) Parallel URL Fetcher downloading tool D http://puf.sourceforge.net/ -id_n_s_1154 puf/0.93.2a (Linux 2.4.18; i686) Parallel URL Fetcher downloading tool D http://puf.sourceforge.net/ -id_n_s_130407_1 pulseBot (pulse Web Miner) WebarooBot - Webaroo web site search / theme based downloading tool (64.124.122.2xx) R s. also RufusBot http://www.webaroo.com/index http://www.webaroo.com/company/site-owners -id_n_s_1155 PureSight PureSight Internet content filter P http://www.puresight.com/Products/PureSightHomeDescription.shtml -id_n_s_1156 PuxaRapido v1.0 Puxa Rapido download manager D http://www.puxarapido.com.br/ -id_n_s_230907_2 PWeBot/1.2 Inspector (http://www.programacionweb.net/robot.php) ProgramacionWeb.net PWeBot link checking (Argentina) R 62.149.236.2xx http://www.programacionweb.net/robot-en.php http://www.programacionweb.net/ -id_n_s_1157 PycURL Fast Search robot (using PycURL Python component- s. below) R http://www.fastsearch.net/ http://pycurl.sourceforge.net/ -id_n_s_060107_1 PycURL/7.xx.x PycURL - Python interface to libcurl D http://pycurl.sourceforge.net/ -id_n_s_1158 Python-urllib/1.1x Python URL fetcher - robot used by Naver Japan/Korea R s. also nabot- dloader- NaverBot & Cowbot http://www.indyproject.org/ http://www.python.org/ -id_n_s_1159 Python-urllib/2.0a1 Python URL fetcher - robot used by Google R http://labs.google.com http://www.python.org/ -id_n_s_1160 Qango.com Web Directory (http://www.qango.com/) Qango.com Web Directory robot R http://www.qango.com/ -id_n_s_170408_1 QEAVis Agent/Nutch-0.9 (Quantitative Evaluation of Academic Websites Visibility; http://nlp.uned.es/qeavis QEAVis: Quantitative Evaluation of Academic Websites Visibility using Nutch R 83.33.209.10x http://nlp.uned.es/qeavis/ -id_n_s_1161 QPCreep Test Rig ( We are not indexing- just testing ) Quepasa!com (Latin American search) robot R http://www.quepasa.com/ -id_n_s_1162 QuepasaCreep ( crawler@quepasacorp.com ) Quepasa!com (Latin American search) robot R http://www.quepasa.com/ -id_n_s_1163 QuepasaCreep v0.9.1x Quepasa!com (Latin American search) robot R http://www.quepasa.com/ -id_n_s_1164 QueryN Metasearch QueryN Metasearch robot R http://www.queryn.com/queryn/ -id_n_s_230108_2 Quicksilver (Blacktree,MacOSX) Blacktrees Quicksilver helper application for Mac B http://docs.blacktree.com/quicksilver/what_is_quicksilver -id_n_s_230606_3 QuickTime\xaa.7.0.4 (qtver=7.0.4;cpu=PPC;os=Mac 10.3.9) Quicktime for Macintosh B -id_n_s_060107_4 QweeryBot/3.01 ( http://qweerybot.qweery.nl) Qweerybot for the Qweery search engine (in development) - Netherland R 85.158.204.2xx http://qweerybot.qweery.nl/ -id_n_s_060107_3 Qweery_robot.txt_CheckBot/3.01 (http://qweerybot.qweery.com) Qweerybot for the Qweery search engine (in development) - Netherland R 85.158.204.2xx http://qweerybot.qweery.nl/ -id_n_s_160208_1 R6_CommentReader_(www.radian6.com/crawler) Radian6 RSS feed comment crawler R http://www.radian6.com/cms/index.php http://www.radian6.com/crawler/ -id_n_s_160208_2 R6_FeedFetcher_(www.radian6.com/crawler) Radian6 Rss feed crawler R http://www.radian6.com/cms/index.php http://www.radian6.com/crawler/ -id_n_s_1165 rabaz (rabaz at gigabaz dot com) gigaBaz - the brainbot (Germany) robot R http://brainbot.com//site3 -id_n_s_1166 RaBot/1.0 Agent-admin/phortse@hanmail.net DAUMOA - Daum search Korea robot (211.115.109.xxx) R s. also Mozilla/4.0 (compatible; MSIE is not me; DAUMOA ... http://www.daum.net/ -id_n_s_1167 Rainbot1.1 Bot Provider for the All Womans Bot Service? - site is dead http://bservice.org/bots/ -id_n_s_1168 ramBot xtreme x.x Intersearch.de (was www.intersearch.de) robot (Germany) R -id_n_s_160406_2 RAMPyBot - www.giveRAMP.com/0.1 (RAMPyBot - www.giveRAMP.com; http://www.giveramp.com/bot.html; support@giveRAMP.com) giveRAMP Search Engine robot (64.69.43.1xx) R http://www.giveramp.com/ -id_n_s_260206_1 RAMPyBot/0.8-dev (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org) giveRAMP Search Engine robot (64.69.43.1xx) R powered by Nutch http://www.giveramp.com/ http://lucene.apache.org/nutch/ -id_n_s_1169 Rank Exec (rankexec.com) Reciprocal Link Manager 1.x/bot Rank Exec reciprocal link checking C http://www.rankexec.com/ -id_n_s_180408_5 Rankivabot/3.2 (www.rankiva.com; 3.2; vzmxikn) Rankiva website popularity robot R http://www.rankiva.com/ -id_n_s_1170 Rational SiteCheck (Windows NT) Innova/IBM Rational SiteCheck - Rational robot R http://www.rational.com.ar/defaultenglish.html -id_n_s_290708_2 RAYSPIDER/Nutch-0.9 Unknown spider from Raytheon Company - maybe Raytheon High Speed Guard proxy P 199.46.198.xxx http://www.raytheon.com/ -id_n_s_230207_3 ReadABlog Spider (compatible; 1.1; feed update; www.readablog.com) Read A Blog - RSS feed and blog search engine C 70.85.24.xx http://www.readablog.com/ -id_n_s_1171 RealDownload/4.0.0.4x RealDownload download manager D http://service.real.com/help/faq/rdown4/rdownfaqa01.html -id_n_s_100408_3 REAP-crawler Nutch/Nutch-1.0-dev (Reap Project; http://reap.cs.cmu.edu/REAP-crawler/; Reap Project) The REAP Web Crawler for the REAP project C http://reap.cs.cmu.edu/REAP-crawler/ http://reap.cs.cmu.edu/ -id_n_s_1172 Reaper [2.03.10-031204] (http://www.sitesearch.ca/reaper/) Reaper robot for SiteSearch R http://marty.anstey.ca/projects/robots/reaper.html -id_n_s_1173 Reaper/2.0x (+http://www.sitesearch.ca/reaper) Reaper robot for SiteSearch R http://marty.anstey.ca/projects/robots/reaper.html -id_n_s_1174 REBOL Core 2.x.x.x.x REBOL messaging language for distributed Internet apps http://www.rebol.com/ -id_n_s_250307_1 REBOL View 1.x.x.x.x REBOL/View - machine independent internet client application B http://www.rebol.com/prod-view.html -id_n_s_1175 RebusnetBot (+http://www.rebusnet.biz) Rebusnet software site - link / submission checking R C http://www.rebusnet.biz -id_n_s_1176 RebusnetPADBot/1.5x (+http://www.rebusnet.biz) Rebusnet software site - link / submission checking R C http://www.rebusnet.biz -id_n_s_171205_1 reciprocal links checker (http://www.recip-links.com/) Online reciprocal link checker C http://www.recip-links.com/ -id_n_s_110307_2 RedBot/redbot-1.0 (Rediff.com Crawler; redbot at rediff dot com) rediff.com search link checking C 220.226.198.xx http://www.rediff.com/ -id_n_s_130106_1 RedCarpet/1.2 (http://www.redcarpet-inc.com/robots.html) RedCarpet crawler for Pronto price comparison search(66.179.107.1xx) R http://www.redcarpet-inc.com/robots.html http://www.pronto.com/ -id_n_s_171205_2 RedCell/0.1 (InfoSec Search Bot (Coming Soon); http://www.telegenetic.net/bot.html; lhall@telegenetic.net) Der Bot for telegenetic.net's security related search (65.220.67.2xx) R Based on Nutch http://www.telegenetic.net/bot.html -id_n_s_040106_1 RedCell/0.1 (RedCell; telegenetic.net/bot.html; lhall_at_telegenetic.net) Der Bot for telegenetic.net's security related search (65.220.67.2xx) R Based on Nutch http://www.telegenetic.net/bot.html -id_n_s_1177 RedKernel WWW-Spider 2/0 (+http://www-spider.redkernel-softwares.com/) RedKernel Softwares robot R http://www.redkernel-softwares.com/ -id_n_s_1178 REL Link Checker Lite x.x REL Link Checker Lite free version of Web Link Validator C http://www.relsoftware.com/rlc/ -id_n_s_1179 RepoMonkey Bait & Tackle/v1.01 unknown -id_n_s_1180 Rewebber/1.2 libwww-perl/5.41 Rewebber proxy service P http://www.rewebber.com/ -id_n_s_1181 rico/0.1 Applied Semantics Auto-Categorizer for QWestDex Direct R http://www.dotcomdirectory.com -id_n_s_241105_2 RixBot (http://babelserver.org/rix) RixBot Rebol Indexer for the RIX - Rebol related search (195.204.121.xx) R http://babelserver.org/rix -id_n_s_070406_2 RMA/1.0 (compatible; RealMedia) StreamBox VCR user agent D http://all-streaming-media.com/streaming-media-faq/faq-streambox-vcr-download-problems.htm -id_n_s_1182 RMA/1.0 (compatible; RealMedia) Real Media server acting as client B P http://service.real.com/help/library/whitepapers/wpaper.html -id_n_s_061206_4 RoboCrawl (http://www.canadiancontent.net) Canadian Content search crawler R http://www.canadiancontent.net/ -id_n_s_1183 RoboCrawl (www.canadiancontent.net) Canadian Content Search (207.44.220.xx) robot R http://www.canadiancontent.net/ -id_n_s_1184 RoboPal (http://www.findpal.com/) FindPal Australia metasearch robot (61.68.139.xx) R http://www.findpal.com/ -id_n_s_1187 Robot/www.pj-search.com PopJapanSearch robot R http://www.pj-search.com/ -id_n_s_1185 Robot: NutchCrawler- Owner: wdavies@acm.org Experimental robot using Wget via attbi.net R -id_n_s_1186 Robot@SuperSnooper.Com Supersnooper robot R http://www.Supersnooper.com/ -id_n_s_1188 Robozilla/1.0 Netscape Directory / DMOZ Open Directory link crawler R http://directory.mozilla.org/ -id_n_s_220208_1 Rome Client (http://tinyurl.com/64t5n) Ver: 0.9 ROME - Open source Java tools for RSS and Atom feeds B https://rome.dev.java.net/ -id_n_s_1189 Rotondo/3.1 libwww/5.3.1 Qualigo.de robot R http://www.qualigo.de/ -id_n_s_1190 RPT-HTTPClient/0.3-x different IPs using the HTTPClient library (mostly link checking) C Java1.4.0 http://www.innovation.ch/java/HTTPClient/ -id_n_s_1191 RRC (crawler_admin@bigfoot.com) Metacarta.com (66.28.xx.xxx) robot R s. Larbin... http://www.metacarta.com -id_n_s_250707_5 RssBandit/1.5.0.10 (.NET CLR 1.1.4322.2407; WinNT 5.1.2600.0; http://www.rssbandit.org) (.NET CLR 1.1.4322.2407; WinNT 5.1.2600.0; ) RSS Bandit RSS/Atom reader for .NET framework B http://www.rssbandit.org/ -id_n_s_230607_3 RSSMicro.com RSS/Atom Feed Robot RSS Micro Search - RSS feed search engine R 209.216.63.xx http://www.rssmicro.com/ -id_n_s_080307_2 RSSOwl/1.2.3 2006-11-26 (Windows; U; zhtw) RSSOwl embedded RSS feed reader B http://www.rssowl.org/ -id_n_s_060108_1 RSSOwl/1.2.4 Preview Release 2007-04-15 (Windows; U; zhtw) RSSOwl embedded RSS feed reader B http://www.rssowl.org/ -id_n_s_181006_3 RssReader/1.0.xx.x (http://www.rssreader.com) Microsoft Windows NT 5.1.2600.0 Ykoon RssReader news feed reader B http://www.rssreader.com/ -id_n_s_1192 RSurf15a 41 Some site scanning tool via diff. IPs- i.e.: - dslx.net (208.35.1x.xxx) - Home.com S -id_n_s_1193 RSurf15a 51 Some site scanning tool via diff. IPs- i.e.: - dslx.net (208.35.1x.xxx) - Home.com S -id_n_s_1194 RSurf15a 81 Some site scanning tool via diff. IPs- i.e.: - dslx.net (208.35.1x.xxx) - Home.com S -id_n_s_080206_2 Rubbot/1.0 (+http://rubhub.com/) rubhub blog spider C based on XFN relationship lookup engine http://rubhub.com/main/ http://gmpg.org/xfn/more -id_n_s_191105_1 RufusBot (Rufus Web Miner; http://64.124.122.252/feedback.html) WebarooBot - Webaroo web site search / theme based downloading tool (64.124.122.2xx) R s. also pulseBot http://www.webaroo.com/index http://www.webaroo.com/company/site-owners -id_n_s_020407_1 RufusBot (Rufus Web Miner; http://www.webaroo.com/rooSiteOwners.html) WebarooBot - Webaroo web site search / theme based downloading tool (64.124.122.2xx) R s. also pulseBot http://www.webaroo.com/index http://www.webaroo.com/company/site-owners -id_n_s_1195 Rumours-Agent unknown robot from rumours.jp (202.214.69.xxx) -id_n_s_1196 RX Bar RX (Reflexive Search) Bar for IE B http://www.searchenginebar.com/ -id_n_s_160506_1 S&L Spider (http://search.hirners.com/) Search & Links directory spider C 80.108.7.xx http://search.hirners.com/ -id_n_s_1197 S.T.A.L.K.E.R. (http://www.seo-tools.net/en/bot.aspx) SEO-Tools.net link checking ? C http://www.seo-tools.net/ -id_n_s_1198 SafariBookmarkChecker (+http://www.coriolis.ch/) SafariBookmarkChecker for Mac OS X C http://www.coriolis.ch/ -id_n_s_061107_1 sait/Nutch-0.9 (SAIT Research; http://www.samsung.com) sait robot - unknown robot from Samsung International Korea R 202.20.190.xx http://samsungnetworks.co.kr/eng/index.jsp -id_n_s_191105_2 SandCrawler - Compatibility Testing Sandcrawler robot from Microsoft (131.107.0.xx) R -id_n_s_170109_3 SapphireWebCrawler/1.0 (Sapphire Web Crawler using Nutch; http://boston.lti.cs.cmu.edu/crawler/; mhoy@cs.cmu.edu) Sapphire Web Crawler from Carnegie Mellon University's Language Technologies Institute R http://boston.lti.cs.cmu.edu/crawler/ -id_n_s_170109_4 SapphireWebCrawler/Nutch-1.0-dev (Sapphire Web Crawler using Nutch; http://boston.lti.cs.cmu.edu/crawler/; mhoy@cs.cmu.edu) Sapphire Web Crawler from Carnegie Mellon University's Language Technologies Institute R http://boston.lti.cs.cmu.edu/crawler/ -id_n_s_021205_4 savvybot/0.2 WebSavvy Directory robot R http://www.websavvy.cc/bot.php -id_n_s_1199 SBIder/0.7 (SBIder; http://www.sitesell.com/sbider.html; http://support.sitesell.com/contact-support.html) SiteSell SBIder Nutch based crawler R http://www.sitesell.com/ -id_n_s_030106_2 SBIder/0.8-dev (SBIder; http://www.sitesell.com/sbider.html; http://support.sitesell.com/contact-support.html) SiteSell SBIder Nutch based crawler R http://www.sitesell.com/ -id_n_s_1200 SBL-BOT (http://sbl.net) Softbyte Labs Black Widow web site ripper D B http://sbl.net/ -id_n_s_1201 ScanWeb ScanWeb - regular expression based web page searching tool R http://eserver.host.sk/ -id_n_s_301006_1 ScholarUniverse/0.8 (Nutch;+http://scholaruniverse.com/bot.jsp; fetch-agent@scholaruniverse.com) ScholarUniverse - Scholarly experts search robot R 209.216.243.xx http://www.scholaruniverse.com/index.jsp -id_n_s_1202 schwarzmann.biz-Spider_for_paddel.org+(http://www.innerprise.net/usp-spider.asp) URL Spider Pro (USP) used by German Schwarzmann GmbH R http://www.schwarzmann.biz/ -id_n_s_1203 Science Traveller International 1X/1.0 1X Web Browser B http://www.scitrav.com/ -id_n_s_190407_1 ScollSpider/2.0 (+http://www.webwobot.com/ScollSpider.php) WebWobot UK search engine robot (82.43.129.2xx) R s. also Mozilla/3.0 (compatible; ScollSpider ... http://www.webwobot.com/ -id_n_s_1206 Scooter-3.0.EU Altavista robot R http://www.altavista.com/ -id_n_s_1207 Scooter-3.0.FS Altavista robot R http://www.altavista.com/ -id_n_s_1208 Scooter-3.0.HD Altavista robot R http://www.altavista.com/ -id_n_s_1209 Scooter-3.0.VNS Altavista robot R http://www.altavista.com/ -id_n_s_1210 Scooter-3.0QI Altavista robot R http://www.altavista.com/ -id_n_s_1211 Scooter-3.2 Altavista robot R http://www.altavista.com/ -id_n_s_1212 Scooter-3.2.BT Altavista robot R http://www.altavista.com/ -id_n_s_1213 Scooter-3.2.DIL Altavista robot R http://www.altavista.com/ -id_n_s_1214 Scooter-3.2.EX Altavista robot R http://www.altavista.com/ -id_n_s_1215 Scooter-3.2.JT Altavista robot R http://www.altavista.com/ -id_n_s_1216 Scooter-3.2.NIV Altavista robot R http://www.altavista.com/ -id_n_s_1217 Scooter-3.2.SF0 Altavista robot R http://www.altavista.com/ -id_n_s_1218 Scooter-3.2.snippet Altavista robot R http://www.altavista.com/ -id_n_s_1219 Scooter-3.3dev Altavista robot R http://www.altavista.com/ -id_n_s_1220 Scooter-ARS-1.1 Altavista robot R http://www.altavista.com/ -id_n_s_1221 Scooter-ARS-1.1-ih Altavista robot R http://www.altavista.com/ -id_n_s_1222 scooter-venus-3.0.vns Altavista robot R http://www.altavista.com/ -id_n_s_1223 Scooter-W3-1.0 Altavista robot R http://www.altavista.com/ -id_n_s_1224 Scooter-W3.1.2 Altavista robot R http://www.altavista.com/ -id_n_s_1225 Scooter/1.0 Altavista robot R http://www.altavista.com/ -id_n_s_1226 Scooter/1.0 scooter@pa.dec.com Altavista robot R http://www.altavista.com/ -id_n_s_1227 Scooter/1.1 (custom) Altavista robot R http://www.altavista.com/ -id_n_s_1228 Scooter/2.0 G.R.A.B. V1.1.0 Altavista robot R http://www.altavista.com/ -id_n_s_1229 Scooter/2.0 G.R.A.B. X2.0 Altavista robot R http://www.altavista.com/ -id_n_s_1230 Scooter/3.3 Altavista robot R http://www.altavista.com/ -id_n_s_1232 Scooter/3.3.QA.pczukor Altavista robot R http://www.altavista.com/ -id_n_s_1233 Scooter/3.3.vscooter Altavista robot R http://www.altavista.com/ -id_n_s_1231 Scooter/3.3_SF Altavista robot R http://www.altavista.com/ -id_n_s_1234 Scooter2_Mercator_x-x.0 Altavista using Mercator robot R http://www.altavista.com/ http://www.research.compaq.com/SRC/mercator/ -id_n_s_1204 Scooter_bh0-3.0.3 Altavista robot R http://www.altavista.com/ -id_n_s_1205 Scooter_trk3-3.0.3 Altavista robot R http://www.altavista.com/ -id_n_s_190306_3 Scope (Mars+) Scope Navigator mobile browser (Japan) B http://www.programmer.co.jp/scope.shtml -id_n_s_1235 ScoutAbout Some nec.com robot using Research Republic ScoutAbout Research Tool R http://www.researchrepublic.com/ -id_n_s_051207_4 ScoutAnt/0.1; +http://www.ant.com/what_is_ant.com/ Ant.com search robot R 66.230.171.17x http://www.ant.com/ -id_n_s_271105_3 scoutmaster ScoutMaster information retrieval software R http://www.scoutmaster.de/ -id_n_s_1236 Scrubby/2.x (http://www.scrubtheweb.com/) Scrub the web robot (66.93.156.xx) R s.also Mozilla/5.0 (compatible; Scrubby/2.2 ... http://www.scrubtheweb.com/ -id_n_s_030308_3 Scrubby/3.0 (+http://www.scrubtheweb.com/help/technology.html) Scrub the web robot (66.93.156.xx) R s.also Mozilla/5.0 (compatible; Scrubby/2.2 ... http://www.scrubtheweb.com/ -id_n_s_1240 Search+ URL Search+ search software R http://srchplus.chat.ru/index.htm -id_n_s_110606_3 Search-Engine-Studio Xtreem Search Engine Studio - SE software R http://www.xtreeme.com/search-engine-studio/ -id_n_s_1237 search.ch V1.4 Search.ch robot R http://www.search.ch/ -id_n_s_1238 search.ch V1.4.2 (spiderman@search.ch; http://www.search.ch) Search.ch robot R http://www.search.ch/ -id_n_s_1239 Search/1.0 (http://www.innerprise.net/es-spider.asp) Enterprise Search web indexing / site searching tool R http://www.innerprise.net/es-bi.asp -id_n_s_1241 searchbot admin@google.com Unknown robot / website grabber from Chinatelecom (219.142.78.xxx) S -id_n_s_1242 SearchByUsa/2 (SearchByUsa; http://www.SearchByUsa.com/bot.html; info@SearchByUsa.com) SearchByUSA robot (69.150.7.xxx) R http://www.searchbyusa.com/ -id_n_s_231006_1 SearchdayBot Searchday (Germany) search robot R 85.25.131.1xx http://www.searchday.de/ -id_n_s_1243 SearchExpress Spider0.99 Searchexpress spider R http://www.searchexpress.com/ -id_n_s_1245 SearchGuild/DMOZ/Experiment (searchguild@gmail.com) Searchguild forum & directory robot (81.3.75.xxx) R http://searchguild.com/ -id_n_s_1244 SearchGuild_DMOZ_Experiment (chris@searchguild.com) Searchguild forum & directory robot (81.3.75.xxx) R http://searchguild.com/ -id_n_s_1246 Searchit-Now Robot/2.2 (+http://www.searchit-now.co.uk) Searchit robot (69.93.107.xx) R http://www.searchit-now.co.uk -id_n_s_220906_3 Searchmee! Spider v0.98a Searchmee! Search Engine (prototype) robot by findanisp.com R 64.202.100. http://www.searchmee.com/ -id_n_s_100506_1 SearchSight/2.0 (http://SearchSight.com/) SearchSight search robot R http://searchsight.com/ -id_n_s_1247 SearchSpider.com/1.1 SearchSpider robot R http://www.searchspider.com/ -id_n_s_1248 Searchspider/1.2 (SearchSpider; http://www.searchspider.com; webmaster@searchspider.com) SearchSpider robot R http://www.searchspider.com/ -id_n_s_1249 SearchTone2.0 - IDEARE Janas (Ideare.com / Tiscali.it) robot R http://www.ideare.com/ http://www.tiscali.it -id_n_s_1250 Seekbot/1.0 (http://www.seekbot.net/bot.html) HTTPFetcher/0.3 seekport. beta search (Germany) robot R 195.27.215.xx http://www.seekbot.net/ -id_n_s_1251 Seekbot/1.0 (http://www.seekbot.net/bot.html) RobotsTxtFetcher/1.0 (XDF) seekport. beta search (Germany) robot R 195.27.215.xx http://www.seekbot.net/ -id_n_s_1252 Seekbot/1.0 (http://www.seekbot.net/bot.html) RobotsTxtFetcher/1.2 seekport. beta search (Germany) robot R 195.27.215.xx http://www.seekbot.net/ -id_n_s_1253 Seeker.lookseek.com Lookseek search robot / link checking R 12.199.64.xx http://www.lookseek.com/ -id_n_s_011006_3 semaforo.net semaforo.net web filtering software P http://www.semaforo.net/en/default.htm -id_n_s_020807_2 Semager/1.1 (http://www.semager.de/blog/semager-bots/) Semager.de (was NG-Search) semantic search - Germany R 212.114.209.2xx http://www.semager.de/ http://www.semager.de/blog/semager-bots/ -id_n_s_230507_2 Semager/1.x (http://www.semager.de) Semager.de (was NG-Search) semantic search - Germany R 212.114.209.2xx http://www.semager.de/ http://www.semager.de/blog/semager-bots/ -id_n_s_1254 semanticdiscovery/0.x Semantic Discovery domain checking tool R C http://www.semanticdiscovery.com/products.html -id_n_s_1255 Sensis Web Crawler (search_comments\at\sensis\dot\com\dot\au) Sensis Australia search robot R http://www.sensis.com.au/ -id_n_s_1256 Sensis.com.au Web Crawler (search_comments\at\sensis\dot\com\dot\au) Sensis Australia search robot R http://www.sensis.com.au/ -id_n_s_1257 SeznamBot/1.0 Seznam Search (Czech Republic) robot R 212.80.76.xx http://www.seznam.cz/ -id_n_s_1258 SeznamBot/1.0 (+http://fulltext.seznam.cz/) Seznam Search (Czech Republic) robot R 212.80.76.xx http://www.seznam.cz/ -id_n_s_080907_2 SeznamBot/2.0-test (+http://fulltext.sblog.cz/) Seznam Search (Czech Republic) robot R 212.80.76.xx http://www.seznam.cz/ -id_n_s_280208_2 ShablastBot 1.0 Unknown robot from Shablast.com - Website has no content - Ignores robots.txt S 67.228.100.1xx / 67.228.102.2xx http://shablast.com/ -id_n_s_1259 Shareaza v1.x.x.xx Shareaza P2P peer-to-peer download client D B http://www.shareaza.com/ -id_n_s_1260 SharewarePlazaFileCheckBot/1.0+(+http://www.SharewarePlaza.com) SharewarePlaza File Check Bot - link checking R C http://www.sharewareplaza.com/ -id_n_s_1261 Shim Crawler Chikayama-Taura Lab Shim-Crawler used for The Kototoi Project (Japan) - (133.11.36.xx) R s. also Shim-Crawler ... http://www.logos.ic.i.u-tokyo.ac.jp/crawler/index.en.html http://www.kototoi.org/index.html -id_n_s_240106_2 Shim-Crawler(Mozilla-compatible; http://www.logos.ic.i.u-tokyo.ac.jp/crawler/; crawl@logos.ic.i.u-tokyo.ac.jp) Chikayama-Taura Lab Shim-Crawler used for The Kototoi Project (Japan) - (133.11.36.xx) R s. also Shim Crawler http://www.logos.ic.i.u-tokyo.ac.jp/crawler/index.en.html http://www.kototoi.org/index.html -id_n_s_131205_1 ShopWiki/1.0 ( +http://www.shopwiki.com/) ShopWiki shopping search based on LittleWiki search R 4.78.166.1xx http://www.shopwiki.com/ http://dev.littlewiki.com/wiki/Home -id_n_s_250706_1 ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot) ShopWiki shopping search based on LittleWiki search R 4.78.166.1xx http://www.shopwiki.com/ http://dev.littlewiki.com/wiki/Home -id_n_s_1262 Shoula.com Crawler 2.0 Shoula Search Engine crawler R http://www.shoula.com/ -id_n_s_230107_1 SietsCrawler/1.1 (+http://www.siets.biz) Siets Crawler - Web based site crawling application R http://www.siets.biz/products/crawler/ -id_n_s_070308_1 Sigram/Nutch-1.0-dev (Test agent for Nutch development; http://www.sigram.com/bot.html; bot at sigram dot com) Sigram's Nutch robot - crawler testing R http://www.sigram.com/bot.html -id_n_s_050906_1 Siigle Orumcex v.001 Turkey (http://www.siigle.com) Siigle search (Turkey) robot R 62.68.196.xx http://www.siigle.com/ -id_n_s_171006_1 silk/1.0 Slider Search directory robot (194.213.194.2xx) R s. also Slider_Search... http://www.slider.com/index.html -id_n_s_281205_1 silk/1.0 (+http://www.slider.com/silk.htm)/3.7 Slider Search directory robot (194.213.194.2xx) R s. also Slider_Search... http://www.slider.com/index.html -id_n_s_131206_2 SimpleFavPanel/1.2 SimpleFavPanel - IE newsfeed panel plugin B http://www.egrath.net/index.php?ExplorerBarPlus%2F%A5%D1%A5%CD%A5%EB%B0%EC%CD%F7%2FSimpleFavPanel -id_n_s_1263 Simpy 1.x; http://www.simpy.com/ Simpy bookmarking and personal search engine R C s. also Argus http://www.simpy.com/ -id_n_s_1264 Simpy/1.x (Simpy; http://www.simpy.com/?ref=bot; feedback at simpy dot com) Simpy bookmarking and personal search engine R C s. also Argus http://www.simpy.com/ -id_n_s_180707_2 Sirketcebot/v.01 (http://www.sirketce.com/bot.html) Sirketçe search - Turkey R 88.255.173.xx http://www.sirketce.com/ -id_n_s_070207_3 SiteBar/3.x.x (Bookmark Server; http://sitebar.org/) SiteBar online bookmark manager C http://sitebar.org/ -id_n_s_1265 SiteBar/x.x SiteBar bookmark server C http://sitebar.sourceforge.net/ -id_n_s_1266 SiteBar/x.x.x (Bookmark Server; http://sitebar.org/) SiteBar bookmark server C http://sitebar.sourceforge.net/ -id_n_s_1267 sitecheck.internetseer.com Internetseer Web Site Monitoring / Claymont robot R C http://www.internetseer.com/ http://www.claymont.com/ -id_n_s_1268 sitecheck.internetseer.com (For more info see: http://sitecheck.internetseer.com) Internetseer Web Site Monitoring R C http://www.internetseer.com/ -id_n_s_1269 SiteRecon+(xx) SiteRecon website monitoring spider at xx minute intervals R C http://www.siterecon.com/ -id_n_s_1270 SiteSnagger PC Magazin web site downloadmanager D http://www.zdnet.com/pcmag/pctech/content/17/04/ut1704.001.html -id_n_s_1271 SiteSpider +(http://www.SiteSpider.com/) Site Spider robot (66.249.17.xx) R http://www.SiteSpider.com/ -id_n_s_021205_3 SiteSucker/1.x.x SiteSucker Mac website downloading tool D http://www.sitesucker.us/ -id_n_s_140306_2 SiteTaggerBot (http://www.sitetagger.com/bot.htm) SiteTagger.com bookmark organizer C http://www.sitetagger.com/ -id_n_s_030407_1 SiteTruth.com site rating system SiteTruth - Automatic site legitimacy rating system R 69.64.67.xx http://www.sitetruth.com/ -id_n_s_1272 SiteWinder Webwasher.com (217.146.159.xx) internet filter B P http://www.webwasher.com/ -id_n_s_1273 SiteXpert Xtreeme SiteXpert sitemap & search engine builder R http://www.xtreeme.com/sitexpert/index.php -id_n_s_1274 Skampy/0.9.x (http://www.skaffe.com/skampy-info.html) Skaffe.com directory link checker R http://www.skaffe.com/ -id_n_s_1275 Skimpy/0.x (http://www.skaffe.com/skampy-info.html) Skaffe.com directory link checker R http://www.skaffe.com/ -id_n_s_090706_1 Skywalker/0.1 (Skywalker; anonymous; anonymous) Visvo distributed website crawler based on Nutch R 63.133.162.xx http://www.visvo.com/bot.html -id_n_s_1276 Slarp/0.1 Only.com robot R http://www.only.com/ -id_n_s_1277 Sleipnir Sleipnir - Japanese Explorer based browser & search bar B http://www20.pos.to/~sleipnir/software/sleipnir/index.html -id_n_s_1278 Sleipnir Version 1.xx Sleipnir - Japanese Explorer based browser & search bar B http://www20.pos.to/~sleipnir/software/sleipnir/index.html -id_n_s_170207_5 Sleipnir Version2.x Sleipnir - Japanese Explorer based browser & search bar B http://www20.pos.to/~sleipnir/software/sleipnir/index.html -id_n_s_260706_1 Sleipnir/2.xx Sleipnir - Japanese Explorer based browser & search bar B http://www20.pos.to/~sleipnir/software/sleipnir/index.html -id_n_s_1279 Slider_Search_v1-de Slider Search directory robot (194.213.194.2xx) R s. also silk/1.0... http://www.slider.com/index.html -id_n_s_1280 SlimBrowser Slim Browser (IE based browser) - uses this user agent for favicon.ico only B http://www.flashpeak.com/sbrowser/ -id_n_s_1281 Slurp/2.0 (slurp@inktomi.com; http://www.inktomi.com/slurp.html) Inktomi (Hotbot-Lycos-NBCi) robot R http://www.inktomi.com/slurp.html -id_n_s_1282 Slurp/2.0-KiteWeekly (slurp@inktomi.com; http://www.inktomi.com/slurp.html) Inktomi (Hotbot-Lycos-NBCi) robot R http://www.inktomi.com/slurp.html -id_n_s_1283 Slurp/si (slurp@inktomi.com; http://www.inktomi.com/slurp.html) Inktomi (Hotbot-Lycos-NBCi) robot R http://www.inktomi.com/slurp.html -id_n_s_240806_1 Slurpy Verifier/1.0 Inktomi (Hotbot-Lycos-NBCi) robot - 72.30.61.xx(x) R s. also Mozilla/3.0 (Slurp/..... http://www.inktomi.com/ -id_n_s_1284 SlySearch (slysearch@slysearch.com) Slysearch robot (now Turnitin robot) R http://www.slysearch.com/ -id_n_s_1285 SlySearch/1.0 http://www.plagiarism.org/crawler/robotinfo.html Slysearch robot (now Turnitin robot) R http://www.slysearch.com/ -id_n_s_1286 SlySearch/1.x http://www.slysearch.com Slysearch robot (now Turnitin robot) R http://www.slysearch.com/ -id_n_s_1287 SmartDownload/1.2.67 (Win32; Jan 12 1999) Netzip/Smartdownload download manager D http://www.netzip.com/ -id_n_s_1288 SmartDownload/1.2.77 (Win32; Feb 1 2000) Netzip/Smartdownload download manager D http://www.netzip.com/ -id_n_s_1289 SmartDownload/1.2.77 (Win32; Jun 19 2001) Netzip/Smartdownload download manager D http://www.netzip.com/ -id_n_s_1290 smartwit.com Loop Improvements NRS Enterprise search (69.44.155.xx[x]) R http://www.loopimprovements.com/ http://demo.loopimprovements.com/demo/ -id_n_s_020307_2 SmiffyDCMetaSpider/1.0 SmiffyDCMetaSpider - Robot to check the retro-adding of Dublin Core metadata R 64.71.152.xx http://www.smiffysplace.com http://www.smiffysplace.com/smiffydcmetaspider -id_n_s_1291 sna-0.0.1 (mikemuzio@msn.com) Snoopy PHP-client see Snoopy http://sourceforge.net/projects/snoopy/ -id_n_s_1292 sna-0.0.1 mikeelliott@hotmail.com Snoopy PHP-client see Snoopy http://sourceforge.net/projects/snoopy/ -id_n_s_080106_1 snap.com beta crawler v0 Unknown bot from bb2.net (66.234.139.xxx) also as Snapbot/1.0 S Gets only the robots.txt - Not from Snap.com / Idealab (63.251.211.xxx) http://www.kloth.net/internet/badbots.php -id_n_s_250506_1 Snapbot/1.0 Unknown bot from bb2.net (66.234.139.xxx) - also as snap.com S Not from Snap.com / Idealab (63.251.211.xxx) http://www.kloth.net/internet/badbots.php -id_n_s_250408_1 Snapbot/1.0 (Snap Shots, +http://www.snap.com) Unknown bot from Psinet / Cogentco - not from Snap.com S 38.98.19.6x -id_n_s_270906_2 Snappy/1.1 ( http://www.urltrends.com/ ) My UrlTrends online web ranking service C 205.138.199.1xx / 209.85.36.x http://www.urltrends.com/ -id_n_s_100707_1 Snarfer/0.x.x (http://www.snarfware.com/) Snarfer RSS reader B http://www.snarfware.com/ -id_n_s_1293 SnoopRob/x.x Unknown robot from 217.229.156.xx (T-Online Germany) -id_n_s_1294 Snoopy v1.xx Snoopy PHP-client s. also sna-x.x.x http://sourceforge.net/projects/snoopy/ -id_n_s_1295 Snoopy v1.xx- : User-Agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; MyIE2) Snoopy PHP-client s. also sna-x.x.x http://sourceforge.net/projects/snoopy/ -id_n_s_1296 Snoopy_v0.xx Snoopy PHP-client s. also sna-x.x.x http://sourceforge.net/projects/snoopy/ -id_n_s_1297 SnykeBot/0.6 (http://www.snyke.com) Snyke.com France robot R http://www.snyke.com/ -id_n_s_250706_2 SocSciBot () Link crawler for the social sciences R http://socscibot.wlv.ac.uk/ -id_n_s_170407_1 SoftBank/1.0/812SH/SHJ001 Browser/NetFront/3.3 Profile/MIDP-2.0 Configuration/CLDC-1.1 NetFront browser on Softbank mobile phone B http://www.access-company.com/products/netfrontmobile/browser/index.html http://mb.softbank.jp/mb/en/product/ -id_n_s_1298 SoftHypermarketFileCheckBot/1.0+(+http://www.softhypermaket.com) Soft Hypermarket link checking R http://www.softhypermarket.com/ -id_n_s_1299 Softizerbot (http://www.softizer.com) Softizer.com software directory link checking C 72.9.97.xx http://www.softizer.com/ -id_n_s_090208_1 sogou develop spider Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot S s. also sohu agent & Sogou web spider -id_n_s_011207_2 Sogou Orion spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm#07) Unknown UA from Chinanet (220.181.18.xx) faking Sogou search robot S s. also sohu agent , Sogou web spider & sogou develop spider -id_n_s_150106_1 sogou spider Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot S s. also sohu agent , Sogou web spider & sogou develop spider -id_n_s_280407_1 Sogou web spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm#07) Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot S s. also sohu agent , sogou spider & sogou develop spider -id_n_s_291105_1 sohu agent Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot S s. also sogou spider , sogou spider & sogou develop spider -id_n_s_1300 sohu-search Sohu (Search Fox) search robot China (61.135.131.xxx) R this UA also comes from 220.181.26.xxx (not Sohus IP range) as spam bot - s.also sohu agent http://www.sohu.com/ -id_n_s_160308_3 Sosospider+(+http://help.soso.com/webspider.htm) SOSO search (China) spider R http://www.soso.com/ http://help.soso.com/webspider.htm -id_n_s_1301 Space Bison/0.02 [fu] (Win67; X; SK) Default Proxomitron (discontinued) filtering proxy user agent identifier P B http://duke.usask.ca/~macphed/prox/ -id_n_s_1302 SpeedDownload/1.x Speed Download (Mac) download manager D http://www.yazsoft.com/ -id_n_s_1303 speedfind ramBot xtreme 8.1 Speedfind.de robot R http://www.speedfind.de/ -id_n_s_1304 Speedy Spider (Beta/x.x; speedy@entireweb.com) Entireweb search robot R 62.13.25.2xx http://www.entireweb.com/ -id_n_s_070906_1 Speedy Spider (Entireweb; Beta/1.0; http://www.entireweb.com/about/search_tech/speedyspider/) Entireweb search spider R 62.13.25.2xx http://www.entireweb.com/ -id_n_s_1305 Speedy_Spider (http://www.entireweb.com) Entireweb search robot R 62.13.25.2xx http://www.entireweb.com/ -id_n_s_050208_4 Sphere Scout&v4.0 - scout at sphere dot com Sphere blog and news search robot R 64.40.11[7-8].[x]xx http://www.sphere.com/ -id_n_s_040106_3 Sphider Sphider - a lightweight search engine in PHP R http://www.cs.ioc.ee/~ando/sphider/ -id_n_s_1306 Spida/0.1 Only.com robot R in conjunction with LWP::Simple/5.53 http://www.only.com/ -id_n_s_1307 Spider-Sleek/2.0 (+http://search-info.com/linktous.html) Search-Info ODP/DMOZ spider R http://search-info.com/ -id_n_s_1308 spider.batsch.com Batsch robot R - site unreachable http://www.batsch.com -id_n_s_110206_4 Spider.TerraNautic.net - v:1.04 TerraNautic spider for Schnellsuchen touristic search (Germany) C http://www.terranautic.net/ http://www.schnellsuchen.com/ -id_n_s_1309 spider.yellopet.com - www.yellopet.com Yellopet spider R http://www.yellopet.com/ -id_n_s_1310 Spider/maxbot.com admin@maxbot.com Maxbot .gov .mil .edu indexing robot R http://www.maxbot.com/ -id_n_s_1311 SpiderKU/0.x Unknown robot from CPE at Kasetsart University (158.108.35.xxx) R http://www.cpe.ku.ac.th/ -id_n_s_1312 SpiderMan Yahoo Search user agent or spider (202.165.102.xxx) R http://search.yahoo.com/ -id_n_s_1313 SpiderMonkey/7.0x (SpiderMonkey.ca info at http://spidermonkey.ca/sm.shtml) SpiderMonkey Canada robot R http://spidermonkey.ca/ -id_n_s_1314 Spinne/2.0 Spider.de robot R http://www.spider.de/ -id_n_s_1315 Spinne/2.0 med Medkatalog (medical catalogue) Austria robot R http://www.medkatalog.com/ -id_n_s_1316 Spinne/2.0 med_AH Medkatalog (medical catalogue) Austria robot R http://www.medkatalog.com/ -id_n_s_180707_3 Spock Crawler (http://www.spock.com/crawler) Spock - people search application - via Amazon web services R 72.44.62.1xx http://www.spock.com/crawler http://www.amazon.com/gp/browse.html?node=3435361 -id_n_s_1317 sportsuchmaschine.de-Robot (Version: 1.02- powered by www.sportsuchmaschine.de) Sportsuchmaschine (German sports related search) link checking / robot R http://www.sportsuchmaschine.de/ -id_n_s_040306_1 sproose/0.1-alpha (sproose crawler; http://www.sproose.com/bot.html; crawler@sproose.com) Sproose personalized search (38.100.225.xx) R powered by Nutch http://www.sproose.com/ http://lucene.apache.org/nutch/ -id_n_s_1318 SQ Webscanner SQ Webscanner Mac download manager D product is discontinued http://macinsearch.com/users/webscanner/ -id_n_s_1319 Squid-Prefetch Simple page-prefetch for Squid web proxy P http://packages.debian.org/stable/web/squid-prefetch -id_n_s_171105_2 squidclam Squidclam is a replacement for SquidClamAV-Redirector P s.also SquidClamAV_Redirector 1.x.x http://sourceforge.net/projects/squidclam -id_n_s_1320 SquidClamAV_Redirector 1.x.x SCAVR - Squid helper script for scanning download URLs for viruses P s.also squidclam http://www.jackal-net.at/tiki-read_article.php?articleId=1 -id_n_s_1321 Sqworm/2.9.81-BETA (beta_release; 20011102-760; i686-pc-linux-gnu) AOL Search / Pacific Internet Exchange robot R http://www.aol.com/ -id_n_s_1322 Sqworm/2.9.85-BETA (beta_release; 20011115-775; i686-pc-linux-gnu) diff. IPs / services i.e.: - Inria.fr robot - Websense (Internet filtering) robot R http://www.inria.fr/ http://www.websense.com/ -id_n_s_1323 Sqworm/2.9.89-BETA (beta_release; 20020130-839; i686-pc-linux-gnu) Time Warner Telecom user robot ? -id_n_s_1324 SSurf15a 11 Some site scanning tool via diff. IPs i.e.: - choiceone.net (216.153.xxx.xxx) - epix.net (216.108.198.xx) S see also - PSurf15a VA or random letters like - AWSCBA - URVUSLNAM -id_n_s_1325 StackRambler/x.x Rambler search (Russia) robot (81.19.6x.xx) R http://www.rambler.ru -id_n_s_1326 Stamina/1.4 Stamina download manager D http://www.wildbits.com/stamina/ -id_n_s_1327 Star Downloader Star Downloader download manager D http://www.stardownloader.com/ -id_n_s_140106_3 StarDownloader/1.xx Star Downloader download manager D http://www.stardownloader.com/ -id_n_s_1328 stat statcrawler@gmail.com Experimental search engine spider from 66.92.186.xxx R 66.92.186.xxx -id_n_s_1329 Steeler/1.x (http://www.tkl.iis.u-tokyo.ac.jp/~crawler/) Steeler crawler R http://www.tkl.iis.u-tokyo.ac.jp/~crawler/ -id_n_s_031107_5 Steeler/3.3 (http://www.tkl.iis.u-tokyo.ac.jp/~crawler/) Steeler - University of Tokyo web crawler R 157.82.156.xx[x] http://www.tkl.iis.u-tokyo.ac.jp/~crawler/crawler.html.en -id_n_s_060106_1 Strategic Board Bot (+http://www.strategicboard.com) Strategic Board blog & news search robot R http://www.strategicboard.com/ -id_n_s_140906_2 Strategic Board Bot (+http://www.strategicboard.com) Strategic Board blogs and news aggregator robot R 62.0.99.2xx http://www.strategicboard.com/ -id_n_s_1330 Submission Spider at surfsafely.com Surfsafely submission verifier R http://www.surfsafely.com/ -id_n_s_210106_4 suchbaer.de Suchbaer.de (Germany) search robot R http://www.suchbaer.de/ -id_n_s_010206_3 suchbaer.de (CrawlerAgent v0.103) Suchbaer.de (Germany) search robot R http://www.suchbaer.de/ -id_n_s_1331 suchbot Suchbot Germany robot R http://www.suchbot.de/ -id_n_s_1332 Suchknecht.at-Robot Suchknecht Austria robot R http://www.suchknecht.at/ -id_n_s_120206_1 suchpadbot/1.0 (+http://www.suchpad.de) suchpad search Germany robot (213.239.194.xx) R http://www.suchpad.de/ -id_n_s_160107_2 Sunrise XP/2.x Sunrise XP handheld news / website reader and converter B http://sourceforge.net/projects/sunrisexp -id_n_s_230406_4 Sunrise/0.42g (Windows XP) Sunrise XP web sites and newsfeeds converter and handheld reader B http://www.sunrisexp.com/ -id_n_s_1333 SuperBot/x.x (Win32) SuperBot website copier D http://www.sparkleware.com/superbot/index.html -id_n_s_260108_2 SuperBot/x.x.x.xx (Windows XP) SuperBot website copier D http://www.sparkleware.com/superbot/index.html -id_n_s_1334 Superdownloads Spiderman Ubbi Superdownloads (Brazil) link checking C http://superdownloads.ubbi.com.br/ -id_n_s_1335 SURF SurfControl Web Filtering P http://www.surfcontrol.com/ -id_n_s_1336 SurferF3 1/0 Wanadoo Rechereche robot R http://www.wanadoo.fr/qqo/ -id_n_s_1337 SurfMaster Maskbit Surfmaster bookmark tool C http://www.maskbit.com/surfmaster.htm -id_n_s_1338 SurveyBot/2.2 Whois Source Whois Source domain name information robot (66.249.26.xx) R C s.also: PigeonBot http://www.whois.sc/ -id_n_s_1339 SurveyBot/2.3 (Whois Source) Whois Source domain name information robot (66.249.26.xx) R C s.also: PigeonBot http://www.whois.sc/ -id_n_s_1340 suzuran Yokogao Search Engine robot (Kanazawa University) R http://web.kanazawa-u.ac.jp/esearch.html -id_n_s_1341 SWB/V1.4 (HP) HP Secure Web Browser for OpenVMS B http://h71000.www7.hp.com/openvms/products/ips/cswb/cswb.html -id_n_s_1342 swbot/0.9c libwww/5.3.1 unknown -id_n_s_1343 Swooglebot/2.0. (+http://swoogle.umbc.edu/swooglebot.htm) Swooglebot Swoogle's semantic web crawler R http://swoogle.umbc.edu -id_n_s_060106_2 SWSBot-Images/1.2 http://www.smartwaresoft.com/swsbot12.html SWSBot - SmartWareSoft (85.186.255.xx) software search engine created for Playfuls.com R http://www.smartwaresoft.com/swsbot12.html http://www.playfuls.com/ -id_n_s_300106_2 SygolBot http://www.sygol.net Sygol Search (Italy) robot R s.also http://www.sygol.com/ -id_n_s_1344 Sylera/1.2.x Sylera browser (Japan) B http://tabbrowser.ktplan.jp/valinor/sylera.html -id_n_s_1345 SyncBot Mindspring.com user robot http://www.mindspring.com/ -id_n_s_1346 SyncIT/x.x SyncIT link validation C http://www.bookmarksync.com/ -id_n_s_140906_1 Syndirella/0.91pre Syndirella desktop information aggregator (beta) B http://www.yole.ru/projects/syndirella/ -id_n_s_1347 SynoBot Synomia (France) robot R http://www.synomia.fr/ -id_n_s_150406_1 Syntryx ANT Scout Chassis Pheromone; Mozilla/4.0 compatible crawler Syntryx Solution Suite - domain / keyword crawler (216.7.179.xx) R http://www.syntryx.com/ -id_n_s_1348 Szukacz/1.x Szukacz.pl (Polish search) robot R http://www.szukacz.pl/ -id_n_s_1349 Szukacz/1.x (robot; www.szukacz.pl/jakdzialarobot.html; szukacz@proszynski.pl) Szukacz.pl (Polish search) robot R http://www.szukacz.pl/ -id_t_z_220106_2 T-Online Browser German T-Online browser & internet suite B http://service.t-online.de/c/06/52/67/652672.html -id_t_z_070807_1 tags2dir.com/0.8 (+http://tags2dir.com/directory/) tags2dir.com directory index R 74.115.102.1xx http://tags2dir.com/directory/ -id_t_z_1350 Tagword (http://tagword.com/dmoz_survey.php) TAGword DMOZ survey - ODP link checking robot R http://tagword.com/dmoz_survey.php -id_t_z_271105_2 Tagyu Agent/1.0 Tagyu - del.icio.us bookmark collection online tag generator http://www.tagyu.com/ http://del.icio.us/ -id_t_z_1351 Talkro Web-Shot/1.0 (E-mail: webshot@daumsoft.com- Home: http://222.122.15.190/webshot) Daumsoft Talkro IR robot R http://www.daumsoft.com/ -id_t_z_1352 TAMU_CS_IRL_CRAWLER/1.0 Texas A&M University - Dept. of Computer Science crawler (server or link checking ?) R C http://www.cs.tamu.edu/ -id_t_z_1353 targetblaster.com/0.9k Targetblaster user link validation ? R C http://www.targetblaster.com/ -id_t_z_230706_2 TargetYourNews.com bot Target Your News - user submitted links C 72.36.160.xxx http://targetyournews.com/ -id_t_z_201006_1 TCDBOT/Nutch-0.8 (PhD student research;http://www.tcd.ie; mcgettrs at t c d dot IE) Trinity College Dublin (Ireland) TCDBOT R 134.226.1.xx http://www.tcd.ie/ -id_t_z_1354 TE HTTP header for transfer encoding used as user agent name ? -id_t_z_1355 TeamSoft WinInet Component WinInet Internet client app. http://www.winsoft.sk/wininet.htm -id_t_z_1356 TECOMAC-Crawler/0.x Tecomac Gmbh (Germany) crawler software - now Arexera Information Technologies R http://www.arexera.de/ -id_t_z_1357 Tecomi Bot (http://www.tecomi.com/bot.htm) Tecomi (Germany) beta / test robot (84.201.65.xxx) R http://www.tecomi.com/Suchmaschine -id_t_z_101107_2 Teemer (NetSeer, Inc. is a Los Angeles based Internet startup company.; http://www.netseer.com/crawler.html; crawler@netseer.com) Teemer crawler for NetSeer search (beta) via Amazon Web Services - see also NetSeer/Nutch R 67.202.26.1xx http://www.netseer.com/ http://www.amazon.com/gp/browse.html?node=3435361 -id_t_z_1358 Teleport Pro/1.2x(.1xxx) Teleport (website) downloading tool D http://www.tenmax.com/teleport/pro/home.htm -id_t_z_1359 Teoma MP Teoma crawler (65.214.36.xx[x]) R http://www.teoma.com/ -id_t_z_1361 teomaagent crawler-admin@teoma.com Teoma crawler (65.214.36.xx[x]) R http://www.teoma.com/ -id_t_z_1362 teomaagent1 [crawler-admin@teoma.com] Teoma crawler (65.214.36.xx[x]) R http://www.teoma.com/ -id_t_z_1360 teoma_agent1 Teoma crawler (65.214.36.xx[x]) R http://www.teoma.com/ -id_t_z_1363 Teradex Mapper; mapper@teradex.com; http://www.teradex.com Teradex Directory robot R http://directory.teradex.com/ -id_t_z_010406_4 TeragramCrawler Teragram multilingual text & data processing software D ? http://www.teragram.com/ -id_t_z_150807_2 terraminds-bot/1.0 (support@terraminds.de) Terraminds blog search (Germany) R 88.198.44.2xx http://www.terraminds.de/ -id_t_z_220406_1 TerrawizBot/1.0 (+http://www.terrawiz.com/bot.html) Terrawiz Indian Search Engine robot R 209.128.80.1xx http://www.terrawiz.com/ -id_t_z_1364 Test spider Noceans Information Portfolio Manager (66.35.69.x) R http://www.noceans.com/ -id_t_z_160507_1 TestCrawler/Nutch-0.9 (Testing Crawler for Research ; http://balihoo.com/index.aspx; tgautier at balihoo dot com) Balihoo - Search Engine for Advertising Media R 204.228.230.xx http://balihoo.com/ -id_t_z_1365 The Expert HTML Source Viewer (http://www.expert-html.com) Expert HTML online source viewer D B in conjunction with lwp-trivial/1.35 http://www.expert-html.net - site is offline -id_t_z_281207_3 TheRarestParser/0.2a (http://therarestwords.com/) The Rarest Words - Linguistic experiment crawler via Amazon Web Services R 67.202.27.19x http://therarestwords.com/ http://www.amazon.com/gp/browse.html?node=3435361 -id_t_z_1366 TheSuBot/0.1 (www.thesubot.de) TheSuBot robot (Germany) for an unknown theme based search engine R http://www.thesubot.de/ -id_t_z_171106_1 thumbshots-de-Bot (Version: 1.02, powered by www.thumbshots.de) ThumbShots website thumbnail service (Germany) robot D 212.112.238.xx http://www.thumbshots.de/ -id_t_z_1367 thumbshots-de-Bot (Version: 1.02- powered by www.thumbshots.de) ThumbShots.de (Germany) robot R http://www.thumbshots.de/ -id_t_z_250206_1 timboBot/0.9 http://www.breakingblogs.com/timbo_bot.html Breaking Blogs timbo bot blog robot R http://www.breakingblogs.com/ -id_t_z_140106_4 http://www.timelyweb.com/ TimelyWeb web page monitoring tool C s. also EldoS ... http://www.eldos.org/timelyweb/timelyweb.html -id_t_z_180408_6 TinEye/1.1 (http://tineye.com/crawler.html) TinEye crawler for an open image search project R http://tineye.com/crawler.html -id_t_z_1368 tivraSpider/1.0 (crawler@tivra.com) Tivra spider from AT&T Labs Research R see this document: http://trec.nist.gov/pubs/trec9/papers/att-trec9.ps http://trec.nist.gov/pubs/trec9/papers/att-trec9.ps -id_t_z_1369 TJG/Spider Tjgroup spider R http://www.tjgroup.com/ -id_t_z_1370 TJvMultiHttpGrabber Component TJvHttpGrabber (JEDI Visual Component Library) Possibly used by Bit Torrent Search http://homepages.borland.com/jedi/jedihelp/item.php?Id=22015 http://www.btsearch.net/ -id_t_z_1371 Tkensaku/x.x(http://www.tkensaku.com/q.html) Tkensaku Search (Japan) robot from 210.239.46.xxx (www.tken.com) R http://www.tkensaku.com/q.html -id_t_z_1372 toCrawl/UrlDispatcher Unknown robot from 195.68.98.xx (coltfrance.com) -id_t_z_200207_1 Topodia/1.2-dev (Topodia - Crawler for HTTP content indexing; http://www.topodia.com/; support@topodia.com) Topodia search engine and personal information assistant (in development) R 88.153.148.xx http://www.topodia.com/ -id_t_z_160506_2 TOPOS robot/1.1 (http://www.topos.com.ua/) Topos search (Russia) robot C 193.17.73.1xx http://www.topos.com.ua/ -id_t_z_050806_2 traazibot/testengine (+http://www.traazi.de) Traazi! search (Germany) robot R 87.230.5.2xx http://www.traazi.de/ -id_t_z_041007_2 Trailfire-bot/0.7.1 (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org) Trailfire web collection and annotating system C http://www.trailfire.com/ -id_t_z_081207_2 Trailfire-bot/0.7.1 (Trailfire page content analyzer; http://trailfire.com; info@trailfire.com) Trailfire web collection and annotating system C http://www.trailfire.com/ -id_t_z_260807_2 Trailfire/0.7.1 (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org) Trailfire web collection and annotating system C http://www.trailfire.com/ -id_t_z_1376 Trampelpfad-Spider Trampelpfad Webkatalog spider R http://www2.trampelpfad.de/ -id_t_z_1377 Trampelpfad-Spider-v0.1 Trampelpfad Webkatalog spider R http://www2.trampelpfad.de/ -id_t_z_1378 tricosMetaCheck 1.2216-08-1999 (http://www.tricos.com/metacheck) Tricos meta tag validation C http://www.tricos.us/metaone.php -id_t_z_1379 TSurf15a 11 some bad user agent S - s. DBrowse- Dsurf etc. -id_t_z_1380 TulipChain/5.x (http://ostermiller.org/tulipchain/) Java/1.x.1_0x (http://java.sun.com/) Linux/2.4.17 Tulip Chain browser / link checker for Dmoz.org directory B C R http://ostermiller.org/tulipchain/ -id_t_z_1381 TulipChain/5.xx (http://ostermiller.org/tulipchain/) Java/1.x.1_0x (http://apple.com/) Mac_OS_X/10.2.8 Tulip Chain browser / link checker for Dmoz.org directory B C R http://ostermiller.org/tulipchain/ -id_t_z_101107_3 Tumblr/1.0 RSS syndication (+http://www.tumblr.com/) (support@tumblr.com) Tumblr Tumblelogs RSS and news syndication crawler R 72.32.6.15x http://www.tumblr.com/ -id_t_z_1382 TurnitinBot/x.x (http://www.turnitin.com/robot/crawlerinfo.html) Turnitin (ex SlySearch) robot for helping educational institutions prevent plagiarism R 64.140.49.xx http://www.turnitin.com/robot/crawlerinfo.html -id_t_z_1383 Turnpike Emporium LinkChecker/0.1 TurnPike Emporium Directory (207.67.198.x) link checking R http://www.turnpike.net/directory.phtml -id_t_z_1384 TutorGig/1.5 (+http://www.tutorgig.com/crawler) TutorGig tutorial search robot R http://www.tutorgig.com/crawler/ -id_t_z_1385 Tutorial Crawler 1.4 (http://www.tutorgig.com/crawler) TutorGig tutorial search robot R http://www.tutorgig.com/crawler/ -id_t_z_1386 Twiceler www.cuill.com/robots.html Twiceler experimental web crawler R 64.62.136.xxx http://www.cuill.com/ -id_t_z_290407_1 Twiceler-0.9 http://www.cuill.com/twiceler/robot.html Twiceler experimental web crawler R 64.62.136.xxx http://www.cuill.com/ -id_t_z_291105_5 Twisted PageGetter File downloading component from Twisted Python D http://twistedmatrix.com/ -id_t_z_140508_5 Twitturly / v0.x Twitt(url)y URL tracking service for Twitter via Amazon Web Services C 75.101.135.[x]xx http://twitturly.com/ http://twitter.com/ -id_t_z_1387 Twotrees Reactive Filter V2.0 Twotrees content filter P http://www.twotrees.com/ -id_t_z_221207_2 Tycoon Agent/Nutch-1.0-dev Tycoon - Hewlett-Packards distributed cluster solution robot R 204.123.46.xx[x] http://tycoon.hpl.hp.com/ -id_t_z_1388 TygoBot Tygo Search robot R http://www.tygo.com/ -id_t_z_1389 TygoProwler Tygo Search robot R http://www.tygo.com/ -id_t_z_1390 UCmore UCMore - IE navigation and search plugin B http://www.ucmore.com/ -id_t_z_1391 UCMore Crawler App UCMore - IE navigation and search plugin B http://www.ucmore.com/ -id_t_z_290208_1 UCWEB5.1 Ucweb mobile browser B http://www.ucweb.com/English/product.shtml -id_t_z_1392 UDM user agent - maybe UdmSearch (see UdmSearch) ? -id_t_z_1393 UdmSearch/3.1.x UdmSearch / MySearch (now mnoGoSeach) offline browser/search client R B http://mnogosearch.org/ -id_t_z_1394 UIowaCrawler/1.0 University of Iowa Crawler- possibly MySpiders R http://myspiders.biz.uiowa.edu/ -id_t_z_231106_1 UKWizz/Nutch-0.8.1 (UKWizz Nutch crawler; http://www.ukwizz.com/) UKWizz search robot R s. also Mackster http://www.ukwizz.com -id_t_z_1395 Ultraseek Infoseek robot R http://www.infoseek.com/ -id_t_z_1396 Under the Rainbow 2.2 Unknown mail harvester/spambot from 80.58.13.xxx (proxycache.rima-tde.net) S http://www.honeypot.be/ -id_a_f_140308_1 unknownght.com Web Server IIS vs Apache Survey. See Results at www.DNSRight.com DNS Right - Online DNS tools C 203.161.71.17x http://www.dnsright.com/ -id_t_z_1397 UofTDB_experiment (leehyun@cs.toronto.edu) Unknown robot from University of Toronto (128.100.5.1xx) R -id_t_z_1398 UP.Browser/3.01-IG01 UP.Link/3.2.3.4 Mobile phone browser B -id_t_z_050806_1 updated/0.1-alpha (updated crawler; http://www.updated.com; crawler@updated.com) Updated! search robot R 38.119.96.1xx http://www.updated.com/ -id_t_z_1399 updated/0.1beta (updated.com; http://www.updated.com; crawler@updated.om) Updated! search robot R 38.119.96.1xx http://www.updated.com/ -id_t_z_1400 UPG1 UP/4.0 (compatible; Blazer 1.0) Handspring (PalmOS powered cellphone) Treo Blazer browser B -id_t_z_1401 Uptimebot UptimeBot.com online link popularity check R http://www.uptimebot.com/ -id_t_z_1402 UptimeBot(www.uptimebot.com) UptimeBot.com online link popularity check R http://www.uptimebot.com/ -id_t_z_160706_2 URI::Fetch/0.06 URI::Fetch - client for fetching HTTP pages and syndication feeds (RSS Atom) D http://search.cpan.org/dist/URI-Fetch/ -id_t_z_1403 URL Spider Pro/x.xx (innerprise.net) Innerprise URL Spider Pro (now ES.NET) web indexing / site searching tool R http://www.innerprise.net/ -id_t_z_121106_2 URLBase/6.x URLBase - Internet shortcut manager C s. also Mozilla/4.0 (Compatible); URLBase 6 http://www.terriadev.com/products/urlbase/ -id_t_z_1406 URLBlaze URLBlaze file sharing link toolkit C http://www.urlblaze.net/ -id_t_z_011108_4 urlfan-bot/1.0; +http://www.urlfan.com/site/bot/350.html ://URLFAN news crawler R 70.165.48.16x http://www.urlfan.com/ -id_t_z_1407 URLGetFile URLGetFile downloading tool D http://shazron.com/freeware/java-utils/ -id_t_z_1404 URL_Spider_Pro/x.x Innerprise URL Spider Pro (now ES.NET) web indexing / site searching tool R http://www.innerprise.net/ -id_t_z_1405 URL_Spider_Pro/x.x+(http://www.innerprise.net/usp-spider.asp) Innerprise URL Spider Pro (now ES.NET) web indexing / site searching tool R http://www.innerprise.net/ -id_t_z_291006_1 User-Agent: BoardReader Favicon Fetcher /1.0 info@boardreader.com BoardReader search favicon fetcher D 208.65.71.xx http://www.boardreader.com/ http://www.internetadsales.com/modules/news/article.php?storyid=4050 -id_t_z_081206_1 User-Agent: BoardReader Image Fetcher /1.0 info@boardreader.com BoardReader search image fetcher D 208.65.71.xx http://www.boardreader.com/ http://www.internetadsales.com/modules/news/article.php?storyid=4050 -id_t_z_060206_2 User-Agent: LjSEEK Picture-Bot /1.0 contact@ljseek.com ljpic.com - LiveJournal picture feed search C http://www.ljpic.com/ -id_t_z_1408 User-Agent: FileHeap! file downloader (http://www.fileheap.com) FileHeap download manager D http://www.fileheap.com -id_t_z_270306_2 User-Agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1) Malformed UA header from some guestbook/forum spammer S -id_t_z_1409 User-Agent: Mozilla/4.0 (SKIZZLE! Distributed Internet Spider v1.0 - www.SKIZZLE.com) Skizzle search robot R http://www.skizzle.com/ -id_t_z_1410 user-agent=Mozilla/3.01Gold unknown robot (reads robots.txt) or sitegrabber. From different IPs- ie.: 62.98.8.xx (wind.it) R D ? -id_t_z_1411 USyd-NLP-Spider (http://www.it.usyd.edu.au/~vinci/bot.html) University of Sydney NLP Spider for research in Natural Language Processing R http://www.it.usyd.edu.au/~vinci/bot.html -id_t_z_1412 UtilMind HTTPGet Web Thief Site Grabber D http://www.utilmind.com/scripts/webthief.html -id_t_z_1413 Utopia WebWasher 3.0 WebWasher ad filter P B http://www.webwasher.com/ -id_t_z_100406_1 uTorrent/1500 uTorrent BitTorrent client D http://www.utorrent.com/ -id_t_z_060108_2 VadixBot Unknown bad behaving bot via Road Runner - see link S 67.78.34.1[6-7][0-9] - 70.112.211.2x http://mikesblog.americasdebate.com/2007/06/06/vadixbot-look-out/ -id_t_z_050406_4 Vagabondo-WAP/2.0 (webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/)/1.0 Profile WiseGuys WAP pages robot R http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk -id_t_z_1414 Vagabondo/1.x MT (webagent@wise-guys.nl) WiseGuys robot Netherland - 82.94.216.2 R s. also Mozilla/3.0 (Vagabondo... http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk -id_t_z_1415 Vagabondo/2.0 MT WiseGuys robot Netherland - 82.94.216.2 R s. also Mozilla/3.0 (Vagabondo... http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk -id_t_z_1416 Vagabondo/2.0 MT (webagent at wise-guys dot nl) WiseGuys robot Netherland - 82.94.216.2 R s. also Mozilla/3.0 (Vagabondo... http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk -id_t_z_1417 Vagabondo/2.0 MT (webagent@NOSPAMwise-guys.nl) WiseGuys robot Netherland - 82.94.216.2 R s. also Mozilla/3.0 (Vagabondo... http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk -id_t_z_021205_2 Vagabondo/3.0 (webagent at wise-guys dot nl) WiseGuys robot Netherland - 82.94.216.2 R s.also - Mozilla/3.0 (Vagabondo... http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk -id_t_z_1418 Vakes/0.01 (Vakes; http://www.vakes.com/; search@vakes.com) Open Directory link checking from Vakes R http://www.vakes.com/ -id_t_z_1420 VayalaCreep-v0.0.1 (haploid@haploid.com) unknown level3.net (63.214.172.xxx) robot -id_t_z_1419 Vayala|Creep-v0.0.1 (codepoet@wildties.com) unknown level3.net (63.214.172.xxx) robot -id_t_z_1421 vb wininet iNet Grabber - Internet content grabber D http://www.aldostools.com/igrabber.html -id_t_z_1422 versus 0.2 (+http://versus.integis.ch) Versus Project robot - Comparing methods for near-uniform URL sampling R http://versus.integis.ch/ -id_t_z_1423 versus crawler eda.baykan@epfl.ch Unknown robot from EPFL University Switzerland (128.178.155.xxx) R http://www.epfl.ch/Eindex.html -id_t_z_120408_1 Verticrawlbot Verticrawl - Semantic search engine solution (French) C http://www.verticrawl.com/fr/homepage.php -id_t_z_1424 VeryGoodSearch.com.DaddyLongLegs VeryGoodSearch.com link submission checking R http://www.verygoodsearch.com/ -id_t_z_1425 verzamelgids.nl - Networking4all Bot/x.x Verzamelgids NL link checking robot R 213.247.50.xx http://www.verzamelgids.nl/ -id_t_z_181006_2 Verzamelgids/2.2 (http://www.verzamelgids.nl) Verzamelgids NL link checking robot R 213.247.50.xx http://www.verzamelgids.nl/ -id_t_z_030406_1 Vespa Crawler Unknown robot from Yahoo Norway R 217.144.236.x http://no.yahoo.com/ -id_t_z_190206_1 virus_detector (virus_harvester@securecomputing.com) Sidewinder G2 anti-virus and anti-spyware protection D http://www.securecomputing.com/sg2_antivirus.cfm?menu=solutions -id_t_z_140407_1 VisBot/2.0 (Visvo.com Crawler; http://www.visvo.com/bot.html; bot@visvo.com) Visbot crawler for a search software under development R 63.133.162..xx http://www.visvo.com/bot.html -id_t_z_1426 Visicom Toolbar Some IE toolbar made with Visicom Media Dynamic Toolbar software B http://www.dynamictoolbar.com/en/products/toolbar/ -id_t_z_1427 Vision Research Lab image spider at vision.ece.ucsb.edu Vision research lab's Cortina - content based image retrieval (128.111.60.xx) R http://vision.ece.ucsb.edu/multimedia/cortina.html -id_t_z_160906_1 VLC media player - version 0.8.5 Janus - (c) 1996-2006 the VideoLAN team VLC - Cross-platform media player and streaming server B http://www.videolan.org/vlc/ -id_t_z_140806_1 VMBot/0.x.x (VMBot; http://www.VerticalMatch.com/; vmbot@tradedot.com) VM - Vertical Search Engine (China) R 202.83.221.2xx http://www.verticalmatch.com/ -id_t_z_020106_1 Vortex/2.2 (+http://marty.anstey.ca/robots/vortex/) Vortex Web Indexing Robot for a study on internet link distribution R http://marty.anstey.ca/projects/robots/vortex/ -id_t_z_041207_1 voyager-hc/1.0 Kosmix health, auto and travel search crawler (204.14.48.x / 38.113.234.xxx) R s. also - cfetch/1.x - carleson/1.x http://www.kosmix.com/ -id_t_z_231105_1 voyager/1.0 Kosmix health, auto and travel search crawler (204.14.48.x / 38.113.234.xxx) R s. also - cfetch/1.x - carleson/1.x http://www.kosmix.com/ -id_t_z_301108_3 voyager/2.0 (http://www.kosmix.com/html/crawler.html) Kosmix health, auto and travel search crawler (204.14.48.x / 38.113.234.xxx) R s. also - cfetch/1.x - carleson/1.x http://www.kosmix.com/ -id_t_z_171105_3 VSE/1.0 (testcrawler@hotmail.com) Vivisimo search crawler (206.210.89.xxx) R http://www.vivisimo.com/ -id_t_z_171105_4 VSE/1.0 (testcrawler@vivisimo.com) Vivisimo search crawler (206.210.89.xxx) R http://www.vivisimo.com/ -id_t_z_1428 vspider Verity vspider indexing software R http://www.verity.com/ -id_t_z_1429 vspider/3.x Verity vspider indexing software R http://www.verity.com/ -id_t_z_130707_1 VWBOT/Nutch-0.9-dev (VWBOT Nutch Crawler; http://vwbot.cs.uiuc.edu;+vwbot@cs.uiuc.edu VWBot - MetaQuerier Crawler for the MetaQuerier project at the University of Illinois R 192.17.240.xx http://vwbot.cs.uiuc.edu/ http://metaquerier.cs.uiuc.edu/ -id_t_z_1431 W3C-checklink/3.x.x.x libwww-perl/5.xx W3C Link Checker C http://validator.w3.org/checklink -id_t_z_1432 W3C-checklink/4.x [4.xx] libwww-perl/5.xxx W3C Link Checker C http://validator.w3.org/checklink -id_t_z_080806_1 W3C-WebCon/5.x.x libwww/5.x.x WebCon - the Libwww command line tool D http://www.w3.org/ComLine/ -id_t_z_1433 W3CLineMode/5.4.0 libwww/5.x.x W3C Line Mode (character based Web browser) B http://www.w3.org/LineMode/ -id_t_z_1434 W3CRobot/5.4.0 libwww/5.4.0 Unknown link checking using Libwww via Korea Telecom (221.148.44.xxx) C http://www.w3.org/Library/ -id_t_z_1430 W3C_Validator/1.xxx libwww-perl/5.xx W3C HTML-Code Validator C http://validator.w3.org/ -id_t_z_1435 w3m/0.x.xx w3m Linux pager / text-based browser B http://w3m.sourceforge.net/ -id_t_z_1436 W3SiteSearch Crawler_v1.1 http://www.w3sitesearch.de W3 Site Search (Germany) search engine solution R http://www.w3sitesearch.de/ -id_t_z_061206_3 wadaino.jp-crawler 0.2 (http://wadaino.jp/) Wadain (Japan) Blog / RSS search crawler R 202.51.14.1xx http://wadaino.jp/ -id_t_z_1437 WannaBe (Macintosh; PPC) Wanna-Be text mode browser B http://mindstory.com/wb2/ -id_t_z_270906_1 WapOnWindows 1.0 WapOnWindows WAP browser for PCs B Site is dead http://www.waponwindows.com/ -id_t_z_250206_2 Watchfire WebXM 1.0 Watchfire WebXM intranet solution P http://www.watchfire.com/products/webxm/default.aspx -id_t_z_200706_1 WAVcheck 1.0.x (http://www.webbanalys.se/apps/WAVcheck/) WAVcheck - Simple Vendor Discovery Tool for detecting client-side tags from web analytics vendors C http://www.webbanalys.se/apps/WAVcheck/ -id_t_z_110106_1 Wavefire/0.8-dev (Wavefire; http://www.wavefire.com; info@wavefire.com) Wavefire local search community engine (64.141.15.1xx) R http://www.wavefire.com/ -id_t_z_110206_5 Waypath development crawler - info at waypath dot com Waypath blog discovery engine robot R http://www.waypath.com/ -id_t_z_110206_6 Waypath Scout v2.x - info at waypath dot com Waypath blog discovery engine robot R http://www.waypath.com/ -id_t_z_1438 WDG_Validator/1.1 WDG HTML-code validator C http://www.htmlhelp.tne.co.uk/tools/validator/ -id_t_z_1439 Web Image Collector Datafire.com's Web Image Collector (graphics downloading tool) D http://www.datafire.com/ -id_t_z_1440 Web Link Validator 1.5 Relsoft link checking software C http://www.relsoftware.com/ -id_t_z_1441 Web Snooper RankMeter ranking software R http://www.searchutilities.com/ -id_t_z_010206_2 web-bekannt (Version: 1.02, powered by www.internetservice-franken.de) Web-bekannt German web directory link checking C http://www.web-bekannt.de/ -id_t_z_010206_1 web-bekannt (Version: 1.02, powered by www.web-bekannt.de) Web-bekannt German web directory link checking C http://www.web-bekannt.de/ -id_t_z_1442 Web-Bot V1.03 Unkown link or server checking from Würzburg University Germany (132.187.10.xx) R C http://informatik.uni-wuerzburg.de/ -id_t_z_1443 Web-Robot/5.0 (en-US; web-robot.com/policy.html) Web-Robot Crawler/2.0.3 Unknown robot from 69.50.233.x (nectartech.com) no active website -id_t_z_010107_2 web2express.org/Nutch-0.9-dev (leveled playing field; http://web2express.org/; info at web2express.org) Web2Express / Web2x - Open data searching tool R http://search.web2express.org/search/search.html -id_t_z_050206_1 WebAlta Crawler/1.2.1 (http://www.webalta.ru/bot.html) WebAlta search Russia crawler (85.21.201.xx) R http://www.webalta.ru/ -id_t_z_250806_1 WebarooBot (Webaroo Bot; http://64.124.122.252/feedback.html) WebarooBot / RufusBot from webaroo offline search service R 64.124.122.2xx http://www.webaroo.com/ http://www.webaroo.com/company/site-owners -id_t_z_210407_1 WebarooBot (Webaroo Bot; http://www.webaroo.com/rooSiteOwners.html) WebarooBot / RufusBot from webaroo offline search service R 64.124.122.2xx http://www.webaroo.com/ http://www.webaroo.com/company/site-owners -id_t_z_1444 WebAuto/3.4xxx (WinNT; I) Yanasoft WebAuto website copier / downloading tool D http://www.yanasoft.co.jp/webauto.html -id_t_z_1445 webbandit/4.xx.0 Web Bandit personal search software R http://softwaresolutions.net/webbandit/ -id_t_z_140106_2 WebBug/5.x Amansoft WebBug web server protocol test C http://www.cyberspyder.com/webbug.html -id_t_z_1446 Webclipping.com WebClipping.com - online news monitoring service R http://www.webclipping.com -id_t_z_1447 webcollage/1.xx WebCollage Syndicator graphics crawler/collector R D s. also collage.cgi/1.xx http://www.webcollage.com/ -id_t_z_1448 WebCompass 2.0 Quarterdecks WebCompass search tool R -id_t_z_1449 WebCopier vx.x WebCopier offline browser D B http://www.maximumsoft.com/ -id_t_z_1450 WebCopier vx.xa WebCopier offline browser D B http://www.maximumsoft.com/ -id_t_z_210506_1 WebCorp/1.0 WebCorp linguistic search engine (UK) R 193.60.130.xx http://webcorp.uce.ac.uk/ -id_t_z_1451 webcrawl.net Webcrawl Search robot (64.40.105.xxx) R http://www.webcrawl.net/ -id_t_z_1452 WebDownloader for X x.xx Unix/Linux Web Downloader D http://www.krasu.ru/soft/chuchelo/ -id_t_z_1453 Webdup/0.9 Unknown robot from china-netcom.com -id_t_z_1454 WebFetch WingFlyer WebFetch website downloading tool D B http://www.wingflyer.com/ -id_t_z_1455 webfetch/5.x.x webfetch - command line tool to fetch files via HTTP D http://tony.aiu.to/sa/webfetch/ -id_t_z_310806_2 WebFilter Robot 1.0 Verso NetSpective WebFilter P http://www.verso.com/enterprise/netspective/webfilter.asp -id_t_z_1456 WebFilter Robot 1.x Telemate.net NetSpective WebFilter P http://www.telemate.net/ -id_t_z_1457 WebFindBot(http://www.web-find.com) Webfind search robot R http://www.web-find.com/ -id_t_z_1458 Webglimpse 2.xx.x (http://webglimpse.net) Webglimpse search engine software R http://www.webglimpse.net/ -id_t_z_150306_2 webGobbler/1.x.x webGobbler - Online random image generator R D http://sebsauvage.net/webgobbler/ -id_t_z_1459 webhack fake ? -id_t_z_290807_2 WebImages 0.3 ( http://herbert.groot.jebbink.nl/?app=WebImages ) herbert.groot.jebbink.nl Web Images collage generator D 212.204.217.1xx http://herbert.groot.jebbink.nl/ -id_t_z_280306_2 WebLight/4.x.x (support@illumit.com; http://www.illumit.com/Products/weblight/) WebLight web analyzer & link checker C s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; support@illumit.com... http://www.illumit.com/Products/weblight/ -id_t_z_1460 Weblink's checker/ WebLink's link management system for HTTP- FTP and Mail hyperlinks C sometimes in conjunction w. PHP/4.0.6 http://www.harlequin.ch/technologien/tools/weblinks.php -id_t_z_140307_1 Weblog Attitude Diffusion 1.0 Los Alamos National Laboratoy weblog research project R http://www.user-agents.org/agents/weblogattitude.shtml http://www.lanl.gov/ -id_t_z_230606_1 webmeasurement-bot, http://rvs.informatik.uni-leipzig.de Unknown robot from Leipzig University (Germany) faculty for computer science R 139.18.38.1xx http://rvs.informatik.uni-leipzig.de/ -id_t_z_1461 WebMiner/x.x [en] (Win98; I) WebMiner bulk file downloader D http://tribolic.com/webminer/ -id_t_z_1462 WeBoX/0.xx WeBoX (Japan) - Browser and web collector B D http://www-nishio.ise.eng.osaka-u.ac.jp/~nakamura/webox/ -id_t_z_1463 WebPix 1.0 (www.netwu.com) WebPix - picture downloading tool D http://www.netwu.com/webpix/ -id_t_z_1464 WebQL Caesius WebQL - Custom robot/agent generator / web extraction software B D http://www.caesius.com/ -id_t_z_1465 WebRACE/1.1 (University of Cyprus- Distributed Crawler) WebRACE - HTTP retrieval- annotation and caching engine P http://www.cs.ucy.ac.cy/Projects/eRACE/webrace.html -id_t_z_130907_1 WebRankSpider/1.37 (+http://ulm191.server4you.de/crawler/) WebRankSpider experimental web crawler R 62.75.202.1xx http://ulm191.server4you.de/crawler/ -id_t_z_1468 WebReaper vx.x - www.webreaper.net Webreaper download manager D http://www.webreaper.net/ -id_t_z_1466 WebReaper [info@webreaper.net] Webreaper download manager D http://www.webreaper.net/ -id_t_z_1467 WebReaper [webreaper@webreaper.net] Webreaper download manager D http://www.webreaper.net/ -id_t_z_1469 WebSearch.COM.AU/3.0.1 (The Australian Search Engine; http://WebSearch.COM.AU; Search@WebSearch.COM.AU) Websearch Australia robot R http://WebSearch.COM.AU/ -id_t_z_1470 WebSearchBench WebCrawler v0.1(Experimental) Dortmund University WebSearchBench - Open source search software R http://websearchbench.cs.uni-dortmund.de/websearch/about.html.de -id_t_z_1471 WebSearchBench WebCrawler V1.0 (Beta)- Prof. Dr.-Ing. Christoph Lindemann- Universität Dortmund- cl@cs.uni-dortmund.de- http://websearchbench.cs.uni-dortmund.de/ Dortmund University WebSearchBench - Open source search software R http://websearchbench.cs.uni-dortmund.de/websearch/about.html.de -id_t_z_260806_2 Website Explorer/0.9.x.x Web site downloading tool and offline browser (Japan) D http://www.umechando.com/webex/ -id_t_z_1472 Website eXtractor Website eXtractor web site downloading tool D http://www.asona.org/ http://www.internet-soft.com/ -id_t_z_090606_1 WebsiteWorth v1.0 Sootle web directory Website Worth ranking tool R 216.89.111.x http://directory.sootle.com/website-worth/ -id_t_z_1473 Webspinne/1.0 webmaster@webspinne.de Webspinne.de robot R http://www.webspinne.de/ -id_t_z_1474 Websquash.com (Add url robot) Websquash.com Search Engine robot / link checking R http://www.websquash.com/ -id_t_z_1475 WebStat/1.0 (Unix; beta; 20040314) WebStat - Java statistical computing environment for the web R http://www.math.psu.edu/babcock/webstat/version1.0/ -id_t_z_091006_2 Webster v0.3 ( http://webster.healeys.net/ ) Webster - Rev. Healeys web crawler R 24.99.22.xx http://webster.healeys.net/ http://webster.healeys.net/search.php -id_t_z_1476 webster-internet.de pad browser Websters Webmaster Archive (Germany) submission / pad checking C B http://webster.de/ -id_t_z_1477 WebStripper/2.xx WebStripper download manager D http://webstripper.net/index.html http://www.netidea.it -id_t_z_1478 WebTrafficExpress/x.0 WebTrafficExpress IBM server software P -id_t_z_1479 WebTrends/3.0 (WinNT) Web Trends link analyzer C http://www.netiq.com/webtrends/default.asp -id_t_z_1480 WebVac (webmaster@pita.stanford.edu) The Stanford WebBase Project crawler R ex Pita- s. there http://www-diglib.stanford.edu/~testbed/doc2/WebBase/ -id_t_z_1481 WebVal/1.0 webval - Python link checking tool C http://www.alcyone.com/pyos/webval/ -id_t_z_171205_3 Webverzeichnis.de - Telefon: 01908 / 26005 Webverzeichnis.de (Germany) directory robot R http://www.webverzeichnis.de/ -id_t_z_060306_1 WebVulnCrawl.unknown/1.0 libwww-perl/5.803 Web Vulnerability Crawler S Looking for excluded directories in robots.txt http://webvulncrawl.blogspot.com/2005/12/what-am-i-doing.html -id_t_z_1482 WebWatcherMonitor/2.01 Studio Net.Idea's Web Watcher Monitor robot R C http://www.web-watcher.com/web-watcher-monitor.html -id_t_z_1483 WebZIP/x.x (http://www.spidersoft.com) WebZip offline browser B D http://www.spidersoft.com/ -id_t_z_1484 Wells Search II Unknown spam bot / harvester (62.163.**.** / 62.194.**.*) S s.also - Port Huron Labs -id_t_z_1485 WEP Search 00 Some spam bot- see link S http://www.kloth.net/internet/badbots-2004.php -id_t_z_230606_2 West Wind Internet Protocols 4.xx wwIPStuff - Internet client tools for Visual FoxPro B D http://www.west-wind.com/wwipstuff.asp -id_t_z_1486 WFARC IBM's Almaden Research robot (Clever search project) R s. also: - http://www.almaden.ibm.com/cs/crawler - FocusedSampler http://www.almaden.ibm.com/cs/k53/clever.html -id_t_z_1488 Wget/1.x(.x)GNU wget http://www.gnu.org/software/wget/wget.html - file downloader GNU wget - file downloader D http://www.gnu.org/software/wget/wget.html -id_t_z_1489 Wget/1.x+cvs-stable (Red Hat modified) GNU wget - file downloader D http://www.gnu.org/software/wget/wget.html -id_t_z_1487 Wget/1.x.x+cvs GNU wget - file downloader D http://www.gnu.org/software/wget/wget.html -id_t_z_1490 Whatsup/x.x Whatsup Gold network monitor C http://www.ipswitch.com/products/network-management.html -id_t_z_1491 whatUseek_winona/3.0 WhatUSeek / Chubba robot R 166.90.205.x http://www.whatuseek.com/ -id_t_z_1492 WhizBang! Lab WhizBang! Labs (closed since May 2002) information extraction robot R -id_t_z_1493 Wildsoft Surfer some download agent D - in conjunction w. dlman -id_t_z_1494 Willow Internet Crawler by Twotrees V2.1 Twotrees crawler R http://www.twotrees.com/ -id_t_z_1495 WinampMPEG/2.00 (larbin@unspecified.mail) unknown robot from gw.ocg-corp.com (209.126.176.x) see also: - Opera/6.01 (larbin@.....) - MSIE-5.13 larbin@.... -id_t_z_1496 WincerSong Agent v1.0 Super Affiliate Tracker agent by Wincer Song http://www.superaffiliatetracker.com/index.htm -id_t_z_191105_3 Windows-Media-Player/10.00.00.xxxx Windows Media Player 10 B -id_t_z_160107_1 WinGet 1.1 Nicksoft WinGet download manager D Domain is for sale -id_t_z_060406_1 WinHTTP Example/1.0 Example code for a WinHTTP C++ library crawler R http://www.codeguru.com/cpp/i-n/internet/http/article.php/c6237/ http://www.microsoft.com/msdownload/platformsdk/sdkupdate/update.htm -id_t_z_260506_1 WinkBot/0.06 (Wink.com search engine web crawler; http://www.wink.com/Wink:WinkBot; winkbot@wink.com) Wink beta search robot (64.13.136.x) R http://www.wink.com/ -id_t_z_010607_1 WinPodder (http://winpodder.com) WinPodder - Podcast player and RSS reader B http://winpodder.com/ -id_t_z_251105_1 WinWAP/3.x (3.x.x.xx; Win32) (Google WAP Proxy/1.0) WinWap - Windows PC WAP browser B http://www.winwap.com/products_2_1.php -id_t_z_111206_2 Wir sind die Borg (Version: 1.03, Sie wurden Assimiliert +http://www.yammba.com/suchmaschine/bot.html) Yammba web directory (Germany) link checking C http://www.yammba.com/ -id_t_z_130506_2 WIRE/0.11 (Linux; i686; Bot,Robot,Spider,Crawler,aromano@cli.di.unipi.it) WIRE crawler used by the University of Pisa - Italy R 146.48.82.xx http://www.cwr.cl/projects/WIRE/ http://www.unipi.it/english/index.htm -id_t_z_1497 WIRE/0.x (Linux; i686; Bot,Robot,Spider,Crawler) WIRE - Web information retrieval environment crawler R Used by different IPs for different purposes http://www.cwr.cl/projects/WIRE/ -id_t_z_1498 WISEbot/1.0 (WISEbot@koreawisenut.com; http://wisebot.koreawisenut.com) Korea Wisenut robot R http://www.koreawisenut.com/ -id_t_z_1499 WiseWire-Spider2 Wisewire domain checker (Discontinued) R C http://www.wisewire.com/ -id_t_z_110107_2 wish-project (http://wish.slis.tsukuba.ac.jp/) WISH academic research project for link checking C 133.51.22.xx http://wish.slis.tsukuba.ac.jp/ -id_t_z_1500 WordChampBot Wordchamp web page vocabulary / translation robot B D http://www.wordchamp.com/ -id_t_z_301105_1 WordPress/x.x.x.x PHP/4.x.xx WordPress personal Blog publishing platform B http://wordpress.org/ -id_t_z_100207_1 worio heritrix bot (+http://worio.com/) WORIO (beta) search for computer scientists and programmers using Heritrix open-source crawler R 137.82.84.xx http://www.worio.com/ http://www.archive.org/ -id_t_z_291007_1 woriobot ( http://www.worio.com/) WORIO (beta) search for computer scientists and programmers via Amazon Web Services R 67.202.45.2xx http://www.worio.com/ http://www.amazon.com/gp/browse.html?node=3435361 -id_t_z_1501 WorldLight Entireweb Search robot (62.13.25.xxx) R s. also Mozilla/4.0 (compatible; SpeedySpider .... http://www.entireweb.com/ -id_t_z_1502 WorQmada/1.0 unknown link checking (from 4.18.57.126) ? C -id_t_z_1503 Wotbox/alpha0.6 (bot@wotbox.com; http://www.wotbox.com) Wotbox spider R http://www.wotbox.com/ -id_t_z_1504 Wotbox/alpha0.x.x (bot@wotbox.com; http://www.wotbox.com) Java/1.4.1_02 Wotbox spider R http://www.wotbox.com/ -id_t_z_1505 WSB WebCrawler V1.0 (Beta)- cl@cs.uni-dortmund.de WebSearchBench crawler from Dortmund University- Germany R http://websearchbench.cs.uni-dortmund.de/ -id_t_z_1506 WSB, http://websearchbench.cs.uni-dortmund.de WebSearchBench crawler from Dortmund University- Germany R http://websearchbench.cs.uni-dortmund.de/ -id_t_z_1507 wume_crawler/1.1 (http://wume.cse.lehigh.edu/~xiq204/crawler/) WUME Lab's web crawler (128.180.121.xxx) R http://wume.cse.lehigh.edu/~xiq204/crawler/ -id_t_z_1508 Wusage/x.0@boutell.com Wusage log-file analysis R C http://www.boutell.com/wusage/ -id_t_z_120106_2 Wwlib/Linux WWLib - Wolverhampton Univerity Web Library for classifying web documents R http://www.scit.wlv.ac.uk/wwlib/ -id_t_z_1509 WWSBOT 1.x [--- http://www.analyzer.nu ---] WWSBOT web server version checker C http://www.analyzer.nu/Perl/WWSBOT.html -id_t_z_170506_2 WWW-Mechanize/1.1x Perl web page fetching module D http://search.cpan.org/dist/WWW-Mechanize/ -id_t_z_1510 www.arianna.it Arianna robot R http://arianna.libero.it/ -id_t_z_1511 www.business-socket.com registry verify/1.x Business-Socket.com link checking ? C http://www.business-socket.com -id_t_z_221006_2 www.doweb.co.uk crawler The DoWeb UK Business directory link checking C 85.13.252.x http://www.doweb.co.uk/action_home+page.htm -id_t_z_1512 www4mail/2.x libwww-FM/2.14 (Unix; I) www4mail - web navigation & database search by e-mail http://www4mail.org/ -id_t_z_1513 WWWC/1.0x WWWC Updating check of Web pages. (Japanese only) C http://www.nakka.com/soft/index_eng.html -id_t_z_1514 WWWeasel Robot v1.00 (http://wwweasel.de) World Wide Weasel Germany robot R http://wwweasel.de/ -id_t_z_1515 WWWOFFLE/2.x WWWoffle download manager D http://www.gedanken.demon.co.uk/wwwoffle/ -id_t_z_1516 wwwster/1.x (Beta- mailto:gue@cis.uni-muenchen.de) Unknown robot from CIS at Munich University R 129.187.254.xxx http://www.cis.uni-muenchen.de/ -id_t_z_050208_5 wxDownload Fast wxDownload Fast (wxDFast) open source download manager D http://dfast.sourceforge.net/index.html -id_t_z_1517 X-Crawler Arexera (Germany) crawler software R http://www.arexera.de/de/products/crawler.php -id_t_z_1518 Xaldon WebSpider Xaldon WebSpider offline browser B D http://www.xaldon.de/produkte_webspider.html -id_t_z_1519 Xenu Link Sleuth 1.xx Xenu link checker C http://home.snafu.de/tilman/xenulink.html -id_t_z_1520 Xenu's Link Sleuth 1.x[a-z] Xenu link checker C http://home.snafu.de/tilman/xenulink.html -id_t_z_270706_2 Xerka WebBot v1.0.0 [UPVOpenDir] XerKa text mining and information retrieval software D http://www.diana-teknologia.com/www1/english/xerka.htm -id_t_z_250106_2 xine/1.0 xine - free Linux / OS/2 multimedia player B http://xinehq.de/ -id_t_z_141205_3 xirq/0.1-beta (xirq; http://www.xirq.com; xirq@xirq.com) XIRQ search (beta) robot (70.86.206.1xx) R http://www.xirq.com/ -id_t_z_160806_1 XMLSlurp/0.1 libwww-perl/5.805 GPath / XMLSlurp - Expression language for tree structured data http://groovy.codehaus.org/GPath -id_t_z_070506_1 XRL/2.00b1 (Linux; i686; en-us) (+http://metamark.net/about) Metamark URL Shorten Service P http://metamark.net/ -id_t_z_200308_3 Xylix Xylix Retrieval System software C http://www.xylixsoftware.ch/retrievalsystem.php -id_t_z_1521 xyro_(xcrawler@cosmos.inria.fr) Inria Crawler R http://www.inria.fr/ -id_t_z_081205_1 Y!J-BSC/1.0 (http://help.yahoo.co.jp/help/jp/search/indexing/indexing-15.html) Yahoo Search Japan robot (211.14.8.2xx) R s. also Mozilla/4.0 (compatible; Y!J... http://www.yahoo.co.jp/ -id_t_z_271006_2 Y!J-SRD/1.0 Yahoo Search Japan robot (203.216.197.xxx) R s. also DoCoMo/2.0/SO502i (compatible; Y!J-SRD/1.0 ... http://www.yahoo.co.jp/ -id_t_z_240106_3 Y!J/1.0 (http://help.yahoo.co.jp/help/jp/search/indexing/indexing-15.html) Yahoo Search Japan robot (211.14.8.2xx) R s. also Mozilla/4.0 (compatible; Y!J... http://www.yahoo.co.jp/ -id_t_z_220206_2 Y!OASIS/TEST no-ad Mozilla/4.08 [en] (X11; I; FreeBSD 2.2.8-STABLE i386) Yahoo picture service for mobiles P 217.12.4.xx -id_t_z_1522 Y!TunnelPro Y!TunnelPro - Yahoo! Messenger companion user agent B s. YTunnelPro http://www.ytunnelpro.com/ -id_t_z_121205_1 yacy (www.yacy.net; v20040602; i386 Linux 2.4.26-gentoo-r13; java 1.4.2_06; MET/en) Yacy distributed P2P web search engine robot R http://www.yacy.net/ -id_t_z_260306_4 yacybot (x86 Windows XP 5.1; java 1.5.0_06; Europe/de) yacy.net Yacy distributed P2P web search engine robot R http://www.yacy.net/ -id_t_z_300707_2 Yahoo Pipes 1.0 (Yahoo) Pipes interactive data aggregator robot R http://pipes.yahoo.com/pipes/ -id_t_z_100406_2 Yahoo! Mindset Yahoo Mindset: Intent-driven Search (66.228.182.1xx) R s. also Mozilla/4.0 http://mindset.research.yahoo.com/ -id_t_z_040106_2 Yahoo-Blogs/v3.9 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html ) Yahoo blog indexing robot (209.191.83.1xx) R http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html -id_t_z_1523 Yahoo-MMAudVid/1.0 (mms dash mmaudvidcrawler dash support at yahoo dash inc dot com) Yahoo multimedia crawler (206.190.43.xx) R -id_t_z_080108_2 Yahoo-MMAudVid/2.0(mms dash mm aud vid crawler dash support at yahoo dash inc.com ;Mozilla 4.0 compatible; MSIE 7.0;Windows NT 5.0; .NET CLR 2.0) Yahoo multimedia crawler R -id_t_z_1524 Yahoo-MMCrawler/3.x (mm dash crawler at trd dot overture dot com) Yahoo multimedia crawler via Fastsearch.net (66.77.73.xx) R see also FAST-WebCrawler/3.x Multimedia... -id_t_z_110806_1 Yahoo-Test/4.0 Yahoo Search robot R 216.145.49.xx -id_t_z_1525 Yahoo-VerticalCrawler-FormerWebCrawler/3.9 crawler at trd dot overture dot com; http://www.alltheweb.com/help/webmaster/crawler Yahoo crawler via Overture (66.77.73.3x) R -id_t_z_010906_2 YahooFeedSeeker/2.0 (compatible; Mozilla 4.0; MSIE 5.5; http://publisher.yahoo.com/rssguide) Yahoo Publisher Network RSS crawler R http://publisher.yahoo.com/rssguide -id_t_z_1526 YahooSeeker-Testing/v3.9 (compatible; Mozilla 4.0; MSIE 5.5; http://search.yahoo.com/) Yahoo Product Search crawler ( 68.142.195..x) R -id_t_z_1527 YahooSeeker/1.0 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/shop/merchant/) Yahoo Product Search crawler ( 66.196.93.x) R -id_t_z_1528 YahooSeeker/1.0 (compatible; Mozilla 4.0; MSIE 5.5; http://search.yahoo.com/yahooseeker.html) Yahoo Product Search crawler ( 66.196.93.x) R -id_t_z_1529 YahooSeeker/1.1 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/shop/merchant/) Yahoo Product Search crawler ( 66.196.93.x) R -id_t_z_1530 YahooSeeker/bsv3.9 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html ) Yahoo Product Search crawler ( 68.142.195..x) R -id_t_z_1531 YahooSeeker/CafeKelsa-dev (compatible; Konqueror/3.2; FreeBSD ;cafekelsa-dev-webmaster@yahoo-inc.com ) Yahoo robot R 64.157.137.xxx -id_t_z_231106_2 Yandex/1.01.001 (compatible; Win16; I) Yandex Search Russia link checking (213.180.206.2xx) R s. also Mozilla/4.0 (compatible; MSIE 5.0; YANDEX) http://www.yandex.ru -id_t_z_301108_2 Yanga WorldSearch Bot v1.1/beta (http://www.yanga.co.uk/) Yanga search robot by Gigabase (Russian Federation) R 91.205.124.x http://www.yanga.co.uk/ -id_t_z_1532 yarienavoir.net/0.2 Yarienavoir search (Belgium) robot R 217.71.121.xx http://www.yarienavoir.net/ -id_t_z_300506_1 Yeti 1noon.com search Korea robot (222.231.21.xxx) R uses also a blank UA field http://www.1noon.com/ -id_t_z_040407_1 Yeti/0.01 (nhn/1noon, yetibot@naver.com, check robots.txt daily and follows it) 1noon.com search Korea robot (222.231.21.xxx) R uses also a blank UA field http://www.1noon.com/ -id_t_z_301108_1 Yeti/1.0 (NHN Corp.; http://help.naver.com/robots/) Naver search (Korea) robot R 61.247.222.xx http://www.naver.com/ -id_t_z_290407_2 yggdrasil/Nutch-0.9 (yggdrasil biorelated search engine; www dot biotec dot tu minus dresden do de slash schroeder; heiko dot dietze at biotec dot tu minus dresden dot de) yggdrasil spider for GoPubMed biorelated search engine R 141.30.193.x[x] http://www.biotec.tu-dresden.de/schroeder http://gopubmed.biotec.tu-dresden.de/ -id_t_z_211206_3 YodaoBot/1.0 (http://www.yodao.com/help/webmaster/spider/; ) Yodao search (China) R 60.191.80.xx http://www.yodao.com/ -id_t_z_110308_1 yoofind/yoofind-0.1-dev (yoono webcrawler; http://www.yoono.com ; MyEmail) Yoono - community based search (193.110.140.xxx / 194.0.179.[x]xx) R s. also Mozilla/5.0 (compatible; Yoono; http://www.yoono.com/) - yoono/1.0 web-crawler .. http://www.yoono.com/ -id_t_z_210106_3 yoogliFetchAgent/0.1 Yoogli search (under development) agent R http://www.yoogli.com/ -id_t_z_120606_1 yoono/1.0 web-crawler/1.0 Yoono - community based search (193.110.140.xxx / 194.0.179.[x]xx) R s. also Mozilla/5.0 (compatible; Yoono; http://www.yoono.com/) - yoofind/yoofind .. http://www.yoono.com/ -id_t_z_1533 YottaCars_Bot/4.12 (+http://www.yottacars.com) Car Search Engine YottaCars bot - YottaCar car search engine ( 64.62.175.xxx) R s. also OmniExplorer_Bot http://www.yottacars.com/ -id_t_z_1534 YottaShopping_Bot/4.12 (+http://www.yottashopping.com) Shopping Search Engine YottaShopping bot - YottaShopping search engine ( 64.62.175.xxx) R s. also OmniExplorer_Bot http://www.yottashopping.com/ -id_t_z_1535 YTunnelPro Y!TunnelPro - Yahoo! Messenger companion user agent B s. Y!TunnelPro http://www.ytunnelpro.com/ -id_t_z_1536 Z-Add Link Checker (http://w3.z-add.co.uk/linkcheck/) Z-Add online link checker C http://w3.z-add.co.uk/linkcheck/ -id_t_z_1537 Zao-Crawler Zao crawler for Kototoi Project R http://www.kototoi.org/zao/ -id_t_z_1538 Zao-Crawler 0.2b Zao crawler for Kototoi Project R http://www.kototoi.org/zao/ -id_t_z_1539 Zao/0.1 (http://www.kototoi.org/zao/) Zao crawler for Kototoi Project R http://www.kototoi.org/zao/ -id_t_z_1540 ZBot/1.00 (icaulfield@zeus.com) Zeus Internet Marketing Robot based on Webster Pro component R http://cyber-robotics.com/ http://www.homepagesw.com/ -id_t_z_111205_5 Zearchit Zearchit German search / directory R 212.227.109.1xx http://www.zearchit.de/ -id_t_z_130106_2 ZeBot_lseek.net (bot@ze.bz) Ze.bz Moteur de Recherche robot R 213.251.135.xx http://www.ze.bz/ -id_t_z_1541 ZeBot_www.ze.bz (ze.bz@hotmail.com) Ze.bz Moteur de Recherche robot R 213.251.135.xx http://www.ze.bz/ -id_t_z_130806_2 zedzo.digest/0.1 (http://www.zedzo.com/) ZedZo Search (beta) robot R 24.62.50.1xx http://www.zedzo.com/ -id_t_z_210807_2 Zend_Http_Client Zend PHP frameworks Zend_Http_Client component D http://framework.zend.com/manual/en/zend.http.html -id_t_z_290208_2 zermelo Mozilla/5.0 compatible; heritrix/1.12.1 (+http://www.powerset.com) [email:crawl@powerset.com,email:paul@page-store.com] Powerset Natural Language Search crawler (under development) using Heritrix via Amazon Web Services R 67.202.34.xxx http://www.powerset.com/ http://www.amazon.com/gp/browse.html?node=3435361 -id_t_z_1542 zerxbot/Version 0.6 libwww-perl/5.79 Zerx search robot ? R 138.88.147.xxx http://www.zerx.com/ -id_t_z_1543 Zeus ThemeSite Viewer Webster Pro V2.9 Win32 Zeus Internet Marketing Robot (based on Webster Pro) R http://cyber-robotics.com/ -id_t_z_1544 Zeus xxxxx Webster Pro V2.9 Win32 Zeus Internet Marketing Robot (based on Webster Pro) R http://cyber-robotics.com/ -id_t_z_281105_1 Zeusbot/0.07 (Ulysseek's web-crawling robot; http://www.zeusbot.com; agent@zeusbot.com) Zeusbot robot for building the Ulsysseek.com index R powered by Nutch http://www.zeusbot.com/ http://www.ulysseek.com/ -id_t_z_1545 Ziggy -- The Clown From Hell!! Unknown agent (server- or link checking ?) from 198.173.158.xx C -id_t_z_1546 ZipppBot/0.xx (ZipppBot; http://www.zippp.net; webmaster@zippp.net) Zipp.net web search robot R http://www.zippp.net/ -id_t_z_1547 ZIPPPCVS/0.xx (ZipppBot/.xx;http://www.zippp.net; webmaster@zippp.net) Zipp.net web search robot R http://www.zippp.net/ -id_t_z_1548 Zippy v2.0 - Zippyfinder.com Zippyfinder robot R http://www.zippyfinder.com/ -id_t_z_1549 Zoo Tycoon 2 Client -- http://www.zootycoon.com Microsoft Zoo Tycoon 2 game client B http://www.zootycoon.com -id_t_z_1550 ZoomSpider - wrensoft.com Zoom Search Engine software spider R http://www.wrensoft.com/ -id_t_z_160110_1 Zscho.de Crawler/Nutch-1.0-Zscho.de-semantic_patch (Zscho.de Crawler collecting for machine learning; http://zscho.de/ ) Zscho search crawler (Germany) R 141.65.161.xx http://www.zscho.de/ -id_t_z_280306_1 zspider/0.9-dev http://feedback.redkolibri.com/ zspider robot for a new search engine R http://feedback.redkolibri.com/ -id_t_z_1551 ZyBorg/1.0 (ZyBorg@WISEnut.com; http://www.WISEnut.com) Wisenut robot R http://www.wisenutbot.com/ -id_new_190610_1 Mozilla/5.0 (Windows; U; Windows NT 5.1; de; rv:1.9.2.3) Gecko/20100401 Firefox/3.6.3 (FM Scene 4.6.1) FM Scene soccer fan pages plugin L http://www.fmscene.de -id_new_190610_2 Mozilla/5.0 (Windows; U; Windows NT 5.1; de; rv:1.9.2.3) Gecko/20100401 Firefox/3.6.3 (.NET CLR 3.5.30729) (Prevx 3.0.5) PrevX security plugin http://www.prevx.com \ No newline at end of file diff --git a/share/db/useragent.sql b/share/db/useragent.sql deleted file mode 100644 index 613eee2c..00000000 --- a/share/db/useragent.sql +++ /dev/null @@ -1,64 +0,0 @@ -CREATE TEMPORARY TABLE _useragent ( - id INT PRIMARY KEY, - string VARCHAR(500), - description VARCHAR(2000), - type VARCHAR(20), - comment VARCHAR(100), - link1 VARCHAR(1000), - link2 VARCHAR(1000) -); - --- NB 07.12.17 DROP TABLE IF EXISTS useragent; --- NB 07.12.17 CREATE TABLE IF NOT EXISTS useragent ( --- NB 07.12.17 id VARCHAR(32) PRIMARY KEY, --- NB 07.12.17 string VARCHAR(500), --- NB 07.12.17 description VARCHAR(2000), --- NB 07.12.17 type VARCHAR(20), --- NB 07.12.17 comment VARCHAR(100), --- NB 07.12.17 link1 VARCHAR(1000), --- NB 07.12.17 link2 VARCHAR(1000) --- NB 07.12.17 ); - -DROP TABLE IF EXISTS useragent; -CREATE TABLE IF NOT EXISTS useragent ( - string VARCHAR(500), - description VARCHAR(2000), - comment VARCHAR(100), - link VARCHAR(1000), - is_browser BOOLEAN, - is_link BOOLEAN, - is_download BOOLEAN, - is_proxy BOOLEAN, - is_robot BOOLEAN, - is_spam BOOLEAN -); - -CREATE INDEX useragent_string_idx ON `useragent` (string); -CREATE INDEX useragent_comment_idx ON `useragent` (comment); -CREATE INDEX useragent_is_browser_idx ON `useragent` (is_browser); -CREATE INDEX useragent_is_link_idx ON `useragent` (is_link); -CREATE INDEX useragent_is_download_idx ON `useragent` (is_download); -CREATE INDEX useragent_is_proxy_idx ON `useragent` (is_proxy); -CREATE INDEX useragent_is_robot_idx ON `useragent` (is_robot); -CREATE INDEX useragent_is_spam_idx ON `useragent` (is_spam); - -BEGIN TRANSACTION; -.separator \t -.import "useragent.csv" _useragent --- NB 07.12.17 .import "useragent.csv" useragent --- Type: --- B = Browser --- C = Link-, bookmark-, server- checking --- D = Downloading tool --- P = Proxy server, web filtering --- R = Robot, crawler, spider --- S = Spam or bad bot -INSERT INTO useragent SELECT string,description,comment,link1 - ,CASE WHEN type LIKE '%B%' THEN 1 ELSE 0 END - ,CASE WHEN type LIKE '%C%' THEN 1 ELSE 0 END - ,CASE WHEN type LIKE '%D%' THEN 1 ELSE 0 END - ,CASE WHEN type LIKE '%P%' THEN 1 ELSE 0 END - ,CASE WHEN type LIKE '%R%' THEN 1 ELSE 0 END - ,CASE WHEN type LIKE '%S%' THEN 1 ELSE 0 END -FROM _useragent; -COMMIT; diff --git a/www/dbq/html/default.min.css b/www/dbq/html/default.min.css index 7bf7755e..53841e87 100644 --- a/www/dbq/html/default.min.css +++ b/www/dbq/html/default.min.css @@ -1 +1 @@ -html{font:90% 'Trebuchet MS',sans-serif;background-color:#eee}body{display:table;margin-left:auto;margin-right:auto;padding-left:1em;padding-right:1em;color:#444}@keyframes spin{0%{transform:rotate(0)}100%{transform:rotate(360deg)}}.loader{border:16px solid #fff;border-radius:50%;border-top:16px solid #000;padding:0;margin:0 auto 0 auto;width:8em;height:8em;animation:spin 2s linear infinite;display:block}body.loader{margin-top:8em}.loader *{display:none!important}h1{margin:0 0 .2em 0;font-size:180%;padding-bottom:.3em;margin-bottom:.5em;border-bottom:dashed 1px #444}a{color:inherit}div>a,li a,p a,td a{color:#3572b0}a,a:visited{text-decoration:none}.button:hover,a:hover{opacity:.8}ul{padding:0;margin:0}li{list-style:none;padding:0 0 0 .3em}table{border-collapse:collapse}td,th{padding:.2em .7em}th a.sort{float:left;margin-right:.1em}input:not([type]),input[type=''],input[type=date],input[type=email],input[type=password],input[type=text],input[type=url],select,textarea{border-radius:3px;border:solid 1px #ddd;padding:.3em .4em;box-shadow:0 1px 1px #eee}input[size]{max-width:70%}div.row div label:after,form label:after{content:':'}form input,form label,form select{vertical-align:middle;margin:.2em .4em .2em 0}.rows{padding:0}.rows form{display:inline-block}.block,.menu,div.row,form.edit,iframe,pre,table.rows,ul.row{border-radius:4px;border-spacing:0;padding:.5em .2em;margin-bottom:.5em;border:solid 1px #ddd;background-color:#fafafa;box-shadow:0 1px 2px #eee}table.rows{border-style:hidden;border-collapse:collapse;box-shadow:0 0 0 1px #ddd;table-layout:fixed}table.rows tr:nth-child(even) td{background-color:#fefefe}div.row div,table.rows td,table.rows th,ul.row li{border-bottom:solid 1px #ddd}div.row div,table.rows tr:last-child td,ul.row li{border-bottom:none}table.rows td,table.rows th{border-right:dashed 1px #ddd}.rows .count{text-align:right}table.rows th{text-align:left}table.rows td{padding:.3em .3em}table.rows.fixed{width:100%}div.row div label,table.rows.fixed td,table.rows.fixed th{white-space:nowrap;text-overflow:ellipsis;overflow:hidden}table.rows.fixed th{white-space:normal}table.rows td.delete,table.rows td.view{width:1%;white-space:nowrap}table.rows.fixed th.view{width:2em}table.rows.fixed th.delete{width:2.7em}div.rows{clear:both}div.row{float:left;margin-right:4px;min-width:24%}.nofloat{float:none}div.row div{margin:0;padding:.1em .2em;border-bottom:solid 1px #fff}div.row div.view .button{margin-bottom:5px}div.row div.delete .button{margin-top:5px}div.row div:last-child{border-bottom:none;padding-bottom:0}div.row div.delete label,div.row div.view label{display:none}div.row div.delete,div.row div.view{text-align:center}div.row div label,ul.row li label{padding:.1em .5em .1em 0;min-width:20%;display:inline-block}.button{font:inherit;display:inline-block;text-decoration:none;line-height:1.6em;cursor:pointer;white-space:nowrap;box-sizing:border-box;margin:0 .1em 0 0;padding:0 .3em;border-radius:4px;border:none;color:#3572b0;background-color:#eee;background:linear-gradient(to bottom right,#eee,#ddd);box-shadow:0 1px 1px #bbb}.bottom,.center,.menu,.nav,.rows{clear:both;display:table}.bottom,.buttons,.center,.menu,.nav,.rows,td.button{margin-left:auto;margin-right:auto}div.buttons{text-align:center;margin-top:.5em}form.menu{padding:.5em;background-color:#fafafa;max-width:1024px}form.menu .button.add{float:right;margin-top:.2em}form.menu .criterias{border-top:dashed 1px #ddd;margin-top:.3em;padding-top:.3em;clear:both}form.menu .criterias span.label{border-right:solid 1px #fff;border-radius:3px;margin:0 .2em;white-space:nowrap;float:left}form.menu .criterias span.label:last-child{border-right:none}form.menu select:focus{max-width:auto}form.menu select{max-width:20%}form.menu .criterias input[type=text]{width:4em}div.row label,form.edit .fields label{width:25%;text-align:right;display:inline-block;margin-right:1em;vertical-align:top}div.row .label span,form.edit .fields .label span{width:54%;display:inline-block;text-align:left;vertical-align:middle;margin-top:.2em}form.edit .fields input[size],form.edit .fields select,form.edit .fields textarea{width:65%} +table,table.rows{border-collapse:collapse}.button,a,a:visited{text-decoration:none}html{font:90% 'Trebuchet MS',sans-serif;background-color:#EEE}body{display:table;margin-left:auto;margin-right:auto;padding-left:1em;padding-right:1em;color:#444}@keyframes spin{0%{transform:rotate(0)}100%{transform:rotate(360deg)}}.loader{border:16px solid #FFF;border-radius:50%;border-top:16px solid #000;padding:0;margin:0 auto;width:8em;height:8em;animation:spin 2s linear infinite;display:block}body.loader{margin-top:8em}.loader *{display:none!important}h1{margin:0 0 .5em;font-size:180%;padding-bottom:.3em;border-bottom:dashed 1px #444}a{color:inherit}.button,div>a,li a,p a,td a{color:#3572B0}.button:hover,a:hover{opacity:.8}ul{padding:0;margin:0}li{list-style:none;padding:0 0 0 .3em}td,th{padding:.2em .7em}th a.sort{float:left;margin-right:.1em}input:not([type]),input[type=text],input[type=password],input[type=date],input[type=email],input[type=url],input[type=''],select,textarea{border-radius:3px;border:1px solid #DDD;padding:.3em .4em;box-shadow:0 1px 1px #EEE}input[size]{max-width:70%}div.row div label:after,form label:after{content:':'}form input,form label,form select{vertical-align:middle;margin:.2em .4em .2em 0}.rows{padding:0}.rows form{display:inline-block}.block,.menu,div.row,form.edit,iframe,pre,table.rows,ul.row{border-radius:4px;border-spacing:0;padding:.5em .2em;margin-bottom:.5em;border:1px solid #DDD;background-color:#FAFAFA;box-shadow:0 1px 2px #EEE}table.rows{border-style:hidden;box-shadow:0 0 0 1px #DDD;table-layout:fixed}table.rows tr:nth-child(even) td{background-color:#FEFEFE}div.row div,table.rows td,table.rows th,ul.row li{border-bottom:solid 1px #DDD}div.row div,table.rows tr:last-child td,ul.row li{border-bottom:none}table.rows td,table.rows th{border-right:dashed 1px #DDD}.rows .count{text-align:right}table.rows th{text-align:left}div.buttons,div.row div.delete,div.row div.view{text-align:center}table.rows td{padding:.3em}table.rows.fixed{width:100%}div.row div label,table.rows.fixed td,table.rows.fixed th{white-space:nowrap;text-overflow:ellipsis;overflow:hidden}table.rows.fixed th{white-space:normal}table.rows td.delete,table.rows td.view{width:1%;white-space:nowrap}table.rows.fixed th.view{width:2em}table.rows.fixed th.delete{width:2.7em}div.rows{clear:both}div.row{float:left;margin-right:4px;min-width:24%}.nofloat{float:none}div.row div{margin:0;padding:.1em .2em;border-bottom:solid 1px #fff}div.row div.view .button{margin-bottom:5px}div.row div.delete .button{margin-top:5px}div.row div:last-child{border-bottom:none;padding-bottom:0}div.row div.delete label,div.row div.view label{display:none}div.row div label,ul.row li label{padding:.1em .5em .1em 0;min-width:20%;display:inline-block}.button{font:inherit;display:inline-block;line-height:1.6em;cursor:pointer;white-space:nowrap;box-sizing:border-box;margin:0 .1em 0 0;padding:0 .3em;border-radius:4px;border:none;background-color:#EEE;background:linear-gradient(to bottom right,#EEE,#DDD);box-shadow:0 1px 1px #BBB}.bottom,.center,.menu,.nav,.rows{clear:both;display:table}.bottom,.buttons,.center,.menu,.nav,.rows,td.button{margin-left:auto;margin-right:auto}div.buttons{margin-top:.5em}form.menu{padding:.5em;background-color:#FAFAFA;max-width:1024px}form.menu .button.add{float:right;margin-top:.2em}form.menu .criterias{border-top:dashed 1px #DDD;margin-top:.3em;padding-top:.3em;clear:both}form.menu .criterias span.label{border-right:solid 1px #fff;border-radius:3px;margin:0 .2em;white-space:nowrap;float:left}form.menu .criterias span.label:last-child{border-right:none}form.menu select:focus{max-width:auto}form.menu select{max-width:20%}form.menu .criterias input[type=text]{width:4em}div.row label,form.edit .fields label{width:25%;text-align:right;display:inline-block;margin-right:1em;vertical-align:top}div.row .label span,form.edit .fields .label span{width:54%;display:inline-block;text-align:left;vertical-align:middle;margin-top:.2em}form.edit .fields input[size],form.edit .fields select,form.edit .fields textarea{width:65%} -- 2.47.3