defmodule UserAgent.Data do
# Auto generated, do not edit
def all_agents() do
[
%{
comment: "",
description: "Sync2It bookmark management & clustering engine",
id: "id_a_f_3",
link1: "http://www.sync2it.com",
link2: "",
name: "!Susie (http://www.sync2it.com/susie)",
type: "C R"
},
%{
comment: "Site is dead",
description: "UnCHAOS search robot",
id: "id_a_f_6",
link1: "http://www.unchaos.com/",
link2: "",
name:
"<a href='http://www.unchaos.com/'> UnChaos </a> From Chaos To Order Hybrid Web Search Engine.(vadim_gonchar@unchaos.com)",
type: "R"
},
%{
comment: "Site is dead",
description: "UnCHAOS search robot",
id: "id_a_f_7",
link1: "http://www.unchaos.com/",
link2: "",
name:
"<a href='http://www.unchaos.com/'> UnChaos Bot Hybrid Web Search Engine. </a> (vadim_gonchar@unchaos.com)",
type: "R"
},
%{
comment: "Site is dead",
description: "UnCHAOS search robot",
id: "id_a_f_8",
link1: "http://www.unchaos.com/",
link2: "",
name:
"<b> UnChaosBot From Chaos To Order UnChaos Hybrid Web Search Engine at www.unchaos.com </b> (info@unchaos.com)",
type: "R"
},
%{
comment: "s.also SygolBot",
description: "Sygol Search (Italy) robot",
id: "id_a_f_9",
link1: "http://www.sygol.com/",
link2: "",
name: "<http://www.sygol.com/> http://www.sygol.com",
type: "R"
},
%{
comment: "Services is no more available",
description: "SearchEngineWorld's robots.txt validator",
id: "id_a_f_4",
link1: "http://www.searchengineworld.com/cgi-bin/robotcheck.cgi",
link2: "",
name: "( Robots.txt Validator http://www.searchengineworld.com/cgi-bin/robotcheck.cgi )",
type: "C"
},
%{
comment: "",
description: "DreamCast DreamPassport browser",
id: "id_a_f_171105_1",
link1: "http://www.dricas.com/dp/",
link2: "",
name: "(DreamPassport/3.0; isao/MyDiGiRabi)",
type: "B"
},
%{
comment: "s.also Privoxy/3.0 (Anonymous)",
description: "Privoxy web proxy",
id: "id_a_f_290606_1",
link1: "http://www.privoxy.org/",
link2: "",
name: "(Privoxy/1.0)",
type: "P"
},
%{
comment: "123.113.184.2xx",
description: "Unknown Yahoo robot",
id: "id_a_f_230507_1",
link1: "http://www.yahoo.com",
link2: "",
name: "*/Nutch-0.9-dev",
type: "R"
},
%{
comment: "",
description: "SitiDi.net search (Germany) robot",
id: "id_a_f_5",
link1: "http://www.sitidi.net/",
link2: "",
name: "+SitiDi.net/SitiDiBot/1.0 (+Have Good Day)",
type: "R"
},
%{
comment: "",
description: "Die Kraehe Meta-Search-Engine (Germany) link checking",
id: "id_a_f_1",
link1: "http://www.die-kraehe.de",
link2: "",
name: "-DIE-KRAEHE- META-SEARCH-ENGINE/1.1 http://www.die-kraehe.de",
type: "R"
},
%{
comment: "",
description: "123spider.de (Germany) web directory link checking",
id: "id_a_f_060206_1",
link1: "http://www.123spider.de/",
link2: "",
name: "123spider-Bot (Version: 1.02, powered by www.123spider.de",
type: "C"
},
%{
comment: "217.160.75.2xx",
description: "192.com - UK web directory",
id: "id_a_f_180806_1",
link1: "http://www.192.com/",
link2: "",
name: "192.comAgent",
type: "R"
},
%{
comment: "",
description: "1st ZipCommander Net - IE based browser",
id: "id_a_f_060606_1",
link1: "http://www.zipcommander.com/",
link2: "",
name: "1st ZipCommander (Net) - http://www.zipcommander.com/",
type: "B"
},
%{
comment: "",
description: "2Bone online link checker",
id: "id_a_f_10",
link1: "http://www.2bone.com/links/linkchecker.shtml",
link2: "",
name: "2Bone_LinkChecker/1.0 libwww-perl/5.64",
type: "C"
},
%{
comment: "",
description: "4Anything robot",
id: "id_a_f_11",
link1: "http://www.4anything.com",
link2: "",
name: "4anything.com LinkChecker v2.0",
type: "R"
},
%{
comment: "s. various honey pot sites",
description: "Unknown guestbook spamming or harvesting tool from diff. IPs",
id: "id_a_f_110207_1",
link1:
"http://www.projecthoneypot.org/bsh_X19tb2RlPWdsb2JhbCZfX2J5PWMmY3RyeT11cyZ1YWc9ODQ4NCtCb3N0b24rUHJvamVjdCt2KzEuMA..",
link2: "",
name: "8484 Boston Project v 1.0",
type: "S"
},
%{
comment: "",
description: "neofonie search robot Germany",
id: "id_a_f_2",
link1: "http://www.neofonie.de/loesungen/search/",
link2: "",
name:
":robot/1.0 (linux) ( admin e-mail: undefined http://www.neofonie.de/loesungen/search/robot.html )",
type: "R"
},
%{
comment: "",
description: "A-Online.at robot - now Jet2Web Search",
id: "id_a_f_12",
link1: "http://www.jet2web.net/portal",
link2: "",
name: "A-Online Search",
type: "R"
},
%{
comment: "",
description: "A1 Keyword Research - search engine and keyword optimization software",
id: "id_a_f_090707_1",
link1: "http://www.micro-sys.dk/products/keyword-research/",
link2: "",
name:
"A1 Keyword Research/1.0.2 (+http://www.micro-sys.dk/products/keyword-research/) miggibot/2007.03.27",
type: "C"
},
%{
comment: "",
description: "MiggiBot website crawler engine - A1 Sitemap Generator",
id: "id_a_f_100906_1",
link1: "http://www.micro-sys.dk/products/sitemap-generator/",
link2: "http://www.micro-sys.dk/developer/miggibot/",
name:
"A1 Sitemap Generator/1.0 (+http://www.micro-sys.dk/products/sitemap-generator/) miggibot/2006.01.24",
type: "R"
},
%{
comment: "192.9.71.7x",
description: "Aardvark web crawler for Sun's Blog recommendations",
id: "id_a_f_250408_2",
link1: "http://blogs.sun.com/plamere/",
link2: "",
name: "aardvark-crawler",
type: "R"
},
%{
comment: "",
description: "Abacho / Crawler.de robot",
id: "id_a_f_13",
link1: "http://www.abacho.com",
link2: "",
name: "AbachoBOT",
type: "R"
},
%{
comment: "",
description: "Abacho / Crawler.de robot",
id: "id_a_f_14",
link1: "http://www.abacho.com",
link2: "",
name: "AbachoBOT (Mozilla compatible)",
type: "R"
},
%{
comment: "",
description: "ABCdatos - Castilian program & tutorial directory",
id: "id_a_f_15",
link1: "http://www.abcdatos.com",
link2: "",
name: "ABCdatos BotLink/5.xx.xxx#BBL",
type: "R"
},
%{
comment: "",
description: "Aberja Hybridsuchmaschine (Germany) link checking",
id: "id_a_f_16",
link1: "http://www.aberja.de",
link2: "",
name: "Aberja Checkomat",
type: "R"
},
%{
comment:
"s. also - np/0.1_(np;_http://www.nameprotect.com... - aipbot/1.0 (aipbot; http://www.aipbot.com...",
description: "Nameprotect copyright search robot (24.177.134.x)",
id: "id_a_f_17",
link1: "http://www.nameprotect.com/",
link2: "",
name: "abot/0.1 (abot; http://www.abot.com; abot@abot.com)",
type: "R"
},
%{
comment: "",
description: "About robot",
id: "id_a_f_18",
link1: "http://www.about.com",
link2: "",
name: "About/0.1libwww-perl/5.47",
type: "R"
},
%{
comment: "125.100.242.2xx",
description: "Accela Technology RSS feed crawler",
id: "id_a_f_051206_3",
link1: "http://www.accelatech.com/",
link2: "",
name: "Accelatech RSSCrawler/0.4",
type: "R"
},
%{
comment: "65.17.255.xx",
description: "Accoona Search robot",
id: "id_a_f_19",
link1: "http://www.accoona.com",
link2: "",
name: "accoona",
type: "R"
},
%{
comment: "65.17.255.xx",
description: "Accoona Search robot",
id: "id_a_f_20",
link1: "http://www.accoona.com",
link2: "",
name: "Accoona-AI-Agent/1.1.1 (crawler at accoona dot com)",
type: "R"
},
%{
comment: "65.17.255.xx",
description: "Accoona Search robot",
id: "id_a_f_140906_3",
link1: "http://www.accoona.com",
link2: "",
name: "Accoona-AI-Agent/1.1.2 (aicrawler at accoonabot dot com)",
type: "R"
},
%{
comment: "",
description: "Ace Explorer - IE based browser",
id: "id_a_f_21",
link1: "http://www.aceexplorer.com",
link2: "",
name: "Ace Explorer",
type: "B"
},
%{
comment: "64.74.153.xx",
description: "Ackerm search robot",
id: "id_a_f_280806_1",
link1: "http://www.ackerm.com/",
link2: "",
name: "Ack (http://www.ackerm.com/)",
type: "R"
},
%{
comment: "",
description: "Acoi picture finder robot",
id: "id_a_f_22",
link1: "http://monetdb.cwi.nl/acoi/projects.html",
link2: "",
name: "AcoiRobot",
type: "R"
},
%{
comment: "80.237.153.10x",
description: "Acoon.de search (Germany) robot",
id: "id_a_f_23",
link1: "http://www.acoon.de",
link2: "",
name: "Acoon Robot v1.50.001",
type: "R"
},
%{
comment: "80.237.153.10x",
description: "Acoon.de search (Germany) robot",
id: "id_a_f_24",
link1: "http://www.acoon.de",
link2: "",
name: "Acoon Robot v1.52 (http://www.acoon.de)",
type: "R"
},
%{
comment: "80.237.209.xx",
description: "Acoon.de search (Germany) robot",
id: "id_a_f_100508_1",
link1: "http://www.acoon.de",
link2: "",
name: "Acoon-Robot 4.0.x.[xx] (http://www.acoon.de)",
type: "R"
},
%{
comment: "80.237.153.10x",
description: "Acoon.de search (Germany) robot",
id: "id_a_f_010108_1",
link1: "http://www.acoon.de",
link2: "",
name: "Acoon-Robot v3.xx (http://www.acoon.de and http://www.acoon.com)",
type: "R"
},
%{
comment: "124.157.145.1xx",
description: "Acorn Search Project",
id: "id_a_f_110507_1",
link1: "http://acorn.no-ip.org/",
link2: "",
name:
"Acorn/Nutch-0.9 (Non-Profit Search Engine; acorn.isara.org; acorn at isara dot org)",
type: "R"
},
%{
comment: "",
description: "LibMaster.com Active Bookmark HTML page creator",
id: "id_a_f_25",
link1: "http://www.libmaster.com/software.php",
link2: "",
name: "ActiveBookmark 1.x",
type: "C B"
},
%{
comment: "",
description: "Activeworlds 3D homepage browser",
id: "id_a_f_060806_2",
link1: "http://www.activeworlds.com",
link2: "",
name: "Activeworlds",
type: "B"
},
%{
comment: "",
description: "Activeworlds 3D homepage browser",
id: "id_a_f_26",
link1: "http://www.activeworlds.com",
link2: "",
name: "ActiveWorlds/3.xx (xxx)",
type: "B"
},
%{
comment: "",
description: "Ad Muncher - banner killer",
id: "id_a_f_27",
link1: "http://www.admuncher.com/",
link2: "",
name: "Ad Muncher v4.xx.x",
type: "P"
},
%{
comment: "",
description: "Ad Muncher - banner killer",
id: "id_a_f_28",
link1: "http://www.admuncher.com/",
link2: "",
name: "Ad Muncher v4x Build xxxxx",
type: "P"
},
%{
comment: "85.10.199.xx",
description: "website directory adaxas link checking",
id: "id_a_f_061006_1",
link1: "http://www.adaxas.net/",
link2: "",
name: "Adaxas Spider (http://www.adaxas.net/)",
type: "C"
},
%{
comment: "",
description: "Avant Browser - IE based browser",
id: "id_a_f_29",
link1: "http://www.avantbrowser.com",
link2: "",
name: "Advanced Browser (http://www.avantbrowser.com)",
type: "B"
},
%{
comment: "",
description: "Aesop robot",
id: "id_a_f_30",
link1: "http://www.aesop.com",
link2: "",
name: "AESOP_com_SpiderMan",
type: "R"
},
%{
comment: "s. also Mozilla/4.0 (agadine3.0)",
description: "Agada search (Germany) robot",
id: "id_a_f_31",
link1: "http://www.agada.de",
link2: "",
name: "agadine/1.x.x (+http://www.agada.de)",
type: "R"
},
%{
comment: "",
description: "SharewarePlaza link checking",
id: "id_a_f_32",
link1: "http://www.sharewareplaza.com",
link2: "",
name: "Agent-SharewarePlazaFileCheckBot/2.0+(+http://www.SharewarePlaza.com)",
type: "R"
},
%{
comment: "",
description: "Linkomatic submission verifier",
id: "id_a_f_33",
link1: "http://www.linkomatic.com/",
link2: "",
name: "AgentName/0.1 libwww-perl/5.48",
type: "R"
},
%{
comment: "",
description: "21seek.com (China) robot (218.17.90.xxx)",
id: "id_a_f_34",
link1: "http://www.21seek.com",
link2: "",
name: "AIBOT/2.1 By +(www.21seek.com A Real artificial intelligence search engine China)",
type: "R"
},
%{
comment: "72.44.35.2xx",
description: "AideRss - Postrank RSS and Blog filtering",
id: "id_a_f_130807_1",
link1: "http://www.aiderss.com/",
link2: "",
name: "AideRSS/1.0 (aiderss.com)",
type: "C"
},
%{
comment:
"s. also - np/0.1_(np;_http://www.nameprotect.com... - abot/0.1 (abot; http://www.abot.com...",
description: "Nameprotect copyright search robot (24.177.134.x)",
id: "id_a_f_35",
link1: "http://www.nameprotect.com/",
link2: "",
name: "aipbot/1.0 (aipbot; http://www.aipbot.com; aipbot@aipbot.com)",
type: "R"
},
%{
comment:
"s. also - np/0.1_(np;_http://www.nameprotect.com... - abot/0.1 (abot; http://www.abot.com...",
description: "Nameprotect copyright search robot (24.177.134.x)",
id: "id_a_f_36",
link1: "http://www.nameprotect.com/",
link2: "",
name: "aipbot/2-beta (aipbot dev; http://aipbot.com; aipbot@aipbot.com)",
type: "R"
},
%{
comment: "",
description: "Akregator news feed reader for KDE",
id: "id_a_f_291108_1",
link1: "http://akregator.kde.org/",
link2: "",
name: "Akregator/1.2.9; librss/remnants",
type: "B"
},
%{
comment: "",
description: "Aladin robot",
id: "id_a_f_37",
link1: "http://www.aladin.de",
link2: "",
name: "Aladin/3.324",
type: "R"
},
%{
comment: "",
description: "Phone.com UP.Browser for mobiles on Alcatel cellphone",
id: "id_a_f_180408_1",
link1: "http://www.openwave.com",
link2: "",
name: "Alcatel-BG3/1.0 UP.Browser/5.0.3.1.2",
type: "B"
},
%{
comment: "",
description: "Aleksika Danmark - Search engine optimization spider",
id: "id_a_f_38",
link1: "http://www.aleksika.com",
link2: "",
name: "Aleksika Spider/1.0 (+http://www.aleksika.com/)",
type: "R"
},
%{
comment: "",
description: "Alertinfo - French version of Feedreader 3.xx ",
id: "id_a_f_291108_2",
link1: "http://www.feedreader.com/",
link2: "http://www.geste.fr/alertinfo/home.html",
name: "AlertInfo 2.0 (Powered by Newsbrain)",
type: "B"
},
%{
comment: "",
description: "Vestris robot",
id: "id_a_f_39",
link1: "http://alkaline.vestris.com/",
link2: "",
name: "AlkalineBOT/1.3",
type: "R"
},
%{
comment: "",
description: "Vestris robot",
id: "id_a_f_40",
link1: "http://alkaline.vestris.com/",
link2: "",
name: "AlkalineBOT/1.4 (1.4.0326.0 RTM)",
type: "R"
},
%{
comment: "",
description: "Allesklar.de robot",
id: "id_a_f_41",
link1: "http://www.allesklar.de",
link2: "",
name: "Allesklar/0.1 libwww-perl/5.46",
type: "R"
},
%{
comment: "",
description: "Alligator download manager",
id: "id_a_f_42",
link1: "http://www.nearsoftware.com",
link2: "",
name: "Alligator 1.31 (www.nearsoftware.com)",
type: "D"
},
%{
comment: "67.205.96.xxx/67.205.104.xx",
description: "Unknown robot from Allrati.com",
id: "id_a_f_011108_1",
link1: "http://www.allrati.com/",
link2: "",
name: "Allrati/1.1 (+)",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_a_f_43",
link1: "http://www.altavista.com",
link2: "",
name: "AltaVista Intranet V2.0 AVS EVAL search@freeit.com",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_a_f_44",
link1: "http://www.altavista.com",
link2: "",
name: "AltaVista Intranet V2.0 Compaq Altavista Eval sveand@altavista.net",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_a_f_45",
link1: "http://www.altavista.com",
link2: "",
name: "AltaVista Intranet V2.0 evreka.com crawler@evreka.com",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_a_f_46",
link1: "http://www.altavista.com",
link2: "",
name: "AltaVista V2.0B crawler@evreka.com",
type: "R"
},
%{
comment: "",
description: "Amaya - W3C's Editor/Browser",
id: "id_a_f_280209_1",
link1: "http://www.w3.org/Amaya/",
link2: "",
name: "amaya/x.xx libwww/x.x.x",
type: "B"
},
%{
comment: "64.111.217.9x",
description: "Amfibi Search robot",
id: "id_a_f_47",
link1: "http://www.amfibi.com/",
link2: "",
name: "AmfibiBOT",
type: "R"
},
%{
comment: "64.111.217.9x",
description: "Amfibi Search robot",
id: "id_a_f_48",
link1: "http://www.amfibi.com/",
link2: "",
name: "Amfibibot/0.06 (Amfibi Web Search; http://www.amfibi.com; agent@amfibi.com)",
type: "R"
},
%{
comment: "64.111.217.9x",
description: "Amfibi Search robot",
id: "id_a_f_141105_2",
link1: "http://www.amfibi.com/",
link2: "",
name: "Amfibibot/0.07 (Amfibi Robot; http://www.amfibi.com; agent@amfibi.com)",
type: "R"
},
%{
comment: "s. also libwww-perl/5.65",
description: "amibot - Amidalla search engine robot (62.241.33.xx)",
id: "id_a_f_49",
link1: "http://www.amidalla.com/",
link2: "",
name: "amibot",
type: "R"
},
%{
comment: "",
description: "AWeb Amiga browser",
id: "id_a_f_50",
link1: "http://www.amitrix.com/aweb.html",
link2: "",
name: "Amiga-AWeb/3.4.167SE",
type: "B"
},
%{
comment: "",
description: "Voyager - Amiga browser",
id: "id_a_f_51",
link1: "http://www.vapor.com/voyager/",
link2: "",
name: "AmigaVoyager/3.4.4 (MorphOS/PPC native)",
type: "B"
},
%{
comment: "",
description: "Amiga Miami TCP Stack",
id: "id_a_f_091205_1",
link1: "http://home.ptd.net/~strdustr/amirc/Netware.html",
link2: "",
name: "AmiTCP Miami (AmigaOS 2.04)",
type: ""
},
%{
comment: "",
description: "NF embedded browser on Amois Skypephone",
id: "id_a_f_210608_1",
link1: "http://3skypephone.com/",
link2: "",
name: "Amoi 8512/R21.0 NF-Browser/3.3",
type: "B"
},
%{
comment: "s. also aranhabot",
description: "Amazon.com robot for checking their affiliate sites",
id: "id_a_f_190206_3",
link1: "",
link2: "",
name: "amzn_assoc",
type: "C"
},
%{
comment: "",
description: "Annomille Italian historical oriented robot",
id: "id_a_f_52",
link1: "http://www.annomille.it",
link2: "",
name: "AnnoMille spider 0.1 alpha - http://www.annomille.it",
type: "R"
},
%{
comment: "",
description: "annotate Google - Firefox extension for annotating Google search results",
id: "id_a_f_53",
link1: "http://ponderer.org/annotate_google",
link2: "",
name: "annotate_google; http://ponderer.org/download/annotate_google.user.js",
type: "B"
},
%{
comment: "",
description: "Megaproxy user",
id: "id_a_f_54",
link1: "http://www.megaproxy.com",
link2: "",
name: "Anonymized by ProxyOS: http://www.megaproxy.com",
type: "P"
},
%{
comment: "",
description: "faked user agent",
id: "id_a_f_55",
link1: "",
link2: "",
name: "Anonymizer/1.1",
type: ""
},
%{
comment: "",
description: "AnswerBus natural language search using COLLATE technology",
id: "id_a_f_56",
link1: "http://www.answerbus.com",
link2: "http://collate.dfki.de/kurzdarstellung.html",
name: "AnswerBus (http://www.answerbus.com/)",
type: "R"
},
%{
comment: "",
description: "AnswerChase search tool",
id: "id_a_f_57",
link1: "http://www.answerchase.com",
link2: "",
name: "AnswerChase PROve x.0",
type: ""
},
%{
comment: "",
description: "AnswerChase search tool",
id: "id_a_f_58",
link1: "http://www.answerchase.com",
link2: "",
name: "AnswerChase x.0",
type: ""
},
%{
comment: "s. also Mozilla/x.xx (compatible; ANTFresco....)",
description: "ANT Fresco Browser",
id: "id_a_f_59",
link1: "http://www.antlimited.com/products/fresco.htm",
link2: "",
name: "ANTFresco/x.xx",
type: "B"
},
%{
comment: "",
description: "Antibot (discontinued) robot",
id: "id_a_f_60",
link1: "http://www.antidot.net",
link2: "",
name: "antibot-V1.1.5/i586-linux-2.2",
type: "R"
},
%{
comment: "",
description: "Anzwers (Yahoo) Australia robot",
id: "id_a_f_61",
link1: "http://au.anzwers.yahoo.com/",
link2: "",
name: "AnzwersCrawl/2.0 (anzwerscrawl@anzwers.com.au;Engine)",
type: "R"
},
%{
comment: "216.240.143.xx",
description: "Apexoo Search spider",
id: "id_a_f_030206_1",
link1: "http://www.apexoo.com/",
link2: "",
name: "Apexoo Spider 1.x",
type: "R"
},
%{
comment: "",
description: "JavaOS app. for SEGA Saturn Internet and Sanyo Internet-TV",
id: "id_a_f_62",
link1: "",
link2: "",
name: "Aplix HTTP/1.0.1",
type: "B"
},
%{
comment: "",
description: "JavaOS app. for Sanyo Internet-TV",
id: "id_a_f_63",
link1: "",
link2: "",
name: "Aplix_SANYO_browser/1.x (Japanese)",
type: "B"
},
%{
comment: "",
description: "JavaOS app. for SEGA Saturn Internet",
id: "id_a_f_64",
link1: "",
link2: "",
name: "Aplix_SEGASATURN_browser/1.x (Japanese)",
type: "B"
},
%{
comment: "",
description: "Aport robot",
id: "id_a_f_65",
link1: "http://www.aport.ru",
link2: "",
name: "Aport",
type: "R"
},
%{
comment: "",
description: "Walhello Internet Search robot",
id: "id_a_f_66",
link1: "http://www.walhello.com",
link2: "",
name: "appie 1.1 (www.walhello.com)",
type: "R"
},
%{
comment: "",
description: "CoreMedia player on Apple iPhone",
id: "id_a_f_140608_1",
link1: "http://www.apple.com/iphone/",
link2: "",
name: "Apple iPhone v1.1.4 CoreMedia v1.0.0.4A102",
type: "B"
},
%{
comment: "",
description:
"PubSub - Mac OS X utility for managing RSS/Atom subscriptions via the PubSub framework",
id: "id_a_f_070209_1",
link1:
"http://developer.apple.com/documentation/Darwin/Reference/ManPages/man1/pubsub.1.html",
link2: "",
name: "Apple-PubSub/65.1.1",
type: "B"
},
%{
comment: "209.85.31.2xx",
description: "Araby search - Arabia",
id: "id_a_f_120707_1",
link1: "http://www.araby.com/",
link2: "",
name:
"ArabyBot (compatible; Mozilla/5.0; GoogleBot; FAST Crawler 6.4; http://www.araby.com;)",
type: "R"
},
%{
comment: "s.also Covac TexAs Arachbot",
description: "Covac Arachnid Web Crawler",
id: "id_a_f_260608_1",
link1: "http://www.covac-software.com/",
link2: "",
name: "ArachBot",
type: "R"
},
%{
comment: "",
description: "Euroseek spider",
id: "id_a_f_67",
link1: "http://www.euroseek.com",
link2: "",
name: "Arachnoidea (arachnoidea@euroseek.com)",
type: "R"
},
%{
comment: "s. also amzn_assoc",
description: "Amazon.com robot for checking their affiliate sites",
id: "id_a_f_190206_2",
link1: "",
link2: "",
name: "aranhabot",
type: "C"
},
%{
comment: "",
description: "Excite spider",
id: "id_a_f_68",
link1: "http://www.excite.com",
link2: "",
name: "ArchitextSpider",
type: "R"
},
%{
comment: "s.also - InternetArchive/0.8-dev - Mozilla/5.0 (compatible;archive.org_bot/...",
description: "Heritrix - The Internet Archive's open-source crawler (207.241.225.2xx)",
id: "id_a_f_69",
link1: "http://www.archive.org/",
link2: "",
name: "archive.org_bot",
type: "R"
},
%{
comment: "s. also Simpy",
description: "Simpy Bookmarklet crawler (69.55.233.xx)",
id: "id_a_f_70",
link1: "http://www.simpy.com/",
link2: "",
name: "Argus/1.1 (Nutch; http://www.simpy.com/bot.html; feedback at simpy dot com)",
type: "C"
},
%{
comment: "",
description: "Arikus inContext search engine software",
id: "id_a_f_031205_1",
link1: "http://www.arikus.com/inContext-enterprise.html",
link2: "",
name: "Arikus_Spider",
type: "R"
},
%{
comment: "193.136.192.xx",
description: "Tomba project: the Portuguese web archive",
id: "id_a_f_210208_1",
link1: "http://arquivo-web.fccn.pt/",
link2: "http://arquivo-web.fccn.pt/crawler?set_language=en",
name: "Arquivo-web-crawler (compatible; heritrix/1.12.1 +http://arquivo-web.fccn.pt)",
type: "R"
},
%{
comment: "62.68.194.2xx",
description: "Asaha search robot (Turkey)",
id: "id_a_f_251007_1",
link1: "http://www.asaha.com/",
link2: "",
name: "ASAHA Search Engine Turkey V.001 (http://www.asaha.com/)",
type: "R"
},
%{
comment: "",
description: "ASAHINA Antenna information detecting agent",
id: "id_a_f_71",
link1: "http://masshy.fastwave.gr.jp/hina/release/",
link2: "",
name: "Asahina-Antenna/1.x",
type: "R"
},
%{
comment: "",
description: "ASAHINA Antenna information detecting agent",
id: "id_a_f_72",
link1: "http://masshy.fastwave.gr.jp/hina/release/",
link2: "",
name: "Asahina-Antenna/1.x (libhina.pl/x.x ; libtime.pl/x.x)",
type: "R"
},
%{
comment: "",
description: "Ask 24x Info robot",
id: "id_a_f_73",
link1: "http://ask.24x.info/",
link2: "",
name: "ask.24x.info",
type: "R"
},
%{
comment: "",
description: "Ask About Oil - Petroleum related search (24.227.212.xxx) using Nutch",
id: "id_a_f_74",
link1: "http://askaboutoil.com/search.jsp",
link2: "http://www.nutch.org",
name:
"AskAboutOil/0.06-rcp (Nutch; http://www.nutch.org/docs/en/bot.html; nutch-agent@askaboutoil.com)",
type: "R"
},
%{
comment: "131.112.125.1xx",
description: "askEd! / Inferret search (Japan) robot using Nutch",
id: "id_a_f_120806_1",
link1: "http://asked.jp/",
link2: "",
name: "asked/Nutch-0.8 (web crawler; http://asked.jp; epicurus at gmail dot com)",
type: "R"
},
%{
comment: "",
description: "ASPSeek search engine software -Yahoo-Inc. / Telecom Canada robot ",
id: "id_a_f_75",
link1: "http://www.aspseek.org",
link2: "",
name: "ASPSeek/1.2.5",
type: "R"
},
%{
comment: "",
description: "Swsoft.net robot using Aspseek",
id: "id_a_f_76",
link1: "http://www.aspseek.com",
link2: "",
name: "ASPseek/1.2.9d",
type: "R"
},
%{
comment: "",
description: "ASPSeek search engine software",
id: "id_a_f_77",
link1: "http://www.aspseek.org",
link2: "",
name: "ASPSeek/1.2.x",
type: "R"
},
%{
comment: "",
description: "ASPSeek search engine software",
id: "id_a_f_78",
link1: "http://www.aspseek.org",
link2: "",
name: "ASPSeek/1.2.xa",
type: "R"
},
%{
comment: "",
description: "ASPSeek search engine software",
id: "id_a_f_79",
link1: "http://www.aspseek.org",
link2: "",
name: "ASPseek/1.2.xx",
type: "R"
},
%{
comment: "",
description: "ASPSeek search engine software",
id: "id_a_f_80",
link1: "http://www.aspseek.org",
link2: "",
name: "ASPSeek/1.2.xxpre",
type: "R"
},
%{
comment: "site is down",
description: "Associative Sort robot",
id: "id_a_f_81",
link1: "http://pcmath126.unice.fr/assort-robot.html",
link2: "",
name: "ASSORT/0.10",
type: "R"
},
%{
comment: "s. also Mozilla/4.0 (compatible; MSIE 6.0 compatible; Asterias Crawler ...",
description: "Singingfish media spider (64.12.186.2xx) via AOL search",
id: "id_a_f_82",
link1: "http://search.singingfish.com/sfw/home.jsp",
link2: "",
name: "asterias/2.0",
type: "R"
},
%{
comment: "",
description: "Atlocal local business search robot",
id: "id_a_f_83",
link1: "http://www.atlocal.com/",
link2: "",
name: "AtlocalBot/1.1 +(http://www.atlocal.com/local-web-site-owner.html)",
type: "R"
},
%{
comment: "",
description: "Atomic Email Hunter email extracing and harvesting",
id: "id_a_f_041207_2",
link1: "",
link2: "",
name: "Atomic_Email_Hunter/4.0",
type: "S"
},
%{
comment: "",
description: "Atomz robot",
id: "id_a_f_84",
link1: "http://www.atomz.com",
link2: "",
name: "Atomz/1.0",
type: "R"
},
%{
comment: "",
description: "atSpider (ceased) email harvester / spambot",
id: "id_a_f_85",
link1: "",
link2: "",
name: "atSpider/1.0",
type: "S"
},
%{
comment: "85.88.35.xx",
description: "Attentio social media monitoring and analysing ",
id: "id_a_f_060707_1",
link1: "http://www.attentio.com/",
link2: "",
name:
"Attentio/Nutch-0.9-dev (Attentio's beta blog crawler; www.attentio.com; info@attentio.com)",
type: "R"
},
%{
comment: "",
description: "Samsung SPH-A660 phone with Sprint software",
id: "id_a_f_231105_2",
link1: "http://www1.sprintpcs.com/explore/showcase/Showcase.jsp?scTopic=pcsVision",
link2: "",
name: "AU-MIC/2.0 MMP/2.0",
type: "B"
},
%{
comment: "",
description: "Audiovox SMT5600 (AT&T) Smartphone mobile phone browser",
id: "id_a_f_240208_1",
link1: "http://www.audiovox.com/",
link2: "http://www.audiovox.com/manuals/owners/SMT%205600%20QSG%209-7%20FINAL.pdf",
name: "AUDIOVOX-SMT5600",
type: "B"
},
%{
comment: "",
description: "Augurnet Swiss (was www.augurnet.ch) search robot",
id: "id_a_f_86",
link1: "",
link2: "",
name: "augurfind",
type: "R"
},
%{
comment: "",
description: "Augurnet Swiss (was www.augurnet.ch) search robot",
id: "id_a_f_87",
link1: "",
link2: "",
name: "augurnfind V-1.x",
type: "R"
},
%{
comment: "was http://autoemailspider.com - site is dead",
description: "Auto Email Pro Email harvester",
id: "id_a_f_88",
link1: "",
link2: "",
name: "autoemailspider",
type: "S"
},
%{
comment: "s. Linkscan/x ?",
description: "Linkscan tool from Elsop",
id: "id_a_f_89",
link1: "http://www.elsop.com/linkscan/",
link2: "",
name: "autohttp",
type: "C"
},
%{
comment: "84.104.43.x",
description: "Autowebdir - The Automatically Generated Web Directory",
id: "id_a_f_050208_1",
link1: "http://www.autowebdir.com/",
link2: "",
name: "autowebdir 1.1 (www.autowebdir.com)",
type: "R"
},
%{
comment: "",
description: "Altavista robot ??",
id: "id_a_f_90",
link1: "http://www.altavista.com/",
link2: "",
name: "AV Fetch 1.0",
type: "R"
},
%{
comment: "",
description: "Avant Browser - IE based browser",
id: "id_a_f_91",
link1: "http://www.avantbrowser.com",
link2: "",
name: "Avant Browser (http://www.avantbrowser.com)",
type: "B"
},
%{
comment: "",
description: "National Research Council Canada robot",
id: "id_a_f_92",
link1: "http://www.nrc-cnrc.gc.ca/main_e.html",
link2: "",
name: "AVSearch-1.0(peter.turney@nrc.ca)",
type: "R"
},
%{
comment: "",
description: "Unknown robot from 205.203.108.xx (telerate.com)",
id: "id_a_f_93",
link1: "",
link2: "",
name: "AVSearch-2.0-fusionIdx-14-CompetitorWebSites",
type: ""
},
%{
comment: "",
description: "Altavista robot",
id: "id_a_f_94",
link1: "http://www.altavista.com/",
link2: "",
name: "AVSearch-3.0(AltaVista/AVC)",
type: "R"
},
%{
comment: "",
description: "AWeb Amiga browser",
id: "id_a_f_95",
link1: "http://aweb.sunsite.dk/",
link2: "",
name: "AWeb",
type: "B"
},
%{
comment: "",
description: "Axada search Germany robot",
id: "id_a_f_96",
link1: "http://www.axada.de",
link2: "",
name: "axadine/ (Axadine Crawler; http://www.axada.de/; )",
type: "R"
},
%{
comment: "",
description: "Axmo search robot",
id: "id_a_f_97",
link1: "http://www.axmo.com",
link2: "",
name: "AxmoRobot - Crawling your site for better indexing on www.axmo.com search engine.",
type: "R"
},
%{
comment: "",
description: "Azureus Java BitTorrent Client",
id: "id_a_f_250306_1",
link1: "http://azureus.sourceforge.net/",
link2: "",
name: "Azureus 2.x.x.x",
type: "D"
},
%{
comment: "84.255.237.2xx",
description: "Babaloo search robot (Slovenia)",
id: "id_a_f_131208_1",
link1: "http://www.babaloo.si/",
link2: "",
name: "BabalooSpider/1.3 (BabalooSpider; http://www.babaloo.si; spider@babaloo.si)",
type: "R"
},
%{
comment: "",
description: "BaBoom Web Portal (ODP) robot (66.98.254.xx)",
id: "id_a_f_98",
link1: "http://www.baboom.us",
link2: "",
name: "BaboomBot/1.x.x (+http://www.baboom.us)",
type: "R"
},
%{
comment: "",
description: "BackStreet Browser - Offline browser / website downloader",
id: "id_a_f_050406_1",
link1: "http://www.spadixbd.com/backstreet/",
link2: "",
name: "BackStreet Browser 3.x",
type: "D"
},
%{
comment: "119.63.193.94.[x]xx",
description: "Baidu search (Japan) image crawler",
id: "id_a_f_140508_1",
link1: "http://www.baidu.jp/",
link2: "",
name: "BaiduImagespider+(+http://www.baidu.jp/search/s308.html)",
type: "R"
},
%{
comment: "",
description: "Baidu spidering engine - used by diff. IPs",
id: "id_a_f_99",
link1: "http://www.baidu.com",
link2: "",
name: "BaiDuSpider",
type: "R"
},
%{
comment: "",
description: "Baidu spidering engine - used by diff. IPs",
id: "id_a_f_080608_1",
link1: "http://www.baidu.com",
link2: "",
name: "Baiduspider+(+http://help.baidu.jp/system/05.html)",
type: "R"
},
%{
comment: "",
description: "Baidu spidering engine - used by diff. IPs",
id: "id_a_f_100",
link1: "http://www.baidu.com",
link2: "",
name: "Baiduspider+(+http://www.baidu.com/search/spider.htm)",
type: "R"
},
%{
comment: "119.63.193.[x]xx",
description: "Baidu search (Japan) crawler",
id: "id_a_f_080407_1",
link1: "http://www.baidu.jp",
link2: "",
name: "Baiduspider+(+http://www.baidu.com/search/spider_jp.html)",
type: "R"
},
%{
comment: "",
description: "Balihoo - Vertical search engine crawler (beta)",
id: "id_a_f_031107_1",
link1: "http://www.balihoo.com/",
link2: "http://www.balihoo.com/pdfs/BalihooFactSheet.pdf",
name:
"Balihoo/Nutch-1.0-dev (Crawler for Balihoo.com search engine - obeys robots.txt and robots meta tags ; http://balihoo.com/index.aspx; robot at balihoo dot com)",
type: "R"
},
%{
comment: "s. also Mozilla/5.0 (compatible; BanBots/2.0b..",
description: "Project BanBots Perl script robot",
id: "id_a_f_101",
link1: "http://www.banbots.com/",
link2: "",
name: "BanBots/1.2 (spider@banbots.com)",
type: "C"
},
%{
comment: "",
description: "Barca Pro email & PIM software",
id: "id_a_f_140506_3",
link1:
"http://www.pocosystems.com/home/index.php?option=com_content&task=view&id=105&Itemid=54",
link2: "",
name: "Barca/2.0.xxxx",
type: "B"
},
%{
comment: "",
description: "Barca Pro email & PIM software",
id: "id_a_f_120206_2",
link1:
"http://www.pocosystems.com/home/index.php?option=com_content&task=view&id=105&Itemid=54",
link2: "",
name: "BarcaPro/1.4.xxxx",
type: "B"
},
%{
comment: "64.246.56.xx",
description: "Barrahome crawler",
id: "id_a_f_102",
link1: "http://www.barrahome.org",
link2: "",
name: "BarraHomeCrawler (albertof@barrahome.org)",
type: "R"
},
%{
comment: "204.71.191.1xx",
description: "Unknown user agent from Microsoft",
id: "id_a_f_011006_1",
link1: "",
link2: "",
name: "bCentral Billing Post-Process",
type: ""
},
%{
comment: "208.144.233.xxx",
description: "Business.com robot",
id: "id_a_f_103",
link1: "http://www.business.com",
link2: "",
name: "bdcindexer_2.6.2 (research@bdc)",
type: "R"
},
%{
comment: "",
description: "Brandimensions Brand Protection robot",
id: "id_a_f_104",
link1: "http://www.brandimensions.com/",
link2: "",
name: "BDFetch",
type: "R"
},
%{
comment: "",
description: "Bdncentral Sitesearch robot",
id: "id_a_f_105",
link1: "http://www.bdncentral.com",
link2: "",
name:
"BDNcentral Crawler v2.3 [en] (http://www.bdncentral.com/robot.html) (X11; I; Linux 2.0.44 i686)",
type: "R"
},
%{
comment: "",
description: "beammachine web directory (Germany) link checking",
id: "id_a_f_111205_3",
link1: "http://www.beammachine.net/de/",
link2: "",
name: "BeamMachine/0.5 (dead link remover of www.beammachine.net)",
type: "R C"
},
%{
comment: "",
description: "Beauty robot for Cosmoty - German beauty and wellness search",
id: "id_a_f_106",
link1: "http://www.cosmoty.de",
link2: "http://www.uchoose.de/Projekte/Lifestyle/beauty/",
name: "beautybot/1.0 (+http://www.uchoose.de/crawler/beautybot/)",
type: "R"
},
%{
comment: "68.6.204.2xx",
description: "A Passion for Jazz music related search robot",
id: "id_a_f_230406_1",
link1: "http://www.apassion4jazz.net/",
link2: "",
name: "BebopBot/2.5.1 ( crawler http://www.apassion4jazz.net/bebopbot.html )",
type: "R"
},
%{
comment: "",
description: "LinkcheckerBeepware (site is down) web directory link checking",
id: "id_a_f_107",
link1: "http://directory.beebware.co.uk",
link2: "",
name: "BeebwareDirectory/v0.01",
type: "C"
},
%{
comment: "",
description: "Big Brother link checking tool",
id: "id_a_f_108",
link1: "http://pauillac.inria.fr",
link2: "",
name: "Big Brother (http://pauillac.inria.fr/~fpottier/)",
type: "C"
},
%{
comment: "216.89.111.x",
description: "GoonGee.com link popularity checking",
id: "id_a_f_130606_1",
link1: "http://www.goongee.com/big-fish/",
link2: "",
name: "Big Fish v1.0",
type: "C"
},
%{
comment: "",
description: "BB4 network monitoring",
id: "id_a_f_109",
link1: "http://www.bb4.com",
link2: "",
name: "BigBrother/1.6e",
type: "C"
},
%{
comment: "",
description: "BigClique Search robot",
id: "id_a_f_110",
link1: "http://www.bigclique.com",
link2: "",
name: "BigCliqueBOT/1.03-dev (bigclicbot; http://www.bigclique.com; bot@bigclique.com)",
type: "R"
},
%{
comment: "",
description: "Biglotron search (France) robot",
id: "id_a_f_080206_4",
link1: "http://www.biglotron.com/",
link2: "",
name: "BIGLOTRON (Beta 2;GNU/Linux)",
type: "R"
},
%{
comment: "72.0.207.1xx",
description: "Bigsearch.ca search robot",
id: "id_a_f_171106_2",
link1: "http://www.bigsearch.ca/",
link2: "",
name:
"Bigsearch.ca/Nutch-x.x-dev (Bigsearch.ca Internet Spider; http://www.bigsearch.ca/; info@enhancededge.com)",
type: "R"
},
%{
comment: "",
description: "Bilbo - web frontend for the Nessus Security Scanner",
id: "id_a_f_111",
link1:
"http://home.broadpark.no/%7Etnilsen-1/Linux/Bilbo_-_Nessus_WEB/bilbo_-_nessus_web.html",
link2: "",
name: "Bilbo/2.3b-UNIX",
type: "C"
},
%{
comment: "212.156.230.2xx",
description: "Bilgi.com (Beta) search robot - Turkey",
id: "id_a_f_170806_1",
link1: "http://www.bilgi.com/",
link2: "",
name:
"BilgiBetaBot/0.8-dev (bilgi.com (Beta) ; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org)",
type: "R"
},
%{
comment: "212.156.230.2xx",
description: "Bilgi.com (Beta) search robot - Turkey",
id: "id_a_f_080607_1",
link1: "http://www.bilgi.com/",
link2: "",
name: "BilgiBot/1.0(beta) (http://www.bilgi.com/; bilgi at bilgi dot com)",
type: "R"
},
%{
comment: "",
description: "Carnegie Mellon School robot/link checking ?",
id: "id_a_f_112",
link1: "http://www.cs.cmu.edu",
link2: "",
name: "billbot wjj@cs.cmu.edu",
type: "C"
},
%{
comment: "",
description: "Bitacle Blog Search Archive robot",
id: "id_a_f_050206_3",
link1: "http://bitacle.org/",
link2: "",
name: "Bitacle bot/1.1",
type: "R"
},
%{
comment: "",
description: "Bitacle Blog Search Archive robot",
id: "id_a_f_050206_2",
link1: "http://bitacle.org/",
link2: "",
name: "Bitacle Robot (V:1.0;) (http://www.bitacle.com)",
type: "R"
},
%{
comment: "",
description: "Biyubi Navigator - Mexican browser for Fenix OS",
id: "id_a_f_113",
link1: "http://www.biyubi.com",
link2: "",
name: "Biyubi/x.x (Sistema Fenix; G11; Familia Toledo; es-mx)",
type: "B"
},
%{
comment: "",
description: "Blackberry Wireless Internet browser via Google WAP Proxy",
id: "id_a_f_114",
link1: "http://www.blackberry.com/products/service/web.shtml",
link2: "http://www.openwave.com",
name:
"BlackBerry7520/4.0.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/5.0.3.3 UP.Link/5.1.2.12 (Google WAP Proxy/1.0)",
type: "B P"
},
%{
comment: "",
description: "FS Consulting (was www.fsconsult.net) Black Widow web crawler",
id: "id_a_f_115",
link1: "",
link2: "",
name: "BlackWidow",
type: "R"
},
%{
comment: "",
description: "BlackWidow web site scanner / downloading tool",
id: "id_a_f_010306_1",
link1: "http://www.softbytelabs.com/BlackWidow",
link2: "",
name: "BlackWidow",
type: "D"
},
%{
comment: "203.87.123.1xx",
description: "Blaiz Enterprises RawGrunt search",
id: "id_a_f_116",
link1: "http://www.rawgrunt.com/",
link2: "http://www.blaiz.net",
name: "Blaiz-Bee/1.0 (+http://www.blaiz.net)",
type: "R"
},
%{
comment: "203.87.123.1xx",
description: "Blaiz Enterprises RawGrunt search",
id: "id_a_f_160307_1",
link1: "http://www.rawgrunt.com/",
link2: "http://www.blaiz.net",
name: "Blaiz-Bee/2.00.8222 (BE Internet Search Engine http://www.rawgrunt.com)",
type: "R"
},
%{
comment: "203.87.123.1xx",
description: "Blaiz Enterprises RawGrunt search",
id: "id_a_f_240706_1",
link1: "http://www.rawgrunt.com/",
link2: "http://www.blaiz.net",
name: "Blaiz-Bee/2.00.xxxx (+http://www.blaiz.net)",
type: "R"
},
%{
comment: "",
description: "Blitzsuche Germany robot",
id: "id_a_f_117",
link1: "http://blitzsuche.rp-online.de/",
link2: "",
name: "BlitzBOT@tricus.net",
type: "R"
},
%{
comment: "",
description: "Blitzsuche Germany robot",
id: "id_a_f_118",
link1: "http://blitzsuche.rp-online.de/",
link2: "",
name: "BlitzBOT@tricus.net (Mozilla compatible)",
type: "R"
},
%{
comment: "",
description: "BlockNote web page editor",
id: "id_a_f_090307_1",
link1: "http://blocknote.net/",
link2: "",
name: "BlockNote.Net",
type: "B"
},
%{
comment: "",
description: "blogdex robot from MIT.edu",
id: "id_a_f_119",
link1: "http://blogdex.media.mit.edu/",
link2: "",
name: "BlogBot/1.x",
type: "R"
},
%{
comment: "",
description: "BlogBridge RSS reader",
id: "id_a_f_071206_1",
link1: "http://www.blogbridge.com/",
link2: "",
name: "BlogBridge 2.13 (http://www.blogbridge.com/)",
type: "B"
},
%{
comment: "65.214.44.xx",
description: "Bloglines article search",
id: "id_a_f_120",
link1: "http://www.bloglines.com",
link2: "",
name: "Bloglines Title Fetch/1.0 (http://www.bloglines.com)",
type: "R"
},
%{
comment: "65.214.44.xx",
description: "Bloglines graphics crawler",
id: "id_a_f_250907_1",
link1: "http://www.bloglines.com",
link2: "",
name: "Bloglines-Images/0.1 (http://www.bloglines.com)",
type: "R"
},
%{
comment: "65.214.44.xx",
description: "Bloglines news crawler",
id: "id_a_f_011108_2",
link1: "http://www.bloglines.com",
link2: "",
name: "Bloglines/3.1 (http://www.bloglines.com)",
type: "R"
},
%{
comment: "",
description: "FeedMap / BlogMap geo coding service",
id: "id_a_f_071206_2",
link1: "http://www.feedmap.net/BlogMap/",
link2: "",
name: "BlogMap (http://www.feedmap.net)",
type: "C"
},
%{
comment: "64.158.138.xx",
description: "Intelliseek's BlogPulse blog search",
id: "id_a_f_121",
link1: "http://www.blogpulse.com",
link2: "",
name: "Blogpulse (info@blogpulse.com)",
type: "R"
},
%{
comment: "64.158.138.xx",
description: "Intelliseek's BlogPulse blog search",
id: "id_a_f_050208_2",
link1: "http://www.blogpulse.com",
link2: "",
name: "BlogPulseLive (support@blogpulse.com)",
type: "R"
},
%{
comment: "s. also BlogzIce ...",
description: "IceRocket Web search robot",
id: "id_a_f_161206_2",
link1: "http://www.icerocket.com",
link2: "",
name: "BlogSearch/1.x +http://www.icerocket.com/",
type: "R"
},
%{
comment: "88.198.44.2xx",
description: "Art of Computing blog search project",
id: "id_a_f_020707_1",
link1: "http://artofcomputing.net/blog/?p=4",
link2: "",
name: "blogsearchbot-pumpkin-3",
type: "R"
},
%{
comment: "",
description: "BlogsNow realtime link tracker robot",
id: "id_a_f_241205_1",
link1: "http://www.blogsnow.com/",
link2: "",
name: "BlogsNowBot, V 2.01 (+http://www.blogsnow.com/)",
type: "R"
},
%{
comment: "212.61.21.xx",
description: "BlogVipe news and Blog crawler (Netherlands)",
id: "id_a_f_261107_1",
link1: "http://www.blogvibe.nl",
link2: "",
name: "BlogVibeBot-v1.1 (spider@blogvibe.nl)",
type: "R"
},
%{
comment: "",
description: "blogWatcher robot from Okumura Group Tokyo (131.112.182.xxx)",
id: "id_a_f_122",
link1: "http://www.lr.pi.titech.ac.jp",
link2: "",
name: "blogWatcher_Spider/0.1 (http://www.lr.pi.titech.ac.jp/blogWatcher/)",
type: "R"
},
%{
comment: "s. also BlogSearch ...",
description: "IceRocket Web search robot",
id: "id_a_f_123",
link1: "http://www.icerocket.com",
link2: "",
name: "BlogzIce/1.0 (+http://icerocket.com; rhodes@icerocket.com)",
type: "R"
},
%{
comment: "s. also BlogSearch ...",
description: "IceRocket Web search robot",
id: "id_a_f_124",
link1: "http://www.icerocket.com",
link2: "",
name: "BlogzIce/1.0 +http://www.icerocket.com/",
type: "R"
},
%{
comment: "206.166.206.18x",
description: "Blooby search (beta) robot",
id: "id_a_f_310108_1",
link1: "http://www.blooby.com/",
link2: "",
name: "BloobyBot",
type: "R"
},
%{
comment: "204.228.230.xx",
description: "Balihoo - Search Engine for Advertising Media",
id: "id_a_f_270507_1",
link1: "http://balihoo.com/",
link2: "",
name:
"Bloodhound/Nutch-0.9 (Testing Crawler for Research - obeys robots.txt and robots meta tags ; http://balihoo.com/index.aspx; robot at balihoo dot com)",
type: "R"
},
%{
comment: "",
description: "Bluefish HTML-editor for Linux",
id: "id_a_f_125",
link1: "http://bluefish.openoffice.nl/",
link2: "",
name: "bluefish 0.6 HTML editor",
type: "B"
},
%{
comment: "seems to be a Trojan - see link",
description: "Part of ButtMan remote access tool",
id: "id_a_f_126",
link1: "http://www.glocksoft.com/trojan_list/ButtMan.htm",
link2: "",
name: "BMCLIENT",
type: ""
},
%{
comment: "Website is dead - was:",
description: "Bookmark Express bookmark manager",
id: "id_a_f_120506_1",
link1: "http://www.bookmarkexpress.com/",
link2: "",
name: "BMLAUNCHER",
type: "C"
},
%{
comment: "",
description: "Bobby web accessibility desktop testing tool",
id: "id_a_f_127",
link1: "http://bobby.watchfire.com/bobby/html/en/index.jsp",
link2: "",
name: "Bobby/4.0.x RPT-HTTPClient/0.3-3E",
type: "C"
},
%{
comment: "",
description: "Boitho search (Norway) robot via 80.202.212.xx / 80.80.111.xx",
id: "id_a_f_128",
link1: "http://www.boitho.com",
link2: "",
name: "boitho.com-dc/0.xx (http://www.boitho.com/dcbot.html)",
type: "R"
},
%{
comment: "",
description: "Boitho search (Norway) robot via 80.202.212.xx / 80.80.111.xx",
id: "id_a_f_129",
link1: "http://www.boitho.com",
link2: "",
name: "boitho.com-robot/1.x",
type: "R"
},
%{
comment: "",
description: "Boitho search (Norway) robot via 80.202.212.xx / 80.80.111.xx",
id: "id_a_f_130",
link1: "http://www.boitho.com",
link2: "",
name: "boitho.com-robot/1.x (http://www.boitho.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "Bookdog - Mac bookmark manager",
id: "id_a_f_060806_1",
link1: "http://www.sheepsystems.com/bookdog/",
link2: "",
name: "Bookdog/x.x",
type: "C"
},
%{
comment: "",
description: "Bookmark Buddy - favorite bookmark manager ",
id: "id_a_f_131",
link1: "http://www.bookmarkbuddy.net",
link2: "",
name: "Bookmark Buddy bookmark checker (http://www.bookmarkbuddy.net/)",
type: "C"
},
%{
comment: "",
description: "Favourites managing program",
id: "id_a_f_132",
link1: "http://www.bookmark.ne.jp",
link2: "",
name: "Bookmark Renewal Check Agent [http://www.bookmark.ne.jp/]",
type: "C"
},
%{
comment: "",
description: "Favourites managing program",
id: "id_a_f_230807_1",
link1: "http://www.bookmark.ne.jp",
link2: "",
name: "Bookmark Renewal Check Agent [http://www.bookmark.ne.jp/] (Version 2.0beta)",
type: "C"
},
%{
comment: "",
description: "Bookmark Base bookmark manager",
id: "id_a_f_300408_1",
link1: "http://www.bookmarkbase.com/",
link2: "",
name: "BookmarkBase(2/;http://bookmarkbase.com)",
type: "C"
},
%{
comment: "",
description: "cybercity.fr user robot / faked user agent ?",
id: "id_a_f_133",
link1: "",
link2: "",
name: "Bot mailto:craftbot@yahoo.com",
type: ""
},
%{
comment: "72.14.164.1xx",
description: "BD-Brandprotect copyright infringement crawler",
id: "id_a_f_160308_1",
link1: "http://www.bdbrandprotect.com/",
link2: "http://www.bdbrandprotect.com/solutions_5.html",
name: "BPImageWalker/2.0 (www.bdbrandprotect.com)",
type: "R"
},
%{
comment: " s. also BStop",
description: "BravoBrian bSTOP parental control",
id: "id_a_f_134",
link1: "http://bstop.bravobrian.it/",
link2: "",
name: "BravoBrian bstop.bravobrian.it",
type: "P R"
},
%{
comment: " s. also BStop",
description: "Robot for BravoBrian bSTOP",
id: "id_a_f_135",
link1: "http://bstop.bravobrian.it/",
link2: "",
name: "BravoBrian SpiderEngine MarcoPolo",
type: "R"
},
%{
comment: "",
description: "BrightCloud web filtering for classifying websites",
id: "id_a_f_220508_1",
link1: "http://www.brightcloud.com/brightcrawler.asp",
link2: "",
name: "BrightCrawler (http://www.brightcloud.com/brightcrawler.asp)",
type: "P R"
},
%{
comment: "",
description: "Webarchive Project Bruinbot crawler",
id: "id_a_f_136",
link1: "http://webarchive.cs.ucla.edu",
link2: "",
name: "BruinBot (+http://webarchive.cs.ucla.edu/bruinbot.html) ",
type: "R"
},
%{
comment: "",
description: "Inktomi (Hotbot-Lycos NBCi) robot",
id: "id_a_f_137",
link1: "http://www.inktomi.com/",
link2: "",
name: "BSDSeek/1.0",
type: "R"
},
%{
comment: "s. also BravoBrian ..",
description: "BravoBrian bSTOP parental control",
id: "id_a_f_138",
link1: "http://bstop.bravobrian.it/",
link2: "",
name: "BStop.BravoBrian.it Agent Detector",
type: "P R"
},
%{
comment: "",
description: "BitTorrent Search Engine btbot robot",
id: "id_a_f_139",
link1: "http://www.btbot.com",
link2: "",
name: "BTbot/0.x (+http://www.btbot.com/btbot.html)",
type: "R"
},
%{
comment: "",
description: "µTorrent BitTorrent Client",
id: "id_a_f_300408_2",
link1: "http://www.utorrent.com/",
link2: "",
name: "BTWebClient/180B(9704)",
type: "D"
},
%{
comment: "194.24.253.xx",
description: "BuildCMS crawler - market monitoring project of BuildCMS",
id: "id_a_f_080407_2",
link1: "http://www.buildcms.com/index.php",
link2: "http://www.buildcms.com/about_us/crawler",
name: "BuildCMS crawler (http://www.buildcms.com/crawler)",
type: "R"
},
%{
comment: "202.181.96.2xx",
description: "Bulkfeeds: RSS directory link checking",
id: "id_a_f_051206_4",
link1: "http://bulkfeeds.net/",
link2: "",
name: "Bulkfeeds/r1752 (http://bulkfeeds.net/)",
type: "C"
},
%{
comment: "",
description: "BullsEye/Intelliseek robot",
id: "id_a_f_140",
link1: "http://www.intelliseek.com/be/bullseye.htm",
link2: "",
name: "BullsEye",
type: "R"
},
%{
comment: "",
description: "Relevare Portal software robot",
id: "id_a_f_141",
link1: "http://www.relevare.com",
link2: "",
name: "bumblebee@relevare.com",
type: "R"
},
%{
comment: "",
description: "Microsoft server information robot (see link)",
id: "id_a_f_142",
link1: "http://www.webmasterworld.com/forum11/841.htm",
link2: "",
name: "BunnySlippers",
type: "C"
},
%{
comment: "",
description: "BurstFind search crawler (64.34.172.xx)",
id: "id_a_f_070606_1",
link1: "http://www.burstfind.com/",
link2: "",
name:
"BurstFindCrawler/1.1 (crawler.burstfind.com; http://crawler.burstfind.com; crawler@burstfind.com)",
type: "R"
},
%{
comment: "",
description: "Buscaplus (Spain) robot",
id: "id_a_f_143",
link1: "http://www.buscaplus.com",
link2: "",
name: "Buscaplus Robi/1.0 (http://www.buscaplus.com/robi/)",
type: "R"
},
%{
comment: "",
description: "Logitech Desktop Managers (LDM) Backweb (BW) update check",
id: "id_a_f_050807_2",
link1: "http://www.logitech.com/index.cfm/494/3041&cl=de,de",
link2: "",
name: "BW-C-2.0",
type: "D"
},
%{
comment: "",
description: "Basic Web Hacking 3 fake user-agent from Hellbound Hackers challenges",
id: "id_a_f_140508_2",
link1: "http://www.hellboundhackers.org/forum/_basic_web_hacking_3-7-6960_0.html",
link2: "http://vuau.wordpress.com/2008/03/12/hbh-basic-web-3-switch-user-agent/",
name: "bwh3_user_agent",
type: "S"
},
%{
comment: "64.111.217.9x",
description: "Amfibi Search robot",
id: "id_a_f_140508_3",
link1: "http://www.amfibi.com/",
link2: "",
name:
"Cabot/Nutch-0.9 (Amfibi's web-crawling robot; http://www.amfibi.com/cabot/; agent@amfibi.com)",
type: "R"
},
%{
comment: "64.111.217.9x",
description: "Amfibi Search robot",
id: "id_a_f_280508_1",
link1: "http://www.amfibi.com/",
link2: "",
name:
"Cabot/Nutch-1.0-dev (Amfibi's web-crawling robot; http://www.amfibi.com/cabot/; agent@amfibi.com)",
type: "R"
},
%{
comment: "",
description: "Evolution integrated mail solution Camel TCP stream class",
id: "id_a_f_140506_4",
link1: "http://www.gnome.org/projects/evolution/",
link2: "http://go-evolution.org/Camel.Stream",
name: "CamelHttpStream/1.0",
type: ""
},
%{
comment: "",
description: "Some user agent",
id: "id_a_f_144",
link1: "",
link2: "",
name: "Cancer Information and Support International;",
type: ""
},
%{
comment: "s. also - voyager/1.x - cfetch/1.",
description: "Cosmix project crawler (204.14.48.x / 38.113.234.xxx)",
id: "id_a_f_110206_1",
link1: "http://www.cosmixcorp.com/",
link2: "",
name: "carleson/1.0",
type: "R"
},
%{
comment: "",
description: "Carnegie Mellon University WebBOT",
id: "id_a_f_145",
link1: "http://www.andrew.cmu.edu",
link2: "",
name:
"Carnegie_Mellon_University_Research_WebBOT-->PLEASE READ-->http://www.andrew.cmu.edu/~brgordon/webbot/index.html http://www.andrew.cmu.edu/~brgordon/webbot/index.html",
type: "R"
},
%{
comment: "",
description: "Carnegie Mellon University WebBOT",
id: "id_a_f_146",
link1: "http://www.andrew.cmu.edu",
link2: "",
name:
"Carnegie_Mellon_University_WebCrawler http://www.andrew.cmu.edu/~brgordon/webbot/index.html",
type: "R"
},
%{
comment: "",
description: "Catall.de search & web directory (Germany)",
id: "id_a_f_170206_1",
link1: "http://www.catall.de/",
link2: "",
name: "Catall Spider",
type: "R"
},
%{
comment: "72.36.94.1xx",
description: "UIUCs Cazoodle search based on MetaQuerier",
id: "id_a_f_130807_3",
link1: "http://www.cazoodle.com/",
link2: "http://metaquerier.cs.uiuc.edu/",
name:
"CazoodleBot/CazoodleBot-0.1 (CazoodleBot Crawler; http://www.cazoodle.com/cazoodlebot; cazoodlebot@cazoodle.com)",
type: "R"
},
%{
comment: "38.103.63.1[6-8]",
description: "CommonCrawl Foundation search crawler",
id: "id_a_f_290308_1",
link1: "http://www.commoncrawl.org/faq.htm",
link2: "",
name: "CCBot/1.0 (+http://www.commoncrawl.org/bot.html)",
type: "R"
},
%{
comment: "",
description: "Empyreum Ccubee (Czech) search engine solution",
id: "id_a_f_147",
link1: "http://empyreum.com/technologies/ccubee",
link2: "",
name: "ccubee/x.x",
type: "R"
},
%{
comment: "61.142.xx.x[xx]",
description: "Timewe mobile browser (WAP) simulator (Japan)",
id: "id_a_f_010108_2",
link1: "http://timewe.net/",
link2: "",
name:
"CDR/1.7.1 Simulator/0.7(+http://timewe.net) Profile/MIDP-1.0 Configuration/CLDC-1.0",
type: "B"
},
%{
comment: "",
description: "Cisco Content Engine",
id: "id_a_f_291105_6",
link1: "http://www.cisco.com/en/US/products/hw/contnetw/index.html",
link2: "",
name: "CE-Preload",
type: "P"
},
%{
comment: "87.72.214.9x",
description: "Nordic semantic search engine",
id: "id_a_f_100408_4",
link1: "http://www.centiverse-project.net/post/Educating-the-bots.aspx",
link2: "",
name: "CentiverseBot",
type: "C"
},
%{
comment: "87.72.214.9x",
description: "Nordic semantic search engine",
id: "id_a_f_180408_2",
link1: "http://www.centiverse-project.net/post/Educating-the-bots.aspx",
link2: "",
name: "CentiverseBot - investigator",
type: "C"
},
%{
comment: "87.72.214.9x",
description: "Nordic semantic search engine",
id: "id_a_f_180408_3",
link1: "http://www.centiverse-project.net/post/Educating-the-bots.aspx",
link2: "",
name: "CentiverseBot/3.0 (http://www.centiverse-project.net)",
type: "C"
},
%{
comment: "",
description: "Floortransformed.com robot (link ckecking ??)",
id: "id_a_f_148",
link1: "http://www.floorstransformed.com",
link2: "",
name: "Ceramic Tile Installation Guide (http://www.floorstransformed.com)",
type: "R"
},
%{
comment: "",
description: "CERN Line Mode Browser",
id: "id_a_f_131208_2",
link1: "http://www.w3.org/LineMode/",
link2: "",
name: "CERN-LineMode/2.15",
type: "B"
},
%{
comment: "s. also - voyager/1.x - carleson/1.x",
description: "Cosmix project crawler (204.14.48.x / 38.113.234.xxx)",
id: "id_a_f_149",
link1: "http://www.cosmixcorp.com",
link2: "",
name: "cfetch/1.0",
type: "R"
},
%{
comment: "",
description: "MaxOS X CoreFoundation CFNetwork API",
id: "id_a_f_150",
link1: "http://www.cocoadev.com/index.pl?CFNetwork",
link2: "",
name: "CFNetwork/x.x",
type: ""
},
%{
comment: "",
description: "cg-eye CGI checker",
id: "id_a_f_151",
link1: "http://www.htmlhelp.com",
link2: "",
name: "cg-eye interactive",
type: "C"
},
%{
comment: "",
description: "Charon Amiga download manager",
id: "id_a_f_152",
link1: "http://tesla.rcub.bg.ac.yu/%7Eantony/Charon/",
link2: "",
name: "Charon/1.x (Amiga)",
type: "D"
},
%{
comment: "69.80.208.2xx",
description: "Chat Catcher blog monitoring robot",
id: "id_a_f_131208_3",
link1: "http://chatcatcher.com/cc/",
link2: "",
name: "Chat Catcher/1.0",
type: "C"
},
%{
comment: "",
description: "Checkbot link validation",
id: "id_a_f_153",
link1: "http://degraaff.org/checkbot/",
link2: "",
name: "Checkbot/1.xx LWP/5.xx",
type: "C"
},
%{
comment: "",
description: "Checklinks - Perl link checker",
id: "id_a_f_154",
link1: "http://www.jmarshall.com",
link2: "",
name: "CheckLinks/1.x.x",
type: "C"
},
%{
comment: "",
description: "NTL user agent",
id: "id_a_f_155",
link1: "http://www.ntl.com",
link2: "",
name: "CheckUrl",
type: ""
},
%{
comment: "",
description: "CheckWeb link validation",
id: "id_a_f_156",
link1: "http://p.duby.free.fr/chkweb.htm",
link2: "",
name: "CheckWeb",
type: "C"
},
%{
comment: "",
description: "Chilkat HTTP component user-agent",
id: "id_a_f_030206_2",
link1: "http://www.chilkatsoft.com/HttpDotNet.asp",
link2: "",
name: "Chilkat/1.0.0 (+http://www.chilkatsoft.com/ChilkatHttpUA.asp)",
type: ""
},
%{
comment: "see link:",
description: "Unknown spam bot from telekom.com.my (218.111.83.xxx)",
id: "id_a_f_230506_1",
link1: "http://linuxreviews.org/webdesign/602_Apache_Webalizer/",
link2: "",
name: "China Local Browse 2.6",
type: "S"
},
%{
comment: "67.15.219.[x]x",
description: "Chitika Inc. Blog advertising",
id: "id_a_f_170408_2",
link1: "http://chitika.com/",
link2: "",
name: "Chitika ContentHit 1.0",
type: "C"
},
%{
comment: "- s. also Mozilla/4.0 (compatible; ChristCrawler..)",
description: "Christcentral.com Christcrawler (was www.christcrawler.com)",
id: "id_a_f_157",
link1: "",
link2: "",
name: "ChristCRAWLER 2.0",
type: "R"
},
%{
comment: "",
description: "CHttpClient - C++ class using WinInet",
id: "id_a_f_010607_2",
link1: "http://www.codeproject.com/library/lyoulhttpclient.asp",
link2: "",
name: "CHttpClient by Open Text Corporation",
type: ""
},
%{
comment: "",
description: "CipinetBot -Cipinet Search Engine Web Crawler",
id: "id_a_f_158",
link1: "http://www.cipinet.com",
link2: "",
name: "CipinetBot (http://www.cipinet.com/bot.html)",
type: "R"
},
%{
comment: "88.198.212.5x",
description: "Cityreview regional search (Germany) link checking",
id: "id_a_f_130108_1",
link1: "http://www.cityreview.de/",
link2: "http://www.cityreview.org/crawler/",
name: "Cityreview Robot (+http://www.cityreview.org/crawler/)",
type: "C"
},
%{
comment: "",
description: "Commision Junction link checking spider",
id: "id_a_f_159",
link1: "http://www.cj.com/",
link2: "",
name: "CJ Spider/",
type: "C"
},
%{
comment: "",
description: "CJB Net anonymous socks proxy service (216.194.70.x)",
id: "id_a_f_050606_1",
link1: "http://proxy.cjb.net/",
link2: "",
name: "CJB.NET Proxy",
type: "P"
},
%{
comment: "s. also Diamond",
description: "Claria (ex Gator) SearchScout robot (64.152.73.xx)",
id: "id_a_f_160",
link1: "http://www.searchscout.com",
link2: "",
name: "ClariaBot/1.0",
type: "R"
},
%{
comment: "",
description: "Claymont Search robot",
id: "id_a_f_161",
link1: "http://www.claymont.com",
link2: "",
name: "Claymont.com",
type: "R"
},
%{
comment: "212.80.76.xx",
description: "Seznam Search (Czech Republic) robot",
id: "id_a_f_100307_1",
link1: "http://www.seznam.cz/",
link2: "",
name: "CloakDetect/0.9 (+http://fulltext.seznam.cz/)",
type: "R"
},
%{
comment: "",
description: "Clush clustered search robot",
id: "id_a_f_162",
link1: "http://www.clush.com",
link2: "",
name: "Clushbot/2.x (+http://www.clush.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "Clush clustered search robot",
id: "id_a_f_163",
link1: "http://www.clush.com",
link2: "",
name: "Clushbot/3.x-BinaryFury (+http://www.clush.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "Clush clustered search robot",
id: "id_a_f_164",
link1: "http://www.clush.com",
link2: "",
name: "Clushbot/3.xx-Ajax (+http://www.clush.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "Clush clustered search robot",
id: "id_a_f_165",
link1: "http://www.clush.com",
link2: "",
name: "Clushbot/3.xx-Hector (+http://www.clush.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "Clush clustered search robot",
id: "id_a_f_166",
link1: "http://www.clush.com",
link2: "",
name: "Clushbot/3.xx-Peleus (+http://www.clush.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "COAST Webmaster - Web management and maintenance software",
id: "id_a_f_070506_1",
link1: "http://www.extablish.com/cwm.htm",
link2: "",
name: "COAST WebMaster Pro/4.x.x.xx (Windows NT)",
type: "C"
},
%{
comment: "",
description: "Proposed Content-Based Image Tracking System (CoBITS) P2P crawler",
id: "id_a_f_150306_1",
link1: "http://www.iis.sinica.edu.tw/~hungchi/CBIT/",
link2: "",
name: "CoBITSProbe",
type: "R C"
},
%{
comment: "",
description: "Cocoa del.icio.us (social bookmarks manager) client for Mac OS X",
id: "id_a_f_167",
link1: "http://www.scifihifi.com",
link2: "",
name: "Cocoal.icio.us/1.0 (v36) (Mac OS X; http://www.scifihifi.com/cocoalicious)",
type: "C"
},
%{
comment: "72.81.252.9x",
description: "Cogent Search Bot from Cogent Software Solutions for unknown purposes",
id: "id_a_f_070209_2",
link1: "http://www.cogentsoftwaresolutions.com/bot.html",
link2: "",
name: "Cogentbot/1.X (+http://www.cogentsoftwaresolutions.com/bot.html)",
type: "R"
},
%{
comment: "",
description:
"Cold Fusion server used by various IPs i.e.: - NetWORLD web catalogue link checking",
id: "id_a_f_168",
link1: "http://www.networld.com",
link2: "http://www.macromedia.com/software/coldfusion/",
name: "ColdFusion",
type: "P C"
},
%{
comment: "",
description: "Cold Fusion server used by Bookmark Tracker - online favourites managment",
id: "id_a_f_169",
link1: "http://www.bookmarktracker.com",
link2: "http://www.macromedia.com/software/coldfusion/",
name: "ColdFusion (BookmarkTracker.com)",
type: "C"
},
%{
comment: "",
description: "WebCollage Syndicator graphics crawler/collector",
id: "id_a_f_170",
link1: "http://www.webcollage.com",
link2: "",
name: "collage.cgi/1.xx",
type: "R D"
},
%{
comment: "130.235.4.xx",
description: "Combine harvesting & indexing robot",
id: "id_a_f_171",
link1: "http://combine.it.lth.se/",
link2: "",
name: "combine/0.0",
type: "R"
},
%{
comment: "130.235.4.xx",
description: "Combine harvesting & indexing robot",
id: "id_a_f_080406_1",
link1: "http://combine.it.lth.se/",
link2: "",
name: "Combine/2.0 http://combine.it.lth.se/",
type: "R"
},
%{
comment: "130.235.4.xx",
description: "Combine harvesting & indexing robot",
id: "id_a_f_160807_1",
link1: "http://combine.it.lth.se/",
link2: "",
name: "Combine/3 http://combine.it.lth.se/",
type: "R"
},
%{
comment: "130.235.4.xx",
description: "Combine harvesting & indexing robot",
id: "id_a_f_172",
link1: "http://combine.it.lth.se/",
link2: "",
name: "Combine/x.0",
type: "R"
},
%{
comment: "",
description: "cometrics Web Content Mining solution - Germany",
id: "id_a_f_280606_3",
link1: "http://www.cometrics.de/",
link2: "",
name: "cometrics-bot, http://www.cometrics.de",
type: "R"
},
%{
comment: "",
description:
"Wildsoft Germany (closed) Internet client system user-agent (was www.oskarweb.de)",
id: "id_a_f_173",
link1: "",
link2: "",
name: "Commerce Browser Center",
type: "B"
},
%{
comment: "216.182.233.1xx",
description: "UCLA Complex Networks Groups Complex Network Analysis",
id: "id_a_f_240107_1",
link1: "http://cantor.ee.ucla.edu/~networks/",
link2: "",
name:
"complex_network_group/Nutch-0.9-dev (discovering the structure of the world-wide-web; http://cantor.ee.ucla.edu/~networks/crawl; nimakhaj@gmail.com)",
type: "C"
},
%{
comment: "",
description: "Hungarian Academy of Sciences data mining search",
id: "id_a_f_174",
link1: "http://www.ilab.sztaki.hu/websearch/",
link2: "",
name: "Computer_and_Automation_Research_Institute_Crawler crawler@ilab.sztaki.hu",
type: "R"
},
%{
comment: "powered by Nutch",
description: "ComRite Chinese Search Engine for Oversea Web Sites (69.248.26.xx)",
id: "id_a_f_010406_2",
link1: "http://www.comrite.com/",
link2: "http://meidong.comrite.com/",
name:
"Comrite/0.7.1 (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org)",
type: "R"
},
%{
comment: "",
description: "unknown",
id: "id_a_f_175",
link1: "",
link2: "",
name: "Contact",
type: ""
},
%{
comment: "64.124.152.xx",
description: "Probably E-Mail harvesting robot - same as LMQueueBot",
id: "id_a_f_200307_1",
link1: "",
link2: "",
name: "ContactBot/0.2",
type: "S"
},
%{
comment: "",
description: "ContentSmartz e-mail harvesting tools",
id: "id_a_f_291105_7",
link1: "",
link2: "",
name: "ContentSmartz",
type: "S"
},
%{
comment: "NOT Contype mime type managment Perl script",
description: "Internet Explorer versions 4.x and 5 plugin content",
id: "id_a_f_176",
link1: "http://support.microsoft.com/default.aspx?scid=kb;en-us;293792",
link2: "",
name: "contype",
type: "B"
},
%{
comment: " s. also - infoConveraCrawler... - CrawlConvera ...",
description: "Converas RetrievalWare Internet Spider (63.241.61.x)",
id: "id_a_f_177",
link1: "http://www.convera.com",
link2: "",
name: "Convera Internet Spider V6.x",
type: "R"
},
%{
comment: " s. also - infoConveraCrawler... - CrawlConvera ...",
description: "Converas RetrievalWare Internet Spider (63.241.61.x)",
id: "id_a_f_178",
link1: "http://www.convera.com",
link2: "",
name: "ConveraCrawler/0.2",
type: "R"
},
%{
comment: " s. also - infoConveraCrawler... - CrawlConvera ...",
description: "Converas RetrievalWare Internet Spider (63.241.61.x)",
id: "id_a_f_051205_1",
link1: "http://www.convera.com/",
link2: "",
name: "ConveraCrawler/0.9d (+http://www.authoritativeweb.com/crawl)",
type: "R"
},
%{
comment: " s. also - infoConveraCrawler... - CrawlConvera ...",
description: "Converas RetrievalWare Internet Spider (63.241.61.x)",
id: "id_a_f_179",
link1: "http://www.convera.com",
link2: "",
name: "ConveraMultiMediaCrawler/0.1 (+http://www.authoritativeweb.com/crawl)",
type: "R"
},
%{
comment: "",
description: "Suchmaschine21 (Germany) robot",
id: "id_a_f_180",
link1: "http://www.suchmaschine21.de/",
link2: "",
name: "CoolBot",
type: "R"
},
%{
comment: "",
description: "Cooliris photo and video browser",
id: "id_a_f_030110_2",
link1: "http://www.cooliris.com/",
link2: "",
name: "Cooliris/1.5 CFNetwork/459 Darwin/10.0.0d3",
type: "B"
},
%{
comment: "",
description: "Coral Content Distribution Network",
id: "id_a_f_040406_1",
link1: "http://coralcdn.org/",
link2: "",
name: "CoralWebPrx/0.1.1x (See http://coralcdn.org/)",
type: "P C"
},
%{
comment: "",
description: "Xyleme SA France robot",
id: "id_a_f_181",
link1: "http://www.xyleme.com/en/index.jsp",
link2: "",
name: "cosmos/0.8_(robot@xyleme.com)",
type: "R"
},
%{
comment: "",
description: "Xyleme SA France robot",
id: "id_a_f_182",
link1: "http://www.xyleme.com/en/index.jsp",
link2: "",
name: "cosmos/0.9_(robot@xyleme.com)",
type: "R"
},
%{
comment: "",
description: "Coteo.com - local French directory link checking",
id: "id_a_f_040607_1",
link1: "http://www.coteo.com/",
link2: "",
name: "CoteoNutchCrawler/Nutch-0.9 (info [at] coteo [dot] com)",
type: "C"
},
%{
comment: "",
description: "Cougarsearch.com robot",
id: "id_a_f_030206_3",
link1: "http://www.cougarsearch.com/",
link2: "",
name: "CougarSearch/0.x (+http://www.cougarsearch.com/faq.shtml)",
type: "R"
},
%{
comment: "s.also ArachBot",
description: "Covac Arachnid Web Crawler",
id: "id_a_f_280408_2",
link1: "http://www.covac-software.com/",
link2: "",
name: "Covac TexAs Arachbot",
type: "R"
},
%{
comment: "",
description: "CoverScout for iTunes - CD cover search tool",
id: "id_a_f_211208_1",
link1: "http://www.equinux.com/de/products/coverscout/index.html",
link2: "",
name: "CoverScout%203/3.0.1 CFNetwork/339.5 Darwin/9.5.0 (i386) (iMac5,1)",
type: "B"
},
%{
comment: " s. also Python-urllib/1.15 - nabot - NaverBot & dloader",
description: "Naver Japan / Korea robot",
id: "id_a_f_183",
link1: "http://www.naver.co.jp",
link2: "",
name: "Cowbot-0.1 (NHN Corp. / +82-2-3011-1954 / nhnbot@naver.com)",
type: "R"
},
%{
comment: " s. also Python-urllib/1.15 - nabot - NaverBot & dloader",
description: "Naver Japan / Korea robot",
id: "id_a_f_184",
link1: "http://www.naver.co.jp",
link2: "",
name: "Cowbot-0.1.x (NHN Corp. / +82-2-3011-1954 / nhnbot@naver.com)",
type: "R"
},
%{
comment: "s. also - Convera Internet Spider .. - infoConveraCrawler...",
description: "Converas RetrievalWare Internet Spider",
id: "id_a_f_185",
link1: "http://www.convera.com",
link2: "",
name: "CrawlConvera0.1 (CrawlConvera@yahoo.com)",
type: "R"
},
%{
comment: "",
description: "unknown robot via Level3.net",
id: "id_a_f_186",
link1: "",
link2: "",
name: "Crawler",
type: ""
},
%{
comment: "",
description: "Cometsystems Comet Search robot via Findwhat (now Miva)",
id: "id_a_f_187",
link1: "http://www.cometsystems.com",
link2: "http://www.miva.com/",
name: "Crawler (cometsearch@cometsystems.com)",
type: "R"
},
%{
comment: "",
description: "Crawler.de / Abacho robot",
id: "id_a_f_188",
link1: "http://www.crawler.de",
link2: "http://www.abacho.de/",
name: "Crawler admin@crawler.de",
type: "R"
},
%{
comment: "",
description: "Crawler.de / Abacho robot",
id: "id_a_f_189",
link1: "http://www.crawler.de",
link2: "http://www.abacho.de/",
name: "Crawler V 0.2.x admin@crawler.de",
type: "R"
},
%{
comment: "",
description: "Alexa crawler",
id: "id_a_f_190",
link1: "http://www.alexa.com",
link2: "",
name: "crawler@alexa.com",
type: "R"
},
%{
comment: "",
description: "Pinpoint WAP search robot",
id: "id_a_f_191",
link1: "http://www.pinpoint.com",
link2: "",
name: "CrawlerBoy Pinpoint.com",
type: "R"
},
%{
comment: "powered by Nutch",
description: "Crawlly Beta search - Germany (72.232.194.2xx)",
id: "id_a_f_130506_1",
link1: "http://www.crawlly.com/",
link2: "",
name: "Crawllybot/0.1 (Crawllybot; +http://www.crawlly.com; crawler@crawlly.com)",
type: "R"
},
%{
comment: "",
description: "Creatice Commons using Nutch open source robot",
id: "id_a_f_192",
link1: "http://www.nutch.org",
link2: "",
name:
"CreativeCommons/0.06-dev (Nutch; http://www.nutch.org/docs/en/bot.html; nutch-agent@lists.sourceforge.net)",
type: "R"
},
%{
comment: "",
description: "Cricket A100 cell phone browser",
id: "id_a_f_030110_3",
link1: "http://www.mycricket.com/cell-phones/details/Cricket-A100",
link2: "",
name: "Cricket-A100/1.0 UP.Browser/6.3.0.7 (GUI) MMP/2.0",
type: "B"
},
%{
comment: "",
description: "Croccrawler robot",
id: "id_a_f_193",
link1: "http://www.croccrawler.com",
link2: "",
name: "CrocCrawler vx.3 [en] (http://www.croccrawler.com) (X11; I; Linux 2.0.44 i686)",
type: "R"
},
%{
comment: "",
description:
"Web mining project from CSCI 659 (computer science course) at Indiana Univerity",
id: "id_a_f_090306_2",
link1: "http://informatics.indiana.edu/fil/Class/b659/",
link2: "",
name: "csci_b659/0.13",
type: "R"
},
%{
comment: "",
description: "CSE HTML Validator for Windows",
id: "id_a_f_180906_1",
link1: "http://www.htmlvalidator.com/",
link2: "",
name: "CSE HTML Validator Professional (http://www.htmlvalidator.com/)",
type: "C"
},
%{
comment: "site is dead",
description: "Cuam - IE based browser",
id: "id_a_f_194",
link1: "http://cuam.virtualave.net",
link2: "",
name: "Cuam Ver0.050bx",
type: "B"
},
%{
comment: "",
description: "Cuasar (Spain) music / ringtone search spider",
id: "id_a_f_195",
link1: "http://www.cuasar.com",
link2: "",
name: "Cuasarbot/0.9b http://www.cuasar.com/spider_beta/ ",
type: "R"
},
%{
comment: "",
description: "Curl file transferring tool",
id: "id_a_f_196",
link1: "http://curl.haxx.se/",
link2: "",
name: "curl/7.10.x (i386-redhat-linux-gnu) libcurl/7.10.x OpenSSL/0.9.7a ipv6 zlib/1.1.4",
type: "D"
},
%{
comment: "",
description: "Curl file transferring tool",
id: "id_a_f_197",
link1: "http://curl.haxx.se/",
link2: "",
name: "curl/7.7.x (i386--freebsd4.3) libcurl 7.7.x (SSL 0.9.6) (ipv6 enabled)",
type: "D"
},
%{
comment: "",
description: "Curl file transferring tool",
id: "id_a_f_198",
link1: "http://curl.haxx.se/",
link2: "",
name: "curl/7.8 (i686-pc-linux-gnu) libcurl 7.8 (OpenSSL 0.9.6)",
type: "D"
},
%{
comment: "",
description: "Curl file transferring tool",
id: "id_a_f_199",
link1: "http://curl.haxx.se/",
link2: "",
name: "curl/7.9.x (win32) libcurl 7.9.x",
type: "D"
},
%{
comment: "",
description: "CurryGuide UK link check robot",
id: "id_a_f_200",
link1: "http://uk.curryguide.com/",
link2: "",
name: "CurryGuide SiteScan 1.1",
type: "R"
},
%{
comment: "s. also - - Mozilla/5.0 (compatible; Custo 3...",
description: "Custo web site spidering tool (link checking)",
id: "id_a_f_201",
link1: "http://www.netwu.com",
link2: "",
name: "Custo x.x (www.netwu.com)",
type: "C"
},
%{
comment: "",
description: "Bisnisseek (was www.bisnisseek.com) robot",
id: "id_a_f_202",
link1: "",
link2: "",
name: "Custom Spider www.bisnisseek.com /1.0",
type: "R"
},
%{
comment: "",
description: "Cyberdog Mac Browser (was www.cyberdog.org)",
id: "id_a_f_203",
link1: "",
link2: "",
name: "Cyberdog/2.0 (Macintosh; 68k)",
type: "B"
},
%{
comment: "38.103.17.16x",
description: "CyberPatrol LLC robot for web filtering software",
id: "id_a_f_260608_2",
link1: "http://www.cyberpatrol.com/cyberpatrolcrawler.asp",
link2: "",
name: "CyberPatrol SiteCat Webbot (http://www.cyberpatrol.com/cyberpatrolcrawler.asp)",
type: "R"
},
%{
comment: "",
description: "CyberSpyder Link Test software",
id: "id_a_f_204",
link1: "http://www.cyberspyder.com/cslnkts1.html",
link2: "",
name: "CyberSpyder Link Test/2.1.12 (admin@mspennyworth.com)",
type: "C"
},
%{
comment: "",
description: "Cydral image & site search spider",
id: "id_a_f_205",
link1: "http://www.cydral.com",
link2: "",
name: "CydralSpider/1.x (Cydral Web Image Search; http://www.cydral.com)",
type: "R"
},
%{
comment: "",
description: "Cydral image & site search spider",
id: "id_a_f_060508_1",
link1: "http://www.cydral.com",
link2: "",
name: "CydralSpider/3.0 (Cydral Image Search; http://www.cydral.com)",
type: "R"
},
%{
comment: "",
description: "Downloadaccelerator download manager",
id: "id_a_f_206",
link1: "http://www.downloadaccelerator.com",
link2: "",
name: "DA 3.5 (www.lidan.com)",
type: "D"
},
%{
comment: "",
description: "Downloadaccelerator download manager",
id: "id_a_f_207",
link1: "http://www.downloadaccelerator.com",
link2: "",
name: "DA 4.0",
type: "D"
},
%{
comment: "",
description: "Downloadaccelerator download manager",
id: "id_a_f_208",
link1: "http://www.downloadaccelerator.com",
link2: "",
name: "DA 4.0 (www.downloadaccelerator.com)",
type: "D"
},
%{
comment: "",
description: "Downloadaccelerator download manager",
id: "id_a_f_209",
link1: "http://www.downloadaccelerator.com",
link2: "",
name: "DA 5.0",
type: "D"
},
%{
comment: "",
description: "Downloadaccelerator download manager",
id: "id_a_f_210",
link1: "http://www.downloadaccelerator.com",
link2: "",
name: "DA 7.0",
type: "D"
},
%{
comment: "",
description: "Download Accelerator Plus download manager",
id: "id_a_f_070209_3",
link1: "http://www.speedbit.com/",
link2: "",
name: "DAP x.x",
type: "D"
},
%{
comment: "",
description: "PowerTCP ActiveX control tool",
id: "id_a_f_211",
link1: "http://www.dart.com",
link2: "",
name: "Dart Communications PowerTCP",
type: ""
},
%{
comment: "",
description: "Unknown bot from Kornet Korea (218.149.129.xxx) scans for Perl Awstats",
id: "id_a_f_212",
link1: "",
link2: "",
name: "DataCha0s/2.0",
type: "S"
},
%{
comment: "from various IPs",
description: "Unknown UA looking for Awstats Perl components",
id: "id_a_f_101106_1",
link1: "",
link2: "",
name: "DataCha0s/2.0",
type: "S"
},
%{
comment: "138.23.85.xx",
description: "INFOMINE/iVia Scholary Internet Resource Collections robot",
id: "id_a_f_213",
link1: "http://infomine.ucr.edu/",
link2: "http://ivia.ucr.edu/useragents.shtml",
name: "DataFountains/DMOZ Downloader",
type: "R"
},
%{
comment: "138.23.85.xx",
description: "INFOMINE/iVia Scholary Internet Resource Collections robot",
id: "id_a_f_040307_1",
link1: "http://infomine.ucr.edu/",
link2: "http://ivia.ucr.edu/useragents.shtml",
name: "DataFountains/Dmoz Downloader (http://ivia.ucr.edu/useragents.shtml)",
type: "R"
},
%{
comment: "138.23.85.xx",
description: "INFOMINE/iVia Scholary Internet Resource Collections robot",
id: "id_a_f_110307_1",
link1: "http://infomine.ucr.edu/",
link2: "http://ivia.ucr.edu/useragents.shtml",
name:
"DataFountains/DMOZ Feature Vector Corpus Creator (http://ivia.ucr.edu/useragents.shtml)",
type: "R"
},
%{
comment: "",
description: "DataparkSearch open source search engine",
id: "id_a_f_050907_1",
link1: "http://www.dataparksearch.org",
link2: "",
name: "DataparkSearch/4.47 (+http://dataparksearch.org/bot)",
type: "R"
},
%{
comment: "",
description: "DataparkSearch open source search engine",
id: "id_a_f_214",
link1: "http://www.dataparksearch.org",
link2: "",
name: "DataparkSearch/4.xx (http://www.dataparksearch.org/)",
type: "R"
},
%{
comment: "",
description: "DataSpear Directory robot (24.109.29.xx)",
id: "id_a_f_080206_1",
link1: "http://www.dataspear.com/",
link2: "",
name:
"DataSpear/1.0 (Spider; http://www.dataspear.com/spider.html; spider@dataspear.com)",
type: "R"
},
%{
comment: "",
description: "DataSpear Directory robot (24.109.29.xx)",
id: "id_a_f_215",
link1: "http://www.dataspear.com/",
link2: "",
name:
"DataSpearSpiderBot/0.2 (DataSpear Spider Bot; http://dssb.dataspear.com/bot.html; dssb@dataspear.com)",
type: "R"
},
%{
comment: "",
description: "Sicher-durchs-Netz German security related search (62.75.220.xxx)",
id: "id_a_f_161105_1",
link1: "http://www.sicher-durchs-netz.de/suche",
link2: "",
name: "DatenBot( http://www.sicher-durchs-netz.de/bot.html)",
type: "R"
},
%{
comment: "site is closed",
description: "Wholeweb robot",
id: "id_a_f_216",
link1: "http://www.wholeweb.net",
link2: "",
name: "DaviesBot/1.7 (www.wholeweb.net)",
type: "R"
},
%{
comment: "",
description: "Daypop blog - weblog - online mag search spider",
id: "id_a_f_217",
link1: "http://www.daypop.com/info/about.htm",
link2: "",
name: "daypopbot/0.x",
type: "R"
},
%{
comment: "",
description: "dbDig search engine",
id: "id_a_f_218",
link1: "http://www.prairielandconsulting.com",
link2: "",
name: "dbDig(http://www.prairielandconsulting.com)",
type: "R"
},
%{
comment: "UA sometimes - DSurf15a 01 - DBrowse 1.4d",
description:
"Some site scanning tool via diff. IPs i.e.: - wanweb.net (208.6.163.xxx) - cox.net (68.4.xxx.xxx)",
id: "id_a_f_219",
link1: "",
link2: "",
name: "DBrowse 1.4b",
type: "S"
},
%{
comment: "see also DSurf15a 01 - DBrowse 1.4b",
description: "Some site scanning tool via diff. IPs i.e.: - pacbell.net (67.112.xxx.xxx)",
id: "id_a_f_220",
link1: "",
link2: "",
name: "DBrowse 1.4d",
type: "S"
},
%{
comment: "",
description: "DC-Sakura download manager",
id: "id_a_f_221",
link1: "http://www.dc-sakura.com/",
link2: "",
name: "DC-Sakura/x.xx",
type: "D"
},
%{
comment: "",
description: "unknown divine/Openmarket.com robot",
id: "id_a_f_222",
link1: "http://www.openmarket.com/",
link2: "",
name: "dCSbot/1.1",
type: "R"
},
%{
comment: "",
description: "some (website) downloading tool",
id: "id_a_f_223",
link1: "",
link2: "",
name: "DDD",
type: "D"
},
%{
comment: "",
description: "Unknown user agent",
id: "id_a_f_224",
link1: "",
link2: "",
name: "dds explorer v1.0 beta",
type: ""
},
%{
comment: "",
description: "Searchengine.com (Germany) submission checking / robot (84.73.57.xx)",
id: "id_a_f_225",
link1: "http://de.searchengine.com",
link2: "",
name: "de.searchengine.comBot 1.2 (http://de.searchengine.com/spider)",
type: "R"
},
%{
comment: "",
description: "DLC Perl HTTP link checking",
id: "id_a_f_226",
link1: "http://dlc.sourceforge.net/",
link2: "",
name: "DeadLinkCheck/0.4.0 libwww-perl/5.xx",
type: "C"
},
%{
comment: "216.89.111.x",
description: "Sootle Web Directory deep link checker",
id: "id_a_f_111206_3",
link1: "http://directory.sootle.com/deep-links/",
link2: "",
name: "Deep Link Calculator v1.0",
type: "C"
},
%{
comment: "",
description: "deepak-USC/ISI robot from USC/Information Science Institute",
id: "id_a_f_227",
link1: "http://www.isi.edu/%7Eravichan/deepak-usc-isi.html",
link2: "http://www.isi.edu/",
name: "deepak-USC/ISI",
type: "R"
},
%{
comment: "",
description: "Deepindex robot",
id: "id_a_f_228",
link1: "http://www.deepindex.net/utilisateurs.php?referral=deepindex",
link2: "",
name: "DeepIndex",
type: "R"
},
%{
comment: "",
description: "Zetbot search Belgium (213.41.128.xx) using Deepindex robot",
id: "id_a_f_229",
link1: "http://www.zetbot.com/",
link2: "http://www.deepindex.net/utilisateurs.php?referral=deepindex",
name: "DeepIndex ( http://www.zetbot.com )",
type: "R"
},
%{
comment: "",
description: "Deepindex robot",
id: "id_a_f_230",
link1: "http://www.deepindex.net/utilisateurs.php?referral=deepindex",
link2: "",
name: "DeepIndex (www.en.deepindex.com)",
type: "R"
},
%{
comment: "",
description: "Deepindex robot (via Paragon.net Canada)",
id: "id_a_f_231",
link1: "http://www.deepindex.net/utilisateurs.php?referral=deepindex",
link2: "",
name: "DeepIndexer.ca",
type: "R"
},
%{
comment: "66.94.237.1xx",
description: "del.icio.us picture robot for thumbnail preview via Yahoo",
id: "id_a_f_011006_2",
link1: "http://del.icio.us/",
link2: "",
name:
"del.icio.us-thumbnails/1.0 Mozilla/5.0 (compatible; Konqueror/3.4; FreeBSD) KHTML/3.4.2 (like Gecko)",
type: "D"
},
%{
comment: "",
description: "DeleGate application level gateway / proxy server",
id: "id_a_f_250106_1",
link1: "http://www.delegate.org/delegate/",
link2: "",
name: "DeleGate/9.0.5-fix1",
type: "P"
},
%{
comment: "",
description: "Some site scanning tool from 217.34.59.xxx (btopenworld.com)",
id: "id_a_f_232",
link1: "",
link2: "",
name: "Demo Bot DOT 16b",
type: "S"
},
%{
comment: "appears also as - MFC Foundation Class Library - Full Web Bot 0516B",
description: "Some site scanning tool from 68.154.96.xx (bellsouth.net)",
id: "id_a_f_233",
link1: "",
link2: "",
name: "Demo Bot Z 16b",
type: "S"
},
%{
comment: "",
description: "Denmex Websearch robot/link checking",
id: "id_a_f_234",
link1: "http://search.denmex.com",
link2: "",
name: "Denmex websearch (http://search.denmex.com)",
type: "R"
},
%{
comment: "",
description: "DataBecker Bilder Sauger (discontinued) web graphics downloader",
id: "id_a_f_235",
link1: "http://www.databecker.de",
link2: "",
name: "Der große BilderSauger 2.00u",
type: "D"
},
%{
comment: "",
description: "Searchspider.com robot (72.245.225.xxx)",
id: "id_a_f_230206_1",
link1: "http://www.searchspider.com/",
link2: "",
name: "dev-spider2.searchpsider.com/1.3b",
type: "R"
},
%{
comment: "",
description: "DevComponents HTMLDocument Class Library for Visual Studio.net",
id: "id_a_f_236",
link1: "http://www.devcomponents.com",
link2: "",
name: "DevComponents.com HtmlDocument Object",
type: ""
},
%{
comment: "(site is offline)",
description: "DiaGem Japan web crawler",
id: "id_a_f_237",
link1: "http://www.skyrocket.gr.jp",
link2: "",
name: "DiaGem/1.1 (http://www.skyrocket.gr.jp/diagem.html)",
type: "R"
},
%{
comment: "s. also Claria",
description: "Claria (ex Gator) SearchScout robot (64.152.73.xx)",
id: "id_a_f_238",
link1: "http://www.searchscout.com",
link2: "",
name: "Diamond/x.0",
type: "R"
},
%{
comment: "s. also Claria",
description: "Claria (ex Gator) SearchScout robot (64.152.73.xx)",
id: "id_a_f_239",
link1: "http://www.searchscout.com",
link2: "",
name: "DiamondBot",
type: "R"
},
%{
comment: "",
description: "Diggit! robot",
id: "id_a_f_240",
link1: "http://www.diggit.com",
link2: "",
name: "Digger/1.0 JDK/1.3.0rc3",
type: "R"
},
%{
comment: "",
description: "OpenPortal4U robot",
id: "id_a_f_241",
link1: "http://www.arisem.com",
link2: "",
name: "DigOut4U",
type: "R"
},
%{
comment: "",
description: "Findsame.com (site is offline) / Digital-Integrity robot",
id: "id_a_f_242",
link1: "http://www.digital-integrity.com/",
link2: "",
name: "DIIbot/1.2",
type: "R"
},
%{
comment: "",
description: "Dillo Web Browser",
id: "id_a_f_100206_1",
link1: "http://www.dillo.org/",
link2: "",
name: "Dillo/0.8.5-i18n-misc",
type: "B"
},
%{
comment: "",
description: "Dillo Web Browser",
id: "id_a_f_243",
link1: "http://www.dillo.org/",
link2: "",
name: "Dillo/0.x.x",
type: "B"
},
%{
comment: "",
description: "disastrous - a del.icio.us link checker based on Python",
id: "id_a_f_100109_1",
link1: "http://www.bortzmeyer.org/disastrous.html",
link2: "",
name:
"disastrous/1.0.5 (running with Python 2.5.1; http://www.bortzmeyer.org/disastrous.html; archangel77@del.icio.us)",
type: "C"
},
%{
comment: "No active homepage",
description: "DISCo Pump offline browser / website ripper",
id: "id_a_f_140306_1",
link1: "http://www.arssoft.com/",
link2: "http://www.filetransit.com/view.php?id=3870",
name: "DISCo Pump x.x",
type: "D"
},
%{
comment: "208.96.54.xx",
description: "Unkown robot from Discovery Engine Corp.",
id: "id_a_f_300907_1",
link1: "http://www.discoveryengine.com/",
link2: "",
name:
"disco/Nutch-0.9 (experimental crawler; www.discoveryengine.com; disco-crawl@discoveryengine.com)",
type: "R"
},
%{
comment: "208.96.54.xx",
description: "Unkown robot from Discovery Engine Corp.",
id: "id_a_f_300907_2",
link1: "http://www.discoveryengine.com/",
link2: "",
name:
"disco/Nutch-1.0-dev (experimental crawler; www.discoveryengine.com; disco-crawl@discoveryengine.com)",
type: "R"
},
%{
comment: "",
description: "Ditto picture search robot",
id: "id_a_f_244",
link1: "http://www.ditto.com",
link2: "",
name: "DittoSpyder",
type: "R"
},
%{
comment: "Wildsoft Surfer",
description: "some download agent",
id: "id_a_f_245",
link1: "",
link2: "",
name: "dlman",
type: "D"
},
%{
comment: "s. also Python-urllib/1.15 - nabot - NaverBot & Cowbot",
description: "Naver Japan / Korea robot",
id: "id_a_f_246",
link1: "http://www.naver.co.jp",
link2: "",
name: "dloader(NaverRobot)/1.0",
type: "R"
},
%{
comment: "203.161.71.17x",
description: "DNS Right - Online DNS tools",
id: "id_a_f_100408_1",
link1: "http://www.dnsright.com/",
link2: "",
name: "DNSRight.com WebBot Link Ckeck Tool. Report abuse to: dnsr@dnsright.com",
type: "C"
},
%{
comment: "",
description: "NTT DoCoMo (Japan) robot",
id: "id_a_f_247",
link1: "http://www.nttdocomo.co.jp/",
link2: "",
name: "DoCoMo/1.0/Nxxxi/c10",
type: "R"
},
%{
comment: "",
description: "NTT DoCoMo (Japan) robot",
id: "id_a_f_248",
link1: "http://www.nttdocomo.co.jp/",
link2: "",
name: "DoCoMo/1.0/Nxxxi/c10/TB",
type: "R"
},
%{
comment: "",
description: "Google (216.239.39.x) proxy server",
id: "id_a_f_249",
link1: "",
link2: "",
name: "DoCoMo/1.0/P502i/c10 (Google CHTML Proxy/1.0)",
type: "P"
},
%{
comment: "",
description: "NTT DoCoMo (Japan) robot",
id: "id_a_f_250",
link1: "http://www.nttdocomo.co.jp/",
link2: "",
name: "DoCoMo/2.0 P900iV(c100;TB;W24H11) ",
type: "R"
},
%{
comment: "",
description: "NTT DoCoMo (Japan) proxy server (210.136.161.1xx)",
id: "id_a_f_141205_1",
link1: "http://www.nttdocomo.co.jp/",
link2: "",
name: "DoCoMo/2.0 SH901iS(c100;TB;W24H12),gzip(gfe) (via translate.google.com)",
type: "P"
},
%{
comment: "s. also Y!J-SRD/1.0",
description: "Yahoo Search Japan robot (203.216.197.xxx)",
id: "id_a_f_081207_1",
link1: "http://www.yahoo.co.jp/",
link2: "",
name:
"DoCoMo/2.0 SH902i (compatible; Y!J-SRD/1.0; http://help.yahoo.co.jp/help/jp/search/indexing/indexing-27.html)",
type: "R"
},
%{
comment: "s. also Y!J-SRD/1.0",
description: "Yahoo Search Japan robot (203.216.197.xxx)",
id: "id_a_f_271006_3",
link1: "http://www.yahoo.co.jp/",
link2: "",
name:
"DoCoMo/2.0/SO502i (compatible; Y!J-SRD/1.0; http://help.yahoo.co.jp/help/jp/search/indexing/indexing-27.html)",
type: "R"
},
%{
comment: "",
description: "DocZilla - Mozilla-based SGML/XML/HTML- browser",
id: "id_a_f_251",
link1: "http://www.doczilla.com",
link2: "",
name: "DocZilla/1.0 (Windows; U; WinNT4.0; en-US; rv:1.0.0) Gecko/20020804",
type: "B"
},
%{
comment: "212.174.130.1xx",
description:
"unknown robot from AGMLAB Information Technologies (Information retrieval system ?)",
id: "id_a_f_210607_1",
link1: "http://www.agmlab.com/agmlab_eng.html",
link2: "",
name: "dodgebot/experimental",
type: "R"
},
%{
comment: "",
description: "Donut P - Japanese IE based browser",
id: "id_a_f_180606_1",
link1: "http://donutp.com/",
link2: "",
name: "DonutP; Windows98SE",
type: "B"
},
%{
comment: "59.151.41.xx",
description: "Unknown robot from douban search (China) - maybe image crawling",
id: "id_a_f_250907_2",
link1: "http://www.douban.com/",
link2: "",
name: "Doubanbot/1.0 (bot@douban.com http://www.douban.com)",
type: ""
},
%{
comment: "",
description: "Download Demon/Netzip download manager",
id: "id_a_f_252",
link1: "http://www.netzip.com",
link2: "",
name: "Download Demon/3.x.x.x",
type: "D"
},
%{
comment: "",
description: "Download Druid IE plugin download manager",
id: "id_a_f_191105_4",
link1: "http://www.xemico.com/druid/index.html",
link2: "",
name: "Download Druid 2.x",
type: "D"
},
%{
comment: "",
description: "Download Express download manager",
id: "id_a_f_253",
link1: "http://www.metaproducts.com",
link2: "",
name: "Download Express 1.0",
type: "D"
},
%{
comment: "",
description: "Download Master download manager",
id: "id_a_f_254",
link1: "http://www.westbyte.com/dm/index.phtml",
link2: "",
name: "Download Master",
type: "D"
},
%{
comment: "",
description: "Download Ninja download manager (Japan)",
id: "id_a_f_191105_5",
link1: "http://www.h-fd.org/mkro/mt/archives/2002/09/download_ninja_1.html",
link2: "",
name: "Download Ninja 3.0",
type: "D"
},
%{
comment: "",
description: "Download Wonder download manager",
id: "id_a_f_255",
link1: "http://www.forty.com",
link2: "",
name: "Download Wonder",
type: "D"
},
%{
comment: "",
description: "Download-Tipp Germany link checking",
id: "id_a_f_256",
link1: "http://download-tipp.de/",
link2: "",
name: "Download-Tipp Linkcheck (http://download-tipp.de/)",
type: "R"
},
%{
comment: "",
description: "download.exe .NET based downloading tool",
id: "id_a_f_257",
link1: "http://www.sql-und-xml.de/freeware-tools/",
link2: "",
name: "Download.exe(1.1) (+http://www.sql-und-xml.de/freeware-tools/)",
type: "D"
},
%{
comment: "",
description: "Download Direct download manager",
id: "id_a_f_300907_3",
link1: "http://senbit.com/",
link2: "",
name: "DownloadDirect.1.0",
type: "D"
},
%{
comment: "",
description: "Dr.WEB online virus scanner",
id: "id_a_f_258",
link1: "http://online.drweb.com",
link2: "",
name: "Dr.Web (R) online scanner: http://online.drweb.com/",
type: ""
},
%{
comment: "",
description: "Dragonfly CMS - Open Source content management system",
id: "id_a_f_259",
link1: "http://www.cpgnuke.com",
link2: "",
name: "Dragonfly File Reader",
type: "B"
},
%{
comment: "",
description: "Drecom Japan (210.233.67.xxx) - Blog search ??",
id: "id_a_f_260",
link1: "http://www.drecom.co.jp",
link2: "",
name: "Drecombot/1.0 (http://career.drecom.jp/bot.html)",
type: "R"
},
%{
comment: "",
description: "Drupal - open source content management platform",
id: "id_a_f_3090906_1",
link1: "http://drupal.org/",
link2: "",
name: "Drupal (+http://drupal.org/)",
type: "C"
},
%{
comment: "DBrowse 1.4d",
description:
"Some site scanning tool via diff. IPs i.e.: - cox.net (68.5.xxx.xxx) - pacbell.net (64.16x.xxx.xxx)",
id: "id_a_f_261",
link1: "",
link2: "",
name: "DSurf15a 01",
type: "S"
},
%{
comment: "TRPMFHXE",
description: "Some site scanning tool via diff. IPs i.e.: - cox.net (68.4.xxx.xxx)",
id: "id_a_f_262",
link1: "",
link2: "",
name: "DSurf15a 71",
type: "S"
},
%{
comment: "WFRIKXVNFL",
description: "Some site scanning tool via diff. IPs i.e.: - verizon.net (4.47.xxx.xxx)",
id: "id_a_f_263",
link1: "",
link2: "",
name: "DSurf15a 81",
type: "S"
},
%{
comment: "",
description:
"Some site scanning tool via diff. IPs i.e.: - eastlink.ca (24.222.xxx.xxx) - cogeco.net (216.221.8x.xxx)",
id: "id_a_f_264",
link1: "",
link2: "",
name: "DSurf15a VA",
type: "S"
},
%{
comment: "",
description: "DTAAgent Java object for data collecting",
id: "id_a_f_020506_2",
link1:
"http://www.ibr.cs.tu-bs.de/courses/ss00/sep-vs/gruppe1/jdoc/DTA/agent/DTAAgent.html",
link2: "",
name: "DTAAgent",
type: "R D"
},
%{
comment: "",
description: "dt Search Spider software",
id: "id_a_f_265",
link1: "http://www.dtsearch.com/spider.html",
link2: "",
name: "dtSearchSpider",
type: "R"
},
%{
comment: "",
description: "Fourelle Venturi proxy server",
id: "id_a_f_266",
link1: "http://www.fourelle.com/news/articles/148457.htm",
link2: "",
name: "Dual Proxy",
type: "P"
},
%{
comment: "72.94.249.34",
description: "Duck Duck Go search crawler",
id: "id_a_f_290308_2",
link1: "http://duckduckgo.com/",
link2: "http://duckduckgo.com/duckduckbot.html",
name: "DuckDuckBot/1.0; (+http://duckduckgo.com/duckduckbot.html)",
type: "R"
},
%{
comment: "",
description: "DumbFind.com robot",
id: "id_a_f_267",
link1: "http://www.dumbfind.com",
link2: "",
name: "Dumbot(version 0.1 beta - dumbfind.com)",
type: "R"
},
%{
comment: "",
description: "DumbFind.com robot",
id: "id_a_f_268",
link1: "http://www.dumbfind.com",
link2: "",
name: "Dumbot(version 0.1 beta - http://www.dumbfind.com/dumbot.html)",
type: "R"
},
%{
comment: "",
description: "DumbFind.com robot",
id: "id_a_f_269",
link1: "http://www.dumbfind.com",
link2: "",
name: "Dumbot(version 0.1 beta)",
type: "R"
},
%{
comment: "",
description: "Vigiltech e-Sense user research robot (website is offline)",
id: "id_a_f_270",
link1: "",
link2: "",
name: "e-sense 1.0 ea(www.vigiltech.com/esensedisclaim.html)",
type: "R"
},
%{
comment: "",
description: "e-Society Project (Japan) crawler (133.9.238.xx)",
id: "id_a_f_271",
link1: "http://www.yama.info.waseda.ac.jp",
link2: "",
name: "e-SocietyRobot(http://www.yama.info.waseda.ac.jp/~yamana/es/)",
type: "R"
},
%{
comment: "",
description: "Global Opto's eApollo Flash based search engine - Taiwan",
id: "id_a_f_280108_1",
link1: "http://www.eapollo.com/eaSE.jsp?language=eng",
link2: "http://www.global-opto.com/",
name:
"eApolloBot/2.0 (compatible; heritrix/2.0.0-SNAPSHOT-20071024.170148 +http://www.eapollo-opto.com)",
type: "R"
},
%{
comment: "s. also Mozilla/5.0 (compatible; EARTHCOM.info/2.01 ...",
description: "Earthcom (Czech Republic) search robot (194.108.39.xx)",
id: "id_a_f_272",
link1: "http://www.earthcom.info",
link2: "",
name: "EARTHCOM.info/1.x [www.earthcom.info]",
type: "R"
},
%{
comment: "s. also Mozilla/5.0 (compatible; EARTHCOM.info/2.01 ...",
description: "Earthcom (Czech Republic) search robot (194.108.39.xx)",
id: "id_a_f_273",
link1: "http://www.earthcom.info",
link2: "",
name: "EARTHCOM.info/1.xbeta [www.earthcom.info]",
type: "R"
},
%{
comment: "",
description: "Keywen Encyclopedia Bot",
id: "id_a_f_274",
link1: "http://keywen.com/Encyclopedia/Bot/",
link2: "",
name: "EasyDL/3.xx",
type: "R"
},
%{
comment: "",
description: "Keywen Encyclopedia Bot",
id: "id_a_f_275",
link1: "http://keywen.com/Encyclopedia/Bot/",
link2: "",
name: "EasyDL/3.xx http://keywen.com/Encyclopedia/Bot",
type: "R"
},
%{
comment: "",
description: "Some site scanning tool via diff. IPs i.e.: - swbell.net (65.66.xxx.xxx)",
id: "id_a_f_276",
link1: "",
link2: "",
name: "EBrowse 1.4b",
type: "S"
},
%{
comment: "",
description: "eCatch (now Wysigot) offline browser",
id: "id_a_f_277",
link1: "http://www.ecatch.com",
link2: "",
name: "eCatch/3.0",
type: "B D"
},
%{
comment: "",
description: "Echo.fr robot",
id: "id_a_f_278",
link1: "http://echo.fr/",
link2: "",
name: "EchO!/2.0",
type: "R"
},
%{
comment:
"s. also DSurf - 66.118.1xx.xxx (sagonet.com) - see also Full Web Bot - Industry Program 1.0.5",
description: "Some site scanning tool via diff. IPs i.e.: - cox.net (68.4.xxx.xxx)",
id: "id_a_f_279",
link1: "",
link2: "",
name: "Educate Search VxB",
type: "S"
},
%{
comment: "",
description: "Xdefine text search engine robot - based on Egothor open source crawler",
id: "id_a_f_280",
link1: "http://www.xdefine.com/",
link2: "http://www.egothor.org/",
name: "egothor/3.0a (+http://www.xdefine.org/robot.html)",
type: "R"
},
%{
comment: "",
description: "Egoto Search robot",
id: "id_a_f_281",
link1: "http://www.egoto.com",
link2: "",
name: "EgotoBot/4.8 (+http://www.egoto.com/about.htm)",
type: "R"
},
%{
comment: "",
description: "eJupiter searcg robot (206.191.49.xx)",
id: "id_a_f_211105_1",
link1: "http://search.ejupiter.com/",
link2: "",
name: "ejupiter.com",
type: "R"
},
%{
comment: "s. also TimelyWeb/...",
description: "TimelyWeb web page monitoring tool",
id: "id_a_f_282",
link1: "http://www.eldos.org/timelyweb/timelyweb.html",
link2: "",
name: "EldoS TimelyWeb/3.x",
type: "C"
},
%{
comment: "",
description: "Elftales crawler for uChoose theme based search (Germany)",
id: "id_a_f_283",
link1: "http://www.uchoose.de",
link2: "",
name: "elfbot/1.0 (+http://www.uchoose.de/crawler/elfbot/)",
type: "R"
},
%{
comment: "211.115.109.1xx",
description: "DAUMOA - RSS search robot of Daum",
id: "id_a_f_300707_1",
link1: "http://ws.daum.net/abouten.html",
link2: "",
name:
"ELI/20070402:2.0 (DAUM RSS Robot, Daum Communications Corp.; +http://ws.daum.net/aboutkr.html)",
type: "R"
},
%{
comment: "",
description: "ELinks text mode browser",
id: "id_a_f_284",
link1: "http://elinks.or.cz/",
link2: "",
name: "ELinks (0.x.x; Linux 2.4.20 i586; 132x60)",
type: "B"
},
%{
comment: "",
description: "ELinks text mode browser",
id: "id_a_f_285",
link1: "http://elinks.or.cz/",
link2: "",
name: "ELinks/0.x.x (textmode; NetBSD 1.6.2 sparc; 132x43)",
type: "B"
},
%{
comment: "",
description: "Sonic E-mail collector",
id: "id_a_f_286",
link1: "http://www.americaint.com/superstore/elist.html",
link2: "",
name: "EmailSiphon",
type: "S"
},
%{
comment: "",
description: "EmailSpider E-mail harvesting software",
id: "id_a_f_220508_2",
link1: "http://www.emailspider.net/index.php?kat=11",
link2: "",
name: "EmailSpider",
type: "S"
},
%{
comment: "",
description: "Trellian EMailWolf E-mail collector",
id: "id_a_f_287",
link1: "http://www.trellian.com",
link2: "",
name: "EmailWolf 1.00",
type: "S"
},
%{
comment: "",
description: "EmeraldShield spam and web filtration services",
id: "id_a_f_288",
link1: "http://www.emeraldshield.com",
link2: "",
name: "EmeraldShield.com WebBot",
type: "P R"
},
%{
comment: "",
description: "EmeraldShield spam and web filtration services",
id: "id_a_f_289",
link1: "http://www.emeraldshield.com",
link2: "",
name: "EmeraldShield.com WebBot (http://www.emeraldshield.com/webbot.aspx)",
type: "P R"
},
%{
comment: "",
description: "Empas search Korea robot (220.95.22x.xxx)",
id: "id_a_f_070606_2",
link1: "http://www.empas.com/",
link2: "",
name: "EMPAS_ROBOT",
type: "R"
},
%{
comment: "",
description: "Enabot - Enaball semantic search project crawler",
id: "id_a_f_280208_1",
link1: "http://www.enaball.com/crawler.html",
link2: "",
name: "EnaBot/1.x (http://www.enaball.com/crawler.html)",
type: "R"
},
%{
comment: "",
description: "endo - Mac news site and blog aggregator",
id: "id_a_f_110506_4",
link1: "http://kula.jp/software/endo/",
link2: "",
name: "endo/1.0 (Mac OS X; ppc i386; http://kula.jp/endo)",
type: "B"
},
%{
comment: "",
description: "Enfish Personal search tool",
id: "id_a_f_290",
link1: "http://www.enfish.com",
link2: "",
name: "Enfish Tracker",
type: "R"
},
%{
comment: " s. also - ES.NET_Crawler - InnerpriseBot",
description: "Enterprise Search engine software (64.202.165.xxx)",
id: "id_a_f_291",
link1: "http://www.innerprise.net",
link2: "",
name: "Enterprise_Search/1.0",
type: "R"
},
%{
comment: " s. also - ES.NET_Crawler - InnerpriseBot",
description: "Enterprise Search engine software (64.202.165.xxx)",
id: "id_a_f_292",
link1: "http://www.innerprise.net",
link2: "",
name: "Enterprise_Search/1.0.xxx",
type: "R"
},
%{
comment: " s. also - ES.NET_Crawler - InnerpriseBot",
description: "Enterprise Search engine software (64.202.165.xxx)",
id: "id_a_f_293",
link1: "http://www.innerprise.net",
link2: "",
name: "Enterprise_Search/1.00.xxx;MSSQL (http://www.innerprise.net/es-spider.asp)",
type: "R"
},
%{
comment: "70.169.191.x",
description: "Envolk Web Search robot",
id: "id_a_f_230706_1",
link1: "http://www.envolk.com/",
link2: "",
name: "envolk/1.7 (+http://www.envolk.com/envolkspiderinfo.php)",
type: "R"
},
%{
comment: "70.169.191.x",
description: "Envolk Web Search robot",
id: "id_a_f_294",
link1: "http://www.envolk.com/",
link2: "",
name: "envolk[ITS]spider/1.6(+http://www.envolk.com/envolkspider.html)",
type: "R"
},
%{
comment: "",
description: "EroCrawler adult search robot",
id: "id_a_f_295",
link1: "http://www.erocrawler.com",
link2: "",
name: "EroCrawler",
type: "R"
},
%{
comment: "s. also - Enterprise_Search - InnerpriseBot",
description: "Enterprise Search engine software (64.202.165.xxx)",
id: "id_a_f_296",
link1: "http://search.innerprise.net",
link2: "",
name: "ES.NET_Crawler/2.0 (http://search.innerprise.net/)",
type: "R"
},
%{
comment: "see also ExactSeek Crawler / eseek-larbin / exactseek.com",
description: "ExactSEEK (Jayde Online) robot",
id: "id_a_f_297",
link1: "http://www.exactseek.com",
link2: "",
name: "eseek-larbin_2.6.2 (crawler@exactseek.com)",
type: "R"
},
%{
comment: "",
description: "ESI Smart-Spider toolkit",
id: "id_a_f_298",
link1: "http://www.smart-spider.com/",
link2: "",
name: "ESISmartSpider",
type: "R"
},
%{
comment: "",
description: "e-Style ISP search (Russia) robot (217.174.103.xxx)",
id: "id_a_f_299",
link1: "http://www.e-styleisp.ru/",
link2: "",
name: "eStyleSearch 4 (compatible; MSIE 6.0; Windows NT 5.0)",
type: "R"
},
%{
comment: "s. also DSurf - PBrowse ...",
description: "Some site scanning tool via diff. IPs",
id: "id_a_f_300",
link1: "",
link2: "",
name: "ESurf15a 15",
type: "S"
},
%{
comment: "",
description: "Eurip.com - European Internet Portal robot",
id: "id_a_f_301",
link1: "http://www.eurip.com",
link2: "",
name: "EuripBot/0.x (+http://www.eurip.com) GetFile",
type: "R"
},
%{
comment: "",
description: "Eurip.com - European Internet Portal robot",
id: "id_a_f_302",
link1: "http://www.eurip.com",
link2: "",
name: "EuripBot/0.x (+http://www.eurip.com) GetRobots",
type: "R"
},
%{
comment: "",
description: "Eurip.com - European Internet Portal robot",
id: "id_a_f_303",
link1: "http://www.eurip.com",
link2: "",
name: "EuripBot/0.x (+http://www.eurip.com) PreCheck",
type: "R"
},
%{
comment: "",
description: "Ayell Euronet business directory robot",
id: "id_a_f_220508_3",
link1: "http://www.ayell.eu/",
link2: "",
name: "Eurobot/1.0 (http://www.ayell.eu)",
type: "R"
},
%{
comment: "based on Nutch",
description: "Evaal Search Engine robot",
id: "id_a_f_030206_4",
link1: "http://www.evaal.com/",
link2: "http://search.evaal.com/en/about.html",
name: "EvaalSE - bot@evaal.com",
type: "R"
},
%{
comment: "",
description: "Eventax event search (Germany)",
id: "id_a_f_304",
link1: "http://www.eventax.de",
link2: "",
name: "eventax/1.3 (eventax; http://www.eventax.de/; info@eventax.de)",
type: "R"
},
%{
comment: "",
description: "Vulcan Inc. Everest crawler (in development)",
id: "id_a_f_291205_1",
link1: "http://www.vulcan.com/",
link2: "",
name:
"Everest-Vulcan Inc./0.1 (R&D project; host=e-1-24; http://everest.vulcan.com/crawlerhelp)",
type: "R"
},
%{
comment: "",
description: "Vulcan Inc. Everest crawler (in development)",
id: "id_a_f_305",
link1: "http://www.vulcan.com/",
link2: "",
name: "Everest-Vulcan Inc./0.1 (R&D project; http://everest.vulcan.com/crawlerhelp)",
type: "R"
},
%{
comment: "Exabot-Images only requests robots.txt - image crawling under UA NG/4.0.1229",
description: "Exalead Websearch image crawler (193.47.80.xx)",
id: "id_a_f_050406_2",
link1: "http://www.exalead.com/search",
link2: "",
name: "Exabot-Images/1.0",
type: "R"
},
%{
comment: "s. Harvest-NG/1.0.2 and Exalead NG...",
description: "Exalead (France) search robot (193.47.80.xx)",
id: "id_a_f_211206_1",
link1: "http://www.exabot.com/",
link2: "",
name: "Exabot-Test/1.0",
type: "R"
},
%{
comment: "s. Harvest-NG/1.0.2 and Exalead NG...",
description: "Exalead (France) search robot (193.47.80.xx)",
id: "id_a_f_190106_1",
link1: "http://www.exabot.com/",
link2: "",
name: "Exabot/2.0",
type: "R"
},
%{
comment: "s. Harvest-NG/1.0.2 and Exalead NG...",
description: "Exalead (France) search robot (193.47.80.xx)",
id: "id_a_f_211206_2",
link1: "http://www.exabot.com/",
link2: "",
name: "Exabot/3.0",
type: "R"
},
%{
comment: "",
description: "eXact Search Bar for IE",
id: "id_a_f_306",
link1: "http://www.exactsearchbar.com/exact04",
link2: "",
name: "ExactSearch",
type: "B"
},
%{
comment: "see also eseek-larbin / exactseek.com",
description: "ExactSEEK (Jayde Online) robot",
id: "id_a_f_307",
link1: "http://www.exactseek.com",
link2: "",
name: "ExactSeek Crawler/0.1",
type: "R"
},
%{
comment: "see also eseek-larbin / exactseek.com",
description: "ExactSEEK (Jayde Online) robot",
id: "id_a_f_308",
link1: "http://www.exactseek.com",
link2: "",
name: "exactseek-crawler-2.63 (crawler@exactseek.com)",
type: "R"
},
%{
comment: "see also eseek-larbin / exactseek.com",
description: "ExactSEEK (Jayde Online) robot",
id: "id_a_f_309",
link1: "http://www.exactseek.com",
link2: "",
name: "exactseek-pagereaper-2.63 (crawler@exactseek.com)",
type: "R"
},
%{
comment: "see also eseek-larbin",
description: "ExactSEEK (Jayde Online) robot (69.9.181.1xx)",
id: "id_a_f_050606_2",
link1: "http://www.exactseek.com",
link2: "",
name: "exactseek.com",
type: "R"
},
%{
comment: "s. Harvest-NG/1.0.2 and NG/1.0",
description: "Exalead (France) search robot (193.47.80.xx)",
id: "id_a_f_310",
link1: "http://www.exabot.com",
link2: "",
name: "Exalead NG/MimeLive Client (convert/http/0.120)",
type: "R"
},
%{
comment: "",
description: "Excalibur (now Convera) spider software",
id: "id_a_f_311",
link1: "http://www.excalib.com",
link2: "",
name: "Excalibur Internet Spider V6.5.4",
type: "R"
},
%{
comment: "72.36.179.1xx",
description: "Execrawl software search using nutch",
id: "id_a_f_191206_1",
link1: "http://www.execrawl.com/",
link2: "",
name: "Execrawl/1.0 (Execrawl; http://www.execrawl.com/; bot@execrawl.com)",
type: "R"
},
%{
comment: "216.195.184.xx",
description: "exooba crawler for exooba search pre-alpha development",
id: "id_a_f_060608_1",
link1: "http://www.exooba.com/",
link2: "",
name:
"exooba crawler/exooba crawler (crawler for exooba.com; http://www.exooba.com/; info at exooba dot com)",
type: "R"
},
%{
comment: "216.195.184.xx",
description: "exooba crawler for exooba search pre-alpha development",
id: "id_a_f_060608_2",
link1: "http://www.exooba.com/",
link2: "",
name: "exooba/exooba crawler (exooba; exooba)",
type: "R"
},
%{
comment: "",
description: "Mirago UK Robot",
id: "id_a_f_312",
link1: "http://www.mirago.co.uk",
link2: "",
name: "ExperimentalHenrytheMiragoRobot",
type: "R"
},
%{
comment: "",
description: "Expired Domain Sleuth domain name tool",
id: "id_a_f_313",
link1: "http://expireddomainsleuth.com/",
link2: "",
name: "Expired Domain Sleuth",
type: "R C"
},
%{
comment: "",
description: "Express Web Pictures image browser",
id: "id_a_f_314",
link1: "http://www.express-soft.com/",
link2: "",
name: "Express WebPictures (www.express-soft.com)",
type: "B D"
},
%{
comment: "",
description: "Extractor Pro e-mail collector",
id: "id_a_f_315",
link1: "http://www.extractorpro.com",
link2: "",
name: "ExtractorPro",
type: "S"
},
%{
comment: "",
description: "Exisoftware image grabber and downloading tool",
id: "id_a_f_170106_1",
link1: "http://www.exisoftware.com/picture_finder/",
link2: "",
name: "Extreme Picture Finder",
type: "D"
},
%{
comment: "",
description: "Download-Tipp Germany robot",
id: "id_a_f_316",
link1: "http://download-tipp.de",
link2: "",
name: "EyeCatcher (Download-tipp.de)/1.0",
type: "R"
},
%{
comment: "70.86.159.1xx",
description: "Factbites search robot",
id: "id_a_f_091006_1",
link1: "http://www.factbites.com/",
link2: "",
name: "Factbot 1.09 (see http://www.factbites.com/webmasters.php)",
type: "R"
},
%{
comment: "70.86.159.1xx",
description: "Factbites search robot",
id: "id_a_f_220906_1",
link1: "http://www.factbites.com/",
link2: "",
name: "factbot : http://www.factbites.com/robots",
type: "R"
},
%{
comment: "",
description: "FaEdit Professional - Japanese bookmark manager",
id: "id_a_f_221006_1",
link1: "https://sw.vector.co.jp/swreg/step1.reserve?srno=SR040433&site=y",
link2: "",
name: "FaEdit/2.0.x",
type: "C"
},
%{
comment: "",
description: "FairAd user",
id: "id_a_f_317",
link1: "http://www.fairad.de",
link2: "",
name: "FairAd Client",
type: "P"
},
%{
comment: "63.167.160.1xx",
description: "Safe-t.net web filtering service",
id: "id_a_f_051206_1",
link1: "http://www.safe-t.net/",
link2: "",
name: "FANGCrawl/0.01",
type: "P"
},
%{
comment: "",
description: "Drew Curtis' FARK.com link checking",
id: "id_a_f_210206_1",
link1: "http://www.fark.com/",
link2: "",
name: "FARK.com link verifier",
type: "C"
},
%{
comment: "",
description: "Fast/Alltheweb crawler (66.151.181.xx)",
id: "id_a_f_318",
link1: "http://www.alltheweb.com",
link2: "",
name: "Fast Crawler Gold Edition",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler (66.151.181.xx)",
id: "id_a_f_319",
link1: "http://www.alltheweb.com",
link2: "",
name: "FAST Enterprise Crawler 6 (Experimental)",
type: "R"
},
%{
comment: "",
description:
"Fast Enterprise Crawler (66.151.181.xx) for Scirus scienctific information search",
id: "id_a_f_040206_1",
link1: "http://www.scirus.com/srsapp/",
link2: "http://www.alltheweb.com",
name:
"FAST Enterprise Crawler 6 / Scirus scirus-crawler@fast.no; http://www.scirus.com/srsapp/contactus/",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler (66.151.181.xx)",
id: "id_a_f_320",
link1: "http://www.alltheweb.com",
link2: "",
name: "FAST Enterprise Crawler 6 used by Cobra Development (admin@fastsearch.com)",
type: "R"
},
%{
comment: "",
description: "Comperio Web Miner based on Fast ESP",
id: "id_a_f_070507_1",
link1:
"http://www.comperio.no/index.php?option=com_content&task=blogcategory&id=7&Itemid=27",
link2: "",
name: "FAST Enterprise Crawler 6 used by Comperio AS (sts@comperio.no)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler (66.151.181.xx)",
id: "id_a_f_321",
link1: "http://www.alltheweb.com",
link2: "",
name: "FAST Enterprise Crawler 6 used by FAST (FAST)",
type: "R"
},
%{
comment: "193.252.242.xx",
description: "Pages Jaunes business search (France) robot using Fast Enterprise Crawler",
id: "id_a_f_161106_1",
link1: "http://www.pagesjaunes.fr/",
link2: "",
name: "FAST Enterprise Crawler 6 used by Pages Jaunes (pvincent@pagesjaunes.fr)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler for Sensis.com.au Australian search (66.151.181.xx)",
id: "id_a_f_322",
link1: "http://www.sensis.com.au/",
link2: "http://www.alltheweb.com",
name:
"FAST Enterprise Crawler 6 used by Sensis.com.au Web Crawler (search_comments\\at\\sensis\\dot\\com\\dot\\au)",
type: "R"
},
%{
comment: "202.176.220.xx",
description: "SPH Search - Singapore related search using Fast crawler",
id: "id_a_f_251007_2",
link1: "http://www.sphsearch.sg/",
link2: "",
name: "FAST Enterprise Crawler 6 used by Singapore Press Holdings (crawler@sphsearch.sg)",
type: "R"
},
%{
comment: "128.176.188.2xx",
description: "FAST Enterprise Crawler used by WWU (University of Muenster - Germany)",
id: "id_a_f_280606_2",
link1: "http://www.uni-muenster.de/en/index.html",
link2: "http://www.alltheweb.com",
name: "FAST Enterprise Crawler 6 used by WWU (wardi@uni-muenster.de)",
type: "C"
},
%{
comment: "",
description: "Fast/Alltheweb crawler (66.151.181.xx)",
id: "id_a_f_323",
link1: "http://www.alltheweb.com",
link2: "",
name: "FAST Enterprise Crawler/6 (www.fastsearch.com)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler (66.151.181.xx)",
id: "id_a_f_324",
link1: "http://www.alltheweb.com",
link2: "",
name: "FAST Enterprise Crawler/6.4 (helpdesk at fast.no)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler (66.151.181.xx)",
id: "id_a_f_325",
link1: "http://www.alltheweb.com",
link2: "",
name: "FAST FirstPage retriever (compatible; MSIE 5.5; Mozilla/4.0)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler (66.151.181.xx)",
id: "id_a_f_326",
link1: "http://www.alltheweb.com",
link2: "",
name: "FAST MetaWeb Crawler (helpdesk at fastsearch dot com)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler (66.151.181.xx)",
id: "id_a_f_327",
link1: "http://www.alltheweb.com",
link2: "",
name: "Fast PartnerSite Crawler",
type: "R"
},
%{
comment: "see also Yahoo-MMCrawler/3.x",
description: "Fast/Alltheweb multimedia crawler",
id: "id_a_f_328",
link1: "http://www.alltheweb.com",
link2: "",
name:
"FAST-WebCrawler/2.2.10 (Multimedia Search) (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler",
id: "id_a_f_329",
link1: "http://www.alltheweb.com",
link2: "",
name:
"FAST-WebCrawler/2.2.6 (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler",
id: "id_a_f_330",
link1: "http://www.alltheweb.com",
link2: "",
name:
"FAST-WebCrawler/2.2.7 (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html)http://www.fast.no",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler",
id: "id_a_f_331",
link1: "http://www.alltheweb.com",
link2: "",
name:
"FAST-WebCrawler/2.2.8 (crawler@fast.no; http://www.fast.no/faq/faqfastwebsearch/faqfastwebcrawler.html)http://www.fast.no",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler",
id: "id_a_f_332",
link1: "http://www.alltheweb.com",
link2: "",
name: "FAST-WebCrawler/3.2 test",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler",
id: "id_a_f_333",
link1: "http://www.alltheweb.com",
link2: "",
name: "FAST-WebCrawler/3.3 (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler",
id: "id_a_f_334",
link1: "http://www.alltheweb.com",
link2: "",
name:
"FAST-WebCrawler/3.4/Nirvana (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler",
id: "id_a_f_335",
link1: "http://www.alltheweb.com",
link2: "",
name:
"FAST-WebCrawler/3.4/PartnerSite (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler",
id: "id_a_f_336",
link1: "http://www.alltheweb.com",
link2: "",
name:
"FAST-WebCrawler/3.5 (atw-crawler at fast dot no; http://fast.no/support.php?c=faqs/crawler)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler",
id: "id_a_f_337",
link1: "http://www.alltheweb.com",
link2: "",
name:
"FAST-WebCrawler/3.6 (atw-crawler at fast dot no; http://fast.no/support/crawler.asp)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler",
id: "id_a_f_338",
link1: "http://www.alltheweb.com",
link2: "",
name:
"FAST-WebCrawler/3.6/FirstPage (crawler@fast.no; http://fast.no/support.php?c=faqs/crawler)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler",
id: "id_a_f_339",
link1: "http://www.alltheweb.com",
link2: "",
name:
"FAST-WebCrawler/3.7 (atw-crawler at fast dot no; http://fast.no/support/crawler.asp)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler",
id: "id_a_f_340",
link1: "http://www.alltheweb.com",
link2: "",
name:
"FAST-WebCrawler/3.7/FirstPage (atw-crawler at fast dot no;http://fast.no/support/crawler.asp)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler",
id: "id_a_f_341",
link1: "http://www.alltheweb.com",
link2: "",
name:
"FAST-WebCrawler/3.8 (atw-crawler at fast dot no; http://fast.no/support/crawler.asp)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler",
id: "id_a_f_342",
link1: "http://www.alltheweb.com",
link2: "",
name:
"FAST-WebCrawler/3.8/Fresh (atw-crawler at fast dot no; http://fast.no/support/crawler.asp)",
type: "R"
},
%{
comment: "see also Yahoo-MMCrawler/3.x",
description: "Fast/Alltheweb multimedia crawler",
id: "id_a_f_343",
link1: "http://www.alltheweb.com",
link2: "",
name: "FAST-WebCrawler/3.x Multimedia",
type: "R"
},
%{
comment: "see also Yahoo-MMCrawler/3.x",
description: "Fast/Alltheweb multimedia crawler",
id: "id_a_f_344",
link1: "http://www.alltheweb.com",
link2: "",
name: "FAST-WebCrawler/3.x Multimedia (mm dash crawler at fast dot no)",
type: "R"
},
%{
comment: "",
description: "Fastbot search Germany crawler (80.252.104.1xx)",
id: "id_a_f_121205_2",
link1: "http://www.fastbot.de/",
link2: "",
name: "fastbot crawler beta 2.0 (+http://www.fastbot.de)",
type: "R"
},
%{
comment: "",
description: "Ay-Up geo sync search robot",
id: "id_a_f_345",
link1: "http://www.ay-up.com",
link2: "",
name: "FastBug http://www.ay-up.com",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler (66.151.181.xx)",
id: "id_a_f_346",
link1: "http://www.alltheweb.com",
link2: "",
name: "FastCrawler 3.0.1 (crawler@1klik.dk)",
type: "R"
},
%{
comment: "",
description: "Fast/Alltheweb crawler used by SuperPages.com",
id: "id_a_f_347",
link1: "http://www.superpages.com",
link2: "http://www.alltheweb.com",
name: "FastSearch Web Crawler for Verizon SuperPages (kevin.watters@fastsearch.com)",
type: "R"
},
%{
comment: "66.207.217.13x",
description: "Favcollector Favicon collecting robot",
id: "id_a_f_170408_3",
link1: "http://www.favcollector.com/",
link2: "",
name: "Favcollector/2.0 (info@favcollector.com http://www.favcollector.com/)",
type: "R"
},
%{
comment: "",
description: "FavIconizer - IE favorites icons refreshing tool",
id: "id_a_f_161006_1",
link1: "http://www.codeproject.com/tools/faviconizer.asp",
link2: "",
name: "FavIconizer",
type: "D"
},
%{
comment: "84.19.186.1xx",
description: "favo.eu (Germany) search robot",
id: "id_a_f_151206_1",
link1: "http://www.favo.eu/",
link2: "",
name: "favo.eu crawler/0.6 (http://www.favo.eu)",
type: "R"
},
%{
comment: "",
description: "ZD's FavOrg favourites managing program",
id: "id_a_f_348",
link1: "http://www.pcmag.com/article2/0,4149,108438,00.asp",
link2: "",
name: "FavOrg",
type: "C"
},
%{
comment: "",
description: "Campulka.net Favorites checking tool",
id: "id_a_f_260108_1",
link1: "http://campulka.net/?dir=Utility",
link2: "",
name: "Favorites Checking (http://campulka.net)",
type: "C"
},
%{
comment: "",
description: "Favorites Sweeper bookmark checker",
id: "id_a_f_349",
link1: "http://www.manitoolssoftware.cjb.net",
link2: "",
name: "Favorites Sweeper v.2.03",
type: "C"
},
%{
comment: "",
description: "FaXo Search robot (69.152.89.xx)",
id: "id_a_f_350",
link1: "http://www.faxo.com",
link2: "",
name: "Faxobot/1.0",
type: "R"
},
%{
comment: "",
description: "Free Download Manager (FDM) download accelerator ",
id: "id_a_f_351",
link1: "http://www.freedownloadmanager.org",
link2: "",
name: "FDM 1.x",
type: "D"
},
%{
comment: "",
description: "Free Download Manager (FDM) download accelerator ",
id: "id_a_f_180207_1",
link1: "http://www.freedownloadmanager.org",
link2: "",
name: "FDM 2.x",
type: "D"
},
%{
comment: "",
description: "RSS Feed Seeker bot (68.225.95.2xx)",
id: "id_a_f_352",
link1: "http://www.MyNewFavoriteThing.com",
link2: "",
name: "Feed Seeker Bot (RSS Feed Seeker http://www.MyNewFavoriteThing.com/fsb.php)",
type: "R"
},
%{
comment: "194.105.139.2xx",
description: "Feed24 news feed and blog search",
id: "id_a_f_241206_1",
link1: "http://www.feed24.com/",
link2: "",
name: "Feed24.com",
type: "R"
},
%{
comment: "",
description: "Feed::Find - Syndication feed (RSS/Atom) auto-discovery",
id: "id_a_f_050306_1",
link1: "http://search.cpan.org/~btrott/Feed-Find-0.06/lib/Feed/Find.pm",
link2: "",
name: "Feed::Find/0.0x",
type: "D"
},
%{
comment: "64.27.19.25x",
description: "Feedable beta web based RSS service",
id: "id_a_f_250707_1",
link1: "http://reader.feedable.com/",
link2: "",
name: "Feedable/0.1 (compatible; MSIE 6.0; Windows NT 5.1)",
type: "B"
},
%{
comment: "reads robots.txt",
description: "Unknown robot from the University of Tokyo (157.82.157.xx)",
id: "id_a_f_230406_2",
link1: "http://www.u-tokyo.ac.jp/index_e.html",
link2: "",
name: "FeedChecker/0.01",
type: "R"
},
%{
comment: "",
description: "FeedDemon RSS reader",
id: "id_a_f_140608_2",
link1: "http://www.newsgator.com/individuals/feeddemon/",
link2: "",
name: "FeedDemon/2.7 (http://www.newsgator.com/; Microsoft Windows XP)",
type: "B"
},
%{
comment: "72.14.[1-2]xx.[X]xx",
description: "Google news feed feetcher for iGoogle gadgets",
id: "id_a_f_160308_2",
link1: "http://www.google.com/feedfetcher.html",
link2: "",
name: "Feedfetcher-Google-iGoogleGadgets; (+http://www.google.com/feedfetcher.html)",
type: "C"
},
%{
comment: "72.14.199.x[xx]",
description: "Google Feedfetcher - RSS and Atom feed crawler",
id: "id_a_f_010906_1",
link1: "http://www.google.com/feedfetcher.html",
link2: "",
name: "Feedfetcher-Google; (+http://www.google.com/feedfetcher.html)",
type: "R"
},
%{
comment: "216.92.192.1xx",
description: "FeedForAll RSS feed robot",
id: "id_a_f_010307_1",
link1: "http://www.feedforall.com/",
link2: "",
name: "FeedForAll rss2html.php v2",
type: "C"
},
%{
comment: "216.134.194.xx",
description: "FeedHub news feed personalization engine powered by mSpoke",
id: "id_a_f_010308_1",
link1: "http://www.feedhub.com/",
link2: "http://www.mspoke.com/",
name: "FeedHub FeedDiscovery/1.0 (http://www.feedhub.com)",
type: "R"
},
%{
comment: "216.134.194.xx",
description: "FeedHub news feed personalization engine powered by mSpoke",
id: "id_a_f_060608_3",
link1: "http://www.feedhub.com/",
link2: "http://www.mspoke.com/",
name: "FeedHub MetaDataFetcher/1.0 (http://www.feedhub.com)",
type: "R"
},
%{
comment: "69.46.36.x",
description: "Feedjit news feed service favicon crawler",
id: "id_a_f_260608_3",
link1: "http://feedjit.com/",
link2: "",
name: "Feedjit Favicon Crawler 1.0",
type: "R"
},
%{
comment: "",
description: "Newsbrain Feedreader3",
id: "id_a_f_150108_1",
link1: "http://www.feedreader.com/",
link2: "",
name: "Feedreader 3.xx (Powered by Newsbrain)",
type: "B"
},
%{
comment: "",
description: "FeedShow online RSS feed reader",
id: "id_a_f_281106_3",
link1: "http://www.feedshow.com/",
link2: "",
name: "Feedshow/x.0 (http://www.feedshow.com; 1 subscriber)",
type: "B"
},
%{
comment: "",
description: "FeedShow online RSS feed reader",
id: "id_a_f_051206_2",
link1: "http://www.feedshow.com/",
link2: "",
name: "FeedshowOnline (http://www.feedshow.com)",
type: "B"
},
%{
comment: "",
description: "FeedZcollector - Feed (RSS, ATOM and RDF) capturing software",
id: "id_a_f_040207_1",
link1: "http://www.feeds4all.com/feedzcollector/",
link2: "",
name: "FeedZcollector v1.x (Platinum) http://www.feeds4all.com/feedzcollector",
type: "B"
},
%{
comment: "s. also Morris",
description: "MixCat robot",
id: "id_a_f_353",
link1: "http://mixcat.com",
link2: "",
name: "Felix - Mixcat Crawler (+http://mixcat.com)",
type: "R"
},
%{
comment: "",
description: "FreeBSD download tool",
id: "id_a_f_354",
link1: "",
link2: "",
name: "fetch libfetch/2.0",
type: "D"
},
%{
comment: "",
description: "Frequent Finders spider via Sitefusion.com",
id: "id_a_f_355",
link1: "http://www.frequentfinders.com",
link2: "",
name: "FFC Trap Door Spider",
type: "R"
},
%{
comment: "",
description: "Filangy search and bookmark service",
id: "id_a_f_356",
link1: "http://www.filangy.com",
link2: "",
name:
"Filangy/0.01-beta (Filangy; http://www.nutch.org/docs/en/bot.html; filangy-agent@filangy.com)",
type: "R C"
},
%{
comment: "",
description: "Filangy search and bookmark service",
id: "id_a_f_357",
link1: "http://www.filangy.com",
link2: "",
name:
"Filangy/1.0x (Filangy; http://www.filangy.com/filangyinfo.jsp?inc=robots.jsp; filangy-agent@filangy.com)",
type: "R C"
},
%{
comment: "",
description: "Filangy search and bookmark service",
id: "id_a_f_358",
link1: "http://www.filangy.com",
link2: "",
name:
"Filangy/1.0x (Filangy; http://www.nutch.org/docs/en/bot.html; filangy-agent@filangy.com)",
type: "R C"
},
%{
comment: "",
description: "File Boost Network link checking",
id: "id_a_f_359",
link1: "http://www.fileboost.net",
link2: "",
name: "fileboost.net/1.0 (+http://www.fileboost.net)",
type: "R C"
},
%{
comment: "",
description: "FileHound download manager",
id: "id_a_f_360",
link1: "http://www.allabout.com",
link2: "",
name: "FileHound x.x",
type: "D"
},
%{
comment: "72.47.203.8x",
description: "filtrbox media content (news) monitoring",
id: "id_a_f_180208_1",
link1: "http://www.filtrbox.com/",
link2: "",
name: "Filtrbox/1.0",
type: "R"
},
%{
comment: "site is down",
description: "Find An ISP robot",
id: "id_a_f_361",
link1: "http://www.findanisp.com/",
link2: "",
name: "FindAnISP.com_ISP_Finder_v99a",
type: "R C"
},
%{
comment: "",
description: "Yelo.no business search (Norway) via Findexa",
id: "id_a_f_141205_2",
link1: "http://www.findexa.no/english/article27709.ece",
link2: "",
name: "Findexa Crawler (http://www.findexa.no/gulesider/article26548.ece)",
type: "R"
},
%{
comment: "",
description: "NextLinks - German vocabulary and hyperlink search",
id: "id_a_f_362",
link1: "http://wortschatz.uni-leipzig.de/nextlinks/findlinks.html",
link2: "",
name: "findlinks/x.xxx (+http://wortschatz.uni-leipzig.de/findlinks/) ",
type: "R"
},
%{
comment: "",
description: "Finesearch robot",
id: "id_a_f_363",
link1: "http://www.finesearch.com",
link2: "",
name: "FineBot",
type: "R"
},
%{
comment: "",
description: "Finjan Vital Security Web Appliance security solution",
id: "id_a_f_080306_1",
link1: "http://www.finjan.com/",
link2: "",
name: "Finjan-prefetch",
type: "P"
},
%{
comment: "",
description: "Fireball.de robot",
id: "id_a_f_364",
link1: "http://www.fireball.de",
link2: "",
name: "Firefly/1.0",
type: "R"
},
%{
comment: "",
description: "Fireball.de robot",
id: "id_a_f_365",
link1: "http://www.fireball.de",
link2: "",
name: "Firefly/1.0 (compatible; Mozilla 4.0; MSIE 5.5)",
type: "R"
},
%{
comment: "reads robots.txt",
description: "Unknown robot from Czech Technical University Prague (147.32.141.xx)",
id: "id_a_f_210906_1",
link1: "http://www.cvut.cz/",
link2: "",
name: "Firefox (kastaneta03@hotmail.com)",
type: "R"
},
%{
comment: "reads robots.txt",
description: "Unknown robot from Czech Technical University Prague (147.32.141.xx)",
id: "id_a_f_190306_2",
link1: "http://www.cvut.cz/",
link2: "",
name: "Firefox_1.0.6 (kasparek@naparek.cz)",
type: "R"
},
%{
comment: "",
description: "AT&T/Fast Search robot for FirstGov (U.S.Government) portal",
id: "id_a_f_366",
link1: "http://www.firstgov.gov",
link2: "",
name: "FirstGov.gov Search - POC:firstgov.webmasters@gsa.gov",
type: "R"
},
%{
comment: "",
description: "Firstsfind Germany robot / link checking",
id: "id_a_f_367",
link1: "http://www.firstsfind.de",
link2: "",
name: "firstsbot",
type: "R"
},
%{
comment: "",
description: "Flaptor information retrieval solutions robot",
id: "id_a_f_020906_1",
link1: "http://www.flaptor.com/index.htm",
link2: "",
name:
"Flapbot/0.7.2 (Flaptor Crawler; http://www.flaptor.com; crawler at flaptor period com)",
type: "R"
},
%{
comment: "",
description: "JetCar/FlashGet download manager",
id: "id_a_f_368",
link1: "http://www.amazesoft.com",
link2: "",
name: "FlashGet",
type: "D"
},
%{
comment: "",
description: "FlatArts Favorites Icon Tool",
id: "id_a_f_161205_1",
link1: "http://flatarts.jp/contents/software/information.php?name=rico",
link2: "",
name: "FLATARTS_FAVICO",
type: "C D"
},
%{
comment: "81.176.76.93",
description: "Flexum.ru search service",
id: "id_a_f_100308_1",
link1: "http://www.flexum.ru/",
link2: "",
name: "Flexum spider",
type: "R"
},
%{
comment: "81.176.76.93",
description: "Flexum.ru search service",
id: "id_a_f_280508_2",
link1: "http://www.flexum.ru/",
link2: "",
name: "Flexum/2.0",
type: "R"
},
%{
comment: "",
description: "DivX.com Movie Find robot",
id: "id_a_f_369",
link1: "http://www.divx.com",
link2: "",
name: "FlickBot 2.0 RPT-HTTPClient/0.3-3",
type: "R"
},
%{
comment: "",
description: "Metacarta / Cogent robot",
id: "id_a_f_370",
link1: "http://www.metacarta.com",
link2: "",
name: "flunky",
type: "R"
},
%{
comment: "",
description: "unknown",
id: "id_a_f_371",
link1: "",
link2: "",
name: "fly/6.01 libwww/4.0D",
type: ""
},
%{
comment: "62.141.52.2xx",
description: "FLY Index Metasearch link checking",
id: "id_a_f_110107_1",
link1: "http://www.flyindex.net/",
link2: "",
name: "flyindex.net 1.0/http://www.flyindex.net",
type: "C"
},
%{
comment: "209.205.65.9x",
description: "Fnoole news crawler",
id: "id_a_f_021108_1",
link1: "http://www.fnoole.com/",
link2: "",
name: "FnooleBot/2.5.2 (+http://www.fnoole.com/addurl.html)",
type: "R"
},
%{
comment: " s. also: - - WFARC",
description: "IBM's Almaden Research robot",
id: "id_a_f_372",
link1: "http://www.almaden.ibm.com",
link2: "",
name: "FocusedSampler/1.0",
type: "R"
},
%{
comment: "212.227.95.3x",
description: "folkd.com social search robot",
id: "id_a_f_080108_1",
link1: "http://www.folkd.com/",
link2: "",
name: "Folkd.com Spider/0.1 beta 1 (www.folkd.com)",
type: "R"
},
%{
comment: "77.232.77.13x",
description: "FollowSite robot - website monitoring",
id: "id_a_f_070209_4",
link1: "http://www.followsite.com/bot.html",
link2: "",
name: "FollowSite Bot ( http://www.followsite.com/bot.html )",
type: "C"
},
%{
comment: "77.232.77.13x",
description: "FollowSite robot - website monitoring",
id: "id_a_f_140209_1",
link1: "http://www.followsite.com/bot.html",
link2: "",
name: "FollowSite.com ( http://www.followsite.com/b.html )",
type: "C"
},
%{
comment: "",
description: "Fooky search Scorpionbots robot (65.12.170.xxx)",
id: "id_a_f_141105_1",
link1: "http://www.fooky.com/",
link2: "",
name: "Fooky.com/ScorpionBot/ScoutOut; http://www.fooky.com/scorpionbots",
type: "R"
},
%{
comment: "",
description: "Neomo Search (Germany) robot (85.10.197.1xx)",
id: "id_a_f_373",
link1: "http://www.neomo.de",
link2: "",
name: "Francis/1.0 (francis@neomo.de http://www.neomo.de/)",
type: "R"
},
%{
comment: "",
description: "Some spam bot",
id: "id_a_f_374",
link1: "",
link2: "",
name: "Franklin Locator 1.8",
type: "S"
},
%{
comment: "",
description: "Free Downloads shareware directory link checking",
id: "id_a_f_110506_1",
link1: "http://www.free-downloads.net/",
link2: "",
name: "free-downloads.net download-link validator /0.1",
type: "C"
},
%{
comment: "",
description: "FreeFind.com robot",
id: "id_a_f_375",
link1: "http://freefind.com",
link2: "",
name: "FreeFind.com-SiteSearchEngine/1.0 (http://freefind.com; spiderinfo@freefind.com)",
type: "R"
},
%{
comment: "",
description: "Frelics backlink checking bot (beta)",
id: "id_a_f_221008_2",
link1: "http://www.frelic.com/",
link2: "",
name: "Frelicbot/1.0 +http://www.frelic.com/",
type: "C"
},
%{
comment: "",
description: "Fresh Download download manager",
id: "id_a_f_376",
link1: "http://www.freshdevices.com",
link2: "",
name: "FreshDownload/x.xx",
type: "D"
},
%{
comment: "",
description: "FreshNotes - music related artist search (72.3.225.xx)",
id: "id_a_f_230306_2",
link1: "http://freshnotes.com/fn/",
link2: "",
name: "FreshNotes crawler< report problems to crawler-at-freshnotes-dot-com",
type: "R"
},
%{
comment: "s. also DSurf - PBrowse ...",
description: "Some site scanning tool via diff. IPs",
id: "id_a_f_377",
link1: "",
link2: "",
name: "FSurf15a 01",
type: "S"
},
%{
comment: "83.105.71.16x",
description: "Find the Best search robot",
id: "id_a_f_070209_5",
link1: "http://www.findthebest.co.uk/",
link2: "",
name: "FTB-Bot http://www.findthebest.co.uk/",
type: "R"
},
%{
comment: "",
description:
"Some site scanning tool from diff. IPs i.e.: - 66.28.240.xx (cogentco.com) - 68.5.174.xx (cox.net)",
id: "id_a_f_378",
link1: "",
link2: "",
name: "Full Web Bot 0416B",
type: "S"
},
%{
comment:
"appears also as MFC Foundation Class Library & Demo Bot Z 16b - 66.118.1xx.xxx (sagonet.com) - s. also Educate Search VxB - Industry Program 1.0.5",
description: "Some site scanning tool i.e. from - 68.154.96.xx (bellsouth.net)",
id: "id_a_f_379",
link1: "",
link2: "",
name: "Full Web Bot 0516B",
type: "S"
},
%{
comment: "",
description: "Some site scanning tool from 66.255.6.xxx (uslec.com)",
id: "id_a_f_380",
link1: "",
link2: "",
name: "Full Web Bot 2816B",
type: "S"
},
%{
comment: "208.109.126.1xx",
description: "FuseBulb search",
id: "id_a_f_190807_1",
link1: "http://www.fusebulb.com/",
link2: "",
name: "FuseBulb.Com",
type: "R"
},
%{
comment: "",
description: "FyberSearch FyberSpider robot",
id: "id_a_f_381",
link1: "http://www.fybersearch.com",
link2: "",
name: "FyberSpider (+http://www.fybersearch.com/fyberspider.php)",
type: "R"
},
%{
comment: "",
description: "Some user from bbnplanet.net (4.63.218.2xx) using an Innerprise robot tool",
id: "id_g_m_382",
link1: "http://www.innerprise.net",
link2: "",
name: "Gagglebot",
type: "R C ?"
},
%{
comment: "",
description: "Seed Search robot",
id: "id_g_m_383",
link1: "http://www.seed.net.tw",
link2: "",
name: "GAIS Robot/1.0B2",
type: "R"
},
%{
comment: "140.123.100.x",
description: "Gaislab Taiwan robot",
id: "id_g_m_384",
link1: "http://gais.cs.ccu.edu.tw",
link2: "",
name: "Gaisbot/3.0 (indexer@gais.cs.ccu.edu.tw; http://gais.cs.ccu.edu.tw/robot.php)",
type: "R"
},
%{
comment: "140.123.100.x",
description: "Gaislab Taiwan robot",
id: "id_g_m_160706_1",
link1: "http://gais.cs.ccu.edu.tw",
link2: "",
name: "Gaisbot/3.0+(robot06@gais.cs.ccu.edu.tw;+http://gais.cs.ccu.edu.tw/robot.php)",
type: "R"
},
%{
comment: " s. also Mozilla/4.0 (compatible; MSIE 5.0; www.galaxy.com....)",
description: "Galaxy robot (63.121.41.xxx)",
id: "id_g_m_385",
link1: "http://www.galaxy.com",
link2: "",
name: "GalaxyBot/1.0 (http://www.galaxy.com/galaxybot.html)",
type: "R"
},
%{
comment: "88.208.223.xx",
description: "Gallent Search directory (UK)",
id: "id_g_m_130407_2",
link1: "http://www.gallent.co.uk/",
link2: "http://robot.gallentsearch.com/",
name: "Gallent Search Spider v1.4 Robot 2 (http://robot.GallentSearch.com)",
type: "R"
},
%{
comment: "80.65.45.xx",
description: "Gamekit game search engine - Germany",
id: "id_g_m_010107_1",
link1: "http://www.gamekit.de/",
link2: "",
name: "gamekitbot/1.0 (+http://www.uchoose.de/crawler/gamekitbot/)",
type: "R"
},
%{
comment: "GameSpy Arcade download manager (FilePlanet)",
description: "GameSpyHTTP/1.0",
id: "id_g_m_386",
link1: "http://www.gamespyarcade.com/features/",
link2: "",
name: "Gamespy_Arcade",
type: "D"
},
%{
comment: "",
description: "GammaWare GammaSpider",
id: "id_g_m_387",
link1: "http://www.gammasite.com",
link2: "",
name: "GammaSpider/1.0",
type: "R"
},
%{
comment: "",
description: "nttrd.com / Infobee.ne.jp robot",
id: "id_g_m_388",
link1: "",
link2: "",
name: "gazz/x.x (gazz@nttrd.com)",
type: "R"
},
%{
comment: "no active website",
description: "Geckobot user robot",
id: "id_g_m_389",
link1: "http://www.geckobot.com/",
link2: "",
name: "geckobot",
type: ""
},
%{
comment: "66.249.72.1xx",
description: "Google Mobile Search crawler",
id: "id_g_m_280406_1",
link1: "http://www.google.com/mobile/formats.html",
link2: "",
name:
"Generic Mobile Phone (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)",
type: "R P"
},
%{
comment: "",
description: "Unknown robot from Carnegie Mellon University (128.2.211.xxx)",
id: "id_g_m_390",
link1: "http://www.cmu.edu",
link2: "",
name: "generic_crawler/01.0217/",
type: "R"
},
%{
comment: "",
description: "Lunascape Genesis browser",
id: "id_g_m_100109_2",
link1: "http://www.lunascape.tv/",
link2: "",
name: "GenesisBrowser (HTTP 1.1; 0.9; XP SP2; .NET CLR 2.0.50727)",
type: "B"
},
%{
comment: " s. also: - larbin_2.6.3 (wgao@genieknows.com)",
description: "GenieKnows.com search",
id: "id_g_m_231205_1",
link1: "http://www.genieknows.com/",
link2: "",
name: "genieBot (http://64.5.245.11/faq/faq.html)",
type: "R"
},
%{
comment: " s. also: - larbin_2.6.3 (wgao@genieknows.com)",
description: "GenieKnows.com search",
id: "id_g_m_391",
link1: "http://www.genieknows.com/",
link2: "",
name: "geniebot wgao@genieknows.com",
type: "R"
},
%{
comment: "no active website",
description: "Unknown robot from wavepath.com (65.254.33.1xx)",
id: "id_g_m_050606_3",
link1: "",
link2: "",
name: "GeoBot/1.0",
type: ""
},
%{
comment: "",
description: "Geona Search robot / link checking",
id: "id_g_m_392",
link1: "http://www.geona.com",
link2: "",
name: "GeonaBot 1.x; http://www.geona.com/",
type: "R"
},
%{
comment: "",
description: "GeoURL ICBM Address Server - a location-to-URL reverse directory",
id: "id_g_m_160206_3",
link1: "http://geourl.org/",
link2: "",
name: "geourl/2.0b2",
type: "C"
},
%{
comment: "",
description: "GeoURL ICBM Address Server - a location-to-URL reverse directory",
id: "id_g_m_160206_2",
link1: "http://geourl.org/",
link2: "",
name: "GeoURLBot 1.0 (http://geourl.org)",
type: "C"
},
%{
comment: "",
description: "Getbot web downloading tool / site grabber",
id: "id_g_m_393",
link1: "http://www.getbot.com",
link2: "",
name: "GetBot",
type: "D"
},
%{
comment: "",
description: "GetRight download manager",
id: "id_g_m_394",
link1: "http://www.getright.com",
link2: "",
name: "GetRight/3.x.x",
type: "D"
},
%{
comment: "",
description: "GetRight download manager",
id: "id_g_m_395",
link1: "http://www.getright.com",
link2: "",
name: "GetRight/4.5xx",
type: "D"
},
%{
comment: "",
description: "GetRight download manager",
id: "id_g_m_396",
link1: "http://www.getright.com",
link2: "",
name: "GetRight/4.x",
type: "D"
},
%{
comment: "",
description: "GetRight download manager",
id: "id_g_m_397",
link1: "http://www.getright.com",
link2: "",
name: "GetRight/4.x[a-e]",
type: "D"
},
%{
comment: "",
description: "GetRight download manager",
id: "id_g_m_260807_1",
link1: "http://www.getright.com",
link2: "",
name: "GetRight/6.1 (Pro)",
type: "D"
},
%{
comment: "",
description: "GetRight download manager",
id: "id_g_m_398",
link1: "http://www.getright.com",
link2: "",
name: "GetRightPro/6.0beta2",
type: "D"
},
%{
comment: "216.204.133.xxx",
description: "GetWeb - web page to email service",
id: "id_g_m_170706_3",
link1: "http://www.healthnet.org/getweb.php",
link2: "",
name: "GetWeb/0.1 libwww-perl/5.16",
type: "D"
},
%{
comment: "",
description: "Sixxs Ghost Route Hunter",
id: "id_g_m_399",
link1: "http://www.sixxs.net/tools/grh/",
link2: "",
name: "GhostRouteHunter/20021130 (https://www.sixxs.net/tools/grh/; info@sixxs.net)",
type: "C"
},
%{
comment: " s. also - MicroBaz",
description: "GigaBaz Brainbot (Germany) robot",
id: "id_g_m_400",
link1: "http://gigabaz.com",
link2: "",
name: "gigabaz/3.1x (baz@gigabaz.com; http://gigabaz.com/gigabaz/)",
type: "R"
},
%{
comment: "",
description: "Gigablast robot (64.62.168.xx)",
id: "id_g_m_401",
link1: "http://www.gigablast.com",
link2: "",
name: "Gigabot/2.0 (gigablast.com)",
type: "R"
},
%{
comment: "comes from 64.62.168.xx AND 66.154.102.xx",
description: "Gigablast robot",
id: "id_g_m_140106_1",
link1: "http://www.gigablast.com",
link2: "",
name: "Gigabot/2.0/gigablast.com/spider.html",
type: "R"
},
%{
comment: "comes from 64.62.168.xx AND 66.154.102.xx",
description: "Gigablast robot",
id: "id_g_m_170506_1",
link1: "http://www.gigablast.com",
link2: "",
name: "Gigabot/2.0; http://www.gigablast.com/spider.html",
type: "R"
},
%{
comment: "66.231.188.1xx",
description: "Gigablast robot",
id: "id_g_m_190507_1",
link1: "http://www.gigablast.com",
link2: "",
name: "Gigabot/2.0att",
type: "R"
},
%{
comment: "66.231.18x.[x]xx",
description: "Gigablast robot",
id: "id_g_m_230508_1",
link1: "http://www.gigablast.com",
link2: "",
name: "Gigabot/3.0 (http://www.gigablast.com/spider.html)",
type: "R"
},
%{
comment: "",
description: "Gigablast robot (64.62.168.xx)",
id: "id_g_m_402",
link1: "http://www.gigablast.com",
link2: "",
name: "Gigabot/x.0",
type: "R"
},
%{
comment: "",
description: "Gigablast robot (64.62.168.xx)",
id: "id_g_m_403",
link1: "http://www.gigablast.com",
link2: "",
name: "GigabotSiteSearch/2.0 (sitesearch.gigablast.com)",
type: "R"
},
%{
comment: "",
description: "www.gnod.net spider",
id: "id_g_m_404",
link1: "http://www.gnod.net",
link2: "",
name: "GNODSPIDER (www.gnod.net)",
type: "R"
},
%{
comment: "",
description: "Go!Zilla download manager",
id: "id_g_m_406",
link1: "http://www.gozilla.com",
link2: "",
name: "Go!Zilla 3.x (www.gozilla.com)",
type: "D"
},
%{
comment: "",
description: "Go!Zilla download manager",
id: "id_g_m_407",
link1: "http://www.gozilla.com",
link2: "",
name: "Go!Zilla/4.x.x.xx",
type: "D"
},
%{
comment: "",
description: "GotIt web accelerator (discontinued)",
id: "id_g_m_405",
link1: "",
link2: "",
name: "Go-Ahead-Got-It/1.1",
type: "P D"
},
%{
comment: "",
description: "GoGuides.Org (195.226.137.xx) robot",
id: "id_g_m_408",
link1: "http://www.goguides.org/goblin-info.html",
link2: "",
name: "Goblin/0.9 (http://www.goguides.org/)",
type: "R"
},
%{
comment: "",
description: "GoGuides.Org (195.226.137.xx) robot",
id: "id_g_m_409",
link1: "http://www.goguides.org/goblin-info.html",
link2: "",
name: "Goblin/0.9.x (http://www.goguides.org/goblin-info.html)",
type: "R"
},
%{
comment: "208.109.236.xx",
description: "GoForIt Search robot",
id: "id_g_m_410",
link1: "http://www.goforit.com",
link2: "",
name: "GoForIt.com",
type: "R"
},
%{
comment: "208.109.236.xx",
description: "GoForIt Search robot",
id: "id_g_m_411",
link1: "http://www.goforit.com",
link2: "",
name: "GOFORITBOT ( http://www.goforit.com/about/ )",
type: "R"
},
%{
comment: "",
description: "GoGuides.org directory & search link checking",
id: "id_g_m_020306_1",
link1: "http://www.goguides.org/",
link2: "",
name: "GoGuides.Org Link Check",
type: "C"
},
%{
comment: "74.52.41.1xx",
description: "GoldenFeed.com - RSS search engine",
id: "id_g_m_230207_2",
link1: "http://www.goldenfeed.com/",
link2: "",
name: "GoldenFeed Spider 1.0 (http://www.goldenfeed.com)",
type: "C"
},
%{
comment: "",
description: "Invention Machines Goldfire Server",
id: "id_g_m_412",
link1: "http://www.invention-machine.com/custsupport/GFR_install.cfm",
link2: "",
name: "Goldfire Server",
type: "P"
},
%{
comment: "212.34.185.xx",
description: "suchen.de German local search robot",
id: "id_g_m_041006_1",
link1: "http://www.suchen.de/",
link2: "",
name: "gonzo1[P] +http://www.suchen.de/popups/faq.jsp",
type: "R"
},
%{
comment: "212.34.185.xx",
description: "suchen.de German local search robot",
id: "id_g_m_130108_2",
link1: "http://www.suchen.de/",
link2: "",
name: "gonzo2[P] +http://www.suchen.de/faq.html",
type: "R"
},
%{
comment: "",
description: "Some private robot (Wanadoo.fr client)",
id: "id_g_m_413",
link1: "",
link2: "",
name: "Goofer/0.2",
type: "R"
},
%{
comment: "",
description: "Google instant messenger",
id: "id_g_m_300606_1",
link1: "http://www.google.com/talk/",
link2: "",
name: "Google Talk",
type: "B"
},
%{
comment: "",
description: "Packard Bell Net user robot (*not* Google)",
id: "id_g_m_414",
link1: "",
link2: "",
name: "googlebot (larbin2.6.0@unspecified.mail)",
type: ""
},
%{
comment: "",
description: "Google image crawler (66.249.72.xxx)",
id: "id_g_m_050106_1",
link1: "http://www.google.com",
link2: "",
name: "Googlebot-Image/1.0",
type: "R"
},
%{
comment: "",
description: "Google image crawler (66.249.72.xxx)",
id: "id_g_m_415",
link1: "http://www.google.com",
link2: "",
name: "Googlebot-Image/1.0 ( http://www.googlebot.com/bot.html)",
type: "R"
},
%{
comment:
" s. also: - Mozilla/4.0 (MobilePhone SCP ... - Mozilla/5.0 (compatible; Googlebot/2.1...",
description: "Google robot 66.249.64.XXX",
id: "id_g_m_416",
link1: "http://www.google.com",
link2: "",
name: "Googlebot/2.1 ( http://www.google.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "Google robot 66.249.64.XXX",
id: "id_g_m_417",
link1: "http://www.google.com",
link2: "",
name: "Googlebot/2.1 ( http://www.googlebot.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "Google robot 66.249.64.XXX",
id: "id_g_m_418",
link1: "http://www.google.com",
link2: "",
name: "Googlebot/Test ( http://www.googlebot.com/bot.html)",
type: "R"
},
%{
comment: "174.129.242.x",
description: "ShareThis social networking service via Amazon Web Services",
id: "id_g_m_280209_2",
link1: "http://sharethis.com/",
link2: "http://www.amazonaws.com/",
name: "Gordon's Spider/Nutch-0.9 (http://www.sharethis.com; gordon@sharethis.com)",
type: "C"
},
%{
comment: "",
description: "Grapeshot web search system API",
id: "id_g_m_419",
link1: "http://www.grapeshot.co.uk/html/Index.html",
link2: "",
name: "GrapeFX/0.3 libwww/5.4.0",
type: "R"
},
%{
comment: "74.62.161.xx",
description: "Flatland Industries vertical search solution",
id: "id_g_m_300907_4",
link1: "http://www.flatlandindustries.com/",
link2: "http://www.flatlandindustries.com/flatlandbot.php",
name:
"great-plains-web-spider/flatlandbot (Flatland Industries Web Spider; http://www.flatlandindustries.com/flatlandbot.php; jason@flatlandindustries.com)",
type: "R"
},
%{
comment: "",
description: "GreatNews 1.0 Beta RSS reader",
id: "id_g_m_250707_2",
link1: "http://www.curiostudio.com/",
link2: "",
name: "GreatNews/1.0",
type: "B"
},
%{
comment: "",
description: "GreenBrowser - IE based browser (China)",
id: "id_g_m_170207_2",
link1: "http://www.morequick.com/indexen.htm",
link2: "",
name: "GreenBrowser",
type: "B"
},
%{
comment: "212.227.127.xx",
description: "search gridwell favicon display",
id: "id_g_m_100307_2",
link1: "http://search.gridwell.com/",
link2: "",
name: "gridwell (http://search.gridwell.com)",
type: "D"
},
%{
comment: "",
description: "Grigor Search bot",
id: "id_g_m_420",
link1: "http://www.grigor.biz",
link2: "",
name: "GrigorBot 0.8 (http://www.grigor.biz/bot.html)",
type: "R"
},
%{
comment: "",
description: "Australasian Legal Information Institute (AustLII) robot",
id: "id_g_m_161206_1",
link1: "http://www.austlii.edu.au/",
link2: "http://www2.austlii.edu.au/~dan/gromit/",
name: "Gromit/1.0",
type: "R"
},
%{
comment: "",
description: "Grub open source crawler",
id: "id_g_m_421",
link1: "http://www.grub.org",
link2: "",
name: "grub crawler(http://www.grub.org)",
type: "R"
},
%{
comment: "",
description: "Grub open source crawler",
id: "id_g_m_422",
link1: "http://www.grub.org",
link2: "",
name: "grub-client",
type: "R"
},
%{
comment: "",
description: "Google Search Appliance robot (216.239.xx.xx)",
id: "id_g_m_423",
link1: "http://www.google.com/enterprise/gsa/",
link2: "",
name: "gsa-crawler (Enterprise; GID-01422; jplastiras@google.com)",
type: "R"
},
%{
comment: "",
description: "Google Search Appliance robot (216.239.xx.xx)",
id: "id_g_m_424",
link1: "http://www.google.com/enterprise/gsa/",
link2: "",
name: "gsa-crawler (Enterprise; GID-01742;gsatesting@rediffmail.com)",
type: "R"
},
%{
comment: "",
description: "Google Enterprise Search Appliance used by Enhesa (212.35.100.1xx)",
id: "id_g_m_060506_1",
link1: "http://www.enhesa.com/enhesa/en/default.asp",
link2: "http://www.google.com/enterprise/gsa/",
name: "gsa-crawler (Enterprise; GIX-02057; dm@enhesa.com)",
type: "R"
},
%{
comment: "",
description: "Google Enterprise Search Appliance used by IBM (129.41.20.1xx)",
id: "id_g_m_311205_1",
link1: "http://www.google.com/enterprise/gsa/",
link2: "",
name: "gsa-crawler (Enterprise; GIX-03519; cknuetter@stubhub.com)",
type: "R"
},
%{
comment: "",
description: "Google Search Appliance robot (216.239.xx.xx)",
id: "id_g_m_425",
link1: "http://www.google.com/enterprise/gsa/",
link2: "",
name: "gsa-crawler (Enterprise; GIX-0xxxx; enterprise-training@google.com)",
type: "R"
},
%{
comment: "",
description: "GSiteCrawler - Google sitemap generator for Windows",
id: "id_g_m_081006_1",
link1: "http://gsitecrawler.com/",
link2: "",
name: "GSiteCrawler/v1.xx rev. xxx (http://gsitecrawler.com/)",
type: "C"
},
%{
comment: "",
description: "Guestbook spamming tool",
id: "id_g_m_260207_1",
link1: "",
link2: "",
name: "Guestbook Auto Submitter",
type: "S"
},
%{
comment: "",
description: "Northernlight robot",
id: "id_g_m_426",
link1: "http://www.northernlight.com",
link2: "",
name: "Gulliver/1.3",
type: "R"
},
%{
comment: "",
description: "Yuntis Collaborative Web Resource Categorization and Ranking Project robot",
id: "id_g_m_427",
link1: "http://www.ecsl.cs.sunysb.edu/yuntis/",
link2: "",
name: "Gulper Web Bot 0.2.4 (www.ecsl.cs.sunysb.edu/~maxim/cgi-bin/Link/GulperBot)",
type: "R"
},
%{
comment: "",
description: "Gungho - Extensible web crawler written in Perl by Google Code",
id: "id_g_m_140907_1",
link1: "http://code.google.com/p/gungho-crawler/wiki/Index",
link2: "",
name: "Gungho/0.08004 (http://code.google.com/p/gungho-crawler/wiki/Index)",
type: "R"
},
%{
comment: "209.128.80.1xx / 72.20.109.xx",
description: "guruji : the Indian search engine robot",
id: "id_g_m_211106_1",
link1: "http://www.guruji.com/",
link2: "",
name: "GurujiBot/1.0 (+http://www.guruji.com/WebmasterFAQ.html)",
type: "R"
},
%{
comment: "72.20.109.xx",
description: "guruji : the Indian search engine picture crawler",
id: "id_g_m_100508_2",
link1: "http://www.guruji.com/",
link2: "",
name: "GurujiImageBot/1.0 (+http://www.guruji.com/en/WebmasterFAQ.html)",
type: "R"
},
%{
comment: "",
description: "Openwave Mobile Browser on Haier T10C mobile",
id: "id_g_m_291108_3",
link1: "http://www.openwave.com",
link2: "",
name:
"Haier-T10C/1.0 iPanel/2.0 WAP2.0 (compatible; UP.Browser/6.2.2.4; UPG1; UP/4.0; Embedded)",
type: "B"
},
%{
comment: "",
description: "Happy Fun Search robot",
id: "id_g_m_171105_5",
link1: "http://www.happyfunsearch.com/bot.html",
link2: "",
name: "HappyFunBot/1.1",
type: "R"
},
%{
comment: "see also Exalead NG and NG/1.0",
description: "Harvest-NG web crawler used by search.yahoo.com",
id: "id_g_m_428",
link1: "http://search.yahoo.com",
link2: "",
name: "Harvest-NG/1.0.2",
type: "R"
},
%{
comment: "site is closed",
description: "Haste - web mapping and monitoring system",
id: "id_g_m_429",
link1: "http://haste.kytoon.com",
link2: "",
name: "Haste/0.12 (HOME: http://haste.kytoon.com/)",
type: "R C"
},
%{
comment: "221.186.146.xx",
description: "Hatena::Antenna Japan robot",
id: "id_g_m_430",
link1: "http://a.hatena.ne.jp",
link2: "",
name: "Hatena Antenna/0.4 (http://a.hatena.ne.jp/help#robot)",
type: "R"
},
%{
comment: "221.186.146.xx",
description: "Hatena Japan proxy for handheld/mobile clients",
id: "id_g_m_110606_2",
link1: "http://www.hatena.ne.jp/",
link2: "",
name: "Hatena Mobile Gateway/1.0",
type: "P"
},
%{
comment: "221.186.146.xx",
description: "Hatena Japan robot",
id: "id_g_m_431",
link1: "http://www.hatena.ne.jp",
link2: "",
name: "Hatena Pagetitle Agent/1.0",
type: "R"
},
%{
comment: "221.186.146.xx",
description: "Hatena Japan RSS feed robot",
id: "id_g_m_240207_1",
link1: "http://www.hatena.ne.jp",
link2: "",
name: "Hatena RSS/0.3 (http://r.hatena.ne.jp)",
type: "R"
},
%{
comment: "221.186.146.xx",
description: "Hatena::Diary (Japan) web page screenshot robot",
id: "id_g_m_110606_1",
link1: "http://www.hatena.ne.jp/",
link2: "",
name: "HatenaScreenshot/1.0 (checker)",
type: "R D"
},
%{
comment: "89.110.157.*",
description: "hbtronix.spider - Domain name spider (Germany)",
id: "id_g_m_120108_1",
link1: "http://hbtronix.de/spider.php",
link2: "",
name: "hbtronix.spider.2 -- http://hbtronix.de/spider.php",
type: "R"
},
%{
comment: "",
description: "Mirago Germany robot",
id: "id_g_m_432",
link1: "http://www.mirago.de/",
link2: "",
name: "HeinrichderMiragoRobot",
type: "R"
},
%{
comment: "",
description: "Mirago Germany robot",
id: "id_g_m_433",
link1: "http://www.mirago.de/",
link2: "",
name: "HeinrichderMiragoRobot (http://www.miragorobot.com/scripts/deinfo.asp)",
type: "R"
},
%{
comment: "",
description: "Helix - The SiteSearch (Canada) web crawler",
id: "id_g_m_434",
link1: "http://www.sitesearch.ca",
link2: "",
name: "Helix/1.x ( http://www.sitesearch.ca/helix/)",
type: "R"
},
%{
comment: "",
description: "Mirago France robot",
id: "id_g_m_080206_3",
link1: "http://www.mirago.fr/",
link2: "",
name: "HenriLeRobotMirago (http://www.miragorobot.com/scripts/frinfo.asp)",
type: "R"
},
%{
comment: "217.154.245.2xx",
description: "Mirago search (UK) robot",
id: "id_g_m_435",
link1: "http://www.mirago.co.uk",
link2: "",
name: "HenrytheMiragoRobot",
type: "R"
},
%{
comment: "217.154.245.2xx",
description: "Mirago search (UK) robot",
id: "id_g_m_060806_3",
link1: "http://www.mirago.co.uk",
link2: "",
name: "HenryTheMiragoRobot (http://www.miragorobot.com/scripts/mrinfo.asp)",
type: "R"
},
%{
comment: "",
description:
"O'Reilly's Perl LWP example client program from Web Client Programming with Perl",
id: "id_g_m_436",
link1: "",
link2: "",
name: "hgrepurl/1.0",
type: ""
},
%{
comment: "",
description: "University of Kassel Germany CsCrawler using the HTTPClient library",
id: "id_g_m_437",
link1: "http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html",
link2: "http://www.innovation.ch/java/HTTPClient/",
name:
"Hi! I'm CsCrawler my homepage: http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html RPT-HTTPClient/0.3-3",
type: "R"
},
%{
comment: "",
description: "HiDownload download manager",
id: "id_g_m_438",
link1: "http://www.streamingstar.com/hidownload.htm",
link2: "",
name: "HiDownload",
type: "D"
},
%{
comment: "site is offline",
description: "Hippias robot",
id: "id_g_m_439",
link1: "http://hippias.evansville.edu",
link2: "",
name: "Hippias/0.9 Beta",
type: "R"
},
%{
comment: "",
description: "Pilot Hitlist web analytics solution",
id: "id_g_m_440",
link1: "http://www.pilotsoftware.com/products_solutions/hitlist.html",
link2: "",
name: "HitList",
type: "R"
},
%{
comment: "",
description: "Hitwise spider",
id: "id_g_m_441",
link1: "http://www.hitwise.com",
link2: "",
name: "Hitwise Spider v1.0 http://www.hitwise.com",
type: "R"
},
%{
comment: " i.e.: - 204.95.207.xxx user agent ? - 66.27.113.xx link checking ?",
description: "diff. IPs / unknown services",
id: "id_g_m_442",
link1: "",
link2: "",
name: "HLoader",
type: ""
},
%{
comment: "",
description: "Morfeo / Centrum Search (Czech Republic) robot from 65.102.46.xxx",
id: "id_g_m_040907_1",
link1: "http://morfeo.centrum.cz/",
link2: "",
name: "holmes/3.11 (http://morfeo.centrum.cz/bot)",
type: "R"
},
%{
comment: "213.180.137.xx",
description: "Onet.pl (Poland) search robot",
id: "id_g_m_220906_2",
link1: "http://szukaj.onet.pl/",
link2: "",
name: "holmes/3.9 (onet.pl)",
type: "R"
},
%{
comment: "213.180.137.xx",
description: "Onet.pl (Poland) search robot",
id: "id_g_m_181006_1",
link1: "http://szukaj.onet.pl/",
link2: "",
name: "holmes/3.xx (OnetSzukaj/5.0; +http://szukaj.onet.pl)",
type: "R"
},
%{
comment: "",
description: "Morfeo / Centrum Search (Czech Republic) robot from 65.102.46.xxx",
id: "id_g_m_443",
link1: "http://morfeo.centrum.cz/",
link2: "",
name: "holmes/x.x",
type: "R"
},
%{
comment: "77.92.229.3x",
description: "Holes search robot (Georgia)",
id: "id_g_m_021108_2",
link1: "http://holmes.ge/",
link2: "",
name: "HolmesBot (http://holmes.ge)",
type: "R"
},
%{
comment: "",
description: "HomePageSearch robot",
id: "id_g_m_444",
link1: "http://hpsearch.uni-trier.de/",
link2: "",
name: "HomePageSearch(hpsearch.uni-trier.de)",
type: "R"
},
%{
comment: "",
description: "Homerweb search robot",
id: "id_g_m_445",
link1: "http://www.homerweb.com",
link2: "",
name: "Homerbot: www.homerweb.com",
type: "R"
},
%{
comment: "69.16.227.1xx",
description: "Honda-Search.com - Honda cars related search robot",
id: "id_g_m_220606_1",
link1: "http://www.honda-search.com/",
link2: "",
name:
"Honda-Search/0.7.2 (Nutch; http://lucene.apache.org/nutch/bot.html; search@honda-search.com)",
type: "R"
},
%{
comment: "",
description: "HooWWer - Next Generation Information Retrieval robot ",
id: "id_g_m_090206_1",
link1: "http://cosco.hiit.fi",
link2: "",
name:
"HooWWWer/2.1.3 (debugging run) (+http://cosco.hiit.fi/search/hoowwwer/ | mailto:crawler-info<at>hiit.fi)",
type: "R"
},
%{
comment: "",
description: "HooWWer - Next Generation Information Retrieval robot (128.214.112.xx)",
id: "id_g_m_446",
link1: "http://cosco.hiit.fi/",
link2: "",
name:
"HooWWWer/2.1.x ( http://cosco.hiit.fi/search/hoowwwer/ | mailto:crawler-info<at>hiit.fi)",
type: "R"
},
%{
comment: "",
description: "HotJava browser plus HTML Component 1.1.x",
id: "id_g_m_447",
link1: "",
link2: "",
name: "HotJava/1.0.1/JRE1.1.x",
type: "B"
},
%{
comment: "",
description: "Hotzuno - Japanese BBS reader client",
id: "id_g_m_448",
link1: "http://hotzonu.hp.infoseek.co.jp/",
link2: "",
name: "Hotzonu/x.0",
type: "B"
},
%{
comment: "15.203.249.12x",
description: "Unknown robot from HP Labs",
id: "id_g_m_040507_1",
link1: "http://hpl.hp.com/",
link2: "",
name: "HPL/Nutch-0.9 -",
type: "R"
},
%{
comment: "",
description: "COMPUTERorgs.com robot (205.134.190.xxx) using htdig",
id: "id_g_m_449",
link1: "http://www.computerorgs.com/",
link2: "http://www.htdig.org",
name: "htdig/3.1.6 (http://computerorgs.com)",
type: "R"
},
%{
comment: "reads robots.txt",
description: "htdig used by the Academie de Toulouse",
id: "id_g_m_210106_1",
link1: "http://www.ac-toulouse.fr/html/_.php",
link2: "http://www.htdig.org",
name: "htdig/3.1.6 (unconfigured@htdig.searchengine.maintainer)",
type: "R"
},
%{
comment: "",
description: "htdig search tool",
id: "id_g_m_450",
link1: "http://www.htdig.org",
link2: "",
name: "htdig/3.1.x (root@localhost)",
type: "R"
},
%{
comment: "",
description: "Lithops Software link validation tool",
id: "id_g_m_451",
link1: "http://www.lithopssoft.com",
link2: "",
name: "Html Link Validator (www.lithopssoft.com)",
type: "C"
},
%{
comment: "",
description: "HTML2JPG webpage to image converter",
id: "id_g_m_110506_3",
link1: "http://www.html2jpg.com",
link2: "",
name: "HTML2JPG Blackbox, http://www.html2jpg.com",
type: "D"
},
%{
comment: "",
description: "HTML2JPG webpage to image converter",
id: "id_g_m_452",
link1: "http://www.html2jpg.com",
link2: "",
name: "HTML2JPG Enterprise",
type: "D"
},
%{
comment: "",
description: "HTML Parser Java library to parse HTML",
id: "id_g_m_101205_1",
link1: "http://sourceforge.net/projects/htmlparser",
link2: "",
name: "HTMLParser/1.x",
type: "D"
},
%{
comment: "",
description: "PHP HTTP client to access Web servers",
id: "id_g_m_071006_1",
link1: "http://code.blitzaffe.com/pages/home/",
link2: "",
name: "HTTP Retriever",
type: "D"
},
%{
comment: "",
description: "Anonymous web proxy service",
id: "id_g_m_240306_1",
link1: "http://anonymouse.org/",
link2: "",
name: "http://Anonymouse.org/ (Unix)",
type: "P"
},
%{
comment: "",
description: "Ask 24x Info (Germany) DMOZ related robot",
id: "id_g_m_453",
link1: "http://narres.it",
link2: "",
name: "http://Ask.24x.Info/ (http://narres.it/)",
type: "R"
},
%{
comment: "82.149.246.2x",
description: "ACONTBOT - Acont search Germany robot",
id: "id_g_m_070209_6",
link1: "http://acont.de/",
link2: "http://hilfe.acont.de/bot.htm",
name: "http://hilfe.acont.de/bot.html ACONTBOT",
type: "R"
},
%{
comment: "202.173.141.x",
description: "OzySoftware.com software directory link checking",
id: "id_g_m_230408_1",
link1: "http://ozysoftware.com/index.html",
link2: "",
name: "http://OzySoftware.com/Index.html",
type: "C"
},
%{
comment: " s. also: - FocusedSampler - WFARC",
description: "IBM's Almaden Research robot",
id: "id_g_m_454",
link1: "http://www.almaden.ibm.com",
link2: "",
name: "http://www.almaden.ibm.com/cs/crawler",
type: "R"
},
%{
comment: "",
description: "IBM's Almaden Research robot",
id: "id_g_m_455",
link1: "http://www.almaden.ibm.com",
link2: "",
name: "http://www.almaden.ibm.com/cs/crawler [rc1.wf.ibm.com]",
type: "R"
},
%{
comment: "",
description: "IBM's Almaden Research robot",
id: "id_g_m_456",
link1: "http://www.almaden.ibm.com",
link2: "",
name: "http://www.almaden.ibm.com/cs/crawler [wf216]",
type: "R"
},
%{
comment: "",
description: "Istarthere.com search robot",
id: "id_g_m_271105_4",
link1: "http://www.istarthere.com/",
link2: "",
name: "http://www.istarthere.com_spider@istarthere.com",
type: "R"
},
%{
comment: "",
description: "Monogol - German open source search engine project (195.226.167.1xx)",
id: "id_g_m_070106_1",
link1: "http://www.monogol.de/",
link2: "",
name: "http://www.monogol.de",
type: "R"
},
%{
comment: "87.104.18.xx",
description: "TrendTech Search Engine (Denmark) robot",
id: "id_g_m_060806_4",
link1: "http://www.trendtech.dk/",
link2: "",
name: "http://www.trendtech.dk/spider.asp)",
type: "R"
},
%{
comment: "",
description: "HTTP::Lite - Standalone Perl module for retreiving HTTP documents",
id: "id_g_m_290106_1",
link1: "http://www.toybox.ca/http-lite/",
link2: "",
name: "HTTP::Lite/2.x.x",
type: "D"
},
%{
comment: "",
description: "HTTPEyes - Web proxy cache",
id: "id_g_m_050108_1",
link1: "http://bachue.com/httpeyes/",
link2: "",
name: "HTTPEyes",
type: "P"
},
%{
comment: "",
description: "HTTPResume Amiga download manager",
id: "id_g_m_457",
link1: "http://tesla.rcub.bg.ac.yu/%7Eantony/HTTPResume/",
link2: "",
name: "HTTPResume v. 1.x",
type: "D"
},
%{
comment: "",
description: "HttpUnit - Java test code for emulating browser behaviour",
id: "id_g_m_031107_2",
link1: "http://httpunit.sourceforge.net/",
link2: "",
name: "httpunit/1.5",
type: "B"
},
%{
comment: "",
description: "HttpUnit - Java browser behavior simulation tool",
id: "id_g_m_090306_1",
link1: "http://httpunit.sourceforge.net/",
link2: "",
name: "httpunit/1.x",
type: "B"
},
%{
comment: "",
description: "Hybrid Share mono C#/Gtk# application for file sharing",
id: "id_g_m_010807_1",
link1: "http://hybrid-share.sourceforge.net/index.php",
link2: "",
name: "Hybrid/1.2 [en] (OS Independent)",
type: ""
},
%{
comment: "",
description: "Hyper Estraier full-text search system",
id: "id_g_m_300507_1",
link1: "http://hyperestraier.sourceforge.net/",
link2: "",
name: "HyperEstraier/1.x.xx",
type: "D"
},
%{
comment: "65.111.164.1xx",
description: "i1search robot",
id: "id_g_m_170906_1",
link1: "http://www.i1search.com/",
link2: "",
name:
"i1searchbot/2.0 (i1search web crawler; http://www.i1search.com; crawler@i1search.com)",
type: "R"
},
%{
comment: "",
description: "Alexa / The Internet Archive (209.237.238.1xx)",
id: "id_g_m_461",
link1: "http://www.alexa.com",
link2: "",
name: "IAArchiver-1.0",
type: "R"
},
%{
comment: "Not from iask.com.cn - s. also Mozilla/5.0 (compatible; iaskspider/1.0 ..",
description: "Unknown robot (reads robots.txt) from chinatelecom (219.142.78.xx)",
id: "id_g_m_091205_2",
link1: "",
link2: "",
name: "iaskspider",
type: ""
},
%{
comment: "202.106.184.xxx",
description: "Iask search / Sina portal robot (China)",
id: "id_g_m_111106_1",
link1: "http://iask.com/",
link2: "http://english.sina.com/index.html",
name: "iaskspider2 (iask@staff.sina.com.cn)",
type: "R"
},
%{
comment: "",
description: "Alexa / The Internet Archive (209.237.238.1xx)",
id: "id_g_m_458",
link1: "http://www.alexa.com",
link2: "",
name: "ia_archiver",
type: "R"
},
%{
comment: "",
description: "Alexa / The Internet Archive (209.237.238.1xx)",
id: "id_g_m_459",
link1: "http://www.alexa.com",
link2: "",
name: "ia_archiver-web.archive.org",
type: "R"
},
%{
comment: "",
description: "Alexa / The Internet Archive (209.237.238.1xx)",
id: "id_g_m_460",
link1: "http://www.alexa.com",
link2: "",
name: "ia_archiver/1.6",
type: "R"
},
%{
comment: "was Hisoft (http://www.hisoft.co.uk)",
description: "IOSpirit iBrowse Amiga Browser",
id: "id_g_m_462",
link1: "http://amiga.iospirit.de/",
link2: "",
name: "IBrowse/2.2 (AmigaOS 3.5)",
type: "B"
},
%{
comment: "was Hisoft (http://www.hisoft.co.uk)",
description: "IOSpirit iBrowse Amiga Browser",
id: "id_g_m_463",
link1: "http://amiga.iospirit.de/",
link2: "",
name: "IBrowse/2.2 (Windows 3.1)",
type: "B"
},
%{
comment: "",
description: "iCab MAC Web browser",
id: "id_g_m_464",
link1: "http://www.icab.de",
link2: "",
name: "iCab/2.5.2 (Macintosh; I; PPC)",
type: "B"
},
%{
comment: "202.180.34.1xx",
description: "Knowledge Clustered Group ICC-Crawler (University of Tokyo - Japan)",
id: "id_g_m_110207_2",
link1: "http://kc.nict.go.jp/icc/crawl.html",
link2: "",
name:
"ICC-Crawler(Mozilla-compatible; http://kc.nict.go.jp/icc/crawl.html; icc-crawl(at)ml(dot)nict(dot)go(dot)jp)",
type: "R"
},
%{
comment: "202.180.34.1xx",
description: "Knowledge Clustered Group ICC-Crawler (University of Tokyo - Japan)",
id: "id_g_m_250607_1",
link1: "http://kc.nict.go.jp/icc/crawl.html",
link2: "",
name:
"ICC-Crawler(Mozilla-compatible;http://kc.nict.go.jp/icc/crawl.html;icc-crawl-contact(at)ml(dot)nict(dot)go(dot)jp)",
type: "R"
},
%{
comment: "212.227.76.xx",
description: "ICJobs - Intelligence Competence Center (Germany) robot",
id: "id_g_m_465",
link1: "http://www.iccenter.net",
link2: "",
name: "iCCrawler (http://www.iccenter.net)",
type: "R"
},
%{
comment: "212.227.76.xx",
description: "ICJobs - Intelligence Competence Center (Germany) robot",
id: "id_g_m_121006_1",
link1: "http://www.iccenter.net",
link2: "",
name: "ICCrawler - ICjobs (http://www.icjobs.de/bot.htm)",
type: "R"
},
%{
comment: "",
description: "ICE Java browser",
id: "id_g_m_466",
link1: "http://www.ii.uib.no/~alexey/jb/",
link2: "",
name: "ICE Browser/5.05 (Java 1.4.0; Windows 2000 5.0 x86)",
type: "B"
},
%{
comment: " s. also moget / mogimogi",
description: "Goo Japan / Inktomi robot (210.173.179.xx)",
id: "id_g_m_040206_2",
link1: "http://www.goo.ne.jp",
link2: "",
name: "ichiro/x.0 (http://help.goo.ne.jp/door/crawler.html)",
type: "R"
},
%{
comment: " s. also moget / mogimogi",
description: "Goo Japan / Inktomi robot (210.173.179.xx)",
id: "id_g_m_468",
link1: "http://www.goo.ne.jp",
link2: "",
name: "ichiro/x.0 (ichiro@nttr.co.jp)",
type: "R"
},
%{
comment: "",
description: "Iconsurf.com - Visual Surf Engine / favicon finder",
id: "id_g_m_469",
link1: "http://iconsurf.com",
link2: "",
name: "IconSurf/2.0 favicon finder (see http://iconsurf.com/robot.html)",
type: "R"
},
%{
comment: "",
description: "Iconsurf.com - Visual Surf Engine / favicon finder",
id: "id_g_m_470",
link1: "http://iconsurf.com",
link2: "",
name: "IconSurf/2.0 favicon monitor (see http://iconsurf.com/robot.html)",
type: "R"
},
%{
comment: "",
description: "icooLoader download manager",
id: "id_g_m_471",
link1: "http://www.icoonet.com",
link2: "",
name: "ICOO Loader v.x.x.x",
type: "D"
},
%{
comment: "",
description: "ICRA (Internet Content Rating Association) label spider",
id: "id_g_m_472",
link1: "http://www.icra.org",
link2: "",
name: "ICRA_label_spider/x.0",
type: "R"
},
%{
comment: "",
description: "ICS Robot Search Engine (International Christian school of Seoul)",
id: "id_g_m_473",
link1: "http://icseoul.org/",
link2: "",
name: "icsbot-0.1",
type: "R"
},
%{
comment: "",
description: "Internet Download Accelerator",
id: "id_g_m_260306_1",
link1: "http://www.westbyte.com/ida/",
link2: "",
name: "IDA",
type: "D"
},
%{
comment: "",
description: "Janas (Ideare.com / Tiscali.it) robot",
id: "id_g_m_474",
link1: "",
link2: "",
name: "ideare - SignSite/1.x",
type: "R"
},
%{
comment: "202.165.105.x",
description: "Unknown UA from Yahoo China",
id: "id_g_m_200806_1",
link1: "",
link2: "",
name: "iearthworm/1.0, iearthworm@yahoo.com.cn",
type: ""
},
%{
comment: " possibly Visit URL ??",
description: "Some bookmark manager",
id: "id_g_m_475",
link1: "http://www.lodz.pdi.net/%7Eeristic/free/index.html",
link2: "",
name: "IEFav172Free",
type: "C"
},
%{
comment: "67.15.2[3-4][X].xxx",
description: "iFeed.jp - online rss aggregator (in development)",
id: "id_g_m_060608_4",
link1: "http://www.ifeed.jp/",
link2: "",
name: "iFeed.jp/2.0 (www.psychedelix.com/agents/agents.rss; 0 subscribers)",
type: "R"
},
%{
comment: "87.118.118.12x",
description: "Igde search (Russia) robot",
id: "id_g_m_281207_1",
link1: "http://igde.ru/",
link2: "",
name: "igdeSpyder (compatible; igde.ru; +http://igde.ru/doc/tech.html)",
type: "R"
},
%{
comment: "",
description: "iGetter download manager",
id: "id_g_m_476",
link1: "http://www.igetter.net",
link2: "",
name: "iGetter/1.x (Macintosh;G;PPC)",
type: "D"
},
%{
comment: "",
description: "iGetter download manager",
id: "id_g_m_477",
link1: "http://www.igetter.net",
link2: "",
name: "iGetter/2 (Macintosh; U; PPC Mac OS X; en)",
type: "D"
},
%{
comment: "196.12.53.xx",
description: "Webkhoj - Indian language search engine",
id: "id_g_m_120507_1",
link1: "http://webkhoj.iiit.net/",
link2: "",
name:
"IIITBOT/1.1 (Indian Language Web Search Engine; http://webkhoj.iiit.net; pvvpr at iiit dot ac dot in)",
type: "R"
},
%{
comment: "72.44.58.2xx",
description: "Ilial Knowledge Search robot",
id: "id_g_m_040607_2",
link1: "http://www.ilial.com/crawler/",
link2: "",
name:
"ilial/Nutch-0.9 (Ilial, Inc. is a Los Angeles based Internet startup company. For more information please visit http://www.ilial.com/crawler; http://www.ilial.com/crawler; crawl@ilial.com)",
type: "R"
},
%{
comment: "164.67.195.xx",
description: "Unknown robot from UCLA using Nutch",
id: "id_g_m_290906_1",
link1: "http://www.ucla.edu/",
link2: "http://lucene.apache.org/nutch/",
name: "ilial/Nutch-0.9-dev",
type: "R"
},
%{
comment: "s. also INGRID/3.0 .. / Mozilla/3.0 (INGRID/3.0 ..",
description: "Ilse Netherlands robot (62.69.178.xx)",
id: "id_g_m_270806_1",
link1: "http://www.ilse.nl/",
link2: "",
name: "IlseBot/1.x",
type: "R"
},
%{
comment: "213.215.201.2xx",
description: "Il Trovatore - Italian search engine robot",
id: "id_g_m_478",
link1: "http://www.iltrovatore.it",
link2: "",
name: "IlTrovatore-Setaccio ( http://www.iltrovatore.it)",
type: "R"
},
%{
comment: "213.215.201.2xx",
description: "Il Trovatore - Italian search engine robot",
id: "id_g_m_479",
link1: "http://www.iltrovatore.it",
link2: "",
name:
"Iltrovatore-Setaccio/0.3-dev (Indexing; http://www.iltrovatore.it/bot.html; info@iltrovatore.it)",
type: "R"
},
%{
comment: "213.215.201.2xx",
description: "Il Trovatore - Italian search engine robot",
id: "id_g_m_480",
link1: "http://www.iltrovatore.it",
link2: "",
name: "IlTrovatore-Setaccio/1.2 ( http://www.iltrovatore.it/aiuto/faq.html)",
type: "R"
},
%{
comment: "213.215.201.2xx",
description: "Il Trovatore - Italian search engine robot",
id: "id_g_m_481",
link1: "http://www.iltrovatore.it",
link2: "",
name:
"Iltrovatore-Setaccio/1.2 (It-bot; http://www.iltrovatore.it/bot.html; info@iltrovatore.it)",
type: "R"
},
%{
comment: "213.215.201.2xx",
description: "Il Trovatore - Italian search engine robot",
id: "id_g_m_482",
link1: "http://www.iltrovatore.it",
link2: "",
name: "iltrovatore-setaccio/1.2-dev (spidering; http://www.iltrovatore.it/aiuto/.....)",
type: "R"
},
%{
comment: "213.215.201.2xx",
description: "Il Trovatore - Italian search engine robot",
id: "id_g_m_040506_1",
link1: "http://www.iltrovatore.it",
link2: "",
name:
"IlTrovatore/1.2 (IlTrovatore; http://www.iltrovatore.it/bot.html; bot@iltrovatore.it)",
type: "R"
},
%{
comment: "",
description:
"ImageVisu image and graphics viewer - display files from the Web (HTTP and ECWP)",
id: "id_g_m_060107_2",
link1: "http://geovisu.free.fr/imagvisu/english/",
link2: "",
name: "ImageVisu/v4.x.x",
type: "B"
},
%{
comment: "72.14.164.1xx",
description: "BD-Brandprotect copyright infringement crawler",
id: "id_g_m_080907_1",
link1: "http://www.bdbrandprotect.com/",
link2: "http://www.bdbrandprotect.com/solutions_5.html",
name: "ImageWalker/2.0 (www.bdbrandprotect.com)",
type: "R"
},
%{
comment: "",
description: "HttpClient - a PHP Web Client Class",
id: "id_g_m_110306_1",
link1: "http://scripts.incutio.com/httpclient/index.php",
link2: "",
name: "Incutio HttpClient v0.x",
type: ""
},
%{
comment: "",
description: "IncyWincy search engine using DMOZ Open Directory database",
id: "id_g_m_483",
link1: "http://www.loopimprovements.com",
link2: "",
name: "IncyWincy data gatherer(webmaster@loopimprovements.com",
type: "R"
},
%{
comment: "",
description: "IncyWincy search engine using DMOZ Open Directory database",
id: "id_g_m_484",
link1: "http://www.loopimprovements.com",
link2: "",
name: "IncyWincy page crawler(webmaster@loopimprovements.com",
type: "R"
},
%{
comment: "",
description: "Look.com robot using IncyWincy search engine",
id: "id_g_m_485",
link1: "http://www.loopimprovements.com",
link2: "",
name: "IncyWincy(http://www.look.com)",
type: "R"
},
%{
comment: "",
description: "IncyWincy search engine using DMOZ Open Directory database",
id: "id_g_m_486",
link1: "http://www.loopimprovements.com",
link2: "",
name: "IncyWincy(http://www.loopimprovements.com/robot.html)",
type: "R"
},
%{
comment: "",
description: "IncyWincy search engine using DMOZ Open Directory database",
id: "id_g_m_487",
link1: "http://www.loopimprovements.com",
link2: "",
name: "IncyWincy/2.1(loopimprovements.com/robot.html)",
type: "R"
},
%{
comment: "",
description: "Index the Web (69.57.134.xx) crawler",
id: "id_g_m_488",
link1: "http://www.indextheweb.com/",
link2: "",
name: "IndexTheWeb.com Crawler7",
type: "R"
},
%{
comment: "see also Educate Search VxB - Full Web Bot",
description: "Spam bot from diff. IPs",
id: "id_g_m_489",
link1: "",
link2: "",
name: "Industry Program 1.0.x",
type: "S"
},
%{
comment: "",
description: "Inet Library Resource Center robot",
id: "id_g_m_490",
link1: "http://www.inetlibrary.com",
link2: "",
name: "Inet library",
type: "R"
},
%{
comment: "",
description: "InetURL IVM (phone software) plugin for web server access ?",
id: "id_g_m_491",
link1: "http://www.nch.com.au/ivm/plugins.html",
link2: "",
name: "InetURL/1.0",
type: ""
},
%{
comment: "88.149.164.2xx",
description: "Pubblisito.com search - Italia",
id: "id_g_m_270607_1",
link1: "http://www.pubblisito.com/search/",
link2: "",
name: "info@pubblisito.com- (http://www.pubblisito.com) il Sud dei Motori di Ricerca",
type: "R"
},
%{
comment: "75.126.48.17x",
description: "Infoaxe - search history and bookmark service",
id: "id_g_m_211208_2",
link1: "http://www.infoaxe.com/",
link2: "",
name: "Infoaxe./Nutch-0.9",
type: "C"
},
%{
comment:
"s.also - Convera... Maybe does guestbook / forum spamming s. here http://www.webmasterworld.com/forum11/2871.htm",
description: "Converas RetrievalWare Internet Spider (63.241.61.x)",
id: "id_g_m_492",
link1: "http://www.convera.com/Products/",
link2: "",
name: "infoConveraCrawler/0.8 ( http://www.authoritativeweb.com/crawl)",
type: "R S ?"
},
%{
comment: "",
description: "Versions-project.org Ingelin spider",
id: "id_g_m_493",
link1: "http://www.versions-project.org/",
link2: "",
name: "InfoFly/1.0 (http://www.versions-project.org/)",
type: "R"
},
%{
comment: "",
description: "InfoLink link checking tool",
id: "id_g_m_494",
link1: "http://www.biggbyte.com/biggbyte3/index.html",
link2: "",
name: "InfoLink/1.x",
type: "C"
},
%{
comment: "",
description: "INFOMINE Scholary Internet Resource Collection crawler",
id: "id_g_m_495",
link1: "http://infomine.ucr.edu",
link2: "",
name: "INFOMINE/8.0 Adders",
type: "R"
},
%{
comment: "",
description: "INFOMINE Scholary Internet Resource Collection crawler",
id: "id_g_m_496",
link1: "http://infomine.ucr.edu",
link2: "",
name: "INFOMINE/8.0 RemoteServices",
type: "R"
},
%{
comment: "",
description: "INFOMINE Scholary Internet Resource Collection crawler",
id: "id_g_m_497",
link1: "http://infomine.ucr.edu",
link2: "",
name: "INFOMINE/8.0 VLCrawler (http://infomine.ucr.edu/useragents)",
type: "R"
},
%{
comment: "",
description: "164.71.1.1xx jp.co.fujitsu.t2 Robot",
id: "id_g_m_498",
link1: "",
link2: "",
name: "InfoNaviRobot(F107)",
type: "R"
},
%{
comment: "",
description: "Infoseek robot",
id: "id_g_m_499",
link1: "http://www.infoseek.com",
link2: "",
name: "InfoSeek Sidewinder/0.9",
type: "R"
},
%{
comment: "",
description: "Infoseek robot",
id: "id_g_m_500",
link1: "http://www.infoseek.com",
link2: "",
name: "InfoSeek Sidewinder/1.0A",
type: "R"
},
%{
comment: "",
description: "Infoseek robot",
id: "id_g_m_501",
link1: "http://www.infoseek.com",
link2: "",
name: "InfoSeek Sidewinder/1.1A",
type: "R"
},
%{
comment: "",
description: "Infoseek robot",
id: "id_g_m_502",
link1: "http://www.infoseek.com",
link2: "",
name: "Infoseek SideWinder/1.45 (Compatible; MSIE 10.0; UNIX)",
type: "R"
},
%{
comment: "210.148.160.1xx",
description: "Infoseek Japan robot",
id: "id_g_m_503",
link1: "http://www.infoseek.com",
link2: "",
name: "Infoseek SideWinder/2.0B (Linux 2.4 i686)",
type: "R"
},
%{
comment: " s.also - Mozilla/3.0 (INGRID/3.0 .. / IlseBot/1.0 ..",
description: "Ilse Netherlands robot (62.69.178.xx)",
id: "id_g_m_504",
link1: "http://www.ilse.nl/",
link2: "",
name:
"INGRID/3.0 MT (webcrawler@NOSPAMexperimental.net; http://webmaster.ilse.nl/jsp/webmaster.jsp)",
type: "R"
},
%{
comment: "",
description: "Inktomi (Hotbot-Lycos NBCi etc.) robot",
id: "id_g_m_505",
link1: "http://www.inktomi.com/",
link2: "",
name: "Inktomi Search",
type: "R"
},
%{
comment: "s. also - Enterprise_Search - ES.NET_Crawler",
description: "Enterprise Search engine software (64.202.165.xxx) ",
id: "id_g_m_506",
link1: "http://www.innerprise.net",
link2: "",
name: "InnerpriseBot/1.0 (http://www.innerprise.com/)",
type: "R"
},
%{
comment: "s. also Insitornaut",
description: "Insitor Search robot (80.67.20.1xx)",
id: "id_g_m_111205_4",
link1: "http://www.insitor.com/",
link2: "",
name: "Insitor.com search and find world wide!",
type: "R"
},
%{
comment: "s. also Insitor.com",
description: "Insitor Search robot (80.67.20.1xx)",
id: "id_g_m_121205_3",
link1: "http://www.insitor.com/",
link2: "",
name: "Insitornaut",
type: "R"
},
%{
comment: "",
description: "download manager",
id: "id_g_m_507",
link1: "",
link2: "",
name: "InstallShield DigitalWizard",
type: "D"
},
%{
comment: "",
description: "Integrity - website broken link checker for MAC OSx",
id: "id_g_m_200308_1",
link1: "http://peacockmedia.co.uk/index.php/products/7-products/4-integrity",
link2: "",
name: "integrity/1.6",
type: "C"
},
%{
comment: "",
description: "Microton Intelix robot for Eurotran translation software ?",
id: "id_g_m_010907_1",
link1: "http://www.microton.cz/intelix/",
link2: "",
name: "Intelix/0.x (cs; http://www.microton.cz/intelix/; microton@@microton.cz)",
type: "D"
},
%{
comment: "",
description: "Interarchy file transfer software - SFTP/FTP client for Mac OS X",
id: "id_g_m_508",
link1: "http://www.interarchy.com",
link2: "",
name: "Interarchy/x.x.x (InterarchyCrawler)",
type: "D"
},
%{
comment: "",
description: "Dream Train (Japan) Internet search robot",
id: "id_g_m_509",
link1: "http://www.dti.ne.jp",
link2: "",
name: "Internet Ninja x.0",
type: "R"
},
%{
comment: "s.also - archive.org_bot - Mozilla/5.0 (compatible;archive.org_bot/...",
description:
"Heritrix - The Internet Archive's open-source crawler based on Nutch (207.241.225.2xx)",
id: "id_g_m_510",
link1: "http://www.archive.org/",
link2: "http://lucene.apache.org",
name:
"InternetArchive/0.8-dev(Nutch;http://lucene.apache.org/nutch/bot.html;nutch-agent@lucene.apache",
type: "R"
},
%{
comment: "",
description: "Internet Link Agent - link checking tool",
id: "id_g_m_511",
link1: "http://www.osk.3web.ne.jp/~goronyan/winprg/sub.shtml",
link2: "",
name: "InternetLinkAgent/3.1",
type: "C"
},
%{
comment: "",
description: "Internetseer Web site monitoring / Claymont robot",
id: "id_g_m_512",
link1: "http://www.internetseer.com",
link2: "",
name: "InternetSeer.com",
type: "R"
},
%{
comment: "",
description: "intraVNews - Feed reader & RSS aggregator for Outlook",
id: "id_g_m_513",
link1: "http://www.intravnews.com",
link2: "",
name: "intraVnews/1.x",
type: "B"
},
%{
comment: "149.20.54.1xx",
description: "Internet Open Index crawler using Nutch",
id: "id_g_m_061208_1",
link1: "http://index.isc.org/",
link2: "http://www.nutch.org",
name: "IOI/2.0 (ISC Open Index crawler; http://index.isc.org/; bot@index.isc.org)",
type: "R"
},
%{
comment: "",
description: "IP*Works! HTTP Component",
id: "id_g_m_514",
link1: "http://www.nsoftware.com/products/controls/?ctl=HTTP",
link2: "",
name: "IP*Works! V5 HTTP/S Component - by /n software - www.nsoftware.com",
type: ""
},
%{
comment: "",
description: "IP2Location - Reverse lookup geographical data and ISP by IP",
id: "id_g_m_515",
link1: "http://www.ip2location.com",
link2: "",
name: "http://www.ip2location.com",
type: "R C"
},
%{
comment: "",
description: "IP2Map - geographical IP mapping",
id: "id_g_m_270106_1",
link1: "http://www.ip2map.com/",
link2: "",
name: "IP2MapBot/1.1 <a href=http://www.ip2map.com>http://www.ip2map.com</a>",
type: "R C"
},
%{
comment: "",
description: "Laurions Ipium robot",
id: "id_g_m_516",
link1: "http://www.laurion.com",
link2: "",
name: "IPiumBot laurion(dot)com",
type: "R"
},
%{
comment: "",
description: "Ipselon Web Search robot",
id: "id_g_m_517",
link1: "http://www.ipselon.com",
link2: "",
name: "IpselonBot/0.xx-beta (Ipselon; http://www.ipselon.com; ipselonbot@ipselon.com)",
type: "R"
},
%{
comment: "",
description: "Iria download manager",
id: "id_g_m_518",
link1: "http://www5.tok2.com/home/koteturamu/soft/iria.htm",
link2: "",
name: "Iria/1.xxa",
type: "D"
},
%{
comment: "128.194.135.xx",
description: "IRL-crawler - Texas A&M University research project crawler",
id: "id_g_m_519",
link1: "http://irl.cs.tamu.edu",
link2: "",
name: "IRLbot/1.0 ( http://irl.cs.tamu.edu/crawler)",
type: "R"
},
%{
comment: "128.194.135.xx",
description: "IRL-crawler - Texas A&M University research project crawler",
id: "id_g_m_240308_4",
link1: "http://irl.cs.tamu.edu",
link2: "",
name: "IRLbot/3.0 (compatible; MSIE 6.0; http://irl.cs.tamu.edu/crawler/)",
type: "R"
},
%{
comment: "",
description: "url_log - Irssi Perl url grabber",
id: "id_g_m_520",
link1: "http://www.irssi.org/scripts/html/url_log.pl.html",
link2: "",
name: "IrssiUrlLog/0.2",
type: ""
},
%{
comment: "",
description: "Irvine downloading tool",
id: "id_g_m_521",
link1: "http://hp.vector.co.jp/authors/VA024591/",
link2: "",
name: "Irvine/1.x.x",
type: "D"
},
%{
comment: "",
description: "Unknown spambot / harvester from diff. IPs",
id: "id_g_m_140506_1",
link1:
"http://www.projecthoneypot.org/ip_inspector.php?iph=978231e229521680d11cb93f32de0fa1",
link2: "",
name: "ISC Systems iRc Search 2.1",
type: "S"
},
%{
comment: "",
description: "iSiloX document converter for iSilo reader",
id: "id_g_m_030106_1",
link1: "http://www.isilox.com/",
link2: "",
name: "iSiloX/4.xx Windows/32",
type: "B"
},
%{
comment: "",
description: "Unknown University of Alberta link-checking ?",
id: "id_g_m_522",
link1: "http://www.ualberta.ca",
link2: "",
name: "isurf (tszhu@canada.com)",
type: "C"
},
%{
comment: "",
description: "iTunes UA name for access and decrypt the iTunes music store pages",
id: "id_g_m_150408_5",
link1: "http://www.apple.com/itunes/",
link2: "",
name: "iTunes/x.x.x",
type: "B"
},
%{
comment: "",
description: "Some spam bot from 66.139.78.xx(x)",
id: "id_g_m_523",
link1: "",
link2: "",
name: "IUPUI Research Bot v 1.9a",
type: "S"
},
%{
comment: "",
description: "iVia robot - Open source Internet portal & virtual library system software",
id: "id_g_m_280906_1",
link1: "http://ivia.ucr.edu/",
link2: "",
name: "iVia Page Fetcher (http://ivia.ucr.edu/useragents.shtml)",
type: "D"
},
%{
comment: "",
description: "iVia robot - Open source Internet portal & virtual library system software",
id: "id_g_m_524",
link1: "http://ivia.ucr.edu/",
link2: "",
name: "iVia/4.0 CanonizeUrl (http://infomine.ucr.edu/iVia/useragents.shtml",
type: "D"
},
%{
comment: "72.14.164.1xx",
description: "BD BrandProtect - brand, company or trademarks online monitoring",
id: "id_g_m_180707_1",
link1: "http://www.brandprotect.com/",
link2: "",
name: "IWAgent/ 1.0 - www.brandprotect.com",
type: "R"
},
%{
comment: "",
description: "Proxy message from jp-q.ne.jp",
id: "id_g_m_525",
link1: "",
link2: "",
name: "J-PHONE/3.0/J-SH07",
type: "P"
},
%{
comment: "",
description: "ODIN Directory Japan robot (163.138.95.xx)",
id: "id_g_m_526",
link1: "http://www.ingrid.org",
link2: "",
name: "Jabot/6.x (http://odin.ingrid.org/)",
type: "R"
},
%{
comment: "",
description: "ODIN Directory Japan robot (163.138.95.xx)",
id: "id_g_m_527",
link1: "http://www.ingrid.org",
link2: "",
name: "Jabot/7.x.x (http://odin.ingrid.org/)",
type: "R"
},
%{
comment: "",
description: "German Domanova (offline since Feb.02) robot",
id: "id_g_m_528",
link1: "",
link2: "",
name: "Jack",
type: "R"
},
%{
comment: "",
description: "Jakarta Commons (Java based) HTTP client",
id: "id_g_m_529",
link1: "http://jakarta.apache.org/commons/httpclient/",
link2: "",
name: "Jakarta Commons-HttpClient/2.0xxx",
type: "B"
},
%{
comment: "",
description: "Jakarta Commons (Java based) HTTP client",
id: "id_g_m_530",
link1: "http://jakarta.apache.org/commons/httpclient/",
link2: "",
name: "Jakarta Commons-HttpClient/3.0-rcx",
type: "B"
},
%{
comment: "",
description: "JamBot search robot (70.146.82.xx)",
id: "id_g_m_240306_3",
link1: "http://www.jambot.com/",
link2: "",
name: "Jambot/0.1.x (Jambot; http://www.jambot.com/blog; crawler@jambot.com)",
type: "R"
},
%{
comment: "70.146.82.xx",
description: "JamBot search robot",
id: "id_g_m_130108_1",
link1: "http://www.jambot.com/",
link2: "",
name:
"Jambot/0.2.1 (Jambot; http://www.jambot.com/blog/static.php?page=webmaster-robot; crawler@jambot.com)",
type: "R"
},
%{
comment: "",
description: "Java VM",
id: "id_g_m_531",
link1: "http://java.sun.com/",
link2: "",
name: "Java 1.1",
type: ""
},
%{
comment: " used as robot from 194.203.40.xx",
description: "Java VM",
id: "id_g_m_532",
link1: "http://java.sun.com/",
link2: "",
name: "Java/1.4.1_01",
type: "R B D"
},
%{
comment: "",
description: "Java VM",
id: "id_g_m_533",
link1: "http://java.sun.com/",
link2: "",
name: "Java1.0.21.0",
type: "B"
},
%{
comment: "",
description: "Java VM",
id: "id_g_m_534",
link1: "http://java.sun.com/",
link2: "",
name: "Java1.1.xx.x",
type: ""
},
%{
comment: "",
description: "Java VM",
id: "id_g_m_535",
link1: "http://java.sun.com/",
link2: "",
name: "Java1.3.0rc1",
type: ""
},
%{
comment: "",
description: "Java VM",
id: "id_g_m_536",
link1: "http://java.sun.com/",
link2: "",
name: "Java1.3.x",
type: ""
},
%{
comment:
"used by diff. IPs for various purposes i.e.: - Dortmund University Java based robot - Roadrunner.net (66.108.xxx.xxx) user robot in conjunction w. RPT-HTTPClient/0.3-3",
description: "Java VM",
id: "id_g_m_537",
link1: "http://java.sun.com/",
link2: "http://www.informatik.uni-dortmund.DE",
name: "Java1.4.0",
type: "R B D"
},
%{
comment: "",
description: "Jayde B2B Search robot (66.28.139.xx)",
id: "id_g_m_538",
link1: "http://www.jayde.com",
link2: "",
name: "Jayde Crawler. http://www.jayde.com",
type: "R"
},
%{
comment: "",
description: "some site downloading tool ? via 61.77.51.xxx",
id: "id_g_m_539",
link1: "",
link2: "",
name: "JBH Agent 2.0",
type: "D"
},
%{
comment: "",
description: "WAP 2.0 / jBrowser for handhelds",
id: "id_g_m_540",
link1: "http://www.jataayusoft.com/DbWAPHH.htm",
link2: "",
name: "jBrowser/J2ME Profile/MIDP-1.0 Configuration/CLDC-1.0 (Google WAP Proxy/1.0)",
type: "B"
},
%{
comment: "",
description: "JCheckLinks Java hyperlink validator",
id: "id_g_m_541",
link1: "http://web.purplefrog.com/%7Ethoth/jchecklinks/",
link2: "",
name: "JCheckLinks/0.1 RPT-HTTPClient/0.3-1",
type: "C"
},
%{
comment: "",
description: "Java Development Kit",
id: "id_g_m_542",
link1: "http://developers.sun.com/index.html",
link2: "",
name: "JDK/1.1",
type: ""
},
%{
comment: "",
description: "Insignias Jeode (PDA) Java platform",
id: "id_g_m_543",
link1: "http://www.insignia.com/content/products/jvmProducts.shtml",
link2: "",
name: "Jeode/1.x.x",
type: "B"
},
%{
comment: "",
description: "JetEye Search robot (64.62.142.xxx / 64.71.144.xxx)",
id: "id_g_m_544",
link1: "http://www.jeteye.com",
link2: "",
name: "Jetbot/1.0",
type: "R"
},
%{
comment: "",
description: "Omea RSS - Atom - newsgroups web page reader ",
id: "id_g_m_545",
link1: "http://www.jetbrains.com/omea_reader/",
link2: "",
name: "JetBrains Omea Reader 1.0.x (http://www.jetbrains.com/omea_reader/)",
type: "B"
},
%{
comment: "",
description: "Omea RSS - Atom - newsgroups web page reader ",
id: "id_g_m_546",
link1: "http://www.jetbrains.com/omea_reader/",
link2: "",
name:
"JetBrains Omea Reader 2.0 Release Candidate 1 (http://www.jetbrains.com/omea_reader/)",
type: "B"
},
%{
comment: "",
description: "JetCar / Flashget download manager",
id: "id_g_m_547",
link1: "http://www.amazesoft.com",
link2: "",
name: "JetCar",
type: "D"
},
%{
comment: "",
description: "Jigsaw - W3C's CSS Validator Server",
id: "id_g_m_548",
link1: "http://jigsaw.w3.org/css-validator/validator-uri.html",
link2: "",
name: "Jigsaw/2.2.x W3C_CSS_Validator_JFouffa/2.0",
type: "C"
},
%{
comment: "",
description: "Jobo website downloading program",
id: "id_g_m_550",
link1: "http://www.matuschek.net/software/jobo/index.html",
link2: "",
name: "JoBo/1.x (http://www.matuschek.net/jobo.html)",
type: "D B"
},
%{
comment: "",
description: "Jobo website downloading program",
id: "id_g_m_549",
link1: "http://www.matuschek.net/software/jobo/index.html",
link2: "",
name: "JoBo/@JOBO_VERSION@(http://www.matuschek.net/jobo.html)",
type: "D B"
},
%{
comment: "",
description: "Finacialbot.com - German (213.61.218.xx) job search JobRoboter",
id: "id_g_m_551",
link1: "http://www.finbot.com/jr1.html",
link2: "",
name: "JobSpider_BA/1.1",
type: "R"
},
%{
comment: "",
description: "Jocsoft Web Spider - website downloading tool",
id: "id_g_m_552",
link1: "http://www.jocsoft.com/jws/index.htm",
link2: "",
name: "JOC Web Spider",
type: "D B"
},
%{
comment: "216.227.208.1xx",
description: "Jordo Media RSS / Atom feed directory link checking",
id: "id_g_m_051206_5",
link1: "http://www.jordomedia.com/",
link2: "",
name: "JordoMedia/1.0 RSS File Reader (http://www.jordomedia.com)",
type: "C"
},
%{
comment: "",
description: "Journster.com RSS/Atom aggregator",
id: "id_g_m_090206_2",
link1: "http://beta.journster.com/",
link2: "",
name: "Journster [alpha] (http://journster.com/)",
type: "C"
},
%{
comment: "",
description: "Journster.com RSS/Atom aggregator",
id: "id_g_m_090206_3",
link1: "http://beta.journster.com/",
link2: "",
name: "Journster.com RSS/Atom aggregator 0.5 (http://www.journster.com/bot.phtml)",
type: "C"
},
%{
comment: "",
description: "Check Favorites bookmark checking",
id: "id_g_m_553",
link1: "http://www.jrtwine.com/Products/CheckFavs/",
link2: "",
name: "JRTS Check Favorites Utility",
type: "C"
},
%{
comment: "",
description: "Check Favorites bookmark checking",
id: "id_g_m_554",
link1: "http://www.jrtwine.com/Products/CheckFavs/",
link2: "",
name: "JRTwine Software Check Favorites Utility",
type: "C"
},
%{
comment: "",
description: "Jyxo search (Czech Republic) robot (212.71.128.xx)",
id: "id_g_m_555",
link1: "http://jyxo.cz/",
link2: "",
name: "Jyxobot/x",
type: "R"
},
%{
comment: "",
description: "K-meleon browser - Windows 2000",
id: "id_g_m_556",
link1: "http://kmeleon.sourceforge.net/",
link2: "",
name: "K-Meleon/0.6 (Windows; U; Windows NT 5.1; en-US; rv:0.9.5) Gecko/20011011",
type: "B"
},
%{
comment: "",
description: "Verity K2 Spider ( Network search software)",
id: "id_g_m_557",
link1: "http://www.verity.com/products/pdf/MK0368a_K2_Spider.pdf",
link2: "",
name: "k2spider",
type: "R"
},
%{
comment: "143.248.134.22x",
description:
"Unknown robot from AITrc (Advanced Information Technology Research Center) - Korea",
id: "id_g_m_010108_3",
link1: "http://aitrc.kaist.ac.kr/english/",
link2: "",
name: "KAIST AITrc Crawler",
type: "R"
},
%{
comment: "216.139.221.1xx",
description: "Kakle ranked metasearch robot",
id: "id_g_m_010506_1",
link1: "http://www.kakle.com/",
link2: "",
name:
"KakleBot - www.kakle.com/0.1 (KakleBot - www.kakle.com; http:// www.kakle.com/bot.html; support@kakle.com)",
type: "R"
},
%{
comment: "195.210.57.1xx",
description: "Kalooga image crawler",
id: "id_g_m_250408_3",
link1: "http://www.kalooga.com/",
link2: "",
name:
"kalooga/kalooga-4.0-dev-datahouse (Kalooga; http://www.kalooga.com; info@kalooga.com)",
type: "R"
},
%{
comment: "195.210.57.1xx",
description: "Kalooga image crawler",
id: "id_g_m_011108_3",
link1: "http://www.kalooga.com/",
link2: "",
name:
"kalooga/KaloogaBot (Kalooga; http://www.kalooga.com/info.html?page=crawler; crawler@kalooga.com)",
type: "R"
},
%{
comment: "",
description: "Kapere site grapper / web downloader",
id: "id_g_m_558",
link1: "http://www.kapere.com",
link2: "",
name: "Kapere (http://www.kapere.com)",
type: "D"
},
%{
comment: "",
description: "Kazehakase - Gecko based browser (Japan)",
id: "id_g_m_090807_1",
link1: "http://kazehakase.sourceforge.jp/",
link2: "",
name: "Kazehakase/0.x.x.[x]",
type: "B"
},
%{
comment: "",
description: "Openwave UP.Browser for mobiles via Google WAP Proxy (216.239.33.x)",
id: "id_g_m_559",
link1: "http://www.openwave.com",
link2: "",
name: "KDDI-SN22 UP.Browser/6.0.7 (GUI) MMP/1.1 (Google WAP Proxy/1.0)",
type: "P"
},
%{
comment: "",
description: "Kenjin Spider search agent",
id: "id_g_m_561",
link1: "http://www.kenjin.ne.jp",
link2: "",
name: "Kenjin Spider",
type: "R"
},
%{
comment: "",
description:
"Dznet.com Kevin crawler (link checking ?) via 68.39.148.xx (nj.comcast.net)",
id: "id_g_m_562",
link1: "http://www.dznet.com",
link2: "",
name: "Kevin http://dznet.com/kevin/",
type: "R"
},
%{
comment: "",
description:
"Website AlertsKevin crawler (website monitoring) via 68.39.148.xx (nj.comcast.net)",
id: "id_g_m_563",
link1: "http://www.websitealert.net",
link2: "",
name: "Kevin http://websitealert.net/kevin/",
type: "R"
},
%{
comment: "",
description: "Voila.fr robot",
id: "id_g_m_560",
link1: "http://www.voila.fr",
link2: "",
name: "KE_1.0/2.0 libwww/5.2.8",
type: "R"
},
%{
comment: "",
description: "Some Perl search script from KFSW (Germany)",
id: "id_g_m_301105_5",
link1: "http://www.kfsw.de/",
link2: "",
name: "KFSW-Bot (Version: 1.01 powered by KFSW www.kfsw.de)",
type: "R"
},
%{
comment: "",
description: "kinja weblog search robot",
id: "id_g_m_100206_4",
link1: "http://www.kinja.com/",
link2: "",
name: "kinja-imagebot (http://www.kinja.com/)",
type: "R"
},
%{
comment: "",
description: "kinja weblog search robot",
id: "id_g_m_100206_3",
link1: "http://www.kinja.com/",
link2: "",
name: "kinjabot (http://www.kinja.com)",
type: "R"
},
%{
comment: "",
description: "Fireball search (Germany) robot",
id: "id_g_m_564",
link1: "http://www.fireball.de",
link2: "",
name: "KIT-Fireball/2.0",
type: "R"
},
%{
comment: "",
description: "Fireball search (Germany) robot",
id: "id_g_m_565",
link1: "http://www.fireball.de",
link2: "",
name: "KIT-Fireball/2.0 (compatible; Mozilla 4.0; MSIE 5.5)",
type: "R"
},
%{
comment: "",
description: "Klondike WAP Browser",
id: "id_g_m_566",
link1: "http://www.apachesoftware.com",
link2: "",
name: "Klondike/1.50 (WSP Win32) (Google WAP Proxy/1.0)",
type: "B"
},
%{
comment: "",
description: "University of Washington KnowItAll - web information extraction",
id: "id_g_m_567",
link1: "http://www.cs.washington.edu",
link2: "",
name: "KnowItAll(knowitall@cs.washington.edu)",
type: "R"
},
%{
comment: "",
description: "The knowledge.com (ODP) directory robot",
id: "id_g_m_568",
link1: "http://www.knowledge.com",
link2: "",
name: "Knowledge.com/0.x",
type: "R"
},
%{
comment: "",
description: "Kontiki Client download manager",
id: "id_g_m_569",
link1: "http://www.kontiki.com/client/userhelp_f.shtml",
link2: "",
name: "Kontiki Client x.xx",
type: "D"
},
%{
comment: "powered by Nutch",
description: "Krugle source code search engine for developers (64.71.164.1xx) ",
id: "id_g_m_280406_2",
link1: "http://www.krugle.com/",
link2: "",
name:
"Krugle/Krugle,Nutch/0.8+ (Krugle web crawler; http://www.krugle.com/crawler/info.html; webcrawler@krugle.com)",
type: "R"
},
%{
comment: "12.129.110.xx",
description: "KnowledgeStorm technology industry crawler for Findtech.com",
id: "id_g_m_180606_2",
link1: "http://www.findtech.com/",
link2: "http://www.knowledgestorm.com/resources/content/crawler/index.html",
name:
"KSbot/1.0 (KnowledgeStorm crawler; http://www.knowledgestorm.com/resources/content/crawler/index.html; crawleradmin@knowledgestorm.com)",
type: "R"
},
%{
comment: "",
description: "Kuloko contextual search robot",
id: "id_g_m_570",
link1: "http://www.kuloko.com/",
link2: "",
name: "kuloko-bot/0.x",
type: "R"
},
%{
comment: "",
description: "Kuloko contextual search robot",
id: "id_g_m_571",
link1: "http://www.kuloko.com",
link2: "",
name: "kulokobot www.kuloko.com kuloko@backweave.com",
type: "R"
},
%{
comment: "",
description: "National Library of Sweden Heritage Project robot",
id: "id_g_m_572",
link1: "http://www.kb.se/ENG/kbstart.htm",
link2: "",
name: "kulturarw3/0.1",
type: "R"
},
%{
comment: "Sanoma also runs some web-portals i.e. http://www.startlap.com/",
description: "Link or server checking from Sanoma Budapest (195.70.35.xxx)",
id: "id_g_m_301105_2",
link1: "http://sanomabp.hu/",
link2: "",
name: "KummHttp/1.1 (compatible; KummClient; Linux rulez)",
type: "C R"
},
%{
comment: "",
description: "UP.Browser for mobiles on Kyocera KWC-KX9 cellphone",
id: "id_g_m_280209_3",
link1: "http://www.openwave.com",
link2: "",
name: "KWC-KX9/1109 UP.Browser/6.2.3.9.g.1.107 (GUI) MMP/2.0 UP.Link/6.3.0.0.0",
type: "B"
},
%{
comment: "http://ir.dcs.gla.ac.uk/wiki/TREC-Blog",
description: "TREC Blog Track - Blog and news feed crawler",
id: "id_g_m_211208_3",
link1: "",
link2: "",
name: "Labrador/0.2; http://ir.dcs.gla.ac.uk/labrador; craigm@dcs.gla.ac.uk",
type: "130.209.241.2xx"
},
%{
comment: "",
description: "Intels Lachesis web site response time monitoring tool",
id: "id_g_m_573",
link1: "ftp://ftp.imag.fr/pub/labo-LSR/DRAKKAR/internet-performance/lachesis/",
link2: "",
name: "Lachesis",
type: "C"
},
%{
comment: "reads robots.txt",
description: "Unknown robot from Easten Network China (202.96.51.1xx)",
id: "id_g_m_140406_1",
link1: "",
link2: "",
name: "lanshanbot/1.0",
type: ""
},
%{
comment: "reads robots.txt",
description: "Unknown robot from Easten Network China (202.96.51.1xx)",
id: "id_g_m_021206_2",
link1: "",
link2: "",
name: "lanshanbot/1.0 (+http://search.msn.com/msnbot.htm)",
type: ""
},
%{
comment: "",
description: "Lapozz search (Hungary) robot (82.131.195.xx)",
id: "id_g_m_271105_1",
link1: "http://www.lapozz.com/",
link2: "",
name: "LapozzBot/1.4 ( http://robot.lapozz.com)",
type: "R"
},
%{
comment: "",
description: "Lapozz search (Hungary) robot (82.131.195.xx)",
id: "id_g_m_280508_3",
link1: "http://www.lapozz.com/",
link2: "",
name: "LapozzBot/1.5 (+http://robot.lapozz.hu)",
type: "R"
},
%{
comment: "",
description: "Larbin indexer used as Metacarta.com (66.28.xx.xxx) robot",
id: "id_g_m_574",
link1: "http://www.metacarta.com/",
link2: "http://larbin.sourceforge.net/index-eng.html",
name: "larbin (samualt9@bigfoot.com)",
type: "R"
},
%{
comment: "maybe an e-mail collector - see also Mozilla/4.0 efp@gmx.net",
description: "Unknown robot from 66.230.140.xx (argon.oxeo.com)",
id: "id_g_m_592",
link1: "",
link2: "",
name: "LARBIN-EXPERIMENTAL (efp@gmx.net)",
type: "S"
},
%{
comment: "",
description: "Larbin indexer used by Mitsubishi Electric Research Labs",
id: "id_g_m_575",
link1: "http://www.merl.com",
link2: "http://larbin.sourceforge.net/index-eng.html",
name: "larbin_2.1.1 larbin2.1.1@somewhere.com",
type: "R"
},
%{
comment: "",
description: "Larbin indexer used as Compete.com crawler",
id: "id_g_m_576",
link1: "http://www.compete.com",
link2: "http://larbin.sourceforge.net/index-eng.html",
name: "larbin_2.2.0 (crawl@compete.com)",
type: "R"
},
%{
comment: "",
description: "Larbin indexer used as Inria robot",
id: "id_g_m_577",
link1: "http://www.inria.fr/index.en.html",
link2: "http://larbin.sourceforge.net/index-eng.html",
name: "larbin_2.2.1_de_Viennot (Laurent.Viennot@inria.fr)",
type: "R"
},
%{
comment: "",
description: "Larbin indexer used as Kyoto University robot",
id: "id_g_m_578",
link1: "http://www.kyoto-u.ac.jp/",
link2: "http://larbin.sourceforge.net/index-eng.html",
name: "larbin_2.2.2 (sugayama@lab7.kuis.kyoto-u.ac.jp)",
type: "R"
},
%{
comment: "",
description: "Larbin indexer used as Inria robot",
id: "id_g_m_579",
link1: "http://www.inria.fr/index.en.html",
link2: "http://larbin.sourceforge.net/index-eng.html",
name: "larbin_2.2.2_guillaume (guillaume@liafa.jussieu.fr)",
type: "R"
},
%{
comment: "",
description: "Larbin indexer used by an unknown dsl.net client",
id: "id_g_m_581",
link1: "http://larbin.sourceforge.net/index-eng.html",
link2: "",
name: "larbin_2.6.0 (larbin2.6.0@unspecified.mail)",
type: "R"
},
%{
comment: " ie.: -Central Host Inc. (client) robot ? - Colt Net France robot",
description: "Larbin indexer used by diff. IPs / services",
id: "id_g_m_582",
link1: "http://www.centralhost.com",
link2: "http://larbin.sourceforge.net/index-eng.html",
name: "larbin_2.6.1 (larbin2.6.1@unspecified.mail)",
type: "R"
},
%{
comment: "",
description: "Larbin indexer used by National Institut of Informatics (NII/Japan)",
id: "id_g_m_583",
link1: "http://www.nii.ac.jp",
link2: "http://larbin.sourceforge.net/index-eng.html",
name: "larbin_2.6.2 (hamasaki@grad.nii.ac.jp)",
type: "R"
},
%{
comment: "",
description: "Larbin indexer used by diff. IPs",
id: "id_g_m_584",
link1: "http://larbin.sourceforge.net/index-eng.html",
link2: "",
name: "larbin_2.6.2 (larbin2.6.2@unspecified.mail)",
type: "R"
},
%{
comment: "",
description:
"Larbin indexer used as robot by Georgia Institute of Technology http://www.gatech.edu/",
id: "id_g_m_585",
link1: "http://www.gatech.edu",
link2: "http://larbin.sourceforge.net/index-eng.html",
name: "larbin_2.6.2 (listonATccDOTgatechDOTedu)",
type: "R"
},
%{
comment: "",
description: "Larbin indexer used by Technical University of Crete",
id: "id_g_m_586",
link1: "http://www.systems.tuc.gr",
link2: "http://larbin.sourceforge.net/index-eng.html",
name: "larbin_2.6.2 (pimenas@systems.tuc.gr)",
type: "R"
},
%{
comment: "",
description: "Larbin indexer used as Lemur Consulting robot",
id: "id_g_m_587",
link1: "http://www.lemurconsulting.com",
link2: "http://larbin.sourceforge.net/index-eng.html",
name: "larbin_2.6.2 (tom@lemurconsulting.com)",
type: "R"
},
%{
comment: "",
description: "Larbin indexer used as robot via cloud9.net (168.100.192.xxx)",
id: "id_g_m_588",
link1: "http://larbin.sourceforge.net/index-eng.html",
link2: "",
name: "larbin_2.6.2 (vitalbox1@hotmail.com)",
type: "R"
},
%{
comment: "reads robots.txt",
description: "Unknown robot from EPFL Lausanne Switzerland (128.178.155.1xx)",
id: "id_g_m_261205_1",
link1: "http://www.epfl.ch/Eindex.html",
link2: "",
name: "larbin_2.6.3 (ltaa_web_crawler@groupes.epfl.ch)",
type: "R"
},
%{
comment: " s. also: - geniebot wgao@genieknows.com",
description: "Larbin indexer used by GenieKnows.com search",
id: "id_g_m_589",
link1: "http://www.genieknows.com",
link2: "http://larbin.sourceforge.net/index-eng.html",
name: "larbin_2.6.3 (wgao@genieknows.com)",
type: "R"
},
%{
comment: "",
description: "Larbin indexer used by Next Generation Information Retrieval (NGIR)",
id: "id_g_m_590",
link1: "http://cosco.hiit.fi",
link2: "http://larbin.sourceforge.net/index-eng.html",
name: "larbin_2.6.3_for_(http://cosco.hiit.fi/search/) tsilande@hiit.fi",
type: "R"
},
%{
comment: "",
description: "Larbin indexer used by CEA / DCom Rechercher",
id: "id_g_m_580",
link1: "http://www.cea.fr",
link2: "http://larbin.sourceforge.net/index-eng.html",
name: "larbin_2.6_basileocaml (basile.starynkevitch@cea.fr)",
type: "R"
},
%{
comment: "",
description: "Larbin indexer used as Inria robot",
id: "id_g_m_591",
link1: "http://pauillac.inria.fr",
link2: "http://larbin.sourceforge.net/index-eng.html",
name: "larbin_devel (http://pauillac.inria.fr/~ailleret/prog/larbin/)",
type: "R"
},
%{
comment: "216.86.137.xx",
description: "LawInfo - Lawyer and attorney directory",
id: "id_g_m_160807_2",
link1: "http://www.lawinfo.com/",
link2: "",
name:
"lawinfo-crawler/Nutch-0.9-dev (Crawler for lawinfo.com pages; http://www.lawinfo.com; webmaster@lawinfo.com)",
type: "R"
},
%{
comment: "",
description: "ROADS - Perl web based subject based gateway tool",
id: "id_g_m_020506_3",
link1: "http://roads.opensource.ac.uk/",
link2: "",
name: "lc/$ROADS::Version libwww-perl/5.00",
type: ""
},
%{
comment: "142.177.168.xxx",
description: "unknown robot via MTT.ca / Aliant.ca",
id: "id_g_m_593",
link1: "",
link2: "",
name: "lcabotAccept: */*",
type: ""
},
%{
comment: "",
description: "LeapTag news reader and content discovery tool",
id: "id_g_m_140408_1",
link1: "http://www.leaptag.com/",
link2: "",
name: "LeapTag/0.8.1.beta081.r3750 (compatible; Mozilla 4.0; MSIE 5.5; robot@yoriwa.com)",
type: "B"
},
%{
comment: "",
description: "Linkexchange crawler",
id: "id_g_m_594",
link1: "http://www.linkexchange.com",
link2: "",
name: "LECodeChecker/3.0 libgetdoc/1.0",
type: "R"
},
%{
comment: "",
description: "Leechget download manager",
id: "id_g_m_595",
link1: "http://www.leechget.de",
link2: "",
name: "LeechGet 200x (www.leechget.de)",
type: "D"
},
%{
comment: "",
description: "Gseek.com (site is offline) robot",
id: "id_g_m_596",
link1: "",
link2: "",
name: "LEIA/2.90",
type: "R"
},
%{
comment: "",
description: "Gseek.com (site is offline) robot",
id: "id_g_m_597",
link1: "",
link2: "",
name: "LEIA/3.01pr (LEIAcrawler; [SNIP])",
type: "R"
},
%{
comment: "website has no function",
description: "Maybe logfile spamming for Lets crawl! search (Germany)",
id: "id_g_m_210106_2",
link1: "http://letscrawl.com/",
link2: "",
name: "LetsCrawl.com/1.0 +http://letscrawl.com/",
type: "S"
},
%{
comment: "",
description: "Lexibot (exMataHari) search software",
id: "id_g_m_598",
link1: "http://www.lexibot.com/index.asp",
link2: "",
name: "LexiBot/1.00",
type: "R"
},
%{
comment: "",
description: "Polaris mobile browser on LG LX 260 Sprint Rumor phone",
id: "id_g_m_140209_2",
link1: "http://www.infraware.co.kr/eng/01_product/product10.asp",
link2: "",
name: "LG-LX260 POLARIS-LX260/2.0 MMP/2.0 Profile/MIDP-2.0 Configuration/CLDC-1.1",
type: "B"
},
%{
comment: "",
description: "LG 8138 Mobile Phone browser",
id: "id_g_m_599",
link1: "",
link2: "",
name: "LG/U8138/v1.0",
type: "B"
},
%{
comment: "",
description: "About.com robot",
id: "id_g_m_600",
link1: "http://www.about.com/",
link2: "",
name: "Libby_1.1/libwww-perl/5.47",
type: "R"
},
%{
comment: "",
description: "libcurl's (multiprotocol file transfer library) standard user-agent name",
id: "id_g_m_100306_1",
link1: "http://curl.haxx.se/libcurl/",
link2: "",
name: "libcurl-agent/1.0",
type: "D"
},
%{
comment: "213.251.135.2xx",
description: "LibertyW search for mobile (France)",
id: "id_g_m_080507_1",
link1: "http://www.lw01.com/en/",
link2: "",
name: "LibertyW (+http://www.lw01.com)",
type: "R"
},
%{
comment: "",
description: "Korea Telecom Search robot",
id: "id_g_m_601",
link1: "http://www.kt.co.kr/kt_home/eng/index.jsp",
link2: "",
name: "libWeb/clsHTTP -- hiongun@kt.co.kr",
type: "R"
},
%{
comment: "",
description: "CMP United Media robot",
id: "id_g_m_602",
link1: "http://www.cmpnet.com",
link2: "",
name: "libwww-perl/5.41",
type: "R"
},
%{
comment: "",
description: "SplatSearch robot (207.44.142.xx)",
id: "id_g_m_603",
link1: "http://www.splatsearch.com",
link2: "",
name: "libwww-perl/5.45",
type: "R"
},
%{
comment: "",
description: "Alexa robot",
id: "id_g_m_604",
link1: "http://www.alexa.com",
link2: "",
name: "libwww-perl/5.48",
type: "R"
},
%{
comment:
" ie.: - secure-netz.de link checking (in conjunction w. LWP::Simple/5.50) -N2H2 Internet filtering",
description: "diff. IPs / services",
id: "id_g_m_605",
link1: "http://www.n2h2.com",
link2: "",
name: "libwww-perl/5.50",
type: "R C P"
},
%{
comment: "",
description: "Fast Search robot",
id: "id_g_m_606",
link1: "http://www.alltheweb.com",
link2: "",
name: "libwww-perl/5.52 FP/2.1",
type: "R"
},
%{
comment: "",
description: "Fast Search robot",
id: "id_g_m_607",
link1: "http://www.alltheweb.com",
link2: "",
name: "libwww-perl/5.52 FP/4.0",
type: "R"
},
%{
comment: " ie.: -iPrism Web filtering software - softclub.net link checking",
description: "diff. IPs / services",
id: "id_g_m_608",
link1: "http://www.stbernard.com/default.asp",
link2: "",
name: "libwww-perl/5.53",
type: "R C P"
},
%{
comment: "",
description: "Profile for You internet profiling (?)",
id: "id_g_m_609",
link1: "http://www.profile4u.com",
link2: "",
name: "libwww-perl/5.63",
type: "R C"
},
%{
comment: "",
description: "unknown link checking from Wanadoo.fr (193.253.33.xxx)",
id: "id_g_m_610",
link1: "",
link2: "",
name: "libwww-perl/5.64",
type: "R C"
},
%{
comment: " s. also amibot",
description: "Amidalla search engine robot (62.241.33.xx)",
id: "id_g_m_611",
link1: "http://www.amidalla.com",
link2: "",
name: "libwww-perl/5.65",
type: "R"
},
%{
comment: "",
description: "SplatSearch robot (72.36.210.xx)",
id: "id_g_m_612",
link1: "http://www.splatsearch.com/",
link2: "",
name: "libwww-perl/5.800",
type: "R"
},
%{
comment: "",
description: "Mediater Rechercher robot",
id: "id_g_m_613",
link1: "http://www.mediater.net",
link2: "",
name: "libwww/5.3.2",
type: "R"
},
%{
comment: "",
description: "Liferea - Linux feed reader",
id: "id_g_m_160206_1",
link1: "http://liferea.sourceforge.net/",
link2: "",
name: "Liferea/0.x.x (Linux; en_US.UTF-8; http://liferea.sf.net/)",
type: "B"
},
%{
comment: "",
description: "Liferea (Linux Feed Reader) news aggregator for Unix and Linux",
id: "id_g_m_140508_4",
link1: "http://liferea.sourceforge.net/",
link2: "",
name: "Liferea/1.x.x (Linux; es_ES.UTF-8; http://liferea.sf.net/)",
type: "B"
},
%{
comment: "",
description: "Lightning Download manager",
id: "id_g_m_614",
link1: "http://www.lightningdownload.com",
link2: "",
name: "LightningDownload/1.0beta2",
type: "D"
},
%{
comment: "",
description: "Lightning Download manager",
id: "id_g_m_615",
link1: "http://www.lightningdownload.com",
link2: "",
name: "LightningDownload/1.x.x",
type: "D"
},
%{
comment: "",
description: "Lightning Download manager",
id: "id_g_m_616",
link1: "http://www.lightningdownload.com",
link2: "",
name: "LightningDownload/1.x.x [Accelerated x]",
type: "D"
},
%{
comment: "216.24.131.1xx",
description: "Lijit blog search spider",
id: "id_g_m_131207_1",
link1: "http://www.lijit.com/",
link2: "",
name:
"LijitSpider/Nutch-0.9 (Reports crawler; http://www.lijit.com/; info(a)lijit(d)com)",
type: "R"
},
%{
comment: "s. this Guestbook http://www.donotenter.com/guestbook/gbook.html",
description: "Some spam bot",
id: "id_g_m_617",
link1: "http://www.donotenter.com/guestbook/gbook.html",
link2: "",
name: "Lincoln State Web Browser",
type: "S"
},
%{
comment: "",
description: "Link Valet online link checking",
id: "id_g_m_618",
link1: "http://www.htmlhelp.com",
link2: "",
name: "Link Valet Online 1.x",
type: "C"
},
%{
comment: "",
description: "Linkalarm link validation",
id: "id_g_m_620",
link1: "http://www.linkalarm.com",
link2: "",
name: "LinkAlarm/2.x",
type: "C"
},
%{
comment: "",
description: "Linkbot Pro link checking software",
id: "id_g_m_621",
link1: "http://www.watchfire.com",
link2: "",
name: "Linkbot",
type: "C"
},
%{
comment: "",
description: "Rpsoft 2000 Site-Crawler",
id: "id_g_m_622",
link1: "http://www.rpsoft2000.com/rps-site-crawler.htm",
link2: "",
name: "linkbot",
type: "R"
},
%{
comment: "",
description: "Linkbot Pro link checking software",
id: "id_g_m_623",
link1: "http://www.watchfire.com",
link2: "",
name: "Linkbot x.0",
type: "C"
},
%{
comment: "",
description: "Linkcheck - linkchecking tool for Unix/Linux",
id: "id_g_m_624",
link1: "http://www.inter7.com",
link2: "",
name: "LinkCheck (linkcheck@inter7.com http://www.inter7.com/linkcheck)",
type: "C"
},
%{
comment: "",
description: "Linklint - Perl html link checker",
id: "id_g_m_625",
link1: "http://www.linklint.org",
link2: "",
name: "LinkLint-checkonly/2.x.x",
type: "C"
},
%{
comment: "",
description: "Linklint - Perl html link checker",
id: "id_g_m_626",
link1: "http://www.linklint.org",
link2: "",
name: "LinkLint-spider/2.x.x",
type: "C"
},
%{
comment: "",
description: "Linknz - The Kiwi Search Engine (New Zealand)",
id: "id_g_m_627",
link1: "http://www.linknz.co.nz",
link2: "",
name: "linknzbot",
type: "R"
},
%{
comment: "216.89.111.x",
description: "Link-Pimp web directory link checking",
id: "id_g_m_280606_1",
link1: "http://www.link-pimp.com/",
link2: "",
name: "LinkPimpin v1.0",
type: "C"
},
%{
comment: "",
description: "TafWeb link checking program",
id: "id_g_m_628",
link1: "http://www.tafweb.com",
link2: "",
name: "LinkProver 2.1",
type: "C"
},
%{
comment: "",
description: "Links text browser for Unix & OS/2",
id: "id_g_m_630",
link1: "http://artax.karlin.mff.cuni.cz/%7Emikulas/links/",
link2: "",
name: "Links (0.9x; Linux 2.4.7-10 i686)",
type: "B"
},
%{
comment: "",
description: "Links text browser for Unix & OS/2",
id: "id_g_m_631",
link1: "http://artax.karlin.mff.cuni.cz/%7Emikulas/links/",
link2: "",
name: "Links (0.9xpre12; Linux 2.2.14-5.0 i686; 80x24)",
type: "B"
},
%{
comment: "",
description: "Links text browser for Unix & OS/2",
id: "id_g_m_632",
link1: "http://artax.karlin.mff.cuni.cz/%7Emikulas/links/",
link2: "",
name: "Links (2.xpre7; Linux 2.4.18 i586; x)",
type: "B"
},
%{
comment: "",
description: "Links SQL directory management program",
id: "id_g_m_629",
link1: "http://gossamer-threads.com/scripts/links/",
link2: "",
name: "Links - http://gossamer-threads.com/scripts/links/",
type: "C"
},
%{
comment: "",
description: "Links SQL directory management program",
id: "id_g_m_633",
link1: "http://gossamer-threads.com/scripts/links/",
link2: "",
name: "Links 2.0 (http://gossamer-threads.com/scripts/links/)",
type: "R"
},
%{
comment: "",
description: "Links SQL directory management program",
id: "id_g_m_634",
link1: "http://gossamer-threads.com/scripts/links-sql/",
link2: "",
name: "Links SQL (http://gossamer-threads.com/scripts/links-sql/)",
type: "R"
},
%{
comment: "209.190.5.2xx",
description: "Links4us ODP based directory link checking",
id: "id_g_m_280406_3",
link1: "http://links4us.com/",
link2: "",
name: "Links4US-Crawler, (+http://links4us.com/)",
type: "C"
},
%{
comment: "",
description: "Shareware robot from Elsop.com (used by Indiafocus/Indiainfo and others)",
id: "id_g_m_635",
link1: "http://www.elsop.com",
link2: "http://indiafocus.indiainfo.com/",
name:
"LinkScan/11.0beta2 UnixShareware robot from Elsop.com (used by Indiafocus/Indiainfo)",
type: "R"
},
%{
comment: "",
description: "Shareware robot from Elsop.com (used by Indiafocus/Indiainfo and others)",
id: "id_g_m_636",
link1: "http://www.elsop.com",
link2: "http://indiafocus.indiainfo.com/",
name: "LinkScan/9.0g Unix",
type: "R"
},
%{
comment: "",
description: "Shareware robot from Elsop.com",
id: "id_g_m_637",
link1: "http://www.elsop.com",
link2: "",
name: "LinkScan/x.x Unix",
type: "R"
},
%{
comment: "s.also Mozilla/5.0 (compatible; LinksManager.com_bot...",
description: "Linksmanager bookmark checking",
id: "id_g_m_638",
link1: "http://linksmanager.com/linkchecker.html",
link2: "",
name: "LinksManager.com (http://linksmanager.com/linkchecker.html)",
type: "C"
},
%{
comment: "",
description: "LinkSonar (Japan) link checking tool",
id: "id_g_m_639",
link1: "http://hp.vector.co.jp/authors/VA014575/chicchi/linksonar/readme.html",
link2: "",
name: "LinkSonar/1.35",
type: "C"
},
%{
comment: "",
description: "Left Side Software's LinkSweeper (ceased) bookmark utility",
id: "id_g_m_640",
link1: "http://www.lss.com.au/lss/lss_main.htm",
link2: "",
name: "LinkSweeper/1.x",
type: "C"
},
%{
comment: "",
description: "Seventwentyfour link checking robot",
id: "id_g_m_641",
link1: "http://www.seventwentyfour.com",
link2: "",
name: "LinkWalker",
type: "C"
},
%{
comment: "",
description: "link check 3 - Perl HTML link checker (from Perl for Web Site Management)",
id: "id_g_m_619",
link1: "http://www.elanus.net/cgi/examples.cgi/view/ex_1102.txt",
link2: "",
name: "link_check3.plx libwww-perl/5.65",
type: "C"
},
%{
comment: "",
description: "Listbid.com / Directnic.com link checking ?",
id: "id_g_m_642",
link1: "http://listbid.com",
link2: "",
name:
"ListBidBot (freelance job spider http://listbid.com)<a href=http://listbid.com>Freelance</a>",
type: "R C"
},
%{
comment: "140.109.19.1xx",
description: "WKD Lab: LiveTrans - Online query and terminology translation service",
id: "id_g_m_031107_3",
link1: "http://wkd.iis.sinica.edu.tw/LiveTrans/",
link2: "",
name:
"LiveTrans/Nutch-0.9 (maintainer: cobain at iis dot sinica dot edu dot tw; http://wkd.iis.sinica.edu.tw/LiveTrans/)",
type: "R"
},
%{
comment: "",
description: "llaut robot - Universitat de les Illes Balears (Spain)",
id: "id_g_m_643",
link1: "http://mnm.uib.es",
link2: "",
name: "Llaut/1.0 (http://mnm.uib.es/~gallir/llaut/bot.html)",
type: "R"
},
%{
comment: "64.124.152.xx",
description: "E-Mail harvesting robot - same as ContactBot",
id: "id_g_m_200307_2",
link1: "",
link2: "",
name: "LMQueueBot/0.2",
type: "S"
},
%{
comment: "see here",
description: "lmspider from Scansoft (192.133.61.xx) - Web text collector",
id: "id_g_m_644",
link1: "http://www.kahunaburger.com/blog/archives/000117.html",
link2: "",
name: "lmspider (lmspider@scansoft.com)",
type: "R"
},
%{
comment: "",
description: "Lexis-Nexis robot",
id: "id_g_m_645",
link1: "http://www.lexis-nexis.com/",
link2: "",
name: "LNSpiderguy",
type: "R"
},
%{
comment: "",
description: "LocalBot company information collector",
id: "id_g_m_300106_4",
link1: "http://www.localbot.co.uk/",
link2: "",
name: "LocalBot/1.0 ( http://www.localbot.co.uk/)",
type: "R"
},
%{
comment: "",
description: "Local.com local search robot (216.52.252.xxx)",
id: "id_g_m_646",
link1: "http://www.local.com/",
link2: "",
name: "LocalcomBot/1.2.x ( http://www.local.com/bot.htm)",
type: "R"
},
%{
comment: "",
description: "Lockstep (website content protection tool) user agent",
id: "id_g_m_647",
link1: "http://www.lockstep.com",
link2: "",
name: "Lockstep Spider/1.0",
type: "R"
},
%{
comment: "",
description: "GlobalQueue spider (64.40.105.xxx)",
id: "id_g_m_648",
link1: "http://www.multi-mode.com/",
link2: "",
name: "Look.com",
type: "R"
},
%{
comment: "",
description: "Lotus Notes browser",
id: "id_g_m_649",
link1: "",
link2: "",
name: "Lotus-Notes/4.5 ( Windows-NT )",
type: "B"
},
%{
comment: "",
description: "IBM Lotus Discovery Server",
id: "id_g_m_650",
link1:
"http://www-142.ibm.com/software/sw-lotus/products/product3.nsf/wdocs/644012e0434859b585256ec9006d37b8",
link2: "",
name: "LotusDiscovery/x.0 (compatible; Mozilla 4.0; MSIE 4.01; Windows NT)",
type: ""
},
%{
comment: "80.91.191.2xx",
description: "Everatom.com song lyrics search",
id: "id_g_m_051207_1",
link1: "http://www.everatom.com",
link2: "",
name: "Lovel as 1.0 ( +http://www.everatom.com)",
type: "R"
},
%{
comment: "68.180.139.12x",
description:
"LTI - The Lemur Toolkit for Language Modeling and Information Retrieval via Yahoo",
id: "id_g_m_100308_2",
link1: "http://www.lemurproject.org/",
link2: "http://www.yahoo.com/",
name:
"LTI/LemurProject Nutch Spider/Nutch-1.0-dev (lti crawler for CMU; http://www.lti.cs.cmu.edu; changkuk at cmu dot edu)",
type: "R"
},
%{
comment: "68.180.139.12x",
description:
"LTI - The Lemur Toolkit for Language Modeling and Information Retrieval via Yahoo",
id: "id_g_m_050208_3",
link1: "http://www.lemurproject.org/",
link2: "http://www.yahoo.com/",
name:
"LTI/LemurProject Nutch Spider/Nutch-1.0-dev (Research spider using Nutch; http://www.lemurproject.org; mhoy@cs.cmu.edu)",
type: "R"
},
%{
comment: "",
description: "Luchs.at (Linux Wiki) link checking",
id: "id_g_m_651",
link1: "http://web.luchs.at/information/linkchecker.php",
link2: "",
name: "luchs.at URL checker",
type: "C"
},
%{
comment: "s. also Mozilla/4.0 (... Lunascape ...)",
description: "Lunascape IE based browser (Japan)",
id: "id_g_m_090106_1",
link1: "http://www2.lunascape.jp/index.aspx",
link2: "",
name: "Lunascape",
type: "B"
},
%{
comment: "",
description: "Ultimate Search / Smartdesk (no website) robot",
id: "id_g_m_652",
link1: "",
link2: "",
name: "lwp-trivial/1.32",
type: "R"
},
%{
comment: "",
description: "Search4free robot",
id: "id_g_m_653",
link1: "http://www.search4free.com",
link2: "",
name: "lwp-trivial/1.34",
type: "R"
},
%{
comment: "",
description: "Search4free robot",
id: "id_g_m_654",
link1: "http://www.search4free.com",
link2: "",
name: "lwp-trivial/1.34",
type: "R"
},
%{
comment: "",
description: "Expert HTML online source viewer",
id: "id_g_m_656",
link1: "http://www.expert-html.com/",
link2: "",
name: "lwp-trivial/1.35",
type: "B"
},
%{
comment: "",
description: "Expert HTML online source viewer",
id: "id_g_m_655",
link1: "http://www.expert-html.com/",
link2: "",
name: "lwp-trivial/1.35",
type: "B"
},
%{
comment: "",
description: "Perl LWP:Collective module",
id: "id_g_m_657",
link1: "http://www.thatrobotsite.com",
link2: "",
name: "LWP::Simple/5.22",
type: "R"
},
%{
comment: "",
description: "Perl LWP:Collective module",
id: "id_g_m_658",
link1: "http://www.thatrobotsite.com",
link2: "",
name: "LWP::Simple/5.36",
type: "R"
},
%{
comment: "",
description: "Perl LWP:Collective module - Linkomatic robot",
id: "id_g_m_659",
link1: "http://www.linkomatic.com/",
link2: "http://www.thatrobotsite.com",
name: "LWP::Simple/5.48",
type: "R"
},
%{
comment: "",
description:
"Perl LWP:Collective module - secure-netz.de link checking (in conjunction w. libwww-perl/5.50)",
id: "id_g_m_660",
link1: "http://www.secure-netz.de",
link2: "http://www.thatrobotsite.com",
name: "LWP::Simple/5.50",
type: "R"
},
%{
comment: "",
description: "Perl LWP:Collective module - Inktomi (62.253.64.x) robot",
id: "id_g_m_661",
link1: "http://www.inktomi.com/",
link2: "http://www.thatrobotsite.com",
name: "LWP::Simple/5.51",
type: "R"
},
%{
comment: "in conjunction w. Spida/0.1",
description: "Perl LWP:Collective module - Only.com ",
id: "id_g_m_662",
link1: "http://www.only.com",
link2: "http://www.thatrobotsite.com",
name: "LWP::Simple/5.53",
type: "R"
},
%{
comment: "",
description: "Perl LWP:Collective module",
id: "id_g_m_663",
link1: "http://www.thatrobotsite.com",
link2: "",
name: "LWP::Simple/5.63",
type: "R"
},
%{
comment:
"appears also as Poirot - Mozilla/4.76 [en] (Win98; U) - Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1)",
description:
"ThePlanet/jaja-jak-globusy.com Google Adsense refferer spam bot from 70.85.116.* / 70.84.128.xxx / 70.85.193.xxx",
id: "id_g_m_291105_3",
link1: "http://spamhuntress.com/wiki/Manila_Industries",
link2: "",
name: "LWP::Simple/5.803",
type: "S"
},
%{
comment: "",
description: "Lycos spider",
id: "id_g_m_664",
link1: "http://www.lycos.com",
link2: "",
name: "Lycos_Spider_(modspider)",
type: "R"
},
%{
comment: "",
description: "Lycos spider",
id: "id_g_m_665",
link1: "http://www.lycos.com",
link2: "",
name: "Lycos_Spider_(T-Rex)",
type: "R"
},
%{
comment: "",
description: "Bobcat - Text and Lynx based DOS browser",
id: "id_g_m_200308_2",
link1: "http://www.fdisk.com/doslynx/bobcat.htm",
link2: "",
name: "Lynx/2-4-2 (Bobcat/0.5 [DOS] Jp Beta04)",
type: "B"
},
%{
comment: "",
description: "Lynx 2.x text mode browser",
id: "id_g_m_666",
link1: "http://lynx.browser.org/",
link2: "",
name: "Lynx/2.6 libwww-FM/2.14",
type: "B"
},
%{
comment: "208.113.176.x[xx]",
description:
"seebot.org online service - uses lynx browser for crawlers view of web pages",
id: "id_g_m_180108_1",
link1: "http://seebot.org/",
link2: "",
name: "Lynx/2.8 (;http://seebot.org)",
type: "B"
},
%{
comment: "",
description: "Lynx 2.x text mode browser",
id: "id_g_m_667",
link1: "http://lynx.browser.org/",
link2: "",
name: "Lynx/2.8.3dev.9 libwww-FM/2.14 SSL-MM/1.4.1 OpenSSL/0.9.6",
type: "B"
},
%{
comment: "",
description: "Lynx 2.x text mode browser used as robot via cogentco.com",
id: "id_g_m_668",
link1: "",
link2: "",
name:
"Lynx/2.8.4rel.1 libwww-FM/2.14 SSL-MM/1.4.1 OpenSSL/0.9.6c (human-guided@lerly.net)",
type: "R"
},
%{
comment: "",
description: "Some spam bot",
id: "id_g_m_669",
link1: "http://www.kloth.net/internet/badbots.php",
link2: "",
name: "Mac Finder 1.0.xx",
type: "S"
},
%{
comment: "s. also UKWizz/Nutch",
description: "UKWizz search robot",
id: "id_g_m_670",
link1: "http://www.ukwizz.com",
link2: "",
name: "Mackster( http://www.ukwizz.com )",
type: "R"
},
%{
comment: "",
description: "Wind.it client user-agent ?",
id: "id_g_m_671",
link1: "",
link2: "",
name: "Mag-Net",
type: ""
},
%{
comment: "",
description: "All Magic/Wap wml service for mobile devices",
id: "id_g_m_180606_3",
link1: "http://allmagic3.com/wap/",
link2: "",
name: "MagicWML/1.0 (forcewml)",
type: "P"
},
%{
comment: "",
description: "Magpie RSS - PHP RSS Parser",
id: "id_g_m_061206_1",
link1: "http://magpierss.sourceforge.net/",
link2: "",
name: "MagpieRSS/0.7x (+http://magpierss.sf.net)",
type: "B"
},
%{
comment: "72.167.143.1x",
description: "Mahiti.com India search crawler",
id: "id_g_m_030308_1",
link1: "http://mahiti.com/",
link2: "",
name: "Mahiti.Com/Mahiti Crawler-1.0 (Mahiti.Com; http://mahiti.com ; mahiti.com)",
type: "R"
},
%{
comment: "194.186.55.2xx",
description: "Mail.ru search",
id: "id_g_m_020707_2",
link1: "http://www.mail.ru/",
link2: "",
name: "Mail.Ru/1.0",
type: "R"
},
%{
comment: "",
description: "Unknown Bea robot",
id: "id_g_m_672",
link1: "http://www.beasys.com",
link2: "",
name: "mailto:webcraft@bea.com",
type: "R"
},
%{
comment: "s. also Mozilla/5.0 (+http://www.sli-systems.com/) Mammoth/0.1",
description: "SLI Systems mammoth robot",
id: "id_g_m_673",
link1: "http://www.sli-systems.com/",
link2: "http://www.tenspider.com/business-blog/more.php?id=A45_0_1_0_M",
name: "mammoth/1.0 ( http://www.sli-systems.com/)",
type: "R"
},
%{
comment: "",
description: "Looksmart robot",
id: "id_g_m_674",
link1: "http://www.looksmart.com",
link2: "",
name: "MantraAgent",
type: "R"
},
%{
comment: "",
description: "Map of the Internet visual search engine index robot",
id: "id_g_m_675",
link1: "http://MapoftheInternet.com",
link2: "",
name: "MapoftheInternet.com ( http://MapoftheInternet.com)",
type: "R"
},
%{
comment: "",
description: "Kolibri.de robot",
id: "id_g_m_676",
link1: "http://www.kolibri.de",
link2: "",
name: "Mariner/5.1b [de] (Win95; I ;Kolibri gncwebbot)",
type: "R"
},
%{
comment: "",
description: "Pilot Hitlist web site analysis",
id: "id_g_m_677",
link1: "http://www.marketwave.com/products_solutions/hitlist.html",
link2: "",
name: "Marketwave Hit List",
type: "R"
},
%{
comment: "",
description: "Looksmart directory page analysis",
id: "id_g_m_678",
link1: "http://www.looksmart.com",
link2: "",
name: "Martini",
type: "R"
},
%{
comment: "",
description: "Looksmart directory page analysis",
id: "id_g_m_679",
link1: "http://www.looksmart.com",
link2: "",
name: "MARTINI",
type: "R"
},
%{
comment: "",
description: "Marvin Medhunt robot",
id: "id_g_m_680",
link1: "http://www.hon.ch/MedHunt/Marvin.html",
link2: "",
name: "Marvin v0.3",
type: "R"
},
%{
comment: "124.32.246.xx",
description: "Sagool search Japan robot",
id: "id_g_m_270606_1",
link1: "http://sagool.jp/",
link2: "",
name: "MaSagool/1.0 (MaSagool; http://sagool.jp/; info@sagool.jp)",
type: "R"
},
%{
comment: "",
description: "Mass Downloader download manager",
id: "id_g_m_681",
link1: "http://www.metaproducts.com",
link2: "",
name: "Mass Downloader 2.x",
type: "D"
},
%{
comment: "",
description: "Masterseek (Scandinavia) Beta business search ?",
id: "id_g_m_682",
link1: "http://www.masterseek.com",
link2: "",
name: "MasterSeek",
type: "R"
},
%{
comment: "",
description: "Lexibot (exMataHari) search software",
id: "id_g_m_683",
link1: "http://www.lexibot.com",
link2: "",
name: "Mata Hari/2.00 ",
type: "R"
},
%{
comment: "",
description: "Virgilio Italy robot (212.48.11.xxx) using Fast Enterprise Search",
id: "id_g_m_684",
link1: "http://www.virgilio.it",
link2: "",
name: "Matrix S.p.A. - FAST Enterprise Crawler 6 (Unknown admin e-mail address)",
type: "R"
},
%{
comment: "",
description: "Maxomo multimedia search robot",
id: "id_g_m_685",
link1: "http://www.maxomo.com",
link2: "",
name:
"maxomobot/dev-20051201 (maxomo; http://67.102.134.34:4047/MAXOMO/MAXOMObot.html; maxomobot@maxomo.com)",
type: "R"
},
%{
comment: "",
description: "Unknown robot from McAfee Austria (80.123.144.xx)",
id: "id_g_m_686",
link1: "",
link2: "",
name: "McBot/5.001 (windows; U; NT4.0; en-us)",
type: ""
},
%{
comment: "91.121.83.19x",
description: "MegaDownload files search robot",
id: "id_g_m_290108_1",
link1: "http://www.megadownload.net/",
link2: "http://www.megadownload.net/bot.html",
name: "MDbot/1.0 (+http://www.megadownload.net/bot.html)",
type: "R"
},
%{
comment: "",
description: "Substitute for Windows Media Player",
id: "id_g_m_170306_1",
link1: "http://sourceforge.net/projects/guliverkli/",
link2: "",
name: "Media Player Classic",
type: "B"
},
%{
comment: "",
description: "Media Find crawler",
id: "id_g_m_687",
link1: "http://www.mediacrawler.de",
link2: "",
name: "MediaCrawler-1.0 (Experimental)",
type: "R"
},
%{
comment: "",
description: "Google AdSense robot",
id: "id_g_m_688",
link1: "http://www.google.com/ads/",
link2: "",
name: "Mediapartners-Google/2.1 ( http://www.googlebot.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "WWW.fi Media Search",
id: "id_g_m_689",
link1: "http://www.fi/haku/",
link2: "",
name: "MediaSearch/0.1",
type: "R"
},
%{
comment: "",
description: "Search UK robot",
id: "id_g_m_690",
link1: "http://www.searchuk.com",
link2: "",
name: "MegaSheep v1.0 (www.searchuk.com internet sheep)",
type: "R"
},
%{
comment: "",
description: "Megite web2.0 RSS and news service software",
id: "id_g_m_131107_1",
link1: "http://www.megite.com/",
link2: "",
name: "Megite2.0 (http://www.megite.com)",
type: "R"
},
%{
comment: "",
description: "Mercator crawler software (used by Altavista)",
id: "id_g_m_691",
link1: "http://www.research.compaq.com",
link2: "",
name: "Mercator-1.x",
type: "R"
},
%{
comment: "",
description: "Mercator crawler software (used by Altavista)",
id: "id_g_m_692",
link1: "http://www.research.compaq.com",
link2: "",
name: "Mercator-2.0",
type: "R"
},
%{
comment: "",
description: "Mercator crawler software (used by Altavista)",
id: "id_g_m_693",
link1: "http://www.research.compaq.com",
link2: "",
name: "Mercator-Scrub-1.1",
type: "R"
},
%{
comment: "83.97.31.1xx",
description: "MetaEuro.com Clustering Web Search Engine crawler",
id: "id_g_m_070207_1",
link1: "http://www.metaeuro.com/",
link2: "",
name:
"Metaeuro Web Crawler/0.2 (MetaEuro Web Search Clustering Engine; http://www.metaeuro.com; crawler at metaeuro dot com)",
type: "R"
},
%{
comment: "130.75.2.xx",
description: "MetaGer search robot (Germany)",
id: "id_g_m_694",
link1: "http://www.metager.de/",
link2: "",
name: "MetaGer-LinkChecker",
type: "R"
},
%{
comment: "130.75.2.xx",
description: "MetaGer search robot (Germany)",
id: "id_g_m_270706_1",
link1: "http://www.metager.de/",
link2: "",
name: "MetagerBot/0.8-dev (MetagerBot; http://metager.de; )",
type: "R"
},
%{
comment: "130.75.2.xx",
description: "MetaGer search robot (Germany)",
id: "id_g_m_060307_1",
link1: "http://www.metager.de/",
link2: "",
name: "MetaGer_PreChecker0.1",
type: "R"
},
%{
comment: "",
description: "Download Express download manager",
id: "id_g_m_695",
link1: "http://www.metaproducts.com",
link2: "",
name: "MetaProducts Download Express/1.x",
type: "D"
},
%{
comment: "",
description: "Metaspinner search robot - Germany",
id: "id_g_m_696",
link1: "http://www.meta-spinner.de/",
link2: "",
name:
"Metaspinner/0.01 (Metaspinner; http://www.meta-spinner.de/; support@meta-spinner.de/)",
type: "R"
},
%{
comment: "206.196.111.2xx",
description: "Metatagsdir.com directory index spider",
id: "id_g_m_300407_1",
link1: "http://metatagsdir.com/directory/",
link2: "",
name: "metatagsdir/0.7 (+http://metatagsdir.com/directory/)",
type: "R"
},
%{
comment: "appears also as Full Web Bot 0516B or Demo Bot Z 16b",
description:
"Microsoft Foundation Class Library - i.e. used for e-mail harvesting from 68.154.96.xx (bellsouth.net)",
id: "id_g_m_697",
link1: "",
link2: "",
name: "MFC Foundation Class Library 4.0",
type: "S"
},
%{
comment: "",
description: "Microsoft.com user agent",
id: "id_g_m_698",
link1: "",
link2: "",
name: "MFC_Tear_Sample",
type: ""
},
%{
comment: "",
description: "Advanced Site Crawler web site ripper and extractor",
id: "id_g_m_699",
link1: "http://www.innovative.go.ro/sitecrawler/index.htm",
link2: "",
name: "MFHttpScan",
type: "D"
},
%{
comment: " s. also - gigabaz/3.1x ...",
description: "GigaBaz Brainbot (Germany) robot (213.139.152.xx)",
id: "id_g_m_700",
link1: "http://brainbot.com//site3",
link2: "",
name: "MicroBaz",
type: "R"
},
%{
comment: "",
description: "MS Office 2000 acting as WebDAV client",
id: "id_g_m_701",
link1: "",
link2: "",
name: "Microsoft Data Access Internet Publishing Provider Cache Manager",
type: "B P"
},
%{
comment: "",
description: "MS Office 2000 acting as WebDAV client",
id: "id_g_m_702",
link1: "",
link2: "",
name: "Microsoft Data Access Internet Publishing Provider DAV",
type: "B"
},
%{
comment: "",
description:
"Server probe for data access operations using MS Frontpage with OPTION header",
id: "id_g_m_704",
link1: "",
link2: "",
name: "Microsoft Data Access Internet Publishing Provider Protocol Discovery",
type: "B C"
},
%{
comment: "",
description: "MS Office 2000 acting as WebDAV client",
id: "id_g_m_703",
link1: "",
link2: "",
name: "Microsoft Data Access Internet Publishing Provider Protocol Discovery",
type: "B C"
},
%{
comment: "",
description: "Microsoft Log Parser text query tool",
id: "id_g_m_190807_2",
link1: "http://www.microsoft.com/technet/scriptcenter/tools/logparser/default.mspx",
link2: "",
name: "Microsoft Log Parser 2.2",
type: "D"
},
%{
comment: "Indexing from Microsoft: 204.71.191.xx",
description: "MS Small Business Server content indexer",
id: "id_g_m_180306_1",
link1: "http://www.microsoft.com/windowsserver2003/sbs/default.mspx",
link2: "",
name: "Microsoft Small Business Indexer",
type: "R"
},
%{
comment: "",
description: "user agent looks for form-mail components (spam-bot)",
id: "id_g_m_705",
link1: "",
link2: "",
name: "Microsoft URL Control - 6.00.8xxx",
type: "S"
},
%{
comment: "",
description: "Unknown robot from Microsoft.com (131.107.163.xx)",
id: "id_g_m_707",
link1: "",
link2: "",
name: "MicrosoftPrototypeCrawler (How's my crawling? mailto:newbiecrawler@hotmail.com)",
type: "R"
},
%{
comment: "",
description: "Secure Computing SmartFilterWhere / Bess web filter (192.55.214.xx)",
id: "id_g_m_706",
link1: "http://www.securecomputing.com/index.cfm?skey=22",
link2: "",
name: "Microsoft_Internet_Explorer_5.00.438 (fjones@isd.net)",
type: "P"
},
%{
comment: "",
description: "xpc-mii.net HTTP server message",
id: "id_g_m_708",
link1: "",
link2: "",
name: "MIIxpc/4.2",
type: "P"
},
%{
comment: "80.229.1xx",
description: "The Mindjet blog MindManager category",
id: "id_g_m_130807_2",
link1: "http://blog.mindjet.com/category/mindjet/mindmanager/",
link2: "",
name: "Mindjet MindManager",
type: "D"
},
%{
comment: "",
description: "unknown robot via Korea Telecom (211.218.xxx.xxx)",
id: "id_g_m_709",
link1: "",
link2: "",
name: "minibot",
type: ""
},
%{
comment: "64.230.71.2xx",
description: "mini- Rank website popularity tool",
id: "id_g_m_110506_2",
link1: "http://www.minirank.com/",
link2: "",
name: "miniRank/1.6 (Website ranking; www.minirank.com; robot)",
type: "C"
},
%{
comment: "",
description: "unknown robot via nec.co.jp Telecom (210.143.35.xx)",
id: "id_g_m_710",
link1: "",
link2: "",
name: "MiracleAlphaTest",
type: ""
},
%{
comment: "",
description: "Some spam bot",
id: "id_g_m_711",
link1: "http://www.neilgunton.com/spambot_trap/appendix/",
link2: "",
name: "Missauga Locate 1.0.0",
type: "S"
},
%{
comment: "",
description: "Some spam bot",
id: "id_g_m_712",
link1: "http://www.neilgunton.com/spambot_trap/appendix/",
link2: "",
name: "Missigua Locator 1.9",
type: "S"
},
%{
comment: "",
description: "Some spam bot",
id: "id_g_m_713",
link1: "",
link2: "",
name: "Missouri College Browse",
type: "S"
},
%{
comment: "",
description: "Mister PiX picture finding software",
id: "id_g_m_714",
link1: "http://www.mister-pix.com/",
link2: "",
name: "Mister Pix II 2.02a",
type: "D R"
},
%{
comment: "",
description: "Mister PiX picture finding software",
id: "id_g_m_715",
link1: "http://www.mister-pix.com/",
link2: "",
name: "Mister PiX version.dll",
type: "D R"
},
%{
comment: "",
description: "Misterbot search France robot",
id: "id_g_m_110206_3",
link1: "http://www.misterbot.fr/",
link2: "",
name:
"Misterbot-Nutch/0.7.1 (Misterbot-Nutch; http://www.misterbot.fr; admin@misterbot.fr)",
type: "R"
},
%{
comment: "",
description: "Miva / ex Findwhat.com search robot (66.150.55.2xx)",
id: "id_g_m_716",
link1: "http://www.miva.com/",
link2: "",
name: "Miva (AlgoFeedback@miva.com)",
type: "R"
},
%{
comment: "s. link ",
description: "Some spam bot from Jasmine Internet - Bangkok (203.147.0.xx)",
id: "id_g_m_141105_2",
link1:
"http://www.projecthoneypot.org/ip_inspector.php?iph=7bc2eae614063a45b0e1d0786dbe6a2e",
link2: "",
name: "Mizzu Labs 2.2",
type: "S"
},
%{
comment: "",
description: "Majestic-12 DSearch MJ12bot (Experimental distributed crawler)",
id: "id_g_m_080706_3",
link1: "http://www.majestic12.co.uk/projects/dsearch/",
link2: "",
name: "MJ12bot/vx.x.x (http://majestic12.co.uk/bot.php?+)",
type: "R"
},
%{
comment: "",
description: "Majestic-12 DSearch MJ12bot (Experimental distributed crawler)",
id: "id_g_m_717",
link1: "http://www.majestic12.co.uk/projects/dsearch/mj12bot.php",
link2: "",
name: "MJ12bot/vx.x.x (http://www.majestic12.co.uk/projects/dsearch/mj12bot.php)",
type: "R"
},
%{
comment: "217.8.248.19x",
description: "MJB SEO Club MJBot",
id: "id_g_m_200108_1",
link1: "http://www.mjbdata.com/information/",
link2: "",
name: "MJBot (SEO assessment)",
type: "R"
},
%{
comment: "",
description: "MLBot - metadata labs web crawler for building a media index (beta)",
id: "id_g_m_030308_2",
link1: "http://www.metadatalabs.com/",
link2: "",
name: "MLBot (www.metadatalabs.com)",
type: "R"
},
%{
comment: "",
description: "mnoGoSearch (ex UdmSearch) software robot",
id: "id_g_m_718",
link1: "http://mnogosearch.org/",
link2: "",
name: "MnogoSearch/3.2.xx",
type: "R"
},
%{
comment: "see link:",
description: "Unknown bad bot - maybe guestbook spamming or email harvesting",
id: "id_g_m_260306_3",
link1: "http://www.kloth.net/internet/badbots.php",
link2: "",
name: "Mo College 1.9",
type: "S"
},
%{
comment: "s. also ichiro",
description: "Goo Japan / Inktomi robot (210.173.179.xx)",
id: "id_g_m_719",
link1: "http://www.goo.ne.jp",
link2: "",
name: "moget/x.x (moget@goo.ne.jp)",
type: "R"
},
%{
comment: "s. also ichiro",
description: "Goo Japan / Inktomi robot (210.173.179.xx)",
id: "id_g_m_720",
link1: "http://www.goo.ne.jp",
link2: "",
name: "mogimogi/1.0",
type: "R"
},
%{
comment: "",
description: "moiNag - net.art generator",
id: "id_g_m_721",
link1: "http://soundwarez.org/generator/moiNAG/",
link2: "",
name: "moiNAG 0.02",
type: "R D"
},
%{
comment: "s.also Mozilla/5.0 (compatible; MojeekBot/2.0 ...",
description: "Mojeek Search Preview robot (217.155.205.xx)",
id: "id_g_m_722",
link1: "http://www.mojeek.com",
link2: "",
name: "MojeekBot/0.x (archi; http://www.mojeek.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "Greasemonkey Firefox extension",
id: "id_g_m_150407_1",
link1: "http://www.greasespot.net/",
link2: "http://diveintogreasemonkey.org/install/what-is-greasemonkey.html",
name: "monkeyagent",
type: "D"
},
%{
comment: "",
description: "Moonbrowser - IE based browser (Japan)",
id: "id_g_m_090106_2",
link1: "http://www.geocities.co.jp/SiliconValley-Cupertino/8986/",
link2: "",
name: "MoonBrowser (version 0.41 Beta4)",
type: "B"
},
%{
comment: "72.13.32.x",
description: "Moreover / FeedDirect RSS feed robot",
id: "id_g_m_010307_2",
link1: "http://w.moreover.com/",
link2: "http://www.feeddirect.com/",
name: "Moreoverbot/x.00 (+http://www.moreover.com)",
type: "C"
},
%{
comment: "",
description: "MixCat robot s. also Felix",
id: "id_g_m_723",
link1: "http://mixcat.com",
link2: "",
name: "Morris - Mixcat Crawler ( http://mixcat.com)",
type: "R"
},
%{
comment: "",
description: "Robots.txt online checker",
id: "id_g_m_100206_2",
link1: "http://tool.motoricerca.info/robots-checker.phtml",
link2: "",
name:
"Motoricerca-Robots.txt-Checker/1.0 (http://tool.motoricerca.info/robots-checker.phtml)",
type: "C"
},
%{
comment: "",
description: "Obigo WAP browser for mobiles on Motorola V3",
id: "id_g_m_240108_1",
link1: "http://www.obigo.com/",
link2: "http://en.wikipedia.org/wiki/Obigo_Browser",
name: "Motorola-V3m Obigo",
type: "B"
},
%{
comment: "",
description: "MPRM Group Ltd. Spider Monkey robot",
id: "id_g_m_724",
link1: "http://www.spidermonkey.ca/sm.shtml",
link2: "",
name: "Mouse-House/7.4 (spider_monkey spider info at www.mobrien.com/sm.shtml)",
type: "R"
},
%{
comment: "",
description: "Movable Type web-based personal publishing system",
id: "id_g_m_725",
link1: "http://www.movabletype.org",
link2: "",
name: "MovableType/x.x",
type: "B"
},
%{
comment: "",
description: "Mozdex Open search engine spider (65.98.100.2xx)",
id: "id_g_m_726",
link1: "http://www.mozdex.com/",
link2: "",
name: "mozDex/0.xx-dev (mozDex; http://www.mozdex.com/en/bot.html; spider@mozdex.com)",
type: "R"
},
%{
comment: "",
description: "Bell Nexxia / Sympatico Canada user robot & spoofed referer from diff. IPs",
id: "id_g_m_727",
link1: "",
link2: "",
name: "Mozi!",
type: ""
},
%{
comment: "",
description: "Unknown robots from diff. IPs",
id: "id_moz_728",
link1: "",
link2: "",
name: "Mozilla",
type: ""
},
%{
comment: "",
description: "libwhisker - HTTP client and utility - Perl library",
id: "id_moz_100109_3",
link1: "http://www.wiretrip.net/rfp/lw.asp",
link2: "",
name: "Mozilla (libwhisker/2.4)",
type: ""
},
%{
comment: "",
description: "http://www.somewhere.com robot",
id: "id_moz_729",
link1: "http://www.somewhere.com",
link2: "",
name: "Mozilla (Mozilla@somewhere.com)",
type: "R"
},
%{
comment: "130.203.154.2xx",
description: "BotSeer search engine for robots.txt",
id: "id_moz_041007_1",
link1: "http://botseer.ist.psu.edu/",
link2: "http://botseer.ist.psu.edu/about.html",
name: "Mozilla 4.0(compatible; BotSeer/1.0; +http://botseer.ist.psu.edu)",
type: "R"
},
%{
comment: "",
description: "PDA Pocket IE 2.x Windows CE",
id: "id_moz_731",
link1: "",
link2: "",
name: "Mozilla/1.1 (compatible; MSPIE 2.0; Windows CE)",
type: "B"
},
%{
comment: "",
description: "Oregano browser for RISC OS",
id: "id_moz_732",
link1: "http://www.crashnet.org.uk",
link2: "",
name: "Mozilla/1.10 [en] (Compatible; RISC OS 3.70; Oregano 1.10)",
type: "B"
},
%{
comment: "",
description: "IE 2.x WinNT",
id: "id_moz_730",
link1: "",
link2: "",
name: "Mozilla/1.22 (compatible; MSIE 2.0d; Windows NT)",
type: "B"
},
%{
comment: "",
description: "EudoraWeb 2.0 browser (Eudora Internet Suite) for PalmOS",
id: "id_moz_733",
link1: "http://www.eudora.com/products/unsupported/internetsuite/",
link2: "",
name: "Mozilla/1.22 (compatible; MSIE 5.01; PalmOS 3.0) EudoraWeb 2",
type: "B"
},
%{
comment: "",
description: "Dummy user agent - i.e. used by Namo Web Editor",
id: "id_moz_1552",
link1: "http://www.namo.com/",
link2: "",
name: "Mozilla/2.0",
type: "B"
},
%{
comment: "",
description: "AOL Mac",
id: "id_moz_734",
link1: "",
link2: "",
name: "Mozilla/2.0 (compatible; AOL 3.0; Mac_PowerPC)",
type: "B"
},
%{
comment: "",
description: "AOL Win 3.x",
id: "id_moz_735",
link1: "",
link2: "",
name: "Mozilla/2.0 (Compatible; AOL-IWENG 3.0; Win16)",
type: "B"
},
%{
comment: " 65.214.45.[x]xx",
description: "Ask Jeeves /Teoma robot",
id: "id_moz_736",
link1: "http://sp.ask.com",
link2: "",
name: "Mozilla/2.0 (compatible; Ask Jeeves)",
type: "R"
},
%{
comment: "65.214.45.[x]xx",
description: "Ask Jeeves /Teoma robot",
id: "id_moz_040707_2",
link1: "http://sp.ask.com",
link2: "",
name: "Mozilla/2.0 (compatible; Ask Jeeves/Teoma)",
type: "R"
},
%{
comment: " 65.214.45.[x]xx",
description: "Ask Jeeves /Teoma robot",
id: "id_moz_160506_3",
link1: "http://sp.ask.com",
link2: "",
name:
"Mozilla/2.0 (compatible; Ask Jeeves/Teoma; http://about.ask.com/en/docs/about/webmasters.shtml) ",
type: "R"
},
%{
comment: " 65.214.45.[x]xx",
description: "Ask Jeeves /Teoma robot",
id: "id_moz_737",
link1: "http://sp.ask.com",
link2: "",
name:
"Mozilla/2.0 (compatible; Ask Jeeves/Teoma; http://sp.ask.com/docs/about/tech_crawling.html)",
type: "R"
},
%{
comment: "",
description: "Direct Hit Robot",
id: "id_moz_738",
link1: "http://www.directhit.com",
link2: "",
name: "Mozilla/2.0 (compatible; EZResult -- Internet Search Engine)",
type: "R"
},
%{
comment: "",
description: "MS Frontpage x.x web editor",
id: "id_moz_739",
link1: "",
link2: "",
name: "Mozilla/2.0 (compatible; MS FrontPage x.0)",
type: "B"
},
%{
comment: "",
description: "IE 2.x Mac Power PC",
id: "id_moz_740",
link1: "",
link2: "",
name: "Mozilla/2.0 (compatible; MSIE 2.1; Mac_PowerPC)",
type: "B"
},
%{
comment: "",
description: "IE 3.x WinNT",
id: "id_moz_743",
link1: "",
link2: "",
name: "Mozilla/2.0 (compatible; MSIE 3.02; Update a; AK; Windows NT)",
type: "B"
},
%{
comment: "",
description: "IE 3.x AOL Win95",
id: "id_moz_744",
link1: "",
link2: "",
name: "Mozilla/2.0 (compatible; MSIE 3.02; Update a; AOL 3.0; Windows 95)",
type: "B"
},
%{
comment: "",
description: "IE 3.x Win95",
id: "id_moz_741",
link1: "",
link2: "",
name: "Mozilla/2.0 (compatible; MSIE 3.0; AK; Windows 95)",
type: "B"
},
%{
comment: "",
description: "IE 3.x Win 3.1",
id: "id_moz_742",
link1: "",
link2: "",
name: "Mozilla/2.0 (compatible; MSIE 3.0; Windows 3.1)",
type: "B"
},
%{
comment: "",
description: "IE 3.x WinXP",
id: "id_moz_745",
link1: "",
link2: "",
name: "Mozilla/2.0 (compatible; MSIE 3.0B; Win32)",
type: "B"
},
%{
comment: "",
description: "Borland Delphi .OCX component used by WebCollector email harverster",
id: "id_moz_746",
link1: "",
link2: "",
name: "Mozilla/2.0 (compatible; NEWT ActiveX; Win32)",
type: "S"
},
%{
comment: "",
description: "Thunderstone's Webinator Web indexing program",
id: "id_moz_747",
link1: "http://www.thunderstone.com/texis/site/pages/Products.html",
link2: "",
name: "Mozilla/2.0 (compatible; T-H-U-N-D-E-R-S-T-O-N-E)",
type: "R"
},
%{
comment: "",
description: "Check&Get bookmark and link checking tool",
id: "id_moz_748",
link1: "http://www.activeurls.com",
link2: "",
name: "Mozilla/2.0 compatible; Check&Get 1.1x (Windows 98)",
type: "C"
},
%{
comment: "",
description: "Netscape 2.x Win3.x International",
id: "id_moz_749",
link1: "",
link2: "",
name: "Mozilla/2.01 (Win16; I)",
type: "B"
},
%{
comment: "",
description: "Netscape 2.x Gold Win95",
id: "id_moz_750",
link1: "",
link2: "",
name: "Mozilla/2.02Gold (Win95; I)",
type: "B"
},
%{
comment: "",
description:
"Faked user agent for diff. purposes i.e.: - some download manager - E-mail harvesting",
id: "id_moz_771",
link1: "",
link2: "",
name: "Mozilla/3.0 (compatible)",
type: "S D"
},
%{
comment: "",
description: "AvantGo PDA browser",
id: "id_moz_751",
link1: "http://avantgo.com/products/solutions/sfa.html",
link2: "",
name: "Mozilla/3.0 (compatible; AvantGo 3.2)",
type: "B"
},
%{
comment: "",
description: "Searchhippo robot",
id: "id_moz_752",
link1: "http://www.searchhippo.com",
link2: "",
name:
"Mozilla/3.0 (compatible; Fluffy the spider; http://www.searchhippo.com/; info@searchhippo.com)",
type: "R"
},
%{
comment: "",
description: "HP Web PrintSmart (discontinued) - web page printing software",
id: "id_moz_753",
link1: "",
link2: "",
name: "Mozilla/3.0 (compatible; HP Web PrintSmart 04b0 1.0.1.34)",
type: "B D"
},
%{
comment: "",
description:
"Internet Direct Library for Borland (often used as e-mail address collector and mass mailing tool)",
id: "id_moz_754",
link1: "http://forge.novell.com/modules/xfmod/project/?indy-net",
link2: "http://www.indyproject.org/",
name: "Mozilla/3.0 (compatible; Indy Library)",
type: "S"
},
%{
comment: "",
description: "Outertechs Linkman bookmark tool",
id: "id_moz_755",
link1: "http://www.outertech.com",
link2: "",
name: "Mozilla/3.0 (compatible; Linkman)",
type: "C"
},
%{
comment: "",
description: "Euroferret robot",
id: "id_moz_757",
link1: "http://www.euroferret.com",
link2: "",
name: "Mozilla/3.0 (compatible; MuscatFerret/1.5.4; claude@euroferret.com)",
type: "R"
},
%{
comment: "",
description: "Euroferret robot",
id: "id_moz_756",
link1: "http://www.euroferret.com",
link2: "",
name: "Mozilla/3.0 (compatible; MuscatFerret/1.5; olly@muscat.co.uk)",
type: "R"
},
%{
comment: "",
description: "Euroferret robot",
id: "id_moz_758",
link1: "http://www.euroferret.com",
link2: "",
name: "Mozilla/3.0 (compatible; MuscatFerret/1.6.x; claude@euroferret.com)",
type: "R"
},
%{
comment: "",
description: "Netart Generator - script generated random websites",
id: "id_moz_759",
link1: "http://www.obn.org/generator/",
link2: "",
name: "Mozilla/3.0 (compatible; netart generator/1.0; libwww-perl/5.64)",
type: "R D"
},
%{
comment: "",
description: "NetPositive BEOS browser",
id: "id_moz_760",
link1:
"http://www.tunetrackersystems.com/bedocs/documentation/User's%20Guide/03_network/Network07_NetPositive.html",
link2: "",
name: "Mozilla/3.0 (compatible; NetPositive/2.2)",
type: "B"
},
%{
comment: "",
description: "Opera 3.x Win3.x",
id: "id_moz_761",
link1: "",
link2: "",
name: "Mozilla/3.0 (compatible; Opera/3.0; Windows 3.1) v3.1",
type: "B"
},
%{
comment: "",
description: "Opera 3.x Win95/NT",
id: "id_moz_762",
link1: "",
link2: "",
name: "Mozilla/3.0 (compatible; Opera/3.0; Windows 95/NT4) 3.2",
type: "B"
},
%{
comment: "",
description: "Perman Surfer bookmark tool",
id: "id_moz_763",
link1: "http://www.bug.co.jp/nami-nori/",
link2: "",
name: "Mozilla/3.0 (compatible; PerMan Surfer 3.0; Win95)",
type: "C"
},
%{
comment: "",
description: "Web Link Validator link validation software",
id: "id_moz_764",
link1: "http://www.relsoftware.com",
link2: "",
name: "Mozilla/3.0 (compatible; REL Software Web Link Validator 2.x)",
type: "C"
},
%{
comment: "",
description: "Scan4Mail online mail extraction service",
id: "id_moz_765",
link1: "http://www.peterspages.net",
link2: "",
name:
"Mozilla/3.0 (compatible; scan4mail (advanced version) http://www.peterspages.net/?scan4mail)",
type: "S"
},
%{
comment: "s. also ScollSpider",
description: "WebWobot UK search engine robot (82.43.129.2xx)",
id: "id_moz_220606_2",
link1: "http://www.webwobot.com/",
link2: "",
name: "Mozilla/3.0 (compatible; ScollSpider; http://www.webwobot.com)",
type: "R"
},
%{
comment: "",
description: "Web Link Validator link validation software",
id: "id_moz_766",
link1: "http://www.relsoftware.com",
link2: "",
name:
"Mozilla/3.0 (compatible; Web Link Validator 2.x)Web Link Validator http://www.relsoftware.com/ link validation software",
type: "C"
},
%{
comment: "",
description: "Xelios Web Capture (now Wysigot) website downloading tool (Discontinued)",
id: "id_moz_767",
link1: "http://www.xelios.com/",
link2: "http://www.wysigot.com/int/about.html",
name: "Mozilla/3.0 (compatible; WebCapture x.x; Auto; Windows)",
type: "D"
},
%{
comment: "",
description: "Iprospect search engine positioning using Thunderstone's Webinator",
id: "id_moz_768",
link1: "http://www.iprospect.com",
link2: "http://www.thunderstone.com/texis/site/pages/Products.html",
name: "Mozilla/3.0 (compatible; Webinator-DEV01.home.iprospect.com/2.56)",
type: "R"
},
%{
comment: "",
description: "CyberAlert's Media Monitor using Thunderstone's Webinator",
id: "id_moz_769",
link1: "http://www.cyberalert.com",
link2: "http://www.thunderstone.com/texis/site/pages/Products.html",
name: "Mozilla/3.0 (compatible; Webinator-indexer.cyberalert.com/2.56)",
type: "R"
},
%{
comment: "",
description: "Viking server user/client",
id: "id_moz_770",
link1: "http://www.robtex.com",
link2: "",
name: "Mozilla/3.0 (Compatible;Viking/1.8)",
type: "P"
},
%{
comment: "",
description: "One of DC-Sakuras download manager user-agent names",
id: "id_moz_772",
link1: "http://www.dc-sakura.com",
link2: "",
name: "Mozilla/3.0 (DreamPassport/3.0)",
type: "D"
},
%{
comment: "s. also - INGRID/3.0 .. / IlseBot/1.0 ..",
description: "Ilse Netherlands robot (62.69.178.xx)",
id: "id_moz_773",
link1: "http://www.ilse.nl/",
link2: "",
name:
"Mozilla/3.0 (INGRID/3.0 MT; webcrawler@NOSPAMexperimental.net; http://aanmelden.ilse.nl/?aanmeld_mode=webhints)",
type: "R"
},
%{
comment: "",
description: "Liberate DTV server suite / TV-emulator",
id: "id_moz_774",
link1: "http://www.liberate.com",
link2: "",
name: "Mozilla/3.0 (Liberate DTV 1.1)",
type: "B P"
},
%{
comment: "",
description: "Planetweb 2.1 Browser (discontinued) for Dreamcast",
id: "id_moz_775",
link1: "http://www.planetweb.com",
link2: "",
name: "Mozilla/3.0 (Planetweb/2.100 JS SSL US; Dreamcast US)",
type: "B"
},
%{
comment: "",
description: "http://www.goo.ne.jp /Inktomi robot",
id: "id_moz_776",
link1: "http://www.goo.ne.jp",
link2: "",
name: "Mozilla/3.0 (Slurp.so/Goo; slurp@inktomi.com; http://www.inktomi.com/slurp.html)",
type: "R"
},
%{
comment: "s. also Slurpy Verifier ...",
description: "Inktomi (Hotbot-Lycos-NBCi) robot - 72.30.61.xx(x)",
id: "id_moz_777",
link1: "http://www.inktomi.com/",
link2: "",
name: "Mozilla/3.0 (Slurp/cat; slurp@inktomi.com; http://www.inktomi.com/slurp.html)",
type: "R"
},
%{
comment: "s. also Slurpy Verifier ...",
description: "Inktomi (Hotbot-Lycos-NBCi) robot - 72.30.61.xx(x)",
id: "id_moz_778",
link1: "http://www.inktomi.com/",
link2: "",
name: "Mozilla/3.0 (Slurp/si; slurp@inktomi.com; http://www.inktomi.com/slurp.html)",
type: "R"
},
%{
comment: "s. also Vagabondo",
description: "WiseGuys robot Netherland - 82.94.216.2",
id: "id_moz_779",
link1: "http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk",
link2: "",
name:
"Mozilla/3.0 (Vagabondo/1.1 MT; webcrawler@NOSPAMwise-guys.nl; http://webagent.wise-guys.nl/)",
type: "R"
},
%{
comment: "s. also Vagabondo",
description: "WiseGuys robot Netherland - 82.94.216.2",
id: "id_moz_780",
link1: "http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk",
link2: "",
name:
"Mozilla/3.0 (Vagabondo/1.x MT; webagent@wise-guys.nl; http://webagent.wise-guys.nl/)",
type: "R"
},
%{
comment: "",
description: "Ilse Netherlands robot",
id: "id_moz_781",
link1: "http://www.ilse.nl",
link2: "",
name:
"Mozilla/3.0 (Vagabondo/2.0 MT; webcrawler@NOSPAMexperimental.net; http://aanmelden.ilse.nl/?aanmeld_mode=webhints)",
type: "R"
},
%{
comment: "s. also Vagabondo",
description: "WiseGuys robot Netherland - 82.94.216.2",
id: "id_moz_782",
link1: "http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk",
link2: "",
name:
"Mozilla/3.0 (Vagabondo/2.0 MT; webcrawler@NOSPAMwise-guys.nl; http://webagent.wise-guys.nl/)",
type: "R"
},
%{
comment: "",
description: "Netscape 3.x Win3.x",
id: "id_moz_783",
link1: "",
link2: "",
name: "Mozilla/3.0 (Win16; I)",
type: "B"
},
%{
comment: "",
description: "Netscape 3.x Win95",
id: "id_moz_784",
link1: "",
link2: "",
name: "Mozilla/3.0 (Win95; I)",
type: "B"
},
%{
comment: "",
description: "Netscape 3.x WinNT",
id: "id_moz_785",
link1: "",
link2: "",
name: "Mozilla/3.0 (WinNT; I)",
type: "B"
},
%{
comment: "",
description: "Netscape 3.x FreeBSD",
id: "id_moz_786",
link1: "",
link2: "",
name: "Mozilla/3.0 (WorldGate Gazelle 3.5.1 build 11; FreeBSD2.2.8-STABLE)",
type: "B"
},
%{
comment: "",
description: "Netscape 3.x OSF1 V4.0 alpha ",
id: "id_moz_787",
link1: "",
link2: "",
name: "Mozilla/3.0 (X11; I; OSF1 V4.0 alpha)",
type: "B"
},
%{
comment: "",
description: "AOL Web TV",
id: "id_moz_788",
link1: "",
link2: "",
name:
"Mozilla/3.0 NAVIO_AOLTV (11; 13; Philips; PH200; 1; R2.0C36_AOL.0110OPTIK; R2.0.0139d_OPTIK)",
type: "B"
},
%{
comment: "",
description: "WebTV",
id: "id_moz_789",
link1: "",
link2: "",
name: "Mozilla/3.0 WebTV/1.2 (compatible; MSIE 2.0)",
type: "B"
},
%{
comment: "",
description: "Amiga Voyager Browser Amiga",
id: "id_moz_790",
link1: "",
link2: "",
name: "Mozilla/3.01 (compatible; AmigaVoyager/2.95; AmigaOS/MC680x0)",
type: "B"
},
%{
comment: "",
description: "Links2Go robot",
id: "id_moz_791",
link1: "http://www.links2go.com",
link2: "",
name: "Mozilla/3.01 (Compatible; Links2Go Similarity Engine)",
type: "R"
},
%{
comment: "",
description: "Netgem Netbox cable modem TV Box Linux",
id: "id_moz_792",
link1: "http://www.netgem.com",
link2: "",
name: "Mozilla/3.01 (compatible; Netbox/3.5 R92; Linux 2.2)",
type: "B"
},
%{
comment: "",
description: "Netscape 3.x Mac",
id: "id_moz_793",
link1: "",
link2: "",
name: "Mozilla/3.01-C-MACOS8 (Macintosh; I; PPC)",
type: "B"
},
%{
comment: "",
description: "Netscape 3.x Linux",
id: "id_moz_794",
link1: "",
link2: "",
name: "Mozilla/3.01Gold (X11; I; Linux 2.0.32 i486)",
type: "B"
},
%{
comment: "",
description: "Netscape 3.x SunOS",
id: "id_moz_795",
link1: "",
link2: "",
name: "Mozilla/3.01Gold (X11; I; SunOS 5.5.1 sun4m)",
type: "B"
},
%{
comment: "",
description: "Netscape 3.x Irix",
id: "id_moz_796",
link1: "",
link2: "",
name: "Mozilla/3.01SGoldC-SGI (X11; I; IRIX 6.3 IP32)",
type: "B"
},
%{
comment: "",
description: "ANT Fresco Browser Risc OS",
id: "id_moz_797",
link1: "http://www.antlimited.com",
link2: "",
name: "Mozilla/3.04 (compatible; ANTFresco/2.13; RISC OS 4.02)",
type: "B"
},
%{
comment: "",
description: "NCBrowser ANT Fresco Browser Risc OS",
id: "id_moz_798",
link1: "http://www.antlimited.com",
link2: "",
name:
"Mozilla/3.04 (compatible; NCBrowser/2.35; ANTFresco/2.17; RISC OS-NC 5.13 Laz1UK1309)",
type: "B"
},
%{
comment: "",
description: "QNX OS Voyager embedded browser",
id: "id_moz_281106_1",
link1: "http://www.qnx.com/products/browsers/",
link2: "",
name: "Mozilla/3.04 (compatible;QNX Voyager 2.03B ;Photon)",
type: "B"
},
%{
comment: "",
description: "I-Opener (was www.netpliance.com/) web PC",
id: "id_moz_799",
link1: "",
link2: "",
name: "Mozilla/3.x (I-Opener 1.1; Netpliance)",
type: "B"
},
%{
comment: "s. also Yahoo! Mindset",
description: "Yahoo Mindset: Intent-driven Search (66.228.182.1xx)",
id: "id_moz_100406_3",
link1: "http://mindset.research.yahoo.com/",
link2: "",
name: "Mozilla/4.0",
type: "R"
},
%{
comment: "s. also agadine/1.x.x",
description: "Agada search (Germany) robot",
id: "id_moz_800",
link1: "http://www.agada.de",
link2: "",
name: "Mozilla/4.0 (agadine3.0) www.agada.de",
type: "R"
},
%{
comment: "s. also URLBase/6.x",
description: "URLBase 6 bookmark manager",
id: "id_moz_290406_1",
link1: "http://www.terriadev.com/products/urlbase/",
link2: "",
name: "Mozilla/4.0 (Compatible); URLBase 6",
type: "C"
},
%{
comment: "",
description: "Astrafind! adult search robot (66.98.252.xx)",
id: "id_moz_895",
link1: "http://www.astrafind.com",
link2: "",
name: "Mozilla/4.0 (compatible: AstraSpider V.2.1 : astrafind.com)",
type: "R"
},
%{
comment: "s.also - Mozilla/3.0 (Vagabondo... - Vagabondo..",
description: "WiseGuys robot Netherland - 82.94.216.2",
id: "id_moz_021205_1",
link1: "http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk",
link2: "",
name:
"Mozilla/4.0 (compatible; Vagabondo/2.2; webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/)",
type: "R"
},
%{
comment: "s.also - Mozilla/3.0 (Vagabondo... - Vagabondo..",
description: "WiseGuys robot Netherland - 82.94.216.2",
id: "id_moz_240906_1",
link1: "http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk",
link2: "",
name:
"Mozilla/4.0 (compatible; Vagabondo/4.0Beta; webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/)",
type: "R"
},
%{
comment: "",
description: "ReGet Deluxe! download manager",
id: "id_moz_100208_1",
link1: "http://deluxe.reget.com/en/",
link2: "",
name:
"Mozilla/4.0 (compatible; <a href=http://www.reget.com>ReGet Deluxe 5.1</a>; Windows NT 5.1)",
type: "D"
},
%{
comment: "",
description: "Advanced Email Extractor e-mail collector (spam bot)",
id: "id_moz_801",
link1: "http://www.mailutilities.com",
link2: "",
name: "Mozilla/4.0 (compatible; Advanced Email Extractor v2.xx)",
type: "S"
},
%{
comment: "",
description: "Arachmo Spider - web site file extraction tool",
id: "id_moz_802",
link1: "http://bbbearchan.hp.infoseek.co.jp/",
link2: "",
name: "Mozilla/4.0 (compatible; Arachmo)",
type: "D"
},
%{
comment: "",
description: "Novell Border Manager security suite",
id: "id_moz_804",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; BorderManager 3.0)",
type: "P"
},
%{
comment: "209.11.177.1xx",
description: "Best of the Web directory link checking",
id: "id_moz_090807_3",
link1: "http://botw.org/",
link2: "",
name: "Mozilla/4.0 (compatible; BOTW Spider; +http://botw.org)",
type: "C"
},
%{
comment: "s. BlitzBOT@tricus.net",
description: "Blitzsuche Germany robot",
id: "id_moz_803",
link1: "http://blitzsuche.rp-online.de/",
link2: "",
name: "Mozilla/4.0 (compatible; B_L_I_T_Z_B_O_T)",
type: "R"
},
%{
comment: "",
description: "Content Control from Blue Coat",
id: "id_moz_805",
link1: "http://www.cerberian.com",
link2: "",
name: "Mozilla/4.0 (compatible; Cerberian Drtrs Version-3.2-Build-0)",
type: "P"
},
%{
comment: "",
description: "Check&Get bookmark manager, web change monitor and archiver",
id: "id_moz_080706_1",
link1: "http://activeurls.com/en/",
link2: "",
name: "Mozilla/4.0 (compatible; Check&Get 3.0; Windows NT)",
type: "C"
},
%{
comment: "s.also ChristCRAWLER",
description: "Christcentral.com Christcrawler (was www.christcrawler.com)",
id: "id_moz_806",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; ChristCrawler.com ChristCrawler@ChristCENTRAL.com)",
type: "R"
},
%{
comment: "",
description: "Yahoo Search Marketing crawler (68.142.211.1xx)",
id: "id_moz_301105_4",
link1: "http://www.content.overture.com/d/",
link2: "",
name: "Mozilla/4.0 (compatible; crawlx, crawler@trd.overture.com)",
type: "R"
},
%{
comment: "s. also RaBot",
description: "DAUMOA - Daum search Korea robot (211.115.109.xxx)",
id: "id_moz_011207_1",
link1: "http://www.daum.net/",
link2: "http://ws.daum.net/abouten.html",
name: "Mozilla/4.0 (compatible; DAUMOA-video; +http://ws.daum.net/aboutkr.html)",
type: "R"
},
%{
comment: "",
description: "DepSpid distributed web crawler for link dependencies",
id: "id_moz_131206_1",
link1: "http://depspid.net/",
link2: "http://about.depspid.net/",
name: "Mozilla/4.0 (compatible; DepSpid/5.0x; +http://about.depspid.net)",
type: "C"
},
%{
comment: "",
description: "Download Mage download manager",
id: "id_moz_807",
link1: "http://www.dlmage.com",
link2: "",
name: "Mozilla/4.0 (compatible; DnloadMage 1.0)",
type: "D"
},
%{
comment: "",
description: "Fast/Alltheweb crawler",
id: "id_moz_808",
link1: "http://www.alltheweb.com",
link2: "",
name: "Mozilla/4.0 (compatible; FastCrawler3 support-fastcrawler3@fast.no)",
type: "R"
},
%{
comment: "",
description: "Fluid Dynamics Search Engine (FDSE) robot used by Abadoor.de",
id: "id_moz_809",
link1: "http://www.xav.com/scripts/search/",
link2: "http://www.abadoor.de/",
name: "Mozilla/4.0 (compatible; FDSE robot)",
type: "R"
},
%{
comment: "",
description: "GPU Distributed Search Engine crawler",
id: "id_moz_161105_2",
link1: "http://gpu.sourceforge.net/search_engine.php",
link2: "",
name:
"Mozilla/4.0 (compatible; GPU p2p crawler http://gpu.sourceforge.net/search_engine.php)",
type: "R"
},
%{
comment: "",
description: "Grub open source crawler",
id: "id_moz_810",
link1: "http://www.grub.org",
link2: "",
name:
"Mozilla/4.0 (compatible; grub-client-0.2.x; Crawl your stuff with http://grub.org)",
type: "R"
},
%{
comment: "",
description: "Grub open source crawler",
id: "id_moz_811",
link1: "http://www.grub.org",
link2: "",
name:
"Mozilla/4.0 (compatible; grub-client-0.3.x; Crawl your own stuff with http://grub.org)",
type: "R"
},
%{
comment: "",
description: "Grub open source crawler used by Looksmart ( 64.241.242.xx)",
id: "id_moz_812",
link1: "http://www.grub.org",
link2: "",
name: "Mozilla/4.0 (compatible; grub-client-2.x)",
type: "R"
},
%{
comment: "",
description: "ibisBrowser Japanese mobile browser",
id: "id_moz_261205_2",
link1: "http://www.ibis.ne.jp/products/ibisBrowser/index.html",
link2: "",
name: "Mozilla/4.0 (compatible; ibisBrowser)",
type: "B"
},
%{
comment: "",
description: "Novell iChain Cool Solutions caching",
id: "id_moz_813",
link1: "http://www.novell.com",
link2: "",
name: "Mozilla/4.0 (compatible; ICS 1.2.xxx)",
type: "P"
},
%{
comment: "",
description: "IE Favorites Check - Bookmark manager",
id: "id_moz_220206_1",
link1: "http://secure.sintraweb.net/public/soft/iefc/",
link2: "",
name: "Mozilla/4.0 (compatible; IE-Favorites-Check-0.5)",
type: "C"
},
%{
comment: "",
description: "Iplexx Austria (webhosting company) logfile spamming bot",
id: "id_moz_814",
link1: "http://www.iplexx.at",
link2: "",
name: "Mozilla/4.0 (compatible; Iplexx Spider/1.0 http://www.iplexx.at)",
type: "S"
},
%{
comment: "",
description: "KeepNi Monitors - Web site monitoring / link checking tool",
id: "id_moz_020208_1",
link1: "http://www.keepni.com/",
link2: "",
name: "Mozilla/4.0 (compatible; KeepNI web site monitor)",
type: "C"
},
%{
comment: "s. also - Mozilla/4.0 (compatible; NetPromoter Spider ...",
description: "NetPromoter Link Utility link checking tool",
id: "id_moz_815",
link1: "http://www.net-promoter.com/",
link2: "",
name: "Mozilla/4.0 (compatible; Link Utility; http://net-promoter.com)",
type: "C"
},
%{
comment: "",
description: "Lotus Notes 5.0 browser",
id: "id_moz_816",
link1:
"http://www-10.lotus.com/ldd/whatisnotes#Release%205.0%3A%20Web%20integration%20by%20d",
link2: "",
name: "Mozilla/4.0 (compatible; Lotus-Notes/5.0; Windows-NT)",
type: "B"
},
%{
comment: "",
description: "IE 4.x AOL Win98",
id: "id_moz_819",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 4.01; AOL 4.0; Windows 98)",
type: "B"
},
%{
comment: "",
description: "IE 4.x Mac Power PC",
id: "id_moz_820",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 4.01; Mac_PowerPC)",
type: "B"
},
%{
comment: "",
description: "Internet Explorer 4.0 URL check",
id: "id_moz_821",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 4.01; MSIECrawler; Windows 95)",
type: "B C"
},
%{
comment: "",
description: "Vonna search robot",
id: "id_moz_090506_1",
link1: "http://www.vonna.com/",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 4.01; Vonna.com b o t)",
type: "R"
},
%{
comment: "",
description: "IE 4.x Win95",
id: "id_moz_822",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 4.01; Windows 95)",
type: "B"
},
%{
comment: "",
description: "IE PDA Browser Windows CE",
id: "id_moz_823",
link1: "",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 4.01; Windows CE; MSN Companion 2.0; 800x600; Compaq)",
type: "B"
},
%{
comment: "81.52.143.xx",
description: "Orange France robot for mobiles",
id: "id_moz_100109_4",
link1: "http://www.orange.com/en_EN/",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 4.01; Windows CE; PPC; 240x320; SPV M700; OpVer 19.123.2.733) OrangeBot-Mobile 2008.0 (mobilesearch.support@orange-ftgroup.com)",
type: "R"
},
%{
comment: "",
description: "IE for Windows CE on a PocketPC (HP iPAQ)",
id: "id_moz_010308_2",
link1: "http://www.hp.com/",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 4.01; Windows CE; PPS; 240x320)",
type: "B"
},
%{
comment: "",
description: "IE PDA Browser Windows CE",
id: "id_moz_824",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 4.01; Windows NT Windows CE)",
type: "B"
},
%{
comment: "",
description: "IE 4.x WinNT",
id: "id_moz_826",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 4.01; Windows NT)",
type: "B"
},
%{
comment: "",
description:
"diff. IPs / services i.e.: - Microsoft server information robot (see link) - Okanagan Internet Junction web filter (robot)",
id: "id_moz_825",
link1: "http://www.webmasterworld.com/forum11/841.htm",
link2: "http://www.junction.net/",
name: "Mozilla/4.0 (compatible; MSIE 4.01; Windows NT; MS Search 4.0 Robot) Microsoft",
type: ""
},
%{
comment: "208.236.180.xx",
description:
"Unknown robot from American College of Radiology (ACR) running MS Site Server",
id: "id_moz_010406_3",
link1: "http://www.acr.org/s_acr/index.asp",
link2: "http://www.microsoft.com/commerceserver/default.mspx",
name: "Mozilla/4.0 (compatible; MSIE 4.0; Windows NT; Site Server 3.0 Robot) ACR",
type: "R C"
},
%{
comment: "",
description: "Indonesia Interactive Web-portal robot on MS Site Server",
id: "id_moz_817",
link1: "http://www.i-2.co.id/",
link2: "http://www.microsoft.com/commerceserver/default.mspx",
name:
"Mozilla/4.0 (compatible; MSIE 4.0; Windows NT; Site Server 3.0 Robot) Indonesia Interactive",
type: "R"
},
%{
comment: "",
description: "Webquestdesigns hosting",
id: "id_moz_818",
link1: "http://www.webquestdesigns.com",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 4.0; Windows NT; Site Server 3.0 Robot) WebQuest Designs",
type: ""
},
%{
comment: "",
description: "Avirt Gateway proxy server",
id: "id_moz_841",
link1: "http://www.avirt.com/products/gateway.html",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 5.01; Windows 95) via <B>Avirt Gateway Server</B> v4.0",
type: "P"
},
%{
comment: "s. Larbin....",
description: "Metacarta.com (66.28.xx.xxx) robot",
id: "id_moz_843",
link1: "http://www.metacarta.com/",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.01; Windows NT 5.0) (samualt9@bigfoot.com)",
type: "R"
},
%{
comment: "",
description: "NetCaptor IE browser addon",
id: "id_moz_842",
link1: "http://www.netcaptor.com",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.01; Windows NT 5.0; NetCaptor 6.5.0RC1)",
type: "B"
},
%{
comment: "",
description: "IE 5.x AOL Win95 Sureseeker search plugin",
id: "id_moz_827",
link1: "http://www.sureseeker.com",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 5.0; AOL 5.0; Windows 95; DigExt; Gateway2000; sureseeker.com)",
type: "B"
},
%{
comment: "",
description: "IE 5.x Mac PowerPC AtHome user",
id: "id_moz_828",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.0; Mac_PowerPC; AtHome021)",
type: "B"
},
%{
comment: "parked domain",
description: "www.netnose.com crawler",
id: "id_moz_829",
link1: "http://www.netnose.com/",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 5.0; NetNose-Crawler 2.0; A New Search Experience: http://www.netnose.com)",
type: "R"
},
%{
comment: "",
description: "WinXP via CERN httpd proxy server ",
id: "id_moz_830",
link1: "http://www.w3.org",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 5.0; Win32) via proxy gateway CERN-HTTPD/3.0 libwww/2.17",
type: "P"
},
%{
comment: "",
description: "Echo.com robot",
id: "id_moz_831",
link1: "http://www.echo.com",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.0; Windows 95) TrueRobot; 1.5",
type: "R"
},
%{
comment: "",
description: "Voila.fr robot",
id: "id_moz_832",
link1: "http://www.voila.fr",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 5.0; Windows 95) VoilaBot BETA 1.2 (http://www.voila.com/)",
type: "R"
},
%{
comment: "",
description: "Voila.fr robot",
id: "id_moz_833",
link1: "http://www.voila.fr",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.0; Windows 95) VoilaBot; 1.6",
type: "R"
},
%{
comment: "",
description: "WinME Opera 5.x",
id: "id_moz_835",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.0; Windows ME) Opera 5.11 [en]",
type: "B"
},
%{
comment: "",
description: "Kyosoft's Link Checker",
id: "id_moz_834",
link1: "http://www.kyosoft.com",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 5.0; Windows ME; Link Checker 2.x.xx http://www.kyosoft.com)",
type: "C"
},
%{
comment: "site is closed",
description:
"Beijing Express Email Address Extractor via DHCP Data Transport Services (DTS)",
id: "id_moz_836",
link1: "http://www.zstools.com",
link2: "http://esupport.ca.com/index.html?/public/dto_transportit/infodocs/dto1013.asp",
name: "Mozilla/4.0 (compatible; MSIE 5.0; Windows NT; DigExt; DTS Agent",
type: "S"
},
%{
comment: "",
description: "Girafa (browser plug-in) robot",
id: "id_moz_837",
link1: "http://www.girafa.com",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 5.0; Windows NT; Girafabot; girafabot at girafa dot com; http://www.girafa.com)",
type: "B R"
},
%{
comment: "s. also GalaxyBot..",
description: "Galaxy robot (63.121.41.xxx) ",
id: "id_moz_838",
link1: "http://www.galaxy.com/",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.0; www.galaxy.com; www.psychedelix.com)",
type: "R"
},
%{
comment: "s. also GalaxyBot..",
description: "Galaxy robot (63.121.41.xxx)",
id: "id_moz_839",
link1: "http://www.galaxy.com/",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 5.0; www.galaxy.com; www.psychedelix.com/; http://www.galaxy.com/info/crawler.html)",
type: "R"
},
%{
comment: "s. also Yandex/1...",
description: "Yandex Search Russia link checking (213.180.206.2xx)",
id: "id_moz_840",
link1: "http://www.yandex.ru",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.0; YANDEX)",
type: "R"
},
%{
comment: "site is offline",
description: "Gobeez starting page plugin",
id: "id_moz_844",
link1: "http://www.gobeez.com/",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.5; AOL 4.0; Windows 98; GoBeez (www.gobeez.com))",
type: "C"
},
%{
comment: "",
description: "IE 5.5 Win95 Hotbar plug-in",
id: "id_moz_845",
link1: "http://hotbar.com/install/firstvisit.asp",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.5; Windows 95; Transmission Segment; Hotbar 2.0)",
type: ""
},
%{
comment: "",
description: "Crazy Browser - IE based tabbed Browser",
id: "id_moz_846",
link1: "http://www.crazybrowser.com",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; Crazy Browser 1.x.x)",
type: "B"
},
%{
comment: "",
description: "Wanadoo Internet services",
id: "id_moz_847",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; KITV4.7 Wanadoo)",
type: "B"
},
%{
comment: "",
description: "Safexplorer (safexplorer.com - site is offline) kids browser",
id: "id_moz_848",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; SAFEXPLORER TL)",
type: "B"
},
%{
comment: "",
description:
"Katiesoft Scroll (ex www.katiesoft.com now discarded) & SimulBrowse (ex www.simulbrowse.com now dead) IE browser plugins",
id: "id_moz_849",
link1: "",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; SYMPA; Katiesoft 7; SimulBrowse 3.0)",
type: "B"
},
%{
comment: "",
description: "Windows ME BTOpenworld Internet services",
id: "id_moz_850",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; Win 9x 4.90; BTinternet V8.1)",
type: "B"
},
%{
comment: "",
description: "Windows ME Internet Explorer URL check",
id: "id_moz_851",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.5; Windows 98; Win 9x 4.90; MSIECrawler)",
type: "B C"
},
%{
comment: "",
description: "Cobion Germany Brand Protection Services robot",
id: "id_moz_852",
link1: "http://www.cobion.com",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 4.0; obot)",
type: "R"
},
%{
comment: "",
description: "Cobion Germany Brand Protection Services robot",
id: "id_moz_853",
link1: "http://www.cobion.com",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 4.0; QXW03018)",
type: "R"
},
%{
comment: "",
description: "IE 5.5 Win2000 / user agent",
id: "id_moz_858",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0) Active Cache Request",
type: "B"
},
%{
comment: "",
description:
"Maybe: - MS Internet Security & Acceleration Server (ISA) cache refreshing request (see link) or - IE 5.5 Win2000 probably with some (website) API request component (see 2nd link) - suspected as email-harvester / site scanning tool (see http://www.byte.com/documents/s=493/byt20010208s0001/index.htm",
id: "id_moz_859",
link1:
"http://groups.google.com/groups?hl=en&lr=&ie=UTF-8&safe=off&threadm=uGoenyodBHA.1472%40tkmsftngp07&rnum=1&prev=/groups%3Fq%3DFetch%2BAPI%26hl%3Den%26lr%3D%26ie%3DUTF-8%26safe%3Doff%26selm%3DuGoenyodBHA.1472%2540tkmsftngp07%26rnum%3D1",
link2:
"http://groups.google.de/groups?q=%22fetch+api+request%22&hl=de&lr=&ie=UTF-8&oe=UTF-8&selm=3CAD577B.C29BA3B2%40execpc.com&rnum=2",
name: "Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0) Fetch API Request",
type: "P S ?"
},
%{
comment: "",
description: "IE 5.5 Win2000 with MS.NET SDK",
id: "id_moz_854",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; .NET CLR 1.0.3705)",
type: "B"
},
%{
comment: "",
description: "IE 5.5 Win2000 / user agent w. AI RoboForm (AIRF) password manager",
id: "id_moz_855",
link1: "http://www.roboform.com",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; AIRF)",
type: "B"
},
%{
comment: "",
description: "AspTear URL fetching program component / Download32.com spider",
id: "id_moz_856",
link1: "http://www.alphasierrapapa.com/IisDev/Components/AspTear/",
link2: "http://www.download32.com",
name: "Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; AspTear 1.5)",
type: "R D"
},
%{
comment: "",
description: "Nokia.com network",
id: "id_moz_857",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; N_o_k_i_a)",
type: "B"
},
%{
comment: "",
description: "Unknown Object Sciences Corp. robot using the HTTPClient",
id: "id_moz_051102_1",
link1: "http://www.objectsciences.com",
link2: "http://www.innovation.ch/java/HTTPClient/",
name: "Mozilla/4.0 (compatible; MSIE 5.5; Windows NT 5.0; T312461) RPT-HTTPClient/0.3-3E",
type: ""
},
%{
comment: "s. also asterias/2.0",
description: "Singingfish media spider (64.12.186.2xx) via AOL search",
id: "id_moz_060406_2",
link1: "http://search.singingfish.com/sfw/home.jsp",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 6.0 compatible; Asterias Crawler v4; +http://www.singingfish.com/help/spider.html; webmaster@singingfish.com); SpiderThread Revision: 3.10",
type: "R"
},
%{
comment: "",
description: "Megaupload Mega Manager - Download manager toolbar for IE",
id: "id_moz_200108_2",
link1: "http://www.megaupload.com/manager/de/",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; AOL 9.0; Windows 98; .NET CLR 1.1.4322; MEGAUPLOAD 2.0)",
type: "D"
},
%{
comment: "Adware / Spyware component",
description: "Hotbar IE graphical skin",
id: "id_moz_010106_1",
link1: "http://hotbar.com/Installation/Browsing/WhatIs/Hotbar.htm",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; AOL 9.0; Windows NT 5.1; SV1; HbTools 4.7.2)",
type: "B"
},
%{
comment: "s. also Skampy",
description: "Skaffe.com directory link checker",
id: "id_moz_860",
link1: "http://www.skaffe.com",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; MSIE 5.5; Windows NT 5.1) Skampy/0.9.x [en]",
type: "R"
},
%{
comment: "71.161.205.2xx",
description: "TargetSeek Crawler concerning electronics industry product announcements",
id: "id_moz_100606_1",
link1: "http://www.targetgroups.net/TargetSeek.html",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; TargetSeek/1.0; +http://www.targetgroups.net/TargetSeek.html)",
type: "R"
},
%{
comment: "",
description: "IE 6.0 WebWasher ad filter",
id: "id_moz_861",
link1: "http://www.webwasher.com",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Win32) WebWasher 3.0",
type: "B P"
},
%{
comment: "",
description: "Web Link Validator link validation software",
id: "id_moz_864",
link1: "http://www.relsoftware.com",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows 98) REL Software Web Link Validator 2.x)",
type: "C"
},
%{
comment: "",
description: "Web Link Validator link validation software",
id: "id_moz_865",
link1: "http://www.relsoftware.com",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows 98) Web Link Validator 2.x)",
type: "C"
},
%{
comment: "",
description: "IE 6.0 Netmanager IE add-on",
id: "id_moz_862",
link1: "http://www.vinn.com.au",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; Net M@nager V3.02 - www.vinn.com.au)",
type: "B"
},
%{
comment: "s. also WebLight/4.x.x ...",
description: "WebLight web analyzer & link checker",
id: "id_moz_290306_1",
link1: "http://www.illumit.com/Products/weblight/",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; support@illumit.com; http://www.illumit.com/Products/weblight/)",
type: "C"
},
%{
comment: "",
description: "Abolimba Multibrowser - IE based browser",
id: "id_moz_863",
link1: "http://www.autag.com",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; Win 9x 4.90; http://www.Abolimba.de)",
type: "C"
},
%{
comment: "s. also Lunascape",
description: "Lunascape IE based browser (Japan)",
id: "id_moz_866",
link1: "http://www2.lunascape.jp/index.aspx",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; .NET CLR 1.1.4322; Lunascape 2.1.3)",
type: "B"
},
%{
comment: "209.85.136.xxx",
description: "Google wireless transcoder (GWT) proxy for rewriting websites for mobiles",
id: "id_moz_290708_4",
link1: "http://www.google.com/gwt/n",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; Google Wireless Transcoder;)",
type: "P"
},
%{
comment: "81.169.154.xx",
description: "Tüzilla (Germany) - ODP link checking using Robozilla",
id: "id_moz_150906_1",
link1: "http://tuezilla.de",
link2: "http://dmoz.org/profiles/robozilla.html",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; ODP entries t_st; http://tuezilla.de/t_st-odp-entries-agent.html)",
type: "R"
},
%{
comment: "81.169.154.xx",
description: "Tüzilla (Germany) - ODP link checking using Robozilla",
id: "id_moz_867",
link1: "http://tuezilla.de",
link2: "http://dmoz.org/profiles/robozilla.html",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; ODP links test; http://tuezilla.de/test-odp-links-agent.html)",
type: "R"
},
%{
comment: "70.94.232.2xx",
description: "ZoomSpider.Net indexing robot for several directorys",
id: "id_moz_080606_1",
link1: "http://www.zoomspider.net/",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.0; ZoomSpider.net bot; .NET CLR 1.1.4322)",
type: "R"
},
%{
comment: "",
description: "unknown robot from 64.246.44.xx",
id: "id_moz_882",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1) (dns_admin@c-a-s-h.com)",
type: ""
},
%{
comment: "",
description:
"Covac Software UPPS (Universal PHP Proxy Server) - free public proxy server",
id: "id_moz_280408_1",
link1: "http://www.covac-software.com/proxy/",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Covac UPPS Cathan 1.2.5;)",
type: "P"
},
%{
comment: "",
description: "GetNetWise Crayon Crawler web filter",
id: "id_moz_160406_1",
link1: "http://kids.getnetwise.org/tools/tool_info.php?tool_id=931919301.7202",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Crayon Crawler; snprtz|T04056566514940; (R1 1.5))",
type: "P"
},
%{
comment: "",
description: "Deepnet Explorer - IE based browser",
id: "id_moz_868",
link1: "http://deepnetexplorer.com/",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Deepnet Explorer)",
type: "B"
},
%{
comment: "",
description:
"Heritrix Internet Archive's open-source web project used by Analysis Projects at UW",
id: "id_moz_869",
link1: "http://crawler.archive.org/",
link2: "http://www.cs.washington.edu/research/networking/websys/",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; heritrix/1.3.0 http://www.cs.washington.edu/research/networking/websys/)",
type: "R"
},
%{
comment: "",
description: "IE 6x WinXP Hotbar plug-in",
id: "id_moz_870",
link1: "http://hotbar.com/install/firstvisit.asp",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Hotbar 3.0)",
type: "B"
},
%{
comment: "",
description: "IE 6x WinXP iOpus Internet Macros - Internet-based macro recorder ",
id: "id_moz_871",
link1: "http://www.iopus.com",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; iOpus-I-M)",
type: "B"
},
%{
comment: "",
description: "iRider - IE based browser / Free Download Manager (FDM)",
id: "id_moz_872",
link1: "http://www.irider.com/irider/index.htm",
link2: "http://www.freedownloadmanager.org/",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; iRider 2.21.1108; FDM)",
type: "D"
},
%{
comment: "",
description: "KKman http://www.kkman.com/ - Japanese IE based browser",
id: "id_moz_873",
link1: "http://www.kkman.com",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; KKman3.0)",
type: "B"
},
%{
comment: "",
description: "IE 6x WinXP MathPlayer mathematical notation plugin ",
id: "id_moz_874",
link1: "http://www.mathtype.com/en/products/mathplayer/",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; MathPlayer2.0)",
type: "B"
},
%{
comment: "",
description: "Maxton (ex MyIE2) - IE based browser",
id: "id_moz_875",
link1: "http://www.maxthon.com",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Maxthon) ",
type: "B"
},
%{
comment: "",
description: "IE 6x WinXP peoplepc online PeoplePal IE toolbar",
id: "id_moz_876",
link1: "http://home.vfw-online.com/peoplepal/default.asp",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; PeoplePal 3.0; MSIECrawler)",
type: "B"
},
%{
comment: "",
description: "IE 6x WinXP / I-Opener (was www.netpliance.com/) web PC",
id: "id_moz_877",
link1: "",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; Q312461; IOpener Release 1.1.04)",
type: "B"
},
%{
comment: "220.181.34.1xx",
description: "Qihoo search (China) robot",
id: "id_moz_050307_1",
link1: "http://www.qihoo.com/",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; QihooBot 1.0 qihoobot@qihoo.net)",
type: "R"
},
%{
comment: "",
description:
"SimBar IE toolbar for accessing The Sims sites / Infopath IE form & spreadsheet plugin",
id: "id_moz_070306_1",
link1: "http://www.simstools.com/simbar.php",
link2: "http://office.microsoft.com/en-us/fx010857921033.aspx",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SIMBAR Enabled; InfoPath.1)",
type: "B"
},
%{
comment: "",
description: "IE 6x WinXP Stumble Upon IE toolbar",
id: "id_moz_878",
link1: "http://www.stumbleupon.com",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; StumbleUpon.com 1.760; .NET CLR 1.1.4322)",
type: "B"
},
%{
comment: "",
description: "Balsa Productions embedded web browser package for Borland Delphi",
id: "id_moz_150807_1",
link1: "http://bsalsa.com/product.html",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; Embedded Web Browser from: http://bsalsa.com/; MSIECrawler)",
type: "B"
},
%{
comment: "68.166.223.x",
description: "ChangeDetection robot for web page monitoring",
id: "id_moz_030807_2",
link1: "http://www.changedetection.com/",
link2: "http://www.changedetection.com/bot.html",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; http://www.changedetection.com/bot.html )",
type: "C"
},
%{
comment: "",
description: "IE 6x WinXP also used by WebSite Pro HTML editor",
id: "id_moz_879",
link1: "http://www.gtpcc.org/gtpcc/websitepro.htm",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; .NET CLR 1.1.4322)",
type: "B"
},
%{
comment: "was http://www.dx-soft.net/ (expired)",
description: "DX-Browser - German IE based browser",
id: "id_moz_880",
link1: "http://www.zdnet.de/downloads/prg/t/p/deDCTP-wc.html",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; DX-Browser 5.0.0.0)",
type: "B"
},
%{
comment: "",
description: "ezPeer+ P2P IE addon",
id: "id_moz_271006_1",
link1: "http://web.ezpeer.com/",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; FunWebProducts; ezPeer+ v1.0 Beta (0.4.1.98); ezPeer+ v1.0 (0.5.0.00); .NET CLR 1.1.4322; MSIECrawler)",
type: "B"
},
%{
comment: "",
description: "Axandra IBP website promotion software ?",
id: "id_moz_881",
link1: "http://www.axandra-web-site-promotion-software-tool.com/index.htm",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; IBP; .NET CLR 1.1.4322)",
type: "C B"
},
%{
comment: "",
description: "MRA = Mail.ru Agent - Instant Messenger / VoIP",
id: "id_moz_290606_3",
link1: "http://agent.mail.ru/",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; MRA 4.3 (build 01218))",
type: "B"
},
%{
comment: "s. also: - MSNBOT",
description: "MSN Search robot (207.46.89.xx)",
id: "id_moz_883",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search 4.0 Robot)",
type: "R"
},
%{
comment: "",
description: "Link Commander bookmark manager",
id: "id_moz_170207_3",
link1: "http://www.resortlabs.com/bookmark-manager/linkcommander.php",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 7.0; Win32) Link Commander 4.0",
type: "C"
},
%{
comment: "",
description: "IE 7.0 - WinXP",
id: "id_moz_170706_2",
link1: "http://www.microsoft.com/windows/ie/default.mspx",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; bgft)",
type: "B"
},
%{
comment: "",
description: "GTB = Google Toolbar Internet Explorer add-on",
id: "id_moz_080209_1",
link1: "http://toolbar.google.com/T4/index.html",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 5.1; GTB5; User-agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1; http://bsalsa.com) ; .NET CLR 2.0.50727)",
type: "B"
},
%{
comment: "",
description:
"MSIE 7.0 *and* Trident token used by Internet Explorer 8 in compatibility view mode",
id: "id_moz_080209_2",
link1:
"http://blogs.msdn.com/ie/archive/2009/01/09/the-internet-explorer-8-user-agent-string-updated-edition.aspx",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 7.0; Windows NT 6.1; Trident/4.0; SLCC2; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30729; Media Center PC 6.0; Tablet PC 2.0)",
type: "B"
},
%{
comment: "",
description: "Internet Explorer 8",
id: "id_moz_080209_3",
link1: "http://www.microsoft.com/windows/internet-explorer/beta/default.aspx",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 5.1; Trident/4.0; .NET CLR 2.0.50727; .NET CLR 1.1.4322; .NET CLR 3.0.04506.30; .NET CLR 3.0.04506.648)",
type: "B"
},
%{
comment: "",
description: "IE 8.0 (beta) on Win Vista",
id: "id_moz_150408_4",
link1: "http://www.microsoft.com/windows/products/winfamily/ie/ie8/default.mspx",
link2: "",
name: "Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.0)",
type: "B"
},
%{
comment: "",
description: "Bsalsa embedded browser",
id: "id_moz_030110_1",
link1: "http://bsalsa.com/",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE 8.0; Windows NT 6.0; Trident/4.0; Orange 8.0; GTB6.3; Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1) ; Embedded Web Browser from: http://bsalsa.com/; SLCC1; .NET CLR 2.0.50727; .NET CLR 3.5.30729; .NET CLR 3.0.30618; OfficeLiveConnector.1.3; OfficeLivePatch.1.3)",
type: "B"
},
%{
comment: "s. also RaBot",
description: "DAUMOA - Daum search Korea robot (211.115.109.xxx)",
id: "id_moz_010108_4",
link1: "http://www.daum.net/",
link2: "http://ws.daum.net/abouten.html",
name:
"Mozilla/4.0 (compatible; MSIE enviable; DAUMOA 2.0; DAUM Web Robot; Daum Communications Corp., Korea; +http://ws.daum.net/aboutkr.html)",
type: "R"
},
%{
comment: "s. also RaBot",
description: "DAUMOA - Daum search Korea robot (211.115.109.xxx)",
id: "id_moz_311206_1",
link1: "http://www.daum.net/",
link2: "",
name:
"Mozilla/4.0 (compatible; MSIE is not me; DAUMOA/1.0.1; DAUM Web Robot; Daum Communications Corp., Korea)",
type: "R"
},
%{
comment: "",
description: "Naver Search Korea Naverbot",
id: "id_moz_281106_2",
link1: "http://www.naver.com/",
link2: "",
name: "Mozilla/4.0 (compatible; NaverBot/1.0; http://help.naver.com/delete_main.asp)",
type: "R"
},
%{
comment: "",
description: "Netcraft webserver info",
id: "id_moz_884",
link1: "http://www.netcraft.com",
link2: "",
name: "Mozilla/4.0 (compatible; Netcraft Web Server Survey)",
type: "R C"
},
%{
comment: "s. also - Mozilla/4.0 (compatible; Link Utility ...",
description: "NetPromoter Link Utility link checking tool ",
id: "id_moz_885",
link1: "http://www.net-promoter.com/",
link2: "",
name: "Mozilla/4.0 (compatible; NetPromoter Spider;http://www.net-promoter.com/)",
type: "C"
},
%{
comment: "",
description: "Opera 3.x WinNT",
id: "id_moz_886",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; Opera/3.0; Windows 4.10) 3.51 [en]",
type: "B"
},
%{
comment: "",
description: "Powermarks bookmark manager",
id: "id_moz_887",
link1: "http://www.kaylon.com",
link2: "",
name: "Mozilla/4.0 (compatible; Powermarks/3.5; Windows 95/98/2000/NT)",
type: "C"
},
%{
comment: "",
description: "RSS Popper - MS Outlook RSS reader plugin",
id: "id_moz_230607_1",
link1: "http://rsspopper.unknown/2004/10/home.html",
link2: "",
name: "Mozilla/4.0 (compatible; RSS Popper)",
type: "B"
},
%{
comment: "",
description: "SiteKiosk public terminal browser",
id: "id_moz_888",
link1: "http://www.sitekiosk.com",
link2: "",
name: "Mozilla/4.0 (compatible; SiteKiosk 4.0; MSIE 5.0; Windows 98; SiteCoach 1.0)",
type: "B"
},
%{
comment: "s. also Worldlight",
description: "Entireweb Search Speedyspider (62.13.25.xxx)",
id: "id_moz_889",
link1: "http://www.entireweb.com",
link2: "",
name: "Mozilla/4.0 (compatible; SpeedySpider; www.entireweb.com)",
type: "R"
},
%{
comment: "",
description: "SiteProbe - website status checking",
id: "id_moz_890",
link1: "http://www.siteprobe.com",
link2: "",
name: "Mozilla/4.0 (compatible; SPENG)",
type: "R C"
},
%{
comment: "",
description: "Super Cleaner privacy tool (bookmark checking)",
id: "id_moz_891",
link1: "http://www.southbaypc.com/SuperCleaner/",
link2: "",
name: "Mozilla/4.0 (compatible; SuperCleaner 2.xx; Windows 98)",
type: "C"
},
%{
comment: "",
description: "Synapse - Apache web service for processing XML documents",
id: "id_moz_020406_1",
link1: "http://wiki.apache.org/incubator/SynapseProposal",
link2: "",
name: "Mozilla/4.0 (compatible; Synapse)",
type: "P"
},
%{
comment: "",
description:
"Web2PDF - Adobe Acrobat plugin for site traversal and other services for the Web Capture feature",
id: "id_moz_150207_1",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; WebCapture 3.0; Windows)",
type: "D"
},
%{
comment: "",
description: "Windows HTTP Services (WinHTTP / XML-parser)",
id: "id_moz_892",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; Win32; WinHttp.WinHttpRequest.5)",
type: ""
},
%{
comment: "",
description: "WSN Links PHP directory software",
id: "id_moz_170108_1",
link1: "http://scripts.webmastersite.net/wsnlinks/",
link2: "",
name: "Mozilla/4.0 (compatible; WSN Links)",
type: "C"
},
%{
comment: "",
description: "Euro Directory (German / Austrian) directory link checking",
id: "id_moz_111205_6",
link1: "http://www.euro-directory.com/",
link2: "",
name: "Mozilla/4.0 (compatible; www.euro-directory.com; urlchecker1.0)",
type: "R C"
},
%{
comment: "",
description: "Galaxy robot",
id: "id_moz_893",
link1: "http://www.galaxy.com",
link2: "",
name: "Mozilla/4.0 (compatible; www.galaxy.com)",
type: "R"
},
%{
comment: "",
description: "Linkguard.com link validation (service is offline)",
id: "id_moz_894",
link1: "",
link2: "",
name: "Mozilla/4.0 (compatible; www.linkguard.com Linkguard Online 1.0; Windows NT)",
type: "C"
},
%{
comment: "s. also Y!J-BSC/1.0...",
description: "Yahoo Search Japan robot (203.141.52.)",
id: "id_moz_240106_1",
link1: "http://www.yahoo.co.jp/",
link2: "",
name: "Mozilla/4.0 (compatible; Y!J; for robot study; keyoshid)",
type: "R"
},
%{
comment: "",
description: "Yahoo Japan robot (202.93.76.xx)",
id: "id_moz_170706_1",
link1: "http://www.yahoo.co.jp/",
link2: "",
name: "Mozilla/4.0 (compatible; Yahoo Japan; for robot study; kasugiya)",
type: "R"
},
%{
comment: "",
description: "Faked IE id string used by DeepTrawl link checking tool",
id: "id_moz_210207_1",
link1: "http://deeptrawl.com/",
link2: "",
name: "Mozilla/4.0 (compatible;MSIE 6.0; Windows NT 5.0; H010818)",
type: "C"
},
%{
comment: "",
description: "spoofed referer by Fantomaster (Multiblocker) anonymity products",
id: "id_moz_896",
link1: "http://fantomaster.com",
link2: "http://multiblocker.com/home.html",
name: "Mozilla/4.0 (fantomBrowser)",
type: "P"
},
%{
comment: "",
description: "spoofed referer by Fantomaster (Multiblocker) anonymity products",
id: "id_moz_897",
link1: "http://fantomaster.com",
link2: "http://multiblocker.com/home.html",
name: "Mozilla/4.0 (fantomCrew Browser)",
type: "P"
},
%{
comment: "",
description: "unknown robot from - 64.57.223.40 - 66.28.233.xxx (cogentco.com)",
id: "id_moz_898",
link1: "",
link2: "",
name: "Mozilla/4.0 (hhjhj@yahoo.com)",
type: ""
},
%{
comment: "",
description: "Activtourist Jemma spider",
id: "id_moz_899",
link1: "http://www.activtourist.com",
link2: "",
name: "Mozilla/4.0 (JemmaTheTourist;http://www.activtourist.com)",
type: "R"
},
%{
comment: "",
description: "NetFront (v3.x) for Pocket PC (here on Sanyo PM-8200 cell phone)",
id: "id_moz_900",
link1: "http://nfppc.access.co.jp/english/",
link2: "",
name: "Mozilla/4.0 (MobilePhone PM-8200/US/1.0) NetFront/3.x MMP/2.0",
type: "B"
},
%{
comment: "s. also: - Googlebot - Mozilla/5.0 (compatible; Googlebot/2.1...",
description: "Google robot from 66.249.66.xxx ",
id: "id_moz_901",
link1: "http://www.google.com",
link2: "",
name:
"Mozilla/4.0 (MobilePhone SCP-5500/US/1.0) NetFront/3.0 MMP/2.0 (compatible; Googlebot/2.1; http://www.google.com/bot.html)",
type: "R"
},
%{
comment: "s. also: - Googlebot - Mozilla/5.0 (compatible; Googlebot/2.1...",
description: "Google robot from 66.249.66.xxx ",
id: "id_moz_902",
link1: "http://www.google.com",
link2: "",
name:
"Mozilla/4.0 (MobilePhone SCP-5500/US/1.0) NetFront/3.0 MMP/2.0 FAKE (compatible; Googlebot/2.1; http://www.google.com/bot.html)",
type: "R"
},
%{
comment: "63.209.222.xx",
description: "Unknown robot from Mozilla.org",
id: "id_moz_081106_1",
link1: "http://www.mozilla.org/",
link2: "",
name:
"Mozilla/4.0 (Mozilla; http://www.mozilla.org/docs/en/bot.html; master@mozilla.com)",
type: "R"
},
%{
comment: "",
description: "ASI - Any Search Info robot",
id: "id_moz_903",
link1: "http://search-info.com/",
link2: "",
name: "Mozilla/4.0 (Sleek Spider/1.2)",
type: "R"
},
%{
comment: "64.242.88.xx",
description: "Furl (Looksmart) online bookmark tool robot",
id: "id_moz_170406_1",
link1: "http://www.furl.net/",
link2: "",
name:
"Mozilla/4.0 compatible FurlBot/Furl Search 2.0 (FurlBot; http://www.furl.net; wn.furlbot@looksmart.net)",
type: "R"
},
%{
comment: "",
description: "Wisenut robot",
id: "id_moz_905",
link1: "http://www.wisenut.com/",
link2: "",
name:
"Mozilla/4.0 compatible ZyBorg/1.0 (wn.zyborg@looksmart.net; http://www.WISEnutbot.com)",
type: "R"
},
%{
comment: "",
description: "Wisenut robot",
id: "id_moz_906",
link1: "http://www.wisenut.com/",
link2: "",
name:
"Mozilla/4.0 compatible ZyBorg/1.0 (ZyBorg@WISEnutbot.com; http://www.WISEnutbot.com)",
type: "R"
},
%{
comment: "",
description: "Wisenut robot",
id: "id_moz_907",
link1: "http://www.wisenut.com/",
link2: "",
name:
"Mozilla/4.0 compatible ZyBorg/1.0 Dead Link Checker (wn.zyborg@looksmart.net; http://www.WISEnutbot.com)",
type: "R"
},
%{
comment: "",
description: "Wisenut robot",
id: "id_moz_908",
link1: "http://www.wisenut.com/",
link2: "",
name:
"Mozilla/4.0 compatible ZyBorg/1.0 for Homepage (ZyBorg@WISEnutbot.com; http://www.WISEnutbot.com)",
type: "R"
},
%{
comment: "see also LARBIN-EXPERIMENTAL",
description:
"Unknown robot from 66.230.140.xx (argon.oxeo.com) maybe an e-mail collector",
id: "id_moz_909",
link1: "",
link2: "",
name: "Mozilla/4.0 efp@gmx.net",
type: "S"
},
%{
comment: "",
description: "WebTV",
id: "id_moz_910",
link1: "",
link2: "",
name: "Mozilla/4.0 WebTV/2.6 (compatible; MSIE 4.0)",
type: "B"
},
%{
comment: "",
description: "Ask / Ask Jeeves robot",
id: "id_moz_904",
link1: "http://www.Ask.com",
link2: "",
name: "Mozilla/4.0 [en] (Ask Jeeves Corporate Spider)",
type: "R"
},
%{
comment: "",
description: "LookSmart spider",
id: "id_moz_913",
link1: "http://www.looksmart.com",
link2: "",
name: "Mozilla/4.0(compatible; Zealbot 1.0)",
type: "R"
},
%{
comment: "",
description: "HideMe - Web based anonymous proxy server service",
id: "id_moz_290807_1",
link1: "http://www.hideme.biz/",
link2: "http://www.cnn.com/TECH/computing/9901/25/hacktracts.idg/index.html",
name: "Mozilla/4.01 (compatible; NORAD National Defence Network)",
type: "P"
},
%{
comment: "",
description: "Some download manager spoofing Netscape 4.01",
id: "id_moz_914",
link1: "",
link2: "",
name: "Mozilla/4.01 [en](Win95;I)",
type: "D"
},
%{
comment: "",
description: "Netscape 4.x SunOS 5.6",
id: "id_moz_915",
link1: "",
link2: "",
name: "Mozilla/4.02 [en] (X11; I; SunOS 5.6 sun4u)",
type: "B"
},
%{
comment: "",
description: "Dulance Bot - Dulance automated price comparison engine",
id: "id_moz_161105_3",
link1: "http://www.dulance.com/",
link2: "",
name: "Mozilla/4.04 (compatible; Dulance bot; +http://www.dulance.com/bot.jsp)",
type: "R"
},
%{
comment: "",
description: "Netscape 4.x HP-Unix",
id: "id_moz_916",
link1: "",
link2: "",
name: "Mozilla/4.04 [en] (X11; I; HP-UX B.10.20 9000/712)",
type: "B"
},
%{
comment: "",
description: "Netscape 4.x IRIX",
id: "id_moz_917",
link1: "",
link2: "",
name: "Mozilla/4.04 [en] (X11; I; IRIX 5.3 IP22)",
type: "B"
},
%{
comment: "",
description: "Netscape 4.x Macintosh 68k",
id: "id_moz_918",
link1: "",
link2: "",
name: "Mozilla/4.05 (Macintosh; I; 68K Nav)",
type: "B"
},
%{
comment: "",
description: "Netscape 4.x Macintosh PowerPC",
id: "id_moz_919",
link1: "",
link2: "",
name: "Mozilla/4.05 (Macintosh; I; PPC Nav)",
type: "B"
},
%{
comment: "",
description: "Netscape 4.x SunOS 4.1.4",
id: "id_moz_920",
link1: "",
link2: "",
name: "Mozilla/4.05 [en] (X11; I; SunOS 4.1.4 sun4m)",
type: "B"
},
%{
comment: "",
description: "Version 4.08 [en]-98306",
id: "id_moz_921",
link1: "",
link2: "",
name: "Mozilla/4.08 [en] (Win98; U ;Nav)",
type: "Someone copied the help function in the referrer field ?"
},
%{
comment: "",
description: "Netscape 4.x WinNT",
id: "id_moz_922",
link1: "",
link2: "",
name: "Mozilla/4.08 [en] (WinNT; U)",
type: "B"
},
%{
comment: "",
description: "Echo.com robot",
id: "id_moz_911",
link1: "http://www.echo.com",
link2: "",
name: "Mozilla/4.0_(compatible;_MSIE_5.0;_Windows_95)_TrueRobot/1.4 libwww/5.2.8",
type: "R"
},
%{
comment: "",
description: "Voila.fr robot",
id: "id_moz_912",
link1: "http://www.voila.fr",
link2: "",
name: "Mozilla/4.0_(compatible;_MSIE_5.0;_Windows_95)_VoilaBot/1.6 libwww/5.3.2",
type: "R"
},
%{
comment: "",
description: "HTTrack Offline Browser",
id: "id_moz_923",
link1: "http://www.httrack.com/",
link2: "",
name: "Mozilla/4.5 (compatible; HTTrack 3.0x; Windows 98)",
type: "B D"
},
%{
comment: "",
description: "iCab MAC Web browser MAC Power PC",
id: "id_moz_924",
link1: "http://www.icab.de",
link2: "",
name: "Mozilla/4.5 (compatible; iCab 2.5.3; Macintosh; I; PPC)",
type: "B"
},
%{
comment: "",
description: "OmniWeb 4.x.x Mac browser",
id: "id_moz_925",
link1: "http://www.omnigroup.com",
link2: "",
name: "Mozilla/4.5 (compatible; OmniWeb/4.0.5; Mac_PowerPC)",
type: "B"
},
%{
comment: "",
description: "OmniWeb 4.x.x Mac browser",
id: "id_moz_926",
link1: "http://www.omnigroup.com",
link2: "",
name: "Mozilla/4.5 (compatible; OmniWeb/4.1-beta-1; Mac_PowerPC)",
type: "B"
},
%{
comment: "",
description: "different IPs using the HTTPClient library (mostly link checking)",
id: "id_moz_928",
link1: "http://www.innovation.ch",
link2: "",
name: "Mozilla/4.5 RPT-HTTPClient/0.3-2",
type: "C R"
},
%{
comment: "",
description: "RuralNet Internet Services",
id: "id_moz_927",
link1: "http://www.ruralnet.net.au",
link2: "",
name: "Mozilla/4.5 [en]C-CCK-MCD {RuralNet} (Win98; I)",
type: "B"
},
%{
comment: "",
description: "Netscape 4.x Linux",
id: "id_moz_929",
link1: "",
link2: "",
name: "Mozilla/4.5b1 [en] (X11; I; Linux 2.0.35 i586)",
type: "B"
},
%{
comment: "",
description: "Cnet robot for Search.com (216.239.114.xx)",
id: "id_moz_301105_3",
link1: "http://www.search.com/",
link2: "http://www.cnet.com/",
name: "Mozilla/4.6 [en] (http://www.cnet.com/)",
type: "R"
},
%{
comment: "",
description: "Netscape 4.x OS/2",
id: "id_moz_930",
link1: "",
link2: "",
name: "Mozilla/4.61 [de] (OS/2; I)",
type: "B"
},
%{
comment: "",
description: "BrowseX cross-platform browser",
id: "id_moz_931",
link1: "http://browsex.com/",
link2: "",
name: "Mozilla/4.61 [en] (X11; U; ) - BrowseX (2.0.0 Windows)",
type: "B"
},
%{
comment: "",
description: "Nameprotect (12.148.196.128 - 12.148.196.255) snoopbot",
id: "id_moz_932",
link1: "http://www.nameprotect.com",
link2: "",
name: "Mozilla/4.7",
type: "R"
},
%{
comment: "",
description: "Eidetica earch and text mining spider",
id: "id_moz_933",
link1: "http://eidetica.com/",
link2: "",
name: "Mozilla/4.7 (compatible; http://eidetica.com/spider)",
type: "R"
},
%{
comment: "",
description: "Intelliseek (64.158.138.xx) robot",
id: "id_moz_934",
link1: "http://www.intelliseek.com",
link2: "",
name: "Mozilla/4.7 (compatible; Intelliseek; http://www.intelliseek.com)",
type: "R"
},
%{
comment: "",
description: "OffByOne Browser",
id: "id_moz_935",
link1: "http://www.offbyone.com",
link2: "",
name: "Mozilla/4.7 (compatible; OffByOne; Windows 98) Webster Pro V3.2",
type: "B"
},
%{
comment: "closed since May 2002",
description: "WhizBang! Labs information extraction robot",
id: "id_moz_937",
link1: "http://www.whizbang.com",
link2: "",
name: "Mozilla/4.7 (compatible; Whizbang)",
type: "R"
},
%{
comment: "closed since May 2002",
description: "WhizBang! Labs information extraction robot",
id: "id_moz_936",
link1: "http://www.whizbang.com",
link2: "",
name: "Mozilla/4.7 (compatible; WhizBang; http://www.whizbang.com/crawler)",
type: "R"
},
%{
comment: "64.124.85.[x]xx",
description: "BecomeBot - Becomecom shopping search (64.124.85.xx(x))",
id: "id_moz_938",
link1: "http://www.become.com",
link2: "",
name: "Mozilla/4.7 [en](BecomeBot@exava.com)",
type: "R"
},
%{
comment: "",
description: "Exabot - exava shopping search (64.124.85.xx(x))",
id: "id_moz_939",
link1: "http://www.exava.com",
link2: "",
name: "Mozilla/4.7 [en](Exabot@exava.com)",
type: "R"
},
%{
comment: "",
description: "unknown",
id: "id_moz_940",
link1: "",
link2: "",
name: "Mozilla/4.7 [en]C-CCK-MCD {Yahoo;YIP052400} (Win95; I)",
type: ""
},
%{
comment: "",
description: "http://www.ba.be robot",
id: "id_moz_941",
link1: "http://www.ba.be",
link2: "",
name: "Mozilla/4.72 [en] (BACS http://www.ba.be)",
type: "R"
},
%{
comment: "",
description: "Netscpape 4.7x Caldera Open Linux Pentium III",
id: "id_moz_942",
link1: "",
link2: "",
name: "Mozilla/4.72C-CCK-MCD Caldera Systems OpenLinux [en] (X11; U; Linux 2.2.14 i686)",
type: "B"
},
%{
comment: "",
description: "Netscape 4.7x Japan OSF1 alpha",
id: "id_moz_943",
link1: "",
link2: "",
name: "Mozilla/4.75C-ja [ja] (X11; U; OSF1 V5.1 alpha)",
type: "B"
},
%{
comment: "",
description: "Opera 5.x Win 98",
id: "id_moz_944",
link1: "",
link2: "",
name: "Mozilla/4.76 (Windows 98; U) Opera 5.12 [en]",
type: "B"
},
%{
comment: "",
description: "Netscape 4.7x FreeBSD",
id: "id_moz_945",
link1: "",
link2: "",
name: "Mozilla/4.76 [en] (X11; U; FreeBSD 4.4-STABLE i386)",
type: "B"
},
%{
comment: "",
description: "Netscape 4.7x SunOS",
id: "id_moz_946",
link1: "",
link2: "",
name: "Mozilla/4.76 [en] (X11; U; SunOS 5.7 sun4u)",
type: "B"
},
%{
comment: "",
description: "IRIX 6.5",
id: "id_moz_947",
link1: "",
link2: "",
name: "Mozilla/4.77C-SGI [en] (X11; U; IRIX 6.5 IP32)",
type: "B"
},
%{
comment: "",
description: "GigaMedia / NTT DoCoMo robot",
id: "id_moz_948",
link1: "http://ir.giga.net.tw/products.htm",
link2: "",
name: "Mozilla/5.0",
type: "R"
},
%{
comment: "64.106.253.1xx",
description:
"Eurekster Swicki community search using SLI-Systems site search engine Mammoth",
id: "id_moz_040707_3",
link1: "http://www.eurekster.com/",
link2: "http://www.sli-systems.com/",
name: "Mozilla/5.0 (+http://www.eurekster.com/mammoth) Mammoth/0.1",
type: "R"
},
%{
comment: "s. also mammoth/1.0 ...",
description: "SLI Systems mammoth robot",
id: "id_moz_240306_2",
link1: "http://www.sli-systems.com/",
link2: "http://www.tenspider.com/business-blog/more.php?id=A45_0_1_0_M",
name: "Mozilla/5.0 (+http://www.sli-systems.com/) Mammoth/0.1",
type: "R"
},
%{
comment: "",
description: "Clush search robot",
id: "id_moz_949",
link1: "http://www.clush.com",
link2: "",
name: "Mozilla/5.0 (Clustered-Search-Bot/1.0; support@clush.com; http://www.clush.com/)",
type: "R"
},
%{
comment: "",
description: "Greasemonkey RSS panel Firefox plugin",
id: "id_moz_020807_1",
link1: "http://www.xs4all.nl/~jlpoutre/BoT/Javascript/RSSpanel/",
link2: "",
name: "Mozilla/5.0 (compatible) GM RSS Panel X",
type: "B"
},
%{
comment: "216.168.43.1xx",
description: "Evri search robot",
id: "id_moz_140209_3",
link1: "http://www.evri.com/",
link2: "",
name: "Mozilla/5.0 (compatible; +http://www.evri.com/evrinid)",
type: "R"
},
%{
comment: "",
description: "008 distributed crawler for 80legs",
id: "id_moz_250310_1",
link1: "http://www.80legs.com/spider.html",
link2: "",
name:
"Mozilla/5.0 (compatible; 008/0.83; http://www.80legs.com/spider.html;) Gecko/2008032620",
type: "R"
},
%{
comment: "77.233.225.11x",
description: "Abonti WebSearch beta robot",
id: "id_moz_140209_4",
link1: "http://www.abonti.com/",
link2: "",
name: "Mozilla/5.0 (compatible; Abonti/0.8 - http://www.abonti.com)",
type: "R"
},
%{
comment: "195.128.18.xx",
description: "HitCompanies Aihit crawler",
id: "id_moz_030110_4",
link1: "http://hitcompanies.aihit.com/search.htm",
link2: "",
name: "Mozilla/5.0 (compatible; aiHitBot/1.0; +http://www.aihit.com/)",
type: "R"
},
%{
comment: "203.206.162.x",
description: "Ansearch Australian search robot",
id: "id_moz_300406_1",
link1: "http://www.ansearch.com.au/",
link2: "",
name: "Mozilla/5.0 (compatible; AnsearchBot/1.x; +http://www.ansearch.com.au/)",
type: "R"
},
%{
comment: "207.241.232.1xx",
description: "The Library of Congress Minerva crawler",
id: "id_moz_011107_1",
link1: "http://www.loc.gov/minerva/crawl.html",
link2: "",
name:
"Mozilla/5.0 (compatible; archive.org_bot/1.10.0 +http://www.loc.gov/minerva/crawl.html)",
type: "R"
},
%{
comment: "s.also - InternetArchive/0.8-dev - Mozilla/5.0 (compatible;archive.org_bot/...",
description: "Heritrix - The Internet Archive's open-source crawler (207.241.225.2xx)",
id: "id_moz_230607_2",
link1: "http://www.archive.org/",
link2: "",
name: "Mozilla/5.0 (compatible; archive.org_bot/1.13.1x http://crawler.archive.org)",
type: "R"
},
%{
comment: "s. also - InternetArchive/0.8-dev... - mozilla/5.0 (compatible; heritrix/...",
description: "Heritrix - The Internet Archive's open-source crawler",
id: "id_moz_141105_1",
link1: "http://www.archive.org/",
link2: "",
name:
"Mozilla/5.0 (compatible; archive.org_bot/1.5.0-200506132127 http://crawler.archive.org) Hurricane Katrina",
type: "R"
},
%{
comment: " 65.214.45.[x]xx",
description: "Ask Jeeves /Teoma robot",
id: "id_moz_150207_2",
link1: "http://sp.ask.com",
link2: "",
name:
"Mozilla/5.0 (compatible; Ask Jeeves/Teoma; http://about.ask.com/en/docs/about/webmasters.shtml)",
type: "R"
},
%{
comment: "s. also BanBots/1.2...",
description: "Project BanBots Perl script robot",
id: "id_moz_291205_2",
link1: "http://www.banbots.com/",
link2: "",
name: "Mozilla/5.0 (compatible; BanBots/2.0b; Fetch; +http://www.banbots.com)",
type: "C"
},
%{
comment: "64.124.85.[x]xx",
description: "BecomeBot - Become.com shopping search (64.124.85.xx(x))",
id: "id_moz_950",
link1: "http://www.become.com",
link2: "",
name: "Mozilla/5.0 (compatible; BecomeBot/1.23; http://www.become.com/webmasters.html)",
type: "R"
},
%{
comment: "64.124.85.[x]xx",
description: "BecomeBot - Become.com shopping search (64.124.85.xx(x))",
id: "id_moz_951",
link1: "http://www.become.com",
link2: "",
name:
"Mozilla/5.0 (compatible; BecomeBot/1.xx; MSIE 6.0 compatible; http://www.become.com/webmasters.html)",
type: "R"
},
%{
comment: "64.124.85.[x]xx",
description: "BecomeBot - Become.com shopping search (64.124.85.xx(x))",
id: "id_moz_952",
link1: "http://www.become.com",
link2: "",
name:
"Mozilla/5.0 (compatible; BecomeBot/2.0beta; http://www.become.com/webmasters.html)",
type: "R"
},
%{
comment: "64.124.85.[x]xx",
description: "BecomeBot - Become.com shopping search (64.124.85.xx(x))",
id: "id_moz_953",
link1: "http://www.become.com",
link2: "",
name:
"Mozilla/5.0 (compatible; BecomeBot/2.x; MSIE 6.0 compatible; http://www.become.com/site_owners.html)",
type: "R"
},
%{
comment: "64.124.85.[x]xx",
description: "BecomeBot - Become.com shopping search (64.124.85.xx(x))",
id: "id_moz_090506_2",
link1: "http://www.become.com",
link2: "",
name:
"Mozilla/5.0 (compatible; BecomeJPBot/2.3; MSIE 6.0 compatible; +http://www.become.co.jp/site_owners.html)",
type: "R"
},
%{
comment: "69.90.42.xx",
description: "BlogRefsBot.com blog robot",
id: "id_moz_020907_1",
link1: "http://www.blogrefs.com/",
link2: "http://www.blogrefs.com/about/bloggers",
name: "Mozilla/5.0 (compatible; BlogRefsBot/0.1; http://www.blogrefs.com/about/bloggers)",
type: "R"
},
%{
comment: "87.164.242.1xx",
description: "Pressemitteilungen Webservice RSS / news crawler (Germany)",
id: "id_moz_171107_1",
link1: "http://pressemitteilung.ws/",
link2: "",
name: "Mozilla/5.0 (compatible; Bot; +http://pressemitteilung.ws/spamfilter",
type: "R"
},
%{
comment: "213.251.187.1xx",
description: "BuzzRanking internet content analysis",
id: "id_moz_031206_1",
link1: "http://www.buzzrankingbot.com/",
link2: "",
name: "Mozilla/5.0 (compatible; BuzzRankingBot/1.0; +http://www.buzzrankingbot.com/)",
type: "R"
},
%{
comment: "209.249.86.x",
description: "Charlotte indexing spider for Searchme / Wikiseek",
id: "id_moz_310506_1",
link1: "http://www.searchme.com/",
link2: "http://www.wikiseek.com/",
name: "Mozilla/5.0 (compatible; Charlotte/1.0b; charlotte@betaspider.com)",
type: "R"
},
%{
comment: "209.249.86.x",
description: "Charlotte indexing spider for Searchme / Wikiseek",
id: "id_moz_080307_1",
link1: "http://www.searchme.com/",
link2: "http://www.wikiseek.com/",
name: "Mozilla/5.0 (compatible; Charlotte/1.0b; http://www.searchme.com/support/)",
type: "R"
},
%{
comment: "doesn't read robots.txt",
description:
"Unknown graphics crawler or downloading agent from Yamana Laboratory - Waseda Univerity Japan (133.9.238.xx)",
id: "id_moz_220106_1",
link1: "http://www.yama.info.waseda.ac.jp/eng/index.html",
link2: "",
name: "Mozilla/5.0 (compatible; Crawling jpeg; http://www.yama.info.waseda.ac.jp)",
type: "R"
},
%{
comment: "s. also - Custo x.x (www.netwu.com)",
description: "Custo web site spidering tool (link checking)",
id: "id_moz_954",
link1: "http://www.netwu.com",
link2: "",
name: "Mozilla/5.0 (compatible; Custo 3 (Netwu.com); Windows NT 5.1)",
type: "C"
},
%{
comment: "67.202.29.xx",
description: "De.com German travel related search via Amazon Web Services",
id: "id_moz_071207_1",
link1: "http://www.de.com/start.php?homepage=true",
link2: "http://www.amazon.com/gp/browse.html?node=3435361",
name: "Mozilla/5.0 (compatible; de/1.13.2 +http://www.de.com)",
type: "R"
},
%{
comment: "64.71.190.13x",
description: "Diffbot beta - RSS and news feed crawler",
id: "id_moz_170109_1",
link1: "http://www.diffbot.com/",
link2: "",
name: "Mozilla/5.0 (compatible; Diffbot/0.1; +http://www.diffbot.com)",
type: "R"
},
%{
comment: "212.214.165.2xx",
description: "DNS-Digger - DNS server neighbourhood search",
id: "id_moz_030207_1",
link1: "http://www.dnsdigger.com/",
link2: "",
name: "Mozilla/5.0 (compatible; DNS-Digger-Explorer/1.0; +http://www.dnsdigger.com)",
type: "R"
},
%{
comment: "212.214.165.2xx",
description: "DNS-Digger - DNS server neighbourhood search",
id: "id_moz_100606_2",
link1: "http://www.dnsdigger.com/",
link2: "",
name: "Mozilla/5.0 (compatible; DNS-Digger/1.0; +http://www.dnsdigger.com)",
type: "R"
},
%{
comment: "s. also EARTHCOM ..",
description: "Earthcom (Czech Republic) search robot (194.108.39.xx)",
id: "id_moz_020506_1",
link1: "http://www.earthcom.info",
link2: "",
name: "Mozilla/5.0 (compatible; EARTHCOM.info/2.01; http://www.earthcom.info)",
type: "R"
},
%{
comment: "",
description: "enter4u / Earthcom.info search (Czech Republic)",
id: "id_moz_190807_3",
link1: "http://enter4u.eu/",
link2: "http://www.earthcom.info",
name: "Mozilla/5.0 (compatible; EARTHCOM/2.2; +http://enter4u.eu)",
type: "R"
},
%{
comment: "195.113.20.125",
description:
"Prague Faculty of Mathematics and Physics using Egothor open source crawler",
id: "id_moz_050107_1",
link1: "http://ego.ms.mff.cuni.cz/",
link2: "http://www.egothor.org/",
name: "Mozilla/5.0 (compatible; egothor/8.0g; +http://ego.ms.mff.cuni.cz/)",
type: "P"
},
%{
comment: "s. Harvest-NG/1.0.2 and Exalead NG...",
description: "Exalead (France) search robot (193.47.80.xx)",
id: "id_moz_310507_1",
link1: "http://www.exabot.com/",
link2: "",
name: "Mozilla/5.0 (compatible; Exabot Test/3.0; +http://www.exabot.com/go/robot)",
type: "R"
},
%{
comment: "64.124.148.xx[x]",
description: "TheFind.com - Shopping search robot",
id: "id_moz_221207_1",
link1: "http://www.thefind.com/",
link2: "",
name:
"Mozilla/5.0 (compatible; FatBot 2.0; http://www.thefind.com/main/CrawlerFAQs.fhtml)",
type: "R"
},
%{
comment: "",
description: "Galbot tagging robot (beta) - Denmark",
id: "id_moz_170109_2",
link1: "http://www.galbot.com/",
link2: "",
name: "Mozilla/5.0 (compatible; Galbot/1.0; +http://www.galbot.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "Geneva Single-Site Search Engine used by Healthdash health search",
id: "id_moz_955",
link1: "http://www.healthdash.com",
link2: "",
name: "mozilla/5.0 (compatible; genevabot http://www.healthdash.com)",
type: "R"
},
%{
comment: "",
description: "Paros - a Java based HTTP/HTTPS proxy",
id: "id_moz_170207_4",
link1: "http://sourceforge.net/projects/paros",
link2: "",
name: "Mozilla/5.0 (compatible; Google Desktop) Paros/3.2.12",
type: "P"
},
%{
comment: "s. also: - Googlebot - Mozilla/4.0 (MobilePhone SCP ...",
description: "Google robot",
id: "id_moz_956",
link1: "http://www.google.com",
link2: "",
name: "Mozilla/5.0 (compatible; Googlebot/2.1; http://www.google.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "Unknown robot using Heritrix",
id: "id_moz_957",
link1: "http://innovationblog.com",
link2: "http://crawler.archive.org/",
name: "mozilla/5.0 (compatible; heritrix/1.0.4 http://innovationblog.com)",
type: "R"
},
%{
comment: "171.67.73.1x",
description: "The Stanford University InfoLab robot using Heritrix",
id: "id_moz_280207_1",
link1: "http://i.stanford.edu/",
link2: "http://www.archive.org/",
name: "Mozilla/5.0 (compatible; heritrix/1.10.2 +http://i.stanford.edu/)",
type: "R"
},
%{
comment: "195.39.35.1xx",
description: "Newstin news feed search using Heritrix",
id: "id_moz_280108_2",
link1: "http://www.newstin.com/",
link2: "",
name: "Mozilla/5.0 (compatible; heritrix/1.12.1 +http://newstin.com/)",
type: "R"
},
%{
comment: "72.44.62.1xx",
description: "Page-store.com vertical search via Amazon Web Services",
id: "id_moz_210807_1",
link1: "http://www.page-store.com/",
link2: "http://www.amazonaws.com/",
name: "Mozilla/5.0 (compatible; heritrix/1.12.1 +http://www.page-store.com)",
type: "R"
},
%{
comment: "72.44.62.1xx",
description: "Page-store.com vertical search via Amazon Web Services",
id: "id_moz_230108_1",
link1: "http://www.page-store.com/",
link2: "http://www.amazonaws.com/",
name:
"Mozilla/5.0 (compatible; heritrix/1.12.1 +http://www.page-store.com) [email:paul@page-store.com]",
type: "R"
},
%{
comment: "",
description: "Heritrix Internet Archive's open-source web project ",
id: "id_moz_958",
link1: "http://archive.crawler.org",
link2: "",
name: "mozilla/5.0 (compatible; heritrix/1.3.0 http://archive.crawler.org)",
type: "R"
},
%{
comment: "",
description: "Chepi Beta search Spain (194.116.240.1xx) using Heritrix",
id: "id_moz_270106_2",
link1: "http://www.chepi.net/",
link2: "http://lucene.apache.org",
name: "Mozilla/5.0 (compatible; heritrix/1.4.0 +http://www.chepi.net)",
type: "R"
},
%{
comment: "",
description: "Truveo data mining robot using Heritrix",
id: "id_moz_959",
link1: "http://www.truveo.com/home/",
link2: "http://crawler.archive.org/",
name: "Mozilla/5.0 (compatible; heritrix/1.4t http://www.truveo.com/)",
type: "R"
},
%{
comment: "",
description: "L3S WebCrawling Project (Germany) using Heritrix",
id: "id_moz_960",
link1: "http://www.l3s.de/~kohlschuetter/projects/crawling/",
link2: "http://crawler.archive.org/",
name:
"Mozilla/5.0 (compatible; heritrix/1.5.0 http://www.l3s.de/~kohlschuetter/projects/crawling/)",
type: "R"
},
%{
comment: "",
description: "Pandora Internet Archive crawler (Australia) using Heritrix",
id: "id_moz_961",
link1: "http://pandora.nla.gov.au",
link2: "http://crawler.archive.org/",
name:
"Mozilla/5.0 (compatible; heritrix/1.5.0-200506231921 http://pandora.nla.gov.au/crawl.html)",
type: "R"
},
%{
comment: "137.82.84.xx",
description:
"WORIO (beta) search for computer scientists and programmers using Heritrix open-source crawler",
id: "id_moz_250706_3",
link1: "http://www.worio.com/",
link2: "http://www.archive.org/",
name: "Mozilla/5.0 (compatible; heritrix/1.6.0 http://www.worio.com/)",
type: "R"
},
%{
comment: "63.209.222.",
description: "greatarea.com website collection project using Heritrix",
id: "id_moz_190607_1",
link1: "http://www.greaterera.com/",
link2: "",
name: "Mozilla/5.0 (compatible; heritrix/1.7.0 +http://www.greaterera.com/)",
type: "R"
},
%{
comment: "216.182.238.",
description: "hanzo:web social web archiving service",
id: "id_moz_230307_1",
link1: "http://www.hanzoweb.com/",
link2: "",
name: "Mozilla/5.0 (compatible; Heritrix/1.8.0 http://www.hanzoarchives.com)",
type: "D"
},
%{
comment: "72.20.99.xx",
description: "Accelobot - Accelovation Market Discovery software robot",
id: "id_moz_151106_1",
link1: "http://www.accelobot.com/",
link2: "http://www.accelovation.com/solutions.html",
name: "Mozilla/5.0 (compatible; heritrix/1.x.x +http://www.accelobot.com)",
type: "R"
},
%{
comment: "64.236.128.x",
description: "Unknown AOL robot using Heritrix",
id: "id_moz_030208_1",
link1: "http://www.aol.com/",
link2: "",
name: "Mozilla/5.0 (compatible; heritrix/2.0.0-RC1 +http://www.aol.com)",
type: "R"
},
%{
comment: "72.55.165.11x",
description: "Hermits Search.com - Products and service search robot",
id: "id_moz_051207_2",
link1: "http://www.hermitsearch.com/",
link2: "",
name: "Mozilla/5.0 (compatible; Hermit Search. Com; +http://www.hermitsearch.com)",
type: "R"
},
%{
comment: "142.179.247.xx",
description: "IsMySiteUp? - Online website monitoring service",
id: "id_moz_161006_2",
link1: "http://www.ismysiteup.net/",
link2: "",
name: "Mozilla/5.0 (compatible; http://www.IsMySiteUp.Net/bot/ )",
type: "C"
},
%{
comment: "142.179.247.xx",
description: "UptimeAuditor - real time web monitoring",
id: "id_moz_101106_2",
link1: "http://www.uptimeauditor.com/",
link2: "",
name: "Mozilla/5.0 (compatible; http://www.UptimeAuditor.com/bot/ )",
type: "C"
},
%{
comment: "64.40.113.[x]xx",
description: "Hyperix vertical search crawler",
id: "id_moz_180508_1",
link1: "http://www.hyperix.com/",
link2: "",
name: "Mozilla/5.0 (compatible; HyperixScoop/1.3; +http://www.hyperix.com)",
type: "R"
},
%{
comment: "Not from iask.com.cn - s. also iaskspider",
description: "Unknown robot (reads robots.txt) from chinatelecom (219.142.78.xx)",
id: "id_moz_070406_1",
link1: "",
link2: "",
name: "Mozilla/5.0 (compatible; iaskspider/1.0; MSIE 6.0)",
type: ""
},
%{
comment: "67.159.44.2xx",
description: "ID-Search.org - Russian search project",
id: "id_moz_280607_1",
link1: "http://id-search.org/bot.html",
link2: "",
name: "Mozilla/5.0 (compatible; IDBot/1.0; +http://www.id-search.org/bot.html)",
type: "R"
},
%{
comment: "",
description: "Najdi.si (Slovenia) search using Interseek/Web Interseek/API Search Engine",
id: "id_moz_962",
link1: "http://www.najdi.si/pomoc/eng/index.jsp",
link2: "",
name: "Mozilla/5.0 (compatible; InterseekWeb/3.x)",
type: "R"
},
%{
comment: "216.182.238.",
description: "hanzo:web social web archiving service",
id: "id_moz_130807_4",
link1: "http://www.hanzoweb.com/",
link2: "",
name: "Mozilla/5.0 (compatible; Jim +http://www.hanzoarchives.com)",
type: "D"
},
%{
comment: "",
description: "Konqueror 2.0.x X11",
id: "id_moz_963",
link1: "http://www.konqueror.org/",
link2: "",
name:
"Mozilla/5.0 (compatible; Konqueror/2.0.1; X11); Supports MD5-Digest; Supports gzip encoding",
type: "B"
},
%{
comment: "",
description: "Konqueror 2.1.x X11",
id: "id_moz_964",
link1: "http://www.konqueror.org/",
link2: "",
name: "Mozilla/5.0 (compatible; Konqueror/2.1.1; X11)",
type: "B"
},
%{
comment: "",
description: "Konqueror 2.2.x",
id: "id_moz_966",
link1: "http://www.konqueror.org/",
link2: "",
name: "Mozilla/5.0 (compatible; Konqueror/2.2.2)",
type: "B"
},
%{
comment: "",
description: "Konqueror 2.2.x Linux",
id: "id_moz_965",
link1: "http://www.konqueror.org/",
link2: "",
name: "Mozilla/5.0 (compatible; Konqueror/2.2.2; Linux 2.4.14-xfs; X11; i686)",
type: "B"
},
%{
comment: "s. Harvest-NG/1.0.2 and Exalead NG...",
description: "Exalead (France) search robot (193.47.80.xx)",
id: "id_moz_050108_2",
link1: "http://www.exabot.com/",
link2: "",
name:
"Mozilla/5.0 (compatible; Konqueror/3.5; Linux) KHTML/3.5.5 (like Gecko) (Exabot-Thumbnails)",
type: "R"
},
%{
comment: "",
description: "Lemur Consulting LemIR spider",
id: "id_moz_967",
link1: "http://www.lemurconsulting.com",
link2: "",
name: "Mozilla/5.0 (compatible; LemSpider 0.1)",
type: "R"
},
%{
comment: "s.also LinksManager.com",
description: "Linksmanager.com online link checking service",
id: "id_moz_968",
link1: "http://www.linksmanager.com",
link2: "",
name:
"Mozilla/5.0 (compatible; LinksManager.com_bot http://linksmanager.com/linkchecker.html)",
type: "C"
},
%{
comment: "",
description: "LinkStash Bookmark Manager",
id: "id_moz_140408_2",
link1: "http://www.xrayz.co.uk/",
link2: "",
name: "Mozilla/5.0 (compatible; LinkStash Bookmark Manager; http://www.xrayz.co.uk/)",
type: "C"
},
%{
comment: "s. also MojeekBot/0.x",
description: "Mojeek Search Preview robot (217.155.205.xx)",
id: "id_moz_060706_2",
link1: "http://www.mojeek.com",
link2: "",
name: "Mozilla/5.0 (compatible; MojeekBot/2.0; http://www.mojeek.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "Joomla!/Mambo component - MosBookmarks (bot) link checking",
id: "id_moz_290107_1",
link1: "http://www.tegdesign.ch/",
link2: "",
name: "Mozilla/5.0 (compatible; MOSBookmarks/v2.6-Plus; Link Checker)",
type: "C"
},
%{
comment: "71.134.235.xx",
description: "PodTech entertainment and video network crawler",
id: "id_moz_091007_1",
link1: "http://www.podtech.net/home/",
link2: "",
name: "Mozilla/5.0 (compatible; MSIE 6.0; Podtech Network; crawler_admin@podtech.net)",
type: "R"
},
%{
comment: "s. also - Onet.pl SA",
description: "onet.pl Szukaj (Search) robot (213.180.128.1xx)",
id: "id_moz_969",
link1: "http://szukaj.onet.pl",
link2: "",
name: "Mozilla/5.0 (compatible; OnetSzukaj/5.0; http://szukaj.onet.pl)",
type: "R"
},
%{
comment: "70.85.129.12x",
description: "Pagestacker online bookmark service",
id: "id_moz_181207_1",
link1: "http://www.pagestacker.com/",
link2: "",
name: "Mozilla/5.0 (compatible; PagestackerBot; http://www.pagestacker.com)",
type: "C"
},
%{
comment: "80.59.111.2xx",
description: "PalmeraBot - Links24h.com search engine robot",
id: "id_moz_020307_1",
link1: "http://www.links24h.com/",
link2: "http://www.links24h.com/help/palmera/",
name:
"Mozilla/5.0 (compatible; PalmeraBot; http://www.links24h.com/help/palmera) Version 0.001",
type: "R"
},
%{
comment: "210.188.205.2xx",
description: "FeedMo feed search (Japan) using Pear HTTP",
id: "id_moz_130806_1",
link1: "http://feed.moo.jp/",
link2: "http://pear.php.net/",
name: "Mozilla/5.0 (compatible; PEAR HTTP_Request class; http://feed.moo.jp/)",
type: "C ?"
},
%{
comment: "",
description: "PHONifier mobile access to web content",
id: "id_moz_190607_2",
link1: "http://www.phonifier.com/",
link2: "",
name: "Mozilla/5.0 (compatible; Phonifier; +http://www.phonifier.com)",
type: "D B"
},
%{
comment: "74.208.25.118 / 216.15.74.85",
description: "pmoz.info ODP link checking bot",
id: "id_moz_240208_2",
link1: "http://pmoz.info/doc/botinfo.htm",
link2: "http://www.dmoz.org/",
name:
"Mozilla/5.0 (compatible; pmoz.info ODP link checker; +http://pmoz.info/doc/botinfo.htm)",
type: "C"
},
%{
comment: "89.143.229.1xx",
description: "Pogodak search (Slovenia) robot via Interseek",
id: "id_moz_970",
link1: "http://www.pogodak.hr",
link2: "http://www.interseek.com/",
name: "Mozilla/5.0 (compatible; pogodak.ba/3.x)",
type: "R"
},
%{
comment: "89.143.229.1xx",
description: "Pogodak search (Slovenia) robot via Interseek",
id: "id_moz_100408_2",
link1: "http://www.pogodak.hr",
link2: "http://www.interseek.com/",
name: "Mozilla/5.0 (compatible; Pogodak.hr/3.1)",
type: "R"
},
%{
comment: "",
description: "Proximic Publisher Widget - RSS and news content generator",
id: "id_moz_101107_1",
link1: "http://www.proximic.com/",
link2: "",
name:
"Mozilla/5.0 (compatible; Proximic crawler; +http://www.proximic.com/en/about-us/contact-us.html)",
type: "C"
},
%{
comment: "62.149.236.2xx",
description: "ProgramacionWeb.net PWeBot crawler (Argentina)",
id: "id_moz_230907_1",
link1: "http://www.programacionweb.net/robot-en.php",
link2: "http://www.programacionweb.net/",
name: "Mozilla/5.0 (compatible; PWeBot/3.1; http://www.programacionweb.net/robot.php)",
type: "R"
},
%{
comment: "",
description: "Quantcast - Open Internet Ratings Service",
id: "id_moz_130507_1",
link1: "http://www.quantcast.com/",
link2: "",
name: "Mozilla/5.0 (compatible; Quantcastbot/1.0; www.quantcast.com)",
type: "R"
},
%{
comment: "",
description: "robtex - Multi-RBL check and AS-numbercheck",
id: "id_moz_190706_1",
link1: "http://www.robtex.com/",
link2: "",
name: "Mozilla/5.0 (compatible; robtexbot/1.0; http://www.robtex.com/ )",
type: "C"
},
%{
comment: "",
description: "ScoutJet (Blekko) search web crawler",
id: "id_moz_050408_1",
link1: "http://www.scoutjet.com/",
link2: "",
name: "Mozilla/5.0 (compatible; ScoutJet; +http://www.scoutjet.com/)",
type: "R"
},
%{
comment: "s.also Scrubby/2.x ",
description: "Scrub the web robot (66.93.156.xx)",
id: "id_moz_300106_3",
link1: "http://www.scrubtheweb.com/",
link2: "",
name: "Mozilla/5.0 (compatible; Scrubby/2.2; http://www.scrubtheweb.com/)",
type: "R"
},
%{
comment: "",
description: "Shunixbot (France) beta / test semantic web indexing robot",
id: "id_moz_031107_4",
link1: "http://www.shunix.com/",
link2: "",
name: "Mozilla/5.0 (compatible; ShunixBot/1.x.x +http://www.shunix.com/robot.htm)",
type: "R"
},
%{
comment: "",
description: "Shunixbot (France) beta / test semantic web indexing robot",
id: "id_moz_971",
link1: "http://www.shunix.com/",
link2: "",
name: "Mozilla/5.0 (compatible; ShunixBot/1.x; http://www.shunix.com/bot.htm)",
type: "R"
},
%{
comment: "64.15.69.x",
description: "Skreemr - Audio search engine",
id: "id_moz_280607_2",
link1: "http://skreemr.com/",
link2: "",
name: "Mozilla/5.0 (compatible; SkreemRBot +http://skreemr.com)",
type: "R"
},
%{
comment: "",
description: "Snap Firefox Search Plugin",
id: "id_moz_070207_2",
link1: "http://www.snap.com/about/spa1A.php",
link2: "",
name:
"Mozilla/5.0 (compatible; SnapPreviewBot; en-US; rv:1.8.0.9) Gecko/20061206 Firefox/1.5.0.9",
type: "B"
},
%{
comment: "",
description: "Spurl.net bookmark service & search engine (84.40.30.xxx)",
id: "id_moz_972",
link1: "http://www.spurl.net",
link2: "",
name: "Mozilla/5.0 (compatible; SpurlBot/0.2) ",
type: "R C"
},
%{
comment: "208.79.17.x[x]",
description: "Summize - Opinion and review search robot",
id: "id_moz_190108_1",
link1: "http://www.summize.com/",
link2: "",
name: "Mozilla/5.0 (compatible; SummizeBot +http://www.summize.com)",
type: "R"
},
%{
comment: "",
description: "Syclik Control web content management system",
id: "id_moz_973",
link1: "http://www.syclik.com",
link2: "",
name: "Mozilla/5.0 (compatible; SYCLIKControl/LinkChecker;)",
type: "R C"
},
%{
comment: "212.12.114.2xx",
description: "Synoo web directory robot",
id: "id_moz_070607_1",
link1: "http://www.synoo.com/search/bot.html",
link2: "",
name: "Mozilla/5.0 (compatible; Synoobot/0.9; http://www.synoo.com/search/bot.html)",
type: "R"
},
%{
comment: "",
description: "Theophrastus Internet Spider for a basic search engine project",
id: "id_moz_261105_1",
link1: "http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php",
link2: "",
name:
"Mozilla/5.0 (compatible; Theophrastus/x.x; http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php)",
type: "R"
},
%{
comment: "213.253.92.x",
description: "Interseek - Java search engine technology used for Pogodak search",
id: "id_moz_030207_2",
link1: "http://www.interseek.com/",
link2: "http://www.pogodak.com/",
name: "Mozilla/5.0 (compatible; TridentSpider/3.1)",
type: "R"
},
%{
comment: "s.also - Mozilla/3.0 (Vagabondo... - Vagabondo..",
description: "WiseGuys robot",
id: "id_moz_974",
link1: "http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk",
link2: "",
name:
"Mozilla/5.0 (compatible; Vagabondo/2.1; webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/)",
type: "R"
},
%{
comment: "",
description: "Webdunia search (India) robot",
id: "id_moz_280209_4",
link1: "http://www.webdunia.com/",
link2: "",
name: "Mozilla/5.0 (compatible; Webduniabot/1.0; +http://search.webdunia.com/bot.aspx)",
type: "R"
},
%{
comment: "",
description: "phpwebbrain online bookmark service (Germany)",
id: "id_moz_151205_1",
link1: "http://www.monsterli.ch/phpwebbrain/",
link2: "",
name:
"Mozilla/5.0 (compatible; Windows NT 5.0; phpwebbrainBot/0.1 - http://www.monsterli.ch/phpwebbrain/)",
type: "C"
},
%{
comment: "137.82.84.xx",
description:
"WORIO (beta) search for computer scientists and programmers using Heritrix open-source crawler",
id: "id_moz_150307_1",
link1: "http://www.worio.com/",
link2: "http://www.archive.org/",
name: "Mozilla/5.0 (compatible; worio bot heritrix/1.10.0 +http://worio.com)",
type: "R"
},
%{
comment: "76.12.83.24x",
description:
"Kathune spider for World of Warcraft guild data. Used to power WoW Lemmings",
id: "id_moz_221008_1",
link1: "http://www.wowlemmings.com/kathune.html",
link2: "http://www.wowlemmings.com/",
name:
"Mozilla/5.0 (compatible; WoW Lemmings Kathune/2.0;http://www.wowlemmings.com/kathune.html)",
type: "R"
},
%{
comment: "",
description: "eXternalTest - Server and online services monitoring",
id: "id_moz_260407_1",
link1: "http://www.externaltest.com/",
link2: "",
name: "Mozilla/5.0 (compatible; XTbot/1.0v; +http://www.externaltest.com)",
type: "C"
},
%{
comment: "66.196.77.1xx / 72.30.98.2xx",
description: "Yahoo / Inktomi search robot",
id: "id_moz_290606_2",
link1: "",
link2: "",
name:
"Mozilla/5.0 (compatible; Yahoo! DE Slurp; http://help.yahoo.com/help/us/ysearch/slurp)",
type: "R"
},
%{
comment: "",
description: "Inktomi robot (202.160.180.xxx) for Yahoo China",
id: "id_moz_181105_1",
link1: "http://www.yahoo.com.cn/",
link2: "http://www.inktomi.com/",
name: "Mozilla/5.0 (compatible; Yahoo! Slurp China; http://misc.yahoo.com.cn/help.html)",
type: "R"
},
%{
comment: "",
description: "Inktomi robot for Yahoo (via 66.196.xx.xxx)",
id: "id_moz_975",
link1: "http://www.inktomi.com",
link2: "",
name:
"Mozilla/5.0 (compatible; Yahoo! Slurp; http://help.yahoo.com/help/us/ysearch/slurp)",
type: "R"
},
%{
comment: "66.48.78.1xx",
description: "Yesup Seo - Toronto SEO Service",
id: "id_moz_061208_2",
link1: "http://yesupseo.com/",
link2: "",
name: "Mozilla/5.0 (compatible; YesupBot/1.0; +http://www.yesup.net/bot.html)",
type: "C"
},
%{
comment: "s. also yoono/1.0 web-crawler - yoofind/yoofind ..",
description: "Yoono - community based search (193.110.140.xxx / 194.0.179.[x]xx)",
id: "id_moz_250107_1",
link1: "http://www.yoono.com/",
link2: "",
name: "Mozilla/5.0 (compatible; Yoono; http://www.yoono.com/)",
type: "R"
},
%{
comment: "202.108.7.1xx",
description: "Youdao search (China) robot",
id: "id_moz_061208_3",
link1: "http://www.youdao.com/",
link2: "",
name:
"Mozilla/5.0 (compatible; YoudaoBot/1.0; http://www.youdao.com/help/webmaster/spider/; )",
type: "R"
},
%{
comment: "196.46.116.x[x] / 196.23.180.x[x]",
description: "Zenbot robot for the Southern African Zen search service",
id: "id_moz_050807_1",
link1: "http://zen.co.za/",
link2: "http://zen.co.za/webmasters/",
name: "Mozilla/5.0 (compatible; Zenbot/1.3; +http://zen.co.za/webmasters/)",
type: "R"
},
%{
comment: "67.202.34.xxx",
description:
"Powerset Natural Language Search crawler (under development) using Heritrix via Amazon Web Services",
id: "id_moz_110408_1",
link1: "http://www.powerset.com/",
link2: "http://www.amazon.com/gp/browse.html?node=3435361",
name:
"Mozilla/5.0 (compatible; zermelo +http://www.powerset.com) [email:paul@page-store.com,crawl@powerset.com]",
type: "R"
},
%{
comment: "s.also - InternetArchive/0.8-dev - archive.org_bot",
description: "Heritrix - The Internet Archive's open-source crawler (207.241.225.2xx)",
id: "id_moz_030606_1",
link1: "http://www.archive.org/",
link2: "",
name:
"Mozilla/5.0 (compatible;archive.org_bot/1.7.1; collectionId=316; Archive-It; +http://www.archive-it.org)",
type: "R"
},
%{
comment: "207.241.233.2xx",
description: "Wayback Machine Internet Archive crawler",
id: "id_moz_180906_2",
link1: "http://www.archive.org/index.php",
link2: "",
name:
"Mozilla/5.0 (compatible;archive.org_bot/heritrix-1.9.0-200608171144 +http://pandora.nla.gov.au/crawl.html)",
type: "R"
},
%{
comment: "74.93.15.249",
description: "FindITAnswers - Search engine for software developers",
id: "id_moz_180107_1",
link1: "http://www.finditanswers.com/",
link2: "",
name:
"Mozilla/5.0 (compatible;FindITAnswersbot/1.0;+http://search.it-influentials.com/bot.htm)",
type: "B"
},
%{
comment: "80.190.213.xx",
description: "Mainseek search (Poland) robot",
id: "id_moz_170906_2",
link1: "http://www.mainseek.com/",
link2: "",
name: "Mozilla/5.0 (compatible;MAINSEEK_BOT)",
type: "R"
},
%{
comment: "",
description: "MozShot - Technical demo to take screenshot of any URL",
id: "id_moz_290708_1",
link1: "http://mozshot.nemui.org/",
link2: "",
name: "Mozilla/5.0 (Gecko/20070310 Mozshot/0.0.20070628; http://mozshot.nemui.org/)",
type: "B"
},
%{
comment: "",
description: "Mozilla Firefox 3.0 beta (Gran Paradiso) for MacOS",
id: "id_moz_150408_2",
link1: "http://developer.mozilla.org/en/docs/Firefox_3_for_developers",
link2: "",
name:
"Mozilla/5.0 (Macintosh; U; Intel Mac OS X 10.4; en-US; rv:1.9b5) Gecko/2008032619 Firefox/3.0b5",
type: "B"
},
%{
comment: "",
description: "Chimera browser (Mozilla/Gecko engine) - now Camino Mac PowerPC",
id: "id_moz_976",
link1: "http://www.mozilla.org",
link2: "",
name:
"Mozilla/5.0 (Macintosh; U; PPC Mac OS X Mach-O; en-US; rv:1.0.1) Gecko/20021219 Chimera/0.6 ",
type: "B"
},
%{
comment: "",
description: "Camino browser (Mozilla/Gecko engine) - ex Chimera Mac PowerPC",
id: "id_moz_977",
link1: "http://www.mozilla.org",
link2: "",
name:
"Mozilla/5.0 (Macintosh; U; PPC Mac OS X Mach-O; en-US; rv:1.0.1) Gecko/20030306 Camino/0.7",
type: "B"
},
%{
comment: "",
description: "OmniWeb 5.x.x Mac OS X browser",
id: "id_moz_978",
link1: "http://www.omnigroup.com",
link2: "",
name:
"Mozilla/5.0 (Macintosh; U; PPC Mac OS X; en-US) AppleWebKit/xx (KHTML like Gecko) OmniWeb/v5xx.xx",
type: "B"
},
%{
comment: "",
description: "Safari 1.2x browser (Mozilla/Gecko engine) MAC OS X",
id: "id_moz_979",
link1: "http://www.apple.com",
link2: "",
name:
"Mozilla/5.0 (Macintosh; U; PPC Mac OS X; en-us) AppleWebKit/xxx.x (KHTML like Gecko) Safari/12x.x",
type: "B"
},
%{
comment: "",
description: "Netscape 6.x Mac PowerPC",
id: "id_moz_980",
link1: "",
link2: "",
name: "Mozilla/5.0 (Macintosh; U; PPC; en-US; rv:0.9.2) Gecko/20010726 Netscape6/6.1",
type: "B"
},
%{
comment: "",
description: "unknown robot from gw.ocg-corp.com",
id: "id_moz_981",
link1: "",
link2: "",
name: "Mozilla/5.0 (research@mediatrec.com)",
type: ""
},
%{
comment: "",
description: "Sage - RSS and Atom feed reader extension for Mozilla Firefox",
id: "id_moz_260806_1",
link1: "http://sage.mozdev.org/",
link2: "",
name: "Mozilla/5.0 (Sage)",
type: "B"
},
%{
comment: "",
description: "Inktomi (Hotbot-Lycos - NBCi etc.) robot",
id: "id_moz_982",
link1: "http://www.inktomi.com",
link2: "",
name: "Mozilla/5.0 (Slurp/cat; slurp@inktomi.com; http://www.inktomi.com/slurp.html)",
type: "R"
},
%{
comment: "",
description: "Inktomi (Hotbot-Lycos - NBCi etc.) robot",
id: "id_moz_983",
link1: "http://www.inktomi.com",
link2: "",
name: "Mozilla/5.0 (Slurp/si; slurp@inktomi.com; http://www.inktomi.com/slurp.html)",
type: "R"
},
%{
comment: "",
description: "Opera 5.x SunOS",
id: "id_moz_984",
link1: "",
link2: "",
name: "Mozilla/5.0 (SunOS 5.8 sun4u; U) Opera 5.0 [en]",
type: "B"
},
%{
comment: "64.62.136.xxx",
description: "Twiceler experimental web crawler",
id: "id_moz_020507_1",
link1: "http://www.cuill.com/",
link2: "",
name: "Mozilla/5.0 (Twiceler-0.9 http://www.cuill.com/twiceler/robot.html)",
type: "R"
},
%{
comment: "UA sometimes have random letters like: vkfjkgo...",
description:
"Some spambot from Romania (82.208.139.1xx & 86.123.65.xx) - Maybe email harvesting",
id: "id_moz_070106_2",
link1: "",
link2: "",
name: "Mozilla/5.0 (Version: xxxx Type:xx)",
type: "S"
},
%{
comment: "",
description: "GenieKnows.com search robot (64.5.245.xx / 64.5.220.xxx)",
id: "id_moz_985",
link1: "http://www.genieknows.com/",
link2: "",
name: "Mozilla/5.0 (wgao@genieknows.com)",
type: "R"
},
%{
comment: "",
description: "Netscape 6.x Win98",
id: "id_moz_986",
link1: "",
link2: "",
name: "Mozilla/5.0 (Windows; U; Win98; en-US; rv:0.9.2) Gecko/20010726 Netscape6/6.1",
type: "B"
},
%{
comment: "",
description: "Firebird browser (Mozilla/Gecko engine) - ex Phoenix Win98",
id: "id_moz_987",
link1: "http://www.mozilla.org",
link2: "",
name:
"Mozilla/5.0 (Windows; U; Win98; en-US; rv:x.xx) Gecko/20030423 Firebird Browser/0.6",
type: "B"
},
%{
comment: "",
description: "Beonex Communicator browser (Mozilla/Gecko engine)",
id: "id_moz_988",
link1: "http://www.beonex.com",
link2: "",
name: "Mozilla/5.0 (Windows; U; Win9x; en; Stable) Gecko/20020911 Beonex/0.8.1-stable",
type: "B"
},
%{
comment: "",
description: "Healthline health related search robot (72.5.115.xx)",
id: "id_moz_111205_1",
link1: "http://www.healthline.com/",
link2: "",
name:
"Mozilla/5.0 (Windows; U; Windows NT 5.0; en-US; rv:1.7.7) NimbleCrawler 1.11 obeys UserAgent NimbleCrawler For problems contact: crawler_at_dataalchemy.com",
type: "R"
},
%{
comment: "",
description: "Google Chrome browser based on WebKit (Safari)",
id: "id_moz_171008_2",
link1: "http://www.google.com/chrome",
link2: "",
name:
"Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US) AppleWebKit/525.19 (KHTML, like Gecko) Chrome/0.2.153.1 Safari/525.19",
type: "B"
},
%{
comment: "",
description: "Flock web browser built on Mozilla technologies",
id: "id_moz_170207_1",
link1: "http://www.flock.com/",
link2: "",
name:
"Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.8.0.5) Gecko/20060731 Firefox/1.5.0.5 Flock/0.7.4.1",
type: "B"
},
%{
comment: "",
description: "Megaupload Mega Manager - Download manager plugin for Firefox",
id: "id_moz_190108_3",
link1: "http://www.megaupload.com/manager/de/",
link2: "",
name:
"Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.8.1.11) Gecko/20071127 Firefox/2.0.0.4/Megaupload x.0",
type: "D"
},
%{
comment: "",
description: "Orca browser - based on Gecko",
id: "id_moz_171008_1",
link1: "http://www.orcabrowser.com",
link2: "",
name:
"Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:1.9.0.1) Gecko/2008092215 Firefox/3.0.1 Orca/1.1 beta 3",
type: "B"
},
%{
comment: "",
description: "Firefox browser (Mozilla/Gecko engine) - ex Firebird WinXP",
id: "id_moz_989",
link1: "http://www.mozilla.org",
link2: "",
name:
"Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:x.x.x) Gecko/20041107 Firefox/x.x",
type: "B"
},
%{
comment: "",
description: "Firebird browser (Mozilla/Gecko engine) - ex Phoenix WinXP",
id: "id_moz_990",
link1: "http://www.mozilla.org",
link2: "",
name:
"Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:x.xx) Gecko/20030504 Mozilla Firebird/0.6",
type: "B"
},
%{
comment: "",
description: "Mnenhy - enhanced mail & news Mozilla based browser",
id: "id_moz_991",
link1: "http://mnenhy.mozdev.org/index-de.html",
link2: "",
name:
"Mozilla/5.0 (Windows; U; Windows NT 5.1; en-US; rv:x.xxx) Gecko/20041027 Mnenhy/0.6.0.104",
type: "B"
},
%{
comment: "",
description: "Voila.fr robot",
id: "id_moz_060508_2",
link1: "http://www.voila.fr",
link2: "",
name:
"Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)",
type: "R"
},
%{
comment: "",
description: "Voila.fr robot",
id: "id_moz_080608_2",
link1: "http://www.voila.fr",
link2: "",
name:
"Mozilla/5.0 (Windows; U; Windows NT 5.1; fr; rv:1.8.1) VoilaBot BETA 1.2 (support.voilabot@orange-ftgroup.com)",
type: "R"
},
%{
comment: "",
description: "Mozilla Firefox 3.0 beta (Gran Paradiso) for Win",
id: "id_moz_150408_3",
link1: "http://developer.mozilla.org/en/docs/Firefox_3_for_developers",
link2: "",
name:
"Mozilla/5.0 (Windows; U; Windows NT 6.0; en-US; rv:1.9b5) Gecko/2008032620 Firefox/3.0b5",
type: "B"
},
%{
comment: "",
description: "Tiscali Communicator - Online services suite",
id: "id_moz_300407_2",
link1: "http://im.tiscali.com/index.html",
link2: "",
name:
"Mozilla/5.0 (Windows; U;XMPP Tiscali Communicator v.10.0.1; Windows NT 5.1; it; rv:1.8.1.3) Gecko/20070309 Firefox/2.0.0.3",
type: "B"
},
%{
comment: "",
description: "Healthline health related search robot (72.5.115.xx)",
id: "id_moz_300106_1",
link1: "http://www.healthline.com/",
link2: "",
name:
"Mozilla/5.0 (Windows;) NimbleCrawler 1.12 obeys UserAgent NimbleCrawler For problems contact: crawler@health",
type: "R"
},
%{
comment: "",
description: "Healthline health related search robot (72.5.115.xx)",
id: "id_moz_161205_2",
link1: "http://www.healthline.com/",
link2: "",
name:
"Mozilla/5.0 (Windows;) NimbleCrawler 1.12 obeys UserAgent NimbleCrawler For problems contact: crawler@healthline.com",
type: "R"
},
%{
comment: "",
description: "Kazehakase - Gecko based browser (Japan)",
id: "id_moz_090807_2",
link1: "http://kazehakase.sourceforge.jp/",
link2: "",
name: "Mozilla/5.0 (X11; Linux i686; U;rv: 1.7.13) Gecko/20070322 Kazehakase/0.4.4.1",
type: "B"
},
%{
comment: "",
description: "Netscape 6.x Linux",
id: "id_moz_992",
link1: "",
link2: "",
name:
"Mozilla/5.0 (X11; U; Linux 2.4.2-2 i586; en-US; m18) Gecko/20010131 Netscape6/6.01",
type: "B"
},
%{
comment: "",
description: "SeaMonkey browser suite (ex Mozilla) on Linux",
id: "id_moz_160306_1",
link1: "http://www.mozilla.org/projects/seamonkey/",
link2: "",
name: "Mozilla/5.0 (X11; U; Linux i686; de-AT; rv:1.8.0.2) Gecko/20060309 SeaMonkey/1.0",
type: "B"
},
%{
comment: "",
description: "Epiphany (Mozilla/Gecko engine) browser Linux",
id: "id_moz_993",
link1: "http://www.gnome.org/projects/epiphany/",
link2: "",
name:
"Mozilla/5.0 (X11; U; Linux i686; en-GB; rv:1.7.6) Gecko/20050405 Epiphany/1.6.1 (Ubuntu) (Ubuntu package 1.0.2)",
type: "B"
},
%{
comment: "",
description: "Nautilus (developed by Eazel.com) 1.x Browser Linux",
id: "id_moz_994",
link1:
"http://swin05.dyndns.biz/Doc/Docrh7.03us/DocRH7.3us/sunsite.mff.cuni.cz/pub/redhat/linux/7.3/fr/doc/RH-DOCS/rhl-gsg-en-7.3/s1-browsers-nautilus.html",
link2: "",
name: "Mozilla/5.0 (X11; U; Linux i686; en-US; Nautilus/1.0Final) Gecko/20020408",
type: "B"
},
%{
comment: "",
description: "Mozilla (Gecko) 0.9x browser Linux",
id: "id_moz_995",
link1: "",
link2: "",
name: "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:0.9.3) Gecko/20010801",
type: "B"
},
%{
comment: "64.34.195.1xx",
description: "Spinn3r social network crawler",
id: "id_moz_030110_5",
link1: "http://spinn3r.com/",
link2: "",
name:
"Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.2.1; aggregator:Spinn3r (Spinn3r 3.1); http://spinn3r.com/robot) Gecko/20021130",
type: "R"
},
%{
comment: "",
description: "Phoenix 0.3 browser (Mozilla/Gecko engine) - now Firebird Linux",
id: "id_moz_996",
link1: "http://www.firebirdsql.org/",
link2: "",
name: "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.2b) Gecko/20021007 Phoenix/0.3",
type: "B"
},
%{
comment: "",
description: "Epiphany (Mozilla/Gecko engine) browser Linux",
id: "id_moz_997",
link1: "http://www.gnome.org/projects/epiphany/",
link2: "",
name: "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.6) Gecko/20040413 Epiphany/1.2.1",
type: "B"
},
%{
comment: "",
description: "Snap Firefox Search Plugin",
id: "id_moz_190107_1",
link1: "http://www.snap.com/about/spa1A.php",
link2: "",
name:
"Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8.0.7) Gecko/20060909 Firefox/1.5.0.7 SnapPreviewBot",
type: "B"
},
%{
comment: "",
description: "Bon Echo Alpha - developer preview of future Firefox browser",
id: "id_moz_240107_2",
link1: "http://www.mozilla.org/projects/bonecho/releases/2.0a1.html",
link2: "",
name: "Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8.1) Gecko/20061129 BonEcho/2.0",
type: "B"
},
%{
comment: "",
description: "IceWeasel - the GNU version of the Firefox browser",
id: "id_moz_240207_2",
link1: "http://www.gnu.org/software/gnuzilla/",
link2: "",
name:
"Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.8.1.1) Gecko/20061205 Iceweasel/2.0.0.1 (Debian-2.0.0.1+dfsg-2)",
type: "B"
},
%{
comment: "",
description: "Mozilla Firefox 3.0 beta (Gran Paradiso) for Linux",
id: "id_moz_150408_1",
link1: "http://developer.mozilla.org/en/docs/Firefox_3_for_developers",
link2: "",
name:
"Mozilla/5.0 (X11; U; Linux x86_64; en-US; rv:1.9a8) Gecko/2007100619 GranParadiso/3.0a8",
type: "B"
},
%{
comment: "",
description: "Galeon 1.x Browser Linux",
id: "id_moz_999",
link1: "http://galeon.sourceforge.net/",
link2: "",
name: "Mozilla/5.0 Galeon/1.0.2 (X11; Linux i686; U;) Gecko/20011224",
type: "B"
},
%{
comment: "",
description: "gURLChecker - GNOME link checking tool",
id: "id_moz_1000",
link1: "http://www.nongnu.org",
link2: "",
name: "Mozilla/5.0 gURLChecker/0.x.x (Linux)",
type: "C"
},
%{
comment: "",
description: "URL Spider - used by usww.net",
id: "id_moz_1001",
link1: "http://www.url-spider.com/",
link2: "",
name: "Mozilla/5.0 URL-Spider",
type: "R"
},
%{
comment: "",
description: "W8net spider",
id: "id_moz_1002",
link1: "http://www.usww.com",
link2: "",
name: "Mozilla/5.0 usww.com-Spider-for-w8.net",
type: "R"
},
%{
comment: "",
description: "GenieKnows.com search robot (64.5.245.xx / 64.5.220.xxx)",
id: "id_moz_1003",
link1: "http://www.genieknows.com",
link2: "",
name: "Mozilla/5.0 wgao@genieknows.com",
type: "R"
},
%{
comment: "",
description: "axxus.de German business directory",
id: "id_moz_111205_7",
link1: "http://www.axxus.de/",
link2: "",
name: "Mozilla/5.0 whoiam [http://www.axxus.de/]",
type: "R C"
},
%{
comment: "",
description:
"Yuntis : Collaborative Web Resource Categorization and Ranking Project robot",
id: "id_moz_998",
link1: "http://www.ecsl.cs.sunysb.edu/yuntis/",
link2: "",
name:
"Mozilla/5.0 [en] (compatible; Gulper Web Bot 0.2.4 www.ecsl.cs.sunysb.edu/~maxim/cgi-bin/Link/GulperBot)",
type: "R"
},
%{
comment: "192.17.11.xx",
description: "MetaExplorer project's MetaQuerier robot",
id: "id_g_m_190606_1",
link1: "http://metaquerier.cs.uiuc.edu/",
link2: "",
name: "MQbot metaquerier.cs.uiuc.edu/crawler",
type: "R"
},
%{
comment: "192.17.11.xx",
description: "MetaExplorer project's MetaQuerier robot",
id: "id_g_m_251006_1",
link1: "http://metaquerier.cs.uiuc.edu/",
link2: "",
name:
"MQBOT/Nutch-0.9-dev (MQBOT Nutch Crawler; http://falcon.cs.uiuc.edu; mqbot@cs.uiuc.edu)",
type: "R"
},
%{
comment: "",
description: "MS Frontpage 4.x",
id: "id_g_m_1004",
link1: "",
link2: "",
name: "MSFrontPage/4.0",
type: "B"
},
%{
comment: "",
description: "Some faked UA - maybe for a download manager",
id: "id_g_m_1005",
link1: "",
link2: "",
name: "MSIE 4.0 (Win95)",
type: "D"
},
%{
comment: "see also: - Opera/6.01 (larbin@.....) - WinampMPEG/2.00 larbin@....",
description: "unknown robot from gw.ocg-corp.com (209.126.176.x)",
id: "id_g_m_1006",
link1: "",
link2: "",
name: "MSIE-5.13 (larbin@unspecified.mail)",
type: ""
},
%{
comment: "65.55.235.1xx",
description: "MSN media search robot",
id: "id_g_m_190506_1",
link1: "http://search.msn.com",
link2: "",
name: "msnbot-media/1.0 (+http://search.msn.com/msnbot.htm)",
type: "R"
},
%{
comment: "207.68.157.xxx",
description: "Windows Live product search (Beta) robot",
id: "id_g_m_290806_1",
link1: "http://products.live.com",
link2: "http://productsearch.spaces.live.com/",
name: "msnbot-Products/1.0 (+http://search.msn.com/msnbot.htm)",
type: "R"
},
%{
comment: "s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search...",
description:
"MSN Search robot - 131.107.xxx.xxx 204.95.96.xxx - 204.95.111.xxx 207.46.xxx.xxx",
id: "id_g_m_1007",
link1: "http://search.msn.com",
link2: "",
name: "MSNBOT/0.xx (http://search.msn.com/msnbot.htm)",
type: "R"
},
%{
comment: "s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search...",
description:
"MSN Search robot - 131.107.xxx.xxx 204.95.96.xxx - 204.95.111.xxx 207.46.xxx.xxx",
id: "id_g_m_1008",
link1: "http://search.msn.com",
link2: "",
name: "msnbot/x.xx ( http://search.msn.com/msnbot.htm)",
type: "R"
},
%{
comment: "65.55.241.2xx",
description: "Microsoft search for mobiles",
id: "id_g_m_190108_2",
link1: "http://livesearchmobile.com/?mid=1011",
link2: "",
name: "MSNBOT_Mobile MSMOBOT Mozilla/2.0 (compatible; MSIE 4.02; Windows CE; Default)",
type: "R"
},
%{
comment: "s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows NT; MS Search...",
description:
"MSN Search robot - 131.107.xxx.xxx 204.95.96.xxx - 204.95.111.xxx 207.46.xxx.xxx",
id: "id_g_m_1009",
link1: "http://search.msn.com",
link2: "",
name: "MSNPTC/1.0",
type: "R"
},
%{
comment: "",
description: "Microsoft proxy server",
id: "id_g_m_1010",
link1: "http://www.microsoft.com/isaserver/evaluation/previousversions/default.mspx",
link2: "",
name: "MSProxy/2.0",
type: "P"
},
%{
comment: "",
description: "MacEdition CodeBitch link checking",
id: "id_g_m_181205_3",
link1: "http://www.macedition.com/cb/cb_20030310.php",
link2: "",
name: "MSRBOT",
type: "C"
},
%{
comment: "",
description: "Microsoft MSRBot",
id: "id_g_m_270407_1",
link1: "http://research.microsoft.com/research/sv/msrbot/",
link2: "",
name: "MSRBOT (http://research.microsoft.com/research/sv/msrbot)",
type: "R"
},
%{
comment: "",
description: "StreamBox VCR user agent",
id: "id_g_m_070406_3",
link1:
"http://all-streaming-media.com/streaming-media-faq/faq-streambox-vcr-download-problems.htm",
link2: "",
name: "Mulder, VCR-1.0",
type: "D"
},
%{
comment: "",
description: "Multiblocker (Fantomaster) anonymity software user",
id: "id_g_m_1011",
link1: "http://multiblocker.com/home.html",
link2: "http://fantomaster.com",
name: "multiBlocker browser",
type: "P"
},
%{
comment: "140.203.154.1xx",
description: "MultiCrawler for DERI Galway's Semantic Web Search Engine cluster",
id: "id_g_m_030807_1",
link1: "http://sw.deri.org/2006/04/multicrawler/robots.html",
link2: "http://sw.deri.ie/",
name: "multicrawler ( http://sw.deri.org/2006/04/multicrawler/robots.html)",
type: "R"
},
%{
comment: "",
description: "Virginia Tech Digital Library Research Laboratory robot",
id: "id_g_m_1012",
link1: "http://www.dlib.vt.edu",
link2: "",
name: "MultiText/0.1",
type: "R"
},
%{
comment: "",
description: "SoMusical! musical directory link checking",
id: "id_g_m_1013",
link1: "http://www.somusical.com",
link2: "",
name: "MusicWalker2.0 ( http://www.somusical.com)",
type: "R"
},
%{
comment: "see this blog:",
description: "Unknown bad bot from diff. Taiwanese IPs",
id: "id_g_m_270306_1",
link1: "http://www.tenspider.com/business-blog/weblog.php",
link2: "",
name: "MVAClient",
type: "S"
},
%{
comment: "",
description: "Windows HTTP Services (WinHTTP)",
id: "id_g_m_241105_1",
link1:
"http://msdn.microsoft.com/library/?url=/library/en-us/winhttp/http/about_winhttp.asp",
link2: "",
name: "My WinHTTP Connection",
type: ""
},
%{
comment: "",
description: "unknown user robot (24.124.34.42)",
id: "id_g_m_1014",
link1: "",
link2: "",
name: "myDaemon",
type: ""
},
%{
comment: "",
description: "GetRight download manager",
id: "id_g_m_1015",
link1: "http://www.getright.com",
link2: "",
name: "MyGetRight/1.0.0",
type: "D"
},
%{
comment: "",
description: "GetRight download manager",
id: "id_g_m_1016",
link1: "http://www.getright.com",
link2: "",
name: "MyGetRight/1.0b",
type: "D"
},
%{
comment: "",
description: "Mylinea France web catalogue crawler",
id: "id_g_m_1017",
link1: "http://www.mylinea.com",
link2: "",
name: "Mylinea.com Crawler 2.0",
type: "R"
},
%{
comment: "",
description: "VDOG - SEO webdirecory (Germany) link checking",
id: "id_g_m_040906_1",
link1: "http://www.vdog.de/",
link2: "",
name: "mylinkcheck/1.02",
type: "C"
},
%{
comment: "",
description: "Blogbot (Germany) robot",
id: "id_n_s_1018",
link1: "http://blogbot.de/",
link2: "",
name: "Naamah 1.0.1/Blogbot (http://blogbot.de/)",
type: "R"
},
%{
comment: "",
description: "Blogbot (Germany) robot",
id: "id_n_s_1019",
link1: "http://blogbot.de/",
link2: "",
name: "Naamah 1.0a/Blogbot (http://blogbot.de/)",
type: "R"
},
%{
comment: "s.also Python-urllib/1.15 - dloader(NaverRobot)/1.0 & Cowbot",
description: "Naver Japan / Korea robot ",
id: "id_n_s_1021",
link1: "http://www.naver.co.jp/",
link2: "",
name: "NABOT/5.0",
type: "R"
},
%{
comment: "s.also Python-urllib/1.15 - dloader(NaverRobot)/1.0 & Cowbot",
description: "Naver Japan / Korea robot ",
id: "id_n_s_1020",
link1: "http://www.naver.co.jp/",
link2: "",
name: "nabot_1.0",
type: "R"
},
%{
comment: "",
description: "Badbot searching for Wordpress wp-login.php",
id: "id_n_s_180408_4",
link1: "",
link2: "",
name: "NameOfAgent (CMS Spider)",
type: "S"
},
%{
comment: "",
description: "naoFavicon4IE",
id: "id_n_s_071205_1",
link1: "http://nao4u.com/software/naoFavicon4IE/",
link2: "",
name: "naoFavicon4IE/1.xx",
type: "D"
},
%{
comment: "",
description: "Unknown spambot / harvester from diff. IPs",
id: "id_n_s_140506_2",
link1:
"http://www.projecthoneypot.org/ip_inspector.php?iph=978231e229521680d11cb93f32de0fa1",
link2: "",
name: "NASA Search 1.0",
type: "S"
},
%{
comment: "",
description: "Nationaldirectory spider",
id: "id_n_s_1022",
link1: "http://www.nationaldirectory.com/",
link2: "",
name: "NationalDirectory-WebSpider/1.3",
type: "R"
},
%{
comment: "",
description: "Nationaldirectory spider",
id: "id_n_s_1023",
link1: "http://www.nationaldirectory.com/",
link2: "",
name: "NationalDirectoryAddURL/1.0",
type: "R"
},
%{
comment: "s. also Python-urllib/1.15- nabot- cowbot & dloader",
description: "Naver Japan / Korea robot",
id: "id_n_s_1025",
link1: "http://www.naver.co.jp/",
link2: "",
name: "NaverBot-1.0 (NHN Corp. / +82-2-3011-1954 / nhnbot@naver.com)",
type: "R"
},
%{
comment: "s. also Python-urllib/1.15 - nabot - cowbot & dloader",
description: "Naver Japan / Korea robot",
id: "id_n_s_1024",
link1: "http://www.naver.co.jp/",
link2: "",
name: "NaverBot_dloader/1.5",
type: "R"
},
%{
comment: "",
description: "Navisso closed beta robot (69.41.162.1xx)",
id: "id_n_s_181205_1",
link1: "http://navisso.com/",
link2: "",
name: "NavissoBot",
type: "R"
},
%{
comment: "",
description: "Navisso closed beta robot (69.41.162.1xx)",
id: "id_n_s_181205_2",
link1: "http://navisso.com/",
link2: "",
name: "NavissoBot/1.7 (+http://navisso.com/)",
type: "R"
},
%{
comment: "",
description: "Vias Information Archival robot",
id: "id_n_s_1026",
link1: "http://vias.ncsa.uiuc.edu/",
link2: "",
name: "NCSA Beta 1 (http://vias.ncsa.uiuc.edu/viasarchivinginformation.html)",
type: "R"
},
%{
comment: "81.169.180.2xx",
description: "Nebulla.info distributed crawler (Germany)",
id: "id_n_s_250507_1",
link1: "http://www.nebulla.info/",
link2: "http://bot.nebulla.info/",
name: "Nebullabot/2.2 (http://bot.nebulla.info)",
type: "R"
},
%{
comment: "",
description: "NEC Researchindex robot - now CiteSeer.IST scientific document index",
id: "id_n_s_1027",
link1: "http://citeseer.ist.psu.edu/",
link2: "",
name: "NEC Research Agent -- compuman at research.nj.nec.com",
type: "R"
},
%{
comment: "s. NEC Research Agent",
description: "rcn.com user agent ? NEC Researchindex robot ?",
id: "id_n_s_1028",
link1: "",
link2: "",
name: "NEC-Hayek/1.0",
type: ""
},
%{
comment: "78.129.201.19x",
description: "Net Seekr search robot",
id: "id_n_s_291108_4",
link1: "http://www.net-seekr.com/",
link2: "",
name: "Net-Seekr Bot/Net-Seekr Bot V1 (http://www.net-seekr.com)",
type: "R"
},
%{
comment: "",
description: "NetAnts download manager",
id: "id_n_s_1029",
link1: "http://www.netants.com/en/index.html",
link2: "",
name: "NetAnts/1.2x",
type: "D"
},
%{
comment: "",
description: "NetComplete IE browser package",
id: "id_n_s_1030",
link1: "http://www.netcom.net.uk/",
link2: "",
name: "NETCOMplete/x.xx",
type: "B"
},
%{
comment: "194.153.145.x[xx]",
description: "Netinfo.bg search (Bulgaria) robot",
id: "id_n_s_010807_2",
link1: "http://netinfo.bg/",
link2: "",
name: "NetinfoBot/1.0 (http://netinfo.bg/netinfobot.html)",
type: "R"
},
%{
comment: "site is offline",
description: "Netlookout internet notifier",
id: "id_n_s_1031",
link1: "http://www.frugalsoft.com",
link2: "",
name: "NetLookout/2.24",
type: "R"
},
%{
comment: "Same IP-range as Metager search - powered by Nutch",
description: "Netluchs (Germany) search (193.164.8.xx)",
id: "id_n_s_230406_3",
link1: "http://www.netluchs.de/",
link2: "",
name: "Netluchs/0.8-dev ( ; http://www.netluchs.de/; ___don't___spam_me_@netluchs.de)",
type: "R"
},
%{
comment: "",
description: "NetMechanic link checker",
id: "id_n_s_1032",
link1: "http://www.netmechanic.com/",
link2: "",
name: "NetMechanic Vx.0",
type: "C"
},
%{
comment: "",
description: "NewsGator NetNewsWire - Mac RSS feed reader",
id: "id_n_s_030906_1",
link1: "http://www.newsgator.com/NGOLProduct.aspx?ProdID=NetNewsWire",
link2: "",
name: "NetNewsWire/2.x (Mac OS X; http://ranchero.com/netnewswire/)",
type: "B"
},
%{
comment: "",
description: "unknown InCom (216.0.107.xx) robot",
id: "id_n_s_1033",
link1: "http://www.incom.net/",
link2: "",
name: "NetNoseCrawler/v1.0",
type: "R"
},
%{
comment: "",
description: "Netprospector metasearch software",
id: "id_n_s_1034",
link1: "http://www.actaddons.com/products/netprospector.asp",
link2: "",
name: "Netprospector JavaCrawler",
type: "R"
},
%{
comment: "",
description: "Netpumper download manager",
id: "id_n_s_1035",
link1: "http://www.netpumper.com/",
link2: "",
name: "NetPumper/x.xx",
type: "D"
},
%{
comment: "",
description: "Look.com robot (209.87.232.x)",
id: "id_n_s_1036",
link1: "http://www.look.com/",
link2: "",
name: "NetResearchServer(http://www.look.com)",
type: "R"
},
%{
comment: "",
description: "IncyWincy search engine using DMOZ database",
id: "id_n_s_1037",
link1: "http://www.loopimprovements.com/",
link2: "",
name: "NetResearchServer/x.x(loopimprovements.com/robot.html)",
type: "R"
},
%{
comment: "67.202.26.1xx",
description: "NetSeer search (beta) crawler via Amazon Web Services - see also Teemer",
id: "id_n_s_140209_5",
link1: "http://www.netseer.com/",
link2: "http://www.amazon.com/gp/browse.html?node=3435361",
name: "NetSeer/Nutch-0.9 (NetSeer Crawler; http://www.netseer.com; crawler@netseer.com)",
type: "R"
},
%{
comment: "212.77.102.1xx",
description: "Wirtualna Polska / Netsprint search (Poland) robot",
id: "id_n_s_150906_2",
link1: "http://www.wp.pl/",
link2: "http://www.netsprint.pl/serwis/",
name: "NetSprint -- 2.0",
type: "R"
},
%{
comment: "",
description: "NetWhat Search crawler (69.9.167.1xx)",
id: "id_n_s_190306_1",
link1: "http://www.netwhat.com/",
link2: "",
name:
"NetWhatCrawler/0.06-dev (NetWhatCrawler from NetWhat.com; http://www.netwhat.com; support@netwhat.com)",
type: "R"
},
%{
comment: "site is closed",
description: "Netzippy robot",
id: "id_n_s_1038",
link1: "http://www.netzippy.com/",
link2: "",
name: "NetZippy",
type: "R"
},
%{
comment: "",
description: "unknown",
id: "id_n_s_1039",
link1: "",
link2: "",
name: "NeuralBot/0.2",
type: ""
},
%{
comment: "",
description: "Unknown (12.238.4.xxx) attbi.com client robot",
id: "id_n_s_1040",
link1: "",
link2: "",
name: "newsearchengine (ThisUser@unspecified.mail)",
type: ""
},
%{
comment: "",
description: "FetchLinks plugin for NewsGator RSS reader",
id: "id_n_s_250707_3",
link1: "http://graemef.com/project/fetchlinks",
link2: "",
name: "NewsGator FetchLinks extension/0.2.0 (http://graemef.com)",
type: "B"
},
%{
comment: "64.78.155.1xx",
description: "NewsGator online RSS reader",
id: "id_n_s_250707_4",
link1: "http://www.newsgator.com/",
link2: "",
name: "NewsGatorOnline/2.0 (http://www.newsgator.com; 1 subscribers)",
type: "B"
},
%{
comment: "",
description: "Eliyon Crawler for Business People Search",
id: "id_n_s_1041",
link1: "http://www.eliyon.com/NextGenSearchBot",
link2: "",
name: "NextGenSearchBot 1 (for information visit http://www.eliyon.com/NextGenSearchBot)",
type: "R"
},
%{
comment: "",
description: "Nextopia crawler",
id: "id_n_s_1042",
link1: "http://www.nextopia.com/",
link2: "",
name: "NextopiaBOT (+http://www.nextopia.com) distributed crawler client beta v0.x",
type: "R"
},
%{
comment: "84.56.87.1xx",
description: "find your keywords - semantic search (Germany) robot",
id: "id_n_s_060906_1",
link1: "http://www.ng-search.com/",
link2: "",
name: "NG-Search/0.90 (NG-SearchBot; http://www.ng-search.com; )",
type: "R"
},
%{
comment: "s. Harvest-NG/1.0.2 and Exalead NG...",
description: "Exalead (France) search robot (193.47.80.xx)",
id: "id_n_s_1043",
link1: "http://www.exabot.com/",
link2: "",
name: "NG/1.0",
type: "R"
},
%{
comment: "s. also Exabot-Images/1.0",
description: "Exalead Websearch image crawler (193.47.80.xx)",
id: "id_n_s_050406_3",
link1: "http://www.exalead.com/search",
link2: "",
name: "NG/4.0.1229",
type: "R"
},
%{
comment: "128.8.126.xx",
description: "Unknown UA from PlanetLab distributed network",
id: "id_n_s_071106_1",
link1: "http://planetlab2.cs.umd.edu/",
link2: "",
name: "nicebot",
type: ""
},
%{
comment: "-site is offline-",
description: "NicoZone childsafe search robot ",
id: "id_n_s_1044",
link1: "http://www.nicozone.net/",
link2: "",
name: "NICO/1.0",
type: "R P"
},
%{
comment: "69.61.23.11x",
description: "Nikita the Spider - Online HTML validation , link checking",
id: "id_n_s_291007_2",
link1: "http://nikitathespider.com/",
link2: "",
name: "Nikita the Spider (http://NikitaTheSpider.com/)",
type: "C"
},
%{
comment: "",
description: "Experimental LSI (?) robot from 140.233.69.xx (Middlebury.edu)",
id: "id_n_s_1045",
link1: "http://javelina.cet.middlebury.edu/lsa/out/lsa_intro.htm",
link2: "",
name: "NITLE Blog Spider/0.01",
type: "R"
},
%{
comment: "",
description: "Download manager",
id: "id_n_s_1046",
link1: "http://www.klsofttools.com",
link2: "",
name: "Nitro Downloader 1.x (www.klsofttools.com)",
type: "D"
},
%{
comment: "",
description: "Noago spider",
id: "id_n_s_1047",
link1: "http://www.noago.com/",
link2: "",
name: "Noago Spider",
type: "R"
},
%{
comment: "",
description: "telefonica.es user robot",
id: "id_n_s_1048",
link1: "",
link2: "",
name: "Nocilla/1.0",
type: ""
},
%{
comment: "",
description: "Google WAP robot",
id: "id_n_s_1049",
link1: "http://www.google.com/",
link2: "",
name: "Nokia-WAPToolkit/1.2 googlebot(at)googlebot.com",
type: "R"
},
%{
comment: "",
description: "Botmobi crawler for Find.mobi mobile search",
id: "id_n_s_290708_3",
link1: "http://find.mobi/bot.html",
link2: "http://find.mobi/",
name:
"Nokia6300/2.0 (05.50) Profile/MIDP-2.0 Configuration/CLDC-1.1 (botmobi http://find.mobi/bot.html abuse@mtld.mobi)",
type: "C"
},
%{
comment: "68.180.2xx.[x]xx",
description: "YahooSeeker/M1A1-R2D2 - Yahoo mobile web crawling robot",
id: "id_n_s_200108_3",
link1: "http://help.yahoo.com/l/us/yahoo/search/mobilecrawler/mobilecrawler-01.html",
link2: "",
name:
"Nokia6610/1.0 (3.09) Profile/MIDP-1.0 Configuration/CLDC-1.0 (compatible;YahooSeeker/M1A1-R2D2; http://help.yahoo.com/help/us/ysearch/crawling/crawling-01.html)",
type: "R"
},
%{
comment: "",
description: "Google WAP proxy",
id: "id_n_s_1050",
link1: "http://www.google.com/",
link2: "",
name: "Nokia7110/1.0 (05.01) (Google WAP Proxy/1.0)",
type: "P"
},
%{
comment: "",
description: "Nokodo public beta search robot (67.18.222.xx)",
id: "id_n_s_1051",
link1: "http://www.nokodo.com/",
link2: "",
name: "NokodoBot/1.x (+http://nokodo.com/bot.htm)",
type: "R"
},
%{
comment: "",
description: "Burf.com UK Search Engine robot",
id: "id_n_s_1052",
link1: "http://www.burf.com/",
link2: "",
name: "Norbert the Spider(Burf.com)",
type: "R"
},
%{
comment: "194.224.199.xx",
description: "noXtrum search robot (Spain)",
id: "id_n_s_1053",
link1: "http://www.noxtrum.com/",
link2: "",
name: "noxtrumbot/1.0 (crawler@noxtrum.com)",
type: "R"
},
%{
comment: "207.210.106.1xx",
description: "Noyona job search (preview)",
id: "id_n_s_040506_2",
link1: "http://www.noyona.com/index.pl",
link2: "",
name: "noyona_0_1",
type: "R"
},
%{
comment: "s. also - aipbot/1.0 (aipbot; http://www.aipbot.com... - NPBot ...",
description: "Nameprotect copyright search robot (24.177.134.x)",
id: "id_n_s_1054",
link1: "http://www.nameprotect.com/",
link2: "",
name: "NP/0.1 (NP; http://www.nameprotect.com; npbot@nameprotect.com)",
type: "R"
},
%{
comment: "",
description: "Nameprotect copyright search robot (24.177.134.x)",
id: "id_n_s_1553",
link1: "http://www.nameprotect.com/",
link2: "",
name: "NPBot (http://www.nameprotect.com/botinfo.html)",
type: "R"
},
%{
comment: "",
description: "Nameprotect copyright search robot (24.177.134.x)",
id: "id_n_s_1552",
link1: "http://www.nameprotect.com/",
link2: "",
name: "NPBot-1/2.0",
type: "R"
},
%{
comment: "",
description: "Nsauditor Network Security Auditor",
id: "id_n_s_291205_3",
link1: "http://www.nsauditor.com/",
link2: "",
name: "Nsauditor/1.x",
type: "S"
},
%{
comment: "",
description: "NetShow Media Player = Windows Media Player 10",
id: "id_n_s_1055",
link1: "",
link2: "",
name: "NSPlayer/10.0.0.xxxx WMFSDK/10.0",
type: "B"
},
%{
comment: "",
description: "Nsyght social search application",
id: "id_n_s_281207_2",
link1: "http://search.nsyght.com/",
link2: "",
name: "nsyght.com/Nutch-1.0-dev (nsyght.com; Nsyght.com)",
type: "R"
},
%{
comment: "",
description: "Nsyght social search application",
id: "id_n_s_161007_1",
link1: "http://search.nsyght.com/",
link2: "",
name: "nsyght.com/Nutch-x.x (nsyght.com; search.nsyght.com)",
type: "R"
},
%{
comment: "",
description: "NTT Directory robot",
id: "id_n_s_1056",
link1: "http://navi.ocn.ne.jp/",
link2: "",
name: "nttdirectory_robot/0.9 (super-robot@super.navi.ocn.ne.jp)",
type: "R"
},
%{
comment: "",
description: "Nucleus CMS SiteList link managing plugin",
id: "id_n_s_180206_1",
link1: "http://wakka.xiffy.nl/sitelist",
link2: "",
name: "Nucleus SiteList LinkChecker/1.1",
type: "C"
},
%{
comment: "",
description: "nuSearch spider (84.9.136.xxx)",
id: "id_n_s_1058",
link1: "http://www.nusearch.com/",
link2: "",
name:
"nuSearch Spider <a href='http://www.nusearch.com'>www.nusearch.com</a> (compatible; MSIE 4.01)",
type: "R"
},
%{
comment: "",
description: "nuSearch spider (84.9.136.xxx)",
id: "id_n_s_1057",
link1: "http://www.nusearch.com/",
link2: "",
name: "NuSearch Spider (compatible; MSIE 6.0)",
type: "R"
},
%{
comment: "",
description: "nuSearch spider (84.9.136.xxx)",
id: "id_n_s_1059",
link1: "http://www.nusearch.com/",
link2: "",
name: "NuSearch Spider www.nusearch.com",
type: "R"
},
%{
comment: "",
description: "Nutch open source robot",
id: "id_n_s_1060",
link1: "http://www.nutch.org/docs/bot.html",
link2: "",
name: "Nutch",
type: "R"
},
%{
comment: "",
description: "Picapage search for handheld devices using Nutch",
id: "id_n_s_211107_1",
link1: "http://picapage.biz/",
link2: "",
name: "Nutch crawler/Nutch-0.9 (picapage.com; admin@picapage.com)",
type: "R"
},
%{
comment: "",
description: "Ayell Euronet business directory robot using Nutch",
id: "id_n_s_230408_1",
link1: "http://www.ayell.eu/",
link2: "",
name: "Nutch/Nutch-0.9 (Eurobot; http://www.ayell.eu )",
type: "R"
},
%{
comment:
"uses also: Mozilla/5.0 (X11; U; Linux i686; en-US; rv:1.7.5) Gecko/20041107 Firefox/1.0",
description: "Netsweeper content filtering engine (66.207.120.2xx) powered by Nutch",
id: "id_n_s_120406_1",
link1: "http://www.netsweeper.com/",
link2: "",
name:
"NutchCVS/0.06-dev (Nutch; http://www.nutch.org/docs/en/bot.html; nutch-agent@lists.sourceforge.net)",
type: "P"
},
%{
comment: "",
description: "Nutch open source robot",
id: "id_n_s_1061",
link1: "http://www.nutch.org/docs/bot.html",
link2: "",
name:
"NutchCVS/0.0x-dev (Nutch; http://www.nutch.org/docs/bot.html; nutch-agent@lists.sourceforge.net)",
type: "R"
},
%{
comment: "powered by Nutch",
description:
"Robot from University of Washington Computer Science & Engineering (128.208.6.2xx)",
id: "id_n_s_010406_1",
link1: "http://qbert.cs.washington.edu/",
link2: "",
name:
"NutchCVS/0.7.1 (Nutch running at UW; http://www.nutch.org/docs/en/bot.html; sycrawl@cs.washington.edu)",
type: "R"
},
%{
comment: "216.182.236.xx",
description: "Amazon Elastic Compute Cloud (Amazon EC2) robot",
id: "id_n_s_251006_2",
link1:
"http://www.amazon.com/b/ref=sc_fe_l_2/104-6713356-1433533?ie=UTF8&node=201590011&no=3435361&me=A36L942TSJ2AJA",
link2: "",
name:
"NutchEC2Test/Nutch-0.9-dev (Testing Nutch on Amazon EC2.; http://lucene.apache.org/nutch/bot.html; ec2test at lucene.com)",
type: "R"
},
%{
comment: "",
description: "Nutch open source robot",
id: "id_n_s_1062",
link1: "http://www.nutch.org/docs/bot.html",
link2: "",
name:
"NutchOrg/0.0x-dev (Nutch; http://www.nutch.org/docs/bot.html; nutch-agent@lists.sourceforge.net)",
type: "R"
},
%{
comment: "reads robots.txt",
description:
"Unknown robot using Nutch (maybe private crawling) via Cox network (70.187.130.25x)",
id: "id_n_s_210108_1",
link1: "http://lucene.apache.org/nutch/",
link2: "",
name: "nutchsearch/Nutch-0.9 (Nutch Search 1.0; herceg_novi at yahoo dot com)",
type: "R"
},
%{
comment: "128.208.3.1xx",
description: "Unknown crawler from University of Washington - Computer science",
id: "id_n_s_041106_1",
link1: "http://www.cs.washington.edu/",
link2: "",
name:
"NutchVinegarCrawl/Nutch-0.8.1 (Vinegar; http://www.cs.washington.edu; eytanadar at gmail dot com)",
type: "R"
},
%{
comment: "",
description: "Weblog bookwatch robot",
id: "id_n_s_1063",
link1: "http://www.onfocus.com/bookwatch/",
link2: "",
name: "obidos-bot (just looking for books.)",
type: "R"
},
%{
comment: "",
description: "Objects Search robot",
id: "id_n_s_1064",
link1: "http://www.objectssearch.com/",
link2: "",
name:
"ObjectsSearch/0.01-dev (ObjectsSearch;http://www.ObjectsSearch.com/bot.html; support@thesoftwareobjects.com)",
type: "R"
},
%{
comment: "",
description: "Objects Search robot",
id: "id_n_s_1065",
link1: "http://www.objectssearch.com/",
link2: "",
name:
"ObjectsSearch/0.0x (ObjectsSearch; http://www.ObjectsSearch.com/bot.html; support@thesoftwareobjects.com)",
type: "R"
},
%{
comment: "",
description: "Cobion Germany Brand Protection Services robot",
id: "id_n_s_1066",
link1: "http://www.cobion.com/",
link2: "",
name: "oBot ((compatible;Win32))",
type: "R"
},
%{
comment: "",
description: "GlobalSpec Engineering Search robot (66.194.55.xxx)",
id: "id_n_s_1067",
link1: "http://www.globalspec.com/",
link2: "",
name: "Ocelli/1.x (http://www.globalspec.com/Ocelli)",
type: "R"
},
%{
comment: "",
description: "Octopus download manager",
id: "id_n_s_1068",
link1: "http://moskalyuk.com/octopus/",
link2: "",
name: "Octopus",
type: "D"
},
%{
comment: "",
description: "Octora blog or RSS information crawler - beta (66.228.114.xx)",
id: "id_n_s_230306_1",
link1: "http://www.octora.com/",
link2: "",
name: "Octora Beta - www.octora.com",
type: "R"
},
%{
comment: "66.228.114.xx",
description: "Octora RSS feed search",
id: "id_n_s_230606_4",
link1: "http://www.octora.com/",
link2: "",
name: "Octora Beta Bot - www.octora.com",
type: "R"
},
%{
comment: "",
description: "Meta Products Offlinebrowser",
id: "id_n_s_1069",
link1: "http://www.metaproducts.com/",
link2: "",
name: "Offline Explorer 1.*",
type: "B D"
},
%{
comment: "",
description: "Claymont robot / Internetseer Web Site Monitoring",
id: "id_n_s_1070",
link1: "http://www.claymont.com/",
link2: "",
name: "OliverPerry",
type: "R C"
},
%{
comment: "based on YottaCars... (see there)",
description: "OmniExplorer car & shopping search (64.62.175.xxx)",
id: "id_n_s_1071",
link1: "http://www.omni-explorer.com",
link2: "",
name:
"OmniExplorer_Bot/1.0x (+http://www.omni-explorer.com) Internet CategorizerOmniExplorer http://www.omni-explorer.com/ car & shopping search (64.62.175.xxx)",
type: "R"
},
%{
comment: "based on YottaCars... (see there)",
description: "OmniExplorer car & shopping search (64.62.175.xxx)",
id: "id_n_s_1072",
link1: "http://www.omni-explorer.com",
link2: "",
name: "OmniExplorer_Bot/1.0x (+http://www.omni-explorer.com) Job Crawler",
type: "R"
},
%{
comment: "based on YottaCars... (see there)",
description: "OmniExplorer car & shopping search (64.62.175.xxx)",
id: "id_n_s_1073",
link1: "http://www.omni-explorer.com",
link2: "",
name: "OmniExplorer_Bot/1.1x (+http://www.omni-explorer.com) Torrent Crawler",
type: "R"
},
%{
comment: "based on YottaCars... (see there)",
description: "OmniExplorer car & shopping search (64.62.175.xxx)",
id: "id_n_s_1074",
link1: "http://www.omni-explorer.com",
link2: "",
name: "OmniExplorer_Bot/x.xx (+http://www.omni-explorer.com) WorldIndexer",
type: "R"
},
%{
comment: "85.176.108.2xx",
description: "onsearch.de German web directory link checking ",
id: "id_n_s_290106_3",
link1: "http://www.onsearch.de/",
link2: "",
name: "onCHECK Linkchecker von www.scientec.de fuer www.onsinn.de",
type: "C"
},
%{
comment: "85.176.108.2xx",
description: "onsearch.de German web directory link checking ",
id: "id_n_s_290106_2",
link1: "http://www.onsearch.de/",
link2: "",
name: "onCHECK-Robot, www.onsearch.de",
type: "C"
},
%{
comment: "s. also - Mozilla/5.0 (compatible; OnetSzukaj/5.0....",
description: "onet.pl Szukaj (Search) robot (213.180.128.1xx)",
id: "id_n_s_1075",
link1: "http://szukaj.onet.pl/",
link2: "",
name: "Onet.pl SA- http://szukaj.onet.pl",
type: "R"
},
%{
comment: "",
description: "Dead-Links.com link validation spider",
id: "id_n_s_1076",
link1: "http://www.dead-links.com/",
link2: "",
name: "online link validator (http://www.dead-links.com/)",
type: "C"
},
%{
comment: "",
description: "Online24 shopping portal (Germany) link checking",
id: "id_n_s_040206_3",
link1: "http://www.online24.de/",
link2: "",
name: "Online24-Bot (Version: 1.0x, powered by www.online24.de)",
type: "C"
},
%{
comment: "",
description: "OntoSpider - Dutch robot for a research project. (195.11.244.xx)",
id: "id_n_s_1077",
link1: "http://ontospider.i-n.info",
link2: "",
name: "OntoSpider/1.0 libwww-perl/5.65",
type: "R"
},
%{
comment: "67.215.230.xx",
description: "SeetooZ search crawler",
id: "id_n_s_030110_6",
link1: "http://www.setooz.com/",
link2: "",
name: "OOZBOT/0.20 ( http://www.setooz.com/oozbot.html ; agentname at setooz dot_com )",
type: "R"
},
%{
comment: "(80.237.209.xx)",
description: "OpenAcoon open source search engine (used by Acoon search)",
id: "id_g_m_280508_4",
link1: "http://www.openacoon.de/",
link2: "http://www.acoon.de/",
name: "OpenAcoon v4.0.x (www.openacoon.de)",
type: "R"
},
%{
comment: "",
description: "Openfind.com.tw robot",
id: "id_n_s_1078",
link1: "http://www.openfind.com.tw/",
link2: "",
name:
"Openbot/3.0+(robot-response@openfind.com.tw;+http://www.openfind.com.tw/robot.html)",
type: "R"
},
%{
comment: "",
description: "Openfind.com.tw robot",
id: "id_n_s_1079",
link1: "http://www.openfind.com.tw/",
link2: "",
name:
"Openfind data gatherer- Openbot/3.0+(robot-response@openfind.com.tw;+http://www.openfind.com.tw/robot.html)",
type: "R"
},
%{
comment: "",
description: "Openfind.com.tw robot",
id: "id_n_s_1080",
link1: "http://www.openfind.com.tw/",
link2: "",
name: "Openfind Robot/1.1A2",
type: "R"
},
%{
comment: "216.182.236.1xx",
description: "open i search robot - search engine in development",
id: "id_n_s_250107_2",
link1: "http://www.openisearch.com/",
link2: "",
name: "OpenISearch/1.x (www.openisearch.com)",
type: "R"
},
%{
comment: "",
description: "Opentagger social bookmarking system",
id: "id_n_s_291105_4",
link1: "http://www.opentagger.com/",
link2: "",
name: "OpenTaggerBot (http://www.opentagger.com/opentaggerbot.htm)",
type: "R"
},
%{
comment: "",
description: "OpenText crawler",
id: "id_n_s_1081",
link1: "http://www.opentext.net/",
link2: "",
name: "OpenTextSiteCrawler/2.9.2",
type: "R"
},
%{
comment: "",
description: "OpenWebSpider - Open Source web search engine",
id: "id_n_s_310806_1",
link1: "http://www.openwebspider.org/",
link2: "",
name: "OpenWebSpider/0.x.x (http://www.openwebspider.org)",
type: "R"
},
%{
comment: "",
description: "OpenWebSpider - Open Source web search engine",
id: "id_n_s_1082",
link1: "http://www.openwebspider.org/",
link2: "",
name: "OpenWebSpider/x",
type: "R"
},
%{
comment: "",
description: "Opera 5.0 Linux",
id: "id_n_s_1083",
link1: "",
link2: "",
name: "Opera/5.0 (Linux 2.0.38 i386; U) [en]",
type: "B"
},
%{
comment: "",
description: "Opera 5.11 faked WinME referer",
id: "id_n_s_1084",
link1: "",
link2: "",
name: "Opera/5.11 (Windows ME; U) [ru]",
type: "B"
},
%{
comment: "",
description: "Opera 5.12 Win98",
id: "id_n_s_1085",
link1: "",
link2: "",
name: "Opera/5.12 (Windows 98; U) [en]",
type: "B"
},
%{
comment: "see also: - MSIE-5.13 (larbin@.....) - WinampMPEG/2.00 larbin@....",
description: "unknown robot from gw.ocg-corp.com (209.126.176.x)",
id: "id_n_s_1086",
link1: "",
link2: "",
name: "Opera/6.01 (larbin@unspecified.mail)",
type: ""
},
%{
comment: "",
description: "Opera 6.x- Mandrake Linux",
id: "id_n_s_1087",
link1: "",
link2: "",
name: "Opera/6.x (Linux 2.4.8-26mdk i686; U) [en]",
type: "B"
},
%{
comment: "",
description: "Opera 6.x WinNT",
id: "id_n_s_1088",
link1: "",
link2: "",
name: "Opera/6.x (Windows NT 4.0; U) [de]",
type: "B"
},
%{
comment: "",
description: "Opera 7.x WinXP",
id: "id_n_s_1089",
link1: "",
link2: "",
name: "Opera/7.x (Windows NT 5.1; U) [en]",
type: "B"
},
%{
comment: "",
description: "Opera 8.x (Beta) WinXP",
id: "id_n_s_1090",
link1: "",
link2: "",
name: "Opera/8.xx (Windows NT 5.1; U; en)",
type: "B"
},
%{
comment: "",
description: "Opera 9 (Beta) Browser",
id: "id_n_s_141105_2",
link1: "http://snapshot.opera.com/",
link2: "",
name: "Opera/9.0 (Windows NT 5.1; U; en)",
type: "B"
},
%{
comment: "",
description: "Opera 9 (final)",
id: "id_n_s_250606_1",
link1: "http://www.opera.com/",
link2: "",
name: "Opera/9.00 (Windows NT 5.1; U; de)",
type: "B"
},
%{
comment: "",
description: "Opera browser 9.6x on WinXP (Presto = Operas rendering engine)",
id: "id_n_s_201008_1",
link1: "http://my.opera.com/ODIN/blog/a-look-under-the-hood-of-opera-9-6",
link2: "",
name: "Opera/9.60 (Windows NT 5.1; U; de) Presto/2.1.1",
type: "B"
},
%{
comment: "",
description: "Opidoo Search Belgium robot (62.4.83.xxx)",
id: "id_n_s_1091",
link1: "http://www.opidoo.com/",
link2: "",
name: "OpidooBOT (larbin2.6.3@unspecified.mail)",
type: "R"
},
%{
comment: "",
description: "Open Wave Phone Simulator SDK",
id: "id_n_s_080208_1",
link1: "http://developer.openwave.com/dvl/tools_and_sdk/phone_simulator/",
link2: "",
name: "OPWV-SDK UP.Browser/7.0.2.3.119 (GUI) MMP/2.0 Push/PO",
type: "B"
},
%{
comment: "",
description: "Oracle Application Server cache",
id: "id_n_s_190406_2",
link1: "http://www.oracle.com/appserver/index.html",
link2: "",
name: "Oracle Application Server Web Cache 10g",
type: "P"
},
%{
comment: "",
description: "Oracle interMedia Text - Text and web documents indexing",
id: "id_n_s_1092",
link1: "http://www.oracle.com/technology//products/text/index.html",
link2: "",
name: "Oracle iMTCrawler",
type: "D"
},
%{
comment: "",
description: "Oracle Search",
id: "id_n_s_1093",
link1: "http://www.oracle.com/",
link2: "",
name: "Oracle Ultra Search",
type: "R"
},
%{
comment: "",
description: "Orangeslicer semantic search (Beta) Germany (193.201.52.1xx)",
id: "id_n_s_220306_1",
link1: "http://www.orangeslicer.com/",
link2: "",
name: "OrangeSpider",
type: "R"
},
%{
comment: "",
description: "Orbiter - DailyOrbit search spider",
id: "id_n_s_1094",
link1: "http://www.dailyorbit.com/",
link2: "",
name: "Orbiter/T-2.0 (+http://www.dailyorbit.com/bot.htm)",
type: "R"
},
%{
comment: "",
description: "Orca browser - based on Gecko",
id: "id_n_s_150206_1",
link1: "http://www.orcabrowser.com",
link2: "",
name: "Orca Browser (http://www.orcabrowser.com)",
type: "B"
},
%{
comment: "Spyware proxy service",
description: "Marketscore (was Netsetter) internet accelerator",
id: "id_n_s_251205_1",
link1: "http://www.marketscore.com/Home.aspx",
link2: "",
name: "OSSProxy 1.3.305.321 (Build 305.321 Win32 en-us)(Dec 21 2005 16:30:54)",
type: "P"
},
%{
comment: "",
description: "Unknown robot from Chinanet (220.181.8.xxx)",
id: "id_n_s_141105_1",
link1: "",
link2: "",
name: "OutfoxBot/0.x (For internet experiments; http://; outfox.agent@gmail.com)",
type: ""
},
%{
comment: "",
description: "Unknown robot from Chinanet (60.191.80.1)",
id: "id_n_s_221106_1",
link1: "",
link2: "",
name: "OutfoxMelonBot/0.5 (for internet experiments; http://; outfoxbot@gmail.com)",
type: ""
},
%{
comment: "",
description: "Overture/Fast/Alltheweb crawler (66.77.73.xxx)",
id: "id_n_s_1095",
link1: "http://www.alltheweb.com/",
link2: "",
name:
"Overture-WebCrawler/3.8/Fresh (atw-crawler at fast dot no; http://fast.no/support/crawler.asp)",
type: "R"
},
%{
comment: "",
description: "Unknown robot from 198.169.127.xx (innovationplace.com)",
id: "id_n_s_1096",
link1: "",
link2: "",
name: "OWR_Crawler 0.1",
type: ""
},
%{
comment: "87.139.106.xx",
description: "Ozelot - Flying Cat's search engine robot (Germany)",
id: "id_n_s_090906_1",
link1: "http://www.flying-cat.de/ozelot/",
link2: "",
name:
"ozelot/2.7.3 (Search engine indexer; www.flying-cat.de/ozelot; ozelot@flying-cat.de)",
type: "R"
},
%{
comment: "72.167.37.20x",
description: "PADLibrary.com - PAD file software robot for FindFiles.com",
id: "id_n_s_290108_2",
link1: "http://padlibrary.com/",
link2: "http://www.findfiles.com/",
name: "PADLibrary Spider",
type: "R"
},
%{
comment: "208.185.247.xx",
description: "Pagebites job search crawler",
id: "id_n_s_150207_3",
link1: "http://www.pagebites.com/",
link2: "",
name: "PageBitesHyperBot/600 (http://www.pagebites.com/)",
type: "R"
},
%{
comment: "209.9.228.1xx",
description: "Pagebull visual search engine",
id: "id_n_s_111206_1",
link1: "http://www.pagebull.com/",
link2: "",
name: "Pagebull http://www.pagebull.com/",
type: "R"
},
%{
comment: "70.85.129.12x",
description: "Pagestacker online bookmark service",
id: "id_n_s_051207_3",
link1: "http://www.pagestacker.com/",
link2: "",
name: "Pagestacker Bot",
type: "C"
},
%{
comment: "206.169.110.xx",
description: "Secure Computing SmartFilter Tools - malware crawler",
id: "id_n_s_290506_1",
link1: "http://www.securecomputing.com/PageVerifier.cfm",
link2: "",
name: "page_verifier (http://www.securecomputing.com/goto/pv)",
type: "R"
},
%{
comment: "",
description: "Downloadmanager ?",
id: "id_n_s_1097",
link1: "",
link2: "",
name: "PagmIEDownload",
type: "D"
},
%{
comment: "",
description: "CFC crawler used by Italian academic and research network (GARR)",
id: "id_n_s_1098",
link1: "http://www.garr.it/",
link2: "",
name: "parallelContextFocusCrawler1.1parallelContextFocusCrawler1.1",
type: "R"
},
%{
comment: "",
description: "http://www.ianett.com robot",
id: "id_n_s_1099",
link1: "http://www.ianett.com/",
link2: "",
name: "ParaSite/1.0b (http://www.ianett.com/parasite/)",
type: "R"
},
%{
comment: "",
description: "Patsearch (Germany) robot",
id: "id_n_s_1100",
link1: "http://www.herz-power.de/",
link2: "",
name: "Patwebbot (http://www.herz-power.de/technik.html)",
type: "R"
},
%{
comment: "",
description: "Pavuk web downloading program for Unix",
id: "id_n_s_1101",
link1: "http://www.idata.sk/%7Eondrej/pavuk/about.html",
link2: "",
name: "pavuk/0.9pl29b i686-pc-linux-gnu",
type: "D"
},
%{
comment: "- UA sometimes DSurf15a",
description: "Some site scanning tool via diff. IPs- i.e.: - cox.net (68.4.xxx.xxx)",
id: "id_n_s_1102",
link1: "",
link2: "",
name: "PBrowse 1.4b",
type: "S"
},
%{
comment: "",
description: "Post.sk / Eurotel.sk robot",
id: "id_n_s_1103",
link1: "",
link2: "",
name: "pd02_1.0.0 pd02_1.0.0@dzimi@post.sk",
type: "R"
},
%{
comment: "",
description: "Pear HTTP_Request PHP extension package",
id: "id_n_s_1104",
link1: "http://pear.php.net/",
link2: "",
name: "PEAR HTTP_Request class ( http://pear.php.net/ )",
type: ""
},
%{
comment: "",
description: "Peerbot - favicon search robot",
id: "id_n_s_1105",
link1: "http://www.peerbot.com/",
link2: "",
name: "PEERbot www.peerbot.com",
type: "R"
},
%{
comment: "",
description: "Unknown robot from 64.5.48.xxx (Plethoric.net)",
id: "id_n_s_1106",
link1: "",
link2: "",
name: "PeopleChat/Search_Engine",
type: ""
},
%{
comment: "s. DBrowse- PSurf etc.",
description: "Some site scanning tool via diff. IPs",
id: "id_n_s_1107",
link1: "",
link2: "",
name: "PEval 1.4b",
type: "S"
},
%{
comment: "",
description: "diff. IPs / services",
id: "id_n_s_1108",
link1: "",
link2: "",
name: "PHP/3.x.xx",
type: ""
},
%{
comment: "",
description: "diff. IPs / services",
id: "id_n_s_1109",
link1: "",
link2: "",
name: "PHP/4.0.4pl1",
type: ""
},
%{
comment: "in conjunction w. Weblink's Checker UA",
description: "diff. IPs / services- i.e.: -NTT/Verio Inc. link checker",
id: "id_n_s_1110",
link1: "http://www.verio.com/",
link2: "",
name: "PHP/4.0.6",
type: "C"
},
%{
comment: "",
description: "diff. IPs / services- i.e.: - Phenominet.com link checking",
id: "id_n_s_1111",
link1: "http://www.phenominet.com",
link2: "",
name: "PHP/4.1.1",
type: "C"
},
%{
comment: "Mixcat s. also Felix and Morris",
description:
"diff. IPs / services- i.e.: - 209.114.200.xx = MyNetCrawler link checking - 216.139.207.xxx = Mixcat crawler",
id: "id_n_s_1112",
link1: "http://mynetcrawler.com/",
link2: "http://mixcat.com",
name: "PHP/4.1.2",
type: ""
},
%{
comment: "",
description: "Pico Search robot",
id: "id_n_s_1113",
link1: "http://www.picosearch.com/",
link2: "",
name: "PicoSearch/1.0",
type: "R"
},
%{
comment: "",
description: "Piffany targeted search web spider",
id: "id_n_s_010506_3",
link1: "http://www.piffany.com/",
link2: "http://www.piffany.com/spider.html",
name: "Piffany_Web_Scraper_v0.x",
type: "R"
},
%{
comment: "",
description: "Piffany targeted search web spider",
id: "id_n_s_010506_2",
link1: "http://www.piffany.com/",
link2: "http://www.piffany.com/spider.html",
name: "Piffany_Web_Spider_v0.x",
type: "R"
},
%{
comment: "",
description:
"Whois Source domain name information robot (66.249.26.xx)- s.also: - SurveyBot",
id: "id_n_s_1114",
link1: "http://www.whois.sc/",
link2: "",
name: "PigeonBot1.0 BETA",
type: "R C"
},
%{
comment: "",
description: "PingALink website monitoring",
id: "id_n_s_1115",
link1: "http://www.pingalink.com/",
link2: "",
name: "PingALink Monitoring Services 1.0",
type: "R C"
},
%{
comment: "",
description: "PingALink website monitoring",
id: "id_n_s_1116",
link1: "http://www.pingalink.com/",
link2: "",
name: "PingALink Monitoring Services 1.0 (http://www.pingalink.com)",
type: "R C"
},
%{
comment: "66.98.148.xx",
description: "Pingdom web site monitoring",
id: "id_n_s_120607_1",
link1: "http://www.pingdom.com/",
link2: "",
name: "Pingdom GIGRIB (http://www.pingdom.com)",
type: "C"
},
%{
comment: "",
description: "pipeline search (DMOZ based) search robot (24.106.39. xxx)",
id: "id_n_s_1117",
link1: "http://www.pipeline-search.com/",
link2: "",
name:
"pipeLiner/0.3a (PipeLine Spider;http://www.pipeline-search.com/webmaster.html; webmaster'at'pipeline-search.com)",
type: "R"
},
%{
comment: "",
description: "pipeline search (DMOZ based) search robot (24.106.39. xxx)",
id: "id_n_s_1118",
link1: "http://www.pipeline-search.com/",
link2: "",
name: "pipeLiner/0.xx (PipeLine Spider; http://www.pipeline-search.com/webmaster.html)",
type: "R"
},
%{
comment: "now WebVac s. there",
description: "Pita crawler",
id: "id_n_s_1119",
link1: "http://www-diglib.stanford.edu/~testbed/doc2/WebBase/webbase-pages.html",
link2: "",
name: "Pita",
type: "R"
},
%{
comment: "",
description: "Private user-agent via Hurricane Electric Internet Services",
id: "id_n_s_1120",
link1: "http://www.he.net/",
link2: "",
name: "Pizilla++ ver 2.45",
type: "B ?"
},
%{
comment: "",
description: "Portaljuice spider",
id: "id_n_s_1121",
link1: "http://www.portaljuice.com/",
link2: "",
name: "PJspider/3.0 (pjspider@portaljuice.com; http://www.portaljuice.com)",
type: "R"
},
%{
comment: "",
description: "Plagger - pluggable RSS/Atom feed aggregator written in Perl",
id: "id_n_s_121106_1",
link1: "http://plagger.org/trac",
link2: "",
name: "Plagger/0.x.xx (http://plagger.org/)",
type: "B"
},
%{
comment: "",
description: "unknown ucsd.edu robot",
id: "id_n_s_1122",
link1: "",
link2: "",
name: "PlagiarBot/1.0",
type: "R"
},
%{
comment: "",
description: "Plantynet web filtering services - Blacklist DB robot",
id: "id_n_s_1123",
link1: "http://www.plantynet.com/",
link2: "",
name: "PlantyNet_WebRobot_V1.9 dhkang@plantynet.com",
type: "R P"
},
%{
comment: "Doesn't read robots.txt - Plinki.com's website has no content",
description: "Unknown UA from 66.220.23.2xx",
id: "id_n_s_120106_1",
link1: "http://www.plinki.com/",
link2: "",
name:
"plinki/0.1 (you got plinked! (thats a good thing..); http://www.plinki.com; crawl@plinki.com)",
type: ""
},
%{
comment: "66.179.81.1xx",
description: "Pluck RSS feed crawler",
id: "id_n_s_061206_2",
link1: "http://www.pluck.com/",
link2: "",
name:
"PluckFeedCrawler/2.0 (compatible; Mozilla 4.0; MSIE 5.5; http://www.pluck.com; 1 subscribers)",
type: "R"
},
%{
comment: "209.85.62.1xx",
description: "Pluggd Podcast search engine",
id: "id_n_s_140807_1",
link1: "http://www.pluggd.com/",
link2: "",
name:
"Pluggd/Nutch-0.9 (automated crawler http://www.pluggd.com;support at pluggd dot com)",
type: "R"
},
%{
comment: "",
description:
"Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan",
id: "id_n_s_1124",
link1: "http://www.vector.co.jp/soft/win95/net/se077067.html",
link2: "",
name: "Pockey-GetHTML/4.12.0 (Win32; GUI; ix86)",
type: "D"
},
%{
comment: "",
description:
"Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan",
id: "id_n_s_1125",
link1: "http://www.vector.co.jp/soft/win95/net/se077067.html",
link2: "",
name: "Pockey-GetHTML/x.xx",
type: "D"
},
%{
comment: "",
description:
"Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan",
id: "id_n_s_1126",
link1: "http://www.vector.co.jp/soft/win95/net/se077067.html",
link2: "",
name: "Pockey/x.x.x",
type: "D"
},
%{
comment: "",
description:
"Yutaka Endo's Pockey / GetHTML / GetHTMLW - some downloading tool from Japan",
id: "id_n_s_1127",
link1: "http://www.vector.co.jp/soft/win95/net/se077067.html",
link2: "",
name: "Pockey7.x.x(WIN32GUI)",
type: "D"
},
%{
comment: "",
description: "HTTP user-agent for POE (portable networking framework for Perl )",
id: "id_n_s_1128",
link1: "http://search.cpan.org/dist/POE-Component-Client-HTTP/HTTP.pm",
link2: "",
name: "POE-Component-Client-HTTP/0.64 (perl; N; POE; en; rv:0.640000)",
type: ""
},
%{
comment:
"appears also as LWP::Simple/5.803 - Mozilla/4.76 [en] (Win98; U) - Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1)",
description:
"ThePlanet/jaja-jak-globusy.com Google Adsense refferer spam bot from 70.85.116.* / 70.84.128.xxx / 70.85.193.xxx",
id: "id_n_s_291105_2",
link1: "http://spamhuntress.com/wiki/Manila_Industries",
link2: "",
name: "Poirot",
type: "S"
},
%{
comment: "",
description: "Polybot webcrawler",
id: "id_n_s_1129",
link1: "http://cis.poly.edu/polybot/",
link2: "",
name: "polybot 1.0 (http://cis.poly.edu/polybot/)",
type: "R"
},
%{
comment: "",
description: "Dir.com / Iliad French recherche robot",
id: "id_n_s_1130",
link1: "http://www.iliad.fr/",
link2: "",
name: "Pompos/1.x http://dir.com/pompos.html",
type: "R"
},
%{
comment: "",
description: "Iliad / Free French recherche robot",
id: "id_n_s_1131",
link1: "http://www.iliad.fr/",
link2: "",
name: "Pompos/1.x pompos@iliad.fr",
type: "R"
},
%{
comment: "",
description: "Popdex - web site popularity crawler",
id: "id_n_s_1132",
link1: "http://www.popdex.com/",
link2: "",
name: "Popdexter/1.0",
type: "R"
},
%{
comment: "s. also - Wells Search II",
description: "Unknown spam bot / harvester (63.223.10.***)",
id: "id_n_s_1133",
link1: "",
link2: "",
name: "Port Huron Labs",
type: "S"
},
%{
comment: "",
description: "PortalB (now Alacra search) spider",
id: "id_n_s_1134",
link1: "http://www.portalb.com/alacra/index.htm",
link2: "",
name: "PortalBSpider/2.0 (spider@portalb.com)",
type: "R"
},
%{
comment: "",
description: "portalmmm IMode mobile browser",
id: "id_n_s_080706_2",
link1: "",
link2: "",
name: "portalmmm/2.0 S500i(c20;TB)",
type: "B"
},
%{
comment: "",
description: "Yahoo (66.94.237.1xx / 216.109.121.xx) favorites tracking robot",
id: "id_n_s_1135",
link1: "",
link2: "",
name: "PostFavorites",
type: "C"
},
%{
comment: "",
description: "Potbot : A simple IRC bot written in Perl",
id: "id_n_s_1136",
link1: "http://sourceforge.net/projects/potbot/",
link2: "",
name: "potbot 1.0",
type: "R"
},
%{
comment: "",
description: "Project Rialto - data mining development project",
id: "id_n_s_050408_2",
link1: "http://projectrialto.com/index.html",
link2: "",
name: "PRCrawler/Nutch-0.9 (data mining development project; crawler@projectrialto.com)",
type: "R"
},
%{
comment: "",
description: "CUPS robot for AT&T Privacy Bird Privacy Preferences (P3P) enhancements",
id: "id_n_s_1137",
link1: "http://cups.cs.cmu.edu/",
link2: "http://privacybird.com/",
name: "PrivacyFinder Cache Bot v1.0",
type: "R"
},
%{
comment: "",
description: "CUPS robot for AT&T Privacy Bird Privacy Preferences (P3P) enhancements",
id: "id_n_s_111205_2",
link1: "http://cups.cs.cmu.edu/",
link2: "http://privacybird.com/",
name: "PrivacyFinder/1.1",
type: "R"
},
%{
comment: "s.also (Privoxy/1.0)",
description: "Privoxy web proxy",
id: "id_n_s_1138",
link1: "http://www.privoxy.org/",
link2: "",
name: "Privoxy/3.0 (Anonymous)",
type: "P"
},
%{
comment: "",
description:
"Some site scanning tool from diff. IPs- i.e.: - 67.99.33.x (lightningcon.broadwing.net)",
id: "id_n_s_1139",
link1: "",
link2: "",
name: "Production Bot 0116B",
type: "S"
},
%{
comment: "",
description: "Some site scanning tool from diff. IPs- i.e.: - 216.232.64.xx (telus.net)",
id: "id_n_s_1140",
link1: "",
link2: "",
name: "Production Bot 2016B",
type: "S"
},
%{
comment: "",
description:
"Some site scanning tool from diff. IPs- i.e.: - 141.154.181.xxx (east.verizon.net)",
id: "id_n_s_1141",
link1: "",
link2: "",
name: "Production Bot DOT 3016B",
type: "S"
},
%{
comment: "- see here: http://www.kloth.net/internet/badbots-2004.php",
description: "Some spam bot",
id: "id_n_s_1142",
link1: "http://www.kloth.net/internet/badbots-2004.php",
link2: "",
name: "Program Shareware 1.0.2",
type: "S"
},
%{
comment: "",
description: "unknown",
id: "id_n_s_1143",
link1: "",
link2: "",
name: "Progressive Download",
type: ""
},
%{
comment: "",
description: "unknown",
id: "id_n_s_1144",
link1: "",
link2: "",
name: "Progressive Download HTTP check",
type: ""
},
%{
comment: "",
description: "XP5 robot",
id: "id_n_s_1145",
link1: "http://marty.anstey.ca/projects/robots/index.html",
link2: "",
name: "Project XP5 [2.03.07-111203]",
type: "R"
},
%{
comment: "",
description: "Answerchase PROve Answerbot",
id: "id_n_s_1146",
link1: "http://www.answerchase.com/",
link2: "",
name: "PROve AnswerBot 4.0",
type: "R"
},
%{
comment: "",
description: "ProWebguide robot",
id: "id_n_s_1147",
link1: "http://www.prowebguide.com/",
link2: "",
name: "ProWebGuide Link Checker (http://www.prowebguide.com)",
type: "R"
},
%{
comment: "",
description: "Picsearch robot (62.119.21.13x)",
id: "id_n_s_1148",
link1: "http://www.picsearch.com/",
link2: "",
name: "psbot/0.1 (+http://www.picsearch.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "Some site scanning tool via diff. IPs- i.e.: QWest Net",
id: "id_n_s_1149",
link1: "",
link2: "",
name: "PSurf15a 11",
type: "S"
},
%{
comment: "",
description:
"Some site scanning tool via diff. IPs- i.e.: Optonline net (24.191.xxx.xxx)",
id: "id_n_s_1150",
link1: "",
link2: "",
name: "PSurf15a 51",
type: "S"
},
%{
comment: "UA sometimes SSurf15a 11 or random letters like RXMYRCJ",
description:
"Some site scanning tool via diff. IPs- i.e.: - choiceone.net (216.153.xxx.xxx) - attbi.com (12.250.xxx.xxx) - optonline.net (24.191.xxx.xxx)",
id: "id_n_s_1151",
link1: "",
link2: "",
name: "PSurf15a VA",
type: "S"
},
%{
comment: "no active website",
description:
"Unknown website grabbing / ripping for unknown purposes from 208.66.195.x - Digitalinfinity.org Russia",
id: "id_n_s_160606_1",
link1: "",
link2: "",
name: "psycheclone",
type: "S"
},
%{
comment: "",
description:
"Some robot from Stanford University (171.64.75.xxx = PubCrawl.Stanford.EDU)",
id: "id_n_s_1152",
link1: "",
link2: "",
name: "PubCrawl (pubcrawl.stanford.edu)",
type: "R"
},
%{
comment: "",
description: "Parallel URL Fetcher downloading tool",
id: "id_n_s_1153",
link1: "http://puf.sourceforge.net/",
link2: "",
name: "puf/0.91beta6a (Linux 2.2.18; i686)",
type: "D"
},
%{
comment: "",
description: "Parallel URL Fetcher downloading tool",
id: "id_n_s_1154",
link1: "http://puf.sourceforge.net/",
link2: "",
name: "puf/0.93.2a (Linux 2.4.18; i686)",
type: "D"
},
%{
comment: "s. also RufusBot",
description:
"WebarooBot - Webaroo web site search / theme based downloading tool (64.124.122.2xx)",
id: "id_n_s_130407_1",
link1: "http://www.webaroo.com/index",
link2: "http://www.webaroo.com/company/site-owners",
name: "pulseBot (pulse Web Miner)",
type: "R"
},
%{
comment: "",
description: "PureSight Internet content filter",
id: "id_n_s_1155",
link1: "http://www.puresight.com/Products/PureSightHomeDescription.shtml",
link2: "",
name: "PureSight",
type: "P"
},
%{
comment: "",
description: "Puxa Rapido download manager",
id: "id_n_s_1156",
link1: "http://www.puxarapido.com.br/",
link2: "",
name: "PuxaRapido v1.0",
type: "D"
},
%{
comment: "62.149.236.2xx",
description: "ProgramacionWeb.net PWeBot link checking (Argentina)",
id: "id_n_s_230907_2",
link1: "http://www.programacionweb.net/robot-en.php",
link2: "http://www.programacionweb.net/",
name: "PWeBot/1.2 Inspector (http://www.programacionweb.net/robot.php)",
type: "R"
},
%{
comment: "",
description: "Fast Search robot (using PycURL Python component- s. below)",
id: "id_n_s_1157",
link1: "http://www.fastsearch.net/",
link2: "http://pycurl.sourceforge.net/",
name: "PycURL",
type: "R"
},
%{
comment: "",
description: "PycURL - Python interface to libcurl",
id: "id_n_s_060107_1",
link1: "http://pycurl.sourceforge.net/",
link2: "",
name: "PycURL/7.xx.x",
type: "D"
},
%{
comment: "s. also nabot- dloader- NaverBot & Cowbot",
description: "Python URL fetcher - robot used by Naver Japan/Korea",
id: "id_n_s_1158",
link1: "http://www.indyproject.org/",
link2: "http://www.python.org/",
name: "Python-urllib/1.1x",
type: "R"
},
%{
comment: "",
description: "Python URL fetcher - robot used by Google",
id: "id_n_s_1159",
link1: "http://labs.google.com",
link2: "http://www.python.org/",
name: "Python-urllib/2.0a1",
type: "R"
},
%{
comment: "",
description: "Qango.com Web Directory robot",
id: "id_n_s_1160",
link1: "http://www.qango.com/",
link2: "",
name: "Qango.com Web Directory (http://www.qango.com/)",
type: "R"
},
%{
comment: "83.33.209.10x",
description:
"QEAVis: Quantitative Evaluation of Academic Websites Visibility using Nutch",
id: "id_n_s_170408_1",
link1: "http://nlp.uned.es/qeavis/",
link2: "",
name:
"QEAVis Agent/Nutch-0.9 (Quantitative Evaluation of Academic Websites Visibility; http://nlp.uned.es/qeavis",
type: "R"
},
%{
comment: "",
description: "Quepasa!com (Latin American search) robot",
id: "id_n_s_1161",
link1: "http://www.quepasa.com/",
link2: "",
name: "QPCreep Test Rig ( We are not indexing- just testing )",
type: "R"
},
%{
comment: "",
description: "Quepasa!com (Latin American search) robot",
id: "id_n_s_1162",
link1: "http://www.quepasa.com/",
link2: "",
name: "QuepasaCreep ( crawler@quepasacorp.com )",
type: "R"
},
%{
comment: "",
description: "Quepasa!com (Latin American search) robot",
id: "id_n_s_1163",
link1: "http://www.quepasa.com/",
link2: "",
name: "QuepasaCreep v0.9.1x",
type: "R"
},
%{
comment: "",
description: "QueryN Metasearch robot",
id: "id_n_s_1164",
link1: "http://www.queryn.com/queryn/",
link2: "",
name: "QueryN Metasearch",
type: "R"
},
%{
comment: "",
description: "Blacktrees Quicksilver helper application for Mac",
id: "id_n_s_230108_2",
link1: "http://docs.blacktree.com/quicksilver/what_is_quicksilver",
link2: "",
name: "Quicksilver (Blacktree,MacOSX)",
type: "B"
},
%{
comment: "",
description: "Quicktime for Macintosh",
id: "id_n_s_230606_3",
link1: "",
link2: "",
name: "QuickTime\\xaa.7.0.4 (qtver=7.0.4;cpu=PPC;os=Mac 10.3.9)",
type: "B"
},
%{
comment: "85.158.204.2xx",
description: "Qweerybot for the Qweery search engine (in development) - Netherland",
id: "id_n_s_060107_4",
link1: "http://qweerybot.qweery.nl/",
link2: "",
name: "QweeryBot/3.01 ( http://qweerybot.qweery.nl)",
type: "R"
},
%{
comment: "85.158.204.2xx",
description: "Qweerybot for the Qweery search engine (in development) - Netherland",
id: "id_n_s_060107_3",
link1: "http://qweerybot.qweery.nl/",
link2: "",
name: "Qweery_robot.txt_CheckBot/3.01 (http://qweerybot.qweery.com)",
type: "R"
},
%{
comment: "",
description: "Radian6 RSS feed comment crawler",
id: "id_n_s_160208_1",
link1: "http://www.radian6.com/cms/index.php",
link2: "http://www.radian6.com/crawler/",
name: "R6_CommentReader_(www.radian6.com/crawler)",
type: "R"
},
%{
comment: "",
description: "Radian6 Rss feed crawler",
id: "id_n_s_160208_2",
link1: "http://www.radian6.com/cms/index.php",
link2: "http://www.radian6.com/crawler/",
name: "R6_FeedFetcher_(www.radian6.com/crawler)",
type: "R"
},
%{
comment: "",
description: "gigaBaz - the brainbot (Germany) robot",
id: "id_n_s_1165",
link1: "http://brainbot.com//site3",
link2: "",
name: "rabaz (rabaz at gigabaz dot com)",
type: "R"
},
%{
comment: "s. also Mozilla/4.0 (compatible; MSIE is not me; DAUMOA ...",
description: "DAUMOA - Daum search Korea robot (211.115.109.xxx)",
id: "id_n_s_1166",
link1: "http://www.daum.net/",
link2: "",
name: "RaBot/1.0 Agent-admin/phortse@hanmail.net",
type: "R"
},
%{
comment: " - site is dead",
description: "Bot Provider for the All Womans Bot Service?",
id: "id_n_s_1167",
link1: "http://bservice.org/bots/",
link2: "",
name: "Rainbot1.1",
type: ""
},
%{
comment: "",
description: "Intersearch.de (was www.intersearch.de) robot (Germany)",
id: "id_n_s_1168",
link1: "",
link2: "",
name: "ramBot xtreme x.x",
type: "R"
},
%{
comment: "",
description: "giveRAMP Search Engine robot (64.69.43.1xx)",
id: "id_n_s_160406_2",
link1: "http://www.giveramp.com/",
link2: "",
name:
"RAMPyBot - www.giveRAMP.com/0.1 (RAMPyBot - www.giveRAMP.com; http://www.giveramp.com/bot.html; support@giveRAMP.com)",
type: "R"
},
%{
comment: "powered by Nutch",
description: "giveRAMP Search Engine robot (64.69.43.1xx)",
id: "id_n_s_260206_1",
link1: "http://www.giveramp.com/",
link2: "http://lucene.apache.org/nutch/",
name:
"RAMPyBot/0.8-dev (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org)",
type: "R"
},
%{
comment: "",
description: "Rank Exec reciprocal link checking",
id: "id_n_s_1169",
link1: "http://www.rankexec.com/",
link2: "",
name: "Rank Exec (rankexec.com) Reciprocal Link Manager 1.x/bot",
type: "C"
},
%{
comment: "",
description: "Rankiva website popularity robot",
id: "id_n_s_180408_5",
link1: "http://www.rankiva.com/",
link2: "",
name: "Rankivabot/3.2 (www.rankiva.com; 3.2; vzmxikn)",
type: "R"
},
%{
comment: "",
description: "Innova/IBM Rational SiteCheck - Rational robot",
id: "id_n_s_1170",
link1: "http://www.rational.com.ar/defaultenglish.html",
link2: "",
name: "Rational SiteCheck (Windows NT)",
type: "R"
},
%{
comment: "199.46.198.xxx",
description:
"Unknown spider from Raytheon Company - maybe Raytheon High Speed Guard proxy",
id: "id_n_s_290708_2",
link1: "http://www.raytheon.com/",
link2: "",
name: "RAYSPIDER/Nutch-0.9",
type: "P"
},
%{
comment: "70.85.24.xx",
description: "Read A Blog - RSS feed and blog search engine",
id: "id_n_s_230207_3",
link1: "http://www.readablog.com/",
link2: "",
name: "ReadABlog Spider (compatible; 1.1; feed update; www.readablog.com)",
type: "C"
},
%{
comment: "",
description: "RealDownload download manager",
id: "id_n_s_1171",
link1: "http://service.real.com/help/faq/rdown4/rdownfaqa01.html",
link2: "",
name: "RealDownload/4.0.0.4x",
type: "D"
},
%{
comment: "",
description: "The REAP Web Crawler for the REAP project",
id: "id_n_s_100408_3",
link1: "http://reap.cs.cmu.edu/REAP-crawler/",
link2: "http://reap.cs.cmu.edu/",
name:
"REAP-crawler Nutch/Nutch-1.0-dev (Reap Project; http://reap.cs.cmu.edu/REAP-crawler/; Reap Project)",
type: "C"
},
%{
comment: "",
description: "Reaper robot for SiteSearch",
id: "id_n_s_1172",
link1: "http://marty.anstey.ca/projects/robots/reaper.html",
link2: "",
name: "Reaper [2.03.10-031204] (http://www.sitesearch.ca/reaper/)",
type: "R"
},
%{
comment: "",
description: "Reaper robot for SiteSearch",
id: "id_n_s_1173",
link1: "http://marty.anstey.ca/projects/robots/reaper.html",
link2: "",
name: "Reaper/2.0x (+http://www.sitesearch.ca/reaper)",
type: "R"
},
%{
comment: "",
description: "REBOL messaging language for distributed Internet apps",
id: "id_n_s_1174",
link1: "http://www.rebol.com/",
link2: "",
name: "REBOL Core 2.x.x.x.x",
type: ""
},
%{
comment: "",
description: "REBOL/View - machine independent internet client application",
id: "id_n_s_250307_1",
link1: "http://www.rebol.com/prod-view.html",
link2: "",
name: "REBOL View 1.x.x.x.x",
type: "B"
},
%{
comment: "",
description: "Rebusnet software site - link / submission checking",
id: "id_n_s_1175",
link1: "http://www.rebusnet.biz",
link2: "",
name: "RebusnetBot (+http://www.rebusnet.biz)",
type: "R C"
},
%{
comment: "",
description: "Rebusnet software site - link / submission checking",
id: "id_n_s_1176",
link1: "http://www.rebusnet.biz",
link2: "",
name: "RebusnetPADBot/1.5x (+http://www.rebusnet.biz)",
type: "R C"
},
%{
comment: "",
description: "Online reciprocal link checker",
id: "id_n_s_171205_1",
link1: "http://www.recip-links.com/",
link2: "",
name: "reciprocal links checker (http://www.recip-links.com/)",
type: "C"
},
%{
comment: "220.226.198.xx",
description: "rediff.com search link checking",
id: "id_n_s_110307_2",
link1: "http://www.rediff.com/",
link2: "",
name: "RedBot/redbot-1.0 (Rediff.com Crawler; redbot at rediff dot com)",
type: "C"
},
%{
comment: "",
description: "RedCarpet crawler for Pronto price comparison search(66.179.107.1xx)",
id: "id_n_s_130106_1",
link1: "http://www.redcarpet-inc.com/robots.html",
link2: "http://www.pronto.com/",
name: "RedCarpet/1.2 (http://www.redcarpet-inc.com/robots.html)",
type: "R"
},
%{
comment: "Based on Nutch",
description: "Der Bot for telegenetic.net's security related search (65.220.67.2xx)",
id: "id_n_s_171205_2",
link1: "http://www.telegenetic.net/bot.html",
link2: "",
name:
"RedCell/0.1 (InfoSec Search Bot (Coming Soon); http://www.telegenetic.net/bot.html; lhall@telegenetic.net)",
type: "R"
},
%{
comment: "Based on Nutch",
description: "Der Bot for telegenetic.net's security related search (65.220.67.2xx)",
id: "id_n_s_040106_1",
link1: "http://www.telegenetic.net/bot.html",
link2: "",
name: "RedCell/0.1 (RedCell; telegenetic.net/bot.html; lhall_at_telegenetic.net)",
type: "R"
},
%{
comment: "",
description: "RedKernel Softwares robot",
id: "id_n_s_1177",
link1: "http://www.redkernel-softwares.com/",
link2: "",
name: "RedKernel WWW-Spider 2/0 (+http://www-spider.redkernel-softwares.com/)",
type: "R"
},
%{
comment: "",
description: "REL Link Checker Lite free version of Web Link Validator",
id: "id_n_s_1178",
link1: "http://www.relsoftware.com/rlc/",
link2: "",
name: "REL Link Checker Lite x.x",
type: "C"
},
%{
comment: "",
description: "unknown",
id: "id_n_s_1179",
link1: "",
link2: "",
name: "RepoMonkey Bait & Tackle/v1.01",
type: ""
},
%{
comment: "",
description: "Rewebber proxy service",
id: "id_n_s_1180",
link1: "http://www.rewebber.com/",
link2: "",
name: "Rewebber/1.2 libwww-perl/5.41",
type: "P"
},
%{
comment: "",
description: "Applied Semantics Auto-Categorizer for QWestDex Direct",
id: "id_n_s_1181",
link1: "http://www.dotcomdirectory.com",
link2: "",
name: "rico/0.1",
type: "R"
},
%{
comment: "",
description: "RixBot Rebol Indexer for the RIX - Rebol related search (195.204.121.xx)",
id: "id_n_s_241105_2",
link1: "http://babelserver.org/rix",
link2: "",
name: "RixBot (http://babelserver.org/rix)",
type: "R"
},
%{
comment: "",
description: "StreamBox VCR user agent",
id: "id_n_s_070406_2",
link1:
"http://all-streaming-media.com/streaming-media-faq/faq-streambox-vcr-download-problems.htm",
link2: "",
name: "RMA/1.0 (compatible; RealMedia)",
type: "D"
},
%{
comment: "",
description: "Real Media server acting as client",
id: "id_n_s_1182",
link1: "http://service.real.com/help/library/whitepapers/wpaper.html",
link2: "",
name: "RMA/1.0 (compatible; RealMedia)",
type: "B P"
},
%{
comment: "",
description: "Canadian Content search crawler",
id: "id_n_s_061206_4",
link1: "http://www.canadiancontent.net/",
link2: "",
name: "RoboCrawl (http://www.canadiancontent.net)",
type: "R"
},
%{
comment: "",
description: "Canadian Content Search (207.44.220.xx) robot",
id: "id_n_s_1183",
link1: "http://www.canadiancontent.net/",
link2: "",
name: "RoboCrawl (www.canadiancontent.net)",
type: "R"
},
%{
comment: "",
description: "FindPal Australia metasearch robot (61.68.139.xx)",
id: "id_n_s_1184",
link1: "http://www.findpal.com/",
link2: "",
name: "RoboPal (http://www.findpal.com/)",
type: "R"
},
%{
comment: "",
description: "PopJapanSearch robot",
id: "id_n_s_1187",
link1: "http://www.pj-search.com/",
link2: "",
name: "Robot/www.pj-search.com",
type: "R"
},
%{
comment: "",
description: "Experimental robot using Wget via attbi.net",
id: "id_n_s_1185",
link1: "",
link2: "",
name: "Robot: NutchCrawler- Owner: wdavies@acm.org",
type: "R"
},
%{
comment: "",
description: "Supersnooper robot",
id: "id_n_s_1186",
link1: "http://www.Supersnooper.com/",
link2: "",
name: "Robot@SuperSnooper.Com",
type: "R"
},
%{
comment: "",
description: "Netscape Directory / DMOZ Open Directory link crawler",
id: "id_n_s_1188",
link1: "http://directory.mozilla.org/",
link2: "",
name: "Robozilla/1.0",
type: "R"
},
%{
comment: "",
description: "ROME - Open source Java tools for RSS and Atom feeds",
id: "id_n_s_220208_1",
link1: "https://rome.dev.java.net/",
link2: "",
name: "Rome Client (http://tinyurl.com/64t5n) Ver: 0.9",
type: "B"
},
%{
comment: "",
description: "Qualigo.de robot",
id: "id_n_s_1189",
link1: "http://www.qualigo.de/",
link2: "",
name: "Rotondo/3.1 libwww/5.3.1",
type: "R"
},
%{
comment: "Java1.4.0",
description: "different IPs using the HTTPClient library (mostly link checking)",
id: "id_n_s_1190",
link1: "http://www.innovation.ch/java/HTTPClient/",
link2: "",
name: "RPT-HTTPClient/0.3-x",
type: "C"
},
%{
comment: "s. Larbin...",
description: "Metacarta.com (66.28.xx.xxx) robot",
id: "id_n_s_1191",
link1: "http://www.metacarta.com",
link2: "",
name: "RRC (crawler_admin@bigfoot.com)",
type: "R"
},
%{
comment: "",
description: "RSS Bandit RSS/Atom reader for .NET framework",
id: "id_n_s_250707_5",
link1: "http://www.rssbandit.org/",
link2: "",
name:
"RssBandit/1.5.0.10 (.NET CLR 1.1.4322.2407; WinNT 5.1.2600.0; http://www.rssbandit.org) (.NET CLR 1.1.4322.2407; WinNT 5.1.2600.0; )",
type: "B"
},
%{
comment: "209.216.63.xx",
description: "RSS Micro Search - RSS feed search engine",
id: "id_n_s_230607_3",
link1: "http://www.rssmicro.com/",
link2: "",
name: "RSSMicro.com RSS/Atom Feed Robot",
type: "R"
},
%{
comment: "",
description: "RSSOwl embedded RSS feed reader",
id: "id_n_s_080307_2",
link1: "http://www.rssowl.org/",
link2: "",
name: "RSSOwl/1.2.3 2006-11-26 (Windows; U; zhtw)",
type: "B"
},
%{
comment: "",
description: "RSSOwl embedded RSS feed reader",
id: "id_n_s_060108_1",
link1: "http://www.rssowl.org/",
link2: "",
name: "RSSOwl/1.2.4 Preview Release 2007-04-15 (Windows; U; zhtw)",
type: "B"
},
%{
comment: "",
description: "Ykoon RssReader news feed reader",
id: "id_n_s_181006_3",
link1: "http://www.rssreader.com/",
link2: "",
name: "RssReader/1.0.xx.x (http://www.rssreader.com) Microsoft Windows NT 5.1.2600.0",
type: "B"
},
%{
comment: "",
description:
"Some site scanning tool via diff. IPs- i.e.: - dslx.net (208.35.1x.xxx) - Home.com",
id: "id_n_s_1192",
link1: "",
link2: "",
name: "RSurf15a 41",
type: "S"
},
%{
comment: "",
description:
"Some site scanning tool via diff. IPs- i.e.: - dslx.net (208.35.1x.xxx) - Home.com",
id: "id_n_s_1193",
link1: "",
link2: "",
name: "RSurf15a 51",
type: "S"
},
%{
comment: "",
description:
"Some site scanning tool via diff. IPs- i.e.: - dslx.net (208.35.1x.xxx) - Home.com",
id: "id_n_s_1194",
link1: "",
link2: "",
name: "RSurf15a 81",
type: "S"
},
%{
comment: "based on XFN relationship lookup engine",
description: "rubhub blog spider",
id: "id_n_s_080206_2",
link1: "http://rubhub.com/main/",
link2: "http://gmpg.org/xfn/more",
name: "Rubbot/1.0 (+http://rubhub.com/)",
type: "C"
},
%{
comment: "s. also pulseBot",
description:
"WebarooBot - Webaroo web site search / theme based downloading tool (64.124.122.2xx)",
id: "id_n_s_191105_1",
link1: "http://www.webaroo.com/index",
link2: "http://www.webaroo.com/company/site-owners",
name: "RufusBot (Rufus Web Miner; http://64.124.122.252/feedback.html)",
type: "R"
},
%{
comment: "s. also pulseBot",
description:
"WebarooBot - Webaroo web site search / theme based downloading tool (64.124.122.2xx)",
id: "id_n_s_020407_1",
link1: "http://www.webaroo.com/index",
link2: "http://www.webaroo.com/company/site-owners",
name: "RufusBot (Rufus Web Miner; http://www.webaroo.com/rooSiteOwners.html)",
type: "R"
},
%{
comment: "",
description: "unknown robot from rumours.jp (202.214.69.xxx)",
id: "id_n_s_1195",
link1: "",
link2: "",
name: "Rumours-Agent",
type: ""
},
%{
comment: "",
description: "RX (Reflexive Search) Bar for IE",
id: "id_n_s_1196",
link1: "http://www.searchenginebar.com/",
link2: "",
name: "RX Bar",
type: "B"
},
%{
comment: "80.108.7.xx",
description: "Search & Links directory spider",
id: "id_n_s_160506_1",
link1: "http://search.hirners.com/",
link2: "",
name: "S&L Spider (http://search.hirners.com/)",
type: "C"
},
%{
comment: "",
description: "SEO-Tools.net link checking ?",
id: "id_n_s_1197",
link1: "http://www.seo-tools.net/",
link2: "",
name: "S.T.A.L.K.E.R. (http://www.seo-tools.net/en/bot.aspx)",
type: "C"
},
%{
comment: "",
description: "SafariBookmarkChecker for Mac OS X",
id: "id_n_s_1198",
link1: "http://www.coriolis.ch/",
link2: "",
name: "SafariBookmarkChecker (+http://www.coriolis.ch/)",
type: "C"
},
%{
comment: "202.20.190.xx",
description: "sait robot - unknown robot from Samsung International Korea",
id: "id_n_s_061107_1",
link1: "http://samsungnetworks.co.kr/eng/index.jsp",
link2: "",
name: "sait/Nutch-0.9 (SAIT Research; http://www.samsung.com)",
type: "R"
},
%{
comment: "",
description: "Sandcrawler robot from Microsoft (131.107.0.xx)",
id: "id_n_s_191105_2",
link1: "",
link2: "",
name: "SandCrawler - Compatibility Testing",
type: "R"
},
%{
comment: "",
description:
"Sapphire Web Crawler from Carnegie Mellon University's Language Technologies Institute",
id: "id_n_s_170109_3",
link1: "http://boston.lti.cs.cmu.edu/crawler/",
link2: "",
name:
"SapphireWebCrawler/1.0 (Sapphire Web Crawler using Nutch; http://boston.lti.cs.cmu.edu/crawler/; mhoy@cs.cmu.edu)",
type: "R"
},
%{
comment: "",
description:
"Sapphire Web Crawler from Carnegie Mellon University's Language Technologies Institute",
id: "id_n_s_170109_4",
link1: "http://boston.lti.cs.cmu.edu/crawler/",
link2: "",
name:
"SapphireWebCrawler/Nutch-1.0-dev (Sapphire Web Crawler using Nutch; http://boston.lti.cs.cmu.edu/crawler/; mhoy@cs.cmu.edu)",
type: "R"
},
%{
comment: "",
description: "WebSavvy Directory robot",
id: "id_n_s_021205_4",
link1: "http://www.websavvy.cc/bot.php",
link2: "",
name: "savvybot/0.2",
type: "R"
},
%{
comment: "",
description: "SiteSell SBIder Nutch based crawler",
id: "id_n_s_1199",
link1: "http://www.sitesell.com/",
link2: "",
name:
"SBIder/0.7 (SBIder; http://www.sitesell.com/sbider.html; http://support.sitesell.com/contact-support.html)",
type: "R"
},
%{
comment: "",
description: "SiteSell SBIder Nutch based crawler",
id: "id_n_s_030106_2",
link1: "http://www.sitesell.com/",
link2: "",
name:
"SBIder/0.8-dev (SBIder; http://www.sitesell.com/sbider.html; http://support.sitesell.com/contact-support.html)",
type: "R"
},
%{
comment: "",
description: "Softbyte Labs Black Widow web site ripper",
id: "id_n_s_1200",
link1: "http://sbl.net/",
link2: "",
name: "SBL-BOT (http://sbl.net)",
type: "D B"
},
%{
comment: "",
description: "ScanWeb - regular expression based web page searching tool",
id: "id_n_s_1201",
link1: "http://eserver.host.sk/",
link2: "",
name: "ScanWeb",
type: "R"
},
%{
comment: "209.216.243.xx",
description: "ScholarUniverse - Scholarly experts search robot",
id: "id_n_s_301006_1",
link1: "http://www.scholaruniverse.com/index.jsp",
link2: "",
name:
"ScholarUniverse/0.8 (Nutch;+http://scholaruniverse.com/bot.jsp; fetch-agent@scholaruniverse.com)",
type: "R"
},
%{
comment: "",
description: "URL Spider Pro (USP) used by German Schwarzmann GmbH",
id: "id_n_s_1202",
link1: "http://www.schwarzmann.biz/",
link2: "",
name: "schwarzmann.biz-Spider_for_paddel.org+(http://www.innerprise.net/usp-spider.asp)",
type: "R"
},
%{
comment: "",
description: "1X Web Browser",
id: "id_n_s_1203",
link1: "http://www.scitrav.com/",
link2: "",
name: "Science Traveller International 1X/1.0",
type: "B"
},
%{
comment: "s. also Mozilla/3.0 (compatible; ScollSpider ...",
description: "WebWobot UK search engine robot (82.43.129.2xx)",
id: "id_n_s_190407_1",
link1: "http://www.webwobot.com/",
link2: "",
name: "ScollSpider/2.0 (+http://www.webwobot.com/ScollSpider.php)",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1206",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-3.0.EU",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1207",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-3.0.FS",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1208",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-3.0.HD",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1209",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-3.0.VNS",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1210",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-3.0QI",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1211",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-3.2",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1212",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-3.2.BT",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1213",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-3.2.DIL",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1214",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-3.2.EX",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1215",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-3.2.JT",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1216",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-3.2.NIV",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1217",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-3.2.SF0",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1218",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-3.2.snippet",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1219",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-3.3dev",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1220",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-ARS-1.1",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1221",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-ARS-1.1-ih",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1222",
link1: "http://www.altavista.com/",
link2: "",
name: "scooter-venus-3.0.vns",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1223",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-W3-1.0",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1224",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter-W3.1.2",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1225",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter/1.0",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1226",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter/1.0 scooter@pa.dec.com",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1227",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter/1.1 (custom)",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1228",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter/2.0 G.R.A.B. V1.1.0",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1229",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter/2.0 G.R.A.B. X2.0",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1230",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter/3.3",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1232",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter/3.3.QA.pczukor",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1233",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter/3.3.vscooter",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1231",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter/3.3_SF",
type: "R"
},
%{
comment: "",
description: "Altavista using Mercator robot",
id: "id_n_s_1234",
link1: "http://www.altavista.com/",
link2: "http://www.research.compaq.com/SRC/mercator/",
name: "Scooter2_Mercator_x-x.0",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1204",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter_bh0-3.0.3",
type: "R"
},
%{
comment: "",
description: "Altavista robot",
id: "id_n_s_1205",
link1: "http://www.altavista.com/",
link2: "",
name: "Scooter_trk3-3.0.3",
type: "R"
},
%{
comment: "",
description: "Scope Navigator mobile browser (Japan)",
id: "id_n_s_190306_3",
link1: "http://www.programmer.co.jp/scope.shtml",
link2: "",
name: "Scope (Mars+)",
type: "B"
},
%{
comment: "",
description: "Some nec.com robot using Research Republic ScoutAbout Research Tool",
id: "id_n_s_1235",
link1: "http://www.researchrepublic.com/",
link2: "",
name: "ScoutAbout",
type: "R"
},
%{
comment: "66.230.171.17x",
description: "Ant.com search robot",
id: "id_n_s_051207_4",
link1: "http://www.ant.com/",
link2: "",
name: "ScoutAnt/0.1; +http://www.ant.com/what_is_ant.com/",
type: "R"
},
%{
comment: "",
description: "ScoutMaster information retrieval software",
id: "id_n_s_271105_3",
link1: "http://www.scoutmaster.de/",
link2: "",
name: "scoutmaster",
type: "R"
},
%{
comment: "s.also Mozilla/5.0 (compatible; Scrubby/2.2 ...",
description: "Scrub the web robot (66.93.156.xx)",
id: "id_n_s_1236",
link1: "http://www.scrubtheweb.com/",
link2: "",
name: "Scrubby/2.x (http://www.scrubtheweb.com/)",
type: "R"
},
%{
comment: "s.also Mozilla/5.0 (compatible; Scrubby/2.2 ...",
description: "Scrub the web robot (66.93.156.xx)",
id: "id_n_s_030308_3",
link1: "http://www.scrubtheweb.com/",
link2: "",
name: "Scrubby/3.0 (+http://www.scrubtheweb.com/help/technology.html)",
type: "R"
},
%{
comment: "",
description: "URL Search+ search software",
id: "id_n_s_1240",
link1: "http://srchplus.chat.ru/index.htm",
link2: "",
name: "Search+",
type: "R"
},
%{
comment: "",
description: "Xtreem Search Engine Studio - SE software",
id: "id_n_s_110606_3",
link1: "http://www.xtreeme.com/search-engine-studio/",
link2: "",
name: "Search-Engine-Studio",
type: "R"
},
%{
comment: "",
description: "Search.ch robot",
id: "id_n_s_1237",
link1: "http://www.search.ch/",
link2: "",
name: "search.ch V1.4",
type: "R"
},
%{
comment: "",
description: "Search.ch robot",
id: "id_n_s_1238",
link1: "http://www.search.ch/",
link2: "",
name: "search.ch V1.4.2 (spiderman@search.ch; http://www.search.ch)",
type: "R"
},
%{
comment: "",
description: "Enterprise Search web indexing / site searching tool",
id: "id_n_s_1239",
link1: "http://www.innerprise.net/es-bi.asp",
link2: "",
name: "Search/1.0 (http://www.innerprise.net/es-spider.asp)",
type: "R"
},
%{
comment: "",
description: "Unknown robot / website grabber from Chinatelecom (219.142.78.xxx)",
id: "id_n_s_1241",
link1: "",
link2: "",
name: "searchbot admin@google.com",
type: "S"
},
%{
comment: "",
description: "SearchByUSA robot (69.150.7.xxx)",
id: "id_n_s_1242",
link1: "http://www.searchbyusa.com/",
link2: "",
name:
"SearchByUsa/2 (SearchByUsa; http://www.SearchByUsa.com/bot.html; info@SearchByUsa.com)",
type: "R"
},
%{
comment: "85.25.131.1xx",
description: "Searchday (Germany) search robot",
id: "id_n_s_231006_1",
link1: "http://www.searchday.de/",
link2: "",
name: "SearchdayBot",
type: "R"
},
%{
comment: "",
description: "Searchexpress spider",
id: "id_n_s_1243",
link1: "http://www.searchexpress.com/",
link2: "",
name: "SearchExpress Spider0.99",
type: "R"
},
%{
comment: "",
description: "Searchguild forum & directory robot (81.3.75.xxx)",
id: "id_n_s_1245",
link1: "http://searchguild.com/",
link2: "",
name: "SearchGuild/DMOZ/Experiment (searchguild@gmail.com)",
type: "R"
},
%{
comment: "",
description: "Searchguild forum & directory robot (81.3.75.xxx)",
id: "id_n_s_1244",
link1: "http://searchguild.com/",
link2: "",
name: "SearchGuild_DMOZ_Experiment (chris@searchguild.com)",
type: "R"
},
%{
comment: "",
description: "Searchit robot (69.93.107.xx)",
id: "id_n_s_1246",
link1: "http://www.searchit-now.co.uk",
link2: "",
name: "Searchit-Now Robot/2.2 (+http://www.searchit-now.co.uk)",
type: "R"
},
%{
comment: "64.202.100.",
description: "Searchmee! Search Engine (prototype) robot by findanisp.com",
id: "id_n_s_220906_3",
link1: "http://www.searchmee.com/",
link2: "",
name: "Searchmee! Spider v0.98a",
type: "R"
},
%{
comment: "",
description: "SearchSight search robot",
id: "id_n_s_100506_1",
link1: "http://searchsight.com/",
link2: "",
name: "SearchSight/2.0 (http://SearchSight.com/)",
type: "R"
},
%{
comment: "",
description: "SearchSpider robot",
id: "id_n_s_1247",
link1: "http://www.searchspider.com/",
link2: "",
name: "SearchSpider.com/1.1",
type: "R"
},
%{
comment: "",
description: "SearchSpider robot",
id: "id_n_s_1248",
link1: "http://www.searchspider.com/",
link2: "",
name:
"Searchspider/1.2 (SearchSpider; http://www.searchspider.com; webmaster@searchspider.com)",
type: "R"
},
%{
comment: "",
description: "Janas (Ideare.com / Tiscali.it) robot",
id: "id_n_s_1249",
link1: "http://www.ideare.com/",
link2: "http://www.tiscali.it",
name: "SearchTone2.0 - IDEARE",
type: "R"
},
%{
comment: "195.27.215.xx",
description: "seekport. beta search (Germany) robot",
id: "id_n_s_1250",
link1: "http://www.seekbot.net/",
link2: "",
name: "Seekbot/1.0 (http://www.seekbot.net/bot.html) HTTPFetcher/0.3",
type: "R"
},
%{
comment: "195.27.215.xx",
description: "seekport. beta search (Germany) robot",
id: "id_n_s_1251",
link1: "http://www.seekbot.net/",
link2: "",
name: "Seekbot/1.0 (http://www.seekbot.net/bot.html) RobotsTxtFetcher/1.0 (XDF)",
type: "R"
},
%{
comment: "195.27.215.xx",
description: "seekport. beta search (Germany) robot",
id: "id_n_s_1252",
link1: "http://www.seekbot.net/",
link2: "",
name: "Seekbot/1.0 (http://www.seekbot.net/bot.html) RobotsTxtFetcher/1.2",
type: "R"
},
%{
comment: "12.199.64.xx",
description: "Lookseek search robot / link checking",
id: "id_n_s_1253",
link1: "http://www.lookseek.com/",
link2: "",
name: "Seeker.lookseek.com",
type: "R"
},
%{
comment: "",
description: "semaforo.net web filtering software",
id: "id_n_s_011006_3",
link1: "http://www.semaforo.net/en/default.htm",
link2: "",
name: "semaforo.net",
type: "P"
},
%{
comment: "212.114.209.2xx",
description: "Semager.de (was NG-Search) semantic search - Germany",
id: "id_n_s_020807_2",
link1: "http://www.semager.de/",
link2: "http://www.semager.de/blog/semager-bots/",
name: "Semager/1.1 (http://www.semager.de/blog/semager-bots/)",
type: "R"
},
%{
comment: "212.114.209.2xx",
description: "Semager.de (was NG-Search) semantic search - Germany",
id: "id_n_s_230507_2",
link1: "http://www.semager.de/",
link2: "http://www.semager.de/blog/semager-bots/",
name: "Semager/1.x (http://www.semager.de)",
type: "R"
},
%{
comment: "",
description: "Semantic Discovery domain checking tool",
id: "id_n_s_1254",
link1: "http://www.semanticdiscovery.com/products.html",
link2: "",
name: "semanticdiscovery/0.x",
type: "R C"
},
%{
comment: "",
description: "Sensis Australia search robot",
id: "id_n_s_1255",
link1: "http://www.sensis.com.au/",
link2: "",
name: "Sensis Web Crawler (search_comments\\at\\sensis\\dot\\com\\dot\\au)",
type: "R"
},
%{
comment: "",
description: "Sensis Australia search robot",
id: "id_n_s_1256",
link1: "http://www.sensis.com.au/",
link2: "",
name: "Sensis.com.au Web Crawler (search_comments\\at\\sensis\\dot\\com\\dot\\au)",
type: "R"
},
%{
comment: "212.80.76.xx",
description: "Seznam Search (Czech Republic) robot",
id: "id_n_s_1257",
link1: "http://www.seznam.cz/",
link2: "",
name: "SeznamBot/1.0",
type: "R"
},
%{
comment: "212.80.76.xx",
description: "Seznam Search (Czech Republic) robot",
id: "id_n_s_1258",
link1: "http://www.seznam.cz/",
link2: "",
name: "SeznamBot/1.0 (+http://fulltext.seznam.cz/)",
type: "R"
},
%{
comment: "212.80.76.xx",
description: "Seznam Search (Czech Republic) robot",
id: "id_n_s_080907_2",
link1: "http://www.seznam.cz/",
link2: "",
name: "SeznamBot/2.0-test (+http://fulltext.sblog.cz/)",
type: "R"
},
%{
comment: "67.228.100.1xx / 67.228.102.2xx",
description:
"Unknown robot from Shablast.com - Website has no content - Ignores robots.txt",
id: "id_n_s_280208_2",
link1: "http://shablast.com/",
link2: "",
name: "ShablastBot 1.0",
type: "S"
},
%{
comment: "",
description: "Shareaza P2P peer-to-peer download client",
id: "id_n_s_1259",
link1: "http://www.shareaza.com/",
link2: "",
name: "Shareaza v1.x.x.xx",
type: "D B"
},
%{
comment: "",
description: "SharewarePlaza File Check Bot - link checking",
id: "id_n_s_1260",
link1: "http://www.sharewareplaza.com/",
link2: "",
name: "SharewarePlazaFileCheckBot/1.0+(+http://www.SharewarePlaza.com)",
type: "R C"
},
%{
comment: "s. also Shim-Crawler ...",
description:
"Chikayama-Taura Lab Shim-Crawler used for The Kototoi Project (Japan) - (133.11.36.xx)",
id: "id_n_s_1261",
link1: "http://www.logos.ic.i.u-tokyo.ac.jp/crawler/index.en.html",
link2: "http://www.kototoi.org/index.html",
name: "Shim Crawler",
type: "R"
},
%{
comment: "s. also Shim Crawler",
description:
"Chikayama-Taura Lab Shim-Crawler used for The Kototoi Project (Japan) - (133.11.36.xx)",
id: "id_n_s_240106_2",
link1: "http://www.logos.ic.i.u-tokyo.ac.jp/crawler/index.en.html",
link2: "http://www.kototoi.org/index.html",
name:
"Shim-Crawler(Mozilla-compatible; http://www.logos.ic.i.u-tokyo.ac.jp/crawler/; crawl@logos.ic.i.u-tokyo.ac.jp)",
type: "R"
},
%{
comment: "4.78.166.1xx",
description: "ShopWiki shopping search based on LittleWiki search",
id: "id_n_s_131205_1",
link1: "http://www.shopwiki.com/",
link2: "http://dev.littlewiki.com/wiki/Home",
name: "ShopWiki/1.0 ( +http://www.shopwiki.com/)",
type: "R"
},
%{
comment: "4.78.166.1xx",
description: "ShopWiki shopping search based on LittleWiki search",
id: "id_n_s_250706_1",
link1: "http://www.shopwiki.com/",
link2: "http://dev.littlewiki.com/wiki/Home",
name: "ShopWiki/1.0 ( +http://www.shopwiki.com/wiki/Help:Bot)",
type: "R"
},
%{
comment: "",
description: "Shoula Search Engine crawler",
id: "id_n_s_1262",
link1: "http://www.shoula.com/",
link2: "",
name: "Shoula.com Crawler 2.0",
type: "R"
},
%{
comment: "",
description: "Siets Crawler - Web based site crawling application",
id: "id_n_s_230107_1",
link1: "http://www.siets.biz/products/crawler/",
link2: "",
name: "SietsCrawler/1.1 (+http://www.siets.biz)",
type: "R"
},
%{
comment: "",
description: "Sigram's Nutch robot - crawler testing",
id: "id_n_s_070308_1",
link1: "http://www.sigram.com/bot.html",
link2: "",
name:
"Sigram/Nutch-1.0-dev (Test agent for Nutch development; http://www.sigram.com/bot.html; bot at sigram dot com)",
type: "R"
},
%{
comment: "62.68.196.xx",
description: "Siigle search (Turkey) robot",
id: "id_n_s_050906_1",
link1: "http://www.siigle.com/",
link2: "",
name: "Siigle Orumcex v.001 Turkey (http://www.siigle.com)",
type: "R"
},
%{
comment: "s. also Slider_Search...",
description: "Slider Search directory robot (194.213.194.2xx)",
id: "id_n_s_171006_1",
link1: "http://www.slider.com/index.html",
link2: "",
name: "silk/1.0",
type: "R"
},
%{
comment: "s. also Slider_Search...",
description: "Slider Search directory robot (194.213.194.2xx)",
id: "id_n_s_281205_1",
link1: "http://www.slider.com/index.html",
link2: "",
name: "silk/1.0 (+http://www.slider.com/silk.htm)/3.7",
type: "R"
},
%{
comment: "",
description: "SimpleFavPanel - IE newsfeed panel plugin",
id: "id_n_s_131206_2",
link1:
"http://www.egrath.net/index.php?ExplorerBarPlus%2F%A5%D1%A5%CD%A5%EB%B0%EC%CD%F7%2FSimpleFavPanel",
link2: "",
name: "SimpleFavPanel/1.2",
type: "B"
},
%{
comment: "s. also Argus",
description: "Simpy bookmarking and personal search engine",
id: "id_n_s_1263",
link1: "http://www.simpy.com/",
link2: "",
name: "Simpy 1.x; http://www.simpy.com/",
type: "R C"
},
%{
comment: "s. also Argus",
description: "Simpy bookmarking and personal search engine",
id: "id_n_s_1264",
link1: "http://www.simpy.com/",
link2: "",
name: "Simpy/1.x (Simpy; http://www.simpy.com/?ref=bot; feedback at simpy dot com)",
type: "R C"
},
%{
comment: "88.255.173.xx",
description: "Sirketçe search - Turkey",
id: "id_n_s_180707_2",
link1: "http://www.sirketce.com/",
link2: "",
name: "Sirketcebot/v.01 (http://www.sirketce.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "SiteBar online bookmark manager",
id: "id_n_s_070207_3",
link1: "http://sitebar.org/",
link2: "",
name: "SiteBar/3.x.x (Bookmark Server; http://sitebar.org/)",
type: "C"
},
%{
comment: "",
description: "SiteBar bookmark server",
id: "id_n_s_1265",
link1: "http://sitebar.sourceforge.net/",
link2: "",
name: "SiteBar/x.x",
type: "C"
},
%{
comment: "",
description: "SiteBar bookmark server",
id: "id_n_s_1266",
link1: "http://sitebar.sourceforge.net/",
link2: "",
name: "SiteBar/x.x.x (Bookmark Server; http://sitebar.org/)",
type: "C"
},
%{
comment: "",
description: "Internetseer Web Site Monitoring / Claymont robot",
id: "id_n_s_1267",
link1: "http://www.internetseer.com/",
link2: "http://www.claymont.com/",
name: "sitecheck.internetseer.com",
type: "R C"
},
%{
comment: "",
description: "Internetseer Web Site Monitoring",
id: "id_n_s_1268",
link1: "http://www.internetseer.com/",
link2: "",
name: "sitecheck.internetseer.com (For more info see: http://sitecheck.internetseer.com)",
type: "R C"
},
%{
comment: "",
description: "SiteRecon website monitoring spider at xx minute intervals",
id: "id_n_s_1269",
link1: "http://www.siterecon.com/",
link2: "",
name: "SiteRecon+(xx)",
type: "R C"
},
%{
comment: "",
description: "PC Magazin web site downloadmanager",
id: "id_n_s_1270",
link1: "http://www.zdnet.com/pcmag/pctech/content/17/04/ut1704.001.html",
link2: "",
name: "SiteSnagger",
type: "D"
},
%{
comment: "",
description: "Site Spider robot (66.249.17.xx)",
id: "id_n_s_1271",
link1: "http://www.SiteSpider.com/",
link2: "",
name: "SiteSpider +(http://www.SiteSpider.com/)",
type: "R"
},
%{
comment: "",
description: "SiteSucker Mac website downloading tool",
id: "id_n_s_021205_3",
link1: "http://www.sitesucker.us/",
link2: "",
name: "SiteSucker/1.x.x",
type: "D"
},
%{
comment: "",
description: "SiteTagger.com bookmark organizer",
id: "id_n_s_140306_2",
link1: "http://www.sitetagger.com/",
link2: "",
name: "SiteTaggerBot (http://www.sitetagger.com/bot.htm)",
type: "C"
},
%{
comment: "69.64.67.xx",
description: "SiteTruth - Automatic site legitimacy rating system",
id: "id_n_s_030407_1",
link1: "http://www.sitetruth.com/",
link2: "",
name: "SiteTruth.com site rating system",
type: "R"
},
%{
comment: "",
description: "Webwasher.com (217.146.159.xx) internet filter",
id: "id_n_s_1272",
link1: "http://www.webwasher.com/",
link2: "",
name: "SiteWinder",
type: "B P"
},
%{
comment: "",
description: "Xtreeme SiteXpert sitemap & search engine builder",
id: "id_n_s_1273",
link1: "http://www.xtreeme.com/sitexpert/index.php",
link2: "",
name: "SiteXpert",
type: "R"
},
%{
comment: "",
description: "Skaffe.com directory link checker",
id: "id_n_s_1274",
link1: "http://www.skaffe.com/",
link2: "",
name: "Skampy/0.9.x (http://www.skaffe.com/skampy-info.html)",
type: "R"
},
%{
comment: "",
description: "Skaffe.com directory link checker",
id: "id_n_s_1275",
link1: "http://www.skaffe.com/",
link2: "",
name: "Skimpy/0.x (http://www.skaffe.com/skampy-info.html)",
type: "R"
},
%{
comment: "63.133.162.xx",
description: "Visvo distributed website crawler based on Nutch",
id: "id_n_s_090706_1",
link1: "http://www.visvo.com/bot.html",
link2: "",
name: "Skywalker/0.1 (Skywalker; anonymous; anonymous)",
type: "R"
},
%{
comment: "",
description: "Only.com robot",
id: "id_n_s_1276",
link1: "http://www.only.com/",
link2: "",
name: "Slarp/0.1",
type: "R"
},
%{
comment: "",
description: "Sleipnir - Japanese Explorer based browser & search bar",
id: "id_n_s_1277",
link1: "http://www20.pos.to/~sleipnir/software/sleipnir/index.html",
link2: "",
name: "Sleipnir",
type: "B"
},
%{
comment: "",
description: "Sleipnir - Japanese Explorer based browser & search bar",
id: "id_n_s_1278",
link1: "http://www20.pos.to/~sleipnir/software/sleipnir/index.html",
link2: "",
name: "Sleipnir Version 1.xx",
type: "B"
},
%{
comment: "",
description: "Sleipnir - Japanese Explorer based browser & search bar",
id: "id_n_s_170207_5",
link1: "http://www20.pos.to/~sleipnir/software/sleipnir/index.html",
link2: "",
name: "Sleipnir Version2.x",
type: "B"
},
%{
comment: "",
description: "Sleipnir - Japanese Explorer based browser & search bar",
id: "id_n_s_260706_1",
link1: "http://www20.pos.to/~sleipnir/software/sleipnir/index.html",
link2: "",
name: "Sleipnir/2.xx",
type: "B"
},
%{
comment: "s. also silk/1.0...",
description: "Slider Search directory robot (194.213.194.2xx)",
id: "id_n_s_1279",
link1: "http://www.slider.com/index.html",
link2: "",
name: "Slider_Search_v1-de",
type: "R"
},
%{
comment: "",
description:
"Slim Browser (IE based browser) - uses this user agent for favicon.ico only",
id: "id_n_s_1280",
link1: "http://www.flashpeak.com/sbrowser/",
link2: "",
name: "SlimBrowser",
type: "B"
},
%{
comment: "",
description: "Inktomi (Hotbot-Lycos-NBCi) robot",
id: "id_n_s_1281",
link1: "http://www.inktomi.com/slurp.html",
link2: "",
name: "Slurp/2.0 (slurp@inktomi.com; http://www.inktomi.com/slurp.html)",
type: "R"
},
%{
comment: "",
description: "Inktomi (Hotbot-Lycos-NBCi) robot",
id: "id_n_s_1282",
link1: "http://www.inktomi.com/slurp.html",
link2: "",
name: "Slurp/2.0-KiteWeekly (slurp@inktomi.com; http://www.inktomi.com/slurp.html)",
type: "R"
},
%{
comment: "",
description: "Inktomi (Hotbot-Lycos-NBCi) robot",
id: "id_n_s_1283",
link1: "http://www.inktomi.com/slurp.html",
link2: "",
name: "Slurp/si (slurp@inktomi.com; http://www.inktomi.com/slurp.html)",
type: "R"
},
%{
comment: "s. also Mozilla/3.0 (Slurp/.....",
description: "Inktomi (Hotbot-Lycos-NBCi) robot - 72.30.61.xx(x)",
id: "id_n_s_240806_1",
link1: "http://www.inktomi.com/",
link2: "",
name: "Slurpy Verifier/1.0",
type: "R"
},
%{
comment: "",
description: "Slysearch robot (now Turnitin robot)",
id: "id_n_s_1284",
link1: "http://www.slysearch.com/",
link2: "",
name: "SlySearch (slysearch@slysearch.com)",
type: "R"
},
%{
comment: "",
description: "Slysearch robot (now Turnitin robot)",
id: "id_n_s_1285",
link1: "http://www.slysearch.com/",
link2: "",
name: "SlySearch/1.0 http://www.plagiarism.org/crawler/robotinfo.html",
type: "R"
},
%{
comment: "",
description: "Slysearch robot (now Turnitin robot)",
id: "id_n_s_1286",
link1: "http://www.slysearch.com/",
link2: "",
name: "SlySearch/1.x http://www.slysearch.com",
type: "R"
},
%{
comment: "",
description: "Netzip/Smartdownload download manager",
id: "id_n_s_1287",
link1: "http://www.netzip.com/",
link2: "",
name: "SmartDownload/1.2.67 (Win32; Jan 12 1999)",
type: "D"
},
%{
comment: "",
description: "Netzip/Smartdownload download manager",
id: "id_n_s_1288",
link1: "http://www.netzip.com/",
link2: "",
name: "SmartDownload/1.2.77 (Win32; Feb 1 2000)",
type: "D"
},
%{
comment: "",
description: "Netzip/Smartdownload download manager",
id: "id_n_s_1289",
link1: "http://www.netzip.com/",
link2: "",
name: "SmartDownload/1.2.77 (Win32; Jun 19 2001)",
type: "D"
},
%{
comment: "",
description: "Loop Improvements NRS Enterprise search (69.44.155.xx[x])",
id: "id_n_s_1290",
link1: "http://www.loopimprovements.com/",
link2: "http://demo.loopimprovements.com/demo/",
name: "smartwit.com",
type: "R"
},
%{
comment: "64.71.152.xx",
description:
"SmiffyDCMetaSpider - Robot to check the retro-adding of Dublin Core metadata",
id: "id_n_s_020307_2",
link1: "http://www.smiffysplace.com",
link2: "http://www.smiffysplace.com/smiffydcmetaspider",
name: "SmiffyDCMetaSpider/1.0",
type: "R"
},
%{
comment: "see Snoopy",
description: "Snoopy PHP-client",
id: "id_n_s_1291",
link1: "http://sourceforge.net/projects/snoopy/",
link2: "",
name: "sna-0.0.1 (mikemuzio@msn.com)",
type: ""
},
%{
comment: "see Snoopy",
description: "Snoopy PHP-client",
id: "id_n_s_1292",
link1: "http://sourceforge.net/projects/snoopy/",
link2: "",
name: "sna-0.0.1 mikeelliott@hotmail.com",
type: ""
},
%{
comment: "Gets only the robots.txt - Not from Snap.com / Idealab (63.251.211.xxx)",
description: "Unknown bot from bb2.net (66.234.139.xxx) also as Snapbot/1.0",
id: "id_n_s_080106_1",
link1: "http://www.kloth.net/internet/badbots.php",
link2: "",
name: "snap.com beta crawler v0",
type: "S"
},
%{
comment: "Not from Snap.com / Idealab (63.251.211.xxx)",
description: "Unknown bot from bb2.net (66.234.139.xxx) - also as snap.com",
id: "id_n_s_250506_1",
link1: "http://www.kloth.net/internet/badbots.php",
link2: "",
name: "Snapbot/1.0",
type: "S"
},
%{
comment: "38.98.19.6x",
description: "Unknown bot from Psinet / Cogentco - not from Snap.com",
id: "id_n_s_250408_1",
link1: "",
link2: "",
name: "Snapbot/1.0 (Snap Shots, +http://www.snap.com)",
type: "S"
},
%{
comment: "205.138.199.1xx / 209.85.36.x",
description: "My UrlTrends online web ranking service",
id: "id_n_s_270906_2",
link1: "http://www.urltrends.com/",
link2: "",
name: "Snappy/1.1 ( http://www.urltrends.com/ )",
type: "C"
},
%{
comment: "",
description: "Snarfer RSS reader",
id: "id_n_s_100707_1",
link1: "http://www.snarfware.com/",
link2: "",
name: "Snarfer/0.x.x (http://www.snarfware.com/)",
type: "B"
},
%{
comment: "",
description: "Unknown robot from 217.229.156.xx (T-Online Germany)",
id: "id_n_s_1293",
link1: "",
link2: "",
name: "SnoopRob/x.x",
type: ""
},
%{
comment: "s. also sna-x.x.x",
description: "Snoopy PHP-client",
id: "id_n_s_1294",
link1: "http://sourceforge.net/projects/snoopy/",
link2: "",
name: "Snoopy v1.xx",
type: ""
},
%{
comment: "s. also sna-x.x.x",
description: "Snoopy PHP-client",
id: "id_n_s_1295",
link1: "http://sourceforge.net/projects/snoopy/",
link2: "",
name:
"Snoopy v1.xx- : User-Agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; MyIE2)",
type: ""
},
%{
comment: "s. also sna-x.x.x",
description: "Snoopy PHP-client",
id: "id_n_s_1296",
link1: "http://sourceforge.net/projects/snoopy/",
link2: "",
name: "Snoopy_v0.xx",
type: ""
},
%{
comment: "",
description: "Snyke.com France robot",
id: "id_n_s_1297",
link1: "http://www.snyke.com/",
link2: "",
name: "SnykeBot/0.6 (http://www.snyke.com)",
type: "R"
},
%{
comment: "",
description: "Link crawler for the social sciences",
id: "id_n_s_250706_2",
link1: "http://socscibot.wlv.ac.uk/",
link2: "",
name: "SocSciBot ()",
type: "R"
},
%{
comment: "",
description: "NetFront browser on Softbank mobile phone",
id: "id_n_s_170407_1",
link1: "http://www.access-company.com/products/netfrontmobile/browser/index.html",
link2: "http://mb.softbank.jp/mb/en/product/",
name:
"SoftBank/1.0/812SH/SHJ001 Browser/NetFront/3.3 Profile/MIDP-2.0 Configuration/CLDC-1.1",
type: "B"
},
%{
comment: "",
description: "Soft Hypermarket link checking",
id: "id_n_s_1298",
link1: "http://www.softhypermarket.com/",
link2: "",
name: "SoftHypermarketFileCheckBot/1.0+(+http://www.softhypermaket.com)",
type: "R"
},
%{
comment: "72.9.97.xx",
description: "Softizer.com software directory link checking",
id: "id_n_s_1299",
link1: "http://www.softizer.com/",
link2: "",
name: "Softizerbot (http://www.softizer.com)",
type: "C"
},
%{
comment: "s. also sohu agent & Sogou web spider",
description: "Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot",
id: "id_n_s_090208_1",
link1: "",
link2: "",
name: "sogou develop spider",
type: "S"
},
%{
comment: "s. also sohu agent , Sogou web spider & sogou develop spider",
description: "Unknown UA from Chinanet (220.181.18.xx) faking Sogou search robot",
id: "id_n_s_011207_2",
link1: "",
link2: "",
name: "Sogou Orion spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm#07)",
type: "S"
},
%{
comment: "s. also sohu agent , Sogou web spider & sogou develop spider",
description: "Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot",
id: "id_n_s_150106_1",
link1: "",
link2: "",
name: "sogou spider",
type: "S"
},
%{
comment: "s. also sohu agent , sogou spider & sogou develop spider",
description: "Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot",
id: "id_n_s_280407_1",
link1: "",
link2: "",
name: "Sogou web spider/3.0(+http://www.sogou.com/docs/help/webmasters.htm#07)",
type: "S"
},
%{
comment: "s. also sogou spider , sogou spider & sogou develop spider",
description: "Unknown UA from Chinanet (220.181.26.1xx) faking Sogou search robot",
id: "id_n_s_291105_1",
link1: "",
link2: "",
name: "sohu agent",
type: "S"
},
%{
comment:
"this UA also comes from 220.181.26.xxx (not Sohus IP range) as spam bot - s.also sohu agent",
description: "Sohu (Search Fox) search robot China (61.135.131.xxx)",
id: "id_n_s_1300",
link1: "http://www.sohu.com/",
link2: "",
name: "sohu-search",
type: "R"
},
%{
comment: "",
description: "SOSO search (China) spider",
id: "id_n_s_160308_3",
link1: "http://www.soso.com/",
link2: "http://help.soso.com/webspider.htm",
name: "Sosospider+(+http://help.soso.com/webspider.htm)",
type: "R"
},
%{
comment: "",
description: "Default Proxomitron (discontinued) filtering proxy user agent identifier",
id: "id_n_s_1301",
link1: "http://duke.usask.ca/~macphed/prox/",
link2: "",
name: "Space Bison/0.02 [fu] (Win67; X; SK)",
type: "P B"
},
%{
comment: "",
description: "Speed Download (Mac) download manager",
id: "id_n_s_1302",
link1: "http://www.yazsoft.com/",
link2: "",
name: "SpeedDownload/1.x",
type: "D"
},
%{
comment: "",
description: "Speedfind.de robot",
id: "id_n_s_1303",
link1: "http://www.speedfind.de/",
link2: "",
name: "speedfind ramBot xtreme 8.1",
type: "R"
},
%{
comment: "62.13.25.2xx",
description: "Entireweb search robot",
id: "id_n_s_1304",
link1: "http://www.entireweb.com/",
link2: "",
name: "Speedy Spider (Beta/x.x; speedy@entireweb.com)",
type: "R"
},
%{
comment: "62.13.25.2xx",
description: "Entireweb search spider",
id: "id_n_s_070906_1",
link1: "http://www.entireweb.com/",
link2: "",
name:
"Speedy Spider (Entireweb; Beta/1.0; http://www.entireweb.com/about/search_tech/speedyspider/)",
type: "R"
},
%{
comment: "62.13.25.2xx",
description: "Entireweb search robot",
id: "id_n_s_1305",
link1: "http://www.entireweb.com/",
link2: "",
name: "Speedy_Spider (http://www.entireweb.com)",
type: "R"
},
%{
comment: "64.40.11[7-8].[x]xx",
description: "Sphere blog and news search robot",
id: "id_n_s_050208_4",
link1: "http://www.sphere.com/",
link2: "",
name: "Sphere Scout&v4.0 - scout at sphere dot com",
type: "R"
},
%{
comment: "",
description: "Sphider - a lightweight search engine in PHP",
id: "id_n_s_040106_3",
link1: "http://www.cs.ioc.ee/~ando/sphider/",
link2: "",
name: "Sphider",
type: "R"
},
%{
comment: "in conjunction with LWP::Simple/5.53",
description: "Only.com robot",
id: "id_n_s_1306",
link1: "http://www.only.com/",
link2: "",
name: "Spida/0.1",
type: "R"
},
%{
comment: "",
description: "Search-Info ODP/DMOZ spider",
id: "id_n_s_1307",
link1: "http://search-info.com/",
link2: "",
name: "Spider-Sleek/2.0 (+http://search-info.com/linktous.html)",
type: "R"
},
%{
comment: " - site unreachable",
description: "Batsch robot",
id: "id_n_s_1308",
link1: "http://www.batsch.com",
link2: "",
name: "spider.batsch.com",
type: "R"
},
%{
comment: "",
description: "TerraNautic spider for Schnellsuchen touristic search (Germany)",
id: "id_n_s_110206_4",
link1: "http://www.terranautic.net/",
link2: "http://www.schnellsuchen.com/",
name: "Spider.TerraNautic.net - v:1.04",
type: "C"
},
%{
comment: "",
description: "Yellopet spider",
id: "id_n_s_1309",
link1: "http://www.yellopet.com/",
link2: "",
name: "spider.yellopet.com - www.yellopet.com",
type: "R"
},
%{
comment: "",
description: "Maxbot .gov .mil .edu indexing robot",
id: "id_n_s_1310",
link1: "http://www.maxbot.com/",
link2: "",
name: "Spider/maxbot.com admin@maxbot.com",
type: "R"
},
%{
comment: "",
description: "Unknown robot from CPE at Kasetsart University (158.108.35.xxx)",
id: "id_n_s_1311",
link1: "http://www.cpe.ku.ac.th/",
link2: "",
name: "SpiderKU/0.x",
type: "R"
},
%{
comment: "",
description: "Yahoo Search user agent or spider (202.165.102.xxx)",
id: "id_n_s_1312",
link1: "http://search.yahoo.com/",
link2: "",
name: "SpiderMan",
type: "R"
},
%{
comment: "",
description: "SpiderMonkey Canada robot",
id: "id_n_s_1313",
link1: "http://spidermonkey.ca/",
link2: "",
name: "SpiderMonkey/7.0x (SpiderMonkey.ca info at http://spidermonkey.ca/sm.shtml)",
type: "R"
},
%{
comment: "",
description: "Spider.de robot",
id: "id_n_s_1314",
link1: "http://www.spider.de/",
link2: "",
name: "Spinne/2.0",
type: "R"
},
%{
comment: "",
description: "Medkatalog (medical catalogue) Austria robot",
id: "id_n_s_1315",
link1: "http://www.medkatalog.com/",
link2: "",
name: "Spinne/2.0 med",
type: "R"
},
%{
comment: "",
description: "Medkatalog (medical catalogue) Austria robot",
id: "id_n_s_1316",
link1: "http://www.medkatalog.com/",
link2: "",
name: "Spinne/2.0 med_AH",
type: "R"
},
%{
comment: "72.44.62.1xx",
description: "Spock - people search application - via Amazon web services",
id: "id_n_s_180707_3",
link1: "http://www.spock.com/crawler",
link2: "http://www.amazon.com/gp/browse.html?node=3435361",
name: "Spock Crawler (http://www.spock.com/crawler)",
type: "R"
},
%{
comment: "",
description: "Sportsuchmaschine (German sports related search) link checking / robot",
id: "id_n_s_1317",
link1: "http://www.sportsuchmaschine.de/",
link2: "",
name: "sportsuchmaschine.de-Robot (Version: 1.02- powered by www.sportsuchmaschine.de)",
type: "R"
},
%{
comment: "powered by Nutch",
description: "Sproose personalized search (38.100.225.xx)",
id: "id_n_s_040306_1",
link1: "http://www.sproose.com/",
link2: "http://lucene.apache.org/nutch/",
name:
"sproose/0.1-alpha (sproose crawler; http://www.sproose.com/bot.html; crawler@sproose.com)",
type: "R"
},
%{
comment: "product is discontinued",
description: "SQ Webscanner Mac download manager",
id: "id_n_s_1318",
link1: "http://macinsearch.com/users/webscanner/",
link2: "",
name: "SQ Webscanner",
type: "D"
},
%{
comment: "",
description: "Simple page-prefetch for Squid web proxy",
id: "id_n_s_1319",
link1: "http://packages.debian.org/stable/web/squid-prefetch",
link2: "",
name: "Squid-Prefetch",
type: "P"
},
%{
comment: "s.also SquidClamAV_Redirector 1.x.x",
description: "Squidclam is a replacement for SquidClamAV-Redirector",
id: "id_n_s_171105_2",
link1: "http://sourceforge.net/projects/squidclam",
link2: "",
name: "squidclam",
type: "P"
},
%{
comment: "s.also squidclam",
description: "SCAVR - Squid helper script for scanning download URLs for viruses",
id: "id_n_s_1320",
link1: "http://www.jackal-net.at/tiki-read_article.php?articleId=1",
link2: "",
name: "SquidClamAV_Redirector 1.x.x",
type: "P"
},
%{
comment: "",
description: "AOL Search / Pacific Internet Exchange robot",
id: "id_n_s_1321",
link1: "http://www.aol.com/",
link2: "",
name: "Sqworm/2.9.81-BETA (beta_release; 20011102-760; i686-pc-linux-gnu)",
type: "R"
},
%{
comment: "",
description:
"diff. IPs / services i.e.: - Inria.fr robot - Websense (Internet filtering) robot",
id: "id_n_s_1322",
link1: "http://www.inria.fr/",
link2: "http://www.websense.com/",
name: "Sqworm/2.9.85-BETA (beta_release; 20011115-775; i686-pc-linux-gnu)",
type: "R"
},
%{
comment: "",
description: "Time Warner Telecom user robot ?",
id: "id_n_s_1323",
link1: "",
link2: "",
name: "Sqworm/2.9.89-BETA (beta_release; 20020130-839; i686-pc-linux-gnu) ",
type: ""
},
%{
comment: "see also - PSurf15a VA or random letters like - AWSCBA - URVUSLNAM",
description:
"Some site scanning tool via diff. IPs i.e.: - choiceone.net (216.153.xxx.xxx) - epix.net (216.108.198.xx)",
id: "id_n_s_1324",
link1: "",
link2: "",
name: "SSurf15a 11 ",
type: "S"
},
%{
comment: "",
description: "Rambler search (Russia) robot (81.19.6x.xx)",
id: "id_n_s_1325",
link1: "http://www.rambler.ru",
link2: "",
name: "StackRambler/x.x ",
type: "R"
},
%{
comment: "",
description: "Stamina download manager",
id: "id_n_s_1326",
link1: "http://www.wildbits.com/stamina/",
link2: "",
name: "Stamina/1.4",
type: "D"
},
%{
comment: "",
description: "Star Downloader download manager",
id: "id_n_s_1327",
link1: "http://www.stardownloader.com/",
link2: "",
name: "Star Downloader",
type: "D"
},
%{
comment: "",
description: "Star Downloader download manager",
id: "id_n_s_140106_3",
link1: "http://www.stardownloader.com/",
link2: "",
name: "StarDownloader/1.xx",
type: "D"
},
%{
comment: "66.92.186.xxx",
description: "Experimental search engine spider from 66.92.186.xxx",
id: "id_n_s_1328",
link1: "",
link2: "",
name: "stat statcrawler@gmail.com",
type: "R"
},
%{
comment: "",
description: "Steeler crawler",
id: "id_n_s_1329",
link1: "http://www.tkl.iis.u-tokyo.ac.jp/~crawler/",
link2: "",
name: "Steeler/1.x (http://www.tkl.iis.u-tokyo.ac.jp/~crawler/)",
type: "R"
},
%{
comment: "157.82.156.xx[x]",
description: "Steeler - University of Tokyo web crawler",
id: "id_n_s_031107_5",
link1: "http://www.tkl.iis.u-tokyo.ac.jp/~crawler/crawler.html.en",
link2: "",
name: "Steeler/3.3 (http://www.tkl.iis.u-tokyo.ac.jp/~crawler/)",
type: "R"
},
%{
comment: "",
description: "Strategic Board blog & news search robot",
id: "id_n_s_060106_1",
link1: "http://www.strategicboard.com/",
link2: "",
name: "Strategic Board Bot (+http://www.strategicboard.com)",
type: "R"
},
%{
comment: "62.0.99.2xx",
description: "Strategic Board blogs and news aggregator robot",
id: "id_n_s_140906_2",
link1: "http://www.strategicboard.com/",
link2: "",
name: "Strategic Board Bot (+http://www.strategicboard.com)",
type: "R"
},
%{
comment: "",
description: "Surfsafely submission verifier",
id: "id_n_s_1330",
link1: "http://www.surfsafely.com/",
link2: "",
name: "Submission Spider at surfsafely.com",
type: "R"
},
%{
comment: "",
description: "Suchbaer.de (Germany) search robot",
id: "id_n_s_210106_4",
link1: "http://www.suchbaer.de/",
link2: "",
name: "suchbaer.de",
type: "R"
},
%{
comment: "",
description: "Suchbaer.de (Germany) search robot",
id: "id_n_s_010206_3",
link1: "http://www.suchbaer.de/",
link2: "",
name: "suchbaer.de (CrawlerAgent v0.103)",
type: "R"
},
%{
comment: "",
description: "Suchbot Germany robot",
id: "id_n_s_1331",
link1: "http://www.suchbot.de/",
link2: "",
name: "suchbot",
type: "R"
},
%{
comment: "",
description: "Suchknecht Austria robot",
id: "id_n_s_1332",
link1: "http://www.suchknecht.at/",
link2: "",
name: "Suchknecht.at-Robot",
type: "R"
},
%{
comment: "",
description: "suchpad search Germany robot (213.239.194.xx)",
id: "id_n_s_120206_1",
link1: "http://www.suchpad.de/",
link2: "",
name: "suchpadbot/1.0 (+http://www.suchpad.de)",
type: "R"
},
%{
comment: "",
description: "Sunrise XP handheld news / website reader and converter",
id: "id_n_s_160107_2",
link1: "http://sourceforge.net/projects/sunrisexp",
link2: "",
name: "Sunrise XP/2.x",
type: "B"
},
%{
comment: "",
description: "Sunrise XP web sites and newsfeeds converter and handheld reader",
id: "id_n_s_230406_4",
link1: "http://www.sunrisexp.com/",
link2: "",
name: "Sunrise/0.42g (Windows XP)",
type: "B"
},
%{
comment: "",
description: "SuperBot website copier",
id: "id_n_s_1333",
link1: "http://www.sparkleware.com/superbot/index.html",
link2: "",
name: "SuperBot/x.x (Win32)",
type: "D"
},
%{
comment: "",
description: "SuperBot website copier",
id: "id_n_s_260108_2",
link1: "http://www.sparkleware.com/superbot/index.html",
link2: "",
name: "SuperBot/x.x.x.xx (Windows XP)",
type: "D"
},
%{
comment: "",
description: "Ubbi Superdownloads (Brazil) link checking",
id: "id_n_s_1334",
link1: "http://superdownloads.ubbi.com.br/",
link2: "",
name: "Superdownloads Spiderman",
type: "C"
},
%{
comment: "",
description: "SurfControl Web Filtering",
id: "id_n_s_1335",
link1: "http://www.surfcontrol.com/",
link2: "",
name: "SURF ",
type: "P"
},
%{
comment: "",
description: "Wanadoo Rechereche robot",
id: "id_n_s_1336",
link1: "http://www.wanadoo.fr/qqo/",
link2: "",
name: "SurferF3 1/0",
type: "R"
},
%{
comment: "",
description: "Maskbit Surfmaster bookmark tool",
id: "id_n_s_1337",
link1: "http://www.maskbit.com/surfmaster.htm",
link2: "",
name: "SurfMaster",
type: "C"
},
%{
comment: "s.also: PigeonBot",
description: "Whois Source domain name information robot (66.249.26.xx)",
id: "id_n_s_1338",
link1: "http://www.whois.sc/",
link2: "",
name: "SurveyBot/2.2 <a href='http://www.whois.sc'>Whois Source</a>",
type: "R C"
},
%{
comment: "s.also: PigeonBot",
description: "Whois Source domain name information robot (66.249.26.xx)",
id: "id_n_s_1339",
link1: "http://www.whois.sc/",
link2: "",
name: "SurveyBot/2.3 (Whois Source)",
type: "R C"
},
%{
comment: "",
description: "Yokogao Search Engine robot (Kanazawa University)",
id: "id_n_s_1340",
link1: "http://web.kanazawa-u.ac.jp/esearch.html",
link2: "",
name: "suzuran",
type: "R"
},
%{
comment: "",
description: "HP Secure Web Browser for OpenVMS",
id: "id_n_s_1341",
link1: "http://h71000.www7.hp.com/openvms/products/ips/cswb/cswb.html",
link2: "",
name: "SWB/V1.4 (HP)",
type: "B"
},
%{
comment: "",
description: "unknown",
id: "id_n_s_1342",
link1: "",
link2: "",
name: "swbot/0.9c libwww/5.3.1",
type: ""
},
%{
comment: "",
description: "Swooglebot Swoogle's semantic web crawler",
id: "id_n_s_1343",
link1: "http://swoogle.umbc.edu",
link2: "",
name: "Swooglebot/2.0. (+http://swoogle.umbc.edu/swooglebot.htm)",
type: "R"
},
%{
comment: "",
description:
"SWSBot - SmartWareSoft (85.186.255.xx) software search engine created for Playfuls.com",
id: "id_n_s_060106_2",
link1: "http://www.smartwaresoft.com/swsbot12.html",
link2: "http://www.playfuls.com/",
name: "SWSBot-Images/1.2 http://www.smartwaresoft.com/swsbot12.html",
type: "R"
},
%{
comment: "s.also <http://www.sygol.com/>",
description: "Sygol Search (Italy) robot",
id: "id_n_s_300106_2",
link1: "http://www.sygol.com/",
link2: "",
name: "SygolBot http://www.sygol.net",
type: "R"
},
%{
comment: "",
description: "Sylera browser (Japan)",
id: "id_n_s_1344",
link1: "http://tabbrowser.ktplan.jp/valinor/sylera.html",
link2: "",
name: "Sylera/1.2.x",
type: "B"
},
%{
comment: "",
description: "Mindspring.com user robot",
id: "id_n_s_1345",
link1: "http://www.mindspring.com/",
link2: "",
name: "SyncBot",
type: ""
},
%{
comment: "",
description: "SyncIT link validation",
id: "id_n_s_1346",
link1: "http://www.bookmarksync.com/",
link2: "",
name: "SyncIT/x.x",
type: "C"
},
%{
comment: "",
description: "Syndirella desktop information aggregator (beta)",
id: "id_n_s_140906_1",
link1: "http://www.yole.ru/projects/syndirella/",
link2: "",
name: "Syndirella/0.91pre",
type: "B"
},
%{
comment: "",
description: "Synomia (France) robot",
id: "id_n_s_1347",
link1: "http://www.synomia.fr/",
link2: "",
name: "SynoBot",
type: "R"
},
%{
comment: "",
description: "Syntryx Solution Suite - domain / keyword crawler (216.7.179.xx)",
id: "id_n_s_150406_1",
link1: "http://www.syntryx.com/",
link2: "",
name: "Syntryx ANT Scout Chassis Pheromone; Mozilla/4.0 compatible crawler",
type: "R"
},
%{
comment: "",
description: "Szukacz.pl (Polish search) robot",
id: "id_n_s_1348",
link1: "http://www.szukacz.pl/",
link2: "",
name: "Szukacz/1.x",
type: "R"
},
%{
comment: "",
description: "Szukacz.pl (Polish search) robot",
id: "id_n_s_1349",
link1: "http://www.szukacz.pl/",
link2: "",
name: "Szukacz/1.x (robot; www.szukacz.pl/jakdzialarobot.html; szukacz@proszynski.pl)",
type: "R"
},
%{
comment: "",
description: "German T-Online browser & internet suite ",
id: "id_t_z_220106_2",
link1: "http://service.t-online.de/c/06/52/67/652672.html",
link2: "",
name: "T-Online Browser",
type: "B"
},
%{
comment: "74.115.102.1xx",
description: "tags2dir.com directory index",
id: "id_t_z_070807_1",
link1: "http://tags2dir.com/directory/",
link2: "",
name: "tags2dir.com/0.8 (+http://tags2dir.com/directory/)",
type: "R"
},
%{
comment: "",
description: "TAGword DMOZ survey - ODP link checking robot",
id: "id_t_z_1350",
link1: "http://tagword.com/dmoz_survey.php",
link2: "",
name: "Tagword (http://tagword.com/dmoz_survey.php)",
type: "R"
},
%{
comment: "",
description: "Tagyu - del.icio.us bookmark collection online tag generator",
id: "id_t_z_271105_2",
link1: "http://www.tagyu.com/",
link2: "http://del.icio.us/",
name: "Tagyu Agent/1.0",
type: ""
},
%{
comment: "",
description: "Daumsoft Talkro IR robot",
id: "id_t_z_1351",
link1: "http://www.daumsoft.com/",
link2: "",
name:
"Talkro Web-Shot/1.0 (E-mail: webshot@daumsoft.com- Home: http://222.122.15.190/webshot)",
type: "R"
},
%{
comment: "",
description:
"Texas A&M University - Dept. of Computer Science crawler (server or link checking ?)",
id: "id_t_z_1352",
link1: "http://www.cs.tamu.edu/",
link2: "",
name: "TAMU_CS_IRL_CRAWLER/1.0",
type: "R C"
},
%{
comment: "",
description: "Targetblaster user link validation ?",
id: "id_t_z_1353",
link1: "http://www.targetblaster.com/",
link2: "",
name: "targetblaster.com/0.9k",
type: "R C"
},
%{
comment: "72.36.160.xxx",
description: "Target Your News - user submitted links",
id: "id_t_z_230706_2",
link1: "http://targetyournews.com/",
link2: "",
name: "TargetYourNews.com bot",
type: "C"
},
%{
comment: "134.226.1.xx",
description: "Trinity College Dublin (Ireland) TCDBOT",
id: "id_t_z_201006_1",
link1: "http://www.tcd.ie/",
link2: "",
name:
"TCDBOT/Nutch-0.8 (PhD student research;http://www.tcd.ie; mcgettrs at t c d dot IE)",
type: "R"
},
%{
comment: "",
description: "HTTP header for transfer encoding used as user agent name ?",
id: "id_t_z_1354",
link1: "",
link2: "",
name: "TE",
type: ""
},
%{
comment: "",
description: "WinInet Internet client app.",
id: "id_t_z_1355",
link1: "http://www.winsoft.sk/wininet.htm",
link2: "",
name: "TeamSoft WinInet Component",
type: ""
},
%{
comment: "",
description:
"Tecomac Gmbh (Germany) crawler software - now Arexera Information Technologies",
id: "id_t_z_1356",
link1: "http://www.arexera.de/",
link2: "",
name: "TECOMAC-Crawler/0.x",
type: "R"
},
%{
comment: "",
description: "Tecomi (Germany) beta / test robot (84.201.65.xxx)",
id: "id_t_z_1357",
link1: "http://www.tecomi.com/Suchmaschine",
link2: "",
name: "Tecomi Bot (http://www.tecomi.com/bot.htm)",
type: "R"
},
%{
comment: "67.202.26.1xx",
description:
"Teemer crawler for NetSeer search (beta) via Amazon Web Services - see also NetSeer/Nutch",
id: "id_t_z_101107_2",
link1: "http://www.netseer.com/",
link2: "http://www.amazon.com/gp/browse.html?node=3435361",
name:
"Teemer (NetSeer, Inc. is a Los Angeles based Internet startup company.; http://www.netseer.com/crawler.html; crawler@netseer.com)",
type: "R"
},
%{
comment: "",
description: "Teleport (website) downloading tool",
id: "id_t_z_1358",
link1: "http://www.tenmax.com/teleport/pro/home.htm",
link2: "",
name: "Teleport Pro/1.2x(.1xxx)",
type: "D"
},
%{
comment: "",
description: "Teoma crawler (65.214.36.xx[x])",
id: "id_t_z_1359",
link1: "http://www.teoma.com/",
link2: "",
name: "Teoma MP",
type: "R"
},
%{
comment: "",
description: "Teoma crawler (65.214.36.xx[x])",
id: "id_t_z_1361",
link1: "http://www.teoma.com/",
link2: "",
name: "teomaagent crawler-admin@teoma.com",
type: "R"
},
%{
comment: "",
description: "Teoma crawler (65.214.36.xx[x])",
id: "id_t_z_1362",
link1: "http://www.teoma.com/",
link2: "",
name: "teomaagent1 [crawler-admin@teoma.com]",
type: "R"
},
%{
comment: "",
description: "Teoma crawler (65.214.36.xx[x])",
id: "id_t_z_1360",
link1: "http://www.teoma.com/",
link2: "",
name: "teoma_agent1",
type: "R"
},
%{
comment: "",
description: "Teradex Directory robot",
id: "id_t_z_1363",
link1: "http://directory.teradex.com/",
link2: "",
name: "Teradex Mapper; mapper@teradex.com; http://www.teradex.com",
type: "R"
},
%{
comment: "",
description: "Teragram multilingual text & data processing software",
id: "id_t_z_010406_4",
link1: "http://www.teragram.com/",
link2: "",
name: "TeragramCrawler",
type: "D ?"
},
%{
comment: "88.198.44.2xx",
description: "Terraminds blog search (Germany)",
id: "id_t_z_150807_2",
link1: "http://www.terraminds.de/",
link2: "",
name: "terraminds-bot/1.0 (support@terraminds.de)",
type: "R"
},
%{
comment: "209.128.80.1xx",
description: "Terrawiz Indian Search Engine robot",
id: "id_t_z_220406_1",
link1: "http://www.terrawiz.com/",
link2: "",
name: "TerrawizBot/1.0 (+http://www.terrawiz.com/bot.html)",
type: "R"
},
%{
comment: "",
description: "Noceans Information Portfolio Manager (66.35.69.x)",
id: "id_t_z_1364",
link1: "http://www.noceans.com/",
link2: "",
name: "Test spider",
type: "R"
},
%{
comment: "204.228.230.xx",
description: "Balihoo - Search Engine for Advertising Media",
id: "id_t_z_160507_1",
link1: "http://balihoo.com/",
link2: "",
name:
"TestCrawler/Nutch-0.9 (Testing Crawler for Research ; http://balihoo.com/index.aspx; tgautier at balihoo dot com)",
type: "R"
},
%{
comment: "in conjunction with lwp-trivial/1.35",
description: "Expert HTML online source viewer",
id: "id_t_z_1365",
link1: "http://www.expert-html.net - site is offline",
link2: "",
name: "The Expert HTML Source Viewer (http://www.expert-html.com)",
type: "D B"
},
%{
comment: "67.202.27.19x",
description: "The Rarest Words - Linguistic experiment crawler via Amazon Web Services",
id: "id_t_z_281207_3",
link1: "http://therarestwords.com/",
link2: "http://www.amazon.com/gp/browse.html?node=3435361",
name: "TheRarestParser/0.2a (http://therarestwords.com/)",
type: "R"
},
%{
comment: "",
description: "TheSuBot robot (Germany) for an unknown theme based search engine",
id: "id_t_z_1366",
link1: "http://www.thesubot.de/",
link2: "",
name: "TheSuBot/0.1 (www.thesubot.de)",
type: "R"
},
%{
comment: "212.112.238.xx",
description: "ThumbShots website thumbnail service (Germany) robot",
id: "id_t_z_171106_1",
link1: "http://www.thumbshots.de/",
link2: "",
name: "thumbshots-de-Bot (Version: 1.02, powered by www.thumbshots.de)",
type: "D"
},
%{
comment: "",
description: "ThumbShots.de (Germany) robot",
id: "id_t_z_1367",
link1: "http://www.thumbshots.de/",
link2: "",
name: "thumbshots-de-Bot (Version: 1.02- powered by www.thumbshots.de)",
type: "R"
},
%{
comment: "",
description: "Breaking Blogs timbo bot blog robot",
id: "id_t_z_250206_1",
link1: "http://www.breakingblogs.com/",
link2: "",
name: "timboBot/0.9 http://www.breakingblogs.com/timbo_bot.html",
type: "R"
},
%{
comment: "s. also EldoS ...",
description: "TimelyWeb web page monitoring tool",
id: "id_t_z_140106_4",
link1: "http://www.eldos.org/timelyweb/timelyweb.html",
link2: "",
name: "http://www.timelyweb.com/",
type: "C"
},
%{
comment: "",
description: "TinEye crawler for an open image search project",
id: "id_t_z_180408_6",
link1: "http://tineye.com/crawler.html",
link2: "",
name: "TinEye/1.1 (http://tineye.com/crawler.html)",
type: "R"
},
%{
comment: "see this document: http://trec.nist.gov/pubs/trec9/papers/att-trec9.ps",
description: "Tivra spider from AT&T Labs Research",
id: "id_t_z_1368",
link1: "http://trec.nist.gov/pubs/trec9/papers/att-trec9.ps",
link2: "",
name: "tivraSpider/1.0 (crawler@tivra.com)",
type: "R"
},
%{
comment: "",
description: "Tjgroup spider",
id: "id_t_z_1369",
link1: "http://www.tjgroup.com/",
link2: "",
name: "TJG/Spider",
type: "R"
},
%{
comment: "Possibly used by Bit Torrent Search ",
description: "TJvHttpGrabber (JEDI Visual Component Library)",
id: "id_t_z_1370",
link1: "http://homepages.borland.com/jedi/jedihelp/item.php?Id=22015",
link2: "http://www.btsearch.net/",
name: "TJvMultiHttpGrabber Component",
type: ""
},
%{
comment: "",
description: "Tkensaku Search (Japan) robot from 210.239.46.xxx (www.tken.com)",
id: "id_t_z_1371",
link1: "http://www.tkensaku.com/q.html",
link2: "",
name: "Tkensaku/x.x(http://www.tkensaku.com/q.html)",
type: "R"
},
%{
comment: "",
description: "Unknown robot from 195.68.98.xx (coltfrance.com)",
id: "id_t_z_1372",
link1: "",
link2: "",
name: "toCrawl/UrlDispatcher",
type: ""
},
%{
comment: "88.153.148.xx",
description: "Topodia search engine and personal information assistant (in development)",
id: "id_t_z_200207_1",
link1: "http://www.topodia.com/",
link2: "",
name:
"Topodia/1.2-dev (Topodia - Crawler for HTTP content indexing; http://www.topodia.com/; support@topodia.com)",
type: "R"
},
%{
comment: "193.17.73.1xx",
description: "Topos search (Russia) robot",
id: "id_t_z_160506_2",
link1: "http://www.topos.com.ua/",
link2: "",
name: "TOPOS robot/1.1 (http://www.topos.com.ua/)",
type: "C"
},
%{
comment: "87.230.5.2xx",
description: "Traazi! search (Germany) robot",
id: "id_t_z_050806_2",
link1: "http://www.traazi.de/",
link2: "",
name: "traazibot/testengine (+http://www.traazi.de)",
type: "R"
},
%{
comment: "",
description: "Trailfire web collection and annotating system",
id: "id_t_z_041007_2",
link1: "http://www.trailfire.com/",
link2: "",
name:
"Trailfire-bot/0.7.1 (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org)",
type: "C"
},
%{
comment: "",
description: "Trailfire web collection and annotating system",
id: "id_t_z_081207_2",
link1: "http://www.trailfire.com/",
link2: "",
name:
"Trailfire-bot/0.7.1 (Trailfire page content analyzer; http://trailfire.com; info@trailfire.com)",
type: "C"
},
%{
comment: "",
description: "Trailfire web collection and annotating system",
id: "id_t_z_260807_2",
link1: "http://www.trailfire.com/",
link2: "",
name:
"Trailfire/0.7.1 (Nutch; http://lucene.apache.org/nutch/bot.html; nutch-agent@lucene.apache.org)",
type: "C"
},
%{
comment: "",
description: "Trampelpfad Webkatalog spider",
id: "id_t_z_1376",
link1: "http://www2.trampelpfad.de/",
link2: "",
name: "Trampelpfad-Spider",
type: "R"
},
%{
comment: "",
description: "Trampelpfad Webkatalog spider",
id: "id_t_z_1377",
link1: "http://www2.trampelpfad.de/",
link2: "",
name: "Trampelpfad-Spider-v0.1",
type: "R"
},
%{
comment: "",
description: "Tricos meta tag validation",
id: "id_t_z_1378",
link1: "http://www.tricos.us/metaone.php",
link2: "",
name: "tricosMetaCheck 1.2216-08-1999 (http://www.tricos.com/metacheck)",
type: "C"
},
%{
comment: "- s. DBrowse- Dsurf etc.",
description: "some bad user agent",
id: "id_t_z_1379",
link1: "",
link2: "",
name: "TSurf15a 11",
type: "S"
},
%{
comment: "",
description: "Tulip Chain browser / link checker for Dmoz.org directory",
id: "id_t_z_1380",
link1: "http://ostermiller.org/tulipchain/",
link2: "",
name:
"TulipChain/5.x (http://ostermiller.org/tulipchain/) Java/1.x.1_0x (http://java.sun.com/) Linux/2.4.17",
type: "B C R"
},
%{
comment: "",
description: "Tulip Chain browser / link checker for Dmoz.org directory",
id: "id_t_z_1381",
link1: "http://ostermiller.org/tulipchain/",
link2: "",
name:
"TulipChain/5.xx (http://ostermiller.org/tulipchain/) Java/1.x.1_0x (http://apple.com/) Mac_OS_X/10.2.8",
type: "B C R"
},
%{
comment: "72.32.6.15x",
description: "Tumblr Tumblelogs RSS and news syndication crawler",
id: "id_t_z_101107_3",
link1: "http://www.tumblr.com/",
link2: "",
name: "Tumblr/1.0 RSS syndication (+http://www.tumblr.com/) (support@tumblr.com)",
type: "R"
},
%{
comment: "64.140.49.xx",
description:
"Turnitin (ex SlySearch) robot for helping educational institutions prevent plagiarism",
id: "id_t_z_1382",
link1: "http://www.turnitin.com/robot/crawlerinfo.html",
link2: "",
name: "TurnitinBot/x.x (http://www.turnitin.com/robot/crawlerinfo.html)",
type: "R"
},
%{
comment: "",
description: "TurnPike Emporium Directory (207.67.198.x) link checking",
id: "id_t_z_1383",
link1: "http://www.turnpike.net/directory.phtml",
link2: "",
name: "Turnpike Emporium LinkChecker/0.1",
type: "R"
},
%{
comment: "",
description: "TutorGig tutorial search robot",
id: "id_t_z_1384",
link1: "http://www.tutorgig.com/crawler/",
link2: "",
name: "TutorGig/1.5 (+http://www.tutorgig.com/crawler)",
type: "R"
},
%{
comment: "",
description: "TutorGig tutorial search robot",
id: "id_t_z_1385",
link1: "http://www.tutorgig.com/crawler/",
link2: "",
name: "Tutorial Crawler 1.4 (http://www.tutorgig.com/crawler)",
type: "R"
},
%{
comment: "64.62.136.xxx",
description: "Twiceler experimental web crawler",
id: "id_t_z_1386",
link1: "http://www.cuill.com/",
link2: "",
name: "Twiceler www.cuill.com/robots.html",
type: "R"
},
%{
comment: "64.62.136.xxx",
description: "Twiceler experimental web crawler",
id: "id_t_z_290407_1",
link1: "http://www.cuill.com/",
link2: "",
name: "Twiceler-0.9 http://www.cuill.com/twiceler/robot.html",
type: "R"
},
%{
comment: "",
description: "File downloading component from Twisted Python",
id: "id_t_z_291105_5",
link1: "http://twistedmatrix.com/",
link2: "",
name: "Twisted PageGetter",
type: "D"
},
%{
comment: "75.101.135.[x]xx",
description: "Twitt(url)y URL tracking service for Twitter via Amazon Web Services",
id: "id_t_z_140508_5",
link1: "http://twitturly.com/",
link2: "http://twitter.com/",
name: "Twitturly / v0.x",
type: "C"
},
%{
comment: "",
description: "Twotrees content filter",
id: "id_t_z_1387",
link1: "http://www.twotrees.com/",
link2: "",
name: "Twotrees Reactive Filter V2.0",
type: "P"
},
%{
comment: "204.123.46.xx[x]",
description: "Tycoon - Hewlett-Packards distributed cluster solution robot",
id: "id_t_z_221207_2",
link1: "http://tycoon.hpl.hp.com/",
link2: "",
name: "Tycoon Agent/Nutch-1.0-dev",
type: "R"
},
%{
comment: "",
description: "Tygo Search robot",
id: "id_t_z_1388",
link1: "http://www.tygo.com/",
link2: "",
name: "TygoBot",
type: "R"
},
%{
comment: "",
description: "Tygo Search robot",
id: "id_t_z_1389",
link1: "http://www.tygo.com/",
link2: "",
name: "TygoProwler",
type: "R"
},
%{
comment: "",
description: "UCMore - IE navigation and search plugin",
id: "id_t_z_1390",
link1: "http://www.ucmore.com/",
link2: "",
name: "UCmore",
type: "B"
},
%{
comment: "",
description: "UCMore - IE navigation and search plugin",
id: "id_t_z_1391",
link1: "http://www.ucmore.com/",
link2: "",
name: "UCMore Crawler App",
type: "B"
},
%{
comment: "",
description: "Ucweb mobile browser",
id: "id_t_z_290208_1",
link1: "http://www.ucweb.com/English/product.shtml",
link2: "",
name: "UCWEB5.1",
type: "B"
},
%{
comment: "",
description: "user agent - maybe UdmSearch (see UdmSearch) ?",
id: "id_t_z_1392",
link1: "",
link2: "",
name: "UDM",
type: ""
},
%{
comment: "",
description: "UdmSearch / MySearch (now mnoGoSeach) offline browser/search client",
id: "id_t_z_1393",
link1: "http://mnogosearch.org/",
link2: "",
name: "UdmSearch/3.1.x",
type: "R B"
},
%{
comment: "",
description: "University of Iowa Crawler- possibly MySpiders",
id: "id_t_z_1394",
link1: "http://myspiders.biz.uiowa.edu/",
link2: "",
name: "UIowaCrawler/1.0",
type: "R"
},
%{
comment: "s. also Mackster",
description: "UKWizz search robot",
id: "id_t_z_231106_1",
link1: "http://www.ukwizz.com",
link2: "",
name: "UKWizz/Nutch-0.8.1 (UKWizz Nutch crawler; http://www.ukwizz.com/)",
type: "R"
},
%{
comment: "",
description: "Infoseek robot",
id: "id_t_z_1395",
link1: "http://www.infoseek.com/",
link2: "",
name: "Ultraseek",
type: "R"
},
%{
comment: "",
description: "Unknown mail harvester/spambot from 80.58.13.xxx (proxycache.rima-tde.net)",
id: "id_t_z_1396",
link1: "http://www.honeypot.be/",
link2: "",
name: "Under the Rainbow 2.2",
type: "S"
},
%{
comment: "203.161.71.17x",
description: "DNS Right - Online DNS tools",
id: "id_a_f_140308_1",
link1: "http://www.dnsright.com/",
link2: "",
name: "unknownght.com Web Server IIS vs Apache Survey. See Results at www.DNSRight.com",
type: "C"
},
%{
comment: "",
description: "Unknown robot from University of Toronto (128.100.5.1xx)",
id: "id_t_z_1397",
link1: "",
link2: "",
name: "UofTDB_experiment (leehyun@cs.toronto.edu)",
type: "R"
},
%{
comment: "",
description: "Mobile phone browser",
id: "id_t_z_1398",
link1: "",
link2: "",
name: "UP.Browser/3.01-IG01 UP.Link/3.2.3.4",
type: "B"
},
%{
comment: "38.119.96.1xx",
description: "Updated! search robot",
id: "id_t_z_050806_1",
link1: "http://www.updated.com/",
link2: "",
name: "updated/0.1-alpha (updated crawler; http://www.updated.com; crawler@updated.com)",
type: "R"
},
%{
comment: "38.119.96.1xx",
description: "Updated! search robot",
id: "id_t_z_1399",
link1: "http://www.updated.com/",
link2: "",
name: "updated/0.1beta (updated.com; http://www.updated.com; crawler@updated.om)",
type: "R"
},
%{
comment: "",
description: "Handspring (PalmOS powered cellphone) Treo Blazer browser",
id: "id_t_z_1400",
link1: "",
link2: "",
name: "UPG1 UP/4.0 (compatible; Blazer 1.0)",
type: "B"
},
%{
comment: "",
description: "UptimeBot.com online link popularity check",
id: "id_t_z_1401",
link1: "http://www.uptimebot.com/",
link2: "",
name: "Uptimebot",
type: "R"
},
%{
comment: "",
description: "UptimeBot.com online link popularity check",
id: "id_t_z_1402",
link1: "http://www.uptimebot.com/",
link2: "",
name: "UptimeBot(www.uptimebot.com)",
type: "R"
},
%{
comment: "",
description:
"URI::Fetch - client for fetching HTTP pages and syndication feeds (RSS Atom)",
id: "id_t_z_160706_2",
link1: "http://search.cpan.org/dist/URI-Fetch/",
link2: "",
name: "URI::Fetch/0.06",
type: "D"
},
%{
comment: "",
description: "Innerprise URL Spider Pro (now ES.NET) web indexing / site searching tool",
id: "id_t_z_1403",
link1: "http://www.innerprise.net/",
link2: "",
name: "URL Spider Pro/x.xx (innerprise.net)",
type: "R"
},
%{
comment: "s. also Mozilla/4.0 (Compatible); URLBase 6",
description: "URLBase - Internet shortcut manager",
id: "id_t_z_121106_2",
link1: "http://www.terriadev.com/products/urlbase/",
link2: "",
name: "URLBase/6.x",
type: "C"
},
%{
comment: "",
description: "URLBlaze file sharing link toolkit",
id: "id_t_z_1406",
link1: "http://www.urlblaze.net/",
link2: "",
name: "URLBlaze",
type: "C"
},
%{
comment: "70.165.48.16x",
description: "://URLFAN news crawler",
id: "id_t_z_011108_4",
link1: "http://www.urlfan.com/",
link2: "",
name: "urlfan-bot/1.0; +http://www.urlfan.com/site/bot/350.html",
type: "R"
},
%{
comment: "",
description: "URLGetFile downloading tool",
id: "id_t_z_1407",
link1: "http://shazron.com/freeware/java-utils/",
link2: "",
name: "URLGetFile",
type: "D"
},
%{
comment: "",
description: "Innerprise URL Spider Pro (now ES.NET) web indexing / site searching tool",
id: "id_t_z_1404",
link1: "http://www.innerprise.net/",
link2: "",
name: "URL_Spider_Pro/x.x",
type: "R"
},
%{
comment: "",
description: "Innerprise URL Spider Pro (now ES.NET) web indexing / site searching tool",
id: "id_t_z_1405",
link1: "http://www.innerprise.net/",
link2: "",
name: "URL_Spider_Pro/x.x+(http://www.innerprise.net/usp-spider.asp)",
type: "R"
},
%{
comment: "208.65.71.xx",
description: "BoardReader search favicon fetcher",
id: "id_t_z_291006_1",
link1: "http://www.boardreader.com/",
link2: "http://www.internetadsales.com/modules/news/article.php?storyid=4050",
name: "User-Agent: BoardReader Favicon Fetcher /1.0 info@boardreader.com",
type: "D"
},
%{
comment: "208.65.71.xx",
description: "BoardReader search image fetcher",
id: "id_t_z_081206_1",
link1: "http://www.boardreader.com/",
link2: "http://www.internetadsales.com/modules/news/article.php?storyid=4050",
name: "User-Agent: BoardReader Image Fetcher /1.0 info@boardreader.com",
type: "D"
},
%{
comment: "",
description: "ljpic.com - LiveJournal picture feed search",
id: "id_t_z_060206_2",
link1: "http://www.ljpic.com/",
link2: "",
name: "User-Agent: LjSEEK Picture-Bot /1.0 contact@ljseek.com",
type: "C"
},
%{
comment: "",
description: "FileHeap download manager",
id: "id_t_z_1408",
link1: "http://www.fileheap.com",
link2: "",
name: "User-Agent: FileHeap! file downloader (http://www.fileheap.com)",
type: "D"
},
%{
comment: "",
description: "Malformed UA header from some guestbook/forum spammer",
id: "id_t_z_270306_2",
link1: "",
link2: "",
name: "User-Agent: Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1)",
type: "S"
},
%{
comment: "",
description: "Skizzle search robot",
id: "id_t_z_1409",
link1: "http://www.skizzle.com/",
link2: "",
name:
"User-Agent: Mozilla/4.0 (SKIZZLE! Distributed Internet Spider v1.0 - www.SKIZZLE.com)",
type: "R"
},
%{
comment: "",
description:
"unknown robot (reads robots.txt) or sitegrabber. From different IPs- ie.: 62.98.8.xx (wind.it)",
id: "id_t_z_1410",
link1: "",
link2: "",
name: "user-agent=Mozilla/3.01Gold",
type: "R D ?"
},
%{
comment: "",
description:
"University of Sydney NLP Spider for research in Natural Language Processing ",
id: "id_t_z_1411",
link1: "http://www.it.usyd.edu.au/~vinci/bot.html",
link2: "",
name: "USyd-NLP-Spider (http://www.it.usyd.edu.au/~vinci/bot.html)",
type: "R"
},
%{
comment: "",
description: "Web Thief Site Grabber",
id: "id_t_z_1412",
link1: "http://www.utilmind.com/scripts/webthief.html",
link2: "",
name: "UtilMind HTTPGet",
type: "D"
},
%{
comment: "",
description: "WebWasher ad filter",
id: "id_t_z_1413",
link1: "http://www.webwasher.com/",
link2: "",
name: "Utopia WebWasher 3.0",
type: "P B"
},
%{
comment: "",
description: "uTorrent BitTorrent client",
id: "id_t_z_100406_1",
link1: "http://www.utorrent.com/",
link2: "",
name: "uTorrent/1500",
type: "D"
},
%{
comment: "67.78.34.1[6-7][0-9] - 70.112.211.2x",
description: "Unknown bad behaving bot via Road Runner - see link",
id: "id_t_z_060108_2",
link1: "http://mikesblog.americasdebate.com/2007/06/06/vadixbot-look-out/",
link2: "",
name: "VadixBot",
type: "S"
},
%{
comment: "",
description: "WiseGuys WAP pages robot",
id: "id_t_z_050406_4",
link1: "http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk",
link2: "",
name:
"Vagabondo-WAP/2.0 (webcrawler at wise-guys dot nl; http://webagent.wise-guys.nl/)/1.0 Profile",
type: "R"
},
%{
comment: "s. also Mozilla/3.0 (Vagabondo...",
description: "WiseGuys robot Netherland - 82.94.216.2",
id: "id_t_z_1414",
link1: "http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk",
link2: "",
name: "Vagabondo/1.x MT (webagent@wise-guys.nl)",
type: "R"
},
%{
comment: "s. also Mozilla/3.0 (Vagabondo...",
description: "WiseGuys robot Netherland - 82.94.216.2",
id: "id_t_z_1415",
link1: "http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk",
link2: "",
name: "Vagabondo/2.0 MT",
type: "R"
},
%{
comment: "s. also Mozilla/3.0 (Vagabondo...",
description: "WiseGuys robot Netherland - 82.94.216.2",
id: "id_t_z_1416",
link1: "http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk",
link2: "",
name: "Vagabondo/2.0 MT (webagent at wise-guys dot nl)",
type: "R"
},
%{
comment: "s. also Mozilla/3.0 (Vagabondo...",
description: "WiseGuys robot Netherland - 82.94.216.2",
id: "id_t_z_1417",
link1: "http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk",
link2: "",
name: "Vagabondo/2.0 MT (webagent@NOSPAMwise-guys.nl)",
type: "R"
},
%{
comment: "s.also - Mozilla/3.0 (Vagabondo...",
description: "WiseGuys robot Netherland - 82.94.216.2",
id: "id_t_z_021205_2",
link1: "http://www.wise-guys.nl/Contact/index.php?botselected=webagents&lang=uk",
link2: "",
name: "Vagabondo/3.0 (webagent at wise-guys dot nl)",
type: "R"
},
%{
comment: "",
description: "Open Directory link checking from Vakes",
id: "id_t_z_1418",
link1: "http://www.vakes.com/",
link2: "",
name: "Vakes/0.01 (Vakes; http://www.vakes.com/; search@vakes.com)",
type: "R"
},
%{
comment: "",
description: "unknown level3.net (63.214.172.xxx) robot",
id: "id_t_z_1420",
link1: "",
link2: "",
name: "VayalaCreep-v0.0.1 (haploid@haploid.com)",
type: ""
},
%{
comment: "",
description: "unknown level3.net (63.214.172.xxx) robot",
id: "id_t_z_1419",
link1: "",
link2: "",
name: "Vayala|Creep-v0.0.1 (codepoet@wildties.com)",
type: ""
},
%{
comment: "",
description: "iNet Grabber - Internet content grabber",
id: "id_t_z_1421",
link1: "http://www.aldostools.com/igrabber.html",
link2: "",
name: "vb wininet",
type: "D"
},
%{
comment: "",
description: "Versus Project robot - Comparing methods for near-uniform URL sampling",
id: "id_t_z_1422",
link1: "http://versus.integis.ch/",
link2: "",
name: "versus 0.2 (+http://versus.integis.ch)",
type: "R"
},
%{
comment: "",
description: "Unknown robot from EPFL University Switzerland (128.178.155.xxx)",
id: "id_t_z_1423",
link1: "http://www.epfl.ch/Eindex.html",
link2: "",
name: "versus crawler eda.baykan@epfl.ch",
type: "R"
},
%{
comment: "",
description: "Verticrawl - Semantic search engine solution (French)",
id: "id_t_z_120408_1",
link1: "http://www.verticrawl.com/fr/homepage.php",
link2: "",
name: "Verticrawlbot",
type: "C"
},
%{
comment: "",
description: "VeryGoodSearch.com link submission checking",
id: "id_t_z_1424",
link1: "http://www.verygoodsearch.com/",
link2: "",
name: "VeryGoodSearch.com.DaddyLongLegs",
type: "R"
},
%{
comment: "213.247.50.xx",
description: "Verzamelgids NL link checking robot",
id: "id_t_z_1425",
link1: "http://www.verzamelgids.nl/",
link2: "",
name: "verzamelgids.nl - Networking4all Bot/x.x",
type: "R"
},
%{
comment: "213.247.50.xx",
description: "Verzamelgids NL link checking robot",
id: "id_t_z_181006_2",
link1: "http://www.verzamelgids.nl/",
link2: "",
name: "Verzamelgids/2.2 (http://www.verzamelgids.nl)",
type: "R"
},
%{
comment: "217.144.236.x",
description: "Unknown robot from Yahoo Norway",
id: "id_t_z_030406_1",
link1: "http://no.yahoo.com/",
link2: "",
name: "Vespa Crawler",
type: "R"
},
%{
comment: "",
description: "Sidewinder G2 anti-virus and anti-spyware protection",
id: "id_t_z_190206_1",
link1: "http://www.securecomputing.com/sg2_antivirus.cfm?menu=solutions",
link2: "",
name: "virus_detector (virus_harvester@securecomputing.com)",
type: "D"
},
%{
comment: "63.133.162..xx",
description: "Visbot crawler for a search software under development",
id: "id_t_z_140407_1",
link1: "http://www.visvo.com/bot.html",
link2: "",
name: "VisBot/2.0 (Visvo.com Crawler; http://www.visvo.com/bot.html; bot@visvo.com)",
type: "R"
},
%{
comment: "",
description: "Some IE toolbar made with Visicom Media Dynamic Toolbar software",
id: "id_t_z_1426",
link1: "http://www.dynamictoolbar.com/en/products/toolbar/",
link2: "",
name: "Visicom Toolbar",
type: "B"
},
%{
comment: "",
description:
"Vision research lab's Cortina - content based image retrieval (128.111.60.xx)",
id: "id_t_z_1427",
link1: "http://vision.ece.ucsb.edu/multimedia/cortina.html",
link2: "",
name: "Vision Research Lab image spider at vision.ece.ucsb.edu",
type: "R"
},
%{
comment: "",
description: "VLC - Cross-platform media player and streaming server",
id: "id_t_z_160906_1",
link1: "http://www.videolan.org/vlc/",
link2: "",
name: "VLC media player - version 0.8.5 Janus - (c) 1996-2006 the VideoLAN team",
type: "B"
},
%{
comment: "202.83.221.2xx",
description: "VM - Vertical Search Engine (China)",
id: "id_t_z_140806_1",
link1: "http://www.verticalmatch.com/",
link2: "",
name: "VMBot/0.x.x (VMBot; http://www.VerticalMatch.com/; vmbot@tradedot.com)",
type: "R"
},
%{
comment: "",
description: "Vortex Web Indexing Robot for a study on internet link distribution",
id: "id_t_z_020106_1",
link1: "http://marty.anstey.ca/projects/robots/vortex/",
link2: "",
name: "Vortex/2.2 (+http://marty.anstey.ca/robots/vortex/)",
type: "R"
},
%{
comment: "s. also - cfetch/1.x - carleson/1.x",
description:
"Kosmix health, auto and travel search crawler (204.14.48.x / 38.113.234.xxx)",
id: "id_t_z_041207_1",
link1: "http://www.kosmix.com/",
link2: "",
name: "voyager-hc/1.0",
type: "R"
},
%{
comment: "s. also - cfetch/1.x - carleson/1.x",
description:
"Kosmix health, auto and travel search crawler (204.14.48.x / 38.113.234.xxx)",
id: "id_t_z_231105_1",
link1: "http://www.kosmix.com/",
link2: "",
name: "voyager/1.0",
type: "R"
},
%{
comment: "s. also - cfetch/1.x - carleson/1.x",
description:
"Kosmix health, auto and travel search crawler (204.14.48.x / 38.113.234.xxx)",
id: "id_t_z_301108_3",
link1: "http://www.kosmix.com/",
link2: "",
name: "voyager/2.0 (http://www.kosmix.com/html/crawler.html)",
type: "R"
},
%{
comment: "",
description: "Vivisimo search crawler (206.210.89.xxx)",
id: "id_t_z_171105_3",
link1: "http://www.vivisimo.com/",
link2: "",
name: "VSE/1.0 (testcrawler@hotmail.com)",
type: "R"
},
%{
comment: "",
description: "Vivisimo search crawler (206.210.89.xxx)",
id: "id_t_z_171105_4",
link1: "http://www.vivisimo.com/",
link2: "",
name: "VSE/1.0 (testcrawler@vivisimo.com)",
type: "R"
},
%{
comment: "",
description: "Verity vspider indexing software",
id: "id_t_z_1428",
link1: "http://www.verity.com/",
link2: "",
name: "vspider",
type: "R"
},
%{
comment: "",
description: "Verity vspider indexing software",
id: "id_t_z_1429",
link1: "http://www.verity.com/",
link2: "",
name: "vspider/3.x",
type: "R"
},
%{
comment: "192.17.240.xx",
description:
"VWBot - MetaQuerier Crawler for the MetaQuerier project at the University of Illinois",
id: "id_t_z_130707_1",
link1: "http://vwbot.cs.uiuc.edu/",
link2: "http://metaquerier.cs.uiuc.edu/",
name:
"VWBOT/Nutch-0.9-dev (VWBOT Nutch Crawler; http://vwbot.cs.uiuc.edu;+vwbot@cs.uiuc.edu",
type: "R"
},
%{
comment: "",
description: "W3C Link Checker",
id: "id_t_z_1431",
link1: "http://validator.w3.org/checklink",
link2: "",
name: "W3C-checklink/3.x.x.x libwww-perl/5.xx",
type: "C"
},
%{
comment: "",
description: "W3C Link Checker",
id: "id_t_z_1432",
link1: "http://validator.w3.org/checklink",
link2: "",
name: "W3C-checklink/4.x [4.xx] libwww-perl/5.xxx",
type: "C"
},
%{
comment: "",
description: "WebCon - the Libwww command line tool",
id: "id_t_z_080806_1",
link1: "http://www.w3.org/ComLine/",
link2: "",
name: "W3C-WebCon/5.x.x libwww/5.x.x",
type: "D"
},
%{
comment: "",
description: "W3C Line Mode (character based Web browser)",
id: "id_t_z_1433",
link1: "http://www.w3.org/LineMode/",
link2: "",
name: "W3CLineMode/5.4.0 libwww/5.x.x",
type: "B"
},
%{
comment: "",
description: "Unknown link checking using Libwww via Korea Telecom (221.148.44.xxx)",
id: "id_t_z_1434",
link1: "http://www.w3.org/Library/",
link2: "",
name: "W3CRobot/5.4.0 libwww/5.4.0",
type: "C"
},
%{
comment: "",
description: "W3C HTML-Code Validator",
id: "id_t_z_1430",
link1: "http://validator.w3.org/",
link2: "",
name: "W3C_Validator/1.xxx libwww-perl/5.xx",
type: "C"
},
%{
comment: "",
description: "w3m Linux pager / text-based browser",
id: "id_t_z_1435",
link1: "http://w3m.sourceforge.net/",
link2: "",
name: "w3m/0.x.xx",
type: "B"
},
%{
comment: "",
description: "W3 Site Search (Germany) search engine solution",
id: "id_t_z_1436",
link1: "http://www.w3sitesearch.de/",
link2: "",
name: "W3SiteSearch Crawler_v1.1 http://www.w3sitesearch.de",
type: "R"
},
%{
comment: "202.51.14.1xx",
description: "Wadain (Japan) Blog / RSS search crawler",
id: "id_t_z_061206_3",
link1: "http://wadaino.jp/",
link2: "",
name: "wadaino.jp-crawler 0.2 (http://wadaino.jp/)",
type: "R"
},
%{
comment: "",
description: "Wanna-Be text mode browser",
id: "id_t_z_1437",
link1: "http://mindstory.com/wb2/",
link2: "",
name: "WannaBe (Macintosh; PPC)",
type: "B"
},
%{
comment: "Site is dead",
description: "WapOnWindows WAP browser for PCs",
id: "id_t_z_270906_1",
link1: "http://www.waponwindows.com/",
link2: "",
name: "WapOnWindows 1.0",
type: "B"
},
%{
comment: "",
description: "Watchfire WebXM intranet solution",
id: "id_t_z_250206_2",
link1: "http://www.watchfire.com/products/webxm/default.aspx",
link2: "",
name: "Watchfire WebXM 1.0",
type: "P"
},
%{
comment: "",
description:
"WAVcheck - Simple Vendor Discovery Tool for detecting client-side tags from web analytics vendors",
id: "id_t_z_200706_1",
link1: "http://www.webbanalys.se/apps/WAVcheck/",
link2: "",
name: "WAVcheck 1.0.x (http://www.webbanalys.se/apps/WAVcheck/)",
type: "C"
},
%{
comment: "",
description: "Wavefire local search community engine (64.141.15.1xx)",
id: "id_t_z_110106_1",
link1: "http://www.wavefire.com/",
link2: "",
name: "Wavefire/0.8-dev (Wavefire; http://www.wavefire.com; info@wavefire.com)",
type: "R"
},
%{
comment: "",
description: "Waypath blog discovery engine robot",
id: "id_t_z_110206_5",
link1: "http://www.waypath.com/",
link2: "",
name: "Waypath development crawler - info at waypath dot com",
type: "R"
},
%{
comment: "",
description: "Waypath blog discovery engine robot",
id: "id_t_z_110206_6",
link1: "http://www.waypath.com/",
link2: "",
name: "Waypath Scout v2.x - info at waypath dot com",
type: "R"
},
%{
comment: "",
description: "WDG HTML-code validator",
id: "id_t_z_1438",
link1: "http://www.htmlhelp.tne.co.uk/tools/validator/",
link2: "",
name: "WDG_Validator/1.1",
type: "C"
},
%{
comment: "",
description: "Datafire.com's Web Image Collector (graphics downloading tool)",
id: "id_t_z_1439",
link1: "http://www.datafire.com/",
link2: "",
name: "Web Image Collector",
type: "D"
},
%{
comment: "",
description: "Relsoft link checking software",
id: "id_t_z_1440",
link1: "http://www.relsoftware.com/",
link2: "",
name: "Web Link Validator 1.5",
type: "C"
},
%{
comment: "",
description: "RankMeter ranking software",
id: "id_t_z_1441",
link1: "http://www.searchutilities.com/",
link2: "",
name: "Web Snooper",
type: "R"
},
%{
comment: "",
description: "Web-bekannt German web directory link checking",
id: "id_t_z_010206_2",
link1: "http://www.web-bekannt.de/",
link2: "",
name: "web-bekannt (Version: 1.02, powered by www.internetservice-franken.de)",
type: "C"
},
%{
comment: "",
description: "Web-bekannt German web directory link checking",
id: "id_t_z_010206_1",
link1: "http://www.web-bekannt.de/",
link2: "",
name: "web-bekannt (Version: 1.02, powered by www.web-bekannt.de)",
type: "C"
},
%{
comment: "",
description:
"Unkown link or server checking from Würzburg University Germany (132.187.10.xx)",
id: "id_t_z_1442",
link1: "http://informatik.uni-wuerzburg.de/",
link2: "",
name: "Web-Bot V1.03",
type: "R C"
},
%{
comment: "no active website",
description: "Unknown robot from 69.50.233.x (nectartech.com)",
id: "id_t_z_1443",
link1: "",
link2: "",
name: "Web-Robot/5.0 (en-US; web-robot.com/policy.html) Web-Robot Crawler/2.0.3",
type: ""
},
%{
comment: "",
description: "Web2Express / Web2x - Open data searching tool",
id: "id_t_z_010107_2",
link1: "http://search.web2express.org/search/search.html",
link2: "",
name:
"web2express.org/Nutch-0.9-dev (leveled playing field; http://web2express.org/; info at web2express.org)",
type: "R"
},
%{
comment: "",
description: "WebAlta search Russia crawler (85.21.201.xx)",
id: "id_t_z_050206_1",
link1: "http://www.webalta.ru/",
link2: "",
name: "WebAlta Crawler/1.2.1 (http://www.webalta.ru/bot.html)",
type: "R"
},
%{
comment: "64.124.122.2xx",
description: "WebarooBot / RufusBot from webaroo offline search service",
id: "id_t_z_250806_1",
link1: "http://www.webaroo.com/",
link2: "http://www.webaroo.com/company/site-owners",
name: "WebarooBot (Webaroo Bot; http://64.124.122.252/feedback.html)",
type: "R"
},
%{
comment: "64.124.122.2xx",
description: "WebarooBot / RufusBot from webaroo offline search service",
id: "id_t_z_210407_1",
link1: "http://www.webaroo.com/",
link2: "http://www.webaroo.com/company/site-owners",
name: "WebarooBot (Webaroo Bot; http://www.webaroo.com/rooSiteOwners.html)",
type: "R"
},
%{
comment: "",
description: "Yanasoft WebAuto website copier / downloading tool",
id: "id_t_z_1444",
link1: "http://www.yanasoft.co.jp/webauto.html",
link2: "",
name: "WebAuto/3.4xxx (WinNT; I)",
type: "D"
},
%{
comment: "",
description: "Web Bandit personal search software",
id: "id_t_z_1445",
link1: "http://softwaresolutions.net/webbandit/",
link2: "",
name: "webbandit/4.xx.0",
type: "R"
},
%{
comment: "",
description: "Amansoft WebBug web server protocol test",
id: "id_t_z_140106_2",
link1: "http://www.cyberspyder.com/webbug.html",
link2: "",
name: "WebBug/5.x",
type: "C"
},
%{
comment: "",
description: "WebClipping.com - online news monitoring service",
id: "id_t_z_1446",
link1: "http://www.webclipping.com",
link2: "",
name: "Webclipping.com",
type: "R"
},
%{
comment: "s. also collage.cgi/1.xx",
description: "WebCollage Syndicator graphics crawler/collector",
id: "id_t_z_1447",
link1: "http://www.webcollage.com/",
link2: "",
name: "webcollage/1.xx",
type: "R D"
},
%{
comment: "",
description: "Quarterdecks WebCompass search tool",
id: "id_t_z_1448",
link1: "",
link2: "",
name: "WebCompass 2.0",
type: "R"
},
%{
comment: "",
description: "WebCopier offline browser",
id: "id_t_z_1449",
link1: "http://www.maximumsoft.com/",
link2: "",
name: "WebCopier vx.x",
type: "D B"
},
%{
comment: "",
description: "WebCopier offline browser",
id: "id_t_z_1450",
link1: "http://www.maximumsoft.com/",
link2: "",
name: "WebCopier vx.xa",
type: "D B"
},
%{
comment: "193.60.130.xx",
description: "WebCorp linguistic search engine (UK)",
id: "id_t_z_210506_1",
link1: "http://webcorp.uce.ac.uk/",
link2: "",
name: "WebCorp/1.0",
type: "R"
},
%{
comment: "",
description: "Webcrawl Search robot (64.40.105.xxx)",
id: "id_t_z_1451",
link1: "http://www.webcrawl.net/",
link2: "",
name: "webcrawl.net",
type: "R"
},
%{
comment: "",
description: "Unix/Linux Web Downloader",
id: "id_t_z_1452",
link1: "http://www.krasu.ru/soft/chuchelo/",
link2: "",
name: "WebDownloader for X x.xx",
type: "D"
},
%{
comment: "",
description: "Unknown robot from china-netcom.com",
id: "id_t_z_1453",
link1: "",
link2: "",
name: "Webdup/0.9",
type: ""
},
%{
comment: "",
description: "WingFlyer WebFetch website downloading tool",
id: "id_t_z_1454",
link1: "http://www.wingflyer.com/",
link2: "",
name: "WebFetch",
type: "D B"
},
%{
comment: "",
description: "webfetch - command line tool to fetch files via HTTP",
id: "id_t_z_1455",
link1: "http://tony.aiu.to/sa/webfetch/",
link2: "",
name: "webfetch/5.x.x",
type: "D"
},
%{
comment: "",
description: "Verso NetSpective WebFilter",
id: "id_t_z_310806_2",
link1: "http://www.verso.com/enterprise/netspective/webfilter.asp",
link2: "",
name: "WebFilter Robot 1.0",
type: "P"
},
%{
comment: "",
description: "Telemate.net NetSpective WebFilter",
id: "id_t_z_1456",
link1: "http://www.telemate.net/",
link2: "",
name: "WebFilter Robot 1.x",
type: "P"
},
%{
comment: "",
description: "Webfind search robot",
id: "id_t_z_1457",
link1: "http://www.web-find.com/",
link2: "",
name: "WebFindBot(http://www.web-find.com)",
type: "R"
},
%{
comment: "",
description: "Webglimpse search engine software",
id: "id_t_z_1458",
link1: "http://www.webglimpse.net/",
link2: "",
name: "Webglimpse 2.xx.x (http://webglimpse.net)",
type: "R"
},
%{
comment: "",
description: "webGobbler - Online random image generator",
id: "id_t_z_150306_2",
link1: "http://sebsauvage.net/webgobbler/",
link2: "",
name: "webGobbler/1.x.x",
type: "R D"
},
%{
comment: "",
description: "fake ?",
id: "id_t_z_1459",
link1: "",
link2: "",
name: "webhack",
type: ""
},
%{
comment: "212.204.217.1xx",
description: "herbert.groot.jebbink.nl Web Images collage generator",
id: "id_t_z_290807_2",
link1: "http://herbert.groot.jebbink.nl/",
link2: "",
name: "WebImages 0.3 ( http://herbert.groot.jebbink.nl/?app=WebImages )",
type: "D"
},
%{
comment: "s. also Mozilla/4.0 (compatible; MSIE 6.0; Windows 98; support@illumit.com...",
description: "WebLight web analyzer & link checker",
id: "id_t_z_280306_2",
link1: "http://www.illumit.com/Products/weblight/",
link2: "",
name: "WebLight/4.x.x (support@illumit.com; http://www.illumit.com/Products/weblight/)",
type: "C"
},
%{
comment: "sometimes in conjunction w. PHP/4.0.6",
description: "WebLink's link management system for HTTP- FTP and Mail hyperlinks",
id: "id_t_z_1460",
link1: "http://www.harlequin.ch/technologien/tools/weblinks.php",
link2: "",
name: "Weblink's checker/",
type: "C"
},
%{
comment: "",
description: "Los Alamos National Laboratoy weblog research project",
id: "id_t_z_140307_1",
link1: "http://www.user-agents.org/agents/weblogattitude.shtml",
link2: "http://www.lanl.gov/",
name: "Weblog Attitude Diffusion 1.0",
type: "R"
},
%{
comment: "139.18.38.1xx",
description:
"Unknown robot from Leipzig University (Germany) faculty for computer science",
id: "id_t_z_230606_1",
link1: "http://rvs.informatik.uni-leipzig.de/",
link2: "",
name: "webmeasurement-bot, http://rvs.informatik.uni-leipzig.de",
type: "R"
},
%{
comment: "",
description: "WebMiner bulk file downloader",
id: "id_t_z_1461",
link1: "http://tribolic.com/webminer/",
link2: "",
name: "WebMiner/x.x [en] (Win98; I)",
type: "D"
},
%{
comment: "",
description: "WeBoX (Japan) - Browser and web collector",
id: "id_t_z_1462",
link1: "http://www-nishio.ise.eng.osaka-u.ac.jp/~nakamura/webox/",
link2: "",
name: "WeBoX/0.xx",
type: "B D"
},
%{
comment: "",
description: "WebPix - picture downloading tool",
id: "id_t_z_1463",
link1: "http://www.netwu.com/webpix/",
link2: "",
name: "WebPix 1.0 (www.netwu.com)",
type: "D"
},
%{
comment: "",
description: "Caesius WebQL - Custom robot/agent generator / web extraction software",
id: "id_t_z_1464",
link1: "http://www.caesius.com/",
link2: "",
name: "WebQL",
type: "B D"
},
%{
comment: "",
description: "WebRACE - HTTP retrieval- annotation and caching engine",
id: "id_t_z_1465",
link1: "http://www.cs.ucy.ac.cy/Projects/eRACE/webrace.html",
link2: "",
name: "WebRACE/1.1 (University of Cyprus- Distributed Crawler)",
type: "P"
},
%{
comment: "62.75.202.1xx",
description: "WebRankSpider experimental web crawler",
id: "id_t_z_130907_1",
link1: "http://ulm191.server4you.de/crawler/",
link2: "",
name: "WebRankSpider/1.37 (+http://ulm191.server4you.de/crawler/)",
type: "R"
},
%{
comment: "",
description: "Webreaper download manager",
id: "id_t_z_1468",
link1: "http://www.webreaper.net/",
link2: "",
name: "WebReaper vx.x - www.webreaper.net",
type: "D"
},
%{
comment: "",
description: "Webreaper download manager",
id: "id_t_z_1466",
link1: "http://www.webreaper.net/",
link2: "",
name: "WebReaper [info@webreaper.net]",
type: "D"
},
%{
comment: "",
description: "Webreaper download manager",
id: "id_t_z_1467",
link1: "http://www.webreaper.net/",
link2: "",
name: "WebReaper [webreaper@webreaper.net]",
type: "D"
},
%{
comment: "",
description: "Websearch Australia robot",
id: "id_t_z_1469",
link1: "http://WebSearch.COM.AU/",
link2: "",
name:
"WebSearch.COM.AU/3.0.1 (The Australian Search Engine; http://WebSearch.COM.AU; Search@WebSearch.COM.AU)",
type: "R"
},
%{
comment: "",
description: "Dortmund University WebSearchBench - Open source search software",
id: "id_t_z_1470",
link1: "http://websearchbench.cs.uni-dortmund.de/websearch/about.html.de",
link2: "",
name: "WebSearchBench WebCrawler v0.1(Experimental)",
type: "R"
},
%{
comment: "",
description: "Dortmund University WebSearchBench - Open source search software",
id: "id_t_z_1471",
link1: "http://websearchbench.cs.uni-dortmund.de/websearch/about.html.de",
link2: "",
name:
"WebSearchBench WebCrawler V1.0 (Beta)- Prof. Dr.-Ing. Christoph Lindemann- Universität Dortmund- cl@cs.uni-dortmund.de- http://websearchbench.cs.uni-dortmund.de/",
type: "R"
},
%{
comment: "",
description: "Web site downloading tool and offline browser (Japan)",
id: "id_t_z_260806_2",
link1: "http://www.umechando.com/webex/",
link2: "",
name: "Website Explorer/0.9.x.x",
type: "D"
},
%{
comment: "",
description: "Website eXtractor web site downloading tool",
id: "id_t_z_1472",
link1: "http://www.asona.org/",
link2: "http://www.internet-soft.com/",
name: "Website eXtractor",
type: "D"
},
%{
comment: "216.89.111.x",
description: "Sootle web directory Website Worth ranking tool",
id: "id_t_z_090606_1",
link1: "http://directory.sootle.com/website-worth/",
link2: "",
name: "WebsiteWorth v1.0",
type: "R"
},
%{
comment: "",
description: "Webspinne.de robot",
id: "id_t_z_1473",
link1: "http://www.webspinne.de/",
link2: "",
name: "Webspinne/1.0 webmaster@webspinne.de",
type: "R"
},
%{
comment: "",
description: "Websquash.com Search Engine robot / link checking",
id: "id_t_z_1474",
link1: "http://www.websquash.com/",
link2: "",
name: "Websquash.com (Add url robot)",
type: "R"
},
%{
comment: "",
description: "WebStat - Java statistical computing environment for the web",
id: "id_t_z_1475",
link1: "http://www.math.psu.edu/babcock/webstat/version1.0/",
link2: "",
name: "WebStat/1.0 (Unix; beta; 20040314)",
type: "R"
},
%{
comment: "24.99.22.xx",
description: "Webster - Rev. Healeys web crawler",
id: "id_t_z_091006_2",
link1: "http://webster.healeys.net/",
link2: "http://webster.healeys.net/search.php",
name: "Webster v0.3 ( http://webster.healeys.net/ )",
type: "R"
},
%{
comment: "",
description: "Websters Webmaster Archive (Germany) submission / pad checking",
id: "id_t_z_1476",
link1: "http://webster.de/",
link2: "",
name: "webster-internet.de pad browser",
type: "C B"
},
%{
comment: "",
description: "WebStripper download manager",
id: "id_t_z_1477",
link1: "http://webstripper.net/index.html",
link2: "http://www.netidea.it",
name: "WebStripper/2.xx",
type: "D"
},
%{
comment: "",
description: "WebTrafficExpress IBM server software",
id: "id_t_z_1478",
link1: "",
link2: "",
name: "WebTrafficExpress/x.0",
type: "P"
},
%{
comment: "",
description: "Web Trends link analyzer",
id: "id_t_z_1479",
link1: "http://www.netiq.com/webtrends/default.asp",
link2: "",
name: "WebTrends/3.0 (WinNT)",
type: "C"
},
%{
comment: "ex Pita- s. there",
description: "The Stanford WebBase Project crawler",
id: "id_t_z_1480",
link1: "http://www-diglib.stanford.edu/~testbed/doc2/WebBase/",
link2: "",
name: "WebVac (webmaster@pita.stanford.edu)",
type: "R"
},
%{
comment: "",
description: "webval - Python link checking tool",
id: "id_t_z_1481",
link1: "http://www.alcyone.com/pyos/webval/",
link2: "",
name: "WebVal/1.0",
type: "C"
},
%{
comment: "",
description: "Webverzeichnis.de (Germany) directory robot",
id: "id_t_z_171205_3",
link1: "http://www.webverzeichnis.de/",
link2: "",
name: "Webverzeichnis.de - Telefon: 01908 / 26005",
type: "R"
},
%{
comment: "Looking for excluded directories in robots.txt",
description: "Web Vulnerability Crawler",
id: "id_t_z_060306_1",
link1: "http://webvulncrawl.blogspot.com/2005/12/what-am-i-doing.html",
link2: "",
name: "WebVulnCrawl.unknown/1.0 libwww-perl/5.803",
type: "S"
},
%{
comment: "",
description: "Studio Net.Idea's Web Watcher Monitor robot",
id: "id_t_z_1482",
link1: "http://www.web-watcher.com/web-watcher-monitor.html",
link2: "",
name: "WebWatcherMonitor/2.01",
type: "R C"
},
%{
comment: "",
description: "WebZip offline browser",
id: "id_t_z_1483",
link1: "http://www.spidersoft.com/",
link2: "",
name: "WebZIP/x.x (http://www.spidersoft.com)",
type: "B D"
},
%{
comment: "s.also - Port Huron Labs",
description: "Unknown spam bot / harvester (62.163.**.** / 62.194.**.*)",
id: "id_t_z_1484",
link1: "",
link2: "",
name: "Wells Search II",
type: "S"
},
%{
comment: "",
description: "Some spam bot- see link",
id: "id_t_z_1485",
link1: "http://www.kloth.net/internet/badbots-2004.php",
link2: "",
name: "WEP Search 00",
type: "S"
},
%{
comment: "",
description: "wwIPStuff - Internet client tools for Visual FoxPro",
id: "id_t_z_230606_2",
link1: "http://www.west-wind.com/wwipstuff.asp",
link2: "",
name: "West Wind Internet Protocols 4.xx",
type: "B D"
},
%{
comment: "s. also: - http://www.almaden.ibm.com/cs/crawler - FocusedSampler",
description: "IBM's Almaden Research robot (Clever search project)",
id: "id_t_z_1486",
link1: "http://www.almaden.ibm.com/cs/k53/clever.html",
link2: "",
name: "WFARC",
type: "R"
},
%{
comment: "",
description: "GNU wget - file downloader",
id: "id_t_z_1488",
link1: "http://www.gnu.org/software/wget/wget.html",
link2: "",
name: "Wget/1.x(.x)GNU wget http://www.gnu.org/software/wget/wget.html - file downloader",
type: "D"
},
%{
comment: "",
description: "GNU wget - file downloader",
id: "id_t_z_1489",
link1: "http://www.gnu.org/software/wget/wget.html",
link2: "",
name: "Wget/1.x+cvs-stable (Red Hat modified)",
type: "D"
},
%{
comment: "",
description: "GNU wget - file downloader",
id: "id_t_z_1487",
link1: "http://www.gnu.org/software/wget/wget.html",
link2: "",
name: "Wget/1.x.x+cvs",
type: "D"
},
%{
comment: "",
description: "Whatsup Gold network monitor",
id: "id_t_z_1490",
link1: "http://www.ipswitch.com/products/network-management.html",
link2: "",
name: "Whatsup/x.x",
type: "C"
},
%{
comment: "166.90.205.x",
description: "WhatUSeek / Chubba robot",
id: "id_t_z_1491",
link1: "http://www.whatuseek.com/",
link2: "",
name: "whatUseek_winona/3.0",
type: "R"
},
%{
comment: "",
description: "WhizBang! Labs (closed since May 2002) information extraction robot",
id: "id_t_z_1492",
link1: "",
link2: "",
name: "WhizBang! Lab",
type: "R"
},
%{
comment: "- in conjunction w. dlman",
description: "some download agent",
id: "id_t_z_1493",
link1: "",
link2: "",
name: "Wildsoft Surfer",
type: "D"
},
%{
comment: "",
description: "Twotrees crawler",
id: "id_t_z_1494",
link1: "http://www.twotrees.com/",
link2: "",
name: "Willow Internet Crawler by Twotrees V2.1",
type: "R"
},
%{
comment: "see also: - Opera/6.01 (larbin@.....) - MSIE-5.13 larbin@....",
description: "unknown robot from gw.ocg-corp.com (209.126.176.x)",
id: "id_t_z_1495",
link1: "",
link2: "",
name: "WinampMPEG/2.00 (larbin@unspecified.mail)",
type: ""
},
%{
comment: "",
description: "Super Affiliate Tracker agent by Wincer Song",
id: "id_t_z_1496",
link1: "http://www.superaffiliatetracker.com/index.htm",
link2: "",
name: "WincerSong Agent v1.0",
type: ""
},
%{
comment: "",
description: "Windows Media Player 10",
id: "id_t_z_191105_3",
link1: "",
link2: "",
name: "Windows-Media-Player/10.00.00.xxxx",
type: "B"
},
%{
comment: "Domain is for sale",
description: "Nicksoft WinGet download manager",
id: "id_t_z_160107_1",
link1: "",
link2: "",
name: "WinGet 1.1",
type: "D"
},
%{
comment: "",
description: "Example code for a WinHTTP C++ library crawler",
id: "id_t_z_060406_1",
link1: "http://www.codeguru.com/cpp/i-n/internet/http/article.php/c6237/",
link2: "http://www.microsoft.com/msdownload/platformsdk/sdkupdate/update.htm",
name: "WinHTTP Example/1.0",
type: "R"
},
%{
comment: "",
description: "Wink beta search robot (64.13.136.x)",
id: "id_t_z_260506_1",
link1: "http://www.wink.com/",
link2: "",
name:
"WinkBot/0.06 (Wink.com search engine web crawler; http://www.wink.com/Wink:WinkBot; winkbot@wink.com)",
type: "R"
},
%{
comment: "",
description: "WinPodder - Podcast player and RSS reader",
id: "id_t_z_010607_1",
link1: "http://winpodder.com/",
link2: "",
name: "WinPodder (http://winpodder.com)",
type: "B"
},
%{
comment: "",
description: "WinWap - Windows PC WAP browser",
id: "id_t_z_251105_1",
link1: "http://www.winwap.com/products_2_1.php",
link2: "",
name: "WinWAP/3.x (3.x.x.xx; Win32) (Google WAP Proxy/1.0)",
type: "B"
},
%{
comment: "",
description: "Yammba web directory (Germany) link checking",
id: "id_t_z_111206_2",
link1: "http://www.yammba.com/",
link2: "",
name:
"Wir sind die Borg (Version: 1.03, Sie wurden Assimiliert +http://www.yammba.com/suchmaschine/bot.html)",
type: "C"
},
%{
comment: "146.48.82.xx",
description: "WIRE crawler used by the University of Pisa - Italy",
id: "id_t_z_130506_2",
link1: "http://www.cwr.cl/projects/WIRE/",
link2: "http://www.unipi.it/english/index.htm",
name: "WIRE/0.11 (Linux; i686; Bot,Robot,Spider,Crawler,aromano@cli.di.unipi.it)",
type: "R"
},
%{
comment: "Used by different IPs for different purposes",
description: "WIRE - Web information retrieval environment crawler",
id: "id_t_z_1497",
link1: "http://www.cwr.cl/projects/WIRE/",
link2: "",
name: "WIRE/0.x (Linux; i686; Bot,Robot,Spider,Crawler)",
type: "R"
},
%{
comment: "",
description: "Korea Wisenut robot",
id: "id_t_z_1498",
link1: "http://www.koreawisenut.com/",
link2: "",
name: "WISEbot/1.0 (WISEbot@koreawisenut.com; http://wisebot.koreawisenut.com)",
type: "R"
},
%{
comment: "",
description: "Wisewire domain checker (Discontinued)",
id: "id_t_z_1499",
link1: "http://www.wisewire.com/",
link2: "",
name: "WiseWire-Spider2",
type: "R C"
},
%{
comment: "133.51.22.xx",
description: "WISH academic research project for link checking",
id: "id_t_z_110107_2",
link1: "http://wish.slis.tsukuba.ac.jp/",
link2: "",
name: "wish-project (http://wish.slis.tsukuba.ac.jp/)",
type: "C"
},
%{
comment: "",
description: "Wordchamp web page vocabulary / translation robot",
id: "id_t_z_1500",
link1: "http://www.wordchamp.com/",
link2: "",
name: "WordChampBot",
type: "B D"
},
%{
comment: "",
description: "WordPress personal Blog publishing platform",
id: "id_t_z_301105_1",
link1: "http://wordpress.org/",
link2: "",
name: "WordPress/x.x.x.x PHP/4.x.xx",
type: "B"
},
%{
comment: "137.82.84.xx",
description:
"WORIO (beta) search for computer scientists and programmers using Heritrix open-source crawler",
id: "id_t_z_100207_1",
link1: "http://www.worio.com/",
link2: "http://www.archive.org/",
name: "worio heritrix bot (+http://worio.com/)",
type: "R"
},
%{
comment: "67.202.45.2xx",
description:
"WORIO (beta) search for computer scientists and programmers via Amazon Web Services",
id: "id_t_z_291007_1",
link1: "http://www.worio.com/",
link2: "http://www.amazon.com/gp/browse.html?node=3435361",
name: "woriobot ( http://www.worio.com/)",
type: "R"
},
%{
comment: "s. also Mozilla/4.0 (compatible; SpeedySpider ....",
description: "Entireweb Search robot (62.13.25.xxx)",
id: "id_t_z_1501",
link1: "http://www.entireweb.com/",
link2: "",
name: "WorldLight",
type: "R"
},
%{
comment: "",
description: "unknown link checking (from 4.18.57.126) ?",
id: "id_t_z_1502",
link1: "",
link2: "",
name: "WorQmada/1.0",
type: "C"
},
%{
comment: "",
description: "Wotbox spider",
id: "id_t_z_1503",
link1: "http://www.wotbox.com/",
link2: "",
name: "Wotbox/alpha0.6 (bot@wotbox.com; http://www.wotbox.com)",
type: "R"
},
%{
comment: "",
description: "Wotbox spider",
id: "id_t_z_1504",
link1: "http://www.wotbox.com/",
link2: "",
name: "Wotbox/alpha0.x.x (bot@wotbox.com; http://www.wotbox.com) Java/1.4.1_02",
type: "R"
},
%{
comment: "",
description: "WebSearchBench crawler from Dortmund University- Germany",
id: "id_t_z_1505",
link1: "http://websearchbench.cs.uni-dortmund.de/",
link2: "",
name: "WSB WebCrawler V1.0 (Beta)- cl@cs.uni-dortmund.de",
type: "R"
},
%{
comment: "",
description: "WebSearchBench crawler from Dortmund University- Germany",
id: "id_t_z_1506",
link1: "http://websearchbench.cs.uni-dortmund.de/",
link2: "",
name: "WSB, http://websearchbench.cs.uni-dortmund.de",
type: "R"
},
%{
comment: "",
description: "WUME Lab's web crawler (128.180.121.xxx)",
id: "id_t_z_1507",
link1: "http://wume.cse.lehigh.edu/~xiq204/crawler/",
link2: "",
name: "wume_crawler/1.1 (http://wume.cse.lehigh.edu/~xiq204/crawler/)",
type: "R"
},
%{
comment: "",
description: "Wusage log-file analysis",
id: "id_t_z_1508",
link1: "http://www.boutell.com/wusage/",
link2: "",
name: "Wusage/x.0@boutell.com",
type: "R C"
},
%{
comment: "",
description: "WWLib - Wolverhampton Univerity Web Library for classifying web documents",
id: "id_t_z_120106_2",
link1: "http://www.scit.wlv.ac.uk/wwlib/",
link2: "",
name: "Wwlib/Linux",
type: "R"
},
%{
comment: "",
description: "WWSBOT web server version checker",
id: "id_t_z_1509",
link1: "http://www.analyzer.nu/Perl/WWSBOT.html",
link2: "",
name: "WWSBOT 1.x [--- http://www.analyzer.nu ---]",
type: "C"
},
%{
comment: "",
description: "Perl web page fetching module",
id: "id_t_z_170506_2",
link1: "http://search.cpan.org/dist/WWW-Mechanize/",
link2: "",
name: "WWW-Mechanize/1.1x",
type: "D"
},
%{
comment: "",
description: "Arianna robot",
id: "id_t_z_1510",
link1: "http://arianna.libero.it/",
link2: "",
name: "www.arianna.it",
type: "R"
},
%{
comment: "",
description: "Business-Socket.com link checking ?",
id: "id_t_z_1511",
link1: "http://www.business-socket.com",
link2: "",
name: "www.business-socket.com registry verify/1.x",
type: "C"
},
%{
comment: "85.13.252.x",
description: "The DoWeb UK Business directory link checking",
id: "id_t_z_221006_2",
link1: "http://www.doweb.co.uk/action_home+page.htm",
link2: "",
name: "www.doweb.co.uk crawler",
type: "C"
},
%{
comment: "",
description: "www4mail - web navigation & database search by e-mail",
id: "id_t_z_1512",
link1: "http://www4mail.org/",
link2: "",
name: "www4mail/2.x libwww-FM/2.14 (Unix; I)",
type: ""
},
%{
comment: "",
description: "WWWC Updating check of Web pages. (Japanese only)",
id: "id_t_z_1513",
link1: "http://www.nakka.com/soft/index_eng.html",
link2: "",
name: "WWWC/1.0x",
type: "C"
},
%{
comment: "",
description: "World Wide Weasel Germany robot",
id: "id_t_z_1514",
link1: "http://wwweasel.de/",
link2: "",
name: "WWWeasel Robot v1.00 (http://wwweasel.de)",
type: "R"
},
%{
comment: "",
description: "WWWoffle download manager",
id: "id_t_z_1515",
link1: "http://www.gedanken.demon.co.uk/wwwoffle/",
link2: "",
name: "WWWOFFLE/2.x",
type: "D"
},
%{
comment: "129.187.254.xxx",
description: "Unknown robot from CIS at Munich University",
id: "id_t_z_1516",
link1: "http://www.cis.uni-muenchen.de/",
link2: "",
name: "wwwster/1.x (Beta- mailto:gue@cis.uni-muenchen.de)",
type: "R"
},
%{
comment: "",
description: "wxDownload Fast (wxDFast) open source download manager",
id: "id_t_z_050208_5",
link1: "http://dfast.sourceforge.net/index.html",
link2: "",
name: "wxDownload Fast",
type: "D"
},
%{
comment: "",
description: "Arexera (Germany) crawler software",
id: "id_t_z_1517",
link1: "http://www.arexera.de/de/products/crawler.php",
link2: "",
name: "X-Crawler ",
type: "R"
},
%{
comment: "",
description: "Xaldon WebSpider offline browser",
id: "id_t_z_1518",
link1: "http://www.xaldon.de/produkte_webspider.html",
link2: "",
name: "Xaldon WebSpider",
type: "B D"
},
%{
comment: "",
description: "Xenu link checker",
id: "id_t_z_1519",
link1: "http://home.snafu.de/tilman/xenulink.html",
link2: "",
name: "Xenu Link Sleuth 1.xx",
type: "C"
},
%{
comment: "",
description: "Xenu link checker",
id: "id_t_z_1520",
link1: "http://home.snafu.de/tilman/xenulink.html",
link2: "",
name: "Xenu's Link Sleuth 1.x[a-z]",
type: "C"
},
%{
comment: "",
description: "XerKa text mining and information retrieval software",
id: "id_t_z_270706_2",
link1: "http://www.diana-teknologia.com/www1/english/xerka.htm",
link2: "",
name: "Xerka WebBot v1.0.0 [UPVOpenDir]",
type: "D"
},
%{
comment: "",
description: "xine - free Linux / OS/2 multimedia player",
id: "id_t_z_250106_2",
link1: "http://xinehq.de/",
link2: "",
name: "xine/1.0",
type: "B"
},
%{
comment: "",
description: "XIRQ search (beta) robot (70.86.206.1xx)",
id: "id_t_z_141205_3",
link1: "http://www.xirq.com/",
link2: "",
name: "xirq/0.1-beta (xirq; http://www.xirq.com; xirq@xirq.com)",
type: "R"
},
%{
comment: "",
description: "GPath / XMLSlurp - Expression language for tree structured data",
id: "id_t_z_160806_1",
link1: "http://groovy.codehaus.org/GPath",
link2: "",
name: "XMLSlurp/0.1 libwww-perl/5.805",
type: ""
},
%{
comment: "",
description: "Metamark URL Shorten Service",
id: "id_t_z_070506_1",
link1: "http://metamark.net/",
link2: "",
name: "XRL/2.00b1 (Linux; i686; en-us) (+http://metamark.net/about)",
type: "P"
},
%{
comment: "",
description: "Xylix Retrieval System software",
id: "id_t_z_200308_3",
link1: "http://www.xylixsoftware.ch/retrievalsystem.php",
link2: "",
name: "Xylix",
type: "C"
},
%{
comment: "",
description: "Inria Crawler",
id: "id_t_z_1521",
link1: "http://www.inria.fr/",
link2: "",
name: "xyro_(xcrawler@cosmos.inria.fr)",
type: "R"
},
%{
comment: "s. also Mozilla/4.0 (compatible; Y!J...",
description: "Yahoo Search Japan robot (211.14.8.2xx)",
id: "id_t_z_081205_1",
link1: "http://www.yahoo.co.jp/",
link2: "",
name: "Y!J-BSC/1.0 (http://help.yahoo.co.jp/help/jp/search/indexing/indexing-15.html)",
type: "R"
},
%{
comment: "s. also DoCoMo/2.0/SO502i (compatible; Y!J-SRD/1.0 ...",
description: "Yahoo Search Japan robot (203.216.197.xxx)",
id: "id_t_z_271006_2",
link1: "http://www.yahoo.co.jp/",
link2: "",
name: "Y!J-SRD/1.0",
type: "R"
},
%{
comment: "s. also Mozilla/4.0 (compatible; Y!J...",
description: "Yahoo Search Japan robot (211.14.8.2xx)",
id: "id_t_z_240106_3",
link1: "http://www.yahoo.co.jp/",
link2: "",
name: "Y!J/1.0 (http://help.yahoo.co.jp/help/jp/search/indexing/indexing-15.html)",
type: "R"
},
%{
comment: "217.12.4.xx",
description: "Yahoo picture service for mobiles",
id: "id_t_z_220206_2",
link1: "",
link2: "",
name: "Y!OASIS/TEST no-ad Mozilla/4.08 [en] (X11; I; FreeBSD 2.2.8-STABLE i386)",
type: "P"
},
%{
comment: " s. YTunnelPro",
description: "Y!TunnelPro - Yahoo! Messenger companion user agent",
id: "id_t_z_1522",
link1: "http://www.ytunnelpro.com/",
link2: "",
name: "Y!TunnelPro",
type: "B"
},
%{
comment: "",
description: "Yacy distributed P2P web search engine robot",
id: "id_t_z_121205_1",
link1: "http://www.yacy.net/",
link2: "",
name:
"yacy (www.yacy.net; v20040602; i386 Linux 2.4.26-gentoo-r13; java 1.4.2_06; MET/en)",
type: "R"
},
%{
comment: "",
description: "Yacy distributed P2P web search engine robot",
id: "id_t_z_260306_4",
link1: "http://www.yacy.net/",
link2: "",
name: "yacybot (x86 Windows XP 5.1; java 1.5.0_06; Europe/de) yacy.net",
type: "R"
},
%{
comment: "",
description: "(Yahoo) Pipes interactive data aggregator robot",
id: "id_t_z_300707_2",
link1: "http://pipes.yahoo.com/pipes/",
link2: "",
name: "Yahoo Pipes 1.0",
type: "R"
},
%{
comment: "s. also Mozilla/4.0",
description: "Yahoo Mindset: Intent-driven Search (66.228.182.1xx)",
id: "id_t_z_100406_2",
link1: "http://mindset.research.yahoo.com/",
link2: "",
name: "Yahoo! Mindset",
type: "R"
},
%{
comment: "",
description: "Yahoo blog indexing robot (209.191.83.1xx)",
id: "id_t_z_040106_2",
link1: "http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html",
link2: "",
name:
"Yahoo-Blogs/v3.9 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html )",
type: "R"
},
%{
comment: "",
description: "Yahoo multimedia crawler (206.190.43.xx)",
id: "id_t_z_1523",
link1: "",
link2: "",
name:
"Yahoo-MMAudVid/1.0 (mms dash mmaudvidcrawler dash support at yahoo dash inc dot com)",
type: "R"
},
%{
comment: "",
description: "Yahoo multimedia crawler",
id: "id_t_z_080108_2",
link1: "",
link2: "",
name:
"Yahoo-MMAudVid/2.0(mms dash mm aud vid crawler dash support at yahoo dash inc.com ;Mozilla 4.0 compatible; MSIE 7.0;Windows NT 5.0; .NET CLR 2.0)",
type: "R"
},
%{
comment: "see also FAST-WebCrawler/3.x Multimedia...",
description: "Yahoo multimedia crawler via Fastsearch.net (66.77.73.xx)",
id: "id_t_z_1524",
link1: "",
link2: "",
name: "Yahoo-MMCrawler/3.x (mm dash crawler at trd dot overture dot com)",
type: "R"
},
%{
comment: "216.145.49.xx",
description: "Yahoo Search robot",
id: "id_t_z_110806_1",
link1: "",
link2: "",
name: "Yahoo-Test/4.0",
type: "R"
},
%{
comment: "",
description: "Yahoo crawler via Overture (66.77.73.3x)",
id: "id_t_z_1525",
link1: "",
link2: "",
name:
"Yahoo-VerticalCrawler-FormerWebCrawler/3.9 crawler at trd dot overture dot com; http://www.alltheweb.com/help/webmaster/crawler",
type: "R"
},
%{
comment: "",
description: "Yahoo Publisher Network RSS crawler",
id: "id_t_z_010906_2",
link1: "http://publisher.yahoo.com/rssguide",
link2: "",
name:
"YahooFeedSeeker/2.0 (compatible; Mozilla 4.0; MSIE 5.5; http://publisher.yahoo.com/rssguide)",
type: "R"
},
%{
comment: "",
description: "Yahoo Product Search crawler ( 68.142.195..x)",
id: "id_t_z_1526",
link1: "",
link2: "",
name:
"YahooSeeker-Testing/v3.9 (compatible; Mozilla 4.0; MSIE 5.5; http://search.yahoo.com/)",
type: "R"
},
%{
comment: "",
description: "Yahoo Product Search crawler ( 66.196.93.x)",
id: "id_t_z_1527",
link1: "",
link2: "",
name:
"YahooSeeker/1.0 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/shop/merchant/)",
type: "R"
},
%{
comment: "",
description: "Yahoo Product Search crawler ( 66.196.93.x)",
id: "id_t_z_1528",
link1: "",
link2: "",
name:
"YahooSeeker/1.0 (compatible; Mozilla 4.0; MSIE 5.5; http://search.yahoo.com/yahooseeker.html)",
type: "R"
},
%{
comment: "",
description: "Yahoo Product Search crawler ( 66.196.93.x)",
id: "id_t_z_1529",
link1: "",
link2: "",
name:
"YahooSeeker/1.1 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/shop/merchant/)",
type: "R"
},
%{
comment: "",
description: "Yahoo Product Search crawler ( 68.142.195..x)",
id: "id_t_z_1530",
link1: "",
link2: "",
name:
"YahooSeeker/bsv3.9 (compatible; Mozilla 4.0; MSIE 5.5; http://help.yahoo.com/help/us/ysearch/crawling/crawling-02.html )",
type: "R"
},
%{
comment: "64.157.137.xxx",
description: "Yahoo robot",
id: "id_t_z_1531",
link1: "",
link2: "",
name:
"YahooSeeker/CafeKelsa-dev (compatible; Konqueror/3.2; FreeBSD ;cafekelsa-dev-webmaster@yahoo-inc.com )",
type: "R"
},
%{
comment: "s. also Mozilla/4.0 (compatible; MSIE 5.0; YANDEX)",
description: "Yandex Search Russia link checking (213.180.206.2xx)",
id: "id_t_z_231106_2",
link1: "http://www.yandex.ru",
link2: "",
name: "Yandex/1.01.001 (compatible; Win16; I)",
type: "R"
},
%{
comment: "91.205.124.x",
description: "Yanga search robot by Gigabase (Russian Federation)",
id: "id_t_z_301108_2",
link1: "http://www.yanga.co.uk/",
link2: "",
name: "Yanga WorldSearch Bot v1.1/beta (http://www.yanga.co.uk/)",
type: "R"
},
%{
comment: "217.71.121.xx",
description: "Yarienavoir search (Belgium) robot",
id: "id_t_z_1532",
link1: "http://www.yarienavoir.net/",
link2: "",
name: "yarienavoir.net/0.2",
type: "R"
},
%{
comment: "uses also a blank UA field",
description: "1noon.com search Korea robot (222.231.21.xxx)",
id: "id_t_z_300506_1",
link1: "http://www.1noon.com/",
link2: "",
name: "Yeti",
type: "R"
},
%{
comment: "uses also a blank UA field",
description: "1noon.com search Korea robot (222.231.21.xxx)",
id: "id_t_z_040407_1",
link1: "http://www.1noon.com/",
link2: "",
name: "Yeti/0.01 (nhn/1noon, yetibot@naver.com, check robots.txt daily and follows it)",
type: "R"
},
%{
comment: "61.247.222.xx",
description: "Naver search (Korea) robot",
id: "id_t_z_301108_1",
link1: "http://www.naver.com/",
link2: "",
name: "Yeti/1.0 (NHN Corp.; http://help.naver.com/robots/)",
type: "R"
},
%{
comment: "141.30.193.x[x]",
description: "yggdrasil spider for GoPubMed biorelated search engine",
id: "id_t_z_290407_2",
link1: "http://www.biotec.tu-dresden.de/schroeder",
link2: "http://gopubmed.biotec.tu-dresden.de/",
name:
"yggdrasil/Nutch-0.9 (yggdrasil biorelated search engine; www dot biotec dot tu minus dresden do de slash schroeder; heiko dot dietze at biotec dot tu minus dresden dot de)",
type: "R"
},
%{
comment: "60.191.80.xx",
description: "Yodao search (China)",
id: "id_t_z_211206_3",
link1: "http://www.yodao.com/",
link2: "",
name: "YodaoBot/1.0 (http://www.yodao.com/help/webmaster/spider/; )",
type: "R"
},
%{
comment:
"s. also Mozilla/5.0 (compatible; Yoono; http://www.yoono.com/) - yoono/1.0 web-crawler ..",
description: "Yoono - community based search (193.110.140.xxx / 194.0.179.[x]xx)",
id: "id_t_z_110308_1",
link1: "http://www.yoono.com/",
link2: "",
name: "yoofind/yoofind-0.1-dev (yoono webcrawler; http://www.yoono.com ; MyEmail)",
type: "R"
},
%{
comment: "",
description: "Yoogli search (under development) agent",
id: "id_t_z_210106_3",
link1: "http://www.yoogli.com/",
link2: "",
name: "yoogliFetchAgent/0.1",
type: "R"
},
%{
comment:
"s. also Mozilla/5.0 (compatible; Yoono; http://www.yoono.com/) - yoofind/yoofind ..",
description: "Yoono - community based search (193.110.140.xxx / 194.0.179.[x]xx)",
id: "id_t_z_120606_1",
link1: "http://www.yoono.com/",
link2: "",
name: "yoono/1.0 web-crawler/1.0",
type: "R"
},
%{
comment: "s. also OmniExplorer_Bot",
description: "YottaCars bot - YottaCar car search engine ( 64.62.175.xxx)",
id: "id_t_z_1533",
link1: "http://www.yottacars.com/",
link2: "",
name: "YottaCars_Bot/4.12 (+http://www.yottacars.com) Car Search Engine ",
type: "R"
},
%{
comment: "s. also OmniExplorer_Bot",
description: "YottaShopping bot - YottaShopping search engine ( 64.62.175.xxx) ",
id: "id_t_z_1534",
link1: "http://www.yottashopping.com/",
link2: "",
name: "YottaShopping_Bot/4.12 (+http://www.yottashopping.com) Shopping Search Engine",
type: "R"
},
%{
comment: "s. Y!TunnelPro",
description: "Y!TunnelPro - Yahoo! Messenger companion user agent",
id: "id_t_z_1535",
link1: "http://www.ytunnelpro.com/",
link2: "",
name: "YTunnelPro",
type: "B"
},
%{
comment: "",
description: "Z-Add online link checker",
id: "id_t_z_1536",
link1: "http://w3.z-add.co.uk/linkcheck/",
link2: "",
name: "Z-Add Link Checker (http://w3.z-add.co.uk/linkcheck/)",
type: "C"
},
%{
comment: "",
description: "Zao crawler for Kototoi Project",
id: "id_t_z_1537",
link1: "http://www.kototoi.org/zao/",
link2: "",
name: "Zao-Crawler",
type: "R"
},
%{
comment: "",
description: "Zao crawler for Kototoi Project",
id: "id_t_z_1538",
link1: "http://www.kototoi.org/zao/",
link2: "",
name: "Zao-Crawler 0.2b",
type: "R"
},
%{
comment: "",
description: "Zao crawler for Kototoi Project",
id: "id_t_z_1539",
link1: "http://www.kototoi.org/zao/",
link2: "",
name: "Zao/0.1 (http://www.kototoi.org/zao/)",
type: "R"
},
%{
comment: "",
description: "Zeus Internet Marketing Robot based on Webster Pro component",
id: "id_t_z_1540",
link1: "http://cyber-robotics.com/",
link2: "http://www.homepagesw.com/",
name: "ZBot/1.00 (icaulfield@zeus.com)",
type: "R"
},
%{
comment: "212.227.109.1xx",
description: "Zearchit German search / directory",
id: "id_t_z_111205_5",
link1: "http://www.zearchit.de/",
link2: "",
name: "Zearchit",
type: "R"
},
%{
comment: "213.251.135.xx",
description: "Ze.bz Moteur de Recherche robot",
id: "id_t_z_130106_2",
link1: "http://www.ze.bz/",
link2: "",
name: "ZeBot_lseek.net (bot@ze.bz)",
type: "R"
},
%{
comment: "213.251.135.xx",
description: "Ze.bz Moteur de Recherche robot",
id: "id_t_z_1541",
link1: "http://www.ze.bz/",
link2: "",
name: "ZeBot_www.ze.bz (ze.bz@hotmail.com)",
type: "R"
},
%{
comment: "24.62.50.1xx",
description: "ZedZo Search (beta) robot",
id: "id_t_z_130806_2",
link1: "http://www.zedzo.com/",
link2: "",
name: "zedzo.digest/0.1 (http://www.zedzo.com/)",
type: "R"
},
%{
comment: "",
description: "Zend PHP frameworks Zend_Http_Client component",
id: "id_t_z_210807_2",
link1: "http://framework.zend.com/manual/en/zend.http.html",
link2: "",
name: "Zend_Http_Client",
type: "D"
},
%{
comment: "67.202.34.xxx",
description:
"Powerset Natural Language Search crawler (under development) using Heritrix via Amazon Web Services",
id: "id_t_z_290208_2",
link1: "http://www.powerset.com/",
link2: "http://www.amazon.com/gp/browse.html?node=3435361",
name:
"zermelo Mozilla/5.0 compatible; heritrix/1.12.1 (+http://www.powerset.com) [email:crawl@powerset.com,email:paul@page-store.com]",
type: "R"
},
%{
comment: "138.88.147.xxx",
description: "Zerx search robot ?",
id: "id_t_z_1542",
link1: "http://www.zerx.com/",
link2: "",
name: "zerxbot/Version 0.6 libwww-perl/5.79",
type: "R"
},
%{
comment: "",
description: "Zeus Internet Marketing Robot (based on Webster Pro)",
id: "id_t_z_1543",
link1: "http://cyber-robotics.com/",
link2: "",
name: "Zeus ThemeSite Viewer Webster Pro V2.9 Win32",
type: "R"
},
%{
comment: "",
description: "Zeus Internet Marketing Robot (based on Webster Pro)",
id: "id_t_z_1544",
link1: "http://cyber-robotics.com/",
link2: "",
name: "Zeus xxxxx Webster Pro V2.9 Win32",
type: "R"
},
%{
comment: "powered by Nutch",
description: "Zeusbot robot for building the Ulsysseek.com index",
id: "id_t_z_281105_1",
link1: "http://www.zeusbot.com/",
link2: "http://www.ulysseek.com/",
name:
"Zeusbot/0.07 (Ulysseek's web-crawling robot; http://www.zeusbot.com; agent@zeusbot.com)",
type: "R"
},
%{
comment: "",
description: "Unknown agent (server- or link checking ?) from 198.173.158.xx",
id: "id_t_z_1545",
link1: "",
link2: "",
name: "Ziggy -- The Clown From Hell!!",
type: "C"
},
%{
comment: "",
description: "Zipp.net web search robot",
id: "id_t_z_1546",
link1: "http://www.zippp.net/",
link2: "",
name: "ZipppBot/0.xx (ZipppBot; http://www.zippp.net; webmaster@zippp.net)",
type: "R"
},
%{
comment: "",
description: "Zipp.net web search robot",
id: "id_t_z_1547",
link1: "http://www.zippp.net/",
link2: "",
name: "ZIPPPCVS/0.xx (ZipppBot/.xx;http://www.zippp.net; webmaster@zippp.net)",
type: "R"
},
%{
comment: "",
description: "Zippyfinder robot",
id: "id_t_z_1548",
link1: "http://www.zippyfinder.com/",
link2: "",
name: "Zippy v2.0 - Zippyfinder.com",
type: "R"
},
%{
comment: "",
description: "Microsoft Zoo Tycoon 2 game client",
id: "id_t_z_1549",
link1: "http://www.zootycoon.com",
link2: "",
name: "Zoo Tycoon 2 Client -- http://www.zootycoon.com",
type: "B"
},
%{
comment: "",
description: "Zoom Search Engine software spider",
id: "id_t_z_1550",
link1: "http://www.wrensoft.com/",
link2: "",
name: "ZoomSpider - wrensoft.com",
type: "R"
},
%{
comment: "R",
description: " collecting for machine learning; http://zscho.de/ )",
id: "id_t_z_160110_1",
link1: "141.65.161.xx",
link2: "http://www.zscho.de/",
name: "Zscho.de Crawler/Nutch-1.0-Zscho.de-semantic_patch (Zscho.de Crawler",
type: "Zscho search crawler (Germany)"
},
%{
comment: "",
description: "zspider robot for a new search engine",
id: "id_t_z_280306_1",
link1: "http://feedback.redkolibri.com/",
link2: "",
name: "zspider/0.9-dev http://feedback.redkolibri.com/",
type: "R"
},
%{
comment: "",
description: "Wisenut robot",
id: "id_t_z_1551",
link1: "http://www.wisenutbot.com/",
link2: "",
name: "ZyBorg/1.0 (ZyBorg@WISEnut.com; http://www.WISEnut.com)",
type: "R"
},
%{
comment: "",
description: "FM Scene soccer fan pages plugin",
id: "id_new_190610_1",
link1: "http://www.fmscene.de",
link2: "",
name:
"Mozilla/5.0 (Windows; U; Windows NT 5.1; de; rv:1.9.2.3) Gecko/20100401 Firefox/3.6.3 (FM Scene 4.6.1)",
type: "L"
},
%{
comment: "",
description: "PrevX security plugin",
id: "id_new_190610_2",
link1: "http://www.prevx.com",
link2: "",
name:
"Mozilla/5.0 (Windows; U; Windows NT 5.1; de; rv:1.9.2.3) Gecko/20100401 Firefox/3.6.3 (.NET CLR 3.5.30729) (Prevx 3.0.5)",
type: ""
}
]
end
def most_common() do
[
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.0.0 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:103.0) Gecko/20100101 Firefox/103.0",
"Mozilla/5.0 (X11; Linux x86_64; rv:103.0) Gecko/20100101 Firefox/103.0",
"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.0.0 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; rv:103.0) Gecko/20100101 Firefox/103.0",
"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/15.6 Safari/605.1.15",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/103.0.0.0 Safari/537.36",
"Mozilla/5.0 (Macintosh; Intel Mac OS X 10.15; rv:103.0) Gecko/20100101 Firefox/103.0",
"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/103.0.0.0 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.81 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.81 Safari/537.36 Edg/104.0.1293.47",
"Mozilla/5.0 (X11; Ubuntu; Linux x86_64; rv:103.0) Gecko/20100101 Firefox/103.0",
"Mozilla/5.0 (Windows NT 10.0; rv:91.0) Gecko/20100101 Firefox/91.0",
"Mozilla/5.0 (X11; Linux x86_64; rv:91.0) Gecko/20100101 Firefox/91.0",
"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.81 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.81 Safari/537.36 Edg/104.0.1293.54",
"Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.0.0 Safari/537.36",
"Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.0.0 Safari/537.36",
"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/15.5 Safari/605.1.15",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/103.0.5060.134 Safari/537.36 OPR/89.0.4447.83",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:101.0) Gecko/20100101 Firefox/101.0",
"Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36",
"Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/103.0.0.0 Safari/537.36",
"Mozilla/5.0 (X11; Linux x86_64; rv:102.0) Gecko/20100101 Firefox/102.0",
"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_2) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/79.0.3945.88 Safari/537.36",
"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/102.0.0.0 Safari/537.36",
"Mozilla/5.0 (Macintosh; Intel Mac OS X 10.15; rv:102.0) Gecko/20100101 Firefox/102.0",
"Mozilla/5.0 (Macintosh; Intel Mac OS X 10.15; rv:104.0) Gecko/20100101 Firefox/104.0",
"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.81 Safari/537.36 Edg/104.0.1293.54",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/102.0.5005.167 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:102.0) Gecko/20100101 Firefox/102.0",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:91.0) Gecko/20100101 Firefox/91.0",
"Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/78.0.3904.108 Safari/537.36",
"Mozilla/5.0 (Windows NT 6.1; Win64; x64; rv:103.0) Gecko/20100101 Firefox/103.0",
"Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.81 Safari/537.36",
"Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/106.0.0.0 Safari/537.36",
"Mozilla/5.0 (Android 10; Mobile; rv:104.0) Gecko/104.0 Firefox/104.0",
"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_6) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/90.0.4430.72 Safari/537.36",
"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/15.3 Safari/605.1.15",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/100.0.4896.127 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/102.0.5005.134 YaBrowser/22.7.1.806 Yowser/2.5 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/102.0.5005.148 YaBrowser/22.7.2.899 Yowser/2.5 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/102.0.5005.63 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/103.0.5060.114 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.79 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.83 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/58.0.3029.110 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/96.0.4664.110 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/99.0.4844.51 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:104.0) Gecko/20100101 Firefox/104.0",
"Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:105.0) Gecko/20100101 Firefox/105.0",
"Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.0.0 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.81 Safari/537.36",
"Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.198 Safari/537.36",
"Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/103.0.0.0 Safari/537.36",
"Mozilla/5.0 (Windows NT 6.1; Win64; x64; rv:100.0) Gecko/20100101 Firefox/100.0",
"Mozilla/5.0 (Windows NT 6.1; Win64; x64; rv:102.0) Gecko/20100101 Firefox/102.0",
"Mozilla/5.0 (Windows NT 6.3; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.0.0 Safari/537.36",
"Mozilla/5.0 (X11; Fedora; Linux x86_64; rv:100.0) Gecko/20100101 Firefox/100.0",
"Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/103.0.5060.134 Safari/537.36",
"Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/104.0.5112.79 Safari/537.36",
"Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) HeadlessChrome/96.0.4664.45 Safari/537.36",
"Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/15.0 Safari/605.1.15",
"Mozilla/5.0 (X11; Linux x86_64; rv:105.0) Gecko/20100101 Firefox/105.0",
"Mozilla/5.0 (X11; Linux x86_64; rv:78.0) Gecko/20100101 Firefox/78.0",
"Mozilla/5.0 (X11; Linux x86_64; rv:99.0) Gecko/20100101 Firefox/99.0"
]
end
end