ViewVC Help
View File | Revision Log | Show Annotations | View Changeset | Root Listing
root/BBClone/trunk/lib/robot.php
Revision: 394
Committed: Wed Dec 30 14:39:27 2020 UTC (3 years, 11 months ago) by joku
File size: 159415 byte(s)
Log Message:
update Copyright 

File Contents

# User Rev Content
1 joku 63 <?php
2     /* This file is part of BBClone (A PHP based Web Counter on Steroids)
3     *
4     * SVN FILE $Id$
5     *
6 joku 394 * Copyright (C) 2001-2021, the BBClone Team (see doc/authors.txt for details)
7 joku 63 *
8     * This program is free software: you can redistribute it and/or modify
9     * it under the terms of the GNU General Public License as published by
10     * the Free Software Foundation, either version 3 of the License, or
11     * (at your option) any later version.
12     *
13     * This program is distributed in the hope that it will be useful,
14     * but WITHOUT ANY WARRANTY; without even the implied warranty of
15     * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16     * GNU General Public License for more details.
17     *
18     * See doc/copying.txt for details
19     */
20    
21     /////////////////////
22     // Robot Detection //
23     /////////////////////
24    
25     $robot = array(
26     "1noon" => array(
27     "icon" => "1noon",
28     "title" => "1noon",
29     "rule" => array(
30     "1Noonbot[/ ]([0-9.]{1,10})" => "\\1",
31     "^Yeti$" => ""
32     ),
33     "uri" => ""
34     ),
35     "123people" => array(
36     "icon" => "123people",
37     "title" => "123people",
38     "rule" => array(
39     "123peoplebot[ /]([0-9.]{1,10})" => "\\1"
40     ),
41     "uri" => "http://www.123people.fr/"
42     ),
43     "123spider" => array(
44     "icon" => "robot",
45     "title" => "123Spider",
46     "rule" => array(
47     "123spider-Bot \(Version: ([0-9.]{1,10})" => "\\1"
48     ),
49     "uri" => "http://www.123spider.de/"
50     ),
51     "192com" => array(
52     "icon" => "robot",
53     "title" => "192.com",
54     "rule" => array(
55     "192.comAgent" => ""
56     ),
57     "uri" => "http://www.192.com/"
58     ),
59 matthys 298 "200please" => array(
60     "icon" => "200please",
61     "title" => "200please Crawler",
62     "rule" => array(
63     "200PleaseBot[ /]([0-9.]{1,10})" => "\\1"
64     ),
65     "uri" => "http://www.200please.com/bot"
66     ),
67 joku 63 "2dehands" => array(
68     "icon" => "2dehands",
69     "title" => "2deHands",
70     "rule" => array(
71     "2dehands\.nl" => ""
72     ),
73     "uri" => ""
74     ),
75     "80legs" => array(
76     "icon" => "80legs",
77     "title" => "80legs",
78     "rule" => array(
79     "008[/ ]([0-9.]{1,10}).*80legs" => "\\1"
80     ),
81     "uri" => "http://www.80legs.com/"
82     ),
83     "a1sitemap" => array(
84     "icon" => "a1sitemap",
85     "title" => "A1 Sitemap",
86     "rule" => array(
87     "^A1 Sitemap Generator[ /]([0-9.]{1,10})" => "\\1",
88     "miggibot[ /]([0-9.]{1,10})" => "\\1"
89     ),
90     "uri" => "http://www.micro-sys.dk/products/sitemap-generator/"
91     ),
92     "a2b" => array(
93     "icon" => "a2b",
94     "title" => "A2B",
95     "rule" => array(
96     "www\.a2b\.cc" => ""
97     ),
98     "uri" => "http://www.a2b.cc"
99     ),
100     "abacho" => array(
101     "icon" => "robot",
102     "title" => "Abacho",
103     "rule" => array(
104     "^ABACHOBot" => ""
105     ),
106     "uri" => ""
107     ),
108     "abcdatos" => array(
109     "icon" => "abcdatos",
110     "title" => "ABCdatos",
111     "rule" => array(
112     "^ABCdatos BotLink[ /]([0-9.]{1,10})" => "\\1"
113     ),
114     "uri" => "http://www.abcdatos.com/"
115     ),
116     "abot" => array(
117     "icon" => "abot",
118     "title" => "aBot",
119     "rule" => array(
120     "^abot[ /]([0-9.]{1,10})" => "\\1"
121     ),
122     "uri" => ""
123     ),
124     "about" => array(
125     "icon" => "about",
126     "title" => "About",
127     "rule" => array(
128     "Libby[_/ ]([0-9.]{1,10})" => "\\1",
129     "About[_/ ]([0-9.]{1,10})libwww-perl" => "\\1"
130     ),
131     "uri" => ""
132     ),
133     "aboutus" => array(
134     "icon" => "aboutus",
135     "title" => "AboutUs",
136     "rule" => array(
137     "AboutUsBot" => ""
138     ),
139     "uri" => "http://www.aboutus.org/"
140     ),
141     "ackerm" => array(
142     "icon" => "robot",
143     "title" => "Ackerm",
144     "rule" => array(
145     "www.ackerm.com" => ""
146     ),
147     "uri" => "http://www.ackerm.com/"
148     ),
149     "acoi" => array(
150     "icon" => "acoi",
151     "title" => "AcoiRobot",
152     "rule" => array(
153     "^AcoiRobot" => ""
154     ),
155     "uri" => "http://monetdb.cwi.nl/acoi/projects.html"
156     ),
157     "acoon" => array(
158     "icon" => "acoon",
159     "title" => "Acoon",
160     "rule" => array(
161     "Acoon[ \-]?Robot" => ""
162     ),
163     "uri" => ""
164     ),
165     "accoona" => array(
166     "icon" => "accoona",
167     "title" => "Accoona",
168     "rule" => array(
169     "Accoona-AI-Agent[/ ]([0-9.]{1,10})" => "\\1",
170     "^accoona" => ""
171     ),
172     "uri" => ""
173     ),
174     "acme" => array(
175     "icon" => "acme",
176     "title" => "Acme",
177     "rule" => array(
178     "^Acme\.Spider" => ""
179     ),
180     "uri" => "http://www.acme.com/java/software/Acme.Spider.html"
181     ),
182     "active" => array(
183     "icon" => "robot",
184     "title" => "ActiveBookmark",
185     "rule" => array(
186     "ActiveBookmark[/ ]([0-9.]{1,10})" => "\\1"
187     ),
188     "uri" => ""
189     ),
190     "admuncher" => array(
191     "icon" => "robot",
192     "title" => "Ad Muncher",
193     "rule" => array(
194     "Ad Muncher[/ v]*([0-9.]{1,10})" => "\\1"
195     ),
196     "uri" => ""
197     ),
198     "aesop" => array(
199     "icon" => "robot",
200     "title" => "Aesop",
201     "rule" => array(
202     "^AESOP_com_SpiderMan" => ""
203     ),
204     "uri" => "http://www.aesop.com"
205     ),
206     "agada" => array(
207     "icon" => "robot",
208     "title" => "Agada",
209     "rule" => array(
210     "^agadine[/ ]([0-9.]{1,10})" => "\\1"
211     ),
212     "uri" => ""
213     ),
214     "ahrefs" => array(
215     "icon" => "ahrefs",
216     "title" => "Ahrefs",
217     "rule" => array(
218     "AhrefsBot[ /]([0-9.]{1,10})" => "\\1"
219     ),
220     "uri" => "http://ahrefs.com/"
221     ),
222     "aibot" => array(
223     "icon" => "robot",
224     "title" => "Aibot",
225     "rule" => array(
226     "AIBOT[/ ]([0-9.]{1,10})" => "\\1"
227     ),
228     "uri" => ""
229     ),
230     "aihitbot" => array(
231     "icon" => "robot",
232     "title" => "aiHit",
233     "rule" => array(
234     "aiHitBot[/ ]([0-9.]{1,10})" => "\\1"
235     ),
236     "uri" => "http://www.aihit.com/"
237     ),
238     "aipbot" => array(
239     "icon" => "robot",
240     "title" => "Aipbot",
241     "rule" => array(
242     "aipbot[/ ]([0-9.]{1,10})" => "\\1"
243     ),
244     "uri" => ""
245     ),
246     "aleksika" => array(
247     "icon" => "aleksika",
248     "title" => "Aleksika",
249     "rule" => array(
250     "Aleksika Spider[/ ]([0-9.]{1,10})" => "\\1"
251     ),
252     "uri" => ""
253     ),
254     "alertsite" => array(
255     "icon" => "alertsite",
256     "title" => "AlertSite",
257     "rule" => array(
258     "ipd[ /]([0-9.]{1,10}).*Alertsite\.com" => "\\1"
259     ),
260     "uri" => "http://www.alertsite.com/index.html"
261     ),
262     "alexa" => array(
263     "icon" => "alexa",
264     "title" => "Alexa",
265     "rule" => array(
266     "^ia_archive" => ""
267     ),
268     "uri" => "http://www.alexa.com/"
269     ),
270     "almaden" => array(
271     "icon" => "almaden",
272     "title" => "IBM Crawler",
273     "rule" => array(
274     "www\.almaden\.ibm\.com/cs/crawler" => ""
275     ),
276     "uri" => "http://www.almaden.ibm.com/cs/crawler/"
277     ),
278     "altavista" => array(
279     "icon" => "altavista",
280     "title" => "Altavista",
281     "rule" => array(
282     "Scooter[ /\-]*[a-z]*([0-9.]{1,10})" => "\\1",
283     "AltaVista V([0-9.]{1,10})" => "\\1",
284     "AltaVista Intranet V([0-9.]{1,10})" => "\\1"
285     ),
286     "uri" => "http://www.altavista.com/"
287     ),
288     "amazon" => array(
289     "icon" => "amazon",
290     "title" => "Amazon",
291     "rule" => array(
292     "^(aranhabot|amzn_assoc)" => "",
293     "^NutchEC2Test" => ""
294     ),
295     "uri" => "http://www.amazon.com/"
296     ),
297     "amidalla" => array(
298     "icon" => "amidalla",
299     "title" => "Amidalla",
300     "rule" => array(
301     "^amibot" => ""
302     ),
303     "uri" => ""
304     ),
305     "amfibi" => array(
306     "icon" => "amfibi",
307     "title" => "Amfibi",
308     "rule" => array(
309     "Amfibibot[/ ]([0-9.]{1,10})" => "\\1",
310     "Amfibibot" => ""
311     ),
312     "uri" => ""
313     ),
314     "amphetadesk" => array(
315     "icon" => "robot",
316     "title" => "AmphetaDesk",
317     "rule" => array(
318     "AmphetaDesk[/ ]([0-9.]{1,10})" => "\\1"
319     ),
320     "uri" => ""
321     ),
322     "amphetameme" => array(
323     "icon" => "robot",
324     "title" => "Amphetameme",
325     "rule" => array(
326     "amphetameme[ \-]?crawler" => ""
327     ),
328     "uri" => ""
329     ),
330     "annomille" => array(
331     "icon" => "robot",
332     "title" => "AnnoMille",
333     "rule" => array(
334     "^AnnoMille( spider)?[/ ]([0-9.]{1,10})" => "\\2"
335     ),
336     "uri" => "http://www.annomille.it"
337     ),
338     "anonymouse" => array(
339     "icon" => "anonymouse",
340     "title" => "Anonymouse.org",
341     "rule" => array(
342     "http://Anonymouse.org" => ""
343     ),
344     "uri" => "http://anonymouse.org"
345     ),
346     "ansearch" => array(
347     "icon" => "robot",
348     "title" => "Ansearch",
349     "rule" => array(
350     "AnsearchBot[/ ]([0-9.]{1,10})" => "\\1"
351     ),
352     "uri" => ""
353     ),
354     "answerchase" => array(
355     "icon" => "answerchase",
356     "title" => "AnswerChase",
357     "rule" => array(
358     "AnswerChase( PROve)?[/ ]([0-9.]{1,10})" => "\\2"
359     ),
360     "uri" => "http://www.answerchase.com/"
361     ),
362     "antibot" => array(
363     "icon" => "robot",
364 matthys 205 "title" => "Antibot",
365 joku 63 "rule" => array(
366     "antibot-V([0-9.]{1,10})" => "\\1"
367     ),
368     "uri" => ""
369     ),
370     "aonde" => array(
371     "icon" => "aonde",
372     "title" => "Aonde",
373     "rule" => array(
374     "^AONDE-Spider" => ""
375     ),
376     "uri" => ""
377     ),
378     "aonline" => array(
379     "icon" => "robot",
380     "title" => "A-Online.at",
381     "rule" => array(
382     "^A-Online Search" => ""
383     ),
384     "uri" => "http://www.a-online.at/"
385     ),
386     "aol" => array(
387     "icon" => "aol",
388     "title" => "AOLserver",
389     "rule" => array(
390     "^AOLserver-Tcl[/ ]([0-9.]{1,10})" => "\\1",
391     "^AOLserver" => ""
392     ),
393     "uri" => ""
394     ),
395     "apachebench" => array(
396     "icon" => "robot",
397     "title" => "ApacheBench",
398     "rule" => array(
399     "ApacheBench[ /]([0-9.]{1,10})" => "\\1"
400     ),
401     "uri" => ""
402     ),
403     "apassion4jazz" => array(
404     "icon" => "robot",
405     "title" => "Passion 4 Jazz",
406     "rule" => array(
407     "^BebopBot[ /]([0-9.]{1,10})" => "\\1"
408     ),
409     "uri" => "http://www.apassion4jazz.net/bebopbot.html"
410     ),
411     "apexoo" => array(
412     "icon" => "robot",
413     "title" => "Apexoo",
414     "rule" => array(
415     "^Apexoo Spider ([0-9.]{1,10})" => "\\1"
416     ),
417     "uri" => "http://www.apexoo.com/"
418     ),
419     "apnoti" => array(
420     "icon" => "apnoti",
421 matthys 205 "title" => "Apnoti",
422 joku 63 "rule" => array(
423     "apnoti.*Robot[ /]v([0-9.]{1,10})" => "\\1"
424     ),
425     "uri" => "http://www.apnoti.com/"
426     ),
427     "aport" => array(
428     "icon" => "aport",
429     "title" => "Aport",
430     "rule" => array(
431     "^Aport" => ""
432     ),
433     "uri" => ""
434     ),
435     "appie" => array(
436     "icon" => "walhello",
437     "title" => "Walhello",
438     "rule" => array(
439     "appie[ /]([0-9.]{1,10})" => "\\1"
440     ),
441     "uri" => ""
442     ),
443 matthys 389 "apple" => array(
444     "icon" => "apple",
445     "title" => "Apple",
446     "rule" => array(
447     "Applebot[ /]([0-9.]{1,10})" => "\\1"
448     ),
449     "uri" => "http://www.apple.com/go/applebot"
450     ),
451    
452 joku 63 "arachmo" => array(
453     "icon" => "arachmo",
454     "title" => "Arachmo",
455     "rule" => array(
456     "compatible; Arachmo" => ""
457     ),
458     "uri" => ""
459     ),
460     "arexera" => array(
461     "icon" => "arexera",
462     "title" => "Arexera",
463     "rule" => array(
464     "^X-Crawler" => "",
465     "^TECOMAC-Crawler[ /]([0-9.]{1,10})" => "\\1"
466     ),
467     "uri" => "http://www.arexera.de/"
468     ),
469     "arianna" => array(
470     "icon" => "arianna",
471     "title" => "Arianna",
472     "rule" => array(
473     "^www.arianna.it" => ""
474     ),
475     "uri" => "http://www.arianna.it/"
476     ),
477     "artface" => array(
478     "icon" => "robot",
479     "title" => "Artface",
480     "rule" => array(
481     "^ArtfaceBot" => ""
482     ),
483     "uri" => ""
484     ),
485     "artviper" => array(
486     "icon" => "artviper",
487     "title" => "artViper",
488     "rule" => array(
489     "artViper" => ""
490     ),
491     "uri" => "http://www.artviper.net/"
492     ),
493     "asinfo" => array(
494     "icon" => "robot",
495     "title" => "Any Search Info",
496     "rule" => array(
497     "Sleek Spider[ /]([0-9.]{1,10})" => "\\1"
498     ),
499     "uri" => "http://search-info.com/"
500     ),
501     "ask" => array(
502     "icon" => "askjeeves",
503     "title" => "Ask Jeeves",
504     "rule" => array(
505     "Ask[ \-]?Jeeves" => "",
506     "teomaagent" => ""
507     ),
508     "uri" => ""
509     ),
510     "askaboutoil" => array(
511     "icon" => "robot",
512     "title" => "ASPseek",
513     "rule" => array(
514     "^AskAboutOil[ /]([0-9.]{1,10})" => "\\1"
515     ),
516     "uri" => "http://askaboutoil.com/"
517     ),
518     "asked" => array(
519     "icon" => "robot",
520 matthys 205 "title" => "AskEd!",
521 joku 63 "rule" => array(
522     "^asked[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
523     ),
524     "uri" => "http://asked.jp"
525     ),
526     "aspseek" => array(
527     "icon" => "robot",
528     "title" => "ASPseek",
529     "rule" => array(
530     "^ASPseek[/ ]([0-9.]{1,10})" => "\\1"
531     ),
532     "uri" => ""
533     ),
534     "atlocal" => array(
535     "icon" => "robot",
536     "title" => "At Local",
537     "rule" => array(
538     "AtlocalBot[/ ]([0-9.]{1,10})" => "\\1"
539     ),
540     "uri" => "http://www.atlocal.com/"
541     ),
542     "atomz" => array(
543     "icon" => "atomz",
544     "title" => "Atomz",
545     "rule" => array(
546     "Atomz[/ ]([0-9.]{1,10})" => "\\1"
547     ),
548     "uri" => ""
549     ),
550 matthys 345 "avira" => array(
551     "icon" => "avira",
552     "title" => "Avira SafeSearch",
553     "rule" => array(
554     "^SafeSearch microdata crawler" => ""
555     ),
556     "uri" => "https://safesearch.avira.com"
557     ),
558 joku 63 "axel" => array(
559     "icon" => "robot",
560     "title" => "Axel",
561     "rule" => array(
562     "^axel" => ""
563     ),
564     "uri" => ""
565     ),
566     "axmo" => array(
567     "icon" => "axmo",
568     "title" => "Axmo",
569     "rule" => array(
570     "AxmoRobot" => ""
571     ),
572     "uri" => ""
573     ),
574     "answerbus" => array(
575     "icon" => "answerbus",
576     "title" => "AnswerBus",
577     "rule" => array(
578     "answerbus" => ""
579     ),
580     "uri" => ""
581     ),
582     "automapit" => array(
583     "icon" => "robot",
584     "title" => "AutoMapIt",
585     "rule" => array(
586     "AutoMapIt[ /](Bot)?" => ""
587     ),
588     "uri" => "http://www.automapit.com/bot.html"
589     ),
590     "augurnfind" => array(
591     "icon" => "robot",
592     "title" => "Augurnfind",
593     "rule" => array(
594     "augurnfind[/ ][v\-]*([0-9.]{1,10})" => "\\1"
595     ),
596     "uri" => ""
597     ),
598     "awasu" => array(
599     "icon" => "awasu",
600     "title" => "Awasu",
601     "rule" => array(
602     "Awasu[/ ]([0-9a-z.]{1,10})" => "\\1"
603     ),
604     "uri" => ""
605     ),
606     "axxus" => array(
607     "icon" => "axxus",
608     "title" => "axxus.de",
609     "rule" => array(
610     "whoiam" => ""
611     ),
612     "uri" => "http://www.axxus.de/"
613     ),
614     "ayell" => array(
615     "icon" => "ayell",
616     "title" => "Ayell",
617     "rule" => array(
618     "^Eurobot[ /]([0-9.]{1,10})" => "\\1"
619     ),
620     "uri" => "http://eurobot.ayell.eu"
621     ),
622     "babaloo" => array(
623     "icon" => "babaloo",
624     "title" => "Babaloo",
625     "rule" => array(
626     "BabalooSpider[ /]([0-9.]{1,10})" => "\\1"
627     ),
628     "uri" => "http://www.babaloo.si"
629     ),
630     "babe" => array(
631     "icon" => "robot",
632     "title" => "ba.be",
633     "rule" => array(
634     "BACS http://www.ba.be" => ""
635     ),
636     "uri" => "http://www.ba.be/"
637     ),
638     "baidu" => array(
639     "icon" => "baidu",
640     "title" => "Baidu",
641     "rule" => array(
642     "Baiduspider[ /]([0-9.]{1,10})" => "\\1",
643     "Baiduspider" => ""
644     ),
645     "uri" => "http://www.baidu.com/search/spider.html"
646     ),
647     "bananatree" => array(
648     "icon" => "robot",
649     "title" => "BananaTree",
650     "rule" => array(
651     "www\.thebananatree\.org" => ""
652     ),
653     "uri" => "http://www.thebananatree.org/"
654     ),
655     "bdcindexer" => array(
656     "icon" => "robot",
657     "title" => "bdcindexer",
658     "rule" => array(
659     "bdcindexer_([0-9a-z.]{1,10})" => "\\1"
660     ),
661     "uri" => "http://www.business.com/"
662     ),
663     "bdfetch" => array(
664     "icon" => "robot",
665     "title" => "BDFetch",
666     "rule" => array(
667     "^BDFetch" => ""
668     ),
669     "uri" => ""
670     ),
671     "bdncentral" => array(
672     "icon" => "robot",
673     "title" => "Bdncentral",
674     "rule" => array(
675     "BDNcentral Crawler v([0-9.]{1,10})" => "\\1"
676     ),
677     "uri" => "http://www.bdncentral.com/robot.html"
678     ),
679     "beammachine" => array(
680     "icon" => "robot",
681     "title" => "BeamMachine",
682     "rule" => array(
683     "^BeamMachine[ /]([0-9.]{1,10})" => "\\1"
684     ),
685     "uri" => "http://www.beammachine.net/"
686     ),
687     "become" => array(
688     "icon" => "become",
689     "title" => "Become",
690     "rule" => array(
691     "Become(JP)?Bot[/ ]([0-9.]{1,10})" => "\\2",
692     "(BecomeBot|Exabot)@exava\.com\)$" => ""
693     ),
694     "uri" => "http://www.become.com/"
695     ),
696     "beebware" => array(
697     "icon" => "robot",
698     "title" => "Beebware",
699     "rule" => array(
700     "BeebwareDirectory[/ ]v?([0-9.]{1,10})" => "\\2"
701     ),
702     "uri" => ""
703     ),
704     "bigbrother" => array(
705     "icon" => "robot",
706     "title" => "Big Brother",
707     "rule" => array(
708     "^Big Brother" => ""
709     ),
710     "uri" => "http://pauillac.inria.fr/~fpottier/"
711     ),
712     "bigclique" => array(
713     "icon" => "robot",
714     "title" => "BigClique",
715     "rule" => array(
716     "^BigCliqueBOT[/ ]([0-9.]{1,10})" => "\\1"
717     ),
718     "uri" => "http://www.bigclique.com"
719     ),
720     "biglotron" => array(
721     "icon" => "robot",
722     "title" => "Biglotron",
723     "rule" => array(
724     "^BIGLOTRON" => ""
725     ),
726     "uri" => "http://www.bigclique.com"
727     ),
728     "bigsearch" => array(
729     "icon" => "bigsearch",
730     "title" => "Bigsearch",
731     "rule" => array(
732     "Bigsearch.ca[/ ]Nutch[- ]([0-9.]{1,10})" => "\\1"
733     ),
734     "uri" => ""
735     ),
736     "bilbo" => array(
737     "icon" => "robot",
738     "title" => "Bilbo",
739     "rule" => array(
740     "Bilbo[ /]([0-9.]{1,10})" => "\\1"
741     ),
742     "uri" => "http://home.broadpark.no/~tnilsen-1/Linux/Bilbo_-_Nessus_WEB/bilbo_-_nessus_web.html"
743     ),
744     "bilgi" => array(
745     "icon" => "bilgi",
746     "title" => "Bilgi",
747     "rule" => array(
748     "Bilgi(Beta)?Bot[ /]([0-9.]{1,10})" => "\\1"
749     ),
750     "uri" => "http://www.bilgi.com/"
751     ),
752     "bitacle" => array(
753     "icon" => "bitacle",
754     "title" => "Bitacle",
755     "rule" => array(
756     "Bitacle (ro)?bot[ \(/V\:]+([0-9.]{1,10})" => "\\2",
757     ),
758     "uri" => "http://bitacle.org/"
759     ),
760     "bitbeamer" => array(
761     "icon" => "bitbeamer",
762     "title" => "BitBeamer",
763     "rule" => array(
764     "BitBeamer/([0-9.]{1,10})" => "\\1"
765     ),
766     "uri" => ""
767     ),
768     "biz360" => array(
769     "icon" => "biz360",
770     "title" => "Biz360",
771     "rule" => array(
772     "^Biz360 spider" => ""
773     ),
774     "uri" => ""
775     ),
776     "backlinktest" => array(
777     "icon" => "backlinktest",
778     "title" => "BacklinkCrawler",
779     "rule" => array(
780     "BacklinkCrawler" => ""
781     ),
782     "uri" => "http://www.backlinktest.com/crawler.html"
783     ),
784     "blaizbee" => array(
785     "icon" => "blaiz-bee",
786     "title" => "Blaiz-Bee",
787     "rule" => array(
788     "Blaiz-Bee[ /]([0-9.]{1,10})" => ""
789     ),
790     "uri" => ""
791     ),
792     "blogbeat" => array(
793     "icon" => "robot",
794     "title" => "BlogBeat",
795     "rule" => array(
796     "BlogBeat/?([0-9.]{1,10})" => "\\1",
797     ),
798     "uri" => "http://www.blogbeat.nl"
799     ),
800     "blogbotde" => array(
801     "icon" => "robot",
802     "title" => "blogbot.de",
803     "rule" => array(
804     "Naamah[ /]([0-9.a-z]{1,10})[ /]Blogbot" => "\\1",
805     ),
806     "uri" => "http://blogbot.de/"
807     ),
808     "blogcensus" => array(
809     "icon" => "blogcensus",
810     "title" => "Blogcensus",
811     "rule" => array(
812     "^Blogcensus" => "",
813     ),
814     "uri" => "http://blogcensus.de/bot/"
815     ),
816     "blogdex" => array(
817     "icon" => "robot",
818     "title" => "Blogdex",
819     "rule" => array(
820     "Blogdex[ /]([0-9.]{1,10})" => "\\1",
821     ),
822     "uri" => ""
823     ),
824     "blogg" => array(
825     "icon" => "blogg",
826     "title" => "Blogg",
827     "rule" => array(
828     "^blogg\.de" => ""
829     ),
830     "uri" => ""
831     ),
832     "blogland" => array(
833     "icon" => "robot",
834     "title" => "BlogLand",
835     "rule" => array(
836     "BlogLand[/ ]([0-9.]{1,10})" => "\\1"
837     ),
838     "uri" => ""
839     ),
840     "bloglines" => array(
841     "icon" => "bloglines",
842     "title" => "Bloglines",
843     "rule" => array(
844     "Bloglines[ /]([0-9.]{1,10})" => "\\1",
845     "Bloglines" => ""
846     ),
847     "uri" => ""
848     ),
849     "blogmap" => array(
850     "icon" => "robot",
851     "title" => "Blogmap",
852     "rule" => array(
853     "blogmap" => ""
854     ),
855     "uri" => ""
856     ),
857     "blogosphere" => array(
858     "icon" => "robot",
859     "title" => "Blogosphere",
860     "rule" => array(
861     "Blogosphere" => ""
862     ),
863     "uri" => ""
864     ),
865     "blogpeople" => array(
866     "icon" => "robot",
867     "title" => "BlogPeople",
868     "rule" => array(
869     "BlogPeople" => ""
870     ),
871     "uri" => ""
872     ),
873     "blogpulse" => array(
874     "icon" => "blogpulse",
875     "title" => "Blogpulse",
876     "rule" => array(
877     "Blogpulse" => ""
878     ),
879     "uri" => ""
880     ),
881     "blogranking" => array(
882     "icon" => "blogranking",
883     "title" => "BlogRanking",
884     "rule" => array(
885     "^BlogRanking(/RSS checker)?" => ""
886     ),
887     "uri" => ""
888     ),
889     "blogs" => array(
890     "icon" => "blogs",
891     "title" => "Blo.gs",
892     "rule" => array(
893     "blo\.gs[ /]([0-9.]{1,10})" => "\\1",
894     "blo\.gs" => ""
895     ),
896     "uri" => ""
897     ),
898     "blogshares" => array(
899     "icon" => "blogshares",
900     "title" => "BlogShares",
901     "rule" => array(
902     "BlogShares[ /]V?([0-9.]{1,10})" => "\\1",
903     "(^| |\()Blogshares(\.com| |\))" => ""
904     ),
905     "uri" => ""
906     ),
907     "blogslife" => array(
908     "icon" => "robot",
909     "title" => "BlogsLife",
910     "rule" => array(
911     "Blogslive" => ""
912     ),
913     "uri" => ""
914     ),
915     "blogsnow" => array(
916     "icon" => "blogsnow",
917     "title" => "BlogsNow",
918     "rule" => array(
919     "blogsnowbot" => "",
920     "BlogsNow" => ""
921     ),
922     "uri" => ""
923     ),
924     "blogstreet" => array(
925     "icon" => "blogstreet",
926     "title" => "BlogStreet",
927     "rule" => array(
928     "^BlogStreetBot" => ""
929     ),
930     "uri" => ""
931     ),
932     "blogsurf" => array(
933     "icon" => "robot",
934     "title" => "BlogSurf",
935     "rule" => array(
936     "nomadscafe_ra[/ ]([0-9.]{1,10})" => "\\1"
937     ),
938     "uri" => ""
939     ),
940     "blogtick" => array(
941     "icon" => "robot",
942     "title" => "BlogTick",
943     "rule" => array(
944     "BlogTickServer" => ""
945     ),
946     "uri" => ""
947     ),
948     "blogwatcher" => array(
949     "icon" => "blogwatcher",
950     "title" => "Blogwatcher",
951     "rule" => array(
952     "blogWatcher_Spider[/ ]([0-9.]{1,10})" => "\\1"
953     ),
954     "uri" => ""
955     ),
956     "blogwise" => array(
957     "icon" => "blogwise",
958     "title" => "Blogwise",
959     "rule" => array(
960     "Blogwise\.com(-MetaChecker)?[/ ]([0-9.]{1,10})" => "\\2"
961     ),
962     "uri" => ""
963     ),
964     "boardreader" => array(
965     "icon" => "boardreader",
966     "title" => "BoardReader",
967     "rule" => array(
968     "BoardReader[ \-](Image|Favicon)[ \-]Fetcher[ /]+([0-9.]{1,10})" => "\\2"
969     ),
970     "uri" => "http://www.boardreader.com"
971     ),
972     "bobby" => array(
973     "icon" => "bobby",
974     "title" => "Bobby",
975     "rule" => array(
976     "bobby[ /]([0-9.]{1,10})" => "\\1"
977     ),
978     "uri" => ""
979     ),
980     "boitho" => array(
981     "icon" => "robot",
982     "title" => "Boitho",
983     "rule" => array(
984     "Boitho\.com[ \-](dc|robot)?[/ ]([0-9.]{1,10})" => "\\2"
985     ),
986     "uri" => ""
987     ),
988     "booch" => array(
989     "icon" => "robot",
990     "title" => "Booch",
991     "rule" => array(
992     "^booch[_ /]([0-9.]{1,10})" => "\\1"
993     ),
994     "uri" => ""
995     ),
996     "book" => array(
997     "icon" => "book",
998     "title" => "Bookmark",
999     "rule" => array(
1000     "http://www\.bookmark\.ne\.jp" => ""
1001     ),
1002     "uri" => ""
1003     ),
1004     "bookdog" => array(
1005     "icon" => "bookdog",
1006     "title" => "Bookdog",
1007     "rule" => array(
1008     "^Bookdog[ /]([0-9.]{1,10})" => "\\1"
1009     ),
1010     "uri" => ""
1011     ),
1012     "bordermanager" => array(
1013     "icon" => "bordermanager",
1014     "title" => "Border Manager",
1015     "rule" => array(
1016     "BorderManager[ /]([0-9.]{1,10})" => "\\1"
1017     ),
1018     "uri" => ""
1019     ),
1020     "botonparade" => array(
1021     "icon" => "botonparade",
1022     "title" => "Bot on Parade",
1023     "rule" => array(
1024     "BotOnParade" => ""
1025     ),
1026     "uri" => "http://www.bots-on-para.de/bot.html"
1027     ),
1028     "botje" => array(
1029     "icon" => "botje",
1030     "title" => "Botje",
1031     "rule" => array(
1032     "Plukkie[ /]([0-9.]{1,10})" => "\\1"
1033     ),
1034     "uri" => "http://www.botje.com/"
1035     ),
1036     "bottomfeeder" => array(
1037     "icon" => "bottomfeeder",
1038     "title" => "BottomFeeder",
1039     "rule" => array(
1040     "BottomFeeder[ /]([0-9.]{1,10})" => "\\1"
1041     ),
1042     "uri" => ""
1043     ),
1044     "browseremulator" => array(
1045     "icon" => "browseremulator",
1046     "title" => "BrowserEmulator",
1047     "rule" => array(
1048     "BrowserEmulator[ /]([0-9.]{1,10})" => "\\1"
1049     ),
1050     "uri" => "http://www.dejavu.org/emulator.htm"
1051     ),
1052     "browsershots" => array(
1053     "icon" => "browsershots",
1054     "title" => "Browsershots",
1055     "rule" => array(
1056     "Browsershots URL Check" => ""
1057     ),
1058     "uri" => "http://browsershots.org"
1059     ),
1060     "browserspy" => array(
1061     "icon" => "robot",
1062     "title" => "BrowserSpy",
1063     "rule" => array(
1064     "BrowserSpy" => ""
1065     ),
1066     "uri" => ""
1067     ),
1068     "bruinbot" => array(
1069     "icon" => "robot",
1070     "title" => "BruinBot",
1071     "rule" => array(
1072     "BruinBot" => ""
1073     ),
1074     "uri" => ""
1075     ),
1076     "bruno" => array(
1077     "icon" => "robot",
1078     "title" => "Bruno",
1079     "rule" => array(
1080     "^Bruno" => ""
1081     ),
1082     "uri" => ""
1083     ),
1084     "btbot" => array(
1085     "icon" => "btbot",
1086     "title" => "BitTorrent",
1087     "rule" => array(
1088     "BTbot/([0-9.]{1,10})" => "\\1"
1089     ),
1090     "uri" => ""
1091     ),
1092 joku 380 "bubing" => array(
1093     "icon" => "robot",
1094     "title" => "BUbiNG",
1095     "rule" => array(
1096     "BUbiNG" => ""
1097     ),
1098     "uri" => "http://law.di.unimi.it/BUbiNG.html"
1099     ),
1100 joku 63 "builtwith" => array(
1101     "icon" => "builtwith",
1102     "title" => "BuiltWith",
1103     "rule" => array(
1104     "BuiltWith[/ ]([0-9.]{1,10})" => "\\1"
1105     ),
1106     "uri" => "http://builtwith.com/bot.html"
1107     ),
1108     "bulkfeeds" => array(
1109     "icon" => "robot",
1110     "title" => "Bulkfeeds",
1111     "rule" => array(
1112     "Bulkfeeds[/ ]([a-z0-9.]{1,10})" => "\\1"
1113     ),
1114     "uri" => ""
1115     ),
1116     "burf" => array(
1117     "icon" => "burf",
1118     "title" => "Burf.com",
1119     "rule" => array(
1120     "^Norbert the Spider" => ""
1121     ),
1122     "uri" => "http://www.burf.com/"
1123     ),
1124     "butch" => array(
1125     "icon" => "robot",
1126     "title" => "Butch",
1127     "rule" => array(
1128     "Butch(__| )?([a-z0-9.]{1,10})" => "\\2"
1129     ),
1130     "uri" => ""
1131     ),
1132     "buzzlogic" => array(
1133     "icon" => "buzzlogic",
1134     "title" => "Buzzlogic",
1135     "rule" => array(
1136     "BuzzBot[ /]([0-9.]{1,10})" => "\\1"
1137     ),
1138     "uri" => "http://www.buzzlogic.com"
1139     ),
1140     "catchbot" => array(
1141     "icon" => "catchbot",
1142     "title" => "CatchBot",
1143     "rule" => array(
1144     "^CatchBot[/ ]([0-9.]{1,10})" => "\\1"
1145     ),
1146     "uri" => "http://www.catchbot.com"
1147     ),
1148     "camdiscover" => array(
1149     "icon" => "robot",
1150     "title" => "Camdiscover",
1151     "rule" => array(
1152     "^Camcrawler" => ""
1153     ),
1154     "uri" => ""
1155     ),
1156     "cazoodle" => array(
1157     "icon" => "cazoodle",
1158     "title" => "Cazoodle",
1159     "rule" => array(
1160     "^CazoodleBot/(Nutch|CazoodleBot)[/ \-]([0-9.]{1,10})" => "\\2",
1161     "^CazoodleBot[/ ]([a-z0-9.]{1,10})" => "\\1"
1162     ),
1163     "uri" => "http://www.cazoodle.com/cazoodlebot"
1164     ),
1165     "ccbot" => array(
1166     "icon" => "robot",
1167     "title" => "ccBot",
1168     "rule" => array(
1169     "CCBot[/ ]([0-9.]{1,10})" => "\\1"
1170     ),
1171     "uri" => "http://www.commoncrawl.org/bot.html"
1172     ),
1173     "ccgcrawl" => array(
1174     "icon" => "robot",
1175     "title" => "CCGCrawl",
1176     "rule" => array(
1177     "CCGCrawl[/ ]([0-9.]{1,10})" => "\\1"
1178     ),
1179     "uri" => "http://www.myworkbase.com/bot.html"
1180     ),
1181     "cerberian" => array(
1182     "icon" => "robot",
1183     "title" => "Cerberian Drtrs",
1184     "rule" => array(
1185     "^Cerberian Drtrs" => ""
1186     ),
1187     "uri" => ""
1188     ),
1189     "cfnetwork" => array(
1190     "icon" => "robot",
1191     "title" => "Cerberian Drtrs",
1192     "rule" => array(
1193     "^CFNetwork[/ ]([0-9.]{1,10})" => "\\1"
1194     ),
1195     "uri" => "http://www.cfnetwork.be/"
1196     ),
1197     "charlotte" => array(
1198     "icon" => "charlotte",
1199     "title" => "Charlotte",
1200     "rule" => array(
1201     "Charlotte[/ ]([0-9a-z.]{1,10})" => "\\1"
1202     ),
1203     "uri" => ""
1204     ),
1205     "cirilizator" => array(
1206     "icon" => "cirilizator",
1207     "title" => "Cirilizator",
1208     "rule" => array(
1209     "Cirilizator[/ ]([0-9.]{1,10})" => "\\1"
1210     ),
1211     "uri" => ""
1212     ),
1213     "claria" => array(
1214     "icon" => "robot",
1215     "title" => "Claria",
1216     "rule" => array(
1217     "(Claria|Diamond)(Bot)?[ /]([0-9.]{1,10})" => "\\3",
1218     "(Claria|Diamond)(Bot)" => ""
1219     ),
1220     "uri" => ""
1221     ),
1222     "claymont" => array(
1223     "icon" => "claymont",
1224     "title" => "Claymont",
1225     "rule" => array(
1226     "claymont\.com" => "",
1227     "OliverPerry" => ""
1228     ),
1229     "uri" => "http://www.claymont.com"
1230     ),
1231 joku 377 "clipinc" => array(
1232     "icon" => "clipinc",
1233     "title" => "ClipInc",
1234     "rule" => array(
1235     "ClipInc" => ""
1236     ),
1237     "uri" => "http://tobit.software"
1238     ),
1239 joku 63 "clush" => array(
1240     "icon" => "clush",
1241     "title" => "Clush",
1242     "rule" => array(
1243     "Clus(tered-Search-|h)Bot[ /]([0-9.]{1,10})" => "\\2"
1244     ),
1245     "uri" => ""
1246     ),
1247     "cmsworldmap" => array(
1248     "icon" => "cmsworldmap",
1249     "title" => "CMS World Map",
1250     "rule" => array(
1251     "cmsworldmap" => ""
1252     ),
1253     "uri" => "http://www.cmsworldmap.com/"
1254     ),
1255     "cobion" => array(
1256     "icon" => "robot",
1257     "title" => "Cobion",
1258     "rule" => array(
1259     " (QXW03018|obot)\)" => ""
1260     ),
1261     "uri" => ""
1262     ),
1263     "coccoc" => array(
1264 matthys 287 "icon" => "coccoc",
1265 matthys 209 "title" => "Coccoc",
1266 joku 63 "rule" => array(
1267     "coccoc[ /]([0-9.]{1,10})" => "\\1"
1268     ),
1269 matthys 287 "uri" => "http://help.coccoc.com"
1270 joku 63 ),
1271     "coldfusion" => array(
1272     "icon" => "coldfusion",
1273     "title" => "ColdFusion",
1274     "rule" => array(
1275     "^coldfusion" => ""
1276     ),
1277     "uri" => ""
1278     ),
1279     "combine" => array(
1280     "icon" => "robot",
1281     "title" => "Combine",
1282     "rule" => array(
1283     "Combine[ /]([0-9.]{1,10})" => "\\1"
1284     ),
1285     "uri" => ""
1286     ),
1287     "combot" => array(
1288     "icon" => "robot",
1289     "title" => "comBot",
1290     "rule" => array(
1291     "^comBot[ /]([0-9.]{1,10})" => "\\1"
1292     ),
1293     "uri" => ""
1294     ),
1295     "comet" => array(
1296     "icon" => "comet",
1297     "title" => "Comet",
1298     "rule" => array(
1299     "cometsearch@cometsystems" => ""
1300     ),
1301     "uri" => ""
1302     ),
1303     "commerobo" => array(
1304     "icon" => "robot",
1305     "title" => "Commerobo",
1306     "rule" => array(
1307     "Commerobo[/ ]([0-9.]{1,10})" => "\\1"
1308     ),
1309     "uri" => ""
1310     ),
1311     "comrite" => array(
1312     "icon" => "robot",
1313     "title" => "ComRite",
1314     "rule" => array(
1315     "Comrite[/ ]([0-9.]{1,10})" => "\\1"
1316     ),
1317     "uri" => "http://www.comrite.com/"
1318     ),
1319     "convera" => array(
1320     "icon" => "convera",
1321     "title" => "Convera",
1322     "rule" => array(
1323     "Convera(MultiMedia)?Crawler[/ ]([0-9.]{1,10})" => "\\2",
1324     "Convera Internet Spider V([0-9.]{1,10})" => "\\1"
1325     ),
1326     "uri" => ""
1327     ),
1328     "coolbot" => array(
1329     "icon" => "robot",
1330     "title" => "CoolBot",
1331     "rule" => array(
1332     "^CoolBot" => ""
1333     ),
1334     "uri" => ""
1335     ),
1336     "cosmix" => array(
1337     "icon" => "robot",
1338     "title" => "Cosmix",
1339     "rule" => array(
1340     "^(voyager|cfetch|CosmixCrawler|carleson)[/ ]([0-9.]{1,10})" => "\\2",
1341     ),
1342     "uri" => ""
1343     ),
1344     "cosmos" => array(
1345     "icon" => "robot",
1346     "title" => "Cosmos",
1347     "rule" => array(
1348     "^cosmos" => ""
1349     ),
1350     "uri" => ""
1351     ),
1352     "cosmoty" => array(
1353     "icon" => "robot",
1354     "title" => "Cosmoty",
1355     "rule" => array(
1356     "^beautybot[/ ]([0-9.]{1,10})" => "\\1"
1357     ),
1358     "uri" => "http://www.uchoose.de/crawler/beautybot/"
1359     ),
1360     "covario" => array(
1361     "icon" => "covario",
1362     "title" => "Covario",
1363     "rule" => array(
1364     "Covario-IDS[/ ]([0-9.]{1,10})" => "\\1"
1365     ),
1366     "uri" => "http://www.covario.com/ids/"
1367     ),
1368     "creativecommons" => array(
1369     "icon" => "creativecommons",
1370     "title" => "Creative Commons",
1371     "rule" => array(
1372     "CreativeCommons[/ ]([0-9.]{1,6}(-dev)?)" => "\\1"
1373     ),
1374     "uri" => ""
1375     ),
1376     "cscrawler" => array(
1377     "icon" => "robot",
1378     "title" => "CsCrawler",
1379     "rule" => array(
1380     "CsCrawler" => ""
1381     ),
1382     "uri" => "http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html"
1383     ),
1384 joku 111 "jigsaw" => array(
1385     "icon" => "jigsaw",
1386     "title" => "Jigsaw",
1387     "rule" => array(
1388     "Jigsaw[ /]([0-9.]{1,10})" => "\\1"
1389     ),
1390     "uri" => "http://jigsaw.w3.org/css-validator/"
1391     ),
1392 joku 63 "csscheck" => array(
1393     "icon" => "w3c",
1394     "title" => "W3C CSS Validator",
1395     "rule" => array(
1396     "CSS(Check|_Validator).+[ /]([0-9.]{1,10})" => "\\2"
1397     ),
1398     "uri" => "http://jigsaw.w3.org/css-validator/"
1399     ),
1400     "custo" => array(
1401     "icon" => "robot",
1402     "title" => "Custo",
1403     "rule" => array(
1404     "Custo[ /]([0-9.]{1,10})" => "\\1"
1405     ),
1406     "uri" => ""
1407     ),
1408     "cybernavi" => array(
1409     "icon" => "robot",
1410     "title" => "CyberNavi",
1411     "rule" => array(
1412     "CyberNavi_WebGet[ /]([0-9.]{1,10})" => "\\1"
1413     ),
1414     "uri" => ""
1415     ),
1416     "cyberpatrol" => array(
1417     "icon" => "cyberpatrol",
1418     "title" => "CyberPatrol",
1419     "rule" => array(
1420     "^CyberPatrol" => ""
1421     ),
1422     "uri" => "http://www.cyberpatrol.com/cyberpatrolcrawler.asp"
1423     ),
1424     "cyberz" => array(
1425     "icon" => "cyberz",
1426     "title" => "Cyberz",
1427     "rule" => array(
1428     "Cyberz Communication Agent" => ""
1429     ),
1430     "uri" => ""
1431     ),
1432     "cydral" => array(
1433     "icon" => "robot",
1434     "title" => "Cydral",
1435     "rule" => array(
1436     "CydralSpider[ /]([0-9.]{1,10})" => "\\1"
1437     ),
1438     "uri" => ""
1439     ),
1440     "cynthia" => array(
1441     "icon" => "cynthia",
1442     "title" => "Cynthia Says",
1443     "rule" => array(
1444     "Cynthia[ /]([0-9.]{1,10})" => "\\1"
1445     ),
1446     "uri" => ""
1447     ),
1448     "d4x" => array(
1449     "icon" => "d4x",
1450     "title" => "Downloader for X",
1451     "rule" => array(
1452     "Downloader for X[ /]([0-9.]{1,10})" => "\\1"
1453     ),
1454     "uri" => ""
1455     ),
1456     "da" => array(
1457     "icon" => "da",
1458     "title" => "DA",
1459     "rule" => array(
1460     "^DA[ /]([0-9.]{1,10})" => "\\1"
1461     ),
1462     "uri" => ""
1463     ),
1464     "daum" => array(
1465     "icon" => "daum",
1466     "title" => "DAUM",
1467     "rule" => array(
1468     "DAUMOA[ /]([0-9.]{1,10})" => "\\1",
1469 joku 379 "Daum[ /]([0-9.]{1,10})" => "\\1",
1470 joku 63 "DAUM Web Robot" => "",
1471 joku 339 "daum.net" => "",
1472 joku 63 "Daum Communications Corp" => "",
1473     "EDI[ /]([0-9.]{1,10})" => "\\1",
1474     "Edacious.*Intelligent Web Robot" => "",
1475     "RaBot[/ ]([0-9.]{1,10}) Agent" => "\\1"
1476     ),
1477     "uri" => "http://ws.daum.net/"
1478     ),
1479     "daypop" => array(
1480     "icon" => "robot",
1481     "title" => "Daypop",
1482     "rule" => array(
1483     "daypopbot[/ ]([0-9.]{1,10})" => "\\1"
1484     ),
1485     "uri" => ""
1486     ),
1487     "delfi" => array(
1488     "icon" => "delfi",
1489     "title" => "Delfi",
1490     "rule" => array(
1491     "crawl at delfi dot lt" => ""
1492     ),
1493     "uri" => ""
1494     ),
1495     "depspid" => array(
1496     "icon" => "depspid",
1497     "title" => "DepSpid",
1498     "rule" => array(
1499     "DepSpid[/ ]([0-9.]{1,10})" => "\\1"
1500     ),
1501     "uri" => ""
1502     ),
1503     "devonagent" => array(
1504     "icon" => "devonagent",
1505     "title" => "DEVONagent",
1506     "rule" => array(
1507     "DEVONtech" => ""
1508     ),
1509     "uri" => ""
1510     ),
1511     "diffbot" => array(
1512     "icon" => "diffbot",
1513     "title" => "Diffbot",
1514     "rule" => array(
1515     " Diffbot" => ""
1516     ),
1517     "uri" => "http://www.diffbot.com"
1518     ),
1519     "diribot" => array(
1520     "icon" => "diribot",
1521     "title" => "Diri",
1522     "rule" => array(
1523     "diribot" => ""
1524     ),
1525     "uri" => "http://www.diri.bg"
1526     ),
1527     "directhit" => array(
1528     "icon" => "robot",
1529     "title" => "Direct Hit",
1530     "rule" => array(
1531     "EZResult -- Internet Search Engine" => ""
1532     ),
1533     "uri" => "http://www.directhit.com"
1534     ),
1535     "disco" => array(
1536     "icon" => "disco",
1537 matthys 209 "title" => "Disco",
1538 joku 63 "rule" => array(
1539     "disco/Nutch[/ -]([0-9.]{1,10})" => "\\1",
1540     "discobot[/ -]([0-9.]{1,10})" => "\\1",
1541     "disco-crawl@discoveryengine.com" => ""
1542     ),
1543     "uri" => "http://www.discoveryengine.com/"
1544     ),
1545     "discopump" => array(
1546     "icon" => "robot",
1547     "title" => "DISCo Pump",
1548     "rule" => array(
1549     "DISCo Pump[/ ]([0-9.]{1,10})" => "\\1"
1550     ),
1551     "uri" => ""
1552     ),
1553     "dkimreputation" => array(
1554     "icon" => "dkimreputation",
1555     "title" => "DKIM Reputation",
1556     "rule" => array(
1557     "DKIMRepBot[ /]([0-9.]{1,10})" => "\\1"
1558     ),
1559     "uri" => "http://www.dkim-reputation.org"
1560     ),
1561     "dnsdigger" => array(
1562     "icon" => "dnsdigger",
1563     "title" => "DNS-Digger",
1564     "rule" => array(
1565     "DNS-Digger-Explorer[ /]([0-9.]{1,10})" => "\\1"
1566     ),
1567     "uri" => "http://www.dnsdigger.com"
1568     ),
1569     "dnsvalidation" => array(
1570     "icon" => "dnsvalidation",
1571     "title" => "DNS Validation",
1572     "rule" => array(
1573     "DNSValidation[ /]([0-9.]{1,10})" => "\\1"
1574     ),
1575     "uri" => "http://www.dnsvalidation.com/"
1576     ),
1577     "doctorhtml" => array(
1578     "icon" => "robot",
1579     "title" => "DoctorHTML",
1580     "rule" => array(
1581     "Doctor[ \-]?HTML" => ""
1582     ),
1583     "uri" => ""
1584     ),
1585     "dolphin" => array(
1586     "icon" => "dolphin",
1587     "title" => "Dolphin",
1588     "rule" => array(
1589     "Dolphin[ /]([0-9.]{1,10})" => "\\1"
1590     ),
1591     "uri" => "http://telehouse.ru/crawler.html"
1592     ),
1593     "domaindatei" => array(
1594     "icon" => "robot",
1595     "title" => "Domaindatei",
1596     "rule" => array(
1597     "DomaindateiSpider[ /]([0-9.]{1,10})" => "\\1"
1598     ),
1599     "uri" => ""
1600     ),
1601     "dontbuylists" => array(
1602     "icon" => "dontbuylists",
1603     "title" => "Dontbuylists",
1604     "rule" => array(
1605     "DBLBot[ /]([0-9.]{1,10})" => "\\1"
1606     ),
1607     "uri" => "http://www.dontbuylists.com"
1608     ),
1609     "dotbot" => array(
1610     "icon" => "robot",
1611     "title" => "DotBot",
1612     "rule" => array(
1613     "DotBot[ /]([0-9.]{1,10})" => "\\1"
1614     ),
1615     "uri" => "http://www.dotnetdotcom.org"
1616     ),
1617     "doweb" => array(
1618     "icon" => "doweb",
1619     "title" => "DoWeb",
1620     "rule" => array(
1621     "^www.doweb.co.uk" => ""
1622     ),
1623     "uri" => "http://www.doweb.co.uk/"
1624     ),
1625     "downforeveryoneorjustme" => array(
1626     "icon" => "downforeveryoneorjustme",
1627     "title" => "Down for everyone or just me",
1628     "rule" => array(
1629     "downforeveryoneorjustme" => ""
1630     ),
1631     "uri" => "http://www.downforeveryoneorjustme.com"
1632     ),
1633     "downloadninja" => array(
1634     "icon" => "robot",
1635     "title" => "Download Ninja",
1636     "rule" => array(
1637     "Download Ninja[ /]([0-9.]{1,10})" => "\\1"
1638     ),
1639     "uri" => ""
1640     ),
1641     "drupal" => array(
1642     "icon" => "drupal",
1643     "title" => "Drupal",
1644     "rule" => array(
1645     "^Drupal" => ""
1646     ),
1647     "uri" => ""
1648     ),
1649     "dsns" => array(
1650     "icon" => "robot",
1651     "title" => "DSNS Scanner",
1652     "rule" => array(
1653     "^DSNS" => ""
1654     ),
1655     "uri" => ""
1656     ),
1657     "dtsagent" => array(
1658     "icon" => "robot",
1659     "title" => "DTS Agent",
1660     "rule" => array(
1661     "DTS Agent" => ""
1662     ),
1663     "uri" => ""
1664     ),
1665 matthys 342 "duckduckgo" => array(
1666     "icon" => "duckduckgo",
1667     "title" => "DuckDuckGo",
1668     "rule" => array(
1669     "DuckDuckGo-Favicons-Bot[ /]([0-9.]{1,10})" => "\\1"
1670     ),
1671     "uri" => "http://duckduckgo.com"
1672     ),
1673 joku 63 "earthcom" => array(
1674     "icon" => "earthcom",
1675     "title" => "Earthcom",
1676     "rule" => array(
1677     "EARTHCOM\.info[/ ]([0-9a-z.]{1,10})" => "\\1"
1678     ),
1679     "uri" => ""
1680     ),
1681     "ebay" => array(
1682     "icon" => "ebay",
1683     "title" => "eBay",
1684     "rule" => array(
1685     "eBay Relevance Ad Crawler" => ""
1686     ),
1687     "uri" => ""
1688     ),
1689     "echo" => array(
1690     "icon" => "robot",
1691     "title" => "Echo.com",
1692     "rule" => array(
1693     "_TrueRobot[/ ]([0-9.]{1,10})" => "\\1"
1694     ),
1695     "uri" => "http://www.echo.com/"
1696     ),
1697     "eert" => array(
1698     "icon" => "robot",
1699 matthys 209 "title" => "Eert",
1700 joku 63 "rule" => array(
1701     "eert spdr[/ ]([0-9.]{1,10})" => "\\1"
1702     ),
1703     "uri" => "http://bot.eert.net"
1704     ),
1705     "eknip" => array(
1706     "icon" => "eknip",
1707     "title" => "E-Knip",
1708     "rule" => array(
1709     "eknip[ /]([0-9a-z.]{1,10})" => "\\1"
1710     ),
1711     "uri" => ""
1712     ),
1713     "zoominfo" => array(
1714     "icon" => "zoominfo",
1715 matthys 209 "title" => "ZoomInfo", //Previous called Eliyon
1716 joku 63 "rule" => array(
1717     "NextGenSearchBot[/ ]([0-9.]{1,10})" => "\\1"
1718     ),
1719     "uri" => "http://www.zoominfo.com/business/nextgensearchbot.html"
1720     ),
1721     "emeraldshield" => array(
1722     "icon" => "emeraldshield",
1723     "title" => "EmeraldShield",
1724     "rule" => array(
1725     "^EmeraldShield" => ""
1726     ),
1727     "uri" => ""
1728     ),
1729     "empas" => array(
1730     "icon" => "empas",
1731     "title" => "Empas",
1732     "rule" => array(
1733     "DigExt; empas\)$" => "",
1734     "^EMPAS[_\-]ROBOT" => ""
1735     ),
1736     "uri" => ""
1737     ),
1738     "entireweb" => array(
1739     "icon" => "entireweb",
1740     "title" => "Entireweb",
1741     "rule" => array(
1742     "Speedy[ ]?Spider" => ""
1743     ),
1744     "uri" => ""
1745     ),
1746     "envolk" => array(
1747     "icon" => "envolk",
1748     "title" => "Envolk",
1749     "rule" => array(
1750     "envolk\[ITS\]spider[/ ]([0-9.]{1,10})" => "\\1",
1751     "envolk[/ ]([0-9.]{1,10})" => "\\1"
1752     ),
1753     "uri" => ""
1754     ),
1755     "esnet" => array(
1756     "icon" => "robot",
1757     "title" => "ES.NET",
1758     "rule" => array(
1759     "ES.NET Crawler[ /]([0-9.]{1,10})" => "\\1"
1760     ),
1761     "uri" => ""
1762     ),
1763     "estyle" => array(
1764     "icon" => "estyle",
1765     "title" => "eStyle Search",
1766     "rule" => array(
1767     "eStyleSearch[ /]([0-9.]{1,10})" => "\\1"
1768     ),
1769     "uri" => ""
1770     ),
1771     "eurip" => array(
1772     "icon" => "robot",
1773     "title" => "Eurip",
1774     "rule" => array(
1775     "EuripBot[ /]([0-9.]{1,10})" => "\\1"
1776     ),
1777     "uri" => "http://www.eurip.com"
1778     ),
1779     "eurodirectory" => array(
1780     "icon" => "robot",
1781     "title" => "Euro Directory",
1782     "rule" => array(
1783     "www\.euro-directory\.com" => ""
1784     ),
1785     "uri" => "http://www.euro-directory.com/"
1786     ),
1787     "euroseek" => array(
1788     "icon" => "euroseek",
1789     "title" => "EuroSeek",
1790     "rule" => array(
1791     "Arachnoidea" => ""
1792     ),
1793     "uri" => ""
1794     ),
1795     "evaal" => array(
1796     "icon" => "evaal",
1797     "title" => "Evaal",
1798     "rule" => array(
1799     "^EvaalSE" => ""
1800     ),
1801     "uri" => "http://www.evaal.com/"
1802     ),
1803     "eventax" => array(
1804     "icon" => "eventax",
1805     "title" => "Eventax",
1806     "rule" => array(
1807     "^eventax[ /]([0-9.]{1,10})" => "\\1"
1808     ),
1809     "uri" => "http://www.eventax.de/"
1810     ),
1811     "everbee" => array(
1812     "icon" => "everbee",
1813     "title" => "Everbee",
1814     "rule" => array(
1815     "EverbeeCrawler" => ""
1816     ),
1817     "uri" => ""
1818     ),
1819     "everest" => array(
1820     "icon" => "everest",
1821     "title" => "Everest",
1822     "rule" => array(
1823     "Everest-Vulcan Inc.[ /]([0-9.]{1,10})" => "\\1"
1824     ),
1825     "uri" => ""
1826     ),
1827     "exabot" => array(
1828     "icon" => "exabot",
1829     "title" => "ExaBot",
1830     "rule" => array(
1831     "^NG[ /]([0-9.]{1,10})" => "\\1",
1832     "Exabot/([0-9.]{1,10})" => "\\1",
1833     "ExaBotTest/([0-9.]{1,10})" => "\\1",
1834     "ExaBot-(Test|Images)/([0-9.]{1,10})" => "\\2",
1835     "ExaBot-Thumbnails" => ""
1836     ),
1837     "uri" => "http://www.exabot.com/go/robot"
1838     ),
1839     "exactseek" => array(
1840     "icon" => "exactseek",
1841     "title" => "ExactSeek",
1842     "rule" => array(
1843     "^exactseek[ \-]?(pagereaper|crawler)[ \-]?([0-9.]{1,10})" => "\\2",
1844     "ExactSeek[ \.\-]?(Crawler|com)" => ""
1845     ),
1846     "uri" => "http://www.exactseek.com/"
1847     ),
1848     "excite" => array(
1849     "icon" => "excite",
1850     "title" => "Excite",
1851     "rule" => array(
1852     "Architext[ \-]?Spider" => ""
1853     ),
1854     "uri" => ""
1855     ),
1856     "execrawl" => array(
1857     "icon" => "robot",
1858     "title" => "Execrawl",
1859     "rule" => array(
1860     "Execrawl[ /]([0-9.]{1,10})" => "\\1",
1861     "Execrawl" => ""
1862     ),
1863     "uri" => ""
1864     ),
1865     "expertmonitor" => array(
1866     "icon" => "robot",
1867     "title" => "ExpertMonitor",
1868     "rule" => array(
1869     "^NetMonitor[ /]([0-9.]{1,10})" => "\\1"
1870     ),
1871     "uri" => ""
1872     ),
1873     "explorerrss" => array(
1874     "icon" => "robot",
1875     "title" => "Explorer RSS",
1876     "rule" => array(
1877     "^Windows-RSS-Platform[ /]([0-9.]{1,10})" => "\\1"
1878     ),
1879     "uri" => ""
1880     ),
1881     "ezooms" => array(
1882     "icon" => "robot",
1883     "title" => "Ezooms",
1884     "rule" => array(
1885     "ezooms[/ ]([0-9a-z.\-]{1,10})" => "\\1"
1886     ),
1887     "uri" => ""
1888     ),
1889     "facebook" => array(
1890     "icon" => "facebook",
1891     "title" => "Facebook",
1892     "rule" => array(
1893     "FacebookFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1894     "facebookexternalhit/([0-9.]{1,10})" => "\\1",
1895     "^facebook" => ""
1896     ),
1897     "uri" => "http://www.facebook.com/"
1898     ),
1899     "fast" => array(
1900     "icon" => "fast",
1901     "title" => "Fast",
1902     "rule" => array(
1903     "^FAST( Enterprise |-Web| MetaWeb )?Crawler[ /]([0-9.]{1,10})" => "\\2",
1904     "^FAST( Enterprise |-Web| MetaWeb | PartnerSite )?Crawler" => "",
1905     "^Fast Crawler" => "",
1906     "^libwww-perl[ /]([0-9.]{1,10}) FP[ /]([0-9.]{1,10})" => "\\2"
1907     ),
1908     "uri" => "http://www.alltheweb.com/"
1909     ),
1910     "fastbuzz" => array(
1911     "icon" => "fastbuzz",
1912     "title" => "Fastbuzz",
1913     "rule" => array(
1914     "^fastbuzz\.com" => ""
1915     ),
1916     "uri" => ""
1917     ),
1918     "favorg" => array(
1919     "icon" => "robot",
1920     "title" => "FavOrg",
1921     "rule" => array(
1922     "^FavOrg" => ""
1923     ),
1924     "uri" => ""
1925     ),
1926     "favorstar" => array(
1927     "icon" => "favorstar",
1928 matthys 209 "title" => "Favorstar",
1929 joku 63 "rule" => array(
1930     "favorstarbot[ /]([0-9.]{1,10})" => "\\1"
1931     ),
1932     "uri" => "http://favorstar.com/bot.html"
1933     ),
1934     "faxo" => array(
1935     "icon" => "robot",
1936     "title" => "Faxo",
1937     "rule" => array(
1938     "^Faxobot[ /]([0-9.]{1,10})" => "\\1"
1939     ),
1940     "uri" => "http://www.faxo.com/"
1941     ),
1942     "fdse" => array(
1943     "icon" => "robot",
1944     "title" => "FDSE Robot",
1945     "rule" => array(
1946     "FDSE[ \-]?robot" => ""
1947     ),
1948     "uri" => ""
1949     ),
1950     "feedback" => array(
1951     "icon" => "robot",
1952     "title" => "FeedBack",
1953     "rule" => array(
1954     "FeedBack[/ ]([0-9.]{1,10})" => "\\1"
1955     ),
1956     "uri" => ""
1957     ),
1958     "feedburner" => array(
1959     "icon" => "feedburner",
1960     "title" => "FeedBurner",
1961     "rule" => array(
1962     "^FeedBurner[/ ]([0-9.]{1,10})" => "\\1"
1963     ),
1964     "uri" => ""
1965     ),
1966     "feeddemon" => array(
1967     "icon" => "feeddemon",
1968     "title" => "FeedDemon",
1969     "rule" => array(
1970     "FeedDemon[/ ]([0-9.]{1,10})" => "\\1"
1971     ),
1972     "uri" => ""
1973     ),
1974     "feedfind" => array(
1975     "icon" => "feedfind",
1976     "title" => "FeedFind",
1977     "rule" => array(
1978     "Feed::Find[ /]([0-9.]{1,10})" => "\\1"
1979     ),
1980     "uri" => ""
1981     ),
1982     "feedonfeeds" => array(
1983     "icon" => "robot",
1984     "title" => "Feed On Feeds",
1985     "rule" => array(
1986     "FeedOnFeeds[/ ]([0-9.]{1,10})" => "\\1"
1987     ),
1988     "uri" => ""
1989     ),
1990     "feedparser" => array(
1991     "icon" => "robot",
1992     "title" => "Feedparser",
1993     "rule" => array(
1994     "UniversalFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1995     "FeedParser" => ""
1996     ),
1997     "uri" => ""
1998     ),
1999     "feedreader" => array(
2000     "icon" => "feedreader",
2001     "title" => "Feedreader",
2002     "rule" => array(
2003     "^Feedreader" => ""
2004     ),
2005     "uri" => ""
2006     ),
2007     "feedserver" => array(
2008     "icon" => "robot",
2009     "title" => "FeedServer",
2010     "rule" => array(
2011     "FeedServer[/ ]([0-9.]{1,10})" => "\\1"
2012     ),
2013     "uri" => ""
2014     ),
2015     "feedster" => array(
2016     "icon" => "feedster",
2017     "title" => "Feedster",
2018     "rule" => array(
2019     "Feedster Crawler[/ ]([0-9.]{1,10})" => "\\1"
2020     ),
2021     "uri" => ""
2022     ),
2023     "feedvalidator" => array(
2024     "icon" => "feedvalidator",
2025     "title" => "Feed Validator",
2026     "rule" => array(
2027     "^FeedValidator[/ ]([0-9.]{1,10})" => "\\1"
2028     ),
2029     "uri" => ""
2030     ),
2031     "fdm" => array(
2032     "icon" => "robot",
2033     "title" => "Free Download Manager",
2034     "rule" => array(
2035     "^FDM[/ ]([0-9a-z.]{1,10})" => "\\1"
2036     ),
2037     "uri" => ""
2038     ),
2039     "filangy" => array(
2040     "icon" => "robot",
2041     "title" => "Filangy",
2042     "rule" => array(
2043     "Filangy[/ ]([0-9.]{1,10})" => "\\1"
2044     ),
2045     "uri" => "http://www.filangy.com/"
2046     ),
2047     "findanisp" => array(
2048     "icon" => "robot",
2049     "title" => "FindAnISP",
2050     "rule" => array(
2051     "FindAnISP" => ""
2052     ),
2053     "uri" => "http://www.findanisp.com/"
2054     ),
2055     "findengines" => array(
2056     "icon" => "findengines",
2057     "title" => "FindEngines",
2058     "rule" => array(
2059     "FindEngines! Bot" => ""
2060     ),
2061     "uri" => ""
2062     ),
2063     "findexa" => array(
2064     "icon" => "findexa",
2065     "title" => "Findexa",
2066     "rule" => array(
2067     "Findexa Crawler" => ""
2068     ),
2069     "uri" => ""
2070     ),
2071     "findlinks" => array(
2072     "icon" => "findlinks",
2073     "title" => "FindLinks",
2074     "rule" => array(
2075     "findlinks[ /]([0-9.]{1,10})" => "\\1",
2076     "^FindLinks" => ""
2077     ),
2078     "uri" => ""
2079     ),
2080     "findoor" => array(
2081     "icon" => "findoor",
2082 matthys 209 "title" => "Findoor",
2083 joku 63 "rule" => array(
2084     "^findoor(-Bot)?" => "\\1"
2085     ),
2086     "uri" => ""
2087     ),
2088     "firefly" => array(
2089     "icon" => "firefly",
2090     "title" => "Firefly",
2091     "rule" => array(
2092     "Firefly" => ""
2093     ),
2094     "uri" => ""
2095     ),
2096     "flashget" => array(
2097     "icon" => "flashget",
2098     "title" => "FlashGet",
2099     "rule" => array(
2100     "^FlashGet" => ""
2101     ),
2102     "uri" => ""
2103     ),
2104     "flatland" => array(
2105     "icon" => "flatland",
2106     "title" => "Flatland",
2107     "rule" => array(
2108     "^flatlandbot" => ""
2109     ),
2110     "uri" => "http://www.flatlandindustries.com/flatlandbot"
2111     ),
2112     "flickbot" => array(
2113     "icon" => "flickbot",
2114     "title" => "FlickBot",
2115     "rule" => array(
2116     "FlickBot[ /]([0-9.]{1,10})" => "\\1"
2117     ),
2118     "uri" => ""
2119     ),
2120     "flightdeckreports" => array(
2121     "icon" => "flightdeckreports",
2122     "title" => "Flight Deck Reports",
2123     "rule" => array(
2124     "FlightDeckReportsBot[ /]([0-9.]{1,10})" => "\\1"
2125     ),
2126     "uri" => "http://www.flightdeckreports.com/"
2127     ),
2128     "forex" => array(
2129     "icon" => "robot",
2130     "title" => "Forex",
2131     "rule" => array(
2132     "^Forex Trading Network Organization" => ""
2133     ),
2134     "uri" => "http://www.netforex.org/"
2135     ),
2136     "freshmeat" => array(
2137     "icon" => "freshmeat",
2138 matthys 209 "title" => "Freshmeat",
2139 joku 63 "rule" => array(
2140     "fmII URL validator[ /]([0-9.]{1,10})" => "\\1",
2141     "freshmeat.net URL validator[ /]([0-9.]{1,10})" => "\\1"
2142     ),
2143     "uri" => "http://www.freshmeat.net/"
2144     ),
2145     "friend" => array(
2146     "icon" => "friend",
2147     "title" => "Friend",
2148     "rule" => array(
2149     "www\.friend\.fr" => ""
2150     ),
2151     "uri" => "http://www.friend.fr/"
2152     ),
2153     "frontier" => array(
2154     "icon" => "frontier",
2155     "title" => "Frontier",
2156     "rule" => array(
2157     "Frontier[ /]([0-9.]{1,10})" => "\\1"
2158     ),
2159     "uri" => ""
2160     ),
2161     "fyberspider" => array(
2162     "icon" => "robot",
2163     "title" => "FyberSpider",
2164     "rule" => array(
2165     "FyberSpider[ /]([0-9.]{1,10})" => "\\1"
2166     ),
2167     "uri" => "http://www.fyberspider.com/"
2168     ),
2169     "gaisbot" => array(
2170     "icon" => "gais",
2171     "title" => "Gaisbot",
2172     "rule" => array(
2173     "Gaisbot[ /]([0-9.]{1,10})" => "\\1"
2174     ),
2175     "uri" => ""
2176     ),
2177     "galaxy" => array(
2178     "icon" => "galaxy",
2179     "title" => "Galaxy",
2180     "rule" => array(
2181     "GalaxyBot[ /]([0-9.]{1,10})" => "\\1",
2182     "www.galaxy.com" => ""
2183     ),
2184     "uri" => "http://www.galaxy.com/"
2185     ),
2186     "gamespy" => array(
2187     "icon" => "gamespy",
2188     "title" => "GameSpy",
2189     "rule" => array(
2190     "GameSpyHTTP[ /]([0-9.]{1,10})" => "\\1"
2191     ),
2192     "uri" => ""
2193     ),
2194     "garlik" => array(
2195     "icon" => "garlik",
2196     "title" => "Garlik",
2197     "rule" => array(
2198     "GarlikCrawler[ /]([0-9.]{1,10})" => "\\1"
2199     ),
2200     "uri" => "http://garlik.com/"
2201     ),
2202     "gdesktop" => array(
2203     "icon" => "gdesktop",
2204     "title" => "Google Desktop",
2205     "rule" => array(
2206     "compatible; Google Desktop" => ""
2207     ),
2208     "uri" => ""
2209     ),
2210     "genome" => array(
2211     "icon" => "robot",
2212     "title" => "Genome Machine",
2213     "rule" => array(
2214     "Genome[ \-]?Machine" => ""
2215     ),
2216     "uri" => ""
2217     ),
2218     "geohash" => array(
2219     "icon" => "geohash",
2220     "title" => "Geohash",
2221     "rule" => array(
2222     "GeoHasher(/Nutch)[ /-]([0-9.]{1,10})" => "\\2"
2223     ),
2224     "uri" => "http://geohash.org/"
2225     ),
2226     "geona" => array(
2227     "icon" => "robot",
2228     "title" => "Geona",
2229     "rule" => array(
2230     "GeonaBot[ /]([0-9.]{1,10})" => "\\1"
2231     ),
2232     "uri" => ""
2233     ),
2234     "geoblog" => array(
2235     "icon" => "robot",
2236     "title" => "The World as a Blog",
2237     "rule" => array(
2238     "The World as a Blog" => ""
2239     ),
2240     "uri" => ""
2241     ),
2242     "geourl" => array(
2243     "icon" => "geourl",
2244     "title" => "GeoUrl",
2245     "rule" => array(
2246     "geourl[ /]([0-9.]{1,10})" => "\\1",
2247     "^GeoURLBot[ /]([0-9.]{1,10})" => "\\1",
2248     ),
2249     "uri" => ""
2250     ),
2251     "getnetwise" => array(
2252     "icon" => "robot",
2253     "title" => "GetNetWise",
2254     "rule" => array(
2255     " Crayon Crawler" => ""
2256     ),
2257     "uri" => ""
2258     ),
2259     "getright" => array(
2260     "icon" => "getright",
2261     "title" => "GetRight",
2262     "rule" => array(
2263     "GetRight[ /]([0-9.]{1,10})" => "\\1"
2264     ),
2265     "uri" => ""
2266     ),
2267     "getsmart" => array(
2268     "icon" => "getsmart",
2269     "title" => "GetSmart",
2270     "rule" => array(
2271     "GetSmart[ /]([0-9.]{1,10})" => "\\1"
2272     ),
2273     "uri" => ""
2274     ),
2275     "gigabot" => array(
2276     "icon" => "gigablast",
2277     "title" => "Gigablast",
2278     "rule" => array(
2279     "(Gigabot|Sitesearch)[/ ]([0-9.]{1,10})" => "\\2",
2280     "GigabotSiteSearch[/ ]([0-9.]{1,10})" => "\\1",
2281 joku 336 "GigablastOpenSource" => ""
2282 joku 63 ),
2283     "uri" => ""
2284 matthys 328 ),
2285     "gimme" => array(
2286     "icon" => "gimme",
2287     "title" => "gimmeUSA",
2288     "rule" => array(
2289     "Gimme60bot[ /]([0-9.]{1,10})" => "\\1"
2290     ),
2291     "uri" => "http://gimme60.com"
2292 joku 63 ),
2293 matthys 328 "ginger" => array(
2294     "icon" => "ginger",
2295     "title" => "GingerCrawler",
2296     "rule" => array(
2297     "GingerCrawler[ /]([0-9.]{1,10})" => "\\1"
2298     ),
2299     "uri" => "http://www.gingersoftware.com/crawler_agent.htm"
2300     ),
2301 joku 63 "girafabot" => array(
2302     "icon" => "girafa",
2303     "title" => "Girafa",
2304     "rule" => array(
2305     "Girafabot" => ""
2306     ),
2307     "uri" => ""
2308     ),
2309     "globalspec" => array(
2310     "icon" => "globalspec",
2311     "title" => "GlobalSpec",
2312     "rule" => array(
2313     "Ocelli[ /]([0-9.]{1,10})" => "\\1"
2314     ),
2315     "uri" => ""
2316     ),
2317     "glucose" => array(
2318     "icon" => "glucose",
2319     "title" => "Glucose",
2320     "rule" => array(
2321     "glucose[ /]([0-9a-z.\-]{1,10})" => "\\1"
2322     ),
2323     "uri" => ""
2324     ),
2325     "gnomit" => array(
2326     "icon" => "gnomit",
2327     "title" => "Gnomit",
2328     "rule" => array(
2329     "gnomit[ /]([0-9.]{1,10})" => "\\1"
2330     ),
2331     "uri" => "http://www.gnomit.com/",
2332     ),
2333     "goforit" => array(
2334     "icon" => "goforit",
2335     "title" => "GoForIt",
2336     "rule" => array(
2337     "^GoForIt\.com" => "",
2338     "^GOFORITBOT" => ""
2339     ),
2340     "uri" => ""
2341     ),
2342     "goguides" => array(
2343     "icon" => "robot",
2344     "title" => "GoGuides",
2345     "rule" => array(
2346     "^GoGuidesBot[ /]([0-9.]{1,10})" => "\\1"
2347     ),
2348     "uri" => "http://www.goguides.org/"
2349     ),
2350     // Needs to be before google for correct detection
2351     "mediapartners" => array(
2352     "icon" => "google",
2353     "title" => "Mediapartners",
2354     "rule" => array (
2355     "Mediapartners-Google[ /]([0-9.]{1,10})" => "\\1",
2356     "Mediapartners-Google" => ""
2357     ),
2358     "uri" => ""
2359     ),
2360     "google" => array(
2361     "icon" => "google",
2362     "title" => "Google",
2363     "rule" => array (
2364     "Googl(e|ebot)(-Image)?/([0-9.]{1,10})" => "\\3",
2365     "Googl(e|ebot)(-Image)?/" => "",
2366     "^gsa-crawler" => "",
2367     "Google Web Preview" => ""
2368     ),
2369     "uri" => "http://www.google.com/"
2370     ),
2371     "googlesitemaps" => array(
2372     "icon" => "google",
2373     "title" => "Google-Sitemaps",
2374     "rule" => array (
2375     "Googl(e|ebot)(-Sitemaps)?/([0-9.]{1,10})" => "\\3",
2376     "GSiteCrawler[ /v]*([0-9.a-z]{1,10})" => "\\1",
2377     "Googl(e|ebot)(-Sitemaps)?/" => ""
2378     ),
2379     "uri" => ""
2380     ),
2381     "googlemobile" => array(
2382     "icon" => "google",
2383     "title" => "Google-Mobile",
2384     "rule" => array (
2385     "Googl(e|ebot)(-Mobile)?/([0-9.]{1,10})" => "\\3",
2386     "Googl(e|ebot)(-Mobile)?/" => ""
2387     ),
2388     "uri" => ""
2389     ),
2390     "googleads" => array(
2391     "icon" => "google",
2392     "title" => "Google-AdsBot",
2393     "rule" => array (
2394     "^AdsBot-Google" => "",
2395     ),
2396     "uri" => ""
2397     ),
2398     "googlefeeds" => array(
2399     "icon" => "google",
2400     "title" => "Google-Feedfetcher",
2401     "rule" => array (
2402     "^Feedfetcher-Google" => "",
2403     ),
2404     "uri" => ""
2405     ),
2406     "googlverification" => array(
2407     "icon" => "google",
2408     "title" => "Google-Site-Verification",
2409     "rule" => array (
2410     "Google-Site-Verification[ /]([0-9.]{1,10})" => "\\1"
2411     ),
2412     "uri" => ""
2413     ),
2414 matthys 207 // Needs to be AFTER Google detection
2415     "goo" => array(
2416     "icon" => "goo",
2417     "title" => "Goo",
2418     "rule" => array (
2419     "(gazz|ichiro|mog(et|imogi))[ /]([0-9.]{1,10})" => "\\3",
2420     "DoCoMo[ /]([0-9.]{1,10})" => "\\1"
2421     ),
2422     "uri" => ""
2423     ),
2424 joku 63 "goongee" => array(
2425     "icon" => "robot",
2426     "title" => "GoonGee",
2427     "rule" => array (
2428     "^Big Fish[ /]v?([0-9.]{1,10})" => "\\2"
2429     ),
2430     "uri" => "http://www.goongee.com/"
2431     ),
2432     "gpost" => array(
2433     "icon" => "gpost",
2434     "title" => "GPost",
2435     "rule" => array(
2436     "^GPostbot" => ""
2437     ),
2438     "uri" => ""
2439     ),
2440 matthys 309 "grapeshot" => array(
2441     "icon" => "grapeshot",
2442     "title" => "Grapeshot",
2443     "rule" => array(
2444     "GrapeshotCrawler[/ ]([0-9.]{1,10})" => "\\1"
2445     ),
2446     "uri" => "http://www.grapeshot.co.uk/crawler.php"
2447     ),
2448 joku 63 "gregarius" => array(
2449     "icon" => "robot",
2450     "title" => "Gregarius",
2451     "rule" => array(
2452     "^Gregarius[/ ]([0-9.]{1,10})" => ""
2453     ),
2454     "uri" => ""
2455     ),
2456     "grub" => array(
2457     "icon" => "grub",
2458     "title" => "Grub",
2459     "rule" => array(
2460     "grub[ \-]?client[ /\-]{1,5}([0-9.]{1,10})" => "\\1",
2461     "grub crawler" => "",
2462     "grub[/ ]([0-9.]{1,10})" => "\\1",
2463     "^GrubNG([0-9. ]{1,10})?" => "\\1"
2464     ),
2465     "uri" => "http://www.grub.org/"
2466     ),
2467     "gulliver" => array(
2468     "icon" => "robot",
2469     "title" => "Gulliver",
2470     "rule" => array(
2471     "Gulliver" => ""
2472     ),
2473     "uri" => ""
2474     ),
2475     "guruji" => array(
2476     "icon" => "guruji",
2477     "title" => "Guruji",
2478     "rule" => array(
2479     "GurujiBot[/ ]([0-9.]{1,10})" => "\\1"
2480     ),
2481     "uri" => "http://www.guruji.com/"
2482     ),
2483     "gush" => array(
2484     "icon" => "robot",
2485     "title" => "Gush",
2486     "rule" => array(
2487     "^Gush[/ ]([0-9.]{1,10})" => "\\1"
2488     ),
2489     "uri" => ""
2490     ),
2491     "gziptester" => array(
2492     "icon" => "robot",
2493     "title" => "Gzip Tester",
2494     "rule" => array(
2495     "g(id)?zip[ \-]?test(er)?" => ""
2496     ),
2497     "uri" => ""
2498     ),
2499     "hanzoweb" => array(
2500     "icon" => "hanzoweb",
2501     "title" => "Hanzoweb",
2502     "rule" => array(
2503     "^Hanzoweb" => ""
2504     ),
2505     "uri" => ""
2506     ),
2507     "harbot" => array(
2508     "icon" => "harbot",
2509     "title" => "Harbot",
2510     "rule" => array(
2511     "^Harbot GateStation" => ""
2512     ),
2513     "uri" => ""
2514     ),
2515     "hatena" => array(
2516     "icon" => "hatena",
2517     "title" => "Hatena",
2518     "rule" => array(
2519     "Hatena (Antenna|Bookmark|Pagetitle Agent)[ /]([0-9.]{1,10})" => "\\2"
2520     ),
2521     "uri" => ""
2522     ),
2523     "htmlparser" => array(
2524     "icon" => "htmlparser",
2525     "title" => "HTMLParser",
2526     "rule" => array(
2527     "HTMLParser[ /]([0-9.]{1,10})" => "\\1"
2528     ),
2529     "uri" => "http://htmlparser.sourceforge.net/"
2530     ),
2531     "helix" => array(
2532     "icon" => "helix",
2533     "title" => "Heritrix",
2534     "rule" => array(
2535     "^helix[ /]([0-9.]{1,10})" => "\\1"
2536     ),
2537     "uri" => "http://www.sitesearch.ca/helix/"
2538     ),
2539     "heritrix" => array(
2540     "icon" => "heritrix",
2541     "title" => "Heritrix",
2542     "rule" => array(
2543     "heritrix[ /]([0-9.]{1,10})" => "\\1",
2544     "archive.org_bot" => "",
2545     "InternetArchive[ /]([0-9.a-z]{1,10})" => "\\1"
2546     ),
2547     "uri" => "http://archive.org"
2548     ),
2549     "hiddenmarket" => array(
2550     "icon" => "robot",
2551     "title" => "HiddenMarket",
2552     "rule" => array(
2553     "HiddenMarket[ /\-]([0-9.]{1,10})" => "\\1"
2554     ),
2555     "uri" => ""
2556     ),
2557     "honda" => array(
2558     "icon" => "robot",
2559     "title" => "Honda",
2560     "rule" => array(
2561     "Honda-Search[ /]([0-9.]{1,10})" => "\\1"
2562     ),
2563     "uri" => "http://www.honda-search.com"
2564     ),
2565     "hoowwwer" => array(
2566     "icon" => "hoowwwer",
2567     "title" => "HooWWWer",
2568     "rule" => array(
2569     "HooWWWer[ /]([0-9.]{1,10})" => "\\1"
2570     ),
2571     "uri" => ""
2572     ),
2573     "hotzonu" => array(
2574     "icon" => "hotzonu",
2575     "title" => "Hotzonu",
2576     "rule" => array(
2577     "Hotzonu[ /]([0-9.]{1,10})" => "\\1"
2578     ),
2579     "uri" => ""
2580     ),
2581     "houxou" => array(
2582     "icon" => "robot",
2583     "title" => "Houxou",
2584     "rule" => array(
2585     "HouxouCrawler[ /]Nutch.([0-9.]{1,10})" => "\\1",
2586     "HouxouCrawler" => ""
2587     ),
2588     "uri" => ""
2589     ),
2590     "htdig" => array(
2591     "icon" => "htdig",
2592     "title" => "ht://Dig",
2593     "rule" => array(
2594     "htdig[ /]([0-9.]{1,10})" => "\\1",
2595     "htdig" => "\\1"
2596     ),
2597     "uri" => ""
2598     ),
2599     "html2jpg" => array(
2600     "icon" => "html2jpg",
2601     "title" => "HTML2JPG",
2602     "rule" => array(
2603     "^HTML2JPG" => ""
2604     ),
2605     "uri" => ""
2606     ),
2607     "httperf" => array(
2608     "icon" => "robot",
2609     "title" => "HTTPerf",
2610     "rule" => array(
2611     "httperf[ /]([0-9.]{1,10})" => "\\1"
2612     ),
2613     "uri" => ""
2614     ),
2615     "httpunit" => array(
2616     "icon" => "httpunit",
2617     "title" => "HttpUnit",
2618     "rule" => array(
2619     "httpunit[ /]([0-9.]{1,10})" => "\\1"
2620     ),
2621     "uri" => ""
2622     ),
2623     "httrack" => array(
2624     "icon" => "httrack",
2625     "title" => "HTTrack",
2626     "rule" => array(
2627     "HTTrack[ /]([0-9.]{1,10})" => "\\1"
2628     ),
2629     "uri" => ""
2630     ),
2631     "huaweisymantec" => array(
2632     "icon" => "huaweisymantec",
2633     "title" => "HuaweiSymantec",
2634     "rule" => array(
2635     "HuaweiSymantecSpider[ /]([0-9.]{1,10})" => "\\1"
2636     ),
2637     "uri" => "http://www.huaweisymantec.com/en/IRL/spider/"
2638     ),
2639     "hungary" => array(
2640     "icon" => "hungary",
2641     "title" => "Hungary",
2642     "rule" => array(
2643     "HuRob[ /]([0-9.]{1,10})" => "\\1"
2644     ),
2645     "uri" => ""
2646     ),
2647 joku 261 "i18n" => array(
2648     "icon" => "w3c",
2649     "title" => "W3C I18n Checker",
2650     "rule" => array(
2651     "^W3C_I18n-Checker[ /]([0-9.]{1,10})" => "\\1"
2652 joku 169 ),
2653 joku 261 "uri" => "http://validator.w3.org/services"
2654     ),
2655 joku 63 "iakke" => array(
2656     "icon" => "iakke",
2657 matthys 209 "title" => "Iakké",
2658 joku 63 "rule" => array(
2659     "^iakke_bot[ /]v([0-9.]{1,10})" => "\\1"
2660     ),
2661     "uri" => "http://fr.iakke.com/"
2662     ),
2663     "iask" => array(
2664     "icon" => "iask",
2665     "title" => "IAsk",
2666     "rule" => array(
2667     "iaskspider[ /]([0-9.]{1,10})" => "\\1",
2668     "^iaskspider" => ""
2669     ),
2670     "uri" => "http://iask.com"
2671     ),
2672     "icc" => array(
2673     "icon" => "icc",
2674     "title" => "ICC-Crawler",
2675     "rule" => array(
2676     "^ICC-Crawler" => ""
2677     ),
2678     "uri" => "http://kc.nict.go.jp/icc/crawl.html"
2679     ),
2680     "icerocket" => array(
2681     "icon" => "icerocket",
2682     "title" => "Icerocket",
2683     "rule" => array(
2684     "BlogzIce[ /]([0-9.]{1,10})" => "\\1",
2685     "BlogSearch[ /]([0-9.]{1,10})" => "\\1"
2686     ),
2687     "uri" => ""
2688     ),
2689     "icjobs" => array(
2690     "icon" => "icjobs",
2691     "title" => "iCjobs",
2692     "rule" => array(
2693     "iCjobs[ /]([0-9.]{1,10})" => "\\1"
2694     ),
2695     "uri" => "http://www.icjobs.de/"
2696     ),
2697     "icra" => array(
2698     "icon" => "icra",
2699     "title" => "ICRA",
2700     "rule" => array(
2701     "^ICRA_Semantic_spider[ /]([0-9.]{1,10})" => "\\1"
2702     ),
2703     "uri" => "http://www.icra.org"
2704     ),
2705     "iknow" => array(
2706     "icon" => "robot",
2707     "title" => "I know",
2708     "rule" => array(
2709     "Comaneci_bot[ /]([0-9.]{1,10})" => "\\1"
2710     ),
2711     "uri" => ""
2712     ),
2713     "ilial" => array(
2714     "icon" => "robot",
2715     "title" => "Ilial",
2716     "rule" => array(
2717     "ilial[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
2718     ),
2719     "uri" => ""
2720     ),
2721     "ilocal" => array(
2722     "icon" => "ilocal",
2723     "title" => "ilocal",
2724     "rule" => array(
2725     "^ilocal" => "",
2726     ),
2727     "uri" => "http://www.ilocal.nl"
2728     ),
2729     "ilse" => array(
2730     "icon" => "ilse",
2731     "title" => "Ilse",
2732     "rule" => array(
2733     "I(NGRID|lseRobot|lseBot)[ /]([0-9.]{1,10})" => "\\1"
2734     ),
2735     "uri" => "http://ilse.nl/"
2736     ),
2737     "iltrovatore" => array(
2738     "icon" => "iltrovatore",
2739     "title" => "IlTrovatore",
2740     "rule" => array(
2741     "iltrovatore-setaccio[ /]([0-9.]{1,10})" => "\\1",
2742     "Iltrovatore-Setaccio" => "",
2743     "iltrovatore[ /]([0-9.]{1,10})" => "\\1"
2744     ),
2745     "uri" => ""
2746     ),
2747     "indylibrary" => array(
2748     "icon" => "robot",
2749     "title" => "Indy Library",
2750     "rule" => array(
2751     "Indy[ \-]?Library" => ""
2752     ),
2753     "uri" => ""
2754     ),
2755     "inela" => array(
2756     "icon" => "robot",
2757     "title" => "Inela",
2758     "rule" => array(
2759     "InelaBot[ /]([0-9.]{1,10})" => ""
2760     ),
2761     "uri" => "http://inelegant.org/bot"
2762     ),
2763     "ineturl" => array(
2764     "icon" => "robot",
2765     "title" => "InetURL",
2766     "rule" => array(
2767     "InetURL.?[ /]([0-9.]{1,10})" => ""
2768     ),
2769     "uri" => ""
2770     ),
2771     "infoart" => array(
2772     "icon" => "robot",
2773     "title" => "InfoArt",
2774     "rule" => array(
2775     "InfoArt crawler" => ""
2776     ),
2777     "uri" => ""
2778     ),
2779     "infomine" => array(
2780     "icon" => "infomine",
2781     "title" => "INFOMINE",
2782     "rule" => array(
2783     "^DataFountains/DMOZ" => "",
2784     "^INFOMINE[ /]([0-9.]{1,10})" => "\\1"
2785     ),
2786     "uri" => "http://infomine.ucr.edu/"
2787     ),
2788     "infoseek" => array(
2789     "icon" => "infoseek",
2790     "title" => "Infoseek",
2791     "rule" => array(
2792     "SideWinder[ /]?([0-9a-z.]{1,10})" => "\\1",
2793     "Infoseek" => ""
2794     ),
2795     "uri" => ""
2796     ),
2797     "inktomi" => array(
2798     "icon" => "inktomi",
2799     "title" => "Inktomi",
2800     "rule" => array(
2801     "slurp@inktomi\.com" => ""
2802     ),
2803     "uri" => ""
2804     ),
2805     "innerprise" => array(
2806     "icon" => "robot",
2807     "title" => "Innerprise",
2808     "rule" => array(
2809     "^InnerpriseBot[ /]([0-9.]{1,10})" => "\\1",
2810     "URL[ _]Spider[ _]Pro[ /]([0-9.+]{1,10})" => "\\1",
2811     "^ES[ .]NET[ _]Crawler[ /]([0-9.]{1,10})" => "\\1"
2812     ),
2813     "uri" => "http://www.innerprise.com/"
2814     ),
2815     "inria" => array(
2816     "icon" => "inria",
2817     "title" => "Inria",
2818     "rule" => array(
2819     "^xyro_" => ""
2820     ),
2821     "uri" => ""
2822     ),
2823     "insitor" => array(
2824     "icon" => "insitor",
2825     "title" => "Insitor",
2826     "rule" => array(
2827     "^Insitor(,|\.|naut)" => ""
2828     ),
2829     "uri" => "http://www.insitor.com/"
2830     ),
2831     "internetninja" => array(
2832     "icon" => "robot",
2833     "title" => "Internet Ninja",
2834     "rule" => array(
2835     "^Internet Ninja[ /]([0-9.]{1,10})" => "\\1"
2836     ),
2837     "uri" => ""
2838     ),
2839     "internetseer" => array(
2840     "icon" => "internetseer",
2841     "title" => "InternetSeer",
2842     "rule" => array(
2843     "^InternetSeer\.com" => ""
2844     ),
2845     "uri" => ""
2846     ),
2847     "interseek" => array(
2848     "icon" => "interseek",
2849     "title" => "Interseek",
2850     "rule" => array(
2851     "Interseek.com" => ""
2852     ),
2853     "uri" => "http://www.interseek.com"
2854     ),
2855     "intravnews" => array(
2856     "icon" => "intravnews",
2857     "title" => "IntraVnews",
2858     "rule" => array(
2859     "IntraVnews[ /]([0-9.]{1,10})" => "\\1"
2860     ),
2861     "uri" => "http://www.intravnews.com/"
2862     ),
2863     "ip2location" => array(
2864     "icon" => "ip2location",
2865     "title" => "IP2LocationBot",
2866     "rule" => array(
2867     "^IP2(Map|Location)Bot[ /]([0-9.]{1,10})" => "\\2"
2868     ),
2869     "uri" => "http://www.ip2location.com"
2870     ),
2871     "ipworks" => array(
2872     "icon" => "ipworks",
2873     "title" => "IP*Works",
2874     "rule" => array(
2875     "^IP\*Works\! V([0-9.]{1,10})" => "\\1"
2876     ),
2877     "uri" => "http://www.nsoftware.com/ipworks/"
2878     ),
2879     "irca" => array(
2880     "icon" => "robot",
2881     "title" => "Novell iChain Cool Solutions caching",
2882     "rule" => array(
2883 matthys 209 "^ICRA_(label_generator|Semantic_spider)[ /]([0-9.]{1,10})" => "\\2",
2884     "^Mozilla[/ ]([0-9.]{1,10})[/ ]\(compatible[ ;]*ICS" => "\\1"
2885 joku 63 ),
2886     "uri" => "http://www.icra.org"
2887     ),
2888     "irvine" => array(
2889     "icon" => "robot",
2890     "title" => "Irvine",
2891     "rule" => array(
2892     "Irvine[ /]([0-9.]{1,10})" => "\\1"
2893     ),
2894     "uri" => ""
2895     ),
2896     "ips-agent" => array(
2897     "icon" => "robot",
2898 matthys 209 "title" => "IPS-agent",
2899 joku 63 "rule" => array(
2900     "ips-agent" => ""
2901     ),
2902     "uri" => ""
2903     ),
2904     "isara" => array(
2905     "icon" => "isara",
2906 matthys 209 "title" => "Isara",
2907 joku 63 "rule" => array(
2908     "Isara[ -]([0-9.]{1,10})" => "\\1"
2909     ),
2910     "uri" => "http://www.isara.org/"
2911     ),
2912     "isspider" => array(
2913     "icon" => "robot",
2914     "title" => "ISSpider",
2915     "rule" => array(
2916     "ISSpider[ /\-]([0-9.]{1,10})" => "\\1"
2917     ),
2918     "uri" => ""
2919     ),
2920     "it2media" => array(
2921     "icon" => "it2media",
2922     "title" => "IT2media",
2923     "rule" => array(
2924     "www.adressendeutschland.de" => ""
2925     ),
2926     "uri" => "http://www.adressendeutschland.de/"
2927     ),
2928     "ivia" => array(
2929     "icon" => "robot",
2930     "title" => "iVia",
2931     "rule" => array(
2932     "iVia Site Checker.?[ /]([0-9.]{1,10})" => "\\1"
2933     ),
2934     "uri" => ""
2935     ),
2936     "jeteye" => array(
2937     "icon" => "jeteye",
2938     "title" => "Jeteye",
2939     "rule" => array(
2940     "Jetbot[ /]([0-9.]{1,10})" => "\\1"
2941     ),
2942     "uri" => ""
2943     ),
2944     "jobsde" => array(
2945     "icon" => "jobsde",
2946     "title" => "jobs.de",
2947     "rule" => array(
2948     "www\.jobs\.de" => "",
2949     "jobs.de-Robot" => ""
2950     ),
2951     "uri" => "http://www.jobs.de/"
2952     ),
2953     "jpluck" => array(
2954     "icon" => "robot",
2955     "title" => "Jpluck",
2956     "rule" => array(
2957     "JPluck[ /]([0-9a-z.]{1,10})" => "\\1"
2958     ),
2959     "uri" => ""
2960     ),
2961     "jxta" => array(
2962     "icon" => "robot",
2963     "title" => "Jxta",
2964     "rule" => array(
2965     "falcon[ /]([0-9.]{1,10})" => "\\1"
2966     ),
2967     "uri" => ""
2968     ),
2969     "jyte" => array(
2970     "icon" => "jyte",
2971     "title" => "Jyte",
2972     "rule" => array(
2973     "jyte_fetcher[ /]([0-9.]{1,10})" => "\\1"
2974     ),
2975     "uri" => ""
2976     ),
2977     "jyxo" => array(
2978     "icon" => "jyxo",
2979     "title" => "Jyxo",
2980     "rule" => array(
2981     "Jyxobot[ /]([0-9.]{1,10})" => "\\1"
2982     ),
2983     "uri" => ""
2984     ),
2985     "kalooga" => array(
2986     "icon" => "kalooga",
2987     "title" => "Kalooga",
2988     "rule" => array(
2989     "kalooga[ /-]([0-9.]{1,10})" => "\\1",
2990     "^kalooga" => "",
2991     "KaloogaBot" => ""
2992     ),
2993     "uri" => "http://www.kalooga.com"
2994     ),
2995     "keywen" => array(
2996     "icon" => "keywen",
2997     "title" => "Keywen",
2998     "rule" => array(
2999     "EasyDL[ /]([0-9.]{1,10})" => "\\1"
3000     ),
3001     "uri" => ""
3002     ),
3003     "kilomonkey" => array(
3004     "icon" => "robot",
3005     "title" => "Kilomonkey",
3006     "rule" => array(
3007     "kmky-not-a-bot[ /]([0-9.]{1,10})" => "\\1"
3008     ),
3009     "uri" => "http://www.kilomonkey.com/notabot.txt"
3010     ),
3011     "kinja" => array(
3012     "icon" => "kinja",
3013     "title" => "Kinja",
3014     "rule" => array(
3015     "kinjabot[ /]([0-9.]{1,10})" => "\\1",
3016     "^kinjabot" => ""
3017     ),
3018     "uri" => ""
3019     ),
3020     "kiwi" => array(
3021     "icon" => "robot",
3022     "title" => "KiwiStatus",
3023     "rule" => array(
3024     "KiwiStatus[ /]([0-9.]{1,10})" => "\\1",
3025     "KiwiStatus" => ""
3026     ),
3027     "uri" => "http://www.nzs.com/kiei-status/"
3028     ),
3029     "lachesis" => array(
3030     "icon" => "robot",
3031     "title" => "Lachesis",
3032     "rule" => array(
3033     "lachesis" => ""
3034     ),
3035     "uri" => ""
3036     ),
3037     "lanshan" => array(
3038     "icon" => "robot",
3039     "title" => "Lachesis",
3040     "rule" => array(
3041     "lanshanbot[/ ]([0-9.]{1,10})" => "\\1"
3042     ),
3043     "uri" => ""
3044     ),
3045     "lapozz" => array(
3046     "icon" => "lapozz",
3047     "title" => "Lapozz",
3048     "rule" => array(
3049     "LapozzBot[/ ]?([0-9.]{1,10})" => "\\1"
3050     ),
3051     "uri" => ""
3052     ),
3053     "larbin" => array(
3054     "icon" => "robot",
3055     "title" => "Larbin",
3056     "rule" => array(
3057     "larbin[_/ ]?([0-9.]{1,10})" => "\\1"
3058     ),
3059     "uri" => ""
3060     ),
3061     "laurion" => array(
3062     "icon" => "robot",
3063     "title" => "Laurion",
3064     "rule" => array(
3065     "^IPiumBot" => ""
3066     ),
3067     "uri" => "http://www.laurion.com/"
3068     ),
3069     "leechget" => array(
3070     "icon" => "leechget",
3071     "title" => "LeechGet",
3072     "rule" => array(
3073     "^LeechGet[ /]([0-9.]{1,10})" => "\\1"
3074     ),
3075     "uri" => ""
3076     ),
3077     "linguaseek" => array(
3078     "icon" => "linguaseek",
3079     "title" => "Linguaseek",
3080     "rule" => array(
3081     "^LinguaBot[ /]v([0-9.]{1,10})" => "\\1"
3082     ),
3083     "uri" => "http://www.linguaseek.com/"
3084     ),
3085     "linguee" => array(
3086     "icon" => "linguee",
3087     "title" => "Linguee",
3088     "rule" => array(
3089     "^Linguee Bot" => ""
3090     ),
3091     "uri" => "http://www.linguee.com/"
3092     ),
3093 matthys 355 "linkapedia" => array(
3094     "icon" => "linkapedia",
3095     "title" => "Linkapedia",
3096     "rule" => array(
3097     "^linkapedia" => ""
3098     ),
3099     "uri" => "http://www.linkapedia.com"
3100     ),
3101 matthys 346 "linkdex" => array(
3102     "icon" => "linkdex",
3103     "title" => "Linkdex",
3104     "rule" => array(
3105     "linkdexbot[ /]([0-9.]{1,10})" => "\\1"
3106     ),
3107     "uri" => "http://www.linkdex.com/bots/"
3108     ),
3109 matthys 366 "linkedin" => array(
3110     "icon" => "linkedin",
3111     "title" => "LinkedIn",
3112     "rule" => array(
3113     "LinkedInBot[ /]([0-9.]{1,10})" => "\\1"
3114     ),
3115     "uri" => "http://www.linkedin.com"
3116     ),
3117 joku 63 "linkguard" => array(
3118     "icon" => "robot",
3119     "title" => "Linkguard",
3120     "rule" => array(
3121     "Linkguard Online[ /]([0-9.]{1,10})" => "\\1"
3122     ),
3123     "uri" => "http://www.linkguard.com/"
3124     ),
3125     "linklint" => array(
3126     "icon" => "linklint",
3127     "title" => "Linklint",
3128     "rule" => array(
3129     "^Linklint[-\-a-z /]*([0-9.]{1,10})" => "\\1"
3130     ),
3131     "uri" => "http://www.linklint.org/"
3132     ),
3133     "linkman" => array(
3134     "icon" => "linkman",
3135     "title" => "Linkman",
3136     "rule" => array(
3137     "\(compatible; Linkman\)" => ""
3138     ),
3139     "uri" => ""
3140     ),
3141     // Needs to be before linkcheck for correct detection
3142     "linkchecker" => array(
3143     "icon" => "w3c",
3144     "title" => "W3C Link Checker",
3145     "rule" => array(
3146     "^W3C-checklink[ /]([0-9.]{1,10})" => "\\1"
3147     ),
3148     "uri" => "http://validator.w3.org/checklink"
3149     ),
3150     "linkcheck" => array(
3151     "icon" => "linkcheck",
3152     "title" => "Linkcheck",
3153     "rule" => array(
3154     "checklink[ /]([0-9.]{1,10})" => "\\1",
3155     "Link[ \-]?(Chec(k|ker)|Val(et|idator))" => "",
3156     "Adaxas Spider" => "",
3157     "Agent-SharewarePlazaFileCheckBot[ /]([0-9.]{1,10})" => "\\1",
3158     "NetMechanic V([0-9.]{1,10})" => "\\1",
3159     "^InfoLink" => "",
3160     "InternetLinkAgent" => "",
3161     "; SPENG\)" => "",
3162     "SharewarePlazaFileCheckBot" => "",
3163     "fileboost.net" => "",
3164     "^billbot" => ""
3165     ),
3166     "uri" => ""
3167     ),
3168     "linkru" => array(
3169     "icon" => "robot",
3170     "title" => "Link.RU",
3171     "rule" => array(
3172     "^Link.RU bot" => ""
3173     ),
3174     "uri" => ""
3175     ),
3176     "linkssql" => array(
3177     "icon" => "robot",
3178     "title" => "Links SQL",
3179     "rule" => array(
3180     "links sql" => ""
3181     ),
3182     "uri" => ""
3183     ),
3184     "linksweeper" => array(
3185     "icon" => "robot",
3186     "title" => "Link Sweeper",
3187     "rule" => array(
3188     "LinkSweeper[ /]([0-9.]{1,10})" => "\\1"
3189     ),
3190     "uri" => ""
3191     ),
3192     "linkwalker" => array(
3193     "icon" => "robot",
3194     "title" => "Link Walker",
3195     "rule" => array(
3196     "^LinkWalker" => ""
3197     ),
3198     "uri" => ""
3199     ),
3200     "lipperhey" => array(
3201     "icon" => "lipperhey",
3202     "title" => "Lipperhey",
3203     "rule" => array(
3204     "Lipperhey Spider" => ""
3205     ),
3206     "uri" => "http://www.lipperhey.com"
3207     ),
3208     "livedoor" => array(
3209     "icon" => "livedoor",
3210     "title" => "Livedoor",
3211     "rule" => array(
3212     "^Livedoor( SF( - California Crawl)?|Checkers)[ /]" => ""
3213     ),
3214     "uri" => ""
3215     ),
3216     "livejournal" => array(
3217     "icon" => "livejournal",
3218     "title" => "Live Journal",
3219     "rule" => array(
3220     "^LiveJournal\.com" => ""
3221     ),
3222     "uri" => "http://www.livejournal.com"
3223     ),
3224     "ljpic" => array(
3225     "icon" => "ljpic",
3226     "title" => "ljpic",
3227     "rule" => array(
3228     "LjSEEK Picture-Bot[ /]+([0-9.]{1,10})" => "\\1"
3229     ),
3230     "uri" => "http://www.ljpic.com"
3231     ),
3232     "lmspider" => array(
3233     "icon" => "robot",
3234     "title" => "Lmspider",
3235     "rule" => array(
3236     "^lmspider" => ""
3237     ),
3238     "uri" => ""
3239     ),
3240     "locators" => array(
3241     "icon" => "robot",
3242     "title" => "Locaters",
3243     "rule" => array(
3244     "^FiNDoBot[/ ]([0-9a-z.]{1,10})" => "\\1"
3245     ),
3246     "uri" => ""
3247     ),
3248     "look" => array(
3249     "icon" => "look",
3250     "title" => "Look",
3251     "rule" => array(
3252     "www\.look\.com" => "",
3253     "Lookbot" => ""
3254     ),
3255     "uri" => ""
3256     ),
3257     "looksmart" => array(
3258     "icon" => "looksmart",
3259     "title" => "LookSmart",
3260     "rule" => array(
3261     "^Martini" => "",
3262     "^MantraAgent" => "",
3263     "FurlBot" => "",
3264     "looksmart-sv-fw" => ""
3265     ),
3266     "uri" => ""
3267     ),
3268     "loop" => array(
3269     "icon" => "loop",
3270     "title" => "LOOP",
3271     "rule" => array(
3272     "NetResearchServer[ /]([0-9.]{1,10})" => "\\1"
3273     ),
3274     "uri" => ""
3275     ),
3276     "lotkyll" => array(
3277     "icon" => "robot",
3278     "title" => "Lotkyll",
3279     "rule" => array(
3280     "Lotkyll" => ""
3281     ),
3282     "uri" => ""
3283     ),
3284 joku 335 "ltx71" => array(
3285     "icon" => "robot",
3286     "title" => "LTX71",
3287     "rule" => array(
3288     "ltx71" => ""
3289     ),
3290     "uri" => "http://ltx71.com/"
3291     ),
3292 joku 63 "lwp" => array(
3293     "icon" => "robot",
3294     "title" => "lwp",
3295     "rule" => array(
3296     "lwp(-trivial|::simple)[ /]([0-9.]{1,10})" => "\\2"
3297     ),
3298     "uri" => ""
3299     ),
3300     "lycos" => array(
3301     "icon" => "lycos",
3302     "title" => "Lycos",
3303     "rule" => array(
3304     "Lycos_Spider_" => ""
3305     ),
3306     "uri" => ""
3307     ),
3308     "magpierss" => array(
3309     "icon" => "rss",
3310     "title" => "MagpieRSS",
3311     "rule" => array(
3312     "MagpieRSS" => ""
3313     ),
3314     "uri" => "http://magpierss.sourceforge.net/"
3315     ),
3316     "mailru" => array(
3317     "icon" => "mailru",
3318 matthys 209 "title" => "Mail.Ru",
3319 joku 63 "rule" => array(
3320 matthys 195 "^Mail.Ru[ /]([0-9.]{1,10})" => "\\1",
3321     "Mail.RU_Bot[ /]([0-9.]{1,10})" => "\\1"
3322 joku 63 ),
3323 matthys 209 "uri" => "http://www.mail.ru/"
3324 joku 63 ),
3325     "mailsweeper" => array(
3326     "icon" => "robot",
3327     "title" => "Mail Sweeper",
3328     "rule" => array(
3329     "Mail[ \-]?Sweeper" => ""
3330     ),
3331     "uri" => ""
3332     ),
3333     "marvin" => array(
3334     "icon" => "robot",
3335     "title" => "Marvin",
3336     "rule" => array(
3337     "^Marvin" => ""
3338     ),
3339     "uri" => ""
3340     ),
3341     "matkurja" => array(
3342     "icon" => "matkurja",
3343     "title" => "Mat'Kurja",
3344     "rule" => array(
3345     "Mosad[ /]([0-9.]{1,10})" => "\\1"
3346     ),
3347     "uri" => ""
3348     ),
3349     "mavicanet" => array(
3350     "icon" => "mavicanet",
3351     "title" => "Mavicanet",
3352     "rule" => array(
3353     "Mavicanet robot" => ""
3354     ),
3355     "uri" => ""
3356     ),
3357 matthys 292 "meanpath" => array(
3358     "icon" => "meanpath",
3359 matthys 290 "title" => "Meanpath",
3360 matthys 280 "rule" => array(
3361     "meanpathbot[ /]([0-9.]{1,10})" => "\\1"
3362     ),
3363     "uri" => "http://www.meanpath.com/meanpathbot.html"
3364 matthys 275 ),
3365 matthys 280 "mediater" => array(
3366 joku 63 "icon" => "robot",
3367     "title" => "Mediater",
3368     "rule" => array (
3369     "^libwww[ /]([0-9.]{1,10})" => "\\1"
3370 matthys 280 ),
3371     "uri" => ""
3372 joku 63 ),
3373 matthys 305 "memory" => array(
3374     "icon" => "memory",
3375     "title" => "internet Memory",
3376     "rule" => array (
3377     "memoryBot[ /]([0-9.]{1,10})" => "\\1"
3378     ),
3379     "uri" => "http://internetmemory.org/en/"
3380     ),
3381 joku 63 "mercator" => array(
3382     "icon" => "robot",
3383     "title" => "Mercator",
3384     "rule" => array(
3385     "Mercator" => ""
3386     ),
3387     "uri" => ""
3388     ),
3389     "metacarta" => array(
3390     "icon" => "robot",
3391     "title" => "Metacarta",
3392     "rule" => array(
3393     "^RRC (crawler_admin@bigfoot.com)" => "",
3394     "^flunky" => "",
3395     "^Mozilla.*\(samualt9@bigfoot.com\)$" => ""
3396     ),
3397     "uri" => "http://www.metacarta.com"
3398     ),
3399     "metager" => array(
3400     "icon" => "metager",
3401     "title" => "MetaGer",
3402     "rule" => array(
3403     "MetaGer" => ""
3404     ),
3405     "uri" => ""
3406     ),
3407     "metamark" => array(
3408     "icon" => "robot",
3409     "title" => "Metamark",
3410     "rule" => array(
3411     "^XRL[ /]([0-9.a-z]{1,10})" => "\\1"
3412     ),
3413     "uri" => "http://metamark.net"
3414     ),
3415     "metamedic" => array(
3416     "icon" => "metamedic",
3417     "title" => "MetaMedic",
3418     "rule" => array(
3419     "MediBot[ /]([0-9.]{1,10})" => "\\1"
3420     ),
3421     "uri" => ""
3422     ),
3423     "mirago" => array(
3424     "icon" => "mirago",
3425     "title" => "Mirago",
3426     "rule" => array(
3427     "Mirago" => ""
3428     ),
3429     "uri" => ""
3430     ),
3431     "misterwong" => array(
3432     "icon" => "misterwong",
3433     "title" => "Mister Wong",
3434     "rule" => array(
3435     "Mister Wong-Bot[ /]([0-9.]{1,10})" => "\\1"
3436     ),
3437     "uri" => "http://www.mister-wong.de/"
3438     ),
3439     "miva" => array(
3440     "icon" => "miva",
3441     "title" => "Miva",
3442     "rule" => array(
3443     "AlgoFeedback@miva\.com" => ""
3444     ),
3445     "uri" => "http://www.miva.com/"
3446     ),
3447     "mj12" => array(
3448     "icon" => "mj12",
3449     "title" => "Majestic-12",
3450     "rule" => array(
3451     "Mj12bot[ /]v?([0-9.]{1,10})" => "\\1",
3452     "MJ12bot \(mini\)[ /]([0-9.]{1,10})" => "\\1"
3453     ),
3454     "uri" => "http://majestic12.co.uk/bot.php"
3455     ),
3456     "mlbot" => array(
3457     "icon" => "robot",
3458     "title" => "MLBot",
3459     "rule" => array(
3460     "^MLBot" => ""
3461     ),
3462     "uri" => "http://www.metadatalabs.com/mlbot"
3463     ),
3464     "mnogo" => array(
3465     "icon" => "mnogo",
3466     "title" => "mnoGoSearch",
3467     "rule" => array(
3468     "Mnogosearch[ /\-]([0-9.]{1,10})" => "\\1"
3469     ),
3470     "uri" => "http://www.mnogosearch.org/"
3471     ),
3472     "mobileok" => array(
3473     "icon" => "mobileok",
3474     "title" => "W3C mobileOK",
3475     "rule" => array(
3476     "^W3C-mobileOK" => ""
3477     ),
3478     "uri" => "http://www.w3.org/2006/07/mobileok-ddc"
3479     ),
3480 matthys 296 "mojeek" => array(
3481     "icon" => "mojeek",
3482     "title" => "Mojeek",
3483 joku 63 "rule" => array(
3484     "MojeekBot[ /]([0-9.]{1,10})" => "\\1"
3485     ),
3486 matthys 284 "uri" => "https://www.mojeek.com/bot.html"
3487 joku 63 ),
3488     "momspider" => array(
3489     "icon" => "robot",
3490     "title" => "MOM Spider",
3491     "rule" => array(
3492     "MOMspider[ /]([0-9.]{1,10})" => "\\1"
3493     ),
3494     "uri" => ""
3495     ),
3496     "moreover" => array(
3497     "icon" => "moreover",
3498     "title" => "Moreover",
3499     "rule" => array(
3500     "^Moreoverbot[ /]([0-9.]{1,10})" => "\\1"
3501     ),
3502     "uri" => ""
3503     ),
3504     "movabletype" => array(
3505     "icon" => "movabletype",
3506     "title" => "Movable Type",
3507     "rule" => array(
3508     "MovableType[ /]([0-9.]{1,10})" => "\\1"
3509     ),
3510     "uri" => ""
3511     ),
3512     "mozdex" => array(
3513     "icon" => "mozdex",
3514     "title" => "MozDex",
3515     "rule" => array(
3516     "mozDex[ /]([0-9.]{1,6}(-dev)?)" => "\\1"
3517     ),
3518     "uri" => ""
3519     ),
3520     "mqbot" => array(
3521     "icon" => "robot",
3522     "title" => "MQbot",
3523     "rule" => array(
3524     "MQbot" => ""
3525     ),
3526     "uri" => ""
3527     ),
3528     "msnbot" => array(
3529     "icon" => "bing",
3530 matthys 205 "title" => "Bing",
3531 joku 63 "rule" => array(
3532     "MSN(BOT|PTC)[ /]([0-9.]{1,10})" => "\\2",
3533     "MS Search ([0-9.]{1,10}) Robot" => "\\1",
3534     "MSNBOT-(MEDIA|PRODUCTS|NewsBlogs)[ /]([0-9.]{1,10})" => "\\2",
3535     "bingbot[ /]([0-9.]{1,10})" => "\\1"
3536     ),
3537     "uri" => ""
3538     ),
3539     "msnbot-mobile" => array(
3540     "icon" => "msn",
3541     "title" => "MSN Mobile",
3542     "rule" => array(
3543     "MSNBOT-(MOBILE|)[ /]([0-9.]{1,10})" => "\\2",
3544     "MSNBOT_Mobile" => "",
3545     "MSMOBOT" => ""
3546     ),
3547     "uri" => ""
3548     ),
3549     "mslivebot" => array(
3550     "icon" => "livesearch",
3551     "title" => "MS Live Search",
3552     "rule" => array(
3553     "MSNBOT-(Academic)[ /]([0-9.]{1,10})" => "\\2"
3554     ),
3555     "uri" => ""
3556     ),
3557     "msproxy" => array(
3558     "icon" => "robot",
3559     "title" => "MSProxy",
3560     "rule" => array(
3561     "MSProxy[ /]([0-9.]{1,10})" => "\\1"
3562     ),
3563     "uri" => ""
3564     ),
3565     "msrbot" => array(
3566     "icon" => "robot",
3567     "title" => "MSRBOT",
3568     "rule" => array(
3569     "^MSRBOT" => ""
3570     ),
3571     "uri" => "http://research.microsoft.com/research/sv/msrbot/"
3572     ),
3573     "mswebdav" => array(
3574     "icon" => "robot",
3575     "title" => "MS-WebDAV",
3576     "rule" => array(
3577     "Microsoft[ \-]?WebDAV[ \-]?MiniRedir" => ""
3578     ),
3579     "uri" => ""
3580     ),
3581     "mticon" => array(
3582     "icon" => "robot",
3583     "title" => "MTIcon",
3584     "rule" => array(
3585     "MTIcon[/ ]([0-9.]{1,10})" => "\\1"
3586     ),
3587     "uri" => ""
3588     ),
3589     "multipage-validator" => array(
3590     "icon" => "multipage-validator",
3591     "title" => "Multipage Validator",
3592     "rule" => array(
3593     "^W3C_Multipage_Validator[ /]([0-9.]{1,10})" => "\\1"
3594     ),
3595     "uri" => "http://www.validator.ca/"
3596     ),
3597     "myrss" => array(
3598     "icon" => "rss",
3599     "title" => "MyRSS",
3600     "rule" => array(
3601     "MyRSS.jp[/ ]([0-9.]{1,10})" => "\\1"
3602     ),
3603     "uri" => ""
3604     ),
3605     "multimap" => array(
3606     "icon" => "robot",
3607     "title" => "Multimap",
3608     "rule" => array(
3609     "Multimap Geotag Blog Parser[/ ]([0-9.]{1,10})" => "\\1"
3610     ),
3611     "uri" => ""
3612     ),
3613     "najdi" => array(
3614     "icon" => "najdi",
3615     "title" => "Najdi.si",
3616     "rule" => array(
3617     "Najdi.si" => ""
3618     ),
3619     "uri" => "http://www.najdi.si"
3620     ),
3621     "nameprotect" => array(
3622     "icon" => "nameprotect",
3623     "title" => "Name Protect",
3624     "rule" => array(
3625     "NPBot" => ""
3626     ),
3627     "uri" => ""
3628     ),
3629     "nationaldirectory" => array(
3630     "icon" => "robot",
3631     "title" => "National Directory",
3632     "rule" => array(
3633     "NationalDirectory-WebSpider[ /]([0-9.]{1,10})" => "\\1"
3634     ),
3635     "uri" => ""
3636     ),
3637     "natsumican" => array(
3638     "icon" => "robot",
3639     "title" => "Natsu Mican",
3640     "rule" => array(
3641     "NATSU[ \-]MICAN[/ ]([0-9a-z.]{1,10})" => "\\1"
3642     ),
3643     "uri" => ""
3644     ),
3645     "naverbot" => array(
3646     "icon" => "naverbot",
3647     "title" => "Naver",
3648     "rule" => array(
3649     "NaverBot([_\-]dloader)?[/ \-]([0-9.]{1,10})" => "\\2",
3650     "Naver(Bot)?" => "",
3651     "^nabot" => ""
3652     ),
3653     "uri" => ""
3654     ),
3655     "navisso" => array(
3656     "icon" => "navisso",
3657     "title" => "Navisso",
3658     "rule" => array(
3659     "Navisso(Bot)?" => ""
3660     ),
3661     "uri" => "http://www.navisso.com"
3662     ),
3663     "neofonie" => array(
3664     "icon" => "robot",
3665 matthys 205 "title" => "Neofonie",
3666 joku 63 "rule" => array(
3667     "www.neofonie.de" => ""
3668     ),
3669     "uri" => "http://www.neofonie.de/loesungen/search/robot.html"
3670     ),
3671     "neomo" => array(
3672     "icon" => "robot",
3673     "title" => "Neomo",
3674     "rule" => array(
3675     "Francis[ /]([0-9.]{1,10})" => "\\1"
3676     ),
3677     "uri" => ""
3678     ),
3679     "nessus" => array(
3680     "icon" => "nessus",
3681     "title" => "Nessus",
3682     "rule" => array(
3683     "Nessus\)$" => ""
3684     ),
3685     "uri" => ""
3686     ),
3687 matthys 279 "nerdybot" => array(
3688 matthys 280 "icon" => "robot",
3689     "title" => "NerdyBot",
3690     "rule" => array(
3691     "NerdyBot" => ""
3692     ),
3693     "uri" => "http://nerdybot.com/"
3694 matthys 279 ),
3695 joku 63 "nerdbynature" => array(
3696     "icon" => "nerdbynature",
3697     "title" => "NerdByNature",
3698     "rule" => array(
3699     "NerdByNature.Bot" => ""
3700     ),
3701     "uri" => "http://www.nerdbynature.net/bot"
3702     ),
3703     "netants" => array(
3704     "icon" => "netants",
3705     "title" => "NetAnts",
3706     "rule" => array(
3707     "NetAnts[ /]([0-9.]{1,10})" => "\\1"
3708     ),
3709     "uri" => ""
3710     ),
3711     "netcraft" => array(
3712     "icon" => "netcraft",
3713     "title" => "Netcraft",
3714     "rule" => array(
3715     "netcraft" => ""
3716     ),
3717     "uri" => ""
3718     ),
3719     "netinfo" => array(
3720     "icon" => "netinfo",
3721     "title" => "Netinfo",
3722     "rule" => array(
3723     "^NetinfoBot[ /]([0-9.]{1,10})" => "\\1"
3724     ),
3725     "uri" => "http://netinfo.bg/"
3726     ),
3727     "netluchs" => array(
3728     "icon" => "netluchs",
3729     "title" => "Netluchs",
3730     "rule" => array(
3731     "Netluchs[ /]([0-9.a-z]{1,10})" => "\\1"
3732     ),
3733     "uri" => "http://www.netluchs.de/"
3734     ),
3735     "netmechanic" => array(
3736     "icon" => "netmechanic",
3737     "title" => "NetMechanic",
3738     "rule" => array(
3739     "NetMechanic[ /V]{1,5}([0-9.]{1,10})" => "\\1"
3740     ),
3741     "uri" => ""
3742     ),
3743     "netnose" => array(
3744     "icon" => "netnose",
3745     "title" => "NetNose",
3746     "rule" => array(
3747     "NetNose[ \-]Crawler[/ ]([0-9.]{1,10})" => "\\1"
3748     ),
3749     "uri" => ""
3750     ),
3751     "netoskop" => array(
3752     "icon" => "robot",
3753     "title" => "Netoskop",
3754     "rule" => array(
3755     "netoskop" => ""
3756     ),
3757     "uri" => ""
3758     ),
3759     "netpromoter" => array(
3760     "icon" => "netpromoter",
3761     "title" => "NetPromoter",
3762     "rule" => array(
3763     "NetPromoter Spider" => ""
3764     ),
3765     "uri" => "http://www.net-promoter.com/"
3766     ),
3767     "netprospector" => array(
3768     "icon" => "robot",
3769     "title" => "Netprospector",
3770     "rule" => array(
3771     "^netprospector" => ""
3772     )
3773     ),
3774     "netpumper" => array(
3775     "icon" => "robot",
3776     "title" => "Netpumper",
3777     "rule" => array(
3778     "^NetPumper[/ ]([0-9.]{1,10})" => "\\1"
3779     ),
3780     "uri" => ""
3781     ),
3782     "netscapeproxy" => array(
3783     "icon" => "netscape",
3784     "title" => "Netscape Proxy",
3785     "rule" => array(
3786     "Netscape-Proxy[/ ]([0-9.]{1,10})" => "\\1"
3787     ),
3788     "uri" => ""
3789     ),
3790     "netspective" => array(
3791     "icon" => "robot",
3792     "title" => "NetSpective",
3793     "rule" => array(
3794     "^WebFilter Robot ([0-9.]{1,10})" => "\\1"
3795     ),
3796     "uri" => ""
3797     ),
3798     "netvibes" => array(
3799     "icon" => "netvibes",
3800     "title" => " Netvibes",
3801     "rule" => array(
3802     "^Netvibes" => "\\1"
3803     ),
3804     "uri" => ""
3805     ),
3806     "newsfire" => array(
3807     "icon" => "newsfire",
3808     "title" => "NewsFire",
3809     "rule" => array(
3810     "NewsFire[/ ]([0-9.]{1,10})" => "\\1"
3811     ),
3812     "uri" => ""
3813     ),
3814     "newsgator" => array(
3815     "icon" => "newsgator",
3816     "title" => "NewsGator",
3817     "rule" => array(
3818     "NewsGato(r|rOnline)[/ ]([0-9.]{1,10})" => "\\2"
3819     ),
3820     "uri" => ""
3821     ),
3822     "newzcrawler" => array(
3823     "icon" => "newzcrawler",
3824     "title" => "NewzCrawler",
3825     "rule" => array(
3826     "NewzCrawler[/ ]([0-9.]{1,10})" => "\\1"
3827     ),
3828     "uri" => ""
3829     ),
3830     "nextopia" => array(
3831     "icon" => "newzcrawler",
3832     "title" => "NewzCrawler",
3833     "rule" => array(
3834     "^NextopiaBOT.*[v ]([0-9.]{1,10})" => "\\1"
3835     ),
3836     "uri" => ""
3837     ),
3838     "ngsearch" => array(
3839     "icon" => "ngsearch",
3840     "title" => "NG Search",
3841     "rule" => array(
3842     "NG-Search[/ ]([0-9.]{1,10})" => "\\1"
3843     ),
3844     "uri" => ""
3845     ),
3846     "nimble" => array(
3847     "icon" => "robot",
3848     "title" => "Nimble",
3849     "rule" => array(
3850     "NimbleCrawler[/ ]([0-9.]{1,10})" => "\\1"
3851     ),
3852     "uri" => ""
3853     ),
3854     "nmap" => array(
3855     "icon" => "nmap",
3856     "title" => "Nmap",
3857     "rule" => array(
3858     "Nmap Scripting Engine" => ""
3859     ),
3860     "uri" => "http://nmap.org/book/nse.html"
3861     ),
3862     "nusearch" => array(
3863     "icon" => "robot",
3864     "title" => "NuSearch",
3865     "rule" => array(
3866     "^nuSearch" => ""
3867     ),
3868     "uri" => "http://www.nusearch.com/"
3869     ),
3870     "noago" => array(
3871     "icon" => "noago",
3872     "title" => "Noago",
3873     "rule" => array(
3874     "Noago Spider" => ""
3875     ),
3876     "uri" => "http://www.noago.com/"
3877     ),
3878     "noviforum" => array(
3879     "icon" => "noviforum",
3880     "title" => "Noviforum",
3881     "rule" => array(
3882     "TridentSpider[/ ]?([0-9.]{1,10})" => "\\1"
3883     ),
3884     "uri" => ""
3885     ),
3886     "noxtrum" => array(
3887     "icon" => "noxtrum",
3888     "title" => "noXtrum",
3889     "rule" => array(
3890     "noxtrumbot[/ ]?([0-9.]{1,10})" => "\\1"
3891     ),
3892     "uri" => ""
3893     ),
3894     "noyona" => array(
3895     "icon" => "robot",
3896     "title" => "Noyona",
3897     "rule" => array(
3898     "noyona.([0-9._]{1,10})" => "\\1"
3899     ),
3900     "uri" => "http://noyona.com/"
3901     ),
3902     "nsauditor" => array(
3903     "icon" => "nsauditor",
3904     "title" => "Nsauditor",
3905     "rule" => array(
3906     "Nsauditor[ /]([0-9.]{1,10})" => "\\1"
3907     ),
3908     "uri" => "http://www.nsauditor.com/"
3909     ),
3910     "obidosbot" => array(
3911     "icon" => "robot",
3912     "title" => "Bookwatch",
3913     "rule" => array(
3914     "obidos[ \-]?bot" => ""
3915     ),
3916     "uri" => ""
3917     ),
3918     "objectssearch" => array(
3919     "icon" => "robot",
3920     "title" => "Objects Search",
3921     "rule" => array(
3922     "ObjectsSearch[ /]([0-9.]{1,10})" => "\\1"
3923     ),
3924     "uri" => ""
3925     ),
3926     "obot" => array(
3927 matthys 297 "icon" => "ibm",
3928     "title" => "IBM (ONLY) Crawler",
3929 joku 63 "rule" => array(
3930 matthys 297 "oBot[ /]([0-9.]{1,10})" => "\\1"
3931 joku 63 ),
3932 matthys 297 "uri" => "http://filterdb.iss.net/crawler/"
3933     // Previous from "ONLY Solutions GmbH" – that is what the O stands for
3934 joku 63 ),
3935     "ocawa" => array(
3936     "icon" => "ocawa",
3937     "title" => "Ocawa",
3938     "rule" => array(
3939     "Ocawa[ /]([A-Z.a-z][0-9.]{1,10})" => "\\1",
3940     "Ocawa" => ""
3941     ),
3942     "uri" => "http://www.ocawa.com/"
3943     ),
3944     "octora" => array(
3945     "icon" => "octora",
3946     "title" => "Octora",
3947     "rule" => array(
3948     "^Octora (Beta)?" => ""
3949     ),
3950     "uri" => "http://www.octora.com/"
3951     ),
3952     "offlineexplorer" => array(
3953     "icon" => "robot",
3954     "title" => "OfflineExplorer",
3955     "rule" => array(
3956     "^Offline Explorer[ /]([0-9.]{1,10})" => "\\1"
3957     ),
3958     "uri" => ""
3959     ),
3960     "omea" => array(
3961     "icon" => "omea",
3962     "title" => "Omea Reader",
3963     "rule" => array(
3964     "Omea Reader[ /]([0-9.]{1,10})" => "\\1"
3965     ),
3966     "uri" => ""
3967     ),
3968     "onet" => array(
3969     "icon" => "onet",
3970     "title" => "Onet",
3971     "rule" => array(
3972     "OnetSzukaj[ /]([0-9.]{1,10})" => "\\1",
3973     "Onet\.pl" => "",
3974     "inktomi.search.onet" => ""
3975     ),
3976     "uri" => "http://www.onet.pl"
3977     ),
3978     "online24" => array(
3979     "icon" => "robot",
3980 matthys 209 "title" => "Online24",
3981 joku 63 "rule" => array(
3982     "^Online24-Bot .* ([0-9.]{1,10})" => "\\1"
3983     ),
3984     "uri" => "http://www.online24.de"
3985     ),
3986     "onlinewebcheck" => array(
3987     "icon" => "csehtmlvalidator",
3988     "title" => "CSE HTML Validator",
3989     "rule" => array(
3990     "onlinewebcheck" => ""
3991     ),
3992     "uri" => "http://www.onlinewebcheck.com"
3993     ),
3994     "onsearch" => array(
3995     "icon" => "onsearch",
3996 matthys 209 "title" => "OnSearch",
3997 joku 63 "rule" => array(
3998     "^onCHECK-Robot" => ""
3999     ),
4000     "uri" => "http://www.onsearch.de"
4001     ),
4002     "onto" => array(
4003     "icon" => "robot",
4004     "title" => "OntoSpider",
4005     "rule" => array(
4006     "^OntoSpider[ /]([0-9.]{1,10})" => "\\1"
4007     ),
4008     "uri" => "http://ontospider.i-n.info/"
4009     ),
4010     "openacoon" => array(
4011     "icon" => "robot",
4012     "title" => "OpenAcoon",
4013     "rule" => array(
4014     "^OpenAcoon v([0-9.]{1,10})" => "\\1"
4015     ),
4016     "uri" => "http://www.openacoon.de/"
4017     ),
4018     "openfind" => array(
4019     "icon" => "openfind",
4020     "title" => "Openfind",
4021     "rule" => array(
4022     "openbot[ /]([0-9.]{1,10})" => "\\1",
4023     "Openfind Robot[ /]([0-9.A-Z]{1,10})" => "\\1"
4024     ),
4025     "uri" => ""
4026     ),
4027     "opentagger" => array(
4028     "icon" => "robot",
4029     "title" => "OpenTagger",
4030     "rule" => array(
4031     "^OpenTaggerBot" => ""
4032     ),
4033     "uri" => "http://www.opentagger.com/opentaggerbot.htm"
4034     ),
4035     "opentext" => array(
4036     "icon" => "opentext",
4037     "title" => "OpenText",
4038     "rule" => array(
4039     "^OpenTextSiteCrawler[ /]([0-9.]{1,10})" => "\\1"
4040     ),
4041     "uri" => "http://www.opentext.net/"
4042     ),
4043     "openweb" => array(
4044     "icon" => "robot",
4045     "title" => "OpenWebSpider",
4046     "rule" => array(
4047     "^OpenWebSpider[ /]([0-9.]{1,10})" => "\\1",
4048     "^OpenWebSpider v([0-9.A-Z]{1,10})" => "\\1"
4049     ),
4050     "uri" => "http://www.openwebspider.org"
4051     ),
4052     "openx" => array(
4053     "icon" => "openx",
4054     "title" => "OpenX Spider",
4055     "rule" => array(
4056     "OpenX" => ""
4057     ),
4058     "uri" => "http://www.openx.org"
4059     ),
4060     "orange" => array(
4061     "icon" => "orange",
4062     "title" => "Orange",
4063     "rule" => array(
4064 joku 338 "OrangeBot-Mobile[ /]([0-9.]{1,10})" => "\\1",
4065     "OrangeBot[ /]([0-9.]{1,10})" => "\\1"
4066 joku 63 ),
4067     "uri" => "http://orange.com/"
4068     ),
4069     "organica" => array(
4070     "icon" => "robot",
4071     "title" => "Organica",
4072     "rule" => array(
4073     "crawler@organica\.us" => ""
4074     ),
4075     "uri" => ""
4076     ),
4077     "outfox" => array(
4078     "icon" => "robot",
4079     "title" => "Outfox Melon",
4080     "rule" => array(
4081     "OutfoxMelonBot[ /]([0-9.]{1,10})" => "\\1",
4082     "OutfoxBot[ /]([0-9.]{1,10})" => "\\1"
4083     ),
4084     "uri" => ""
4085     ),
4086     "overture" => array(
4087     "icon" => "overture",
4088     "title" => "Overture",
4089     "rule" => array(
4090     "Overture[ \-]?WebCrawler" => ""
4091     ),
4092     "uri" => ""
4093     ),
4094 joku 337 "owler" => array(
4095     "icon" => "robot",
4096     "title" => "Owler",
4097     "rule" => array(
4098     "Owler[ /]([0-9.]{1,10})" => "\\1",
4099     "Owler" => ""
4100     ),
4101     "uri" => ""
4102     ),
4103 joku 63 "page2rss" => array(
4104     "icon" => "page2rss",
4105     "title" => "Page2RSS",
4106     "rule" => array(
4107     "Page2RSS[ /]([0-9.]{1,10})" => "\\1"
4108     ),
4109     "uri" => "http://page2rss.com"
4110     ),
4111     "pagebytes" => array(
4112     "icon" => "robot",
4113     "title" => "PageBites",
4114     "rule" => array(
4115     "^PageBitesHyperBot[ /]([0-9.]{1,10})" => "\\1"
4116     ),
4117     "uri" => ""
4118     ),
4119 matthys 282 "pagesinventory" => array(
4120     "icon" => "pagesinventory",
4121     "title" => "PagesInventory",
4122     "rule" => array(
4123     "^PagesInventory" => ""
4124     ),
4125     "uri" => "http://www.pagesinventory.com"
4126     ),
4127 joku 63 "pagesjaunes" => array(
4128     "icon" => "pagesjaunes",
4129     "title" => "Pages Jaunes",
4130     "rule" => array(
4131     "PJBot[ /]([0-9.]{1,10})" => "\\1"
4132     ),
4133     "uri" => "http://www.pagesjaunes.fr/"
4134     ),
4135     "pagevalet" => array(
4136     "icon" => "wdg",
4137     "title" => "WDG Page Valet",
4138     "rule" => array(
4139     "^Page Valet[ /]([0-9.]{1,10})" => "\\1"
4140     ),
4141     "uri" => "http://www.htmlhelp.com/tools/validator/"
4142     ),
4143     "panopeabot" => array(
4144     "icon" => "robot",
4145     "title" => "PanopeaBot",
4146     "rule" => array(
4147     "PanopeaBot[/ ]([0-9.]{1,10})" => "\\1"
4148     ),
4149     "uri" => ""
4150     ),
4151     "parchmenthill" => array(
4152     "icon" => "robot",
4153     "title" => "Parchment Hill",
4154     "rule" => array(
4155     "ParchBot[ /]([0-9.]{1,10})" => "\\1"
4156     ),
4157     "uri" => "http://www.parchmenthill.com/search.htm"
4158     ),
4159     "pascient" => array(
4160     "icon" => "pascient",
4161     "title" => "Pascient",
4162     "rule" => array(
4163     "panscient.com" => ""
4164     ),
4165     "uri" => "http://www.panscient.com/"
4166     ),
4167     "peerbot" => array(
4168     "icon" => "peerbot",
4169     "title" => "Peerbot",
4170     "rule" => array(
4171     "^PEERbot" => ""
4172     ),
4173     "uri" => ""
4174     ),
4175 matthys 389 "petalbot" => array(
4176     "icon" => "huawei",
4177     "title" => "PetalBot", // Huawei Search - also called Aspiegel
4178     "rule" => array(
4179     "PetalBot" => "",
4180     "AspiegelBot" => ""
4181     ),
4182     "uri" => "https://aspiegel.com/petalbot"
4183     ),
4184 joku 63 "php" => array(
4185     "icon" => "php",
4186     "title" => "PHP",
4187     "rule" => array(
4188     "^PHP[ /]([0-9.]{1,10})" => "\\1"
4189     ),
4190     "uri" => ""
4191     ),
4192     "phpcrawl" => array(
4193     "icon" => "robot",
4194     "title" => "PHPCrawl",
4195     "rule" => array(
4196     "^PHPCrawl" => ""
4197     ),
4198     "uri" => "http://phpcrawl.cuab.de/"
4199     ),
4200     "phpdig" => array(
4201     "icon" => "robot",
4202     "title" => "PhpDig",
4203     "rule" => array(
4204     "^PhpDig[ /]([0-9.]{1,10})" => "\\1"
4205     ),
4206     "uri" => "http://www.finbot.com/"
4207     ),
4208     "phpversiontracker" => array(
4209     "icon" => "phpversiontracker",
4210     "title" => "PHP version tracker",
4211     "rule" => array(
4212     "^PHP version tracker" => ""
4213     ),
4214     "uri" => "http://www.nexen.net/phpversion/bot.php"
4215     ),
4216     "pictureofinternet" => array(
4217     "icon" => "robot",
4218     "title" => "PictureOfInternet",
4219     "rule" => array(
4220     "^PictureOfInternet[ /]([0-9.]{1,10})" => ""
4221     ),
4222     "uri" => ""
4223     ),
4224     "pingdom" => array(
4225     "icon" => "pingdom",
4226     "title" => "Pingdom",
4227     "rule" => array(
4228     "^Pingdom GIGRIB v([0-9.]{1,10})" => "\\1",
4229     "^Pingdom" => ""
4230     ),
4231     "uri" => "http://www.pingdom.com/"
4232     ),
4233     "pinseri" => array(
4234     "icon" => "pinseri",
4235     "title" => "Pinseri",
4236     "rule" => array(
4237     "www\.pinseri\.com/bloglist" => ""
4238     ),
4239     "uri" => ""
4240     ),
4241     "plagger" => array(
4242     "icon" => "plagger",
4243     "title" => "Plagger",
4244     "rule" => array(
4245     "Plagger[ /]([0-9.]{1,10})" => "\\1"
4246     ),
4247     "uri" => "http://www.plugger.org"
4248     ),
4249     "planet" => array(
4250     "icon" => "planet",
4251     "title" => "Planet",
4252     "rule" => array(
4253     "Planet[ /]([0-9.]{1,10})" => "\\1"
4254     ),
4255     "uri" => ""
4256     ),
4257     "plantynet" => array(
4258     "icon" => "robot",
4259     "title" => "PlantyNet",
4260     "rule" => array(
4261     "PlantyNet_WebRobot[_ /]V?([0-9.]{1,10})" => "\\1"
4262     ),
4263     "uri" => ""
4264     ),
4265     "pluck" => array(
4266     "icon" => "pluck",
4267     "title" => "Pluck",
4268     "rule" => array(
4269     "PluckFeedCrawler[ /]([0-9.]{1,10})" => "\\1"
4270     ),
4271     "uri" => ""
4272     ),
4273     "plsearch" => array(
4274     "icon" => "plsearch",
4275     "title" => "PlanetSearch",
4276     "rule" => array(
4277     "fido[ /]([0-9.]{1,10}) Harvest" => "\\1"
4278     ),
4279     "uri" => ""
4280     ),
4281     "poe" => array(
4282     "icon" => "robot",
4283     "title" => "POE-Component",
4284     "rule" => array(
4285     "^POE-Component-Client-HTTP[/ ]([0-9.]{1,10})" => "\\1"
4286     ),
4287     "uri" => ""
4288     ),
4289     "pogodak" => array(
4290     "icon" => "pogodak",
4291     "title" => "Pogodak",
4292     "rule" => array(
4293     "Pogodak\.hr[/ ]?([0-9.]{1,10})" => "\\1"
4294     ),
4295     "uri" => ""
4296     ),
4297     "poodle" => array(
4298     "icon" => "robot",
4299     "title" => "Poodle predictor",
4300     "rule" => array(
4301     "P(oo|ooo)dle[ \-]?predictor[ \-]?([0-9.]{1,10})" => "\\1",
4302     "P(oo|ooo)dle[ \-]?predictor" => ""
4303     ),
4304     "uri" => "http://www.gritechnologies.com/tools/spider.go"
4305     ),
4306     "pompos" => array(
4307     "icon" => "pompos",
4308     "title" => "Pompos",
4309     "rule" => array(
4310     "Pompos[ /]([0-9.]{1,10})" => "\\1"
4311     ),
4312     "uri" => ""
4313     ),
4314     "popdex" => array(
4315     "icon" => "robot",
4316     "title" => "Popdexter",
4317     "rule" => array(
4318     "Popdexter" => ""
4319     ),
4320     "uri" => ""
4321     ),
4322     "postrank" => array(
4323     "icon" => "postrank",
4324     "title" => "PostRank",
4325     "rule" => array(
4326     "^PostRank[ /]+([0-9.]{1,10})" => "\\1"
4327     ),
4328     "uri" => "http://www.postrank.com/"
4329     ),
4330     "powermarks" => array(
4331     "icon" => "robot",
4332     "title" => "Powermarks",
4333     "rule" => array(
4334     "Powermarks[ /]([0-9.]{1,10})" => "\\1"
4335     ),
4336     "uri" => ""
4337     ),
4338 matthys 366 "pinterest" => array(
4339     "icon" => "pinterest",
4340 joku 63 "title" => "PROBE!",
4341     "rule" => array(
4342 matthys 366 "Pinterest[ /]([0-9.]{1,10})" => "\\1"
4343 joku 63 ),
4344 matthys 366 "uri" => "http://www.pinterest.com/"
4345 joku 63 ),
4346 matthys 366 "probe" => array(
4347     "icon" => "robot",
4348     "title" => "PROBE!",
4349     "rule" => array(
4350     "^PROBE!" => ""
4351     ),
4352     "uri" => ""
4353     ),
4354 joku 63 "projecthoneypot" => array(
4355     "icon" => "projecthoneypot",
4356     "title" => "Project Honeypot",
4357     "rule" => array(
4358     "^PHPot Verispider[ /v]+([0-9.]{1,10})" => "\\1",
4359     "projecthoneypot" => ""
4360     ),
4361     "uri" => "http://www.projecthoneypot.org"
4362     ),
4363     "proxycache" => array(
4364     "icon" => "robot",
4365     "title" => "Proxy Cache",
4366     "rule" => array(
4367     "^Mozilla/[0-9.]{1,10} \(compatible\;\)$" => ""
4368     ),
4369     "uri" => ""
4370     ),
4371     "proxyhunter" => array(
4372     "icon" => "robot",
4373     "title" => "ProxyHunter",
4374     "rule" => array(
4375     "ProxyHunter" => ""
4376     ),
4377     "uri" => ""
4378     ),
4379     "psbot" => array(
4380     "icon" => "picsearch",
4381     "title" => "PicSearch",
4382     "rule" => array(
4383     "^psbot" => ""
4384     ),
4385     "uri" => ""
4386     ),
4387     "pubsub" => array(
4388     "icon" => "pubsub",
4389     "title" => "PubSub",
4390     "rule" => array(
4391     "^PubSub-RSS-Reader[ /]([0-9.]{1,10})" => "\\1",
4392     "^PubSub\.com" => ""
4393     ),
4394     "uri" => ""
4395     ),
4396 joku 330 "pubarch" => array(
4397 joku 334 "icon" => "robot",
4398 joku 330 "title" => "PubArchive",
4399     "rule" => array(
4400     "publiclibraryarchive.org" => ""
4401     ),
4402     "uri" => ""
4403     ),
4404 joku 63 "pukiwiki" => array(
4405     "icon" => "pukiwiki",
4406     "title" => "PukiWiki",
4407     "rule" => array(
4408     "PukiWiki[ /]([0-9.]{1,10})" => "\\1"
4409     ),
4410     "uri" => ""
4411     ),
4412     "pwebotxy" => array(
4413     "icon" => "pwebotxy",
4414     "title" => "PWeBot/X.Y",
4415     "rule" => array(
4416     "^PWeBot[ /]([0-9.]{1,10})" => "\\1"
4417     ),
4418     "uri" => "http://www.programacionweb.net/robot.php"
4419     ),
4420     "pxys" => array(
4421     "icon" => "robot",
4422     "title" => "PXYS",
4423     "rule" => array(
4424     "^pxys" => ""
4425     ),
4426     "uri" => ""
4427     ),
4428     "qango" => array(
4429     "icon" => "qango",
4430     "title" => "Qango",
4431     "rule" => array(
4432     "^Qango.com" => ""
4433     ),
4434     "uri" => "http://www.quango.com/"
4435     ),
4436     "qihoo" => array(
4437     "icon" => "qihoo",
4438     "title" => "Qihoo",
4439     "rule" => array(
4440     "QihooBot[ /]([0-9.]{1,10})" => "\\1"
4441     ),
4442     "uri" => "http://www.qihoo.com/"
4443     ),
4444     "qseero" => array(
4445     "icon" => "robot",
4446     "title" => "Qseero",
4447     "rule" => array(
4448     "Qseero v([0-9.]{1,10})" => "\\1"
4449     ),
4450     "uri" => "http://www.q0.com/"
4451     ),
4452     "quantcast" => array(
4453     "icon" => "robot",
4454     "title" => "Quantcast",
4455     "rule" => array(
4456     "Quantcastbot[ /]([0-9.]{1,10})" => "\\1"
4457     ),
4458     "uri" => "http://www.quantcast.com/"
4459     ),
4460     "quepasa" => array(
4461     "icon" => "quepasa",
4462     "title" => "Quepasa",
4463     "rule" => array(
4464     "Quepasa[ \-]?Creep" => ""
4465     ),
4466     "uri" => ""
4467     ),
4468     "questfinder" => array(
4469     "icon" => "robot",
4470     "title" => "QuestFinder",
4471     "rule" => array(
4472     "www\.questfinder\.com" => ""
4473     ),
4474     "uri" => ""
4475     ),
4476 matthys 351 "qwantify" => array(
4477     "icon" => "qwantify",
4478     "title" => "Qwantify",
4479     "rule" => array(
4480     "Qwantify[ /]([0-9.]{1,10})" => "\\1"
4481     ),
4482     "uri" => "https://www.qwant.com/"
4483     ),
4484 joku 63 "qweery" => array(
4485     "icon" => "robot",
4486     "title" => "Qweery",
4487     "rule" => array(
4488     "^QweeryBot[ /]([0-9.]{1,10})" => "\\1"
4489     ),
4490     "uri" => "http://qweerybot.qweery.nl"
4491     ),
4492     "racaicrawler" => array(
4493     "icon" => "robot",
4494     "title" => "RacaiCrawler",
4495     "rule" => array(
4496     "RacaiCrawler[ -]([0-9.]{1,10})" => "\\1"
4497     )
4498     ),
4499     "radian6" => array(
4500     "icon" => "robot",
4501     "title" => "Radian6",
4502     "rule" => array(
4503     "www\.radian6\.com" => ""
4504     ),
4505     "uri" => "http://www.radian6.com"
4506     ),
4507 joku 375 "radiofx" => array(
4508     "icon" => "radiofx",
4509     "title" => "Radio.fx",
4510     "rule" => array(
4511     "Radio.fx" => ""
4512     ),
4513     "uri" => "https://de.tobit.softwarw"
4514     ),
4515 joku 63 "rambler" => array(
4516     "icon" => "rambler",
4517     "title" => "Rambler",
4518     "rule" => array(
4519     "StackRambler[ /]([0-9.]{1,10})" => "\\1"
4520     ),
4521     "uri" => ""
4522     ),
4523     "ramiba" => array(
4524     "icon" => "robot",
4525 matthys 209 "title" => "Ramiba",
4526 joku 63 "rule" => array(
4527     "^ramiba(-bot)?" => "\\1"
4528     ),
4529     "uri" => ""
4530     ),
4531     "rankur" => array(
4532     "icon" => "rankur",
4533     "title" => "Rankur",
4534     "rule" => array(
4535     "^RankurBot/Rankur([0-9.]{1,10})" => "\\1"
4536     ),
4537     "uri" => "http://rankur.com/",
4538     ),
4539 joku 261 "red" => array(
4540     "icon" => "red",
4541     "title" => "RED",
4542     "rule" => array(
4543     "RED[ /]([0-9.]{1,10})" => "\\1"
4544     ),
4545     "uri" => "http://redbot.org/"
4546 joku 181 ),
4547 joku 63 "rediff" => array(
4548     "icon" => "rediff",
4549 matthys 209 "title" => "Rediff",
4550 joku 63 "rule" => array(
4551     "^RedBot/redbot[ /\-]([0-9.]{1,10})" => "\\1"
4552     ),
4553     "uri" => "http://www.rediff.com",
4554     ),
4555     "repia" => array(
4556     "icon" => "robot",
4557     "title" => "Repia",
4558     "rule" => array(
4559     "webmaster@repia\.com" => ""
4560     ),
4561     "uri" => ""
4562     ),
4563     "robotgenius" => array(
4564     "icon" => "robot",
4565     "title" => "Robot Genius",
4566     "rule" => array(
4567     "^robotgenius" => ""
4568     ),
4569     "uri" => "http://robotgenius.net",
4570     ),
4571     "robozilla" => array(
4572     "icon" => "robot",
4573     "title" => "Robozilla",
4574     "rule" => array(
4575     "Robozilla" => ""
4576     ),
4577     "uri" => ""
4578     ),
4579 matthys 302 "rogerbot" => array(
4580 matthys 306 "icon" => "moz",
4581     "title" => "Moz Rogerbot",
4582 matthys 302 "rule" => array(
4583     "rogerbot[ /]([0-9.]{1,10})" => "\\1"
4584     ),
4585     "uri" => "http://moz.com/help/guides/moz-procedures/who-is-rogerbot"
4586     ),
4587 joku 63 "rojo" => array(
4588     "icon" => "rojo",
4589     "title" => "Rojo",
4590     "rule" => array(
4591     "Rojo[ /]([0-9.]{1,10})" => "\\1"
4592     ),
4593     "uri" => ""
4594     ),
4595     "rss-atom" => array(
4596     "icon" => "rss",
4597     "title" => "RSS / Atom",
4598     "rule" => array(
4599     "^Apple-PubSub" => "",
4600     "^AppleSyndication" => ""
4601     ),
4602     "uri" => ""
4603     ),
4604     "rssbot" => array(
4605     "icon" => "rss",
4606 matthys 209 "title" => "RSS-bot",
4607 joku 63 "rule" => array(
4608     "rss-bot[ /]([0-9.]{1,10})" => "\\1"
4609     ),
4610     "uri" => ""
4611     ),
4612     "rssbandit" => array(
4613     "icon" => "rssbandit",
4614     "title" => "RssBandit",
4615     "rule" => array(
4616     "RssBandit[ /]([0-9.]{1,10})" => "\\1"
4617     ),
4618     "uri" => ""
4619     ),
4620     "rssimages" => array(
4621     "icon" => "rss",
4622 matthys 209 "title" => "RssImages",
4623 joku 63 "rule" => array(
4624     "rssImagesBot[ /]([0-9.]{1,10})" => "\\1"
4625     ),
4626     "uri" => ""
4627     ),
4628     "rssmicro" => array(
4629     "icon" => "rssmicro",
4630     "title" => "RSSMicro",
4631     "rule" => array(
4632     "RSSMicro\.com" => ""
4633     ),
4634     "uri" => "http://www.rssmicro.com"
4635     ),
4636     "rssowl" => array(
4637     "icon" => "rssowl",
4638     "title" => "RSSOwl",
4639     "rule" => array(
4640     "RSSOwl[ /]([0-9a-z.]{1,10})" => "\\1"
4641     ),
4642     "uri" => ""
4643     ),
4644     "rssreader" => array(
4645     "icon" => "rss",
4646     "title" => "RssReader",
4647     "rule" => array(
4648     "RssReader[ /]([0-9.]{1,10})" => ""
4649     ),
4650     "uri" => ""
4651     ),
4652     "rtgi" => array(
4653     "icon" => "rtgi",
4654 matthys 209 "title" => "Rtgi",
4655 joku 63 "rule" => array(
4656     "RTGI" => ""
4657     ),
4658     "uri" => "http://rtgi.fr/"
4659     ),
4660     "rufusbot" => array(
4661     "icon" => "robot",
4662     "title" => "RufusBot",
4663     "rule" => array(
4664     "RufusBot" => ""
4665     ),
4666     "uri" => ""
4667     ),
4668 matthys 304 "runet" => array(
4669     "icon" => "runet",
4670     "title" => "iTrack RuNet Crawler",
4671     "rule" => array(
4672     "Runet-Research-Crawler" => ""
4673     ),
4674     "uri" => "http://www.itrack.ru/research/cmsrate/"
4675     ),
4676 joku 63 "runnk" => array(
4677     "icon" => "robot",
4678     "title" => "Runnk",
4679     "rule" => array(
4680     "Runnk RSS finder" => ""
4681     ),
4682     "uri" => "http://www.runnk.com/il/law"
4683     ),
4684     "sagool" => array(
4685     "icon" => "robot",
4686     "title" => "Sagool",
4687     "rule" => array(
4688     "MaSagool" => ""
4689     ),
4690     "uri" => "http://sagool.jp/"
4691     ),
4692     "sanszbot" => array(
4693     "icon" => "robot",
4694     "title" => "Sansz",
4695     "rule" => array(
4696     "SanszBot" => ""
4697     ),
4698     "uri" => ""
4699     ),
4700     "saucereader" => array(
4701     "icon" => "saucereader",
4702     "title" => "Sauce Reader",
4703     "rule" => array(
4704     "Sauce[ ]?Reader[ /]([0-9.]{1,10})" => "\\1"
4705     ),
4706     "uri" => ""
4707     ),
4708     "sbider" => array(
4709     "icon" => "sbider",
4710     "title" => "SBIder",
4711     "rule" => array(
4712     "SBIder[/ ]([0-9.]{1,10})" => "\\1",
4713     "SBIder[/ ]SBIder.([0-9.]{1,10})" => "\\1"
4714     ),
4715     "uri" => ""
4716     ),
4717     "scirus" => array(
4718     "icon" => "robot",
4719     "title" => "Scirus",
4720     "rule" => array(
4721     "FAST-WebCrawler/[0-9a-z.]{1,10}/Scirus" => ""
4722     ),
4723     "uri" => ""
4724     ),
4725     "scoutjet" => array(
4726     "icon" => "scoutjet",
4727     "title" => "ScoutJet",
4728     "rule" => array(
4729     "ScoutJet" => ""
4730     ),
4731     "uri" => "http://www.scoutjet.com/"
4732     ),
4733 joku 261 "scrapy" => array(
4734     "icon" => "scrapy",
4735     "title" => "Scrapy",
4736     "rule" => array(
4737     "Scrapy[ /]([0-9.]{1,10})" => "\\1"
4738     ),
4739     "uri" => "http://scrapy.org"
4740     ),
4741 joku 63 "scrubby" => array(
4742     "icon" => "scrubby",
4743     "title" => "Scrubby",
4744     "rule" => array(
4745     "Scrubby[ /]([0-9.]{1,10})" => "\\1"
4746     ),
4747     "uri" => ""
4748     ),
4749     "sdm" => array(
4750     "icon" => "sdm",
4751     "title" => "SUN Download Manager",
4752     "rule" => array(
4753     "Sun Download Manager[/ ]([0-9.]{1,10})" => "\\1"
4754     ),
4755     "uri" => ""
4756     ),
4757     "sealinks" => array(
4758     "icon" => "robot",
4759     "title" => "Sea Links",
4760     "rule" => array(
4761     "SEA-Links( HTML-Scanner Pingoo\!)?[ /]([0-9.]{1,10})" => "\\2"
4762     ),
4763     "uri" => ""
4764     ),
4765     "search17" => array(
4766     "icon" => "robot",
4767     "title" => "Search 17",
4768     "rule" => array(
4769     "Search17Bot[ /]([0-9.]{1,10})" => "\\1"
4770     ),
4771     "uri" => "http://www.search17.com/bot.php"
4772     ),
4773     "search2" => array(
4774     "icon" => "search2",
4775     "title" => "Search2.net",
4776     "rule" => array(
4777     "^S2Bot[ /]([0-9.]{1,10})" => "\\1"
4778     ),
4779     "uri" => "http://search2.net/"
4780     ),
4781     "searchbot" => array(
4782     "icon" => "robot",
4783     "title" => "Searchbot",
4784     "rule" => array(
4785     "Searchbot[ /]([0-9.]{1,10})" => "\\1"
4786     ),
4787     "uri" => ""
4788     ),
4789     "searchch" => array(
4790     "icon" => "robot",
4791     "title" => "Search.ch",
4792     "rule" => array(
4793     "search\.ch[ /]?V?([0-9.]{1,10})" => "\\1"
4794     ),
4795     "uri" => ""
4796     ),
4797     "searchengineworld" => array(
4798     "icon" => "robot",
4799     "title" => "SearchEngineWorld",
4800     "rule" => array(
4801     "searchengineworld" => ""
4802     ),
4803     "uri" => "http://www.searchengineworld.com/"
4804     ),
4805     "searchhippo" => array(
4806     "icon" => "searchhippo",
4807     "title" => "Searchhippo",
4808     "rule" => array(
4809     "searchhippo" => ""
4810     ),
4811     "uri" => "http://www.searchhippo.com/"
4812     ),
4813     "searchthruus" => array(
4814     "icon" => "robot",
4815     "title" => "SearchThruUs",
4816     "rule" => array(
4817     "www\.unitek-systems\.co\.uk[ /]([0-9.]{1,10})" => "\\1"
4818     ),
4819     "uri" => ""
4820     ),
4821     "securecomputing" => array(
4822     "icon" => "robot",
4823     "title" => "Secure Computing",
4824     "rule" => array(
4825     "securecomputing" => ""
4826     ),
4827     "uri" => ""
4828     ),
4829     "seekport" => array(
4830     "icon" => "seekport",
4831     "title" => "Seekport",
4832     "rule" => array(
4833     "Seekbot[ /]([0-9.]{1,10})" => "\\1"
4834     ),
4835     "uri" => ""
4836     ),
4837     "semanticdiscovery" => array(
4838     "icon" => "robot",
4839     "title" => "Semantic Discovery",
4840     "rule" => array(
4841     "semanticdiscovery[ /]([0-9.]{1,10})" => "\\1"
4842     ),
4843     "uri" => ""
4844     ),
4845 matthys 319 "semrush" => array(
4846     "icon" => "semrush",
4847     "title" => "SEMrush",
4848     "rule" => array(
4849     "SemrushBot[ /]([0-9.]{1,10})" => "\\1"
4850     ),
4851     "uri" => "http://www.semrush.com/bot.html"
4852     ),
4853 joku 63 "sengine" => array(
4854     "icon" => "sengine",
4855     "title" => "Sengine",
4856     "rule" => array(
4857     "netEstate NE Crawler" => ""
4858     ),
4859     "uri" => "http://www.sengine.info/"
4860     ),
4861     "sensis" => array(
4862     "icon" => "sensis",
4863     "title" => "Sensis",
4864     "rule" => array(
4865     "^Sensis(.com.au)? Web Crawler" => ""
4866     ),
4867     "uri" => "http://sensis.com.au"
4868     ),
4869     "seokicks" => array(
4870     "icon" => "seokicks",
4871     "title" => "SEOkicks",
4872     "rule" => array(
4873     "SEOkicks-Robot" => ""
4874     ),
4875     "uri" => "http://www.seokicks.de/"
4876     ),
4877     "seoprofiler" => array(
4878     "icon" => "seoprofiler",
4879     "title" => "SEOprofiler",
4880     "rule" => array(
4881     "spbot[ /]([0-9.]{1,10})" => "\\1"
4882     ),
4883     "uri" => "http://www.seoprofiler.com/"
4884     ),
4885     "setooz" => array(
4886     "icon" => "setooz",
4887     "title" => "Setooz",
4888     "rule" => array(
4889     "OOZBOT[ /]([0-9.]{1,10})" => "\\1"
4890     ),
4891     "uri" => "http://www.setooz.com/oozbot.html"
4892     ),
4893     "seznam" => array(
4894     "icon" => "seznam",
4895     "title" => "Seznam",
4896     "rule" => array(
4897     "SeznamBot[ /]([0-9.]{1,10})" => "\\1",
4898     "Seznam" => ""
4899     ),
4900     "uri" => "http://www.seznam.cz"
4901     ),
4902     "sharpreader" => array(
4903     "icon" => "sharpreader",
4904     "title" => "SharpReader",
4905     "rule" => array(
4906     "SharpReader[ /]([0-9.]{1,10})" => "\\1"
4907     ),
4908     "uri" => ""
4909     ),
4910     "shelob" => array(
4911     "icon" => "shelob",
4912     "title" => "Sherlock Spider",
4913     "rule" => array(
4914     "^Shelob" => ""
4915     ),
4916     "uri" => "http://www.gmx.net"
4917     ),
4918     "sherlockspider" => array(
4919     "icon" => "robot",
4920     "title" => "Sherlock Spider",
4921     "rule" => array(
4922     "sherlock_spider" => ""
4923     ),
4924     "uri" => ""
4925     ),
4926     "shim" => array(
4927     "icon" => "robot",
4928     "title" => "Shim Crawler",
4929     "rule" => array(
4930     "shim[ \-]crawler" => ""
4931     ),
4932     "uri" => ""
4933     ),
4934     "shopwiki" => array(
4935     "icon" => "shopwiki",
4936     "title" => "ShopWiki",
4937     "rule" => array(
4938     "^ShopWiki[ /]([0-9.]{1,10})" => "\\1"
4939     ),
4940     "uri" => ""
4941     ),
4942     "shoula" => array(
4943     "icon" => "robot",
4944     "title" => "Shoula",
4945     "rule" => array(
4946     "^Shoula.com Crawler ([0-9.]{1,10})" => "\\1"
4947     ),
4948     "uri" => "http://www.shoula.com"
4949     ),
4950     "siege" => array(
4951     "icon" => "robot",
4952     "title" => "Siege",
4953     "rule" => array(
4954     "Siege[ /]([0-9.]{1,10})" => "\\1"
4955     ),
4956     "uri" => ""
4957     ),
4958     "siets" => array(
4959     "icon" => "robot",
4960     "title" => "Siets",
4961     "rule" => array(
4962     "SietsCrawler[ /]([0-9.]{1,10})" => "\\1"
4963     ),
4964     "uri" => ""
4965     ),
4966     "simpy" => array(
4967     "icon" => "simpy",
4968     "title" => "Simpy",
4969     "rule" => array(
4970     "^(argus|simpy)[ /]([0-9.]{1,10})" => "\\2",
4971     ),
4972     "uri" => ""
4973     ),
4974     "singingfish" => array(
4975     "icon" => "singingfish",
4976     "title" => "SingingFish",
4977     "rule" => array(
4978     "asterias[ /]([0-9.]{1,10})" => "\\1",
4979     "Asterias Crawler v([0-9.]{1,10})" => "\\1",
4980     "asterias" => ""
4981     ),
4982     "uri" => ""
4983     ),
4984     "sirketce" => array(
4985     "icon" => "robot",
4986     "title" => "Sirketce",
4987     "rule" => array(
4988     "Sirketcebot[ /v]+([0-9.]{1,10})" => "\\1"
4989     ),
4990     "uri" => "http://www.sirketce.com/bot.html"
4991     ),
4992     "sirobot" => array(
4993     "icon" => "robot",
4994     "title" => "SiroBot",
4995     "rule" => array(
4996     "sirobot" => ""
4997     ),
4998     "uri" => ""
4999     ),
5000     "sistrix" => array(
5001     "icon" => "sistrix",
5002     "title" => "SISTRIX",
5003     "rule" => array(
5004     "SISTRIX Crawler" => ""
5005     ),
5006     "uri" => "http://crawler.sistrix.net/"
5007     ),
5008     "sitebar" => array(
5009     "icon" => "sitebar",
5010     "title" => "SiteBar",
5011     "rule" => array(
5012     "SiteBar[ /]([0-9.]{1,10})" => "\\1"
5013     ),
5014     "uri" => ""
5015     ),
5016     "sitebot" => array(
5017     "icon" => "sitebot",
5018     "title" => "SiteBot",
5019     "rule" => array(
5020     "SiteBot[ /]([0-9.]{1,10})" => "\\1"
5021     ),
5022     "uri" => "http://www.sitebot.org/robot/"
5023     ),
5024 matthys 273 "siteexplorer" => array(
5025     "icon" => "siteexplorer",
5026     "title" => "SiteExplorer",
5027     "rule" => array(
5028     "SiteExplorer[ /]([0-9a-z.]{1,10})" => "\\1"
5029     ),
5030     "uri" => "http://siteexplorer.info/"
5031     ),
5032 joku 63 "sitesell" => array(
5033     "icon" => "sitesell",
5034     "title" => "SiteSell",
5035     "rule" => array(
5036     "SBIder[/ ]([0-9a-z.\-]{1,10})" => "\\1"
5037     ),
5038     "uri" => ""
5039     ),
5040     "sitespider" => array(
5041     "icon" => "robot",
5042     "title" => "SiteSpider",
5043     "rule" => array(
5044     "^SiteSpider" => ""
5045     ),
5046     "uri" => ""
5047     ),
5048     "sitesucker" => array(
5049     "icon" => "sitesucker",
5050     "title" => "SiteSucker",
5051     "rule" => array(
5052     "Sitesucker[ /]([0-9.]{1,10})" => "\\1"
5053     ),
5054     "uri" => "http://www.sitesucker.us/"
5055     ),
5056     "sitidi" => array(
5057     "icon" => "robot",
5058     "title" => "SitiDi",
5059     "rule" => array(
5060     "SitiDiBot[ /]([0-9.]{1,10})" => "\\1"
5061     ),
5062     "uri" => ""
5063     ),
5064 joku 329 "sixy" => array(
5065     "icon" => "robot",
5066     "title" => "Sixy.ch",
5067     "rule" => array(
5068     "sixy.ch[ /]([0-9a-z.]{1,10})" => "\\1"
5069     ),
5070     "uri" => "http://sixy.ch"
5071     ),
5072 joku 63 "skaffe" => array(
5073     "icon" => "robot",
5074     "title" => "Skaffe",
5075     "rule" => array(
5076     "Skampy[ /]([0-9.\-]{1,10})" => "\\1"
5077     ),
5078     "uri" => "http://www.skaffe.com"
5079     ),
5080     "skizzle" => array(
5081     "icon" => "skizzle",
5082     "title" => "Skizzle",
5083     "rule" => array(
5084     "SKIZZLE! Distributed Internet Spider[ /v]+([0-9a-z.\-]{1,10})" => "\\1"
5085     ),
5086     "uri" => "http://www.skizzle.com"
5087     ),
5088     "slider" => array(
5089     "icon" => "robot",
5090     "title" => "Slider",
5091     "rule" => array(
5092     "^Slider[ /]([0-9.]{1,10})" => "\\1"
5093     ),
5094     "uri" => ""
5095     ),
5096     "slugch" => array(
5097     "icon" => "robot",
5098 matthys 209 "title" => "Slugch",
5099 joku 63 "rule" => array(
5100     "^slug\.ch crawl ([0-9a-z.\-]{1,10})" => "\\1"
5101     ),
5102     "uri" => ""
5103     ),
5104     "smartware" => array(
5105     "icon" => "robot",
5106     "title" => "SmartWareSoft",
5107     "rule" => array(
5108     "^SWSBot-Images[ /]([0-9.]{1,10})" => "\\1"
5109     ),
5110     "uri" => "http://www.smartwaresoft.com/swsbot12.html"
5111     ),
5112     "snookit" => array(
5113     "icon" => "snookit",
5114     "title" => "Snookit",
5115     "rule" => array(
5116     "^snookit" => ""
5117     ),
5118     "uri" => "http://www.snookit.com/"
5119     ),
5120     "snoopy" => array(
5121     "icon" => "robot",
5122     "title" => "Snoopy",
5123     "rule" => array(
5124     "^Snoopy.+([0-9.]{1,10})" => "\\1",
5125     "sna-([0-9.]{1,10})" => "\\1"
5126     ),
5127     "uri" => "http://snoopy.sourceforge.net/"
5128     ),
5129     "snyke" => array(
5130     "icon" => "robot",
5131     "title" => "Snyke",
5132     "rule" => array(
5133     "^SnykeBot[ /]([0-9.]{1,10})" => "\\1"
5134     ),
5135     "uri" => "http://www.snyke.com"
5136     ),
5137     "socialradar" => array(
5138     "icon" => "socialradar",
5139     "title" => "Social Radar",
5140     "rule" => array(
5141     "Socialradarbot[ /]([0-9.]{1,10})" => "\\1"
5142     ),
5143     "uri" => "http://infegy.com/"
5144     ),
5145     "soegning" => array(
5146     "icon" => "soegning",
5147 matthys 209 "title" => "Søgning",
5148 joku 63 "rule" => array(
5149     "soegning\.dk[/ ]spider[ /]([0-9.]{1,10})" => "\\1"
5150     ),
5151     "uri" => ""
5152     ),
5153     "soft411" => array(
5154     "icon" => "soft411",
5155     "title" => "Soft411",
5156     "rule" => array(
5157     "SOFT411 Directory" => ""
5158     ),
5159     "uri" => ""
5160     ),
5161     "sogou" => array(
5162     "icon" => "sogou",
5163     "title" => "Sogou",
5164     "rule" => array(
5165     "Sogou web spider[ /]([0-9.]{1,10})" => "\\1"
5166     ),
5167     "uri" => "http://www.sogou.com/docs/help/webmasters.htm#07"
5168     ),
5169     "sohu" => array(
5170     "icon" => "robot",
5171     "title" => "Sohu",
5172     "rule" => array(
5173     "sohu[ \-](agent|search)" => ""
5174     ),
5175     "uri" => ""
5176     ),
5177     "somewhere" => array(
5178     "icon" => "robot",
5179 matthys 209 "title" => "Somewhere.com",
5180 joku 63 "rule" => array(
5181     "Mozilla\@somewhere\.com" => "\\1"
5182     ),
5183     "uri" => "http://www.somewhere.com/"
5184     ),
5185     "sopheus" => array(
5186     "icon" => "robot",
5187     "title" => "Sopheus",
5188     "rule" => array(
5189     "Sopheus Project[ /]([0-9.]{1,10})" => "\\1"
5190     ),
5191     "uri" => "http://www.thenetplanet.com"
5192     ),
5193     "soso" => array(
5194     "icon" => "soso",
5195     "title" => "Soso",
5196     "rule" => array(
5197     "^Soso(image)?spider" => ""
5198     ),
5199     "uri" => "http://help.soso.com/soso-image-spider.htm"
5200     ),
5201     "souppot" => array(
5202     "icon" => "robot",
5203     "title" => "SoupPot",
5204     "rule" => array(
5205     "SoupPotBot" => ""
5206     ),
5207     "uri" => ""
5208     ),
5209     "specificmedia" => array(
5210     "icon" => "specificmedia",
5211     "title" => "Specific Media",
5212     "rule" => array(
5213     "^SMBot[ /]([0-9.]{1,10})" => "\\1"
5214     ),
5215     "uri" => ""
5216     ),
5217     "sphider" => array(
5218     "icon" => "sphider",
5219     "title" => "Sphider",
5220     "rule" => array(
5221     "Sphider" => ""
5222     ),
5223     "uri" => "http://www.sphider.eu"
5224     ),
5225     "spinn3r" => array(
5226     "icon" => "robot",
5227     "title" => "Spinn3r",
5228     "rule" => array(
5229     "Spinn3r[ /]([0-9.]{1,10})" => "\\1"
5230     ),
5231     "uri" => "http://spinn3r.com/robot"
5232     ),
5233     "sproose" => array(
5234     "icon" => "robot",
5235 matthys 209 "title" => "Sproose",
5236 joku 63 "rule" => array(
5237     "^sproose[ /]([0-9a-z.]{1,10})" => "\\1"
5238     ),
5239     "uri" => "http://www.sproose.com/bot.html"
5240     ),
5241     "spurlbot" => array(
5242     "icon" => "robot",
5243     "title" => "SpurlBot",
5244     "rule" => array(
5245     "SpurlBot[/ ]([0-9.]{1,10})" => "\\1"
5246     ),
5247     "uri" => ""
5248     ),
5249     "stardownloader" => array(
5250     "icon" => "stardownloader",
5251     "title" => "Star Downloader",
5252     "rule" => array(
5253     "^Star Downloader( Pro)?" => ""
5254     ),
5255     "uri" => ""
5256     ),
5257     "steeler" => array(
5258     "icon" => "robot",
5259     "title" => "Steeler",
5260     "rule" => array(
5261     "Steeler[ /]([0-9.]{1,10})" => "\\1"
5262     ),
5263     "uri" => ""
5264     ),
5265     "strategicboard" => array(
5266     "icon" => "strategicboard",
5267     "title" => "Strategic Board",
5268     "rule" => array(
5269     "Strategic Board Bot" => ""
5270     ),
5271     "uri" => "http://www.strategicboard.com"
5272     ),
5273     "suchbaer" => array(
5274     "icon" => "robot",
5275 matthys 209 "title" => "Suchbaer.de",
5276 joku 63 "rule" => array(
5277     "^suchbaer\.de" => ""
5278     ),
5279     "uri" => "http://www.suchbaer.de/"
5280     ),
5281     "suchbot" => array(
5282     "icon" => "robot",
5283 matthys 209 "title" => "Suchbot",
5284 joku 63 "rule" => array(
5285     "^suchbot" => ""
5286     ),
5287     "uri" => ""
5288     ),
5289     "suchende" => array(
5290     "icon" => "suchende",
5291 matthys 209 "title" => "Suchen.de",
5292 joku 63 "rule" => array(
5293     "^gonzo([0-9]{1,2}).*www.suchen.de" => "\\1",
5294     "^gonzo/([0-9.]{1,10})" => "\\1"
5295     ),
5296     "uri" => "http://www.suchen.de/"
5297     ),
5298     "suchknecht" => array(
5299     "icon" => "robot",
5300     "title" => "Suchknecht",
5301     "rule" => array(
5302     "^Suchknecht.at-Robot" => ""
5303     ),
5304     "uri" => "http://www.suchknecht.at/"
5305     ),
5306     "suchpad" => array(
5307     "icon" => "robot",
5308 matthys 209 "title" => "Suchpad",
5309 joku 63 "rule" => array(
5310     "^suchpadbot[ /]([0-9.]{1,10})" => "\\1"
5311     ),
5312     "uri" => "http://www.suchpad.de"
5313     ),
5314     "sunrise" => array(
5315     "icon" => "sunrise",
5316     "title" => "Sunrise",
5317     "rule" => array(
5318     "^Sunrise[ /]([0-9a-z.]{1,10})" => "\\1"
5319     ),
5320     "uri" => ""
5321     ),
5322     "superbot" => array(
5323     "icon" => "superbot",
5324     "title" => "SuperBot",
5325     "rule" => array(
5326     "SuperBot[ /]([0-9.]{1,10})" => "\\1"
5327     ),
5328     "uri" => ""
5329     ),
5330     "surfcontrol" => array(
5331     "icon" => "robot",
5332     "title" => "SurfControl",
5333     "rule" => array(
5334     "SurfControl" => "",
5335     "ScSpider[ /]([0-9.]{1,10})" => "\\1"
5336     ),
5337     "uri" => ""
5338     ),
5339     "surfnet" => array(
5340     "icon" => "robot",
5341     "title" => "SURFnet",
5342     "rule" => array(
5343     "AVSearch[ \-]([0-9.]{1,10})" => "\\1"
5344     ),
5345     "uri" => ""
5346     ),
5347     "surfsafely" => array(
5348     "icon" => "robot",
5349     "title" => "Surfsafely",
5350     "rule" => array(
5351     "Submission Spider at surfsafely.com" => ""
5352     ),
5353     "uri" => "http://www.surfsafely.com"
5354     ),
5355     "surphace" => array(
5356     "icon" => "spherescout",
5357     "title" => "Surphace",
5358     "rule" => array(
5359     "Sphere Scout.+([0-9.]{1,10})" => "\\1",//Previous called Sphere Scout
5360     "Surphace.+v([0-9.]{1,10})" => "\\1"
5361     ),
5362     "uri" => "http://www.surphace.com"
5363     ),
5364     "surveybot" => array(
5365     "icon" => "surveybot",
5366     "title" => "Whois Survey",
5367     "rule" => array(
5368     "SurveyBot[ /]([0-9.]{1,10})" => "\\1"
5369     ),
5370     "uri" => ""
5371     ),
5372     "swoogle" => array(
5373     "icon" => "robot",
5374     "title" => "Swoogle",
5375     "rule" => array(
5376     "^Swooglebot[ /]([0-9.]{1,10})" => "\\1"
5377     ),
5378     "uri" => "http://swoogle.umbc.edu/swooglebot.htm"
5379     ),
5380     "swse" => array(
5381     "icon" => "robot",
5382     "title" => "SWSE",
5383     "rule" => array(
5384     "sw\.deri\.org" => ""
5385     ),
5386     "uri" => "http://sw.deri.org/2006/04/multicrawler/robots.html"
5387     ),
5388     "swish-e" => array(
5389     "icon" => "swish-e",
5390     "title" => "Swish-e",
5391     "rule" => array(
5392     "^swish-e" => ""
5393     ),
5394     "uri" => "http://swish-e.org/"
5395     ),
5396     "sygol" => array(
5397     "icon" => "sygol",
5398     "title" => "Sygol",
5399     "rule" => array(
5400     "www.sygol.(com|net)" => ""
5401     ),
5402     "uri" => "http://www.sygol.com"
5403     ),
5404     "syllabs" => array(
5405     "icon" => "syllabs",
5406     "title" => "Syllabs",
5407     "rule" => array(
5408     "Focal[-]([0-9.]{1,10})" => "\\1"
5409     ),
5410     "uri" => "http://www.syllabs.com/crawler.html"
5411     ),
5412     "synapse" => array(
5413     "icon" => "robot",
5414     "title" => "Synapse",
5415     "rule" => array(
5416     " Synapse\)" => ""
5417     ),
5418     "uri" => "http://ws.apache.org/synapse/"
5419     ),
5420     "sync2it" => array(
5421     "icon" => "robot",
5422 matthys 209 "title" => "Sync2it",
5423 joku 63 "rule" => array(
5424     "^\!Susie" => ""
5425     ),
5426     "uri" => "http://www.sync2it.com/bms/susie.php"
5427     ),
5428     "syncit" => array(
5429     "icon" => "robot",
5430 matthys 209 "title" => "Syncit",
5431 joku 63 "rule" => array(
5432     "^SyncIT[ /]([0-9.]{1,10})" => "\\1"
5433     ),
5434     "uri" => "http://www.syncit.com/"
5435     ),
5436     "syndic8" => array(
5437     "icon" => "syndic8",
5438     "title" => "Syndic8",
5439     "rule" => array(
5440     "Syndic8[ /]([0-9.]{1,10})" => "\\1"
5441     ),
5442     "uri" => "http://www.syndic8.com/"
5443     ),
5444     "syndicatie" => array(
5445     "icon" => "robot",
5446     "title" => "Syndicatie.nl",
5447     "rule" => array(
5448     "Syndicatie\.nl robot v ([0-9.]{1,10})" => "\\1",
5449     "Syndicatie\.nl robot;" => ""
5450     ),
5451     "uri" => ""
5452     ),
5453     "synomia" => array(
5454     "icon" => "robot",
5455     "title" => "Synomia",
5456     "rule" => array(
5457     "^SynoBot" => ""
5458     ),
5459     "uri" => ""
5460     ),
5461     "synoo" => array(
5462     "icon" => "robot",
5463     "title" => "SynooBot",
5464     "rule" => array(
5465     "SynooBot[ /]([0-9.]{1,10})" => "\\1",
5466     ),
5467     "uri" => ""
5468     ),
5469     "szukacz" => array(
5470     "icon" => "szukacz",
5471     "title" => "Szukacz",
5472     "rule" => array(
5473     "Szukacz[ /]([0-9.]{1,10})" => "\\1"
5474     ),
5475     "uri" => ""
5476     ),
5477     "tagoo" => array(
5478     "icon" => "tagoobot",
5479     "title" => "Tagoo",
5480     "rule" => array(
5481     "Tagoobot[ /]([0-9.]{1,10})" => "\\1"
5482     ),
5483     "uri" => "http://www.tagoo.ru"
5484     ),
5485     "tagword" => array(
5486     "icon" => "tagword",
5487     "title" => "Tagword",
5488     "rule" => array(
5489     "^Tagword" => ""
5490     ),
5491     "uri" => "http://tagword.com/dmoz_survey.php"
5492     ),
5493     "trailfire" => array(
5494     "icon" => "trailfire",
5495     "title" => "Trailfire",
5496     "rule" => array(
5497     "^Trailfire-bot[ /]([0-9.]{1,10})" => "\\1"
5498     ),
5499     "uri" => "http://trailfire.com"
5500     ),
5501     "tamu" => array(
5502     "icon" => "tamu",
5503     "title" => "Tamu Crawler",
5504     "rule" => array(
5505     "IRLbot[ /]([0-9.]{1,10})" => "\\1",
5506     "TAMU_CS_IRL_CRAWLER[ /]([0-9.]{1,10})" => "\\1"
5507     ),
5508     "uri" => "http://irl.cs.tamu.edu/crawler/"
5509     ),
5510     "taptubot" => array(
5511     "icon" => "taptubot",
5512     "title" => "Taptu",
5513     "rule" => array(
5514     "taptubot" => ""
5515     ),
5516     "uri" => "http://www.taptu.com/corp/taptubot"
5517     ),
5518     "targetseek" => array(
5519     "icon" => "robot",
5520     "title" => "TargetSeek",
5521     "rule" => array(
5522     "TargetSeek[ /]([0-9.]{1,10})" => "\\1"
5523     ),
5524     "uri" => "http://www.targetgroups.net/TargetSeek.html"
5525     ),
5526     "taw" => array(
5527     "icon" => "taw",
5528     "title" => "TAW",
5529     "rule" => array(
5530     "TAW[ /]([0-9.]{1,10})" => "\\1"
5531     ),
5532     "uri" => "http://www.tawdis.net"
5533     ),
5534     "tcd" => array(
5535     "icon" => "tcd",
5536     "title" => "Trinity College Dublin",
5537     "rule" => array(
5538     "^TCDBOT/Nutch-([0-9.]{1,10})" => "\\1"
5539     ),
5540     "uri" => "http://www.tcd.ie"
5541     ),
5542     "technorati" => array(
5543     "icon" => "technorati",
5544     "title" => "Technorati",
5545     "rule" => array(
5546     "Technoratibot[ /]([0-9.]{1,10})" => "\\1"
5547     ),
5548     "uri" => ""
5549     ),
5550     "teleport" => array(
5551     "icon" => "teleport",
5552     "title" => "Teleport",
5553     "rule" => array(
5554     "Teleport[ \-]?Pro" => ""
5555     ),
5556     "uri" => ""
5557     ),
5558     "terrar" => array(
5559     "icon" => "robot",
5560     "title" => "Terrar",
5561     "rule" => array(
5562     "^Fresh Search :: Terrar" => ""
5563     ),
5564     "uri" => ""
5565     ),
5566     "theophrastus" => array(
5567     "icon" => "robot",
5568     "title" => "Theophrastus",
5569     "rule" => array(
5570     "Theophrastus[ /]([0-9.]{1,10})" => "\\1"
5571     ),
5572     "uri" => "http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php"
5573     ),
5574     "thumbnailscz" => array(
5575     "icon" => "robot",
5576 matthys 209 "title" => "Thumbnails.cz",
5577 joku 63 "rule" => array(
5578     "^thumbnail\.cz robot[ /]([0-9.]{1,10})" => "\\1"
5579     ),
5580     "uri" => ""
5581     ),
5582     "thumbshot" => array(
5583     "icon" => "robot",
5584 matthys 209 "title" => "Thumbshots",
5585 joku 63 "rule" => array(
5586     "^thumbshots.*(Version: |v)([0-9.]{2,10})e" => "\\1",
5587     "^thumbshots-de" => ""
5588     ),
5589     "uri" => "http://www.thumbshots.de"
5590     ),
5591     "thunderstone" => array(
5592     "icon" => "thunderstone",
5593     "title" => "Thunderstone",
5594     "rule" => array(
5595     "T-H-U-N-D-E-R-S-T-O-N-E" => "",
5596     "search.thunderstone.com" => ""
5597     ),
5598     "uri" => "http://search.thunderstone.com/"
5599     ),
5600     "timbobot" => array(
5601     "icon" => "robot",
5602 matthys 209 "title" => "TimboBot",
5603 joku 63 "rule" => array(
5604     "timboBot" => ""
5605     ),
5606     "uri" => ""
5607     ),
5608     "topsy" => array(
5609     "icon" => "topsy",
5610     "title" => "Topsy",
5611     "rule" => array(
5612     "Butterfly[ /]([0-9.]{1,10})" => "\\1"
5613     ),
5614     "uri" => "http://labs.topsy.com/butterfly.html"
5615     ),
5616     "trayce" => array(
5617     "icon" => "robot",
5618 matthys 209 "title" => "Trayce",
5619 joku 63 "rule" => array(
5620     "traycebot[ /]([0-9a-z.\-]{1,10})" => "\\1"
5621     ),
5622     "uri" => ""
5623     ),
5624     "tricus" => array(
5625     "icon" => "robot",
5626     "title" => "Tricus",
5627     "rule" => array(
5628     "B_l_i_t_z_B_O_T_@_t_r_i_c_u_s_\._c_o_m" => ""
5629     ),
5630     "uri" => ""
5631     ),
5632     "topicblogs" => array(
5633     "icon" => "robot",
5634     "title" => "Topicblogs",
5635     "rule" => array(
5636     "topicblogs[ /]([0-9.]{1,10})" => "\\1"
5637     ),
5638     "uri" => ""
5639     ),
5640     "touche" => array(
5641     "icon" => "touche",
5642 matthys 209 "title" => "Touché",
5643 joku 63 "rule" => array(
5644     "^Touche" => ""
5645     ),
5646     "uri" => "http://touche.com.ve"
5647     ),
5648     "tuezilla" => array(
5649     "icon" => "robot",
5650 matthys 209 "title" => "TÃœzilla",
5651 joku 63 "rule" => array(
5652     "tuezilla.de" => ""
5653     ),
5654     "uri" => "http://tuezilla.de/t_st-odp-entries-agent.html"
5655     ),
5656     "turnitin" => array(
5657     "icon" => "turnitin",
5658     "title" => "Turnitin",
5659     "rule" => array(
5660     "TurnitinBot[ /]([0-9.]{1,10})" => "\\1"
5661     ),
5662     "uri" => ""
5663     ),
5664     "tutorgig" => array(
5665     "icon" => "robot",
5666     "title" => "TutorGig",
5667     "rule" => array(
5668     "TutorGig(Bot)?[ /]([0-9.]{1,10})" => "\\2"
5669     ),
5670     "uri" => ""
5671     ),
5672     "twiceler" => array(
5673     "icon" => "cuill",
5674 matthys 209 "title" => "Cuill",
5675 joku 63 "rule" => array(
5676     "Twiceler[ /-]([0-9.]{1,10})" => "\\1",
5677     "Twiceler" => ""
5678     ),
5679     "uri" => "http://www.cuill.com/twiceler/robot.html"
5680     ),
5681     "twingly" => array(
5682     "icon" => "twingly",
5683     "title" => "Twingly",
5684     "rule" => array(
5685     "Twingly Recon" => ""
5686     ),
5687     "uri" => "http://www.twingly.com/"
5688     ),
5689 matthys 320 "twitter" => array(
5690     "icon" => "twitter",
5691     "title" => "Twitter",
5692     "rule" => array(
5693     "Twitterbot[ /-]([0-9.]{1,10})" => "\\1"
5694     ),
5695     "uri" => "https://dev.twitter.com/cards/getting-started#crawling"
5696     ),
5697 joku 63 "typepad" => array(
5698     "icon" => "typepad",
5699     "title" => "TypePad",
5700     "rule" => array(
5701     "TypePad/([0-9a-z.]{1,10})" => "\\1"
5702     ),
5703     "uri" => ""
5704     ),
5705     "udmsearch" => array(
5706     "icon" => "robot",
5707     "title" => "UdmSearch",
5708     "rule" => array(
5709     "UdmSearch[/ ]([0-9.]{1,10})" => "\\1"
5710     ),
5711     "uri" => ""
5712     ),
5713     "ukwizz" => array(
5714     "icon" => "ukwizz",
5715     "title" => "UKWizz",
5716     "rule" => array(
5717     "^Mackster.*ukwizz" => ""
5718     ),
5719     "uri" => "http://www.ukwizz.com"
5720     ),
5721     "ultraseek" => array(
5722     "icon" => "robot",
5723     "title" => "Ultraseek",
5724     "rule" => array(
5725     "Ultraseek" => ""
5726     ),
5727     "uri" => ""
5728     ),
5729     "ultraspider" => array(
5730     "icon" => "robot",
5731     "title" => "UltraSpider",
5732     "rule" => array(
5733     "UltraSpider3000[/ ]([0-9.]{1,10})" => "\\1"
5734     ),
5735     "uri" => "http://www.search.ch"
5736     ),
5737     "umai" => array(
5738     "icon" => "robot",
5739 matthys 209 "title" => "Umai",
5740 joku 63 "rule" => array(
5741     "umai[/ ]([0-9.]{1,10})" => "\\1"
5742     ),
5743     "uri" => ""
5744     ),
5745     "unchaos" => array(
5746     "icon" => "robot",
5747     "title" => "Unchaos",
5748     "rule" => array(
5749     "unchaos_crawler[_ /]([0-9.]{1,10})" => "\\1",
5750     "unchaos" => ""
5751     ),
5752     "uri" => ""
5753     ),
5754     "unido" => array(
5755     "icon" => "robot",
5756 matthys 209 "title" => "UNIdo",
5757 joku 63 "rule" => array(
5758     "^unido-bot" => "\\1"
5759     ),
5760     "uri" => "http://mobicom.cs.uni-dortmund.de/bot.html"
5761     ),
5762     "updated" => array(
5763     "icon" => "robot",
5764     "title" => "Updated",
5765     "rule" => array(
5766     "updated[ /]([0-9a-z.]{1,10})" => "\\1"
5767     ),
5768     "uri" => ""
5769     ),
5770     "uptimebot" => array(
5771     "icon" => "robot",
5772     "title" => "UptimeBot",
5773     "rule" => array(
5774     "^UptimeBot" => ""
5775     ),
5776     "uri" => "http://www.uptimebot.com/"
5777     ),
5778     "urifetch" => array(
5779     "icon" => "robot",
5780     "title" => "URI::Fetch",
5781     "rule" => array(
5782     "^URI::Fetch[ /]([0-9.]{1,10})" => "\\1"
5783     ),
5784     "uri" => ""
5785     ),
5786     "urlbase" => array(
5787     "icon" => "robot",
5788     "title" => "URLBase",
5789     "rule" => array(
5790     "URLBase[ /]([0-9.]{1,10})" => "\\1"
5791     ),
5792     "uri" => ""
5793     ),
5794     "urlblaze" => array(
5795     "icon" => "robot",
5796     "title" => "URLBlaze",
5797     "rule" => array(
5798     "^URLBlaze" => ""
5799     ),
5800     "uri" => ""
5801     ),
5802     "urlcontr" => array(
5803     "icon" => "robot",
5804     "title" => "MS URL Control",
5805     "rule" => array(
5806     "Microsoft URL[ \-]?Control" => ""
5807     ),
5808     "uri" => ""
5809     ),
5810     "urlgetfile" => array(
5811     "icon" => "robot",
5812     "title" => "URLGetFile",
5813     "rule" => array(
5814     "^URLGetFile" => ""
5815     ),
5816     "uri" => ""
5817     ),
5818     "urlscope" => array(
5819     "icon" => "robot",
5820     "title" => "UrlScope",
5821     "rule" => array(
5822     "UrlScope" => ""
5823     ),
5824     "uri" => ""
5825     ),
5826     "urltrends" => array(
5827     "icon" => "urltrends",
5828 matthys 209 "title" => "UrlTrends",
5829 joku 63 "rule" => array(
5830     "Snappy/([0-9.]{1,10})" => "\\1",
5831     ),
5832     "uri" => ""
5833     ),
5834     "usww" => array(
5835     "icon" => "usww",
5836 matthys 209 "title" => "USWW",
5837 joku 63 "rule" => array(
5838     "usww\.com" => "",
5839     "Mozilla/5\.0 URL-Spider" => ""
5840     ),
5841     "uri" => "http://www.usww.com/"
5842     ),
5843     "usyd" => array(
5844     "icon" => "robot",
5845     "title" => "USyd-NLP-Spider",
5846     "rule" => array(
5847     "^USyd-NLP-Spider" => ""
5848     ),
5849     "uri" => "http://www.it.usyd.edu.au/~vinci/bot.html"
5850     ),
5851     "vagabondo" => array(
5852     "icon" => "wiseguys",
5853     "title" => "WiseGuys",
5854     "rule" => array(
5855     "Vagabondo[ /]([0-9.]{1,10})" => "\\1",
5856     "Vagabondo-WAP[ /]([0-9.]{1,10})" => "\\1"
5857     ),
5858     "uri" => ""
5859     ),
5860     "unicorn" => array(
5861     "icon" => "w3c",
5862     "title" => "W3C Unicorn",
5863     "rule" => array(
5864     "Unicorn[ /]([0-9.]{1,10})" => "\\1",
5865     ),
5866     "uri" => "http://validator.w3.org/unicorn/"
5867     ),
5868     "validator" => array(
5869     "icon" => "w3c",
5870     "title" => "W3C Validator",
5871     "rule" => array(
5872     "W3C_Validator[ /]([0-9.]{1,10})" => "\\1"
5873     ),
5874     "uri" => "http://validator.w3.org/"
5875     ),
5876     "validator.nu" => array(
5877     "icon" => "validatornu",
5878     "title" => "Validator.nu",
5879     "rule" => array(
5880     "^Validator.nu[ /]([0-9.]{1,10})" => "\\1",
5881     "^Validator.nu/LV" => "\\1"
5882     ),
5883     "uri" => "http://validator.nu/"
5884     ),
5885     "verity" => array(
5886     "icon" => "robot",
5887     "title" => "Verity",
5888     "rule" => array(
5889     "^vspider[ /]([0-9.]{1,10})" => "\\1",
5890     "^vspider" => ""
5891     ),
5892     "uri" => "http://www.verity.com/"
5893     ),
5894     "versionsproject" => array(
5895     "icon" => "robot",
5896     "title" => "Versions-project",
5897     "rule" => array(
5898     "InfoFly[ /]([0-9.]{1,10})" => "\\1"
5899     ),
5900     "uri" => "http://www.versions-project.org/"
5901     ),
5902     "verticalmatch" => array(
5903     "icon" => "robot",
5904     "title" => "VerticalMatch",
5905     "rule" => array(
5906     "^VMBot[ /]([0-9.]{1,10})" => "\\1"
5907     ),
5908     "uri" => "http://www.VerticalMatch.com/"
5909     ),
5910     "verzamelgids" => array(
5911     "icon" => "robot",
5912     "title" => "Verzamelgids",
5913     "rule" => array(
5914     "Verzamelgids[ /]([0-9.]{1,10})" => "\\1"
5915     ),
5916     "uri" => "http://www.verzamelgids.nl/"
5917     ),
5918     "vestris" => array(
5919     "icon" => "vestris",
5920     "title" => "Vestris",
5921     "rule" => array(
5922     "AlkalineBOT[ /]([0-9.]{1,10})" => "\\1"
5923     ),
5924     "uri" => "http://alkaline.vestris.com/"
5925     ),
5926     "vindex" => array(
5927     "icon" => "vindex",
5928     "title" => "Vindex",
5929     "rule" => array(
5930     "Vindex[ /]([0-9.]{1,10})" => "\\1"
5931     ),
5932     "uri" => ""
5933     ),
5934     "visvo" => array(
5935     "icon" => "robot",
5936     "title" => "Visvo",
5937     "rule" => array(
5938     "VisBot[ /]([0-9.]{1,10})" => "\\1"
5939     ),
5940     "uri" => "http://www.visvo.com"
5941     ),
5942     "voila" => array(
5943     "icon" => "voila",
5944     "title" => "Voila",
5945     "rule" => array(
5946     "VoilaBot[ /]?[a-z ]*([0-9.]{1,10})" => "\\1",
5947     "VoilaBot;[ /]([0-9.]{1,10})" => "\\1"
5948     ),
5949     "uri" => ""
5950     ),
5951     "vonna" => array(
5952     "icon" => "robot",
5953     "title" => "Vonna",
5954     "rule" => array(
5955     "Vonna.com b o t" => ""
5956     ),
5957     "uri" => ""
5958     ),
5959     "vortex" => array(
5960     "icon" => "robot",
5961     "title" => "Vortex",
5962     "rule" => array(
5963     "Vortex[ /]([0-9.]{1,10})" => "\\1"
5964     ),
5965     "uri" => "http://marty.anstey.ca/robots/vortex/"
5966     ),
5967     "w3sitesearch" => array(
5968     "icon" => "w3sitesearch",
5969     "title" => "W3SiteSearch",
5970     "rule" => array(
5971     "^W3SiteSearch Crawler[\_v]*([0-9.]{1,10})" => "\\1"
5972     ),
5973     "uri" => "http://www.w3sitesearch.de"
5974     ),
5975     "wagger" => array(
5976     "icon" => "robot",
5977     "title" => "Wagger",
5978     "rule" => array(
5979     "^Waggr" => ""
5980     ),
5981     "uri" => "http://www.waggr.com/"
5982     ),
5983     "wanadoo" => array(
5984     "icon" => "robot",
5985     "title" => "Wanadoo",
5986     "rule" => array(
5987     "^SurferF3[ /]([0-9./]{1,10})" => "\\1"
5988     ),
5989     "uri" => "http://www.wanadoo.fr/"
5990     ),
5991     "wapalizer" => array(
5992     "icon" => "robot",
5993     "title" => "Wapalizer",
5994     "rule" => array(
5995     "wapalizer[ /]([0-9.]{1,10})" => "\\1"
5996     ),
5997     "uri" => "http://www.wapdrive.com/"
5998     ),
5999     "watson" => array(
6000     "icon" => "addy",
6001     "title" => "Dr.Watson",
6002     "rule" => array(
6003     "Watson[ /]([0-9.]{1,10})" => "\\1",
6004     "watson\.addy\.com" => ""
6005     ),
6006     "uri" => ""
6007     ),
6008     "wavefire" => array(
6009     "icon" => "robot",
6010     "title" => "Wavefire",
6011     "rule" => array(
6012     "^Wavefire[ /]([0-9.]{1,10})" => "\\1"
6013     ),
6014     "uri" => ""
6015     ),
6016     "waypath" => array(
6017     "icon" => "waypath",
6018     "title" => "Waypath",
6019     "rule" => array(
6020     "Waypath[ \-]?Scout" => "",
6021     "Waypath (development )?crawler" => ""
6022     ),
6023     "uri" => ""
6024     ),
6025     "wauuu" => array(
6026     "icon" => "wauuu",
6027     "title" => "Wauuu",
6028     "rule" => array(
6029     "Wauuu[/ ]([0-9.]{1,10})" => "\\2"
6030     ),
6031     "uri" => "http://www.wauuu.com"
6032     ),
6033     "wdg" => array(
6034     "icon" => "wdg",
6035     "title" => "WDG Validator",
6036     "rule" => array(
6037     "^WDG_(Site)?Validator[/ ]([0-9.]{1,10})" => "\\2"
6038     ),
6039     "uri" => "http://www.htmlhelp.com/tools/validator/"
6040     ),
6041     "webagogo" => array(
6042     "icon" => "webagogo",
6043     "title" => "Webagogo",
6044     "rule" => array(
6045     "^Webagogo" => ""
6046     ),
6047     "uri" => "http://www.webagogo.be/"
6048     ),
6049     "webalta" => array(
6050     "icon" => "webalta",
6051     "title" => "WebAlta",
6052     "rule" => array(
6053     "^WebAlta( Crawler)?[/ ]([0-9.]{1,10})" => "\\2"
6054     ),
6055     "uri" => "http://www.webalta.net/ru/about_webmaster.html"
6056     ),
6057     "webdigity" => array(
6058     "icon" => "robot",
6059     "title" => "Webdigity Whois Service",
6060     "rule" => array(
6061     "^webdigity whois service" => ""
6062     ),
6063     "uri" => "http://www.webdigity.com/ws"
6064     ),
6065     "webelixir" => array(
6066     "icon" => "webelixir",
6067     "title" => "Webelixir",
6068     "rule" => array(
6069     "^webelixir" => ""
6070     ),
6071     "uri" => "http://www.webelixir.net/"
6072     ),
6073     "webbotru" => array(
6074     "icon" => "robot",
6075     "title" => "Webbot.ru",
6076     "rule" => array(
6077     " Webbot[/ ]([0-9.]{1,10})" => "\\1"
6078     ),
6079     "uri" => "http://www.webbot.ru/bot.html"
6080     ),
6081     "webcapture" => array(
6082     "icon" => "robot",
6083     "title" => "WebCapture",
6084     "rule" => array(
6085     "WebCapture[/ ]([0-9.]{1,10})" => "\\1"
6086     ),
6087     "uri" => ""
6088     ),
6089     "webcollage" => array(
6090     "icon" => "robot",
6091     "title" => "Webcollage",
6092     "rule" => array(
6093     "webcollage" => ""
6094     ),
6095     "uri" => ""
6096     ),
6097     "webcopier" => array(
6098     "icon" => "webcopier",
6099     "title" => "WebCopier",
6100     "rule" => array(
6101     "WebCopier[/ ]v?([0-9.]{1,10})" => "\\1"
6102     ),
6103     "uri" => ""
6104     ),
6105     "webcorp" => array(
6106     "icon" => "webcorp",
6107     "title" => "WebCorp",
6108     "rule" => array(
6109     "WebCorp[/ ]+([0-9.]{1,10})" => "\\1"
6110     ),
6111     "uri" => "http://www.webcorp.org.uk/"
6112     ),
6113     "webcrawl" => array(
6114     "icon" => "robot",
6115     "title" => "WebCrawl",
6116     "rule" => array(
6117     "webcrawl\.net" => ""
6118     ),
6119     "uri" => ""
6120     ),
6121     "webdownloader" => array(
6122     "icon" => "robot",
6123     "title" => "Web Downloader",
6124     "rule" => array(
6125     "Web Downloader[/ ]([0-9.]{1,10})" => "\\1"
6126     ),
6127     "uri" => ""
6128     ),
6129     "webfetch" => array(
6130     "icon" => "robot",
6131 matthys 209 "title" => "WebFetch",
6132 joku 63 "rule" => array(
6133     "^webfetch[/ ]([0-9.]{1,10})" => "\\1"
6134     ),
6135     "uri" => ""
6136     ),
6137     "webfind" => array(
6138     "icon" => "robot",
6139 matthys 209 "title" => "WebFind",
6140 joku 63 "rule" => array(
6141     "^WebFindBot" => ""
6142     ),
6143     "uri" => "http://www.web-find.com"
6144     ),
6145     "webglimpse" => array(
6146     "icon" => "robot",
6147     "title" => "Webglimpse",
6148     "rule" => array(
6149     "^Webglimpse[/ ]([0-9.]{1,10})" => "\\1"
6150     ),
6151     "uri" => "http://webglimpse.net"
6152     ),
6153     "webgobbler" => array(
6154     "icon" => "robot",
6155     "title" => "webGobbler",
6156     "rule" => array(
6157     "^webGobbler[/ ]([0-9.]{1,10})" => "\\1"
6158     ),
6159     "uri" => ""
6160     ),
6161     "webimages" => array(
6162     "icon" => "webimages",
6163     "title" => "WebImages",
6164     "rule" => array(
6165     "^WebImages[/ ]([0-9.]{1,10})" => "\\1"
6166     ),
6167     "uri" => "http://herbert.groot.jebbink.nl/"
6168     ),
6169     "weblight" => array(
6170     "icon" => "robot",
6171     "title" => "WebLight",
6172     "rule" => array(
6173     "^WebLight[/ ]([0-9.]{1,10})" => "\\1"
6174     ),
6175     "uri" => "http://www.illumit.com/Products/weblight/"
6176     ),
6177     "weblinks" => array(
6178     "icon" => "robot",
6179     "title" => "WebLink's",
6180     "rule" => array(
6181     "^Weblink.s checker" => ""
6182     ),
6183     "uri" => ""
6184     ),
6185     "webmeasurement" => array(
6186     "icon" => "robot",
6187     "title" => "Webmeasurement",
6188     "rule" => array(
6189     "^webmeasurement-bot" => ""
6190     ),
6191     "uri" => "http://rvs.informatik.uni-leipzig.de"
6192     ),
6193     "webminer" => array(
6194     "icon" => "robot",
6195     "title" => "WebMiner",
6196     "rule" => array(
6197     "^WebMiner[/ ]([0-9.]{1,10})" => "\\1"
6198     ),
6199     "uri" => ""
6200     ),
6201     "webmin" => array(
6202     "icon" => "webmin",
6203     "title" => "Webmin",
6204     "rule" => array(
6205     "^webmin" => ""
6206     ),
6207     "uri" => ""
6208     ),
6209     "webmon" => array(
6210     "icon" => "webmon",
6211     "title" => "Webmon",
6212     "rule" => array(
6213     "WebMon[ /]([0-9.]{1,10})" => "\\1"
6214     ),
6215     "uri" => "http://www.markwell.btinternet.co.uk/webmon/"
6216     ),
6217     "webox" => array(
6218     "icon" => "robot",
6219     "title" => " WeBoX",
6220     "rule" => array(
6221     "WeBoX[/ ]([0-9.]{1,10})" => "\\1"
6222     ),
6223     "uri" => ""
6224     ),
6225     "webpatrol" => array(
6226     "icon" => "webpatrol",
6227     "title" => "WebPatrol",
6228     "rule" => array(
6229     "^WebPatrol[ /]([0-9.]{1,10})" => "\\1"
6230     ),
6231     "uri" => "http://soft.macfeeling.com/WebPatrol.html"
6232     ),
6233     "webpix" => array(
6234     "icon" => "webpix",
6235     "title" => "WebPix",
6236     "rule" => array(
6237     "WebPix[/ ]([0-9.]{1,10})" => "\\1"
6238     ),
6239     "uri" => ""
6240     ),
6241     "webrace" => array(
6242     "icon" => "robot",
6243     "title" => "WebRACE",
6244     "rule" => array(
6245     "^WebRACE[/ ]([0-9.]{1,10})" => "\\1"
6246     ),
6247     "uri" => ""
6248     ),
6249     "webreaper" => array(
6250     "icon" => "webreaper",
6251     "title" => "WebReaper",
6252     "rule" => array(
6253     "^WebReaper " => ""
6254     ),
6255     "uri" => "http://www.webreaper.net/"
6256     ),
6257     "webresult" => array(
6258     "icon" => "robot",
6259     "title" => "Webresult",
6260     "rule" => array(
6261     "Der webresult\.de Robot" => ""
6262     ),
6263     "uri" => ""
6264     ),
6265     "webring" => array(
6266     "icon" => "robot",
6267     "title" => "Webring Checker",
6268     "rule" => array(
6269     "WebRingChecker[/ ]([0-9.]{1,10})" => "\\1"
6270     ),
6271     "uri" => ""
6272     ),
6273     "webripper" => array(
6274     "icon" => "webripper",
6275     "title" => "WebRipper",
6276     "rule" => array(
6277     "^WebRipper" => ""
6278     ),
6279     "uri" => "http://calluna-software.com"
6280     ),
6281     "webscaled" => array(
6282     "icon" => "webscaled",
6283     "title" => "Webscaled",
6284     "rule" => array(
6285     "Swarm" => ""
6286     ),
6287     "uri" => "http://webscaled.com/"
6288     ),
6289     "websearchau" => array(
6290     "icon" => "websearchau",
6291     "title" => "WebSearch.COM.AU",
6292     "rule" => array(
6293     "WebSearch.COM.AU[/ ]+([0-9.]{1,10})" => "\\1"
6294     ),
6295     "uri" => "http://WebSearch.com.au/"
6296     ),
6297     "websearchbench" => array(
6298     "icon" => "robot",
6299     "title" => "WebSearchBench",
6300     "rule" => array(
6301     "WebSearchBench WebCrawler[v/ ]+([0-9.]{1,10})" => "\\1"
6302     ),
6303     "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6304     ),
6305     "websense" => array(
6306     "icon" => "websense",
6307     "title" => "Websense",
6308     "rule" => array(
6309     "(Sqworm|websense|Konqueror/3\.(0|1)(-rc[1-6])?; i686 Linux; 2002[0-9]{4})" => ""
6310     ),
6311     "uri" => ""
6312     ),
6313     "websiteshadow" => array(
6314     "icon" => "websiteshadow",
6315     "title" => "Websiteshadow",
6316     "rule" => array(
6317     "Websiteshadowbot[ /]([0-9.]{1,10})" => "\\1"
6318     ),
6319     "uri" => "http://websiteshadow.com"
6320     ),
6321     "websiteworth" => array(
6322     "icon" => "robot",
6323     "title" => "WebsiteWorth",
6324     "rule" => array(
6325     "WebsiteWorth[v/ ]+([0-9.]{1,10})" => "\\1"
6326     ),
6327     "uri" => "http://directory.sootle.com/website-worth/tata.php"
6328     ),
6329     "websquash" => array(
6330     "icon" => "websquash",
6331     "title" => "Websquash",
6332     "rule" => array(
6333     "webs(quash\.com|ite[ \-]?Monitor)" => ""
6334     ),
6335     "uri" => ""
6336     ),
6337     "webstripper" => array(
6338     "icon" => "robot",
6339     "title" => "WebStripper",
6340     "rule" => array(
6341     "WebStripper[ /]([0-9.]{1,10})" => "\\1"
6342     ),
6343     "uri" => ""
6344     ),
6345     "webzip" => array(
6346     "icon" => "webzip",
6347     "title" => "WebZIP",
6348     "rule" => array(
6349     "Web[ \-]?ZIP[ /]([0-9.]{1,10})" => "\\1"
6350     ),
6351     "uri" => ""
6352     ),
6353     "wep" => array(
6354     "icon" => "robot",
6355     "title" => "WEP Search",
6356     "rule" => array(
6357     "WEP Search[ /]([0-9.]{1,10})" => "\\1"
6358     ),
6359     "uri" => ""
6360     ),
6361     "westwind" => array(
6362     "icon" => "robot",
6363     "title" => "West Wind Internet Protocols",
6364     "rule" => array(
6365     "^West Wind Internet Protocols[ /]([0-9.]{1,10})" => "\\1"
6366     ),
6367     "uri" => "http://www.west-wind.com/wwipstuff.asp"
6368     ),
6369     "wget" => array(
6370     "icon" => "wget",
6371     "title" => "Wget",
6372     "rule" => array(
6373 joku 308 "Wget[ /]([0-9.]{1,10})" => "\\1",
6374     "Wget" => ""
6375 joku 63 ),
6376     "uri" => ""
6377     ),
6378     "whizbang" => array(
6379     "icon" => "whizbang",
6380     "title" => "WhizBang",
6381     "rule" => array(
6382     "WhizBang" => ""
6383     ),
6384     "uri" => "http://www.whizbang.com/crawler/"
6385     ),
6386     "whois" => array(
6387     "icon" => "whois",
6388     "title" => "Who.is",
6389     "rule" => array(
6390     "Who.is Bot" => ""
6391     ),
6392     "uri" => "http://www.who.is/"
6393     ),
6394     "wikiwix" => array(
6395     "icon" => "wikiwix",
6396     "title" => "Wikiwix",
6397     "rule" => array(
6398     "wikiwix-bot-([0-9.]{1,10})" => "\\1"
6399     ),
6400     "uri" => "http://www.wikiwix.com/"
6401     ),
6402     "wingflyer" => array(
6403     "icon" => "robot",
6404     "title" => "WingFlyer",
6405     "rule" => array(
6406     "^WebFetch" => ""
6407     ),
6408     "uri" => "http://www.wingflyer.com/"
6409     ),
6410     "wininet" => array(
6411     "icon" => "robot",
6412     "title" => "WinInet",
6413     "rule" => array(
6414     "TeamSoft WinInet Component" => ""
6415     ),
6416     "uri" => "http://www.winsoft.sk/wininet.htm"
6417     ),
6418     "winhttp" => array(
6419     "icon" => "robot",
6420     "title" => "WinHTTP",
6421     "rule" => array(
6422     "WinHttp\.WinHttpRequest\.([0-9.]{1,10})" => "\\1"
6423     ),
6424     "uri" => ""
6425     ),
6426     "wire" => array(
6427     "icon" => "robot",
6428     "title" => "WIRE",
6429     "rule" => array(
6430     "^WIRE[ /]([0-9.]{1,10})" => "\\1"
6431     ),
6432     "uri" => ""
6433     ),
6434     "wmp" => array(
6435     "icon" => "robot",
6436     "title" => "WMP",
6437     "rule" => array(
6438     "^WMP" => ""
6439     ),
6440     "uri" => ""
6441     ),
6442     "woozweb" => array(
6443     "icon" => "woozweb",
6444     "title" => "Woozweb",
6445     "rule" => array(
6446     "woozweb" => ""
6447     ),
6448     "uri" => "http://www.woozweb.com/"
6449     ),
6450     "wordchamp" => array(
6451     "icon" => "robot",
6452     "title" => "WordChamp",
6453     "rule" => array(
6454     "^WordChampBot" => ""
6455     ),
6456     "uri" => "http://www.wordchamp.com/"
6457     ),
6458     "wordpress" => array(
6459     "icon" => "wordpress",
6460     "title" => "WordPress",
6461     "rule" => array(
6462     "WordPress[ /]([0-9.]{1,10})" => "\\1"
6463     ),
6464     "uri" => ""
6465     ),
6466     "worio" => array(
6467     "icon" => "worio",
6468     "title" => "Worio",
6469     "rule" => array(
6470     "woriobot" => ""
6471     ),
6472     "uri" => "http://worio.com/"
6473     ),
6474     "worldlight" => array(
6475     "icon" => "worldlight",
6476     "title" => "WorldLight",
6477     "rule" => array(
6478     "^WorldLight" => ""
6479     ),
6480     "uri" => ""
6481     ),
6482     "worqmada" => array(
6483     "icon" => "robot",
6484     "title" => "WorQmada",
6485     "rule" => array(
6486     "WorQmada[ /]([0-9.]{1,10})" => "\\1"
6487     ),
6488     "uri" => ""
6489     ),
6490     "wotbox" => array(
6491     "icon" => "wotbox",
6492     "title" => "Wotbox",
6493     "rule" => array(
6494     "Wotbox[ /]?[a-z]*([0-9.]{1,10})" => "\\1"
6495     ),
6496     "uri" => ""
6497     ),
6498     "wp" => array(
6499     "icon" => "wp",
6500     "title" => "Wirtualna Polska",
6501     "rule" => array(
6502     "NetSprint[ /\-]{1,4}([0-9.]{1,10})" => "\\1"
6503     ),
6504     "uri" => "http://wp.pl"
6505     ),
6506     "wsb" => array(
6507     "icon" => "robot",
6508     "title" => "WebSearchBench",
6509     "rule" => array(
6510     "WSB WebCrawler V([0-9.]{1,10})" => "\\1",
6511     "WSB " => ""
6512     ),
6513     "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6514     ),
6515     "wume" => array(
6516     "icon" => "robot",
6517     "title" => "WUME Lab's",
6518     "rule" => array(
6519     "^wume_crawler[ /]([0-9.]{1,10})" => "\\1",
6520     ),
6521     "uri" => "http://wume.cse.lehigh.edu/~xiq204/crawler/"
6522     ),
6523     "wusage" => array(
6524     "icon" => "wusage",
6525     "title" => "Wusage",
6526     "rule" => array(
6527     "Wusage[ /]([0-9.]{1,10})" => "\\1",
6528     ),
6529     "uri" => "http://www.boutell.com/wusage/"
6530     ),
6531     "wwgrapevine" => array(
6532     "icon" => "wwgrapevine",
6533     "title" => "WWgrapevine",
6534     "rule" => array(
6535     "wwgrapevine[ /]([0-9.]{1,10})" => "\\1"
6536     ),
6537     "uri" => ""
6538     ),
6539     "wws" => array(
6540     "icon" => "robot",
6541     "title" => "WWSBOT",
6542     "rule" => array(
6543     "WWSBOT[ /]([0-9.]{1,10})" => "\\1",
6544     ),
6545     "uri" => "http://www.analyzer.nu"
6546     ),
6547     "www4mail" => array(
6548     "icon" => "robot",
6549 matthys 209 "title" => "WWW4mail",
6550 joku 63 "rule" => array(
6551     "^www4mail[ /]([0-9.]{1,10})" => "\\1"
6552     ),
6553     "uri" => "http://www.www4mail.org/"
6554     ),
6555     "wwwc" => array(
6556     "icon" => "wwwc",
6557     "title" => "WWWC",
6558     "rule" => array(
6559     "^WWWC[ /]([0-9.]{1,10})" => "\\1"
6560     ),
6561     "uri" => ""
6562     ),
6563     "wwwd" => array(
6564     "icon" => "robot",
6565     "title" => "WWWD",
6566     "rule" => array(
6567     "^WWWD[ /]([0-9.]{1,10})" => "\\1"
6568     ),
6569     "uri" => ""
6570     ),
6571     "wwweasel" => array(
6572     "icon" => "wwweasel",
6573     "title" => "WWWeasel",
6574     "rule" => array(
6575     "WWWeasel( Robot)?[/ ]v?([0-9.]{1,10})" => "\\2"
6576     ),
6577     "uri" => ""
6578     ),
6579     "wwwfi" => array(
6580     "icon" => "wwwfi",
6581     "title" => "www.fi",
6582     "rule" => array(
6583     "www\.fi crawler" => ""
6584     ),
6585     "uri" => "http://www.fi/"
6586     ),
6587     "wwwmechanize" => array(
6588     "icon" => "robot",
6589     "title" => "WWW-Mechanize",
6590     "rule" => array(
6591     "^WWW-Mechanize[/ ]([0-9.]{1,10})" => "\\1"
6592     ),
6593     "uri" => ""
6594     ),
6595     "wwwoffle" => array(
6596     "icon" => "robot",
6597     "title" => "WWWoffle",
6598     "rule" => array(
6599     "^wwwoffle[/ ]([0-9.]{1,10})" => "\\1"
6600     ),
6601     "uri" => ""
6602     ),
6603     "wwwster" => array(
6604     "icon" => "robot",
6605     "title" => "WWWster",
6606     "rule" => array(
6607     "^wwwster[/ ]([0-9.]{1,10})" => "\\1"
6608     ),
6609     "uri" => ""
6610     ),
6611     "wysigot" => array(
6612     "icon" => "wysigot",
6613     "title" => "Wysigot",
6614     "rule" => array(
6615     "Wysigot[/ ]([0-9.]{1,10})" => "\\1"
6616     ),
6617     "uri" => ""
6618     ),
6619     "xaldon" => array(
6620     "icon" => "xaldon",
6621     "title" => "Xaldon",
6622     "rule" => array(
6623     "Xaldon WebSpider" => ""
6624     ),
6625     "uri" => "http://www.xaldon.de/"
6626     ),
6627     "xenu" => array(
6628     "icon" => "xenu",
6629     "title" => "Xenu Link Sleuth",
6630     "rule" => array(
6631     "Xenu Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6632     "Xenu(&#039;s)? Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6633     "Xenu_Link_Sleuth_([0-9a-z.]{1,10})" => "\\1"
6634     ),
6635     "uri" => "http://home.snafu.de/tilman/xenulink.html"
6636     ),
6637     "xerka" => array(
6638     "icon" => "xerka",
6639     "title" => "Xerka",
6640     "rule" => array(
6641     "^Xerka WebBot v([0-9a-z.]{1,10})" => "\\1"
6642     ),
6643     "uri" => "http://www.diana-teknologia.com/www1/english/xerka.htm"
6644     ),
6645     "xirq" => array(
6646     "icon" => "robot",
6647     "title" => "XIRQ",
6648     "rule" => array(
6649     "^xirq[ /]([0-9a-z.]{1,10})" => "\\1"
6650     ),
6651     "uri" => "http://www.xirq.com"
6652     ),
6653     "xmlslurp" => array(
6654     "icon" => "robot",
6655     "title" => "XMLSlurp",
6656     "rule" => array(
6657     "^XMLSlurp[ /]([0-9a-z.]{1,10})" => "\\1"
6658     ),
6659     "uri" => ""
6660     ),
6661     "xml-sitemaps" => array(
6662     "icon" => "xml-sitemaps",
6663     "title" => "XML-Sitemaps",
6664     "rule" => array(
6665     "XML-Sitemaps[ /]([0-9a-z.]{1,10})" => "\\1"
6666     ),
6667     "uri" => ""
6668     ),
6669     "xmlrpc" => array(
6670     "icon" => "robot",
6671     "title" => "Trackback",
6672     "rule" => array(
6673     "XMLRPC" => ""
6674     ),
6675     "uri" => ""
6676     ),
6677 matthys 294 "xovi" => array(
6678     "icon" => "xovi",
6679     "title" => "Xovi",
6680     "rule" => array(
6681     "XoviBot[ /]([0-9a-z.]{1,10})" => "\\1"
6682     ),
6683     "uri" => "http://www.xovibot.net"
6684     ),
6685 joku 63 "yacy" => array(
6686     "icon" => "yacy",
6687     "title" => "Yacy",
6688     "rule" => array(
6689     "yacy\.net" => ""
6690     ),
6691     "uri" => ""
6692     ),
6693     "yahoo" => array(
6694     "icon" => "yahoo",
6695     "title" => "Yahoo",
6696     "rule" => array(
6697     "Yahoo(! ([a-z]{1,3} )?Slurp|-)" => "",
6698     "Yahoo-MMCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6699     "Yahoo-VerticalCrawler-FormerWebCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6700     "^AnzwersCrawl[/ ]([0-9a-z.]{1,10})" => "\\1",
6701     "Y!J(-BSC|-SRD)*[/ ]([0-9a-z.]{1,10})" => "\\2",
6702     "Y!OASIS/TEST" => "",
6703     "Harvest-NG[/ ]([0-9a-z.]{1,10})" => "\\1",
6704     "Y!J; for robot study" => "",
6705     "Yahoo Japan; for robot study" => ""
6706     ),
6707     "uri" => "http://www.yahoo.com"
6708     ),
6709     "yahoo-feed" => array(
6710     "icon" => "yahoo",
6711     "title" => "Yahoo Feedseeker",
6712     "rule" => array(
6713     "^YahooFeedSeeker[/ ]([0-9a-z.]{1,10})" => "\\1"
6714     ),
6715     "uri" => "http://www.yahoo.com"
6716     ),
6717     "yandex" => array(
6718     "icon" => "yandex",
6719     "title" => "Yandex",
6720     "rule" => array(
6721     "Yandex[/ ]([0-9.]{1,10})" => "\\1",
6722     "Yandex(Bot|Images|Media|Antivirus)[/ ]([0-9.]{1,10})" => "\\2"
6723     ),
6724     "uri" => "http://yandex.com/bots"
6725     ),
6726     "yanga" => array(
6727     "icon" => "yanga",
6728     "title" => "Yanga",
6729     "rule" => array (
6730     "^Yanga.*v([0-9.]{1,10})" => "\\1"
6731     ),
6732     "uri" => "http://www.yanga.co.uk/"
6733     ),
6734     "yap" => array(
6735     "icon" => "yap",
6736     "title" => "Yap",
6737     "rule" => array(
6738     "^YapBot[_/ ]v([0-9.]{1,10})" => "\\1"
6739     ),
6740     "uri" => "http://www.yapinc.com/"
6741     ),
6742     "yarienavoir" => array(
6743     "icon" => "robot",
6744     "title" => "Yarienavoir",
6745     "rule" => array(
6746     "^yarienavoir.net[/ ]([0-9.]{1,10})" => "\\1"
6747     ),
6748     "uri" => "http://www.yarienavoir.net/"
6749     ),
6750     "yell" => array(
6751     "icon" => "yell",
6752     "title" => "Yell",
6753     "rule" => array(
6754     "YellCrawl[ /]V?([0-9.]{1,10})" => "\\1",
6755     "Yellbot[ /]Nutch-([0-9.]{1,10})" => "\\1",
6756     ),
6757     "uri" => ""
6758     ),
6759     "youdao" => array(
6760     "icon" => "youdao",
6761     "title" => "Youdao",
6762     "rule" => array(
6763     "YodaoBot-(Image|Mobile)?[ /]([0-9.]{1,10})" => "\\2",
6764     "YoudaoBot[ /]([0-9.]{1,10})" => "\\1"
6765     ),
6766     "uri" => "http://www.youdao.com/help/webmaster/spider/"
6767     ),
6768     "yoogli" => array(
6769     "icon" => "yoogli",
6770     "title" => "Yoogli",
6771     "rule" => array(
6772     "yoogliFetchAgent[ /]([0-9.]{1,10})" => "\\1"
6773     ),
6774     "uri" => "http://www.yoogli.com"
6775     ),
6776     "yotta" => array(
6777     "icon" => "robot",
6778     "title" => "Yotta",
6779     "rule" => array(
6780     "Yotta(Shopping|Cars)_Bot[ /]([0-9.]{1,10})" => "\\2",
6781     "OmniExplorer_Bot[ /]([0-9.]{1,10})" => "\\1"
6782     ),
6783     "uri" => "http://www.yottacars.com"
6784     ),
6785     "yoono" => array(
6786     "icon" => "yoono",
6787     "title" => "Yoono",
6788     "rule" => array(
6789     "Yoono" => ""
6790     ),
6791     "uri" => "http://www.yoono.com/"
6792     ),
6793     "yowedo" => array(
6794     "icon" => "robot",
6795     "title" => "Yowedo",
6796     "rule" => array(
6797     "Yowedo[ /]([0-9.]{1,10})" => "\\1"
6798     ),
6799     "uri" => "http://yowedo.com/en/partners.html"
6800     ),
6801     "yuntis" => array(
6802     "icon" => "robot",
6803 matthys 209 "title" => "Yuntis",
6804 joku 63 "rule" => array(
6805     "Gulper Web Bot[ /]([0-9.]{1,10})" => "\\1"
6806     ),
6807     "uri" => "http://yuntis.ecsl.cs.sunysb.edu/help/robot/"
6808     ),
6809     "zao" => array(
6810     "icon" => "robot",
6811     "title" => "Zao",
6812     "rule" => array(
6813     "Zao[ /]([0-9.]{1,10})" => "\\1",
6814     "Zao-crawler" => ""
6815     ),
6816     "uri" => ""
6817     ),
6818     "zealbot" => array(
6819     "icon" => "zeal",
6820     "title" => "ZealBot",
6821     "rule" => array(
6822     "Zealbot[ /]([0-9.]{1,10})" => "\\1"
6823     ),
6824     "uri" => ""
6825     ),
6826     "zearchit" => array(
6827     "icon" => "zearchit",
6828     "title" => "Zearchit",
6829     "rule" => array(
6830     "Zearchit" => ""
6831     ),
6832     "uri" => "http://www.zearchit.de/"
6833     ),
6834     "zebz" => array(
6835     "icon" => "robot",
6836     "title" => "ze.bz",
6837     "rule" => array(
6838     "^ZeBot_(lseek\.net|www\.ze\.bz)" => ""
6839     ),
6840     "uri" => "http://www.ze.bz/"
6841     ),
6842     "zedzo" => array(
6843     "icon" => "robot",
6844     "title" => "Zedzo",
6845     "rule" => array(
6846     "zedzo.digest[ /]([0-9.]{1,10})" => "\\1"
6847     ),
6848     "uri" => "http://www.zedzo.com/"
6849     ),
6850     "zerx" => array(
6851     "icon" => "zerx",
6852     "title" => "Zerx",
6853     "rule" => array(
6854     "^zerxbot[ /](Version|v)*[ /]*([0-9.]{1,10})" => "\\2"
6855     ),
6856     "uri" => "http://www.zerx.com/"
6857     ),
6858     "zeus" => array(
6859     "icon" => "zeus",
6860     "title" => "Zeus",
6861     "rule" => array(
6862     "Zeus" => ""
6863     ),
6864     "uri" => "http://www.zeus.com"
6865     ),
6866     "zippp" => array(
6867     "icon" => "robot",
6868     "title" => "Zippp",
6869     "rule" => array(
6870     "ZipppBot[ /]([0-9.]{1,10})" => "\\1"
6871     ),
6872     "uri" => ""
6873     ),
6874     "zippy" => array(
6875     "icon" => "robot",
6876     "title" => "Zippy",
6877     "rule" => array(
6878     "^Zippy[ v/]*([0-9.]{1,10})" => "\\1"
6879     ),
6880     "uri" => "http://www.zippyfinder.com"
6881     ),
6882     "zoeky" => array(
6883     "icon" => "robot",
6884     "title" => "Zoeky",
6885     "rule" => array(
6886     "Zoekybot[ /]([0-9.]{1,10})" => "\\1"
6887     ),
6888     "uri" => ""
6889     ),
6890     "zoom" => array(
6891     "icon" => "zoom",
6892 matthys 209 "title" => "ZoomSpider",
6893 joku 63 "rule" => array(
6894     "^ZoomSpider" => ""
6895     ),
6896     "uri" => "http://www.wrensoft.com/"
6897     ),
6898     "zspider" => array(
6899     "icon" => "robot",
6900 matthys 209 "title" => "Zspider",
6901 joku 63 "rule" => array(
6902     "zspider[ /]([0-9.a-z]{1,10})" => "\\1"
6903     ),
6904     "uri" => "http://feedback.redkolibri.com/"
6905     ),
6906 matthys 281 "zumbot" => array(
6907     "icon" => "robot",
6908     "title" => "ZUM Search",
6909     "rule" => array(
6910     "ZumBot[ /]([0-9.]{1,10})" => "\\1"
6911     ),
6912     "uri" => "http://help.zum.com/inquiry"
6913     ),
6914 joku 63 "zyborg" => array(
6915     "icon" => "zyborg",
6916     "title" => "WiseNutBot",
6917     "rule" => array(
6918     "(WISE|Zy)bo(rg|t)[ /]([0-9.]{1,10})" => "\\3"
6919     ),
6920     "uri" => ""
6921     ),
6922     // Catch up for the originals, they got to stay in that order.
6923     "blogbot" => array(
6924     "icon" => "blogbot",
6925     "title" => "BlogBot",
6926     "rule" => array(
6927     "Blog[ \-]?Bot" => ""
6928     ),
6929     "uri" => "http://www.blogbot.com/"
6930     ),
6931     "centrum" => array(
6932     "icon" => "centrum",
6933     "title" => "Centrum",
6934     "rule" => array(
6935     "holmes[/ ]([0-9.]{1,10})" => "\\1",
6936     "^Centrum-checker" => ""
6937     ),
6938     "uri" => ""
6939     ),
6940     "httpclient" => array(
6941     "icon" => "robot",
6942     "title" => "HTTPClient",
6943     "rule" => array(
6944     "HTTP[ \-]?Client[ /]([0-9.]{1,10})" => "\\1",
6945     "HTTP[ \-]?Client" => ""
6946     ),
6947     "uri" => "http://www.innovation.ch/java/HTTPClient/"
6948     ),
6949     "incywincy" => array(
6950     "icon" => "robot",
6951     "title" => "IncyWincy",
6952     "rule" => array(
6953     "^IncyWincy[ /]([0-9.]{1,10})" => "\\1",
6954     "^IncyWincy" => ""
6955     ),
6956     "uri" => ""
6957     ),
6958     "java" => array(
6959     "icon" => "java",
6960     "title" => "Java",
6961     "rule" => array(
6962     "^java[ /]*([0-9.a-z]{1,10})" => "\\1"
6963     ),
6964     "uri" => ""
6965     ),
6966     "libfetch" => array(
6967     "icon" => "robot",
6968     "title" => "Libfetch",
6969     "rule" => array(
6970     "^(fetch )?libfetch[ /]([0-9.]{1,10})" => "\\2"
6971     ),
6972     "uri" => "http://www.freebsd.org/"
6973     ),
6974     "libwww" => array(
6975     "icon" => "libwww",
6976 matthys 209 "title" => "LibWWW",
6977 joku 63 "rule" => array(
6978     "^libww(w|w-perl|w-FM)[ /]([0-9.]{1,10})" => "\\2",
6979     "^libww(w|w-perl|w-FM)" => "",
6980     "MyApp.*libww(w|w-perl|w-FM)" => ""
6981     ),
6982     "uri" => ""
6983     ),
6984     "litefinder" => array(
6985     "icon" => "litefinder",
6986     "title" => "LiteFinder",
6987     "rule" => array(
6988     "LiteFinder[ /]([0-9.]{1,10})" => "\\1"
6989     ),
6990     "uri" => "http://www.litefinder.net/about.html"
6991     ),
6992     "nutchorg" => array(
6993     "icon" => "nutchorg",
6994     "title" => "Nutch",
6995     "rule" => array(
6996     "Nutc(hOrg|hCVS|h)?[ /]([0-9.]{1,10})" => "\\2",
6997     "Nutch" => ""
6998     ),
6999     "uri" => "http://lucene.apache.org/nutch/"
7000     ),
7001     "pythonurl" => array(
7002     "icon" => "pythonurl",
7003     "title" => "Python-url",
7004     "rule" => array(
7005     "Python[ \-]?urllib" => ""
7006     ),
7007     "uri" => ""
7008     ),
7009     // Know Robots as SPAM BOTS
7010     "SPAM" => array(
7011     "icon" => "robot",
7012     "title" => "SPAM",
7013     "rule" => array(
7014     "NASA Search[/ ]([0-9.]{1,10})" => "\\1",
7015     "^PHOTO CHECK" => "",
7016     "^FOTOCHECKER" => "",
7017     "^IPTC CHECK" => "",
7018     "^DataCha0s" => "",
7019     "^Mac Finder" => "",
7020     "^Missigua Locator[ /]([0-9.]{1,10})" => "\\1",
7021     "^Missouri College Browse" => "",
7022     "Email[ \-]?Siphon" => "",
7023     "atSpider" => "",
7024     "autoemailspider" => "",
7025     "^Demo Bot" => "",
7026     "^Program Shareware" => "",
7027     "^Snapbot" => "",
7028     "^snap.com" => "",
7029     "^Guestbook Auto Submitter" => "",
7030     "panscient.com" => "",
7031     ),
7032     "uri" => ""
7033     ),
7034     // Things we don't know by now
7035     "robot" => array(
7036     "icon" => "robot",
7037     "title" => "Robot",
7038     "rule" => array(
7039     "(robot|spider|harvest|(?<!orange)bot|(?<!msie)crawler)" => ""
7040     )
7041     )
7042     );
7043 joku 261 ?>

Properties

Name Value
svn:keywords Id