ViewVC Help
View File | Revision Log | Show Annotations | View Changeset | Root Listing
root/BBClone/trunk/lib/robot.php
Revision: 379
Committed: Thu May 11 17:42:56 2017 UTC (7 years, 6 months ago) by joku
File size: 158844 byte(s)
Log Message:
update DAUM Robot

File Contents

# User Rev Content
1 joku 63 <?php
2     /* This file is part of BBClone (A PHP based Web Counter on Steroids)
3     *
4     * SVN FILE $Id$
5     *
6 joku 370 * Copyright (C) 2001-2017, the BBClone Team (see doc/authors.txt for details)
7 joku 63 *
8     * This program is free software: you can redistribute it and/or modify
9     * it under the terms of the GNU General Public License as published by
10     * the Free Software Foundation, either version 3 of the License, or
11     * (at your option) any later version.
12     *
13     * This program is distributed in the hope that it will be useful,
14     * but WITHOUT ANY WARRANTY; without even the implied warranty of
15     * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16     * GNU General Public License for more details.
17     *
18     * See doc/copying.txt for details
19     */
20    
21     /////////////////////
22     // Robot Detection //
23     /////////////////////
24    
25     $robot = array(
26     "1noon" => array(
27     "icon" => "1noon",
28     "title" => "1noon",
29     "rule" => array(
30     "1Noonbot[/ ]([0-9.]{1,10})" => "\\1",
31     "^Yeti$" => ""
32     ),
33     "uri" => ""
34     ),
35     "123people" => array(
36     "icon" => "123people",
37     "title" => "123people",
38     "rule" => array(
39     "123peoplebot[ /]([0-9.]{1,10})" => "\\1"
40     ),
41     "uri" => "http://www.123people.fr/"
42     ),
43     "123spider" => array(
44     "icon" => "robot",
45     "title" => "123Spider",
46     "rule" => array(
47     "123spider-Bot \(Version: ([0-9.]{1,10})" => "\\1"
48     ),
49     "uri" => "http://www.123spider.de/"
50     ),
51     "192com" => array(
52     "icon" => "robot",
53     "title" => "192.com",
54     "rule" => array(
55     "192.comAgent" => ""
56     ),
57     "uri" => "http://www.192.com/"
58     ),
59 matthys 298 "200please" => array(
60     "icon" => "200please",
61     "title" => "200please Crawler",
62     "rule" => array(
63     "200PleaseBot[ /]([0-9.]{1,10})" => "\\1"
64     ),
65     "uri" => "http://www.200please.com/bot"
66     ),
67 joku 63 "2dehands" => array(
68     "icon" => "2dehands",
69     "title" => "2deHands",
70     "rule" => array(
71     "2dehands\.nl" => ""
72     ),
73     "uri" => ""
74     ),
75     "80legs" => array(
76     "icon" => "80legs",
77     "title" => "80legs",
78     "rule" => array(
79     "008[/ ]([0-9.]{1,10}).*80legs" => "\\1"
80     ),
81     "uri" => "http://www.80legs.com/"
82     ),
83     "a1sitemap" => array(
84     "icon" => "a1sitemap",
85     "title" => "A1 Sitemap",
86     "rule" => array(
87     "^A1 Sitemap Generator[ /]([0-9.]{1,10})" => "\\1",
88     "miggibot[ /]([0-9.]{1,10})" => "\\1"
89     ),
90     "uri" => "http://www.micro-sys.dk/products/sitemap-generator/"
91     ),
92     "a2b" => array(
93     "icon" => "a2b",
94     "title" => "A2B",
95     "rule" => array(
96     "www\.a2b\.cc" => ""
97     ),
98     "uri" => "http://www.a2b.cc"
99     ),
100     "abacho" => array(
101     "icon" => "robot",
102     "title" => "Abacho",
103     "rule" => array(
104     "^ABACHOBot" => ""
105     ),
106     "uri" => ""
107     ),
108     "abcdatos" => array(
109     "icon" => "abcdatos",
110     "title" => "ABCdatos",
111     "rule" => array(
112     "^ABCdatos BotLink[ /]([0-9.]{1,10})" => "\\1"
113     ),
114     "uri" => "http://www.abcdatos.com/"
115     ),
116     "abot" => array(
117     "icon" => "abot",
118     "title" => "aBot",
119     "rule" => array(
120     "^abot[ /]([0-9.]{1,10})" => "\\1"
121     ),
122     "uri" => ""
123     ),
124     "about" => array(
125     "icon" => "about",
126     "title" => "About",
127     "rule" => array(
128     "Libby[_/ ]([0-9.]{1,10})" => "\\1",
129     "About[_/ ]([0-9.]{1,10})libwww-perl" => "\\1"
130     ),
131     "uri" => ""
132     ),
133     "aboutus" => array(
134     "icon" => "aboutus",
135     "title" => "AboutUs",
136     "rule" => array(
137     "AboutUsBot" => ""
138     ),
139     "uri" => "http://www.aboutus.org/"
140     ),
141     "ackerm" => array(
142     "icon" => "robot",
143     "title" => "Ackerm",
144     "rule" => array(
145     "www.ackerm.com" => ""
146     ),
147     "uri" => "http://www.ackerm.com/"
148     ),
149     "acoi" => array(
150     "icon" => "acoi",
151     "title" => "AcoiRobot",
152     "rule" => array(
153     "^AcoiRobot" => ""
154     ),
155     "uri" => "http://monetdb.cwi.nl/acoi/projects.html"
156     ),
157     "acoon" => array(
158     "icon" => "acoon",
159     "title" => "Acoon",
160     "rule" => array(
161     "Acoon[ \-]?Robot" => ""
162     ),
163     "uri" => ""
164     ),
165     "accoona" => array(
166     "icon" => "accoona",
167     "title" => "Accoona",
168     "rule" => array(
169     "Accoona-AI-Agent[/ ]([0-9.]{1,10})" => "\\1",
170     "^accoona" => ""
171     ),
172     "uri" => ""
173     ),
174     "acme" => array(
175     "icon" => "acme",
176     "title" => "Acme",
177     "rule" => array(
178     "^Acme\.Spider" => ""
179     ),
180     "uri" => "http://www.acme.com/java/software/Acme.Spider.html"
181     ),
182     "active" => array(
183     "icon" => "robot",
184     "title" => "ActiveBookmark",
185     "rule" => array(
186     "ActiveBookmark[/ ]([0-9.]{1,10})" => "\\1"
187     ),
188     "uri" => ""
189     ),
190     "admuncher" => array(
191     "icon" => "robot",
192     "title" => "Ad Muncher",
193     "rule" => array(
194     "Ad Muncher[/ v]*([0-9.]{1,10})" => "\\1"
195     ),
196     "uri" => ""
197     ),
198     "aesop" => array(
199     "icon" => "robot",
200     "title" => "Aesop",
201     "rule" => array(
202     "^AESOP_com_SpiderMan" => ""
203     ),
204     "uri" => "http://www.aesop.com"
205     ),
206     "agada" => array(
207     "icon" => "robot",
208     "title" => "Agada",
209     "rule" => array(
210     "^agadine[/ ]([0-9.]{1,10})" => "\\1"
211     ),
212     "uri" => ""
213     ),
214     "ahrefs" => array(
215     "icon" => "ahrefs",
216     "title" => "Ahrefs",
217     "rule" => array(
218     "AhrefsBot[ /]([0-9.]{1,10})" => "\\1"
219     ),
220     "uri" => "http://ahrefs.com/"
221     ),
222     "aibot" => array(
223     "icon" => "robot",
224     "title" => "Aibot",
225     "rule" => array(
226     "AIBOT[/ ]([0-9.]{1,10})" => "\\1"
227     ),
228     "uri" => ""
229     ),
230     "aihitbot" => array(
231     "icon" => "robot",
232     "title" => "aiHit",
233     "rule" => array(
234     "aiHitBot[/ ]([0-9.]{1,10})" => "\\1"
235     ),
236     "uri" => "http://www.aihit.com/"
237     ),
238     "aipbot" => array(
239     "icon" => "robot",
240     "title" => "Aipbot",
241     "rule" => array(
242     "aipbot[/ ]([0-9.]{1,10})" => "\\1"
243     ),
244     "uri" => ""
245     ),
246     "aleksika" => array(
247     "icon" => "aleksika",
248     "title" => "Aleksika",
249     "rule" => array(
250     "Aleksika Spider[/ ]([0-9.]{1,10})" => "\\1"
251     ),
252     "uri" => ""
253     ),
254     "alertsite" => array(
255     "icon" => "alertsite",
256     "title" => "AlertSite",
257     "rule" => array(
258     "ipd[ /]([0-9.]{1,10}).*Alertsite\.com" => "\\1"
259     ),
260     "uri" => "http://www.alertsite.com/index.html"
261     ),
262     "alexa" => array(
263     "icon" => "alexa",
264     "title" => "Alexa",
265     "rule" => array(
266     "^ia_archive" => ""
267     ),
268     "uri" => "http://www.alexa.com/"
269     ),
270     "almaden" => array(
271     "icon" => "almaden",
272     "title" => "IBM Crawler",
273     "rule" => array(
274     "www\.almaden\.ibm\.com/cs/crawler" => ""
275     ),
276     "uri" => "http://www.almaden.ibm.com/cs/crawler/"
277     ),
278     "altavista" => array(
279     "icon" => "altavista",
280     "title" => "Altavista",
281     "rule" => array(
282     "Scooter[ /\-]*[a-z]*([0-9.]{1,10})" => "\\1",
283     "AltaVista V([0-9.]{1,10})" => "\\1",
284     "AltaVista Intranet V([0-9.]{1,10})" => "\\1"
285     ),
286     "uri" => "http://www.altavista.com/"
287     ),
288     "amazon" => array(
289     "icon" => "amazon",
290     "title" => "Amazon",
291     "rule" => array(
292     "^(aranhabot|amzn_assoc)" => "",
293     "^NutchEC2Test" => ""
294     ),
295     "uri" => "http://www.amazon.com/"
296     ),
297     "amidalla" => array(
298     "icon" => "amidalla",
299     "title" => "Amidalla",
300     "rule" => array(
301     "^amibot" => ""
302     ),
303     "uri" => ""
304     ),
305     "amfibi" => array(
306     "icon" => "amfibi",
307     "title" => "Amfibi",
308     "rule" => array(
309     "Amfibibot[/ ]([0-9.]{1,10})" => "\\1",
310     "Amfibibot" => ""
311     ),
312     "uri" => ""
313     ),
314     "amphetadesk" => array(
315     "icon" => "robot",
316     "title" => "AmphetaDesk",
317     "rule" => array(
318     "AmphetaDesk[/ ]([0-9.]{1,10})" => "\\1"
319     ),
320     "uri" => ""
321     ),
322     "amphetameme" => array(
323     "icon" => "robot",
324     "title" => "Amphetameme",
325     "rule" => array(
326     "amphetameme[ \-]?crawler" => ""
327     ),
328     "uri" => ""
329     ),
330     "annomille" => array(
331     "icon" => "robot",
332     "title" => "AnnoMille",
333     "rule" => array(
334     "^AnnoMille( spider)?[/ ]([0-9.]{1,10})" => "\\2"
335     ),
336     "uri" => "http://www.annomille.it"
337     ),
338     "anonymouse" => array(
339     "icon" => "anonymouse",
340     "title" => "Anonymouse.org",
341     "rule" => array(
342     "http://Anonymouse.org" => ""
343     ),
344     "uri" => "http://anonymouse.org"
345     ),
346     "ansearch" => array(
347     "icon" => "robot",
348     "title" => "Ansearch",
349     "rule" => array(
350     "AnsearchBot[/ ]([0-9.]{1,10})" => "\\1"
351     ),
352     "uri" => ""
353     ),
354     "answerchase" => array(
355     "icon" => "answerchase",
356     "title" => "AnswerChase",
357     "rule" => array(
358     "AnswerChase( PROve)?[/ ]([0-9.]{1,10})" => "\\2"
359     ),
360     "uri" => "http://www.answerchase.com/"
361     ),
362     "antibot" => array(
363     "icon" => "robot",
364 matthys 205 "title" => "Antibot",
365 joku 63 "rule" => array(
366     "antibot-V([0-9.]{1,10})" => "\\1"
367     ),
368     "uri" => ""
369     ),
370     "aonde" => array(
371     "icon" => "aonde",
372     "title" => "Aonde",
373     "rule" => array(
374     "^AONDE-Spider" => ""
375     ),
376     "uri" => ""
377     ),
378     "aonline" => array(
379     "icon" => "robot",
380     "title" => "A-Online.at",
381     "rule" => array(
382     "^A-Online Search" => ""
383     ),
384     "uri" => "http://www.a-online.at/"
385     ),
386     "aol" => array(
387     "icon" => "aol",
388     "title" => "AOLserver",
389     "rule" => array(
390     "^AOLserver-Tcl[/ ]([0-9.]{1,10})" => "\\1",
391     "^AOLserver" => ""
392     ),
393     "uri" => ""
394     ),
395     "apachebench" => array(
396     "icon" => "robot",
397     "title" => "ApacheBench",
398     "rule" => array(
399     "ApacheBench[ /]([0-9.]{1,10})" => "\\1"
400     ),
401     "uri" => ""
402     ),
403     "apassion4jazz" => array(
404     "icon" => "robot",
405     "title" => "Passion 4 Jazz",
406     "rule" => array(
407     "^BebopBot[ /]([0-9.]{1,10})" => "\\1"
408     ),
409     "uri" => "http://www.apassion4jazz.net/bebopbot.html"
410     ),
411     "apexoo" => array(
412     "icon" => "robot",
413     "title" => "Apexoo",
414     "rule" => array(
415     "^Apexoo Spider ([0-9.]{1,10})" => "\\1"
416     ),
417     "uri" => "http://www.apexoo.com/"
418     ),
419     "apnoti" => array(
420     "icon" => "apnoti",
421 matthys 205 "title" => "Apnoti",
422 joku 63 "rule" => array(
423     "apnoti.*Robot[ /]v([0-9.]{1,10})" => "\\1"
424     ),
425     "uri" => "http://www.apnoti.com/"
426     ),
427     "aport" => array(
428     "icon" => "aport",
429     "title" => "Aport",
430     "rule" => array(
431     "^Aport" => ""
432     ),
433     "uri" => ""
434     ),
435     "appie" => array(
436     "icon" => "walhello",
437     "title" => "Walhello",
438     "rule" => array(
439     "appie[ /]([0-9.]{1,10})" => "\\1"
440     ),
441     "uri" => ""
442     ),
443     "arachmo" => array(
444     "icon" => "arachmo",
445     "title" => "Arachmo",
446     "rule" => array(
447     "compatible; Arachmo" => ""
448     ),
449     "uri" => ""
450     ),
451     "arexera" => array(
452     "icon" => "arexera",
453     "title" => "Arexera",
454     "rule" => array(
455     "^X-Crawler" => "",
456     "^TECOMAC-Crawler[ /]([0-9.]{1,10})" => "\\1"
457     ),
458     "uri" => "http://www.arexera.de/"
459     ),
460     "arianna" => array(
461     "icon" => "arianna",
462     "title" => "Arianna",
463     "rule" => array(
464     "^www.arianna.it" => ""
465     ),
466     "uri" => "http://www.arianna.it/"
467     ),
468     "artface" => array(
469     "icon" => "robot",
470     "title" => "Artface",
471     "rule" => array(
472     "^ArtfaceBot" => ""
473     ),
474     "uri" => ""
475     ),
476     "artviper" => array(
477     "icon" => "artviper",
478     "title" => "artViper",
479     "rule" => array(
480     "artViper" => ""
481     ),
482     "uri" => "http://www.artviper.net/"
483     ),
484     "asinfo" => array(
485     "icon" => "robot",
486     "title" => "Any Search Info",
487     "rule" => array(
488     "Sleek Spider[ /]([0-9.]{1,10})" => "\\1"
489     ),
490     "uri" => "http://search-info.com/"
491     ),
492     "ask" => array(
493     "icon" => "askjeeves",
494     "title" => "Ask Jeeves",
495     "rule" => array(
496     "Ask[ \-]?Jeeves" => "",
497     "teomaagent" => ""
498     ),
499     "uri" => ""
500     ),
501     "askaboutoil" => array(
502     "icon" => "robot",
503     "title" => "ASPseek",
504     "rule" => array(
505     "^AskAboutOil[ /]([0-9.]{1,10})" => "\\1"
506     ),
507     "uri" => "http://askaboutoil.com/"
508     ),
509     "asked" => array(
510     "icon" => "robot",
511 matthys 205 "title" => "AskEd!",
512 joku 63 "rule" => array(
513     "^asked[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
514     ),
515     "uri" => "http://asked.jp"
516     ),
517     "aspseek" => array(
518     "icon" => "robot",
519     "title" => "ASPseek",
520     "rule" => array(
521     "^ASPseek[/ ]([0-9.]{1,10})" => "\\1"
522     ),
523     "uri" => ""
524     ),
525     "atlocal" => array(
526     "icon" => "robot",
527     "title" => "At Local",
528     "rule" => array(
529     "AtlocalBot[/ ]([0-9.]{1,10})" => "\\1"
530     ),
531     "uri" => "http://www.atlocal.com/"
532     ),
533     "atomz" => array(
534     "icon" => "atomz",
535     "title" => "Atomz",
536     "rule" => array(
537     "Atomz[/ ]([0-9.]{1,10})" => "\\1"
538     ),
539     "uri" => ""
540     ),
541 matthys 345 "avira" => array(
542     "icon" => "avira",
543     "title" => "Avira SafeSearch",
544     "rule" => array(
545     "^SafeSearch microdata crawler" => ""
546     ),
547     "uri" => "https://safesearch.avira.com"
548     ),
549 joku 63 "axel" => array(
550     "icon" => "robot",
551     "title" => "Axel",
552     "rule" => array(
553     "^axel" => ""
554     ),
555     "uri" => ""
556     ),
557     "axmo" => array(
558     "icon" => "axmo",
559     "title" => "Axmo",
560     "rule" => array(
561     "AxmoRobot" => ""
562     ),
563     "uri" => ""
564     ),
565     "answerbus" => array(
566     "icon" => "answerbus",
567     "title" => "AnswerBus",
568     "rule" => array(
569     "answerbus" => ""
570     ),
571     "uri" => ""
572     ),
573     "automapit" => array(
574     "icon" => "robot",
575     "title" => "AutoMapIt",
576     "rule" => array(
577     "AutoMapIt[ /](Bot)?" => ""
578     ),
579     "uri" => "http://www.automapit.com/bot.html"
580     ),
581     "augurnfind" => array(
582     "icon" => "robot",
583     "title" => "Augurnfind",
584     "rule" => array(
585     "augurnfind[/ ][v\-]*([0-9.]{1,10})" => "\\1"
586     ),
587     "uri" => ""
588     ),
589     "awasu" => array(
590     "icon" => "awasu",
591     "title" => "Awasu",
592     "rule" => array(
593     "Awasu[/ ]([0-9a-z.]{1,10})" => "\\1"
594     ),
595     "uri" => ""
596     ),
597     "axxus" => array(
598     "icon" => "axxus",
599     "title" => "axxus.de",
600     "rule" => array(
601     "whoiam" => ""
602     ),
603     "uri" => "http://www.axxus.de/"
604     ),
605     "ayell" => array(
606     "icon" => "ayell",
607     "title" => "Ayell",
608     "rule" => array(
609     "^Eurobot[ /]([0-9.]{1,10})" => "\\1"
610     ),
611     "uri" => "http://eurobot.ayell.eu"
612     ),
613     "babaloo" => array(
614     "icon" => "babaloo",
615     "title" => "Babaloo",
616     "rule" => array(
617     "BabalooSpider[ /]([0-9.]{1,10})" => "\\1"
618     ),
619     "uri" => "http://www.babaloo.si"
620     ),
621     "babe" => array(
622     "icon" => "robot",
623     "title" => "ba.be",
624     "rule" => array(
625     "BACS http://www.ba.be" => ""
626     ),
627     "uri" => "http://www.ba.be/"
628     ),
629     "baidu" => array(
630     "icon" => "baidu",
631     "title" => "Baidu",
632     "rule" => array(
633     "Baiduspider[ /]([0-9.]{1,10})" => "\\1",
634     "Baiduspider" => ""
635     ),
636     "uri" => "http://www.baidu.com/search/spider.html"
637     ),
638     "bananatree" => array(
639     "icon" => "robot",
640     "title" => "BananaTree",
641     "rule" => array(
642     "www\.thebananatree\.org" => ""
643     ),
644     "uri" => "http://www.thebananatree.org/"
645     ),
646     "bdcindexer" => array(
647     "icon" => "robot",
648     "title" => "bdcindexer",
649     "rule" => array(
650     "bdcindexer_([0-9a-z.]{1,10})" => "\\1"
651     ),
652     "uri" => "http://www.business.com/"
653     ),
654     "bdfetch" => array(
655     "icon" => "robot",
656     "title" => "BDFetch",
657     "rule" => array(
658     "^BDFetch" => ""
659     ),
660     "uri" => ""
661     ),
662     "bdncentral" => array(
663     "icon" => "robot",
664     "title" => "Bdncentral",
665     "rule" => array(
666     "BDNcentral Crawler v([0-9.]{1,10})" => "\\1"
667     ),
668     "uri" => "http://www.bdncentral.com/robot.html"
669     ),
670     "beammachine" => array(
671     "icon" => "robot",
672     "title" => "BeamMachine",
673     "rule" => array(
674     "^BeamMachine[ /]([0-9.]{1,10})" => "\\1"
675     ),
676     "uri" => "http://www.beammachine.net/"
677     ),
678     "become" => array(
679     "icon" => "become",
680     "title" => "Become",
681     "rule" => array(
682     "Become(JP)?Bot[/ ]([0-9.]{1,10})" => "\\2",
683     "(BecomeBot|Exabot)@exava\.com\)$" => ""
684     ),
685     "uri" => "http://www.become.com/"
686     ),
687     "beebware" => array(
688     "icon" => "robot",
689     "title" => "Beebware",
690     "rule" => array(
691     "BeebwareDirectory[/ ]v?([0-9.]{1,10})" => "\\2"
692     ),
693     "uri" => ""
694     ),
695     "bigbrother" => array(
696     "icon" => "robot",
697     "title" => "Big Brother",
698     "rule" => array(
699     "^Big Brother" => ""
700     ),
701     "uri" => "http://pauillac.inria.fr/~fpottier/"
702     ),
703     "bigclique" => array(
704     "icon" => "robot",
705     "title" => "BigClique",
706     "rule" => array(
707     "^BigCliqueBOT[/ ]([0-9.]{1,10})" => "\\1"
708     ),
709     "uri" => "http://www.bigclique.com"
710     ),
711     "biglotron" => array(
712     "icon" => "robot",
713     "title" => "Biglotron",
714     "rule" => array(
715     "^BIGLOTRON" => ""
716     ),
717     "uri" => "http://www.bigclique.com"
718     ),
719     "bigsearch" => array(
720     "icon" => "bigsearch",
721     "title" => "Bigsearch",
722     "rule" => array(
723     "Bigsearch.ca[/ ]Nutch[- ]([0-9.]{1,10})" => "\\1"
724     ),
725     "uri" => ""
726     ),
727     "bilbo" => array(
728     "icon" => "robot",
729     "title" => "Bilbo",
730     "rule" => array(
731     "Bilbo[ /]([0-9.]{1,10})" => "\\1"
732     ),
733     "uri" => "http://home.broadpark.no/~tnilsen-1/Linux/Bilbo_-_Nessus_WEB/bilbo_-_nessus_web.html"
734     ),
735     "bilgi" => array(
736     "icon" => "bilgi",
737     "title" => "Bilgi",
738     "rule" => array(
739     "Bilgi(Beta)?Bot[ /]([0-9.]{1,10})" => "\\1"
740     ),
741     "uri" => "http://www.bilgi.com/"
742     ),
743     "bitacle" => array(
744     "icon" => "bitacle",
745     "title" => "Bitacle",
746     "rule" => array(
747     "Bitacle (ro)?bot[ \(/V\:]+([0-9.]{1,10})" => "\\2",
748     ),
749     "uri" => "http://bitacle.org/"
750     ),
751     "bitbeamer" => array(
752     "icon" => "bitbeamer",
753     "title" => "BitBeamer",
754     "rule" => array(
755     "BitBeamer/([0-9.]{1,10})" => "\\1"
756     ),
757     "uri" => ""
758     ),
759     "biz360" => array(
760     "icon" => "biz360",
761     "title" => "Biz360",
762     "rule" => array(
763     "^Biz360 spider" => ""
764     ),
765     "uri" => ""
766     ),
767     "backlinktest" => array(
768     "icon" => "backlinktest",
769     "title" => "BacklinkCrawler",
770     "rule" => array(
771     "BacklinkCrawler" => ""
772     ),
773     "uri" => "http://www.backlinktest.com/crawler.html"
774     ),
775     "blaizbee" => array(
776     "icon" => "blaiz-bee",
777     "title" => "Blaiz-Bee",
778     "rule" => array(
779     "Blaiz-Bee[ /]([0-9.]{1,10})" => ""
780     ),
781     "uri" => ""
782     ),
783     "blogbeat" => array(
784     "icon" => "robot",
785     "title" => "BlogBeat",
786     "rule" => array(
787     "BlogBeat/?([0-9.]{1,10})" => "\\1",
788     ),
789     "uri" => "http://www.blogbeat.nl"
790     ),
791     "blogbotde" => array(
792     "icon" => "robot",
793     "title" => "blogbot.de",
794     "rule" => array(
795     "Naamah[ /]([0-9.a-z]{1,10})[ /]Blogbot" => "\\1",
796     ),
797     "uri" => "http://blogbot.de/"
798     ),
799     "blogcensus" => array(
800     "icon" => "blogcensus",
801     "title" => "Blogcensus",
802     "rule" => array(
803     "^Blogcensus" => "",
804     ),
805     "uri" => "http://blogcensus.de/bot/"
806     ),
807     "blogdex" => array(
808     "icon" => "robot",
809     "title" => "Blogdex",
810     "rule" => array(
811     "Blogdex[ /]([0-9.]{1,10})" => "\\1",
812     ),
813     "uri" => ""
814     ),
815     "blogg" => array(
816     "icon" => "blogg",
817     "title" => "Blogg",
818     "rule" => array(
819     "^blogg\.de" => ""
820     ),
821     "uri" => ""
822     ),
823     "blogland" => array(
824     "icon" => "robot",
825     "title" => "BlogLand",
826     "rule" => array(
827     "BlogLand[/ ]([0-9.]{1,10})" => "\\1"
828     ),
829     "uri" => ""
830     ),
831     "bloglines" => array(
832     "icon" => "bloglines",
833     "title" => "Bloglines",
834     "rule" => array(
835     "Bloglines[ /]([0-9.]{1,10})" => "\\1",
836     "Bloglines" => ""
837     ),
838     "uri" => ""
839     ),
840     "blogmap" => array(
841     "icon" => "robot",
842     "title" => "Blogmap",
843     "rule" => array(
844     "blogmap" => ""
845     ),
846     "uri" => ""
847     ),
848     "blogosphere" => array(
849     "icon" => "robot",
850     "title" => "Blogosphere",
851     "rule" => array(
852     "Blogosphere" => ""
853     ),
854     "uri" => ""
855     ),
856     "blogpeople" => array(
857     "icon" => "robot",
858     "title" => "BlogPeople",
859     "rule" => array(
860     "BlogPeople" => ""
861     ),
862     "uri" => ""
863     ),
864     "blogpulse" => array(
865     "icon" => "blogpulse",
866     "title" => "Blogpulse",
867     "rule" => array(
868     "Blogpulse" => ""
869     ),
870     "uri" => ""
871     ),
872     "blogranking" => array(
873     "icon" => "blogranking",
874     "title" => "BlogRanking",
875     "rule" => array(
876     "^BlogRanking(/RSS checker)?" => ""
877     ),
878     "uri" => ""
879     ),
880     "blogs" => array(
881     "icon" => "blogs",
882     "title" => "Blo.gs",
883     "rule" => array(
884     "blo\.gs[ /]([0-9.]{1,10})" => "\\1",
885     "blo\.gs" => ""
886     ),
887     "uri" => ""
888     ),
889     "blogshares" => array(
890     "icon" => "blogshares",
891     "title" => "BlogShares",
892     "rule" => array(
893     "BlogShares[ /]V?([0-9.]{1,10})" => "\\1",
894     "(^| |\()Blogshares(\.com| |\))" => ""
895     ),
896     "uri" => ""
897     ),
898     "blogslife" => array(
899     "icon" => "robot",
900     "title" => "BlogsLife",
901     "rule" => array(
902     "Blogslive" => ""
903     ),
904     "uri" => ""
905     ),
906     "blogsnow" => array(
907     "icon" => "blogsnow",
908     "title" => "BlogsNow",
909     "rule" => array(
910     "blogsnowbot" => "",
911     "BlogsNow" => ""
912     ),
913     "uri" => ""
914     ),
915     "blogstreet" => array(
916     "icon" => "blogstreet",
917     "title" => "BlogStreet",
918     "rule" => array(
919     "^BlogStreetBot" => ""
920     ),
921     "uri" => ""
922     ),
923     "blogsurf" => array(
924     "icon" => "robot",
925     "title" => "BlogSurf",
926     "rule" => array(
927     "nomadscafe_ra[/ ]([0-9.]{1,10})" => "\\1"
928     ),
929     "uri" => ""
930     ),
931     "blogtick" => array(
932     "icon" => "robot",
933     "title" => "BlogTick",
934     "rule" => array(
935     "BlogTickServer" => ""
936     ),
937     "uri" => ""
938     ),
939     "blogwatcher" => array(
940     "icon" => "blogwatcher",
941     "title" => "Blogwatcher",
942     "rule" => array(
943     "blogWatcher_Spider[/ ]([0-9.]{1,10})" => "\\1"
944     ),
945     "uri" => ""
946     ),
947     "blogwise" => array(
948     "icon" => "blogwise",
949     "title" => "Blogwise",
950     "rule" => array(
951     "Blogwise\.com(-MetaChecker)?[/ ]([0-9.]{1,10})" => "\\2"
952     ),
953     "uri" => ""
954     ),
955     "boardreader" => array(
956     "icon" => "boardreader",
957     "title" => "BoardReader",
958     "rule" => array(
959     "BoardReader[ \-](Image|Favicon)[ \-]Fetcher[ /]+([0-9.]{1,10})" => "\\2"
960     ),
961     "uri" => "http://www.boardreader.com"
962     ),
963     "bobby" => array(
964     "icon" => "bobby",
965     "title" => "Bobby",
966     "rule" => array(
967     "bobby[ /]([0-9.]{1,10})" => "\\1"
968     ),
969     "uri" => ""
970     ),
971     "boitho" => array(
972     "icon" => "robot",
973     "title" => "Boitho",
974     "rule" => array(
975     "Boitho\.com[ \-](dc|robot)?[/ ]([0-9.]{1,10})" => "\\2"
976     ),
977     "uri" => ""
978     ),
979     "booch" => array(
980     "icon" => "robot",
981     "title" => "Booch",
982     "rule" => array(
983     "^booch[_ /]([0-9.]{1,10})" => "\\1"
984     ),
985     "uri" => ""
986     ),
987     "book" => array(
988     "icon" => "book",
989     "title" => "Bookmark",
990     "rule" => array(
991     "http://www\.bookmark\.ne\.jp" => ""
992     ),
993     "uri" => ""
994     ),
995     "bookdog" => array(
996     "icon" => "bookdog",
997     "title" => "Bookdog",
998     "rule" => array(
999     "^Bookdog[ /]([0-9.]{1,10})" => "\\1"
1000     ),
1001     "uri" => ""
1002     ),
1003     "bordermanager" => array(
1004     "icon" => "bordermanager",
1005     "title" => "Border Manager",
1006     "rule" => array(
1007     "BorderManager[ /]([0-9.]{1,10})" => "\\1"
1008     ),
1009     "uri" => ""
1010     ),
1011     "botonparade" => array(
1012     "icon" => "botonparade",
1013     "title" => "Bot on Parade",
1014     "rule" => array(
1015     "BotOnParade" => ""
1016     ),
1017     "uri" => "http://www.bots-on-para.de/bot.html"
1018     ),
1019     "botje" => array(
1020     "icon" => "botje",
1021     "title" => "Botje",
1022     "rule" => array(
1023     "Plukkie[ /]([0-9.]{1,10})" => "\\1"
1024     ),
1025     "uri" => "http://www.botje.com/"
1026     ),
1027     "bottomfeeder" => array(
1028     "icon" => "bottomfeeder",
1029     "title" => "BottomFeeder",
1030     "rule" => array(
1031     "BottomFeeder[ /]([0-9.]{1,10})" => "\\1"
1032     ),
1033     "uri" => ""
1034     ),
1035     "browseremulator" => array(
1036     "icon" => "browseremulator",
1037     "title" => "BrowserEmulator",
1038     "rule" => array(
1039     "BrowserEmulator[ /]([0-9.]{1,10})" => "\\1"
1040     ),
1041     "uri" => "http://www.dejavu.org/emulator.htm"
1042     ),
1043     "browsershots" => array(
1044     "icon" => "browsershots",
1045     "title" => "Browsershots",
1046     "rule" => array(
1047     "Browsershots URL Check" => ""
1048     ),
1049     "uri" => "http://browsershots.org"
1050     ),
1051     "browserspy" => array(
1052     "icon" => "robot",
1053     "title" => "BrowserSpy",
1054     "rule" => array(
1055     "BrowserSpy" => ""
1056     ),
1057     "uri" => ""
1058     ),
1059     "bruinbot" => array(
1060     "icon" => "robot",
1061     "title" => "BruinBot",
1062     "rule" => array(
1063     "BruinBot" => ""
1064     ),
1065     "uri" => ""
1066     ),
1067     "bruno" => array(
1068     "icon" => "robot",
1069     "title" => "Bruno",
1070     "rule" => array(
1071     "^Bruno" => ""
1072     ),
1073     "uri" => ""
1074     ),
1075     "btbot" => array(
1076     "icon" => "btbot",
1077     "title" => "BitTorrent",
1078     "rule" => array(
1079     "BTbot/([0-9.]{1,10})" => "\\1"
1080     ),
1081     "uri" => ""
1082     ),
1083     "builtwith" => array(
1084     "icon" => "builtwith",
1085     "title" => "BuiltWith",
1086     "rule" => array(
1087     "BuiltWith[/ ]([0-9.]{1,10})" => "\\1"
1088     ),
1089     "uri" => "http://builtwith.com/bot.html"
1090     ),
1091     "bulkfeeds" => array(
1092     "icon" => "robot",
1093     "title" => "Bulkfeeds",
1094     "rule" => array(
1095     "Bulkfeeds[/ ]([a-z0-9.]{1,10})" => "\\1"
1096     ),
1097     "uri" => ""
1098     ),
1099     "burf" => array(
1100     "icon" => "burf",
1101     "title" => "Burf.com",
1102     "rule" => array(
1103     "^Norbert the Spider" => ""
1104     ),
1105     "uri" => "http://www.burf.com/"
1106     ),
1107     "butch" => array(
1108     "icon" => "robot",
1109     "title" => "Butch",
1110     "rule" => array(
1111     "Butch(__| )?([a-z0-9.]{1,10})" => "\\2"
1112     ),
1113     "uri" => ""
1114     ),
1115     "buzzlogic" => array(
1116     "icon" => "buzzlogic",
1117     "title" => "Buzzlogic",
1118     "rule" => array(
1119     "BuzzBot[ /]([0-9.]{1,10})" => "\\1"
1120     ),
1121     "uri" => "http://www.buzzlogic.com"
1122     ),
1123     "catchbot" => array(
1124     "icon" => "catchbot",
1125     "title" => "CatchBot",
1126     "rule" => array(
1127     "^CatchBot[/ ]([0-9.]{1,10})" => "\\1"
1128     ),
1129     "uri" => "http://www.catchbot.com"
1130     ),
1131     "camdiscover" => array(
1132     "icon" => "robot",
1133     "title" => "Camdiscover",
1134     "rule" => array(
1135     "^Camcrawler" => ""
1136     ),
1137     "uri" => ""
1138     ),
1139     "cazoodle" => array(
1140     "icon" => "cazoodle",
1141     "title" => "Cazoodle",
1142     "rule" => array(
1143     "^CazoodleBot/(Nutch|CazoodleBot)[/ \-]([0-9.]{1,10})" => "\\2",
1144     "^CazoodleBot[/ ]([a-z0-9.]{1,10})" => "\\1"
1145     ),
1146     "uri" => "http://www.cazoodle.com/cazoodlebot"
1147     ),
1148     "ccbot" => array(
1149     "icon" => "robot",
1150     "title" => "ccBot",
1151     "rule" => array(
1152     "CCBot[/ ]([0-9.]{1,10})" => "\\1"
1153     ),
1154     "uri" => "http://www.commoncrawl.org/bot.html"
1155     ),
1156     "ccgcrawl" => array(
1157     "icon" => "robot",
1158     "title" => "CCGCrawl",
1159     "rule" => array(
1160     "CCGCrawl[/ ]([0-9.]{1,10})" => "\\1"
1161     ),
1162     "uri" => "http://www.myworkbase.com/bot.html"
1163     ),
1164     "cerberian" => array(
1165     "icon" => "robot",
1166     "title" => "Cerberian Drtrs",
1167     "rule" => array(
1168     "^Cerberian Drtrs" => ""
1169     ),
1170     "uri" => ""
1171     ),
1172     "cfnetwork" => array(
1173     "icon" => "robot",
1174     "title" => "Cerberian Drtrs",
1175     "rule" => array(
1176     "^CFNetwork[/ ]([0-9.]{1,10})" => "\\1"
1177     ),
1178     "uri" => "http://www.cfnetwork.be/"
1179     ),
1180     "charlotte" => array(
1181     "icon" => "charlotte",
1182     "title" => "Charlotte",
1183     "rule" => array(
1184     "Charlotte[/ ]([0-9a-z.]{1,10})" => "\\1"
1185     ),
1186     "uri" => ""
1187     ),
1188     "cirilizator" => array(
1189     "icon" => "cirilizator",
1190     "title" => "Cirilizator",
1191     "rule" => array(
1192     "Cirilizator[/ ]([0-9.]{1,10})" => "\\1"
1193     ),
1194     "uri" => ""
1195     ),
1196     "claria" => array(
1197     "icon" => "robot",
1198     "title" => "Claria",
1199     "rule" => array(
1200     "(Claria|Diamond)(Bot)?[ /]([0-9.]{1,10})" => "\\3",
1201     "(Claria|Diamond)(Bot)" => ""
1202     ),
1203     "uri" => ""
1204     ),
1205     "claymont" => array(
1206     "icon" => "claymont",
1207     "title" => "Claymont",
1208     "rule" => array(
1209     "claymont\.com" => "",
1210     "OliverPerry" => ""
1211     ),
1212     "uri" => "http://www.claymont.com"
1213     ),
1214 joku 377 "clipinc" => array(
1215     "icon" => "clipinc",
1216     "title" => "ClipInc",
1217     "rule" => array(
1218     "ClipInc" => ""
1219     ),
1220     "uri" => "http://tobit.software"
1221     ),
1222 joku 63 "clush" => array(
1223     "icon" => "clush",
1224     "title" => "Clush",
1225     "rule" => array(
1226     "Clus(tered-Search-|h)Bot[ /]([0-9.]{1,10})" => "\\2"
1227     ),
1228     "uri" => ""
1229     ),
1230     "cmsworldmap" => array(
1231     "icon" => "cmsworldmap",
1232     "title" => "CMS World Map",
1233     "rule" => array(
1234     "cmsworldmap" => ""
1235     ),
1236     "uri" => "http://www.cmsworldmap.com/"
1237     ),
1238     "cobion" => array(
1239     "icon" => "robot",
1240     "title" => "Cobion",
1241     "rule" => array(
1242     " (QXW03018|obot)\)" => ""
1243     ),
1244     "uri" => ""
1245     ),
1246     "coccoc" => array(
1247 matthys 287 "icon" => "coccoc",
1248 matthys 209 "title" => "Coccoc",
1249 joku 63 "rule" => array(
1250     "coccoc[ /]([0-9.]{1,10})" => "\\1"
1251     ),
1252 matthys 287 "uri" => "http://help.coccoc.com"
1253 joku 63 ),
1254     "coldfusion" => array(
1255     "icon" => "coldfusion",
1256     "title" => "ColdFusion",
1257     "rule" => array(
1258     "^coldfusion" => ""
1259     ),
1260     "uri" => ""
1261     ),
1262     "combine" => array(
1263     "icon" => "robot",
1264     "title" => "Combine",
1265     "rule" => array(
1266     "Combine[ /]([0-9.]{1,10})" => "\\1"
1267     ),
1268     "uri" => ""
1269     ),
1270     "combot" => array(
1271     "icon" => "robot",
1272     "title" => "comBot",
1273     "rule" => array(
1274     "^comBot[ /]([0-9.]{1,10})" => "\\1"
1275     ),
1276     "uri" => ""
1277     ),
1278     "comet" => array(
1279     "icon" => "comet",
1280     "title" => "Comet",
1281     "rule" => array(
1282     "cometsearch@cometsystems" => ""
1283     ),
1284     "uri" => ""
1285     ),
1286     "commerobo" => array(
1287     "icon" => "robot",
1288     "title" => "Commerobo",
1289     "rule" => array(
1290     "Commerobo[/ ]([0-9.]{1,10})" => "\\1"
1291     ),
1292     "uri" => ""
1293     ),
1294     "comrite" => array(
1295     "icon" => "robot",
1296     "title" => "ComRite",
1297     "rule" => array(
1298     "Comrite[/ ]([0-9.]{1,10})" => "\\1"
1299     ),
1300     "uri" => "http://www.comrite.com/"
1301     ),
1302     "convera" => array(
1303     "icon" => "convera",
1304     "title" => "Convera",
1305     "rule" => array(
1306     "Convera(MultiMedia)?Crawler[/ ]([0-9.]{1,10})" => "\\2",
1307     "Convera Internet Spider V([0-9.]{1,10})" => "\\1"
1308     ),
1309     "uri" => ""
1310     ),
1311     "coolbot" => array(
1312     "icon" => "robot",
1313     "title" => "CoolBot",
1314     "rule" => array(
1315     "^CoolBot" => ""
1316     ),
1317     "uri" => ""
1318     ),
1319     "cosmix" => array(
1320     "icon" => "robot",
1321     "title" => "Cosmix",
1322     "rule" => array(
1323     "^(voyager|cfetch|CosmixCrawler|carleson)[/ ]([0-9.]{1,10})" => "\\2",
1324     ),
1325     "uri" => ""
1326     ),
1327     "cosmos" => array(
1328     "icon" => "robot",
1329     "title" => "Cosmos",
1330     "rule" => array(
1331     "^cosmos" => ""
1332     ),
1333     "uri" => ""
1334     ),
1335     "cosmoty" => array(
1336     "icon" => "robot",
1337     "title" => "Cosmoty",
1338     "rule" => array(
1339     "^beautybot[/ ]([0-9.]{1,10})" => "\\1"
1340     ),
1341     "uri" => "http://www.uchoose.de/crawler/beautybot/"
1342     ),
1343     "covario" => array(
1344     "icon" => "covario",
1345     "title" => "Covario",
1346     "rule" => array(
1347     "Covario-IDS[/ ]([0-9.]{1,10})" => "\\1"
1348     ),
1349     "uri" => "http://www.covario.com/ids/"
1350     ),
1351     "creativecommons" => array(
1352     "icon" => "creativecommons",
1353     "title" => "Creative Commons",
1354     "rule" => array(
1355     "CreativeCommons[/ ]([0-9.]{1,6}(-dev)?)" => "\\1"
1356     ),
1357     "uri" => ""
1358     ),
1359     "cscrawler" => array(
1360     "icon" => "robot",
1361     "title" => "CsCrawler",
1362     "rule" => array(
1363     "CsCrawler" => ""
1364     ),
1365     "uri" => "http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html"
1366     ),
1367 joku 111 "jigsaw" => array(
1368     "icon" => "jigsaw",
1369     "title" => "Jigsaw",
1370     "rule" => array(
1371     "Jigsaw[ /]([0-9.]{1,10})" => "\\1"
1372     ),
1373     "uri" => "http://jigsaw.w3.org/css-validator/"
1374     ),
1375 joku 63 "csscheck" => array(
1376     "icon" => "w3c",
1377     "title" => "W3C CSS Validator",
1378     "rule" => array(
1379     "CSS(Check|_Validator).+[ /]([0-9.]{1,10})" => "\\2"
1380     ),
1381     "uri" => "http://jigsaw.w3.org/css-validator/"
1382     ),
1383     "custo" => array(
1384     "icon" => "robot",
1385     "title" => "Custo",
1386     "rule" => array(
1387     "Custo[ /]([0-9.]{1,10})" => "\\1"
1388     ),
1389     "uri" => ""
1390     ),
1391     "cybernavi" => array(
1392     "icon" => "robot",
1393     "title" => "CyberNavi",
1394     "rule" => array(
1395     "CyberNavi_WebGet[ /]([0-9.]{1,10})" => "\\1"
1396     ),
1397     "uri" => ""
1398     ),
1399     "cyberpatrol" => array(
1400     "icon" => "cyberpatrol",
1401     "title" => "CyberPatrol",
1402     "rule" => array(
1403     "^CyberPatrol" => ""
1404     ),
1405     "uri" => "http://www.cyberpatrol.com/cyberpatrolcrawler.asp"
1406     ),
1407     "cyberz" => array(
1408     "icon" => "cyberz",
1409     "title" => "Cyberz",
1410     "rule" => array(
1411     "Cyberz Communication Agent" => ""
1412     ),
1413     "uri" => ""
1414     ),
1415     "cydral" => array(
1416     "icon" => "robot",
1417     "title" => "Cydral",
1418     "rule" => array(
1419     "CydralSpider[ /]([0-9.]{1,10})" => "\\1"
1420     ),
1421     "uri" => ""
1422     ),
1423     "cynthia" => array(
1424     "icon" => "cynthia",
1425     "title" => "Cynthia Says",
1426     "rule" => array(
1427     "Cynthia[ /]([0-9.]{1,10})" => "\\1"
1428     ),
1429     "uri" => ""
1430     ),
1431     "d4x" => array(
1432     "icon" => "d4x",
1433     "title" => "Downloader for X",
1434     "rule" => array(
1435     "Downloader for X[ /]([0-9.]{1,10})" => "\\1"
1436     ),
1437     "uri" => ""
1438     ),
1439     "da" => array(
1440     "icon" => "da",
1441     "title" => "DA",
1442     "rule" => array(
1443     "^DA[ /]([0-9.]{1,10})" => "\\1"
1444     ),
1445     "uri" => ""
1446     ),
1447     "daum" => array(
1448     "icon" => "daum",
1449     "title" => "DAUM",
1450     "rule" => array(
1451     "DAUMOA[ /]([0-9.]{1,10})" => "\\1",
1452 joku 379 "Daum[ /]([0-9.]{1,10})" => "\\1",
1453 joku 63 "DAUM Web Robot" => "",
1454 joku 339 "daum.net" => "",
1455 joku 63 "Daum Communications Corp" => "",
1456     "EDI[ /]([0-9.]{1,10})" => "\\1",
1457     "Edacious.*Intelligent Web Robot" => "",
1458     "RaBot[/ ]([0-9.]{1,10}) Agent" => "\\1"
1459     ),
1460     "uri" => "http://ws.daum.net/"
1461     ),
1462     "daypop" => array(
1463     "icon" => "robot",
1464     "title" => "Daypop",
1465     "rule" => array(
1466     "daypopbot[/ ]([0-9.]{1,10})" => "\\1"
1467     ),
1468     "uri" => ""
1469     ),
1470     "delfi" => array(
1471     "icon" => "delfi",
1472     "title" => "Delfi",
1473     "rule" => array(
1474     "crawl at delfi dot lt" => ""
1475     ),
1476     "uri" => ""
1477     ),
1478     "depspid" => array(
1479     "icon" => "depspid",
1480     "title" => "DepSpid",
1481     "rule" => array(
1482     "DepSpid[/ ]([0-9.]{1,10})" => "\\1"
1483     ),
1484     "uri" => ""
1485     ),
1486     "devonagent" => array(
1487     "icon" => "devonagent",
1488     "title" => "DEVONagent",
1489     "rule" => array(
1490     "DEVONtech" => ""
1491     ),
1492     "uri" => ""
1493     ),
1494     "diffbot" => array(
1495     "icon" => "diffbot",
1496     "title" => "Diffbot",
1497     "rule" => array(
1498     " Diffbot" => ""
1499     ),
1500     "uri" => "http://www.diffbot.com"
1501     ),
1502     "diribot" => array(
1503     "icon" => "diribot",
1504     "title" => "Diri",
1505     "rule" => array(
1506     "diribot" => ""
1507     ),
1508     "uri" => "http://www.diri.bg"
1509     ),
1510     "directhit" => array(
1511     "icon" => "robot",
1512     "title" => "Direct Hit",
1513     "rule" => array(
1514     "EZResult -- Internet Search Engine" => ""
1515     ),
1516     "uri" => "http://www.directhit.com"
1517     ),
1518     "disco" => array(
1519     "icon" => "disco",
1520 matthys 209 "title" => "Disco",
1521 joku 63 "rule" => array(
1522     "disco/Nutch[/ -]([0-9.]{1,10})" => "\\1",
1523     "discobot[/ -]([0-9.]{1,10})" => "\\1",
1524     "disco-crawl@discoveryengine.com" => ""
1525     ),
1526     "uri" => "http://www.discoveryengine.com/"
1527     ),
1528     "discopump" => array(
1529     "icon" => "robot",
1530     "title" => "DISCo Pump",
1531     "rule" => array(
1532     "DISCo Pump[/ ]([0-9.]{1,10})" => "\\1"
1533     ),
1534     "uri" => ""
1535     ),
1536     "dkimreputation" => array(
1537     "icon" => "dkimreputation",
1538     "title" => "DKIM Reputation",
1539     "rule" => array(
1540     "DKIMRepBot[ /]([0-9.]{1,10})" => "\\1"
1541     ),
1542     "uri" => "http://www.dkim-reputation.org"
1543     ),
1544     "dnsdigger" => array(
1545     "icon" => "dnsdigger",
1546     "title" => "DNS-Digger",
1547     "rule" => array(
1548     "DNS-Digger-Explorer[ /]([0-9.]{1,10})" => "\\1"
1549     ),
1550     "uri" => "http://www.dnsdigger.com"
1551     ),
1552     "dnsvalidation" => array(
1553     "icon" => "dnsvalidation",
1554     "title" => "DNS Validation",
1555     "rule" => array(
1556     "DNSValidation[ /]([0-9.]{1,10})" => "\\1"
1557     ),
1558     "uri" => "http://www.dnsvalidation.com/"
1559     ),
1560     "doctorhtml" => array(
1561     "icon" => "robot",
1562     "title" => "DoctorHTML",
1563     "rule" => array(
1564     "Doctor[ \-]?HTML" => ""
1565     ),
1566     "uri" => ""
1567     ),
1568     "dolphin" => array(
1569     "icon" => "dolphin",
1570     "title" => "Dolphin",
1571     "rule" => array(
1572     "Dolphin[ /]([0-9.]{1,10})" => "\\1"
1573     ),
1574     "uri" => "http://telehouse.ru/crawler.html"
1575     ),
1576     "domaindatei" => array(
1577     "icon" => "robot",
1578     "title" => "Domaindatei",
1579     "rule" => array(
1580     "DomaindateiSpider[ /]([0-9.]{1,10})" => "\\1"
1581     ),
1582     "uri" => ""
1583     ),
1584     "dontbuylists" => array(
1585     "icon" => "dontbuylists",
1586     "title" => "Dontbuylists",
1587     "rule" => array(
1588     "DBLBot[ /]([0-9.]{1,10})" => "\\1"
1589     ),
1590     "uri" => "http://www.dontbuylists.com"
1591     ),
1592     "dotbot" => array(
1593     "icon" => "robot",
1594     "title" => "DotBot",
1595     "rule" => array(
1596     "DotBot[ /]([0-9.]{1,10})" => "\\1"
1597     ),
1598     "uri" => "http://www.dotnetdotcom.org"
1599     ),
1600     "doweb" => array(
1601     "icon" => "doweb",
1602     "title" => "DoWeb",
1603     "rule" => array(
1604     "^www.doweb.co.uk" => ""
1605     ),
1606     "uri" => "http://www.doweb.co.uk/"
1607     ),
1608     "downforeveryoneorjustme" => array(
1609     "icon" => "downforeveryoneorjustme",
1610     "title" => "Down for everyone or just me",
1611     "rule" => array(
1612     "downforeveryoneorjustme" => ""
1613     ),
1614     "uri" => "http://www.downforeveryoneorjustme.com"
1615     ),
1616     "downloadninja" => array(
1617     "icon" => "robot",
1618     "title" => "Download Ninja",
1619     "rule" => array(
1620     "Download Ninja[ /]([0-9.]{1,10})" => "\\1"
1621     ),
1622     "uri" => ""
1623     ),
1624     "drupal" => array(
1625     "icon" => "drupal",
1626     "title" => "Drupal",
1627     "rule" => array(
1628     "^Drupal" => ""
1629     ),
1630     "uri" => ""
1631     ),
1632     "dsns" => array(
1633     "icon" => "robot",
1634     "title" => "DSNS Scanner",
1635     "rule" => array(
1636     "^DSNS" => ""
1637     ),
1638     "uri" => ""
1639     ),
1640     "dtsagent" => array(
1641     "icon" => "robot",
1642     "title" => "DTS Agent",
1643     "rule" => array(
1644     "DTS Agent" => ""
1645     ),
1646     "uri" => ""
1647     ),
1648 matthys 342 "duckduckgo" => array(
1649     "icon" => "duckduckgo",
1650     "title" => "DuckDuckGo",
1651     "rule" => array(
1652     "DuckDuckGo-Favicons-Bot[ /]([0-9.]{1,10})" => "\\1"
1653     ),
1654     "uri" => "http://duckduckgo.com"
1655     ),
1656 joku 63 "earthcom" => array(
1657     "icon" => "earthcom",
1658     "title" => "Earthcom",
1659     "rule" => array(
1660     "EARTHCOM\.info[/ ]([0-9a-z.]{1,10})" => "\\1"
1661     ),
1662     "uri" => ""
1663     ),
1664     "ebay" => array(
1665     "icon" => "ebay",
1666     "title" => "eBay",
1667     "rule" => array(
1668     "eBay Relevance Ad Crawler" => ""
1669     ),
1670     "uri" => ""
1671     ),
1672     "echo" => array(
1673     "icon" => "robot",
1674     "title" => "Echo.com",
1675     "rule" => array(
1676     "_TrueRobot[/ ]([0-9.]{1,10})" => "\\1"
1677     ),
1678     "uri" => "http://www.echo.com/"
1679     ),
1680     "eert" => array(
1681     "icon" => "robot",
1682 matthys 209 "title" => "Eert",
1683 joku 63 "rule" => array(
1684     "eert spdr[/ ]([0-9.]{1,10})" => "\\1"
1685     ),
1686     "uri" => "http://bot.eert.net"
1687     ),
1688     "eknip" => array(
1689     "icon" => "eknip",
1690     "title" => "E-Knip",
1691     "rule" => array(
1692     "eknip[ /]([0-9a-z.]{1,10})" => "\\1"
1693     ),
1694     "uri" => ""
1695     ),
1696     "zoominfo" => array(
1697     "icon" => "zoominfo",
1698 matthys 209 "title" => "ZoomInfo", //Previous called Eliyon
1699 joku 63 "rule" => array(
1700     "NextGenSearchBot[/ ]([0-9.]{1,10})" => "\\1"
1701     ),
1702     "uri" => "http://www.zoominfo.com/business/nextgensearchbot.html"
1703     ),
1704     "emeraldshield" => array(
1705     "icon" => "emeraldshield",
1706     "title" => "EmeraldShield",
1707     "rule" => array(
1708     "^EmeraldShield" => ""
1709     ),
1710     "uri" => ""
1711     ),
1712     "empas" => array(
1713     "icon" => "empas",
1714     "title" => "Empas",
1715     "rule" => array(
1716     "DigExt; empas\)$" => "",
1717     "^EMPAS[_\-]ROBOT" => ""
1718     ),
1719     "uri" => ""
1720     ),
1721     "entireweb" => array(
1722     "icon" => "entireweb",
1723     "title" => "Entireweb",
1724     "rule" => array(
1725     "Speedy[ ]?Spider" => ""
1726     ),
1727     "uri" => ""
1728     ),
1729     "envolk" => array(
1730     "icon" => "envolk",
1731     "title" => "Envolk",
1732     "rule" => array(
1733     "envolk\[ITS\]spider[/ ]([0-9.]{1,10})" => "\\1",
1734     "envolk[/ ]([0-9.]{1,10})" => "\\1"
1735     ),
1736     "uri" => ""
1737     ),
1738     "esnet" => array(
1739     "icon" => "robot",
1740     "title" => "ES.NET",
1741     "rule" => array(
1742     "ES.NET Crawler[ /]([0-9.]{1,10})" => "\\1"
1743     ),
1744     "uri" => ""
1745     ),
1746     "estyle" => array(
1747     "icon" => "estyle",
1748     "title" => "eStyle Search",
1749     "rule" => array(
1750     "eStyleSearch[ /]([0-9.]{1,10})" => "\\1"
1751     ),
1752     "uri" => ""
1753     ),
1754     "eurip" => array(
1755     "icon" => "robot",
1756     "title" => "Eurip",
1757     "rule" => array(
1758     "EuripBot[ /]([0-9.]{1,10})" => "\\1"
1759     ),
1760     "uri" => "http://www.eurip.com"
1761     ),
1762     "eurodirectory" => array(
1763     "icon" => "robot",
1764     "title" => "Euro Directory",
1765     "rule" => array(
1766     "www\.euro-directory\.com" => ""
1767     ),
1768     "uri" => "http://www.euro-directory.com/"
1769     ),
1770     "euroseek" => array(
1771     "icon" => "euroseek",
1772     "title" => "EuroSeek",
1773     "rule" => array(
1774     "Arachnoidea" => ""
1775     ),
1776     "uri" => ""
1777     ),
1778     "evaal" => array(
1779     "icon" => "evaal",
1780     "title" => "Evaal",
1781     "rule" => array(
1782     "^EvaalSE" => ""
1783     ),
1784     "uri" => "http://www.evaal.com/"
1785     ),
1786     "eventax" => array(
1787     "icon" => "eventax",
1788     "title" => "Eventax",
1789     "rule" => array(
1790     "^eventax[ /]([0-9.]{1,10})" => "\\1"
1791     ),
1792     "uri" => "http://www.eventax.de/"
1793     ),
1794     "everbee" => array(
1795     "icon" => "everbee",
1796     "title" => "Everbee",
1797     "rule" => array(
1798     "EverbeeCrawler" => ""
1799     ),
1800     "uri" => ""
1801     ),
1802     "everest" => array(
1803     "icon" => "everest",
1804     "title" => "Everest",
1805     "rule" => array(
1806     "Everest-Vulcan Inc.[ /]([0-9.]{1,10})" => "\\1"
1807     ),
1808     "uri" => ""
1809     ),
1810     "exabot" => array(
1811     "icon" => "exabot",
1812     "title" => "ExaBot",
1813     "rule" => array(
1814     "^NG[ /]([0-9.]{1,10})" => "\\1",
1815     "Exabot/([0-9.]{1,10})" => "\\1",
1816     "ExaBotTest/([0-9.]{1,10})" => "\\1",
1817     "ExaBot-(Test|Images)/([0-9.]{1,10})" => "\\2",
1818     "ExaBot-Thumbnails" => ""
1819     ),
1820     "uri" => "http://www.exabot.com/go/robot"
1821     ),
1822     "exactseek" => array(
1823     "icon" => "exactseek",
1824     "title" => "ExactSeek",
1825     "rule" => array(
1826     "^exactseek[ \-]?(pagereaper|crawler)[ \-]?([0-9.]{1,10})" => "\\2",
1827     "ExactSeek[ \.\-]?(Crawler|com)" => ""
1828     ),
1829     "uri" => "http://www.exactseek.com/"
1830     ),
1831     "excite" => array(
1832     "icon" => "excite",
1833     "title" => "Excite",
1834     "rule" => array(
1835     "Architext[ \-]?Spider" => ""
1836     ),
1837     "uri" => ""
1838     ),
1839     "execrawl" => array(
1840     "icon" => "robot",
1841     "title" => "Execrawl",
1842     "rule" => array(
1843     "Execrawl[ /]([0-9.]{1,10})" => "\\1",
1844     "Execrawl" => ""
1845     ),
1846     "uri" => ""
1847     ),
1848     "expertmonitor" => array(
1849     "icon" => "robot",
1850     "title" => "ExpertMonitor",
1851     "rule" => array(
1852     "^NetMonitor[ /]([0-9.]{1,10})" => "\\1"
1853     ),
1854     "uri" => ""
1855     ),
1856     "explorerrss" => array(
1857     "icon" => "robot",
1858     "title" => "Explorer RSS",
1859     "rule" => array(
1860     "^Windows-RSS-Platform[ /]([0-9.]{1,10})" => "\\1"
1861     ),
1862     "uri" => ""
1863     ),
1864     "ezooms" => array(
1865     "icon" => "robot",
1866     "title" => "Ezooms",
1867     "rule" => array(
1868     "ezooms[/ ]([0-9a-z.\-]{1,10})" => "\\1"
1869     ),
1870     "uri" => ""
1871     ),
1872     "facebook" => array(
1873     "icon" => "facebook",
1874     "title" => "Facebook",
1875     "rule" => array(
1876     "FacebookFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1877     "facebookexternalhit/([0-9.]{1,10})" => "\\1",
1878     "^facebook" => ""
1879     ),
1880     "uri" => "http://www.facebook.com/"
1881     ),
1882     "fast" => array(
1883     "icon" => "fast",
1884     "title" => "Fast",
1885     "rule" => array(
1886     "^FAST( Enterprise |-Web| MetaWeb )?Crawler[ /]([0-9.]{1,10})" => "\\2",
1887     "^FAST( Enterprise |-Web| MetaWeb | PartnerSite )?Crawler" => "",
1888     "^Fast Crawler" => "",
1889     "^libwww-perl[ /]([0-9.]{1,10}) FP[ /]([0-9.]{1,10})" => "\\2"
1890     ),
1891     "uri" => "http://www.alltheweb.com/"
1892     ),
1893     "fastbuzz" => array(
1894     "icon" => "fastbuzz",
1895     "title" => "Fastbuzz",
1896     "rule" => array(
1897     "^fastbuzz\.com" => ""
1898     ),
1899     "uri" => ""
1900     ),
1901     "favorg" => array(
1902     "icon" => "robot",
1903     "title" => "FavOrg",
1904     "rule" => array(
1905     "^FavOrg" => ""
1906     ),
1907     "uri" => ""
1908     ),
1909     "favorstar" => array(
1910     "icon" => "favorstar",
1911 matthys 209 "title" => "Favorstar",
1912 joku 63 "rule" => array(
1913     "favorstarbot[ /]([0-9.]{1,10})" => "\\1"
1914     ),
1915     "uri" => "http://favorstar.com/bot.html"
1916     ),
1917     "faxo" => array(
1918     "icon" => "robot",
1919     "title" => "Faxo",
1920     "rule" => array(
1921     "^Faxobot[ /]([0-9.]{1,10})" => "\\1"
1922     ),
1923     "uri" => "http://www.faxo.com/"
1924     ),
1925     "fdse" => array(
1926     "icon" => "robot",
1927     "title" => "FDSE Robot",
1928     "rule" => array(
1929     "FDSE[ \-]?robot" => ""
1930     ),
1931     "uri" => ""
1932     ),
1933     "feedback" => array(
1934     "icon" => "robot",
1935     "title" => "FeedBack",
1936     "rule" => array(
1937     "FeedBack[/ ]([0-9.]{1,10})" => "\\1"
1938     ),
1939     "uri" => ""
1940     ),
1941     "feedburner" => array(
1942     "icon" => "feedburner",
1943     "title" => "FeedBurner",
1944     "rule" => array(
1945     "^FeedBurner[/ ]([0-9.]{1,10})" => "\\1"
1946     ),
1947     "uri" => ""
1948     ),
1949     "feeddemon" => array(
1950     "icon" => "feeddemon",
1951     "title" => "FeedDemon",
1952     "rule" => array(
1953     "FeedDemon[/ ]([0-9.]{1,10})" => "\\1"
1954     ),
1955     "uri" => ""
1956     ),
1957     "feedfind" => array(
1958     "icon" => "feedfind",
1959     "title" => "FeedFind",
1960     "rule" => array(
1961     "Feed::Find[ /]([0-9.]{1,10})" => "\\1"
1962     ),
1963     "uri" => ""
1964     ),
1965     "feedonfeeds" => array(
1966     "icon" => "robot",
1967     "title" => "Feed On Feeds",
1968     "rule" => array(
1969     "FeedOnFeeds[/ ]([0-9.]{1,10})" => "\\1"
1970     ),
1971     "uri" => ""
1972     ),
1973     "feedparser" => array(
1974     "icon" => "robot",
1975     "title" => "Feedparser",
1976     "rule" => array(
1977     "UniversalFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1978     "FeedParser" => ""
1979     ),
1980     "uri" => ""
1981     ),
1982     "feedreader" => array(
1983     "icon" => "feedreader",
1984     "title" => "Feedreader",
1985     "rule" => array(
1986     "^Feedreader" => ""
1987     ),
1988     "uri" => ""
1989     ),
1990     "feedserver" => array(
1991     "icon" => "robot",
1992     "title" => "FeedServer",
1993     "rule" => array(
1994     "FeedServer[/ ]([0-9.]{1,10})" => "\\1"
1995     ),
1996     "uri" => ""
1997     ),
1998     "feedster" => array(
1999     "icon" => "feedster",
2000     "title" => "Feedster",
2001     "rule" => array(
2002     "Feedster Crawler[/ ]([0-9.]{1,10})" => "\\1"
2003     ),
2004     "uri" => ""
2005     ),
2006     "feedvalidator" => array(
2007     "icon" => "feedvalidator",
2008     "title" => "Feed Validator",
2009     "rule" => array(
2010     "^FeedValidator[/ ]([0-9.]{1,10})" => "\\1"
2011     ),
2012     "uri" => ""
2013     ),
2014     "fdm" => array(
2015     "icon" => "robot",
2016     "title" => "Free Download Manager",
2017     "rule" => array(
2018     "^FDM[/ ]([0-9a-z.]{1,10})" => "\\1"
2019     ),
2020     "uri" => ""
2021     ),
2022     "filangy" => array(
2023     "icon" => "robot",
2024     "title" => "Filangy",
2025     "rule" => array(
2026     "Filangy[/ ]([0-9.]{1,10})" => "\\1"
2027     ),
2028     "uri" => "http://www.filangy.com/"
2029     ),
2030     "findanisp" => array(
2031     "icon" => "robot",
2032     "title" => "FindAnISP",
2033     "rule" => array(
2034     "FindAnISP" => ""
2035     ),
2036     "uri" => "http://www.findanisp.com/"
2037     ),
2038     "findengines" => array(
2039     "icon" => "findengines",
2040     "title" => "FindEngines",
2041     "rule" => array(
2042     "FindEngines! Bot" => ""
2043     ),
2044     "uri" => ""
2045     ),
2046     "findexa" => array(
2047     "icon" => "findexa",
2048     "title" => "Findexa",
2049     "rule" => array(
2050     "Findexa Crawler" => ""
2051     ),
2052     "uri" => ""
2053     ),
2054     "findlinks" => array(
2055     "icon" => "findlinks",
2056     "title" => "FindLinks",
2057     "rule" => array(
2058     "findlinks[ /]([0-9.]{1,10})" => "\\1",
2059     "^FindLinks" => ""
2060     ),
2061     "uri" => ""
2062     ),
2063     "findoor" => array(
2064     "icon" => "findoor",
2065 matthys 209 "title" => "Findoor",
2066 joku 63 "rule" => array(
2067     "^findoor(-Bot)?" => "\\1"
2068     ),
2069     "uri" => ""
2070     ),
2071     "firefly" => array(
2072     "icon" => "firefly",
2073     "title" => "Firefly",
2074     "rule" => array(
2075     "Firefly" => ""
2076     ),
2077     "uri" => ""
2078     ),
2079     "flashget" => array(
2080     "icon" => "flashget",
2081     "title" => "FlashGet",
2082     "rule" => array(
2083     "^FlashGet" => ""
2084     ),
2085     "uri" => ""
2086     ),
2087     "flatland" => array(
2088     "icon" => "flatland",
2089     "title" => "Flatland",
2090     "rule" => array(
2091     "^flatlandbot" => ""
2092     ),
2093     "uri" => "http://www.flatlandindustries.com/flatlandbot"
2094     ),
2095     "flickbot" => array(
2096     "icon" => "flickbot",
2097     "title" => "FlickBot",
2098     "rule" => array(
2099     "FlickBot[ /]([0-9.]{1,10})" => "\\1"
2100     ),
2101     "uri" => ""
2102     ),
2103     "flightdeckreports" => array(
2104     "icon" => "flightdeckreports",
2105     "title" => "Flight Deck Reports",
2106     "rule" => array(
2107     "FlightDeckReportsBot[ /]([0-9.]{1,10})" => "\\1"
2108     ),
2109     "uri" => "http://www.flightdeckreports.com/"
2110     ),
2111     "forex" => array(
2112     "icon" => "robot",
2113     "title" => "Forex",
2114     "rule" => array(
2115     "^Forex Trading Network Organization" => ""
2116     ),
2117     "uri" => "http://www.netforex.org/"
2118     ),
2119     "freshmeat" => array(
2120     "icon" => "freshmeat",
2121 matthys 209 "title" => "Freshmeat",
2122 joku 63 "rule" => array(
2123     "fmII URL validator[ /]([0-9.]{1,10})" => "\\1",
2124     "freshmeat.net URL validator[ /]([0-9.]{1,10})" => "\\1"
2125     ),
2126     "uri" => "http://www.freshmeat.net/"
2127     ),
2128     "friend" => array(
2129     "icon" => "friend",
2130     "title" => "Friend",
2131     "rule" => array(
2132     "www\.friend\.fr" => ""
2133     ),
2134     "uri" => "http://www.friend.fr/"
2135     ),
2136     "frontier" => array(
2137     "icon" => "frontier",
2138     "title" => "Frontier",
2139     "rule" => array(
2140     "Frontier[ /]([0-9.]{1,10})" => "\\1"
2141     ),
2142     "uri" => ""
2143     ),
2144     "fyberspider" => array(
2145     "icon" => "robot",
2146     "title" => "FyberSpider",
2147     "rule" => array(
2148     "FyberSpider[ /]([0-9.]{1,10})" => "\\1"
2149     ),
2150     "uri" => "http://www.fyberspider.com/"
2151     ),
2152     "gaisbot" => array(
2153     "icon" => "gais",
2154     "title" => "Gaisbot",
2155     "rule" => array(
2156     "Gaisbot[ /]([0-9.]{1,10})" => "\\1"
2157     ),
2158     "uri" => ""
2159     ),
2160     "galaxy" => array(
2161     "icon" => "galaxy",
2162     "title" => "Galaxy",
2163     "rule" => array(
2164     "GalaxyBot[ /]([0-9.]{1,10})" => "\\1",
2165     "www.galaxy.com" => ""
2166     ),
2167     "uri" => "http://www.galaxy.com/"
2168     ),
2169     "gamespy" => array(
2170     "icon" => "gamespy",
2171     "title" => "GameSpy",
2172     "rule" => array(
2173     "GameSpyHTTP[ /]([0-9.]{1,10})" => "\\1"
2174     ),
2175     "uri" => ""
2176     ),
2177     "garlik" => array(
2178     "icon" => "garlik",
2179     "title" => "Garlik",
2180     "rule" => array(
2181     "GarlikCrawler[ /]([0-9.]{1,10})" => "\\1"
2182     ),
2183     "uri" => "http://garlik.com/"
2184     ),
2185     "gdesktop" => array(
2186     "icon" => "gdesktop",
2187     "title" => "Google Desktop",
2188     "rule" => array(
2189     "compatible; Google Desktop" => ""
2190     ),
2191     "uri" => ""
2192     ),
2193     "genome" => array(
2194     "icon" => "robot",
2195     "title" => "Genome Machine",
2196     "rule" => array(
2197     "Genome[ \-]?Machine" => ""
2198     ),
2199     "uri" => ""
2200     ),
2201     "geohash" => array(
2202     "icon" => "geohash",
2203     "title" => "Geohash",
2204     "rule" => array(
2205     "GeoHasher(/Nutch)[ /-]([0-9.]{1,10})" => "\\2"
2206     ),
2207     "uri" => "http://geohash.org/"
2208     ),
2209     "geona" => array(
2210     "icon" => "robot",
2211     "title" => "Geona",
2212     "rule" => array(
2213     "GeonaBot[ /]([0-9.]{1,10})" => "\\1"
2214     ),
2215     "uri" => ""
2216     ),
2217     "geoblog" => array(
2218     "icon" => "robot",
2219     "title" => "The World as a Blog",
2220     "rule" => array(
2221     "The World as a Blog" => ""
2222     ),
2223     "uri" => ""
2224     ),
2225     "geourl" => array(
2226     "icon" => "geourl",
2227     "title" => "GeoUrl",
2228     "rule" => array(
2229     "geourl[ /]([0-9.]{1,10})" => "\\1",
2230     "^GeoURLBot[ /]([0-9.]{1,10})" => "\\1",
2231     ),
2232     "uri" => ""
2233     ),
2234     "getnetwise" => array(
2235     "icon" => "robot",
2236     "title" => "GetNetWise",
2237     "rule" => array(
2238     " Crayon Crawler" => ""
2239     ),
2240     "uri" => ""
2241     ),
2242     "getright" => array(
2243     "icon" => "getright",
2244     "title" => "GetRight",
2245     "rule" => array(
2246     "GetRight[ /]([0-9.]{1,10})" => "\\1"
2247     ),
2248     "uri" => ""
2249     ),
2250     "getsmart" => array(
2251     "icon" => "getsmart",
2252     "title" => "GetSmart",
2253     "rule" => array(
2254     "GetSmart[ /]([0-9.]{1,10})" => "\\1"
2255     ),
2256     "uri" => ""
2257     ),
2258     "gigabot" => array(
2259     "icon" => "gigablast",
2260     "title" => "Gigablast",
2261     "rule" => array(
2262     "(Gigabot|Sitesearch)[/ ]([0-9.]{1,10})" => "\\2",
2263     "GigabotSiteSearch[/ ]([0-9.]{1,10})" => "\\1",
2264 joku 336 "GigablastOpenSource" => ""
2265 joku 63 ),
2266     "uri" => ""
2267 matthys 328 ),
2268     "gimme" => array(
2269     "icon" => "gimme",
2270     "title" => "gimmeUSA",
2271     "rule" => array(
2272     "Gimme60bot[ /]([0-9.]{1,10})" => "\\1"
2273     ),
2274     "uri" => "http://gimme60.com"
2275 joku 63 ),
2276 matthys 328 "ginger" => array(
2277     "icon" => "ginger",
2278     "title" => "GingerCrawler",
2279     "rule" => array(
2280     "GingerCrawler[ /]([0-9.]{1,10})" => "\\1"
2281     ),
2282     "uri" => "http://www.gingersoftware.com/crawler_agent.htm"
2283     ),
2284 joku 63 "girafabot" => array(
2285     "icon" => "girafa",
2286     "title" => "Girafa",
2287     "rule" => array(
2288     "Girafabot" => ""
2289     ),
2290     "uri" => ""
2291     ),
2292     "globalspec" => array(
2293     "icon" => "globalspec",
2294     "title" => "GlobalSpec",
2295     "rule" => array(
2296     "Ocelli[ /]([0-9.]{1,10})" => "\\1"
2297     ),
2298     "uri" => ""
2299     ),
2300     "glucose" => array(
2301     "icon" => "glucose",
2302     "title" => "Glucose",
2303     "rule" => array(
2304     "glucose[ /]([0-9a-z.\-]{1,10})" => "\\1"
2305     ),
2306     "uri" => ""
2307     ),
2308     "gnomit" => array(
2309     "icon" => "gnomit",
2310     "title" => "Gnomit",
2311     "rule" => array(
2312     "gnomit[ /]([0-9.]{1,10})" => "\\1"
2313     ),
2314     "uri" => "http://www.gnomit.com/",
2315     ),
2316     "goforit" => array(
2317     "icon" => "goforit",
2318     "title" => "GoForIt",
2319     "rule" => array(
2320     "^GoForIt\.com" => "",
2321     "^GOFORITBOT" => ""
2322     ),
2323     "uri" => ""
2324     ),
2325     "goguides" => array(
2326     "icon" => "robot",
2327     "title" => "GoGuides",
2328     "rule" => array(
2329     "^GoGuidesBot[ /]([0-9.]{1,10})" => "\\1"
2330     ),
2331     "uri" => "http://www.goguides.org/"
2332     ),
2333     // Needs to be before google for correct detection
2334     "mediapartners" => array(
2335     "icon" => "google",
2336     "title" => "Mediapartners",
2337     "rule" => array (
2338     "Mediapartners-Google[ /]([0-9.]{1,10})" => "\\1",
2339     "Mediapartners-Google" => ""
2340     ),
2341     "uri" => ""
2342     ),
2343     "google" => array(
2344     "icon" => "google",
2345     "title" => "Google",
2346     "rule" => array (
2347     "Googl(e|ebot)(-Image)?/([0-9.]{1,10})" => "\\3",
2348     "Googl(e|ebot)(-Image)?/" => "",
2349     "^gsa-crawler" => "",
2350     "Google Web Preview" => ""
2351     ),
2352     "uri" => "http://www.google.com/"
2353     ),
2354     "googlesitemaps" => array(
2355     "icon" => "google",
2356     "title" => "Google-Sitemaps",
2357     "rule" => array (
2358     "Googl(e|ebot)(-Sitemaps)?/([0-9.]{1,10})" => "\\3",
2359     "GSiteCrawler[ /v]*([0-9.a-z]{1,10})" => "\\1",
2360     "Googl(e|ebot)(-Sitemaps)?/" => ""
2361     ),
2362     "uri" => ""
2363     ),
2364     "googlemobile" => array(
2365     "icon" => "google",
2366     "title" => "Google-Mobile",
2367     "rule" => array (
2368     "Googl(e|ebot)(-Mobile)?/([0-9.]{1,10})" => "\\3",
2369     "Googl(e|ebot)(-Mobile)?/" => ""
2370     ),
2371     "uri" => ""
2372     ),
2373     "googleads" => array(
2374     "icon" => "google",
2375     "title" => "Google-AdsBot",
2376     "rule" => array (
2377     "^AdsBot-Google" => "",
2378     ),
2379     "uri" => ""
2380     ),
2381     "googlefeeds" => array(
2382     "icon" => "google",
2383     "title" => "Google-Feedfetcher",
2384     "rule" => array (
2385     "^Feedfetcher-Google" => "",
2386     ),
2387     "uri" => ""
2388     ),
2389     "googlverification" => array(
2390     "icon" => "google",
2391     "title" => "Google-Site-Verification",
2392     "rule" => array (
2393     "Google-Site-Verification[ /]([0-9.]{1,10})" => "\\1"
2394     ),
2395     "uri" => ""
2396     ),
2397 matthys 207 // Needs to be AFTER Google detection
2398     "goo" => array(
2399     "icon" => "goo",
2400     "title" => "Goo",
2401     "rule" => array (
2402     "(gazz|ichiro|mog(et|imogi))[ /]([0-9.]{1,10})" => "\\3",
2403     "DoCoMo[ /]([0-9.]{1,10})" => "\\1"
2404     ),
2405     "uri" => ""
2406     ),
2407 joku 63 "goongee" => array(
2408     "icon" => "robot",
2409     "title" => "GoonGee",
2410     "rule" => array (
2411     "^Big Fish[ /]v?([0-9.]{1,10})" => "\\2"
2412     ),
2413     "uri" => "http://www.goongee.com/"
2414     ),
2415     "gpost" => array(
2416     "icon" => "gpost",
2417     "title" => "GPost",
2418     "rule" => array(
2419     "^GPostbot" => ""
2420     ),
2421     "uri" => ""
2422     ),
2423 matthys 309 "grapeshot" => array(
2424     "icon" => "grapeshot",
2425     "title" => "Grapeshot",
2426     "rule" => array(
2427     "GrapeshotCrawler[/ ]([0-9.]{1,10})" => "\\1"
2428     ),
2429     "uri" => "http://www.grapeshot.co.uk/crawler.php"
2430     ),
2431 joku 63 "gregarius" => array(
2432     "icon" => "robot",
2433     "title" => "Gregarius",
2434     "rule" => array(
2435     "^Gregarius[/ ]([0-9.]{1,10})" => ""
2436     ),
2437     "uri" => ""
2438     ),
2439     "grub" => array(
2440     "icon" => "grub",
2441     "title" => "Grub",
2442     "rule" => array(
2443     "grub[ \-]?client[ /\-]{1,5}([0-9.]{1,10})" => "\\1",
2444     "grub crawler" => "",
2445     "grub[/ ]([0-9.]{1,10})" => "\\1",
2446     "^GrubNG([0-9. ]{1,10})?" => "\\1"
2447     ),
2448     "uri" => "http://www.grub.org/"
2449     ),
2450     "gulliver" => array(
2451     "icon" => "robot",
2452     "title" => "Gulliver",
2453     "rule" => array(
2454     "Gulliver" => ""
2455     ),
2456     "uri" => ""
2457     ),
2458     "guruji" => array(
2459     "icon" => "guruji",
2460     "title" => "Guruji",
2461     "rule" => array(
2462     "GurujiBot[/ ]([0-9.]{1,10})" => "\\1"
2463     ),
2464     "uri" => "http://www.guruji.com/"
2465     ),
2466     "gush" => array(
2467     "icon" => "robot",
2468     "title" => "Gush",
2469     "rule" => array(
2470     "^Gush[/ ]([0-9.]{1,10})" => "\\1"
2471     ),
2472     "uri" => ""
2473     ),
2474     "gziptester" => array(
2475     "icon" => "robot",
2476     "title" => "Gzip Tester",
2477     "rule" => array(
2478     "g(id)?zip[ \-]?test(er)?" => ""
2479     ),
2480     "uri" => ""
2481     ),
2482     "hanzoweb" => array(
2483     "icon" => "hanzoweb",
2484     "title" => "Hanzoweb",
2485     "rule" => array(
2486     "^Hanzoweb" => ""
2487     ),
2488     "uri" => ""
2489     ),
2490     "harbot" => array(
2491     "icon" => "harbot",
2492     "title" => "Harbot",
2493     "rule" => array(
2494     "^Harbot GateStation" => ""
2495     ),
2496     "uri" => ""
2497     ),
2498     "hatena" => array(
2499     "icon" => "hatena",
2500     "title" => "Hatena",
2501     "rule" => array(
2502     "Hatena (Antenna|Bookmark|Pagetitle Agent)[ /]([0-9.]{1,10})" => "\\2"
2503     ),
2504     "uri" => ""
2505     ),
2506     "htmlparser" => array(
2507     "icon" => "htmlparser",
2508     "title" => "HTMLParser",
2509     "rule" => array(
2510     "HTMLParser[ /]([0-9.]{1,10})" => "\\1"
2511     ),
2512     "uri" => "http://htmlparser.sourceforge.net/"
2513     ),
2514     "helix" => array(
2515     "icon" => "helix",
2516     "title" => "Heritrix",
2517     "rule" => array(
2518     "^helix[ /]([0-9.]{1,10})" => "\\1"
2519     ),
2520     "uri" => "http://www.sitesearch.ca/helix/"
2521     ),
2522     "heritrix" => array(
2523     "icon" => "heritrix",
2524     "title" => "Heritrix",
2525     "rule" => array(
2526     "heritrix[ /]([0-9.]{1,10})" => "\\1",
2527     "archive.org_bot" => "",
2528     "InternetArchive[ /]([0-9.a-z]{1,10})" => "\\1"
2529     ),
2530     "uri" => "http://archive.org"
2531     ),
2532     "hiddenmarket" => array(
2533     "icon" => "robot",
2534     "title" => "HiddenMarket",
2535     "rule" => array(
2536     "HiddenMarket[ /\-]([0-9.]{1,10})" => "\\1"
2537     ),
2538     "uri" => ""
2539     ),
2540     "honda" => array(
2541     "icon" => "robot",
2542     "title" => "Honda",
2543     "rule" => array(
2544     "Honda-Search[ /]([0-9.]{1,10})" => "\\1"
2545     ),
2546     "uri" => "http://www.honda-search.com"
2547     ),
2548     "hoowwwer" => array(
2549     "icon" => "hoowwwer",
2550     "title" => "HooWWWer",
2551     "rule" => array(
2552     "HooWWWer[ /]([0-9.]{1,10})" => "\\1"
2553     ),
2554     "uri" => ""
2555     ),
2556     "hotzonu" => array(
2557     "icon" => "hotzonu",
2558     "title" => "Hotzonu",
2559     "rule" => array(
2560     "Hotzonu[ /]([0-9.]{1,10})" => "\\1"
2561     ),
2562     "uri" => ""
2563     ),
2564     "houxou" => array(
2565     "icon" => "robot",
2566     "title" => "Houxou",
2567     "rule" => array(
2568     "HouxouCrawler[ /]Nutch.([0-9.]{1,10})" => "\\1",
2569     "HouxouCrawler" => ""
2570     ),
2571     "uri" => ""
2572     ),
2573     "htdig" => array(
2574     "icon" => "htdig",
2575     "title" => "ht://Dig",
2576     "rule" => array(
2577     "htdig[ /]([0-9.]{1,10})" => "\\1",
2578     "htdig" => "\\1"
2579     ),
2580     "uri" => ""
2581     ),
2582     "html2jpg" => array(
2583     "icon" => "html2jpg",
2584     "title" => "HTML2JPG",
2585     "rule" => array(
2586     "^HTML2JPG" => ""
2587     ),
2588     "uri" => ""
2589     ),
2590     "httperf" => array(
2591     "icon" => "robot",
2592     "title" => "HTTPerf",
2593     "rule" => array(
2594     "httperf[ /]([0-9.]{1,10})" => "\\1"
2595     ),
2596     "uri" => ""
2597     ),
2598     "httpunit" => array(
2599     "icon" => "httpunit",
2600     "title" => "HttpUnit",
2601     "rule" => array(
2602     "httpunit[ /]([0-9.]{1,10})" => "\\1"
2603     ),
2604     "uri" => ""
2605     ),
2606     "httrack" => array(
2607     "icon" => "httrack",
2608     "title" => "HTTrack",
2609     "rule" => array(
2610     "HTTrack[ /]([0-9.]{1,10})" => "\\1"
2611     ),
2612     "uri" => ""
2613     ),
2614     "huaweisymantec" => array(
2615     "icon" => "huaweisymantec",
2616     "title" => "HuaweiSymantec",
2617     "rule" => array(
2618     "HuaweiSymantecSpider[ /]([0-9.]{1,10})" => "\\1"
2619     ),
2620     "uri" => "http://www.huaweisymantec.com/en/IRL/spider/"
2621     ),
2622     "hungary" => array(
2623     "icon" => "hungary",
2624     "title" => "Hungary",
2625     "rule" => array(
2626     "HuRob[ /]([0-9.]{1,10})" => "\\1"
2627     ),
2628     "uri" => ""
2629     ),
2630 joku 261 "i18n" => array(
2631     "icon" => "w3c",
2632     "title" => "W3C I18n Checker",
2633     "rule" => array(
2634     "^W3C_I18n-Checker[ /]([0-9.]{1,10})" => "\\1"
2635 joku 169 ),
2636 joku 261 "uri" => "http://validator.w3.org/services"
2637     ),
2638 joku 63 "iakke" => array(
2639     "icon" => "iakke",
2640 matthys 209 "title" => "Iakké",
2641 joku 63 "rule" => array(
2642     "^iakke_bot[ /]v([0-9.]{1,10})" => "\\1"
2643     ),
2644     "uri" => "http://fr.iakke.com/"
2645     ),
2646     "iask" => array(
2647     "icon" => "iask",
2648     "title" => "IAsk",
2649     "rule" => array(
2650     "iaskspider[ /]([0-9.]{1,10})" => "\\1",
2651     "^iaskspider" => ""
2652     ),
2653     "uri" => "http://iask.com"
2654     ),
2655     "icc" => array(
2656     "icon" => "icc",
2657     "title" => "ICC-Crawler",
2658     "rule" => array(
2659     "^ICC-Crawler" => ""
2660     ),
2661     "uri" => "http://kc.nict.go.jp/icc/crawl.html"
2662     ),
2663     "icerocket" => array(
2664     "icon" => "icerocket",
2665     "title" => "Icerocket",
2666     "rule" => array(
2667     "BlogzIce[ /]([0-9.]{1,10})" => "\\1",
2668     "BlogSearch[ /]([0-9.]{1,10})" => "\\1"
2669     ),
2670     "uri" => ""
2671     ),
2672     "icjobs" => array(
2673     "icon" => "icjobs",
2674     "title" => "iCjobs",
2675     "rule" => array(
2676     "iCjobs[ /]([0-9.]{1,10})" => "\\1"
2677     ),
2678     "uri" => "http://www.icjobs.de/"
2679     ),
2680     "icra" => array(
2681     "icon" => "icra",
2682     "title" => "ICRA",
2683     "rule" => array(
2684     "^ICRA_Semantic_spider[ /]([0-9.]{1,10})" => "\\1"
2685     ),
2686     "uri" => "http://www.icra.org"
2687     ),
2688     "iknow" => array(
2689     "icon" => "robot",
2690     "title" => "I know",
2691     "rule" => array(
2692     "Comaneci_bot[ /]([0-9.]{1,10})" => "\\1"
2693     ),
2694     "uri" => ""
2695     ),
2696     "ilial" => array(
2697     "icon" => "robot",
2698     "title" => "Ilial",
2699     "rule" => array(
2700     "ilial[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
2701     ),
2702     "uri" => ""
2703     ),
2704     "ilocal" => array(
2705     "icon" => "ilocal",
2706     "title" => "ilocal",
2707     "rule" => array(
2708     "^ilocal" => "",
2709     ),
2710     "uri" => "http://www.ilocal.nl"
2711     ),
2712     "ilse" => array(
2713     "icon" => "ilse",
2714     "title" => "Ilse",
2715     "rule" => array(
2716     "I(NGRID|lseRobot|lseBot)[ /]([0-9.]{1,10})" => "\\1"
2717     ),
2718     "uri" => "http://ilse.nl/"
2719     ),
2720     "iltrovatore" => array(
2721     "icon" => "iltrovatore",
2722     "title" => "IlTrovatore",
2723     "rule" => array(
2724     "iltrovatore-setaccio[ /]([0-9.]{1,10})" => "\\1",
2725     "Iltrovatore-Setaccio" => "",
2726     "iltrovatore[ /]([0-9.]{1,10})" => "\\1"
2727     ),
2728     "uri" => ""
2729     ),
2730     "indylibrary" => array(
2731     "icon" => "robot",
2732     "title" => "Indy Library",
2733     "rule" => array(
2734     "Indy[ \-]?Library" => ""
2735     ),
2736     "uri" => ""
2737     ),
2738     "inela" => array(
2739     "icon" => "robot",
2740     "title" => "Inela",
2741     "rule" => array(
2742     "InelaBot[ /]([0-9.]{1,10})" => ""
2743     ),
2744     "uri" => "http://inelegant.org/bot"
2745     ),
2746     "ineturl" => array(
2747     "icon" => "robot",
2748     "title" => "InetURL",
2749     "rule" => array(
2750     "InetURL.?[ /]([0-9.]{1,10})" => ""
2751     ),
2752     "uri" => ""
2753     ),
2754     "infoart" => array(
2755     "icon" => "robot",
2756     "title" => "InfoArt",
2757     "rule" => array(
2758     "InfoArt crawler" => ""
2759     ),
2760     "uri" => ""
2761     ),
2762     "infomine" => array(
2763     "icon" => "infomine",
2764     "title" => "INFOMINE",
2765     "rule" => array(
2766     "^DataFountains/DMOZ" => "",
2767     "^INFOMINE[ /]([0-9.]{1,10})" => "\\1"
2768     ),
2769     "uri" => "http://infomine.ucr.edu/"
2770     ),
2771     "infoseek" => array(
2772     "icon" => "infoseek",
2773     "title" => "Infoseek",
2774     "rule" => array(
2775     "SideWinder[ /]?([0-9a-z.]{1,10})" => "\\1",
2776     "Infoseek" => ""
2777     ),
2778     "uri" => ""
2779     ),
2780     "inktomi" => array(
2781     "icon" => "inktomi",
2782     "title" => "Inktomi",
2783     "rule" => array(
2784     "slurp@inktomi\.com" => ""
2785     ),
2786     "uri" => ""
2787     ),
2788     "innerprise" => array(
2789     "icon" => "robot",
2790     "title" => "Innerprise",
2791     "rule" => array(
2792     "^InnerpriseBot[ /]([0-9.]{1,10})" => "\\1",
2793     "URL[ _]Spider[ _]Pro[ /]([0-9.+]{1,10})" => "\\1",
2794     "^ES[ .]NET[ _]Crawler[ /]([0-9.]{1,10})" => "\\1"
2795     ),
2796     "uri" => "http://www.innerprise.com/"
2797     ),
2798     "inria" => array(
2799     "icon" => "inria",
2800     "title" => "Inria",
2801     "rule" => array(
2802     "^xyro_" => ""
2803     ),
2804     "uri" => ""
2805     ),
2806     "insitor" => array(
2807     "icon" => "insitor",
2808     "title" => "Insitor",
2809     "rule" => array(
2810     "^Insitor(,|\.|naut)" => ""
2811     ),
2812     "uri" => "http://www.insitor.com/"
2813     ),
2814     "internetninja" => array(
2815     "icon" => "robot",
2816     "title" => "Internet Ninja",
2817     "rule" => array(
2818     "^Internet Ninja[ /]([0-9.]{1,10})" => "\\1"
2819     ),
2820     "uri" => ""
2821     ),
2822     "internetseer" => array(
2823     "icon" => "internetseer",
2824     "title" => "InternetSeer",
2825     "rule" => array(
2826     "^InternetSeer\.com" => ""
2827     ),
2828     "uri" => ""
2829     ),
2830     "interseek" => array(
2831     "icon" => "interseek",
2832     "title" => "Interseek",
2833     "rule" => array(
2834     "Interseek.com" => ""
2835     ),
2836     "uri" => "http://www.interseek.com"
2837     ),
2838     "intravnews" => array(
2839     "icon" => "intravnews",
2840     "title" => "IntraVnews",
2841     "rule" => array(
2842     "IntraVnews[ /]([0-9.]{1,10})" => "\\1"
2843     ),
2844     "uri" => "http://www.intravnews.com/"
2845     ),
2846     "ip2location" => array(
2847     "icon" => "ip2location",
2848     "title" => "IP2LocationBot",
2849     "rule" => array(
2850     "^IP2(Map|Location)Bot[ /]([0-9.]{1,10})" => "\\2"
2851     ),
2852     "uri" => "http://www.ip2location.com"
2853     ),
2854     "ipworks" => array(
2855     "icon" => "ipworks",
2856     "title" => "IP*Works",
2857     "rule" => array(
2858     "^IP\*Works\! V([0-9.]{1,10})" => "\\1"
2859     ),
2860     "uri" => "http://www.nsoftware.com/ipworks/"
2861     ),
2862     "irca" => array(
2863     "icon" => "robot",
2864     "title" => "Novell iChain Cool Solutions caching",
2865     "rule" => array(
2866 matthys 209 "^ICRA_(label_generator|Semantic_spider)[ /]([0-9.]{1,10})" => "\\2",
2867     "^Mozilla[/ ]([0-9.]{1,10})[/ ]\(compatible[ ;]*ICS" => "\\1"
2868 joku 63 ),
2869     "uri" => "http://www.icra.org"
2870     ),
2871     "irvine" => array(
2872     "icon" => "robot",
2873     "title" => "Irvine",
2874     "rule" => array(
2875     "Irvine[ /]([0-9.]{1,10})" => "\\1"
2876     ),
2877     "uri" => ""
2878     ),
2879     "ips-agent" => array(
2880     "icon" => "robot",
2881 matthys 209 "title" => "IPS-agent",
2882 joku 63 "rule" => array(
2883     "ips-agent" => ""
2884     ),
2885     "uri" => ""
2886     ),
2887     "isara" => array(
2888     "icon" => "isara",
2889 matthys 209 "title" => "Isara",
2890 joku 63 "rule" => array(
2891     "Isara[ -]([0-9.]{1,10})" => "\\1"
2892     ),
2893     "uri" => "http://www.isara.org/"
2894     ),
2895     "isspider" => array(
2896     "icon" => "robot",
2897     "title" => "ISSpider",
2898     "rule" => array(
2899     "ISSpider[ /\-]([0-9.]{1,10})" => "\\1"
2900     ),
2901     "uri" => ""
2902     ),
2903     "it2media" => array(
2904     "icon" => "it2media",
2905     "title" => "IT2media",
2906     "rule" => array(
2907     "www.adressendeutschland.de" => ""
2908     ),
2909     "uri" => "http://www.adressendeutschland.de/"
2910     ),
2911     "ivia" => array(
2912     "icon" => "robot",
2913     "title" => "iVia",
2914     "rule" => array(
2915     "iVia Site Checker.?[ /]([0-9.]{1,10})" => "\\1"
2916     ),
2917     "uri" => ""
2918     ),
2919     "jeteye" => array(
2920     "icon" => "jeteye",
2921     "title" => "Jeteye",
2922     "rule" => array(
2923     "Jetbot[ /]([0-9.]{1,10})" => "\\1"
2924     ),
2925     "uri" => ""
2926     ),
2927     "jobsde" => array(
2928     "icon" => "jobsde",
2929     "title" => "jobs.de",
2930     "rule" => array(
2931     "www\.jobs\.de" => "",
2932     "jobs.de-Robot" => ""
2933     ),
2934     "uri" => "http://www.jobs.de/"
2935     ),
2936     "jpluck" => array(
2937     "icon" => "robot",
2938     "title" => "Jpluck",
2939     "rule" => array(
2940     "JPluck[ /]([0-9a-z.]{1,10})" => "\\1"
2941     ),
2942     "uri" => ""
2943     ),
2944     "jxta" => array(
2945     "icon" => "robot",
2946     "title" => "Jxta",
2947     "rule" => array(
2948     "falcon[ /]([0-9.]{1,10})" => "\\1"
2949     ),
2950     "uri" => ""
2951     ),
2952     "jyte" => array(
2953     "icon" => "jyte",
2954     "title" => "Jyte",
2955     "rule" => array(
2956     "jyte_fetcher[ /]([0-9.]{1,10})" => "\\1"
2957     ),
2958     "uri" => ""
2959     ),
2960     "jyxo" => array(
2961     "icon" => "jyxo",
2962     "title" => "Jyxo",
2963     "rule" => array(
2964     "Jyxobot[ /]([0-9.]{1,10})" => "\\1"
2965     ),
2966     "uri" => ""
2967     ),
2968     "kalooga" => array(
2969     "icon" => "kalooga",
2970     "title" => "Kalooga",
2971     "rule" => array(
2972     "kalooga[ /-]([0-9.]{1,10})" => "\\1",
2973     "^kalooga" => "",
2974     "KaloogaBot" => ""
2975     ),
2976     "uri" => "http://www.kalooga.com"
2977     ),
2978     "keywen" => array(
2979     "icon" => "keywen",
2980     "title" => "Keywen",
2981     "rule" => array(
2982     "EasyDL[ /]([0-9.]{1,10})" => "\\1"
2983     ),
2984     "uri" => ""
2985     ),
2986     "kilomonkey" => array(
2987     "icon" => "robot",
2988     "title" => "Kilomonkey",
2989     "rule" => array(
2990     "kmky-not-a-bot[ /]([0-9.]{1,10})" => "\\1"
2991     ),
2992     "uri" => "http://www.kilomonkey.com/notabot.txt"
2993     ),
2994     "kinja" => array(
2995     "icon" => "kinja",
2996     "title" => "Kinja",
2997     "rule" => array(
2998     "kinjabot[ /]([0-9.]{1,10})" => "\\1",
2999     "^kinjabot" => ""
3000     ),
3001     "uri" => ""
3002     ),
3003     "kiwi" => array(
3004     "icon" => "robot",
3005     "title" => "KiwiStatus",
3006     "rule" => array(
3007     "KiwiStatus[ /]([0-9.]{1,10})" => "\\1",
3008     "KiwiStatus" => ""
3009     ),
3010     "uri" => "http://www.nzs.com/kiei-status/"
3011     ),
3012     "lachesis" => array(
3013     "icon" => "robot",
3014     "title" => "Lachesis",
3015     "rule" => array(
3016     "lachesis" => ""
3017     ),
3018     "uri" => ""
3019     ),
3020     "lanshan" => array(
3021     "icon" => "robot",
3022     "title" => "Lachesis",
3023     "rule" => array(
3024     "lanshanbot[/ ]([0-9.]{1,10})" => "\\1"
3025     ),
3026     "uri" => ""
3027     ),
3028     "lapozz" => array(
3029     "icon" => "lapozz",
3030     "title" => "Lapozz",
3031     "rule" => array(
3032     "LapozzBot[/ ]?([0-9.]{1,10})" => "\\1"
3033     ),
3034     "uri" => ""
3035     ),
3036     "larbin" => array(
3037     "icon" => "robot",
3038     "title" => "Larbin",
3039     "rule" => array(
3040     "larbin[_/ ]?([0-9.]{1,10})" => "\\1"
3041     ),
3042     "uri" => ""
3043     ),
3044     "laurion" => array(
3045     "icon" => "robot",
3046     "title" => "Laurion",
3047     "rule" => array(
3048     "^IPiumBot" => ""
3049     ),
3050     "uri" => "http://www.laurion.com/"
3051     ),
3052     "leechget" => array(
3053     "icon" => "leechget",
3054     "title" => "LeechGet",
3055     "rule" => array(
3056     "^LeechGet[ /]([0-9.]{1,10})" => "\\1"
3057     ),
3058     "uri" => ""
3059     ),
3060     "linguaseek" => array(
3061     "icon" => "linguaseek",
3062     "title" => "Linguaseek",
3063     "rule" => array(
3064     "^LinguaBot[ /]v([0-9.]{1,10})" => "\\1"
3065     ),
3066     "uri" => "http://www.linguaseek.com/"
3067     ),
3068     "linguee" => array(
3069     "icon" => "linguee",
3070     "title" => "Linguee",
3071     "rule" => array(
3072     "^Linguee Bot" => ""
3073     ),
3074     "uri" => "http://www.linguee.com/"
3075     ),
3076 matthys 355 "linkapedia" => array(
3077     "icon" => "linkapedia",
3078     "title" => "Linkapedia",
3079     "rule" => array(
3080     "^linkapedia" => ""
3081     ),
3082     "uri" => "http://www.linkapedia.com"
3083     ),
3084 matthys 346 "linkdex" => array(
3085     "icon" => "linkdex",
3086     "title" => "Linkdex",
3087     "rule" => array(
3088     "linkdexbot[ /]([0-9.]{1,10})" => "\\1"
3089     ),
3090     "uri" => "http://www.linkdex.com/bots/"
3091     ),
3092 matthys 366 "linkedin" => array(
3093     "icon" => "linkedin",
3094     "title" => "LinkedIn",
3095     "rule" => array(
3096     "LinkedInBot[ /]([0-9.]{1,10})" => "\\1"
3097     ),
3098     "uri" => "http://www.linkedin.com"
3099     ),
3100 joku 63 "linkguard" => array(
3101     "icon" => "robot",
3102     "title" => "Linkguard",
3103     "rule" => array(
3104     "Linkguard Online[ /]([0-9.]{1,10})" => "\\1"
3105     ),
3106     "uri" => "http://www.linkguard.com/"
3107     ),
3108     "linklint" => array(
3109     "icon" => "linklint",
3110     "title" => "Linklint",
3111     "rule" => array(
3112     "^Linklint[-\-a-z /]*([0-9.]{1,10})" => "\\1"
3113     ),
3114     "uri" => "http://www.linklint.org/"
3115     ),
3116     "linkman" => array(
3117     "icon" => "linkman",
3118     "title" => "Linkman",
3119     "rule" => array(
3120     "\(compatible; Linkman\)" => ""
3121     ),
3122     "uri" => ""
3123     ),
3124     // Needs to be before linkcheck for correct detection
3125     "linkchecker" => array(
3126     "icon" => "w3c",
3127     "title" => "W3C Link Checker",
3128     "rule" => array(
3129     "^W3C-checklink[ /]([0-9.]{1,10})" => "\\1"
3130     ),
3131     "uri" => "http://validator.w3.org/checklink"
3132     ),
3133     "linkcheck" => array(
3134     "icon" => "linkcheck",
3135     "title" => "Linkcheck",
3136     "rule" => array(
3137     "checklink[ /]([0-9.]{1,10})" => "\\1",
3138     "Link[ \-]?(Chec(k|ker)|Val(et|idator))" => "",
3139     "Adaxas Spider" => "",
3140     "Agent-SharewarePlazaFileCheckBot[ /]([0-9.]{1,10})" => "\\1",
3141     "NetMechanic V([0-9.]{1,10})" => "\\1",
3142     "^InfoLink" => "",
3143     "InternetLinkAgent" => "",
3144     "; SPENG\)" => "",
3145     "SharewarePlazaFileCheckBot" => "",
3146     "fileboost.net" => "",
3147     "^billbot" => ""
3148     ),
3149     "uri" => ""
3150     ),
3151     "linkru" => array(
3152     "icon" => "robot",
3153     "title" => "Link.RU",
3154     "rule" => array(
3155     "^Link.RU bot" => ""
3156     ),
3157     "uri" => ""
3158     ),
3159     "linkssql" => array(
3160     "icon" => "robot",
3161     "title" => "Links SQL",
3162     "rule" => array(
3163     "links sql" => ""
3164     ),
3165     "uri" => ""
3166     ),
3167     "linksweeper" => array(
3168     "icon" => "robot",
3169     "title" => "Link Sweeper",
3170     "rule" => array(
3171     "LinkSweeper[ /]([0-9.]{1,10})" => "\\1"
3172     ),
3173     "uri" => ""
3174     ),
3175     "linkwalker" => array(
3176     "icon" => "robot",
3177     "title" => "Link Walker",
3178     "rule" => array(
3179     "^LinkWalker" => ""
3180     ),
3181     "uri" => ""
3182     ),
3183     "lipperhey" => array(
3184     "icon" => "lipperhey",
3185     "title" => "Lipperhey",
3186     "rule" => array(
3187     "Lipperhey Spider" => ""
3188     ),
3189     "uri" => "http://www.lipperhey.com"
3190     ),
3191     "livedoor" => array(
3192     "icon" => "livedoor",
3193     "title" => "Livedoor",
3194     "rule" => array(
3195     "^Livedoor( SF( - California Crawl)?|Checkers)[ /]" => ""
3196     ),
3197     "uri" => ""
3198     ),
3199     "livejournal" => array(
3200     "icon" => "livejournal",
3201     "title" => "Live Journal",
3202     "rule" => array(
3203     "^LiveJournal\.com" => ""
3204     ),
3205     "uri" => "http://www.livejournal.com"
3206     ),
3207     "ljpic" => array(
3208     "icon" => "ljpic",
3209     "title" => "ljpic",
3210     "rule" => array(
3211     "LjSEEK Picture-Bot[ /]+([0-9.]{1,10})" => "\\1"
3212     ),
3213     "uri" => "http://www.ljpic.com"
3214     ),
3215     "lmspider" => array(
3216     "icon" => "robot",
3217     "title" => "Lmspider",
3218     "rule" => array(
3219     "^lmspider" => ""
3220     ),
3221     "uri" => ""
3222     ),
3223     "locators" => array(
3224     "icon" => "robot",
3225     "title" => "Locaters",
3226     "rule" => array(
3227     "^FiNDoBot[/ ]([0-9a-z.]{1,10})" => "\\1"
3228     ),
3229     "uri" => ""
3230     ),
3231     "look" => array(
3232     "icon" => "look",
3233     "title" => "Look",
3234     "rule" => array(
3235     "www\.look\.com" => "",
3236     "Lookbot" => ""
3237     ),
3238     "uri" => ""
3239     ),
3240     "looksmart" => array(
3241     "icon" => "looksmart",
3242     "title" => "LookSmart",
3243     "rule" => array(
3244     "^Martini" => "",
3245     "^MantraAgent" => "",
3246     "FurlBot" => "",
3247     "looksmart-sv-fw" => ""
3248     ),
3249     "uri" => ""
3250     ),
3251     "loop" => array(
3252     "icon" => "loop",
3253     "title" => "LOOP",
3254     "rule" => array(
3255     "NetResearchServer[ /]([0-9.]{1,10})" => "\\1"
3256     ),
3257     "uri" => ""
3258     ),
3259     "lotkyll" => array(
3260     "icon" => "robot",
3261     "title" => "Lotkyll",
3262     "rule" => array(
3263     "Lotkyll" => ""
3264     ),
3265     "uri" => ""
3266     ),
3267 joku 335 "ltx71" => array(
3268     "icon" => "robot",
3269     "title" => "LTX71",
3270     "rule" => array(
3271     "ltx71" => ""
3272     ),
3273     "uri" => "http://ltx71.com/"
3274     ),
3275 joku 63 "lwp" => array(
3276     "icon" => "robot",
3277     "title" => "lwp",
3278     "rule" => array(
3279     "lwp(-trivial|::simple)[ /]([0-9.]{1,10})" => "\\2"
3280     ),
3281     "uri" => ""
3282     ),
3283     "lycos" => array(
3284     "icon" => "lycos",
3285     "title" => "Lycos",
3286     "rule" => array(
3287     "Lycos_Spider_" => ""
3288     ),
3289     "uri" => ""
3290     ),
3291     "magpierss" => array(
3292     "icon" => "rss",
3293     "title" => "MagpieRSS",
3294     "rule" => array(
3295     "MagpieRSS" => ""
3296     ),
3297     "uri" => "http://magpierss.sourceforge.net/"
3298     ),
3299     "mailru" => array(
3300     "icon" => "mailru",
3301 matthys 209 "title" => "Mail.Ru",
3302 joku 63 "rule" => array(
3303 matthys 195 "^Mail.Ru[ /]([0-9.]{1,10})" => "\\1",
3304     "Mail.RU_Bot[ /]([0-9.]{1,10})" => "\\1"
3305 joku 63 ),
3306 matthys 209 "uri" => "http://www.mail.ru/"
3307 joku 63 ),
3308     "mailsweeper" => array(
3309     "icon" => "robot",
3310     "title" => "Mail Sweeper",
3311     "rule" => array(
3312     "Mail[ \-]?Sweeper" => ""
3313     ),
3314     "uri" => ""
3315     ),
3316     "marvin" => array(
3317     "icon" => "robot",
3318     "title" => "Marvin",
3319     "rule" => array(
3320     "^Marvin" => ""
3321     ),
3322     "uri" => ""
3323     ),
3324     "matkurja" => array(
3325     "icon" => "matkurja",
3326     "title" => "Mat'Kurja",
3327     "rule" => array(
3328     "Mosad[ /]([0-9.]{1,10})" => "\\1"
3329     ),
3330     "uri" => ""
3331     ),
3332     "mavicanet" => array(
3333     "icon" => "mavicanet",
3334     "title" => "Mavicanet",
3335     "rule" => array(
3336     "Mavicanet robot" => ""
3337     ),
3338     "uri" => ""
3339     ),
3340 matthys 292 "meanpath" => array(
3341     "icon" => "meanpath",
3342 matthys 290 "title" => "Meanpath",
3343 matthys 280 "rule" => array(
3344     "meanpathbot[ /]([0-9.]{1,10})" => "\\1"
3345     ),
3346     "uri" => "http://www.meanpath.com/meanpathbot.html"
3347 matthys 275 ),
3348 matthys 280 "mediater" => array(
3349 joku 63 "icon" => "robot",
3350     "title" => "Mediater",
3351     "rule" => array (
3352     "^libwww[ /]([0-9.]{1,10})" => "\\1"
3353 matthys 280 ),
3354     "uri" => ""
3355 joku 63 ),
3356 matthys 305 "memory" => array(
3357     "icon" => "memory",
3358     "title" => "internet Memory",
3359     "rule" => array (
3360     "memoryBot[ /]([0-9.]{1,10})" => "\\1"
3361     ),
3362     "uri" => "http://internetmemory.org/en/"
3363     ),
3364 joku 63 "mercator" => array(
3365     "icon" => "robot",
3366     "title" => "Mercator",
3367     "rule" => array(
3368     "Mercator" => ""
3369     ),
3370     "uri" => ""
3371     ),
3372     "metacarta" => array(
3373     "icon" => "robot",
3374     "title" => "Metacarta",
3375     "rule" => array(
3376     "^RRC (crawler_admin@bigfoot.com)" => "",
3377     "^flunky" => "",
3378     "^Mozilla.*\(samualt9@bigfoot.com\)$" => ""
3379     ),
3380     "uri" => "http://www.metacarta.com"
3381     ),
3382     "metager" => array(
3383     "icon" => "metager",
3384     "title" => "MetaGer",
3385     "rule" => array(
3386     "MetaGer" => ""
3387     ),
3388     "uri" => ""
3389     ),
3390     "metamark" => array(
3391     "icon" => "robot",
3392     "title" => "Metamark",
3393     "rule" => array(
3394     "^XRL[ /]([0-9.a-z]{1,10})" => "\\1"
3395     ),
3396     "uri" => "http://metamark.net"
3397     ),
3398     "metamedic" => array(
3399     "icon" => "metamedic",
3400     "title" => "MetaMedic",
3401     "rule" => array(
3402     "MediBot[ /]([0-9.]{1,10})" => "\\1"
3403     ),
3404     "uri" => ""
3405     ),
3406     "mirago" => array(
3407     "icon" => "mirago",
3408     "title" => "Mirago",
3409     "rule" => array(
3410     "Mirago" => ""
3411     ),
3412     "uri" => ""
3413     ),
3414     "misterwong" => array(
3415     "icon" => "misterwong",
3416     "title" => "Mister Wong",
3417     "rule" => array(
3418     "Mister Wong-Bot[ /]([0-9.]{1,10})" => "\\1"
3419     ),
3420     "uri" => "http://www.mister-wong.de/"
3421     ),
3422     "miva" => array(
3423     "icon" => "miva",
3424     "title" => "Miva",
3425     "rule" => array(
3426     "AlgoFeedback@miva\.com" => ""
3427     ),
3428     "uri" => "http://www.miva.com/"
3429     ),
3430     "mj12" => array(
3431     "icon" => "mj12",
3432     "title" => "Majestic-12",
3433     "rule" => array(
3434     "Mj12bot[ /]v?([0-9.]{1,10})" => "\\1",
3435     "MJ12bot \(mini\)[ /]([0-9.]{1,10})" => "\\1"
3436     ),
3437     "uri" => "http://majestic12.co.uk/bot.php"
3438     ),
3439     "mlbot" => array(
3440     "icon" => "robot",
3441     "title" => "MLBot",
3442     "rule" => array(
3443     "^MLBot" => ""
3444     ),
3445     "uri" => "http://www.metadatalabs.com/mlbot"
3446     ),
3447     "mnogo" => array(
3448     "icon" => "mnogo",
3449     "title" => "mnoGoSearch",
3450     "rule" => array(
3451     "Mnogosearch[ /\-]([0-9.]{1,10})" => "\\1"
3452     ),
3453     "uri" => "http://www.mnogosearch.org/"
3454     ),
3455     "mobileok" => array(
3456     "icon" => "mobileok",
3457     "title" => "W3C mobileOK",
3458     "rule" => array(
3459     "^W3C-mobileOK" => ""
3460     ),
3461     "uri" => "http://www.w3.org/2006/07/mobileok-ddc"
3462     ),
3463 matthys 296 "mojeek" => array(
3464     "icon" => "mojeek",
3465     "title" => "Mojeek",
3466 joku 63 "rule" => array(
3467     "MojeekBot[ /]([0-9.]{1,10})" => "\\1"
3468     ),
3469 matthys 284 "uri" => "https://www.mojeek.com/bot.html"
3470 joku 63 ),
3471     "momspider" => array(
3472     "icon" => "robot",
3473     "title" => "MOM Spider",
3474     "rule" => array(
3475     "MOMspider[ /]([0-9.]{1,10})" => "\\1"
3476     ),
3477     "uri" => ""
3478     ),
3479     "moreover" => array(
3480     "icon" => "moreover",
3481     "title" => "Moreover",
3482     "rule" => array(
3483     "^Moreoverbot[ /]([0-9.]{1,10})" => "\\1"
3484     ),
3485     "uri" => ""
3486     ),
3487     "movabletype" => array(
3488     "icon" => "movabletype",
3489     "title" => "Movable Type",
3490     "rule" => array(
3491     "MovableType[ /]([0-9.]{1,10})" => "\\1"
3492     ),
3493     "uri" => ""
3494     ),
3495     "mozdex" => array(
3496     "icon" => "mozdex",
3497     "title" => "MozDex",
3498     "rule" => array(
3499     "mozDex[ /]([0-9.]{1,6}(-dev)?)" => "\\1"
3500     ),
3501     "uri" => ""
3502     ),
3503     "mqbot" => array(
3504     "icon" => "robot",
3505     "title" => "MQbot",
3506     "rule" => array(
3507     "MQbot" => ""
3508     ),
3509     "uri" => ""
3510     ),
3511     "msnbot" => array(
3512     "icon" => "bing",
3513 matthys 205 "title" => "Bing",
3514 joku 63 "rule" => array(
3515     "MSN(BOT|PTC)[ /]([0-9.]{1,10})" => "\\2",
3516     "MS Search ([0-9.]{1,10}) Robot" => "\\1",
3517     "MSNBOT-(MEDIA|PRODUCTS|NewsBlogs)[ /]([0-9.]{1,10})" => "\\2",
3518     "bingbot[ /]([0-9.]{1,10})" => "\\1"
3519     ),
3520     "uri" => ""
3521     ),
3522     "msnbot-mobile" => array(
3523     "icon" => "msn",
3524     "title" => "MSN Mobile",
3525     "rule" => array(
3526     "MSNBOT-(MOBILE|)[ /]([0-9.]{1,10})" => "\\2",
3527     "MSNBOT_Mobile" => "",
3528     "MSMOBOT" => ""
3529     ),
3530     "uri" => ""
3531     ),
3532     "mslivebot" => array(
3533     "icon" => "livesearch",
3534     "title" => "MS Live Search",
3535     "rule" => array(
3536     "MSNBOT-(Academic)[ /]([0-9.]{1,10})" => "\\2"
3537     ),
3538     "uri" => ""
3539     ),
3540     "msproxy" => array(
3541     "icon" => "robot",
3542     "title" => "MSProxy",
3543     "rule" => array(
3544     "MSProxy[ /]([0-9.]{1,10})" => "\\1"
3545     ),
3546     "uri" => ""
3547     ),
3548     "msrbot" => array(
3549     "icon" => "robot",
3550     "title" => "MSRBOT",
3551     "rule" => array(
3552     "^MSRBOT" => ""
3553     ),
3554     "uri" => "http://research.microsoft.com/research/sv/msrbot/"
3555     ),
3556     "mswebdav" => array(
3557     "icon" => "robot",
3558     "title" => "MS-WebDAV",
3559     "rule" => array(
3560     "Microsoft[ \-]?WebDAV[ \-]?MiniRedir" => ""
3561     ),
3562     "uri" => ""
3563     ),
3564     "mticon" => array(
3565     "icon" => "robot",
3566     "title" => "MTIcon",
3567     "rule" => array(
3568     "MTIcon[/ ]([0-9.]{1,10})" => "\\1"
3569     ),
3570     "uri" => ""
3571     ),
3572     "multipage-validator" => array(
3573     "icon" => "multipage-validator",
3574     "title" => "Multipage Validator",
3575     "rule" => array(
3576     "^W3C_Multipage_Validator[ /]([0-9.]{1,10})" => "\\1"
3577     ),
3578     "uri" => "http://www.validator.ca/"
3579     ),
3580     "myrss" => array(
3581     "icon" => "rss",
3582     "title" => "MyRSS",
3583     "rule" => array(
3584     "MyRSS.jp[/ ]([0-9.]{1,10})" => "\\1"
3585     ),
3586     "uri" => ""
3587     ),
3588     "multimap" => array(
3589     "icon" => "robot",
3590     "title" => "Multimap",
3591     "rule" => array(
3592     "Multimap Geotag Blog Parser[/ ]([0-9.]{1,10})" => "\\1"
3593     ),
3594     "uri" => ""
3595     ),
3596     "najdi" => array(
3597     "icon" => "najdi",
3598     "title" => "Najdi.si",
3599     "rule" => array(
3600     "Najdi.si" => ""
3601     ),
3602     "uri" => "http://www.najdi.si"
3603     ),
3604     "nameprotect" => array(
3605     "icon" => "nameprotect",
3606     "title" => "Name Protect",
3607     "rule" => array(
3608     "NPBot" => ""
3609     ),
3610     "uri" => ""
3611     ),
3612     "nationaldirectory" => array(
3613     "icon" => "robot",
3614     "title" => "National Directory",
3615     "rule" => array(
3616     "NationalDirectory-WebSpider[ /]([0-9.]{1,10})" => "\\1"
3617     ),
3618     "uri" => ""
3619     ),
3620     "natsumican" => array(
3621     "icon" => "robot",
3622     "title" => "Natsu Mican",
3623     "rule" => array(
3624     "NATSU[ \-]MICAN[/ ]([0-9a-z.]{1,10})" => "\\1"
3625     ),
3626     "uri" => ""
3627     ),
3628     "naverbot" => array(
3629     "icon" => "naverbot",
3630     "title" => "Naver",
3631     "rule" => array(
3632     "NaverBot([_\-]dloader)?[/ \-]([0-9.]{1,10})" => "\\2",
3633     "Naver(Bot)?" => "",
3634     "^nabot" => ""
3635     ),
3636     "uri" => ""
3637     ),
3638     "navisso" => array(
3639     "icon" => "navisso",
3640     "title" => "Navisso",
3641     "rule" => array(
3642     "Navisso(Bot)?" => ""
3643     ),
3644     "uri" => "http://www.navisso.com"
3645     ),
3646     "neofonie" => array(
3647     "icon" => "robot",
3648 matthys 205 "title" => "Neofonie",
3649 joku 63 "rule" => array(
3650     "www.neofonie.de" => ""
3651     ),
3652     "uri" => "http://www.neofonie.de/loesungen/search/robot.html"
3653     ),
3654     "neomo" => array(
3655     "icon" => "robot",
3656     "title" => "Neomo",
3657     "rule" => array(
3658     "Francis[ /]([0-9.]{1,10})" => "\\1"
3659     ),
3660     "uri" => ""
3661     ),
3662     "nessus" => array(
3663     "icon" => "nessus",
3664     "title" => "Nessus",
3665     "rule" => array(
3666     "Nessus\)$" => ""
3667     ),
3668     "uri" => ""
3669     ),
3670 matthys 279 "nerdybot" => array(
3671 matthys 280 "icon" => "robot",
3672     "title" => "NerdyBot",
3673     "rule" => array(
3674     "NerdyBot" => ""
3675     ),
3676     "uri" => "http://nerdybot.com/"
3677 matthys 279 ),
3678 joku 63 "nerdbynature" => array(
3679     "icon" => "nerdbynature",
3680     "title" => "NerdByNature",
3681     "rule" => array(
3682     "NerdByNature.Bot" => ""
3683     ),
3684     "uri" => "http://www.nerdbynature.net/bot"
3685     ),
3686     "netants" => array(
3687     "icon" => "netants",
3688     "title" => "NetAnts",
3689     "rule" => array(
3690     "NetAnts[ /]([0-9.]{1,10})" => "\\1"
3691     ),
3692     "uri" => ""
3693     ),
3694     "netcraft" => array(
3695     "icon" => "netcraft",
3696     "title" => "Netcraft",
3697     "rule" => array(
3698     "netcraft" => ""
3699     ),
3700     "uri" => ""
3701     ),
3702     "netinfo" => array(
3703     "icon" => "netinfo",
3704     "title" => "Netinfo",
3705     "rule" => array(
3706     "^NetinfoBot[ /]([0-9.]{1,10})" => "\\1"
3707     ),
3708     "uri" => "http://netinfo.bg/"
3709     ),
3710     "netluchs" => array(
3711     "icon" => "netluchs",
3712     "title" => "Netluchs",
3713     "rule" => array(
3714     "Netluchs[ /]([0-9.a-z]{1,10})" => "\\1"
3715     ),
3716     "uri" => "http://www.netluchs.de/"
3717     ),
3718     "netmechanic" => array(
3719     "icon" => "netmechanic",
3720     "title" => "NetMechanic",
3721     "rule" => array(
3722     "NetMechanic[ /V]{1,5}([0-9.]{1,10})" => "\\1"
3723     ),
3724     "uri" => ""
3725     ),
3726     "netnose" => array(
3727     "icon" => "netnose",
3728     "title" => "NetNose",
3729     "rule" => array(
3730     "NetNose[ \-]Crawler[/ ]([0-9.]{1,10})" => "\\1"
3731     ),
3732     "uri" => ""
3733     ),
3734     "netoskop" => array(
3735     "icon" => "robot",
3736     "title" => "Netoskop",
3737     "rule" => array(
3738     "netoskop" => ""
3739     ),
3740     "uri" => ""
3741     ),
3742     "netpromoter" => array(
3743     "icon" => "netpromoter",
3744     "title" => "NetPromoter",
3745     "rule" => array(
3746     "NetPromoter Spider" => ""
3747     ),
3748     "uri" => "http://www.net-promoter.com/"
3749     ),
3750     "netprospector" => array(
3751     "icon" => "robot",
3752     "title" => "Netprospector",
3753     "rule" => array(
3754     "^netprospector" => ""
3755     )
3756     ),
3757     "netpumper" => array(
3758     "icon" => "robot",
3759     "title" => "Netpumper",
3760     "rule" => array(
3761     "^NetPumper[/ ]([0-9.]{1,10})" => "\\1"
3762     ),
3763     "uri" => ""
3764     ),
3765     "netscapeproxy" => array(
3766     "icon" => "netscape",
3767     "title" => "Netscape Proxy",
3768     "rule" => array(
3769     "Netscape-Proxy[/ ]([0-9.]{1,10})" => "\\1"
3770     ),
3771     "uri" => ""
3772     ),
3773     "netspective" => array(
3774     "icon" => "robot",
3775     "title" => "NetSpective",
3776     "rule" => array(
3777     "^WebFilter Robot ([0-9.]{1,10})" => "\\1"
3778     ),
3779     "uri" => ""
3780     ),
3781     "netvibes" => array(
3782     "icon" => "netvibes",
3783     "title" => " Netvibes",
3784     "rule" => array(
3785     "^Netvibes" => "\\1"
3786     ),
3787     "uri" => ""
3788     ),
3789     "newsfire" => array(
3790     "icon" => "newsfire",
3791     "title" => "NewsFire",
3792     "rule" => array(
3793     "NewsFire[/ ]([0-9.]{1,10})" => "\\1"
3794     ),
3795     "uri" => ""
3796     ),
3797     "newsgator" => array(
3798     "icon" => "newsgator",
3799     "title" => "NewsGator",
3800     "rule" => array(
3801     "NewsGato(r|rOnline)[/ ]([0-9.]{1,10})" => "\\2"
3802     ),
3803     "uri" => ""
3804     ),
3805     "newzcrawler" => array(
3806     "icon" => "newzcrawler",
3807     "title" => "NewzCrawler",
3808     "rule" => array(
3809     "NewzCrawler[/ ]([0-9.]{1,10})" => "\\1"
3810     ),
3811     "uri" => ""
3812     ),
3813     "nextopia" => array(
3814     "icon" => "newzcrawler",
3815     "title" => "NewzCrawler",
3816     "rule" => array(
3817     "^NextopiaBOT.*[v ]([0-9.]{1,10})" => "\\1"
3818     ),
3819     "uri" => ""
3820     ),
3821     "ngsearch" => array(
3822     "icon" => "ngsearch",
3823     "title" => "NG Search",
3824     "rule" => array(
3825     "NG-Search[/ ]([0-9.]{1,10})" => "\\1"
3826     ),
3827     "uri" => ""
3828     ),
3829     "nimble" => array(
3830     "icon" => "robot",
3831     "title" => "Nimble",
3832     "rule" => array(
3833     "NimbleCrawler[/ ]([0-9.]{1,10})" => "\\1"
3834     ),
3835     "uri" => ""
3836     ),
3837     "nmap" => array(
3838     "icon" => "nmap",
3839     "title" => "Nmap",
3840     "rule" => array(
3841     "Nmap Scripting Engine" => ""
3842     ),
3843     "uri" => "http://nmap.org/book/nse.html"
3844     ),
3845     "nusearch" => array(
3846     "icon" => "robot",
3847     "title" => "NuSearch",
3848     "rule" => array(
3849     "^nuSearch" => ""
3850     ),
3851     "uri" => "http://www.nusearch.com/"
3852     ),
3853     "noago" => array(
3854     "icon" => "noago",
3855     "title" => "Noago",
3856     "rule" => array(
3857     "Noago Spider" => ""
3858     ),
3859     "uri" => "http://www.noago.com/"
3860     ),
3861     "noviforum" => array(
3862     "icon" => "noviforum",
3863     "title" => "Noviforum",
3864     "rule" => array(
3865     "TridentSpider[/ ]?([0-9.]{1,10})" => "\\1"
3866     ),
3867     "uri" => ""
3868     ),
3869     "noxtrum" => array(
3870     "icon" => "noxtrum",
3871     "title" => "noXtrum",
3872     "rule" => array(
3873     "noxtrumbot[/ ]?([0-9.]{1,10})" => "\\1"
3874     ),
3875     "uri" => ""
3876     ),
3877     "noyona" => array(
3878     "icon" => "robot",
3879     "title" => "Noyona",
3880     "rule" => array(
3881     "noyona.([0-9._]{1,10})" => "\\1"
3882     ),
3883     "uri" => "http://noyona.com/"
3884     ),
3885     "nsauditor" => array(
3886     "icon" => "nsauditor",
3887     "title" => "Nsauditor",
3888     "rule" => array(
3889     "Nsauditor[ /]([0-9.]{1,10})" => "\\1"
3890     ),
3891     "uri" => "http://www.nsauditor.com/"
3892     ),
3893     "obidosbot" => array(
3894     "icon" => "robot",
3895     "title" => "Bookwatch",
3896     "rule" => array(
3897     "obidos[ \-]?bot" => ""
3898     ),
3899     "uri" => ""
3900     ),
3901     "objectssearch" => array(
3902     "icon" => "robot",
3903     "title" => "Objects Search",
3904     "rule" => array(
3905     "ObjectsSearch[ /]([0-9.]{1,10})" => "\\1"
3906     ),
3907     "uri" => ""
3908     ),
3909     "obot" => array(
3910 matthys 297 "icon" => "ibm",
3911     "title" => "IBM (ONLY) Crawler",
3912 joku 63 "rule" => array(
3913 matthys 297 "oBot[ /]([0-9.]{1,10})" => "\\1"
3914 joku 63 ),
3915 matthys 297 "uri" => "http://filterdb.iss.net/crawler/"
3916     // Previous from "ONLY Solutions GmbH" – that is what the O stands for
3917 joku 63 ),
3918     "ocawa" => array(
3919     "icon" => "ocawa",
3920     "title" => "Ocawa",
3921     "rule" => array(
3922     "Ocawa[ /]([A-Z.a-z][0-9.]{1,10})" => "\\1",
3923     "Ocawa" => ""
3924     ),
3925     "uri" => "http://www.ocawa.com/"
3926     ),
3927     "octora" => array(
3928     "icon" => "octora",
3929     "title" => "Octora",
3930     "rule" => array(
3931     "^Octora (Beta)?" => ""
3932     ),
3933     "uri" => "http://www.octora.com/"
3934     ),
3935     "offlineexplorer" => array(
3936     "icon" => "robot",
3937     "title" => "OfflineExplorer",
3938     "rule" => array(
3939     "^Offline Explorer[ /]([0-9.]{1,10})" => "\\1"
3940     ),
3941     "uri" => ""
3942     ),
3943     "omea" => array(
3944     "icon" => "omea",
3945     "title" => "Omea Reader",
3946     "rule" => array(
3947     "Omea Reader[ /]([0-9.]{1,10})" => "\\1"
3948     ),
3949     "uri" => ""
3950     ),
3951     "onet" => array(
3952     "icon" => "onet",
3953     "title" => "Onet",
3954     "rule" => array(
3955     "OnetSzukaj[ /]([0-9.]{1,10})" => "\\1",
3956     "Onet\.pl" => "",
3957     "inktomi.search.onet" => ""
3958     ),
3959     "uri" => "http://www.onet.pl"
3960     ),
3961     "online24" => array(
3962     "icon" => "robot",
3963 matthys 209 "title" => "Online24",
3964 joku 63 "rule" => array(
3965     "^Online24-Bot .* ([0-9.]{1,10})" => "\\1"
3966     ),
3967     "uri" => "http://www.online24.de"
3968     ),
3969     "onlinewebcheck" => array(
3970     "icon" => "csehtmlvalidator",
3971     "title" => "CSE HTML Validator",
3972     "rule" => array(
3973     "onlinewebcheck" => ""
3974     ),
3975     "uri" => "http://www.onlinewebcheck.com"
3976     ),
3977     "onsearch" => array(
3978     "icon" => "onsearch",
3979 matthys 209 "title" => "OnSearch",
3980 joku 63 "rule" => array(
3981     "^onCHECK-Robot" => ""
3982     ),
3983     "uri" => "http://www.onsearch.de"
3984     ),
3985     "onto" => array(
3986     "icon" => "robot",
3987     "title" => "OntoSpider",
3988     "rule" => array(
3989     "^OntoSpider[ /]([0-9.]{1,10})" => "\\1"
3990     ),
3991     "uri" => "http://ontospider.i-n.info/"
3992     ),
3993     "openacoon" => array(
3994     "icon" => "robot",
3995     "title" => "OpenAcoon",
3996     "rule" => array(
3997     "^OpenAcoon v([0-9.]{1,10})" => "\\1"
3998     ),
3999     "uri" => "http://www.openacoon.de/"
4000     ),
4001     "openfind" => array(
4002     "icon" => "openfind",
4003     "title" => "Openfind",
4004     "rule" => array(
4005     "openbot[ /]([0-9.]{1,10})" => "\\1",
4006     "Openfind Robot[ /]([0-9.A-Z]{1,10})" => "\\1"
4007     ),
4008     "uri" => ""
4009     ),
4010     "opentagger" => array(
4011     "icon" => "robot",
4012     "title" => "OpenTagger",
4013     "rule" => array(
4014     "^OpenTaggerBot" => ""
4015     ),
4016     "uri" => "http://www.opentagger.com/opentaggerbot.htm"
4017     ),
4018     "opentext" => array(
4019     "icon" => "opentext",
4020     "title" => "OpenText",
4021     "rule" => array(
4022     "^OpenTextSiteCrawler[ /]([0-9.]{1,10})" => "\\1"
4023     ),
4024     "uri" => "http://www.opentext.net/"
4025     ),
4026     "openweb" => array(
4027     "icon" => "robot",
4028     "title" => "OpenWebSpider",
4029     "rule" => array(
4030     "^OpenWebSpider[ /]([0-9.]{1,10})" => "\\1",
4031     "^OpenWebSpider v([0-9.A-Z]{1,10})" => "\\1"
4032     ),
4033     "uri" => "http://www.openwebspider.org"
4034     ),
4035     "openx" => array(
4036     "icon" => "openx",
4037     "title" => "OpenX Spider",
4038     "rule" => array(
4039     "OpenX" => ""
4040     ),
4041     "uri" => "http://www.openx.org"
4042     ),
4043     "orange" => array(
4044     "icon" => "orange",
4045     "title" => "Orange",
4046     "rule" => array(
4047 joku 338 "OrangeBot-Mobile[ /]([0-9.]{1,10})" => "\\1",
4048     "OrangeBot[ /]([0-9.]{1,10})" => "\\1"
4049 joku 63 ),
4050     "uri" => "http://orange.com/"
4051     ),
4052     "organica" => array(
4053     "icon" => "robot",
4054     "title" => "Organica",
4055     "rule" => array(
4056     "crawler@organica\.us" => ""
4057     ),
4058     "uri" => ""
4059     ),
4060     "outfox" => array(
4061     "icon" => "robot",
4062     "title" => "Outfox Melon",
4063     "rule" => array(
4064     "OutfoxMelonBot[ /]([0-9.]{1,10})" => "\\1",
4065     "OutfoxBot[ /]([0-9.]{1,10})" => "\\1"
4066     ),
4067     "uri" => ""
4068     ),
4069     "overture" => array(
4070     "icon" => "overture",
4071     "title" => "Overture",
4072     "rule" => array(
4073     "Overture[ \-]?WebCrawler" => ""
4074     ),
4075     "uri" => ""
4076     ),
4077 joku 337 "owler" => array(
4078     "icon" => "robot",
4079     "title" => "Owler",
4080     "rule" => array(
4081     "Owler[ /]([0-9.]{1,10})" => "\\1",
4082     "Owler" => ""
4083     ),
4084     "uri" => ""
4085     ),
4086 joku 63 "page2rss" => array(
4087     "icon" => "page2rss",
4088     "title" => "Page2RSS",
4089     "rule" => array(
4090     "Page2RSS[ /]([0-9.]{1,10})" => "\\1"
4091     ),
4092     "uri" => "http://page2rss.com"
4093     ),
4094     "pagebytes" => array(
4095     "icon" => "robot",
4096     "title" => "PageBites",
4097     "rule" => array(
4098     "^PageBitesHyperBot[ /]([0-9.]{1,10})" => "\\1"
4099     ),
4100     "uri" => ""
4101     ),
4102 matthys 282 "pagesinventory" => array(
4103     "icon" => "pagesinventory",
4104     "title" => "PagesInventory",
4105     "rule" => array(
4106     "^PagesInventory" => ""
4107     ),
4108     "uri" => "http://www.pagesinventory.com"
4109     ),
4110 joku 63 "pagesjaunes" => array(
4111     "icon" => "pagesjaunes",
4112     "title" => "Pages Jaunes",
4113     "rule" => array(
4114     "PJBot[ /]([0-9.]{1,10})" => "\\1"
4115     ),
4116     "uri" => "http://www.pagesjaunes.fr/"
4117     ),
4118     "pagevalet" => array(
4119     "icon" => "wdg",
4120     "title" => "WDG Page Valet",
4121     "rule" => array(
4122     "^Page Valet[ /]([0-9.]{1,10})" => "\\1"
4123     ),
4124     "uri" => "http://www.htmlhelp.com/tools/validator/"
4125     ),
4126     "panopeabot" => array(
4127     "icon" => "robot",
4128     "title" => "PanopeaBot",
4129     "rule" => array(
4130     "PanopeaBot[/ ]([0-9.]{1,10})" => "\\1"
4131     ),
4132     "uri" => ""
4133     ),
4134     "parchmenthill" => array(
4135     "icon" => "robot",
4136     "title" => "Parchment Hill",
4137     "rule" => array(
4138     "ParchBot[ /]([0-9.]{1,10})" => "\\1"
4139     ),
4140     "uri" => "http://www.parchmenthill.com/search.htm"
4141     ),
4142     "pascient" => array(
4143     "icon" => "pascient",
4144     "title" => "Pascient",
4145     "rule" => array(
4146     "panscient.com" => ""
4147     ),
4148     "uri" => "http://www.panscient.com/"
4149     ),
4150     "peerbot" => array(
4151     "icon" => "peerbot",
4152     "title" => "Peerbot",
4153     "rule" => array(
4154     "^PEERbot" => ""
4155     ),
4156     "uri" => ""
4157     ),
4158     "php" => array(
4159     "icon" => "php",
4160     "title" => "PHP",
4161     "rule" => array(
4162     "^PHP[ /]([0-9.]{1,10})" => "\\1"
4163     ),
4164     "uri" => ""
4165     ),
4166     "phpcrawl" => array(
4167     "icon" => "robot",
4168     "title" => "PHPCrawl",
4169     "rule" => array(
4170     "^PHPCrawl" => ""
4171     ),
4172     "uri" => "http://phpcrawl.cuab.de/"
4173     ),
4174     "phpdig" => array(
4175     "icon" => "robot",
4176     "title" => "PhpDig",
4177     "rule" => array(
4178     "^PhpDig[ /]([0-9.]{1,10})" => "\\1"
4179     ),
4180     "uri" => "http://www.finbot.com/"
4181     ),
4182     "phpversiontracker" => array(
4183     "icon" => "phpversiontracker",
4184     "title" => "PHP version tracker",
4185     "rule" => array(
4186     "^PHP version tracker" => ""
4187     ),
4188     "uri" => "http://www.nexen.net/phpversion/bot.php"
4189     ),
4190     "pictureofinternet" => array(
4191     "icon" => "robot",
4192     "title" => "PictureOfInternet",
4193     "rule" => array(
4194     "^PictureOfInternet[ /]([0-9.]{1,10})" => ""
4195     ),
4196     "uri" => ""
4197     ),
4198     "pingdom" => array(
4199     "icon" => "pingdom",
4200     "title" => "Pingdom",
4201     "rule" => array(
4202     "^Pingdom GIGRIB v([0-9.]{1,10})" => "\\1",
4203     "^Pingdom" => ""
4204     ),
4205     "uri" => "http://www.pingdom.com/"
4206     ),
4207     "pinseri" => array(
4208     "icon" => "pinseri",
4209     "title" => "Pinseri",
4210     "rule" => array(
4211     "www\.pinseri\.com/bloglist" => ""
4212     ),
4213     "uri" => ""
4214     ),
4215     "plagger" => array(
4216     "icon" => "plagger",
4217     "title" => "Plagger",
4218     "rule" => array(
4219     "Plagger[ /]([0-9.]{1,10})" => "\\1"
4220     ),
4221     "uri" => "http://www.plugger.org"
4222     ),
4223     "planet" => array(
4224     "icon" => "planet",
4225     "title" => "Planet",
4226     "rule" => array(
4227     "Planet[ /]([0-9.]{1,10})" => "\\1"
4228     ),
4229     "uri" => ""
4230     ),
4231     "plantynet" => array(
4232     "icon" => "robot",
4233     "title" => "PlantyNet",
4234     "rule" => array(
4235     "PlantyNet_WebRobot[_ /]V?([0-9.]{1,10})" => "\\1"
4236     ),
4237     "uri" => ""
4238     ),
4239     "pluck" => array(
4240     "icon" => "pluck",
4241     "title" => "Pluck",
4242     "rule" => array(
4243     "PluckFeedCrawler[ /]([0-9.]{1,10})" => "\\1"
4244     ),
4245     "uri" => ""
4246     ),
4247     "plsearch" => array(
4248     "icon" => "plsearch",
4249     "title" => "PlanetSearch",
4250     "rule" => array(
4251     "fido[ /]([0-9.]{1,10}) Harvest" => "\\1"
4252     ),
4253     "uri" => ""
4254     ),
4255     "poe" => array(
4256     "icon" => "robot",
4257     "title" => "POE-Component",
4258     "rule" => array(
4259     "^POE-Component-Client-HTTP[/ ]([0-9.]{1,10})" => "\\1"
4260     ),
4261     "uri" => ""
4262     ),
4263     "pogodak" => array(
4264     "icon" => "pogodak",
4265     "title" => "Pogodak",
4266     "rule" => array(
4267     "Pogodak\.hr[/ ]?([0-9.]{1,10})" => "\\1"
4268     ),
4269     "uri" => ""
4270     ),
4271     "poodle" => array(
4272     "icon" => "robot",
4273     "title" => "Poodle predictor",
4274     "rule" => array(
4275     "P(oo|ooo)dle[ \-]?predictor[ \-]?([0-9.]{1,10})" => "\\1",
4276     "P(oo|ooo)dle[ \-]?predictor" => ""
4277     ),
4278     "uri" => "http://www.gritechnologies.com/tools/spider.go"
4279     ),
4280     "pompos" => array(
4281     "icon" => "pompos",
4282     "title" => "Pompos",
4283     "rule" => array(
4284     "Pompos[ /]([0-9.]{1,10})" => "\\1"
4285     ),
4286     "uri" => ""
4287     ),
4288     "popdex" => array(
4289     "icon" => "robot",
4290     "title" => "Popdexter",
4291     "rule" => array(
4292     "Popdexter" => ""
4293     ),
4294     "uri" => ""
4295     ),
4296     "postrank" => array(
4297     "icon" => "postrank",
4298     "title" => "PostRank",
4299     "rule" => array(
4300     "^PostRank[ /]+([0-9.]{1,10})" => "\\1"
4301     ),
4302     "uri" => "http://www.postrank.com/"
4303     ),
4304     "powermarks" => array(
4305     "icon" => "robot",
4306     "title" => "Powermarks",
4307     "rule" => array(
4308     "Powermarks[ /]([0-9.]{1,10})" => "\\1"
4309     ),
4310     "uri" => ""
4311     ),
4312 matthys 366 "pinterest" => array(
4313     "icon" => "pinterest",
4314 joku 63 "title" => "PROBE!",
4315     "rule" => array(
4316 matthys 366 "Pinterest[ /]([0-9.]{1,10})" => "\\1"
4317 joku 63 ),
4318 matthys 366 "uri" => "http://www.pinterest.com/"
4319 joku 63 ),
4320 matthys 366 "probe" => array(
4321     "icon" => "robot",
4322     "title" => "PROBE!",
4323     "rule" => array(
4324     "^PROBE!" => ""
4325     ),
4326     "uri" => ""
4327     ),
4328 joku 63 "projecthoneypot" => array(
4329     "icon" => "projecthoneypot",
4330     "title" => "Project Honeypot",
4331     "rule" => array(
4332     "^PHPot Verispider[ /v]+([0-9.]{1,10})" => "\\1",
4333     "projecthoneypot" => ""
4334     ),
4335     "uri" => "http://www.projecthoneypot.org"
4336     ),
4337     "proxycache" => array(
4338     "icon" => "robot",
4339     "title" => "Proxy Cache",
4340     "rule" => array(
4341     "^Mozilla/[0-9.]{1,10} \(compatible\;\)$" => ""
4342     ),
4343     "uri" => ""
4344     ),
4345     "proxyhunter" => array(
4346     "icon" => "robot",
4347     "title" => "ProxyHunter",
4348     "rule" => array(
4349     "ProxyHunter" => ""
4350     ),
4351     "uri" => ""
4352     ),
4353     "psbot" => array(
4354     "icon" => "picsearch",
4355     "title" => "PicSearch",
4356     "rule" => array(
4357     "^psbot" => ""
4358     ),
4359     "uri" => ""
4360     ),
4361     "pubsub" => array(
4362     "icon" => "pubsub",
4363     "title" => "PubSub",
4364     "rule" => array(
4365     "^PubSub-RSS-Reader[ /]([0-9.]{1,10})" => "\\1",
4366     "^PubSub\.com" => ""
4367     ),
4368     "uri" => ""
4369     ),
4370 joku 330 "pubarch" => array(
4371 joku 334 "icon" => "robot",
4372 joku 330 "title" => "PubArchive",
4373     "rule" => array(
4374     "publiclibraryarchive.org" => ""
4375     ),
4376     "uri" => ""
4377     ),
4378 joku 63 "pukiwiki" => array(
4379     "icon" => "pukiwiki",
4380     "title" => "PukiWiki",
4381     "rule" => array(
4382     "PukiWiki[ /]([0-9.]{1,10})" => "\\1"
4383     ),
4384     "uri" => ""
4385     ),
4386     "pwebotxy" => array(
4387     "icon" => "pwebotxy",
4388     "title" => "PWeBot/X.Y",
4389     "rule" => array(
4390     "^PWeBot[ /]([0-9.]{1,10})" => "\\1"
4391     ),
4392     "uri" => "http://www.programacionweb.net/robot.php"
4393     ),
4394     "pxys" => array(
4395     "icon" => "robot",
4396     "title" => "PXYS",
4397     "rule" => array(
4398     "^pxys" => ""
4399     ),
4400     "uri" => ""
4401     ),
4402     "qango" => array(
4403     "icon" => "qango",
4404     "title" => "Qango",
4405     "rule" => array(
4406     "^Qango.com" => ""
4407     ),
4408     "uri" => "http://www.quango.com/"
4409     ),
4410     "qihoo" => array(
4411     "icon" => "qihoo",
4412     "title" => "Qihoo",
4413     "rule" => array(
4414     "QihooBot[ /]([0-9.]{1,10})" => "\\1"
4415     ),
4416     "uri" => "http://www.qihoo.com/"
4417     ),
4418     "qseero" => array(
4419     "icon" => "robot",
4420     "title" => "Qseero",
4421     "rule" => array(
4422     "Qseero v([0-9.]{1,10})" => "\\1"
4423     ),
4424     "uri" => "http://www.q0.com/"
4425     ),
4426     "quantcast" => array(
4427     "icon" => "robot",
4428     "title" => "Quantcast",
4429     "rule" => array(
4430     "Quantcastbot[ /]([0-9.]{1,10})" => "\\1"
4431     ),
4432     "uri" => "http://www.quantcast.com/"
4433     ),
4434     "quepasa" => array(
4435     "icon" => "quepasa",
4436     "title" => "Quepasa",
4437     "rule" => array(
4438     "Quepasa[ \-]?Creep" => ""
4439     ),
4440     "uri" => ""
4441     ),
4442     "questfinder" => array(
4443     "icon" => "robot",
4444     "title" => "QuestFinder",
4445     "rule" => array(
4446     "www\.questfinder\.com" => ""
4447     ),
4448     "uri" => ""
4449     ),
4450 matthys 351 "qwantify" => array(
4451     "icon" => "qwantify",
4452     "title" => "Qwantify",
4453     "rule" => array(
4454     "Qwantify[ /]([0-9.]{1,10})" => "\\1"
4455     ),
4456     "uri" => "https://www.qwant.com/"
4457     ),
4458 joku 63 "qweery" => array(
4459     "icon" => "robot",
4460     "title" => "Qweery",
4461     "rule" => array(
4462     "^QweeryBot[ /]([0-9.]{1,10})" => "\\1"
4463     ),
4464     "uri" => "http://qweerybot.qweery.nl"
4465     ),
4466     "racaicrawler" => array(
4467     "icon" => "robot",
4468     "title" => "RacaiCrawler",
4469     "rule" => array(
4470     "RacaiCrawler[ -]([0-9.]{1,10})" => "\\1"
4471     )
4472     ),
4473     "radian6" => array(
4474     "icon" => "robot",
4475     "title" => "Radian6",
4476     "rule" => array(
4477     "www\.radian6\.com" => ""
4478     ),
4479     "uri" => "http://www.radian6.com"
4480     ),
4481 joku 375 "radiofx" => array(
4482     "icon" => "radiofx",
4483     "title" => "Radio.fx",
4484     "rule" => array(
4485     "Radio.fx" => ""
4486     ),
4487     "uri" => "https://de.tobit.softwarw"
4488     ),
4489 joku 63 "rambler" => array(
4490     "icon" => "rambler",
4491     "title" => "Rambler",
4492     "rule" => array(
4493     "StackRambler[ /]([0-9.]{1,10})" => "\\1"
4494     ),
4495     "uri" => ""
4496     ),
4497     "ramiba" => array(
4498     "icon" => "robot",
4499 matthys 209 "title" => "Ramiba",
4500 joku 63 "rule" => array(
4501     "^ramiba(-bot)?" => "\\1"
4502     ),
4503     "uri" => ""
4504     ),
4505     "rankur" => array(
4506     "icon" => "rankur",
4507     "title" => "Rankur",
4508     "rule" => array(
4509     "^RankurBot/Rankur([0-9.]{1,10})" => "\\1"
4510     ),
4511     "uri" => "http://rankur.com/",
4512     ),
4513 joku 261 "red" => array(
4514     "icon" => "red",
4515     "title" => "RED",
4516     "rule" => array(
4517     "RED[ /]([0-9.]{1,10})" => "\\1"
4518     ),
4519     "uri" => "http://redbot.org/"
4520 joku 181 ),
4521 joku 63 "rediff" => array(
4522     "icon" => "rediff",
4523 matthys 209 "title" => "Rediff",
4524 joku 63 "rule" => array(
4525     "^RedBot/redbot[ /\-]([0-9.]{1,10})" => "\\1"
4526     ),
4527     "uri" => "http://www.rediff.com",
4528     ),
4529     "repia" => array(
4530     "icon" => "robot",
4531     "title" => "Repia",
4532     "rule" => array(
4533     "webmaster@repia\.com" => ""
4534     ),
4535     "uri" => ""
4536     ),
4537     "robotgenius" => array(
4538     "icon" => "robot",
4539     "title" => "Robot Genius",
4540     "rule" => array(
4541     "^robotgenius" => ""
4542     ),
4543     "uri" => "http://robotgenius.net",
4544     ),
4545     "robozilla" => array(
4546     "icon" => "robot",
4547     "title" => "Robozilla",
4548     "rule" => array(
4549     "Robozilla" => ""
4550     ),
4551     "uri" => ""
4552     ),
4553 matthys 302 "rogerbot" => array(
4554 matthys 306 "icon" => "moz",
4555     "title" => "Moz Rogerbot",
4556 matthys 302 "rule" => array(
4557     "rogerbot[ /]([0-9.]{1,10})" => "\\1"
4558     ),
4559     "uri" => "http://moz.com/help/guides/moz-procedures/who-is-rogerbot"
4560     ),
4561 joku 63 "rojo" => array(
4562     "icon" => "rojo",
4563     "title" => "Rojo",
4564     "rule" => array(
4565     "Rojo[ /]([0-9.]{1,10})" => "\\1"
4566     ),
4567     "uri" => ""
4568     ),
4569     "rss-atom" => array(
4570     "icon" => "rss",
4571     "title" => "RSS / Atom",
4572     "rule" => array(
4573     "^Apple-PubSub" => "",
4574     "^AppleSyndication" => ""
4575     ),
4576     "uri" => ""
4577     ),
4578     "rssbot" => array(
4579     "icon" => "rss",
4580 matthys 209 "title" => "RSS-bot",
4581 joku 63 "rule" => array(
4582     "rss-bot[ /]([0-9.]{1,10})" => "\\1"
4583     ),
4584     "uri" => ""
4585     ),
4586     "rssbandit" => array(
4587     "icon" => "rssbandit",
4588     "title" => "RssBandit",
4589     "rule" => array(
4590     "RssBandit[ /]([0-9.]{1,10})" => "\\1"
4591     ),
4592     "uri" => ""
4593     ),
4594     "rssimages" => array(
4595     "icon" => "rss",
4596 matthys 209 "title" => "RssImages",
4597 joku 63 "rule" => array(
4598     "rssImagesBot[ /]([0-9.]{1,10})" => "\\1"
4599     ),
4600     "uri" => ""
4601     ),
4602     "rssmicro" => array(
4603     "icon" => "rssmicro",
4604     "title" => "RSSMicro",
4605     "rule" => array(
4606     "RSSMicro\.com" => ""
4607     ),
4608     "uri" => "http://www.rssmicro.com"
4609     ),
4610     "rssowl" => array(
4611     "icon" => "rssowl",
4612     "title" => "RSSOwl",
4613     "rule" => array(
4614     "RSSOwl[ /]([0-9a-z.]{1,10})" => "\\1"
4615     ),
4616     "uri" => ""
4617     ),
4618     "rssreader" => array(
4619     "icon" => "rss",
4620     "title" => "RssReader",
4621     "rule" => array(
4622     "RssReader[ /]([0-9.]{1,10})" => ""
4623     ),
4624     "uri" => ""
4625     ),
4626     "rtgi" => array(
4627     "icon" => "rtgi",
4628 matthys 209 "title" => "Rtgi",
4629 joku 63 "rule" => array(
4630     "RTGI" => ""
4631     ),
4632     "uri" => "http://rtgi.fr/"
4633     ),
4634     "rufusbot" => array(
4635     "icon" => "robot",
4636     "title" => "RufusBot",
4637     "rule" => array(
4638     "RufusBot" => ""
4639     ),
4640     "uri" => ""
4641     ),
4642 matthys 304 "runet" => array(
4643     "icon" => "runet",
4644     "title" => "iTrack RuNet Crawler",
4645     "rule" => array(
4646     "Runet-Research-Crawler" => ""
4647     ),
4648     "uri" => "http://www.itrack.ru/research/cmsrate/"
4649     ),
4650 joku 63 "runnk" => array(
4651     "icon" => "robot",
4652     "title" => "Runnk",
4653     "rule" => array(
4654     "Runnk RSS finder" => ""
4655     ),
4656     "uri" => "http://www.runnk.com/il/law"
4657     ),
4658     "sagool" => array(
4659     "icon" => "robot",
4660     "title" => "Sagool",
4661     "rule" => array(
4662     "MaSagool" => ""
4663     ),
4664     "uri" => "http://sagool.jp/"
4665     ),
4666     "sanszbot" => array(
4667     "icon" => "robot",
4668     "title" => "Sansz",
4669     "rule" => array(
4670     "SanszBot" => ""
4671     ),
4672     "uri" => ""
4673     ),
4674     "saucereader" => array(
4675     "icon" => "saucereader",
4676     "title" => "Sauce Reader",
4677     "rule" => array(
4678     "Sauce[ ]?Reader[ /]([0-9.]{1,10})" => "\\1"
4679     ),
4680     "uri" => ""
4681     ),
4682     "sbider" => array(
4683     "icon" => "sbider",
4684     "title" => "SBIder",
4685     "rule" => array(
4686     "SBIder[/ ]([0-9.]{1,10})" => "\\1",
4687     "SBIder[/ ]SBIder.([0-9.]{1,10})" => "\\1"
4688     ),
4689     "uri" => ""
4690     ),
4691     "scirus" => array(
4692     "icon" => "robot",
4693     "title" => "Scirus",
4694     "rule" => array(
4695     "FAST-WebCrawler/[0-9a-z.]{1,10}/Scirus" => ""
4696     ),
4697     "uri" => ""
4698     ),
4699     "scoutjet" => array(
4700     "icon" => "scoutjet",
4701     "title" => "ScoutJet",
4702     "rule" => array(
4703     "ScoutJet" => ""
4704     ),
4705     "uri" => "http://www.scoutjet.com/"
4706     ),
4707 joku 261 "scrapy" => array(
4708     "icon" => "scrapy",
4709     "title" => "Scrapy",
4710     "rule" => array(
4711     "Scrapy[ /]([0-9.]{1,10})" => "\\1"
4712     ),
4713     "uri" => "http://scrapy.org"
4714     ),
4715 joku 63 "scrubby" => array(
4716     "icon" => "scrubby",
4717     "title" => "Scrubby",
4718     "rule" => array(
4719     "Scrubby[ /]([0-9.]{1,10})" => "\\1"
4720     ),
4721     "uri" => ""
4722     ),
4723     "sdm" => array(
4724     "icon" => "sdm",
4725     "title" => "SUN Download Manager",
4726     "rule" => array(
4727     "Sun Download Manager[/ ]([0-9.]{1,10})" => "\\1"
4728     ),
4729     "uri" => ""
4730     ),
4731     "sealinks" => array(
4732     "icon" => "robot",
4733     "title" => "Sea Links",
4734     "rule" => array(
4735     "SEA-Links( HTML-Scanner Pingoo\!)?[ /]([0-9.]{1,10})" => "\\2"
4736     ),
4737     "uri" => ""
4738     ),
4739     "search17" => array(
4740     "icon" => "robot",
4741     "title" => "Search 17",
4742     "rule" => array(
4743     "Search17Bot[ /]([0-9.]{1,10})" => "\\1"
4744     ),
4745     "uri" => "http://www.search17.com/bot.php"
4746     ),
4747     "search2" => array(
4748     "icon" => "search2",
4749     "title" => "Search2.net",
4750     "rule" => array(
4751     "^S2Bot[ /]([0-9.]{1,10})" => "\\1"
4752     ),
4753     "uri" => "http://search2.net/"
4754     ),
4755     "searchbot" => array(
4756     "icon" => "robot",
4757     "title" => "Searchbot",
4758     "rule" => array(
4759     "Searchbot[ /]([0-9.]{1,10})" => "\\1"
4760     ),
4761     "uri" => ""
4762     ),
4763     "searchch" => array(
4764     "icon" => "robot",
4765     "title" => "Search.ch",
4766     "rule" => array(
4767     "search\.ch[ /]?V?([0-9.]{1,10})" => "\\1"
4768     ),
4769     "uri" => ""
4770     ),
4771     "searchengineworld" => array(
4772     "icon" => "robot",
4773     "title" => "SearchEngineWorld",
4774     "rule" => array(
4775     "searchengineworld" => ""
4776     ),
4777     "uri" => "http://www.searchengineworld.com/"
4778     ),
4779     "searchhippo" => array(
4780     "icon" => "searchhippo",
4781     "title" => "Searchhippo",
4782     "rule" => array(
4783     "searchhippo" => ""
4784     ),
4785     "uri" => "http://www.searchhippo.com/"
4786     ),
4787     "searchthruus" => array(
4788     "icon" => "robot",
4789     "title" => "SearchThruUs",
4790     "rule" => array(
4791     "www\.unitek-systems\.co\.uk[ /]([0-9.]{1,10})" => "\\1"
4792     ),
4793     "uri" => ""
4794     ),
4795     "securecomputing" => array(
4796     "icon" => "robot",
4797     "title" => "Secure Computing",
4798     "rule" => array(
4799     "securecomputing" => ""
4800     ),
4801     "uri" => ""
4802     ),
4803     "seekport" => array(
4804     "icon" => "seekport",
4805     "title" => "Seekport",
4806     "rule" => array(
4807     "Seekbot[ /]([0-9.]{1,10})" => "\\1"
4808     ),
4809     "uri" => ""
4810     ),
4811     "semanticdiscovery" => array(
4812     "icon" => "robot",
4813     "title" => "Semantic Discovery",
4814     "rule" => array(
4815     "semanticdiscovery[ /]([0-9.]{1,10})" => "\\1"
4816     ),
4817     "uri" => ""
4818     ),
4819 matthys 319 "semrush" => array(
4820     "icon" => "semrush",
4821     "title" => "SEMrush",
4822     "rule" => array(
4823     "SemrushBot[ /]([0-9.]{1,10})" => "\\1"
4824     ),
4825     "uri" => "http://www.semrush.com/bot.html"
4826     ),
4827 joku 63 "sengine" => array(
4828     "icon" => "sengine",
4829     "title" => "Sengine",
4830     "rule" => array(
4831     "netEstate NE Crawler" => ""
4832     ),
4833     "uri" => "http://www.sengine.info/"
4834     ),
4835     "sensis" => array(
4836     "icon" => "sensis",
4837     "title" => "Sensis",
4838     "rule" => array(
4839     "^Sensis(.com.au)? Web Crawler" => ""
4840     ),
4841     "uri" => "http://sensis.com.au"
4842     ),
4843     "seokicks" => array(
4844     "icon" => "seokicks",
4845     "title" => "SEOkicks",
4846     "rule" => array(
4847     "SEOkicks-Robot" => ""
4848     ),
4849     "uri" => "http://www.seokicks.de/"
4850     ),
4851     "seoprofiler" => array(
4852     "icon" => "seoprofiler",
4853     "title" => "SEOprofiler",
4854     "rule" => array(
4855     "spbot[ /]([0-9.]{1,10})" => "\\1"
4856     ),
4857     "uri" => "http://www.seoprofiler.com/"
4858     ),
4859     "setooz" => array(
4860     "icon" => "setooz",
4861     "title" => "Setooz",
4862     "rule" => array(
4863     "OOZBOT[ /]([0-9.]{1,10})" => "\\1"
4864     ),
4865     "uri" => "http://www.setooz.com/oozbot.html"
4866     ),
4867     "seznam" => array(
4868     "icon" => "seznam",
4869     "title" => "Seznam",
4870     "rule" => array(
4871     "SeznamBot[ /]([0-9.]{1,10})" => "\\1",
4872     "Seznam" => ""
4873     ),
4874     "uri" => "http://www.seznam.cz"
4875     ),
4876     "sharpreader" => array(
4877     "icon" => "sharpreader",
4878     "title" => "SharpReader",
4879     "rule" => array(
4880     "SharpReader[ /]([0-9.]{1,10})" => "\\1"
4881     ),
4882     "uri" => ""
4883     ),
4884     "shelob" => array(
4885     "icon" => "shelob",
4886     "title" => "Sherlock Spider",
4887     "rule" => array(
4888     "^Shelob" => ""
4889     ),
4890     "uri" => "http://www.gmx.net"
4891     ),
4892     "sherlockspider" => array(
4893     "icon" => "robot",
4894     "title" => "Sherlock Spider",
4895     "rule" => array(
4896     "sherlock_spider" => ""
4897     ),
4898     "uri" => ""
4899     ),
4900     "shim" => array(
4901     "icon" => "robot",
4902     "title" => "Shim Crawler",
4903     "rule" => array(
4904     "shim[ \-]crawler" => ""
4905     ),
4906     "uri" => ""
4907     ),
4908     "shopwiki" => array(
4909     "icon" => "shopwiki",
4910     "title" => "ShopWiki",
4911     "rule" => array(
4912     "^ShopWiki[ /]([0-9.]{1,10})" => "\\1"
4913     ),
4914     "uri" => ""
4915     ),
4916     "shoula" => array(
4917     "icon" => "robot",
4918     "title" => "Shoula",
4919     "rule" => array(
4920     "^Shoula.com Crawler ([0-9.]{1,10})" => "\\1"
4921     ),
4922     "uri" => "http://www.shoula.com"
4923     ),
4924     "siege" => array(
4925     "icon" => "robot",
4926     "title" => "Siege",
4927     "rule" => array(
4928     "Siege[ /]([0-9.]{1,10})" => "\\1"
4929     ),
4930     "uri" => ""
4931     ),
4932     "siets" => array(
4933     "icon" => "robot",
4934     "title" => "Siets",
4935     "rule" => array(
4936     "SietsCrawler[ /]([0-9.]{1,10})" => "\\1"
4937     ),
4938     "uri" => ""
4939     ),
4940     "simpy" => array(
4941     "icon" => "simpy",
4942     "title" => "Simpy",
4943     "rule" => array(
4944     "^(argus|simpy)[ /]([0-9.]{1,10})" => "\\2",
4945     ),
4946     "uri" => ""
4947     ),
4948     "singingfish" => array(
4949     "icon" => "singingfish",
4950     "title" => "SingingFish",
4951     "rule" => array(
4952     "asterias[ /]([0-9.]{1,10})" => "\\1",
4953     "Asterias Crawler v([0-9.]{1,10})" => "\\1",
4954     "asterias" => ""
4955     ),
4956     "uri" => ""
4957     ),
4958     "sirketce" => array(
4959     "icon" => "robot",
4960     "title" => "Sirketce",
4961     "rule" => array(
4962     "Sirketcebot[ /v]+([0-9.]{1,10})" => "\\1"
4963     ),
4964     "uri" => "http://www.sirketce.com/bot.html"
4965     ),
4966     "sirobot" => array(
4967     "icon" => "robot",
4968     "title" => "SiroBot",
4969     "rule" => array(
4970     "sirobot" => ""
4971     ),
4972     "uri" => ""
4973     ),
4974     "sistrix" => array(
4975     "icon" => "sistrix",
4976     "title" => "SISTRIX",
4977     "rule" => array(
4978     "SISTRIX Crawler" => ""
4979     ),
4980     "uri" => "http://crawler.sistrix.net/"
4981     ),
4982     "sitebar" => array(
4983     "icon" => "sitebar",
4984     "title" => "SiteBar",
4985     "rule" => array(
4986     "SiteBar[ /]([0-9.]{1,10})" => "\\1"
4987     ),
4988     "uri" => ""
4989     ),
4990     "sitebot" => array(
4991     "icon" => "sitebot",
4992     "title" => "SiteBot",
4993     "rule" => array(
4994     "SiteBot[ /]([0-9.]{1,10})" => "\\1"
4995     ),
4996     "uri" => "http://www.sitebot.org/robot/"
4997     ),
4998 matthys 273 "siteexplorer" => array(
4999     "icon" => "siteexplorer",
5000     "title" => "SiteExplorer",
5001     "rule" => array(
5002     "SiteExplorer[ /]([0-9a-z.]{1,10})" => "\\1"
5003     ),
5004     "uri" => "http://siteexplorer.info/"
5005     ),
5006 joku 63 "sitesell" => array(
5007     "icon" => "sitesell",
5008     "title" => "SiteSell",
5009     "rule" => array(
5010     "SBIder[/ ]([0-9a-z.\-]{1,10})" => "\\1"
5011     ),
5012     "uri" => ""
5013     ),
5014     "sitespider" => array(
5015     "icon" => "robot",
5016     "title" => "SiteSpider",
5017     "rule" => array(
5018     "^SiteSpider" => ""
5019     ),
5020     "uri" => ""
5021     ),
5022     "sitesucker" => array(
5023     "icon" => "sitesucker",
5024     "title" => "SiteSucker",
5025     "rule" => array(
5026     "Sitesucker[ /]([0-9.]{1,10})" => "\\1"
5027     ),
5028     "uri" => "http://www.sitesucker.us/"
5029     ),
5030     "sitidi" => array(
5031     "icon" => "robot",
5032     "title" => "SitiDi",
5033     "rule" => array(
5034     "SitiDiBot[ /]([0-9.]{1,10})" => "\\1"
5035     ),
5036     "uri" => ""
5037     ),
5038 joku 329 "sixy" => array(
5039     "icon" => "robot",
5040     "title" => "Sixy.ch",
5041     "rule" => array(
5042     "sixy.ch[ /]([0-9a-z.]{1,10})" => "\\1"
5043     ),
5044     "uri" => "http://sixy.ch"
5045     ),
5046 joku 63 "skaffe" => array(
5047     "icon" => "robot",
5048     "title" => "Skaffe",
5049     "rule" => array(
5050     "Skampy[ /]([0-9.\-]{1,10})" => "\\1"
5051     ),
5052     "uri" => "http://www.skaffe.com"
5053     ),
5054     "skizzle" => array(
5055     "icon" => "skizzle",
5056     "title" => "Skizzle",
5057     "rule" => array(
5058     "SKIZZLE! Distributed Internet Spider[ /v]+([0-9a-z.\-]{1,10})" => "\\1"
5059     ),
5060     "uri" => "http://www.skizzle.com"
5061     ),
5062     "slider" => array(
5063     "icon" => "robot",
5064     "title" => "Slider",
5065     "rule" => array(
5066     "^Slider[ /]([0-9.]{1,10})" => "\\1"
5067     ),
5068     "uri" => ""
5069     ),
5070     "slugch" => array(
5071     "icon" => "robot",
5072 matthys 209 "title" => "Slugch",
5073 joku 63 "rule" => array(
5074     "^slug\.ch crawl ([0-9a-z.\-]{1,10})" => "\\1"
5075     ),
5076     "uri" => ""
5077     ),
5078     "smartware" => array(
5079     "icon" => "robot",
5080     "title" => "SmartWareSoft",
5081     "rule" => array(
5082     "^SWSBot-Images[ /]([0-9.]{1,10})" => "\\1"
5083     ),
5084     "uri" => "http://www.smartwaresoft.com/swsbot12.html"
5085     ),
5086     "snookit" => array(
5087     "icon" => "snookit",
5088     "title" => "Snookit",
5089     "rule" => array(
5090     "^snookit" => ""
5091     ),
5092     "uri" => "http://www.snookit.com/"
5093     ),
5094     "snoopy" => array(
5095     "icon" => "robot",
5096     "title" => "Snoopy",
5097     "rule" => array(
5098     "^Snoopy.+([0-9.]{1,10})" => "\\1",
5099     "sna-([0-9.]{1,10})" => "\\1"
5100     ),
5101     "uri" => "http://snoopy.sourceforge.net/"
5102     ),
5103     "snyke" => array(
5104     "icon" => "robot",
5105     "title" => "Snyke",
5106     "rule" => array(
5107     "^SnykeBot[ /]([0-9.]{1,10})" => "\\1"
5108     ),
5109     "uri" => "http://www.snyke.com"
5110     ),
5111     "socialradar" => array(
5112     "icon" => "socialradar",
5113     "title" => "Social Radar",
5114     "rule" => array(
5115     "Socialradarbot[ /]([0-9.]{1,10})" => "\\1"
5116     ),
5117     "uri" => "http://infegy.com/"
5118     ),
5119     "soegning" => array(
5120     "icon" => "soegning",
5121 matthys 209 "title" => "Søgning",
5122 joku 63 "rule" => array(
5123     "soegning\.dk[/ ]spider[ /]([0-9.]{1,10})" => "\\1"
5124     ),
5125     "uri" => ""
5126     ),
5127     "soft411" => array(
5128     "icon" => "soft411",
5129     "title" => "Soft411",
5130     "rule" => array(
5131     "SOFT411 Directory" => ""
5132     ),
5133     "uri" => ""
5134     ),
5135     "sogou" => array(
5136     "icon" => "sogou",
5137     "title" => "Sogou",
5138     "rule" => array(
5139     "Sogou web spider[ /]([0-9.]{1,10})" => "\\1"
5140     ),
5141     "uri" => "http://www.sogou.com/docs/help/webmasters.htm#07"
5142     ),
5143     "sohu" => array(
5144     "icon" => "robot",
5145     "title" => "Sohu",
5146     "rule" => array(
5147     "sohu[ \-](agent|search)" => ""
5148     ),
5149     "uri" => ""
5150     ),
5151     "somewhere" => array(
5152     "icon" => "robot",
5153 matthys 209 "title" => "Somewhere.com",
5154 joku 63 "rule" => array(
5155     "Mozilla\@somewhere\.com" => "\\1"
5156     ),
5157     "uri" => "http://www.somewhere.com/"
5158     ),
5159     "sopheus" => array(
5160     "icon" => "robot",
5161     "title" => "Sopheus",
5162     "rule" => array(
5163     "Sopheus Project[ /]([0-9.]{1,10})" => "\\1"
5164     ),
5165     "uri" => "http://www.thenetplanet.com"
5166     ),
5167     "soso" => array(
5168     "icon" => "soso",
5169     "title" => "Soso",
5170     "rule" => array(
5171     "^Soso(image)?spider" => ""
5172     ),
5173     "uri" => "http://help.soso.com/soso-image-spider.htm"
5174     ),
5175     "souppot" => array(
5176     "icon" => "robot",
5177     "title" => "SoupPot",
5178     "rule" => array(
5179     "SoupPotBot" => ""
5180     ),
5181     "uri" => ""
5182     ),
5183     "specificmedia" => array(
5184     "icon" => "specificmedia",
5185     "title" => "Specific Media",
5186     "rule" => array(
5187     "^SMBot[ /]([0-9.]{1,10})" => "\\1"
5188     ),
5189     "uri" => ""
5190     ),
5191     "sphider" => array(
5192     "icon" => "sphider",
5193     "title" => "Sphider",
5194     "rule" => array(
5195     "Sphider" => ""
5196     ),
5197     "uri" => "http://www.sphider.eu"
5198     ),
5199     "spinn3r" => array(
5200     "icon" => "robot",
5201     "title" => "Spinn3r",
5202     "rule" => array(
5203     "Spinn3r[ /]([0-9.]{1,10})" => "\\1"
5204     ),
5205     "uri" => "http://spinn3r.com/robot"
5206     ),
5207     "sproose" => array(
5208     "icon" => "robot",
5209 matthys 209 "title" => "Sproose",
5210 joku 63 "rule" => array(
5211     "^sproose[ /]([0-9a-z.]{1,10})" => "\\1"
5212     ),
5213     "uri" => "http://www.sproose.com/bot.html"
5214     ),
5215     "spurlbot" => array(
5216     "icon" => "robot",
5217     "title" => "SpurlBot",
5218     "rule" => array(
5219     "SpurlBot[/ ]([0-9.]{1,10})" => "\\1"
5220     ),
5221     "uri" => ""
5222     ),
5223     "stardownloader" => array(
5224     "icon" => "stardownloader",
5225     "title" => "Star Downloader",
5226     "rule" => array(
5227     "^Star Downloader( Pro)?" => ""
5228     ),
5229     "uri" => ""
5230     ),
5231     "steeler" => array(
5232     "icon" => "robot",
5233     "title" => "Steeler",
5234     "rule" => array(
5235     "Steeler[ /]([0-9.]{1,10})" => "\\1"
5236     ),
5237     "uri" => ""
5238     ),
5239     "strategicboard" => array(
5240     "icon" => "strategicboard",
5241     "title" => "Strategic Board",
5242     "rule" => array(
5243     "Strategic Board Bot" => ""
5244     ),
5245     "uri" => "http://www.strategicboard.com"
5246     ),
5247     "suchbaer" => array(
5248     "icon" => "robot",
5249 matthys 209 "title" => "Suchbaer.de",
5250 joku 63 "rule" => array(
5251     "^suchbaer\.de" => ""
5252     ),
5253     "uri" => "http://www.suchbaer.de/"
5254     ),
5255     "suchbot" => array(
5256     "icon" => "robot",
5257 matthys 209 "title" => "Suchbot",
5258 joku 63 "rule" => array(
5259     "^suchbot" => ""
5260     ),
5261     "uri" => ""
5262     ),
5263     "suchende" => array(
5264     "icon" => "suchende",
5265 matthys 209 "title" => "Suchen.de",
5266 joku 63 "rule" => array(
5267     "^gonzo([0-9]{1,2}).*www.suchen.de" => "\\1",
5268     "^gonzo/([0-9.]{1,10})" => "\\1"
5269     ),
5270     "uri" => "http://www.suchen.de/"
5271     ),
5272     "suchknecht" => array(
5273     "icon" => "robot",
5274     "title" => "Suchknecht",
5275     "rule" => array(
5276     "^Suchknecht.at-Robot" => ""
5277     ),
5278     "uri" => "http://www.suchknecht.at/"
5279     ),
5280     "suchpad" => array(
5281     "icon" => "robot",
5282 matthys 209 "title" => "Suchpad",
5283 joku 63 "rule" => array(
5284     "^suchpadbot[ /]([0-9.]{1,10})" => "\\1"
5285     ),
5286     "uri" => "http://www.suchpad.de"
5287     ),
5288     "sunrise" => array(
5289     "icon" => "sunrise",
5290     "title" => "Sunrise",
5291     "rule" => array(
5292     "^Sunrise[ /]([0-9a-z.]{1,10})" => "\\1"
5293     ),
5294     "uri" => ""
5295     ),
5296     "superbot" => array(
5297     "icon" => "superbot",
5298     "title" => "SuperBot",
5299     "rule" => array(
5300     "SuperBot[ /]([0-9.]{1,10})" => "\\1"
5301     ),
5302     "uri" => ""
5303     ),
5304     "surfcontrol" => array(
5305     "icon" => "robot",
5306     "title" => "SurfControl",
5307     "rule" => array(
5308     "SurfControl" => "",
5309     "ScSpider[ /]([0-9.]{1,10})" => "\\1"
5310     ),
5311     "uri" => ""
5312     ),
5313     "surfnet" => array(
5314     "icon" => "robot",
5315     "title" => "SURFnet",
5316     "rule" => array(
5317     "AVSearch[ \-]([0-9.]{1,10})" => "\\1"
5318     ),
5319     "uri" => ""
5320     ),
5321     "surfsafely" => array(
5322     "icon" => "robot",
5323     "title" => "Surfsafely",
5324     "rule" => array(
5325     "Submission Spider at surfsafely.com" => ""
5326     ),
5327     "uri" => "http://www.surfsafely.com"
5328     ),
5329     "surphace" => array(
5330     "icon" => "spherescout",
5331     "title" => "Surphace",
5332     "rule" => array(
5333     "Sphere Scout.+([0-9.]{1,10})" => "\\1",//Previous called Sphere Scout
5334     "Surphace.+v([0-9.]{1,10})" => "\\1"
5335     ),
5336     "uri" => "http://www.surphace.com"
5337     ),
5338     "surveybot" => array(
5339     "icon" => "surveybot",
5340     "title" => "Whois Survey",
5341     "rule" => array(
5342     "SurveyBot[ /]([0-9.]{1,10})" => "\\1"
5343     ),
5344     "uri" => ""
5345     ),
5346     "swoogle" => array(
5347     "icon" => "robot",
5348     "title" => "Swoogle",
5349     "rule" => array(
5350     "^Swooglebot[ /]([0-9.]{1,10})" => "\\1"
5351     ),
5352     "uri" => "http://swoogle.umbc.edu/swooglebot.htm"
5353     ),
5354     "swse" => array(
5355     "icon" => "robot",
5356     "title" => "SWSE",
5357     "rule" => array(
5358     "sw\.deri\.org" => ""
5359     ),
5360     "uri" => "http://sw.deri.org/2006/04/multicrawler/robots.html"
5361     ),
5362     "swish-e" => array(
5363     "icon" => "swish-e",
5364     "title" => "Swish-e",
5365     "rule" => array(
5366     "^swish-e" => ""
5367     ),
5368     "uri" => "http://swish-e.org/"
5369     ),
5370     "sygol" => array(
5371     "icon" => "sygol",
5372     "title" => "Sygol",
5373     "rule" => array(
5374     "www.sygol.(com|net)" => ""
5375     ),
5376     "uri" => "http://www.sygol.com"
5377     ),
5378     "syllabs" => array(
5379     "icon" => "syllabs",
5380     "title" => "Syllabs",
5381     "rule" => array(
5382     "Focal[-]([0-9.]{1,10})" => "\\1"
5383     ),
5384     "uri" => "http://www.syllabs.com/crawler.html"
5385     ),
5386     "synapse" => array(
5387     "icon" => "robot",
5388     "title" => "Synapse",
5389     "rule" => array(
5390     " Synapse\)" => ""
5391     ),
5392     "uri" => "http://ws.apache.org/synapse/"
5393     ),
5394     "sync2it" => array(
5395     "icon" => "robot",
5396 matthys 209 "title" => "Sync2it",
5397 joku 63 "rule" => array(
5398     "^\!Susie" => ""
5399     ),
5400     "uri" => "http://www.sync2it.com/bms/susie.php"
5401     ),
5402     "syncit" => array(
5403     "icon" => "robot",
5404 matthys 209 "title" => "Syncit",
5405 joku 63 "rule" => array(
5406     "^SyncIT[ /]([0-9.]{1,10})" => "\\1"
5407     ),
5408     "uri" => "http://www.syncit.com/"
5409     ),
5410     "syndic8" => array(
5411     "icon" => "syndic8",
5412     "title" => "Syndic8",
5413     "rule" => array(
5414     "Syndic8[ /]([0-9.]{1,10})" => "\\1"
5415     ),
5416     "uri" => "http://www.syndic8.com/"
5417     ),
5418     "syndicatie" => array(
5419     "icon" => "robot",
5420     "title" => "Syndicatie.nl",
5421     "rule" => array(
5422     "Syndicatie\.nl robot v ([0-9.]{1,10})" => "\\1",
5423     "Syndicatie\.nl robot;" => ""
5424     ),
5425     "uri" => ""
5426     ),
5427     "synomia" => array(
5428     "icon" => "robot",
5429     "title" => "Synomia",
5430     "rule" => array(
5431     "^SynoBot" => ""
5432     ),
5433     "uri" => ""
5434     ),
5435     "synoo" => array(
5436     "icon" => "robot",
5437     "title" => "SynooBot",
5438     "rule" => array(
5439     "SynooBot[ /]([0-9.]{1,10})" => "\\1",
5440     ),
5441     "uri" => ""
5442     ),
5443     "szukacz" => array(
5444     "icon" => "szukacz",
5445     "title" => "Szukacz",
5446     "rule" => array(
5447     "Szukacz[ /]([0-9.]{1,10})" => "\\1"
5448     ),
5449     "uri" => ""
5450     ),
5451     "tagoo" => array(
5452     "icon" => "tagoobot",
5453     "title" => "Tagoo",
5454     "rule" => array(
5455     "Tagoobot[ /]([0-9.]{1,10})" => "\\1"
5456     ),
5457     "uri" => "http://www.tagoo.ru"
5458     ),
5459     "tagword" => array(
5460     "icon" => "tagword",
5461     "title" => "Tagword",
5462     "rule" => array(
5463     "^Tagword" => ""
5464     ),
5465     "uri" => "http://tagword.com/dmoz_survey.php"
5466     ),
5467     "trailfire" => array(
5468     "icon" => "trailfire",
5469     "title" => "Trailfire",
5470     "rule" => array(
5471     "^Trailfire-bot[ /]([0-9.]{1,10})" => "\\1"
5472     ),
5473     "uri" => "http://trailfire.com"
5474     ),
5475     "tamu" => array(
5476     "icon" => "tamu",
5477     "title" => "Tamu Crawler",
5478     "rule" => array(
5479     "IRLbot[ /]([0-9.]{1,10})" => "\\1",
5480     "TAMU_CS_IRL_CRAWLER[ /]([0-9.]{1,10})" => "\\1"
5481     ),
5482     "uri" => "http://irl.cs.tamu.edu/crawler/"
5483     ),
5484     "taptubot" => array(
5485     "icon" => "taptubot",
5486     "title" => "Taptu",
5487     "rule" => array(
5488     "taptubot" => ""
5489     ),
5490     "uri" => "http://www.taptu.com/corp/taptubot"
5491     ),
5492     "targetseek" => array(
5493     "icon" => "robot",
5494     "title" => "TargetSeek",
5495     "rule" => array(
5496     "TargetSeek[ /]([0-9.]{1,10})" => "\\1"
5497     ),
5498     "uri" => "http://www.targetgroups.net/TargetSeek.html"
5499     ),
5500     "taw" => array(
5501     "icon" => "taw",
5502     "title" => "TAW",
5503     "rule" => array(
5504     "TAW[ /]([0-9.]{1,10})" => "\\1"
5505     ),
5506     "uri" => "http://www.tawdis.net"
5507     ),
5508     "tcd" => array(
5509     "icon" => "tcd",
5510     "title" => "Trinity College Dublin",
5511     "rule" => array(
5512     "^TCDBOT/Nutch-([0-9.]{1,10})" => "\\1"
5513     ),
5514     "uri" => "http://www.tcd.ie"
5515     ),
5516     "technorati" => array(
5517     "icon" => "technorati",
5518     "title" => "Technorati",
5519     "rule" => array(
5520     "Technoratibot[ /]([0-9.]{1,10})" => "\\1"
5521     ),
5522     "uri" => ""
5523     ),
5524     "teleport" => array(
5525     "icon" => "teleport",
5526     "title" => "Teleport",
5527     "rule" => array(
5528     "Teleport[ \-]?Pro" => ""
5529     ),
5530     "uri" => ""
5531     ),
5532     "terrar" => array(
5533     "icon" => "robot",
5534     "title" => "Terrar",
5535     "rule" => array(
5536     "^Fresh Search :: Terrar" => ""
5537     ),
5538     "uri" => ""
5539     ),
5540     "theophrastus" => array(
5541     "icon" => "robot",
5542     "title" => "Theophrastus",
5543     "rule" => array(
5544     "Theophrastus[ /]([0-9.]{1,10})" => "\\1"
5545     ),
5546     "uri" => "http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php"
5547     ),
5548     "thumbnailscz" => array(
5549     "icon" => "robot",
5550 matthys 209 "title" => "Thumbnails.cz",
5551 joku 63 "rule" => array(
5552     "^thumbnail\.cz robot[ /]([0-9.]{1,10})" => "\\1"
5553     ),
5554     "uri" => ""
5555     ),
5556     "thumbshot" => array(
5557     "icon" => "robot",
5558 matthys 209 "title" => "Thumbshots",
5559 joku 63 "rule" => array(
5560     "^thumbshots.*(Version: |v)([0-9.]{2,10})e" => "\\1",
5561     "^thumbshots-de" => ""
5562     ),
5563     "uri" => "http://www.thumbshots.de"
5564     ),
5565     "thunderstone" => array(
5566     "icon" => "thunderstone",
5567     "title" => "Thunderstone",
5568     "rule" => array(
5569     "T-H-U-N-D-E-R-S-T-O-N-E" => "",
5570     "search.thunderstone.com" => ""
5571     ),
5572     "uri" => "http://search.thunderstone.com/"
5573     ),
5574     "timbobot" => array(
5575     "icon" => "robot",
5576 matthys 209 "title" => "TimboBot",
5577 joku 63 "rule" => array(
5578     "timboBot" => ""
5579     ),
5580     "uri" => ""
5581     ),
5582     "topsy" => array(
5583     "icon" => "topsy",
5584     "title" => "Topsy",
5585     "rule" => array(
5586     "Butterfly[ /]([0-9.]{1,10})" => "\\1"
5587     ),
5588     "uri" => "http://labs.topsy.com/butterfly.html"
5589     ),
5590     "trayce" => array(
5591     "icon" => "robot",
5592 matthys 209 "title" => "Trayce",
5593 joku 63 "rule" => array(
5594     "traycebot[ /]([0-9a-z.\-]{1,10})" => "\\1"
5595     ),
5596     "uri" => ""
5597     ),
5598     "tricus" => array(
5599     "icon" => "robot",
5600     "title" => "Tricus",
5601     "rule" => array(
5602     "B_l_i_t_z_B_O_T_@_t_r_i_c_u_s_\._c_o_m" => ""
5603     ),
5604     "uri" => ""
5605     ),
5606     "topicblogs" => array(
5607     "icon" => "robot",
5608     "title" => "Topicblogs",
5609     "rule" => array(
5610     "topicblogs[ /]([0-9.]{1,10})" => "\\1"
5611     ),
5612     "uri" => ""
5613     ),
5614     "touche" => array(
5615     "icon" => "touche",
5616 matthys 209 "title" => "Touché",
5617 joku 63 "rule" => array(
5618     "^Touche" => ""
5619     ),
5620     "uri" => "http://touche.com.ve"
5621     ),
5622     "tuezilla" => array(
5623     "icon" => "robot",
5624 matthys 209 "title" => "TÃœzilla",
5625 joku 63 "rule" => array(
5626     "tuezilla.de" => ""
5627     ),
5628     "uri" => "http://tuezilla.de/t_st-odp-entries-agent.html"
5629     ),
5630     "turnitin" => array(
5631     "icon" => "turnitin",
5632     "title" => "Turnitin",
5633     "rule" => array(
5634     "TurnitinBot[ /]([0-9.]{1,10})" => "\\1"
5635     ),
5636     "uri" => ""
5637     ),
5638     "tutorgig" => array(
5639     "icon" => "robot",
5640     "title" => "TutorGig",
5641     "rule" => array(
5642     "TutorGig(Bot)?[ /]([0-9.]{1,10})" => "\\2"
5643     ),
5644     "uri" => ""
5645     ),
5646     "twiceler" => array(
5647     "icon" => "cuill",
5648 matthys 209 "title" => "Cuill",
5649 joku 63 "rule" => array(
5650     "Twiceler[ /-]([0-9.]{1,10})" => "\\1",
5651     "Twiceler" => ""
5652     ),
5653     "uri" => "http://www.cuill.com/twiceler/robot.html"
5654     ),
5655     "twingly" => array(
5656     "icon" => "twingly",
5657     "title" => "Twingly",
5658     "rule" => array(
5659     "Twingly Recon" => ""
5660     ),
5661     "uri" => "http://www.twingly.com/"
5662     ),
5663 matthys 320 "twitter" => array(
5664     "icon" => "twitter",
5665     "title" => "Twitter",
5666     "rule" => array(
5667     "Twitterbot[ /-]([0-9.]{1,10})" => "\\1"
5668     ),
5669     "uri" => "https://dev.twitter.com/cards/getting-started#crawling"
5670     ),
5671 joku 63 "typepad" => array(
5672     "icon" => "typepad",
5673     "title" => "TypePad",
5674     "rule" => array(
5675     "TypePad/([0-9a-z.]{1,10})" => "\\1"
5676     ),
5677     "uri" => ""
5678     ),
5679     "udmsearch" => array(
5680     "icon" => "robot",
5681     "title" => "UdmSearch",
5682     "rule" => array(
5683     "UdmSearch[/ ]([0-9.]{1,10})" => "\\1"
5684     ),
5685     "uri" => ""
5686     ),
5687     "ukwizz" => array(
5688     "icon" => "ukwizz",
5689     "title" => "UKWizz",
5690     "rule" => array(
5691     "^Mackster.*ukwizz" => ""
5692     ),
5693     "uri" => "http://www.ukwizz.com"
5694     ),
5695     "ultraseek" => array(
5696     "icon" => "robot",
5697     "title" => "Ultraseek",
5698     "rule" => array(
5699     "Ultraseek" => ""
5700     ),
5701     "uri" => ""
5702     ),
5703     "ultraspider" => array(
5704     "icon" => "robot",
5705     "title" => "UltraSpider",
5706     "rule" => array(
5707     "UltraSpider3000[/ ]([0-9.]{1,10})" => "\\1"
5708     ),
5709     "uri" => "http://www.search.ch"
5710     ),
5711     "umai" => array(
5712     "icon" => "robot",
5713 matthys 209 "title" => "Umai",
5714 joku 63 "rule" => array(
5715     "umai[/ ]([0-9.]{1,10})" => "\\1"
5716     ),
5717     "uri" => ""
5718     ),
5719     "unchaos" => array(
5720     "icon" => "robot",
5721     "title" => "Unchaos",
5722     "rule" => array(
5723     "unchaos_crawler[_ /]([0-9.]{1,10})" => "\\1",
5724     "unchaos" => ""
5725     ),
5726     "uri" => ""
5727     ),
5728     "unido" => array(
5729     "icon" => "robot",
5730 matthys 209 "title" => "UNIdo",
5731 joku 63 "rule" => array(
5732     "^unido-bot" => "\\1"
5733     ),
5734     "uri" => "http://mobicom.cs.uni-dortmund.de/bot.html"
5735     ),
5736     "updated" => array(
5737     "icon" => "robot",
5738     "title" => "Updated",
5739     "rule" => array(
5740     "updated[ /]([0-9a-z.]{1,10})" => "\\1"
5741     ),
5742     "uri" => ""
5743     ),
5744     "uptimebot" => array(
5745     "icon" => "robot",
5746     "title" => "UptimeBot",
5747     "rule" => array(
5748     "^UptimeBot" => ""
5749     ),
5750     "uri" => "http://www.uptimebot.com/"
5751     ),
5752     "urifetch" => array(
5753     "icon" => "robot",
5754     "title" => "URI::Fetch",
5755     "rule" => array(
5756     "^URI::Fetch[ /]([0-9.]{1,10})" => "\\1"
5757     ),
5758     "uri" => ""
5759     ),
5760     "urlbase" => array(
5761     "icon" => "robot",
5762     "title" => "URLBase",
5763     "rule" => array(
5764     "URLBase[ /]([0-9.]{1,10})" => "\\1"
5765     ),
5766     "uri" => ""
5767     ),
5768     "urlblaze" => array(
5769     "icon" => "robot",
5770     "title" => "URLBlaze",
5771     "rule" => array(
5772     "^URLBlaze" => ""
5773     ),
5774     "uri" => ""
5775     ),
5776     "urlcontr" => array(
5777     "icon" => "robot",
5778     "title" => "MS URL Control",
5779     "rule" => array(
5780     "Microsoft URL[ \-]?Control" => ""
5781     ),
5782     "uri" => ""
5783     ),
5784     "urlgetfile" => array(
5785     "icon" => "robot",
5786     "title" => "URLGetFile",
5787     "rule" => array(
5788     "^URLGetFile" => ""
5789     ),
5790     "uri" => ""
5791     ),
5792     "urlscope" => array(
5793     "icon" => "robot",
5794     "title" => "UrlScope",
5795     "rule" => array(
5796     "UrlScope" => ""
5797     ),
5798     "uri" => ""
5799     ),
5800     "urltrends" => array(
5801     "icon" => "urltrends",
5802 matthys 209 "title" => "UrlTrends",
5803 joku 63 "rule" => array(
5804     "Snappy/([0-9.]{1,10})" => "\\1",
5805     ),
5806     "uri" => ""
5807     ),
5808     "usww" => array(
5809     "icon" => "usww",
5810 matthys 209 "title" => "USWW",
5811 joku 63 "rule" => array(
5812     "usww\.com" => "",
5813     "Mozilla/5\.0 URL-Spider" => ""
5814     ),
5815     "uri" => "http://www.usww.com/"
5816     ),
5817     "usyd" => array(
5818     "icon" => "robot",
5819     "title" => "USyd-NLP-Spider",
5820     "rule" => array(
5821     "^USyd-NLP-Spider" => ""
5822     ),
5823     "uri" => "http://www.it.usyd.edu.au/~vinci/bot.html"
5824     ),
5825     "vagabondo" => array(
5826     "icon" => "wiseguys",
5827     "title" => "WiseGuys",
5828     "rule" => array(
5829     "Vagabondo[ /]([0-9.]{1,10})" => "\\1",
5830     "Vagabondo-WAP[ /]([0-9.]{1,10})" => "\\1"
5831     ),
5832     "uri" => ""
5833     ),
5834     "unicorn" => array(
5835     "icon" => "w3c",
5836     "title" => "W3C Unicorn",
5837     "rule" => array(
5838     "Unicorn[ /]([0-9.]{1,10})" => "\\1",
5839     ),
5840     "uri" => "http://validator.w3.org/unicorn/"
5841     ),
5842     "validator" => array(
5843     "icon" => "w3c",
5844     "title" => "W3C Validator",
5845     "rule" => array(
5846     "W3C_Validator[ /]([0-9.]{1,10})" => "\\1"
5847     ),
5848     "uri" => "http://validator.w3.org/"
5849     ),
5850     "validator.nu" => array(
5851     "icon" => "validatornu",
5852     "title" => "Validator.nu",
5853     "rule" => array(
5854     "^Validator.nu[ /]([0-9.]{1,10})" => "\\1",
5855     "^Validator.nu/LV" => "\\1"
5856     ),
5857     "uri" => "http://validator.nu/"
5858     ),
5859     "verity" => array(
5860     "icon" => "robot",
5861     "title" => "Verity",
5862     "rule" => array(
5863     "^vspider[ /]([0-9.]{1,10})" => "\\1",
5864     "^vspider" => ""
5865     ),
5866     "uri" => "http://www.verity.com/"
5867     ),
5868     "versionsproject" => array(
5869     "icon" => "robot",
5870     "title" => "Versions-project",
5871     "rule" => array(
5872     "InfoFly[ /]([0-9.]{1,10})" => "\\1"
5873     ),
5874     "uri" => "http://www.versions-project.org/"
5875     ),
5876     "verticalmatch" => array(
5877     "icon" => "robot",
5878     "title" => "VerticalMatch",
5879     "rule" => array(
5880     "^VMBot[ /]([0-9.]{1,10})" => "\\1"
5881     ),
5882     "uri" => "http://www.VerticalMatch.com/"
5883     ),
5884     "verzamelgids" => array(
5885     "icon" => "robot",
5886     "title" => "Verzamelgids",
5887     "rule" => array(
5888     "Verzamelgids[ /]([0-9.]{1,10})" => "\\1"
5889     ),
5890     "uri" => "http://www.verzamelgids.nl/"
5891     ),
5892     "vestris" => array(
5893     "icon" => "vestris",
5894     "title" => "Vestris",
5895     "rule" => array(
5896     "AlkalineBOT[ /]([0-9.]{1,10})" => "\\1"
5897     ),
5898     "uri" => "http://alkaline.vestris.com/"
5899     ),
5900     "vindex" => array(
5901     "icon" => "vindex",
5902     "title" => "Vindex",
5903     "rule" => array(
5904     "Vindex[ /]([0-9.]{1,10})" => "\\1"
5905     ),
5906     "uri" => ""
5907     ),
5908     "visvo" => array(
5909     "icon" => "robot",
5910     "title" => "Visvo",
5911     "rule" => array(
5912     "VisBot[ /]([0-9.]{1,10})" => "\\1"
5913     ),
5914     "uri" => "http://www.visvo.com"
5915     ),
5916     "voila" => array(
5917     "icon" => "voila",
5918     "title" => "Voila",
5919     "rule" => array(
5920     "VoilaBot[ /]?[a-z ]*([0-9.]{1,10})" => "\\1",
5921     "VoilaBot;[ /]([0-9.]{1,10})" => "\\1"
5922     ),
5923     "uri" => ""
5924     ),
5925     "vonna" => array(
5926     "icon" => "robot",
5927     "title" => "Vonna",
5928     "rule" => array(
5929     "Vonna.com b o t" => ""
5930     ),
5931     "uri" => ""
5932     ),
5933     "vortex" => array(
5934     "icon" => "robot",
5935     "title" => "Vortex",
5936     "rule" => array(
5937     "Vortex[ /]([0-9.]{1,10})" => "\\1"
5938     ),
5939     "uri" => "http://marty.anstey.ca/robots/vortex/"
5940     ),
5941     "w3sitesearch" => array(
5942     "icon" => "w3sitesearch",
5943     "title" => "W3SiteSearch",
5944     "rule" => array(
5945     "^W3SiteSearch Crawler[\_v]*([0-9.]{1,10})" => "\\1"
5946     ),
5947     "uri" => "http://www.w3sitesearch.de"
5948     ),
5949     "wagger" => array(
5950     "icon" => "robot",
5951     "title" => "Wagger",
5952     "rule" => array(
5953     "^Waggr" => ""
5954     ),
5955     "uri" => "http://www.waggr.com/"
5956     ),
5957     "wanadoo" => array(
5958     "icon" => "robot",
5959     "title" => "Wanadoo",
5960     "rule" => array(
5961     "^SurferF3[ /]([0-9./]{1,10})" => "\\1"
5962     ),
5963     "uri" => "http://www.wanadoo.fr/"
5964     ),
5965     "wapalizer" => array(
5966     "icon" => "robot",
5967     "title" => "Wapalizer",
5968     "rule" => array(
5969     "wapalizer[ /]([0-9.]{1,10})" => "\\1"
5970     ),
5971     "uri" => "http://www.wapdrive.com/"
5972     ),
5973     "watson" => array(
5974     "icon" => "addy",
5975     "title" => "Dr.Watson",
5976     "rule" => array(
5977     "Watson[ /]([0-9.]{1,10})" => "\\1",
5978     "watson\.addy\.com" => ""
5979     ),
5980     "uri" => ""
5981     ),
5982     "wavefire" => array(
5983     "icon" => "robot",
5984     "title" => "Wavefire",
5985     "rule" => array(
5986     "^Wavefire[ /]([0-9.]{1,10})" => "\\1"
5987     ),
5988     "uri" => ""
5989     ),
5990     "waypath" => array(
5991     "icon" => "waypath",
5992     "title" => "Waypath",
5993     "rule" => array(
5994     "Waypath[ \-]?Scout" => "",
5995     "Waypath (development )?crawler" => ""
5996     ),
5997     "uri" => ""
5998     ),
5999     "wauuu" => array(
6000     "icon" => "wauuu",
6001     "title" => "Wauuu",
6002     "rule" => array(
6003     "Wauuu[/ ]([0-9.]{1,10})" => "\\2"
6004     ),
6005     "uri" => "http://www.wauuu.com"
6006     ),
6007     "wdg" => array(
6008     "icon" => "wdg",
6009     "title" => "WDG Validator",
6010     "rule" => array(
6011     "^WDG_(Site)?Validator[/ ]([0-9.]{1,10})" => "\\2"
6012     ),
6013     "uri" => "http://www.htmlhelp.com/tools/validator/"
6014     ),
6015     "webagogo" => array(
6016     "icon" => "webagogo",
6017     "title" => "Webagogo",
6018     "rule" => array(
6019     "^Webagogo" => ""
6020     ),
6021     "uri" => "http://www.webagogo.be/"
6022     ),
6023     "webalta" => array(
6024     "icon" => "webalta",
6025     "title" => "WebAlta",
6026     "rule" => array(
6027     "^WebAlta( Crawler)?[/ ]([0-9.]{1,10})" => "\\2"
6028     ),
6029     "uri" => "http://www.webalta.net/ru/about_webmaster.html"
6030     ),
6031     "webdigity" => array(
6032     "icon" => "robot",
6033     "title" => "Webdigity Whois Service",
6034     "rule" => array(
6035     "^webdigity whois service" => ""
6036     ),
6037     "uri" => "http://www.webdigity.com/ws"
6038     ),
6039     "webelixir" => array(
6040     "icon" => "webelixir",
6041     "title" => "Webelixir",
6042     "rule" => array(
6043     "^webelixir" => ""
6044     ),
6045     "uri" => "http://www.webelixir.net/"
6046     ),
6047     "webbotru" => array(
6048     "icon" => "robot",
6049     "title" => "Webbot.ru",
6050     "rule" => array(
6051     " Webbot[/ ]([0-9.]{1,10})" => "\\1"
6052     ),
6053     "uri" => "http://www.webbot.ru/bot.html"
6054     ),
6055     "webcapture" => array(
6056     "icon" => "robot",
6057     "title" => "WebCapture",
6058     "rule" => array(
6059     "WebCapture[/ ]([0-9.]{1,10})" => "\\1"
6060     ),
6061     "uri" => ""
6062     ),
6063     "webcollage" => array(
6064     "icon" => "robot",
6065     "title" => "Webcollage",
6066     "rule" => array(
6067     "webcollage" => ""
6068     ),
6069     "uri" => ""
6070     ),
6071     "webcopier" => array(
6072     "icon" => "webcopier",
6073     "title" => "WebCopier",
6074     "rule" => array(
6075     "WebCopier[/ ]v?([0-9.]{1,10})" => "\\1"
6076     ),
6077     "uri" => ""
6078     ),
6079     "webcorp" => array(
6080     "icon" => "webcorp",
6081     "title" => "WebCorp",
6082     "rule" => array(
6083     "WebCorp[/ ]+([0-9.]{1,10})" => "\\1"
6084     ),
6085     "uri" => "http://www.webcorp.org.uk/"
6086     ),
6087     "webcrawl" => array(
6088     "icon" => "robot",
6089     "title" => "WebCrawl",
6090     "rule" => array(
6091     "webcrawl\.net" => ""
6092     ),
6093     "uri" => ""
6094     ),
6095     "webdownloader" => array(
6096     "icon" => "robot",
6097     "title" => "Web Downloader",
6098     "rule" => array(
6099     "Web Downloader[/ ]([0-9.]{1,10})" => "\\1"
6100     ),
6101     "uri" => ""
6102     ),
6103     "webfetch" => array(
6104     "icon" => "robot",
6105 matthys 209 "title" => "WebFetch",
6106 joku 63 "rule" => array(
6107     "^webfetch[/ ]([0-9.]{1,10})" => "\\1"
6108     ),
6109     "uri" => ""
6110     ),
6111     "webfind" => array(
6112     "icon" => "robot",
6113 matthys 209 "title" => "WebFind",
6114 joku 63 "rule" => array(
6115     "^WebFindBot" => ""
6116     ),
6117     "uri" => "http://www.web-find.com"
6118     ),
6119     "webglimpse" => array(
6120     "icon" => "robot",
6121     "title" => "Webglimpse",
6122     "rule" => array(
6123     "^Webglimpse[/ ]([0-9.]{1,10})" => "\\1"
6124     ),
6125     "uri" => "http://webglimpse.net"
6126     ),
6127     "webgobbler" => array(
6128     "icon" => "robot",
6129     "title" => "webGobbler",
6130     "rule" => array(
6131     "^webGobbler[/ ]([0-9.]{1,10})" => "\\1"
6132     ),
6133     "uri" => ""
6134     ),
6135     "webimages" => array(
6136     "icon" => "webimages",
6137     "title" => "WebImages",
6138     "rule" => array(
6139     "^WebImages[/ ]([0-9.]{1,10})" => "\\1"
6140     ),
6141     "uri" => "http://herbert.groot.jebbink.nl/"
6142     ),
6143     "weblight" => array(
6144     "icon" => "robot",
6145     "title" => "WebLight",
6146     "rule" => array(
6147     "^WebLight[/ ]([0-9.]{1,10})" => "\\1"
6148     ),
6149     "uri" => "http://www.illumit.com/Products/weblight/"
6150     ),
6151     "weblinks" => array(
6152     "icon" => "robot",
6153     "title" => "WebLink's",
6154     "rule" => array(
6155     "^Weblink.s checker" => ""
6156     ),
6157     "uri" => ""
6158     ),
6159     "webmeasurement" => array(
6160     "icon" => "robot",
6161     "title" => "Webmeasurement",
6162     "rule" => array(
6163     "^webmeasurement-bot" => ""
6164     ),
6165     "uri" => "http://rvs.informatik.uni-leipzig.de"
6166     ),
6167     "webminer" => array(
6168     "icon" => "robot",
6169     "title" => "WebMiner",
6170     "rule" => array(
6171     "^WebMiner[/ ]([0-9.]{1,10})" => "\\1"
6172     ),
6173     "uri" => ""
6174     ),
6175     "webmin" => array(
6176     "icon" => "webmin",
6177     "title" => "Webmin",
6178     "rule" => array(
6179     "^webmin" => ""
6180     ),
6181     "uri" => ""
6182     ),
6183     "webmon" => array(
6184     "icon" => "webmon",
6185     "title" => "Webmon",
6186     "rule" => array(
6187     "WebMon[ /]([0-9.]{1,10})" => "\\1"
6188     ),
6189     "uri" => "http://www.markwell.btinternet.co.uk/webmon/"
6190     ),
6191     "webox" => array(
6192     "icon" => "robot",
6193     "title" => " WeBoX",
6194     "rule" => array(
6195     "WeBoX[/ ]([0-9.]{1,10})" => "\\1"
6196     ),
6197     "uri" => ""
6198     ),
6199     "webpatrol" => array(
6200     "icon" => "webpatrol",
6201     "title" => "WebPatrol",
6202     "rule" => array(
6203     "^WebPatrol[ /]([0-9.]{1,10})" => "\\1"
6204     ),
6205     "uri" => "http://soft.macfeeling.com/WebPatrol.html"
6206     ),
6207     "webpix" => array(
6208     "icon" => "webpix",
6209     "title" => "WebPix",
6210     "rule" => array(
6211     "WebPix[/ ]([0-9.]{1,10})" => "\\1"
6212     ),
6213     "uri" => ""
6214     ),
6215     "webrace" => array(
6216     "icon" => "robot",
6217     "title" => "WebRACE",
6218     "rule" => array(
6219     "^WebRACE[/ ]([0-9.]{1,10})" => "\\1"
6220     ),
6221     "uri" => ""
6222     ),
6223     "webreaper" => array(
6224     "icon" => "webreaper",
6225     "title" => "WebReaper",
6226     "rule" => array(
6227     "^WebReaper " => ""
6228     ),
6229     "uri" => "http://www.webreaper.net/"
6230     ),
6231     "webresult" => array(
6232     "icon" => "robot",
6233     "title" => "Webresult",
6234     "rule" => array(
6235     "Der webresult\.de Robot" => ""
6236     ),
6237     "uri" => ""
6238     ),
6239     "webring" => array(
6240     "icon" => "robot",
6241     "title" => "Webring Checker",
6242     "rule" => array(
6243     "WebRingChecker[/ ]([0-9.]{1,10})" => "\\1"
6244     ),
6245     "uri" => ""
6246     ),
6247     "webripper" => array(
6248     "icon" => "webripper",
6249     "title" => "WebRipper",
6250     "rule" => array(
6251     "^WebRipper" => ""
6252     ),
6253     "uri" => "http://calluna-software.com"
6254     ),
6255     "webscaled" => array(
6256     "icon" => "webscaled",
6257     "title" => "Webscaled",
6258     "rule" => array(
6259     "Swarm" => ""
6260     ),
6261     "uri" => "http://webscaled.com/"
6262     ),
6263     "websearchau" => array(
6264     "icon" => "websearchau",
6265     "title" => "WebSearch.COM.AU",
6266     "rule" => array(
6267     "WebSearch.COM.AU[/ ]+([0-9.]{1,10})" => "\\1"
6268     ),
6269     "uri" => "http://WebSearch.com.au/"
6270     ),
6271     "websearchbench" => array(
6272     "icon" => "robot",
6273     "title" => "WebSearchBench",
6274     "rule" => array(
6275     "WebSearchBench WebCrawler[v/ ]+([0-9.]{1,10})" => "\\1"
6276     ),
6277     "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6278     ),
6279     "websense" => array(
6280     "icon" => "websense",
6281     "title" => "Websense",
6282     "rule" => array(
6283     "(Sqworm|websense|Konqueror/3\.(0|1)(-rc[1-6])?; i686 Linux; 2002[0-9]{4})" => ""
6284     ),
6285     "uri" => ""
6286     ),
6287     "websiteshadow" => array(
6288     "icon" => "websiteshadow",
6289     "title" => "Websiteshadow",
6290     "rule" => array(
6291     "Websiteshadowbot[ /]([0-9.]{1,10})" => "\\1"
6292     ),
6293     "uri" => "http://websiteshadow.com"
6294     ),
6295     "websiteworth" => array(
6296     "icon" => "robot",
6297     "title" => "WebsiteWorth",
6298     "rule" => array(
6299     "WebsiteWorth[v/ ]+([0-9.]{1,10})" => "\\1"
6300     ),
6301     "uri" => "http://directory.sootle.com/website-worth/tata.php"
6302     ),
6303     "websquash" => array(
6304     "icon" => "websquash",
6305     "title" => "Websquash",
6306     "rule" => array(
6307     "webs(quash\.com|ite[ \-]?Monitor)" => ""
6308     ),
6309     "uri" => ""
6310     ),
6311     "webstripper" => array(
6312     "icon" => "robot",
6313     "title" => "WebStripper",
6314     "rule" => array(
6315     "WebStripper[ /]([0-9.]{1,10})" => "\\1"
6316     ),
6317     "uri" => ""
6318     ),
6319     "webzip" => array(
6320     "icon" => "webzip",
6321     "title" => "WebZIP",
6322     "rule" => array(
6323     "Web[ \-]?ZIP[ /]([0-9.]{1,10})" => "\\1"
6324     ),
6325     "uri" => ""
6326     ),
6327     "wep" => array(
6328     "icon" => "robot",
6329     "title" => "WEP Search",
6330     "rule" => array(
6331     "WEP Search[ /]([0-9.]{1,10})" => "\\1"
6332     ),
6333     "uri" => ""
6334     ),
6335     "westwind" => array(
6336     "icon" => "robot",
6337     "title" => "West Wind Internet Protocols",
6338     "rule" => array(
6339     "^West Wind Internet Protocols[ /]([0-9.]{1,10})" => "\\1"
6340     ),
6341     "uri" => "http://www.west-wind.com/wwipstuff.asp"
6342     ),
6343     "wget" => array(
6344     "icon" => "wget",
6345     "title" => "Wget",
6346     "rule" => array(
6347 joku 308 "Wget[ /]([0-9.]{1,10})" => "\\1",
6348     "Wget" => ""
6349 joku 63 ),
6350     "uri" => ""
6351     ),
6352     "whizbang" => array(
6353     "icon" => "whizbang",
6354     "title" => "WhizBang",
6355     "rule" => array(
6356     "WhizBang" => ""
6357     ),
6358     "uri" => "http://www.whizbang.com/crawler/"
6359     ),
6360     "whois" => array(
6361     "icon" => "whois",
6362     "title" => "Who.is",
6363     "rule" => array(
6364     "Who.is Bot" => ""
6365     ),
6366     "uri" => "http://www.who.is/"
6367     ),
6368     "wikiwix" => array(
6369     "icon" => "wikiwix",
6370     "title" => "Wikiwix",
6371     "rule" => array(
6372     "wikiwix-bot-([0-9.]{1,10})" => "\\1"
6373     ),
6374     "uri" => "http://www.wikiwix.com/"
6375     ),
6376     "wingflyer" => array(
6377     "icon" => "robot",
6378     "title" => "WingFlyer",
6379     "rule" => array(
6380     "^WebFetch" => ""
6381     ),
6382     "uri" => "http://www.wingflyer.com/"
6383     ),
6384     "wininet" => array(
6385     "icon" => "robot",
6386     "title" => "WinInet",
6387     "rule" => array(
6388     "TeamSoft WinInet Component" => ""
6389     ),
6390     "uri" => "http://www.winsoft.sk/wininet.htm"
6391     ),
6392     "winhttp" => array(
6393     "icon" => "robot",
6394     "title" => "WinHTTP",
6395     "rule" => array(
6396     "WinHttp\.WinHttpRequest\.([0-9.]{1,10})" => "\\1"
6397     ),
6398     "uri" => ""
6399     ),
6400     "wire" => array(
6401     "icon" => "robot",
6402     "title" => "WIRE",
6403     "rule" => array(
6404     "^WIRE[ /]([0-9.]{1,10})" => "\\1"
6405     ),
6406     "uri" => ""
6407     ),
6408     "wmp" => array(
6409     "icon" => "robot",
6410     "title" => "WMP",
6411     "rule" => array(
6412     "^WMP" => ""
6413     ),
6414     "uri" => ""
6415     ),
6416     "woozweb" => array(
6417     "icon" => "woozweb",
6418     "title" => "Woozweb",
6419     "rule" => array(
6420     "woozweb" => ""
6421     ),
6422     "uri" => "http://www.woozweb.com/"
6423     ),
6424     "wordchamp" => array(
6425     "icon" => "robot",
6426     "title" => "WordChamp",
6427     "rule" => array(
6428     "^WordChampBot" => ""
6429     ),
6430     "uri" => "http://www.wordchamp.com/"
6431     ),
6432     "wordpress" => array(
6433     "icon" => "wordpress",
6434     "title" => "WordPress",
6435     "rule" => array(
6436     "WordPress[ /]([0-9.]{1,10})" => "\\1"
6437     ),
6438     "uri" => ""
6439     ),
6440     "worio" => array(
6441     "icon" => "worio",
6442     "title" => "Worio",
6443     "rule" => array(
6444     "woriobot" => ""
6445     ),
6446     "uri" => "http://worio.com/"
6447     ),
6448     "worldlight" => array(
6449     "icon" => "worldlight",
6450     "title" => "WorldLight",
6451     "rule" => array(
6452     "^WorldLight" => ""
6453     ),
6454     "uri" => ""
6455     ),
6456     "worqmada" => array(
6457     "icon" => "robot",
6458     "title" => "WorQmada",
6459     "rule" => array(
6460     "WorQmada[ /]([0-9.]{1,10})" => "\\1"
6461     ),
6462     "uri" => ""
6463     ),
6464     "wotbox" => array(
6465     "icon" => "wotbox",
6466     "title" => "Wotbox",
6467     "rule" => array(
6468     "Wotbox[ /]?[a-z]*([0-9.]{1,10})" => "\\1"
6469     ),
6470     "uri" => ""
6471     ),
6472     "wp" => array(
6473     "icon" => "wp",
6474     "title" => "Wirtualna Polska",
6475     "rule" => array(
6476     "NetSprint[ /\-]{1,4}([0-9.]{1,10})" => "\\1"
6477     ),
6478     "uri" => "http://wp.pl"
6479     ),
6480     "wsb" => array(
6481     "icon" => "robot",
6482     "title" => "WebSearchBench",
6483     "rule" => array(
6484     "WSB WebCrawler V([0-9.]{1,10})" => "\\1",
6485     "WSB " => ""
6486     ),
6487     "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6488     ),
6489     "wume" => array(
6490     "icon" => "robot",
6491     "title" => "WUME Lab's",
6492     "rule" => array(
6493     "^wume_crawler[ /]([0-9.]{1,10})" => "\\1",
6494     ),
6495     "uri" => "http://wume.cse.lehigh.edu/~xiq204/crawler/"
6496     ),
6497     "wusage" => array(
6498     "icon" => "wusage",
6499     "title" => "Wusage",
6500     "rule" => array(
6501     "Wusage[ /]([0-9.]{1,10})" => "\\1",
6502     ),
6503     "uri" => "http://www.boutell.com/wusage/"
6504     ),
6505     "wwgrapevine" => array(
6506     "icon" => "wwgrapevine",
6507     "title" => "WWgrapevine",
6508     "rule" => array(
6509     "wwgrapevine[ /]([0-9.]{1,10})" => "\\1"
6510     ),
6511     "uri" => ""
6512     ),
6513     "wws" => array(
6514     "icon" => "robot",
6515     "title" => "WWSBOT",
6516     "rule" => array(
6517     "WWSBOT[ /]([0-9.]{1,10})" => "\\1",
6518     ),
6519     "uri" => "http://www.analyzer.nu"
6520     ),
6521     "www4mail" => array(
6522     "icon" => "robot",
6523 matthys 209 "title" => "WWW4mail",
6524 joku 63 "rule" => array(
6525     "^www4mail[ /]([0-9.]{1,10})" => "\\1"
6526     ),
6527     "uri" => "http://www.www4mail.org/"
6528     ),
6529     "wwwc" => array(
6530     "icon" => "wwwc",
6531     "title" => "WWWC",
6532     "rule" => array(
6533     "^WWWC[ /]([0-9.]{1,10})" => "\\1"
6534     ),
6535     "uri" => ""
6536     ),
6537     "wwwd" => array(
6538     "icon" => "robot",
6539     "title" => "WWWD",
6540     "rule" => array(
6541     "^WWWD[ /]([0-9.]{1,10})" => "\\1"
6542     ),
6543     "uri" => ""
6544     ),
6545     "wwweasel" => array(
6546     "icon" => "wwweasel",
6547     "title" => "WWWeasel",
6548     "rule" => array(
6549     "WWWeasel( Robot)?[/ ]v?([0-9.]{1,10})" => "\\2"
6550     ),
6551     "uri" => ""
6552     ),
6553     "wwwfi" => array(
6554     "icon" => "wwwfi",
6555     "title" => "www.fi",
6556     "rule" => array(
6557     "www\.fi crawler" => ""
6558     ),
6559     "uri" => "http://www.fi/"
6560     ),
6561     "wwwmechanize" => array(
6562     "icon" => "robot",
6563     "title" => "WWW-Mechanize",
6564     "rule" => array(
6565     "^WWW-Mechanize[/ ]([0-9.]{1,10})" => "\\1"
6566     ),
6567     "uri" => ""
6568     ),
6569     "wwwoffle" => array(
6570     "icon" => "robot",
6571     "title" => "WWWoffle",
6572     "rule" => array(
6573     "^wwwoffle[/ ]([0-9.]{1,10})" => "\\1"
6574     ),
6575     "uri" => ""
6576     ),
6577     "wwwster" => array(
6578     "icon" => "robot",
6579     "title" => "WWWster",
6580     "rule" => array(
6581     "^wwwster[/ ]([0-9.]{1,10})" => "\\1"
6582     ),
6583     "uri" => ""
6584     ),
6585     "wysigot" => array(
6586     "icon" => "wysigot",
6587     "title" => "Wysigot",
6588     "rule" => array(
6589     "Wysigot[/ ]([0-9.]{1,10})" => "\\1"
6590     ),
6591     "uri" => ""
6592     ),
6593     "xaldon" => array(
6594     "icon" => "xaldon",
6595     "title" => "Xaldon",
6596     "rule" => array(
6597     "Xaldon WebSpider" => ""
6598     ),
6599     "uri" => "http://www.xaldon.de/"
6600     ),
6601     "xenu" => array(
6602     "icon" => "xenu",
6603     "title" => "Xenu Link Sleuth",
6604     "rule" => array(
6605     "Xenu Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6606     "Xenu(&#039;s)? Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6607     "Xenu_Link_Sleuth_([0-9a-z.]{1,10})" => "\\1"
6608     ),
6609     "uri" => "http://home.snafu.de/tilman/xenulink.html"
6610     ),
6611     "xerka" => array(
6612     "icon" => "xerka",
6613     "title" => "Xerka",
6614     "rule" => array(
6615     "^Xerka WebBot v([0-9a-z.]{1,10})" => "\\1"
6616     ),
6617     "uri" => "http://www.diana-teknologia.com/www1/english/xerka.htm"
6618     ),
6619     "xirq" => array(
6620     "icon" => "robot",
6621     "title" => "XIRQ",
6622     "rule" => array(
6623     "^xirq[ /]([0-9a-z.]{1,10})" => "\\1"
6624     ),
6625     "uri" => "http://www.xirq.com"
6626     ),
6627     "xmlslurp" => array(
6628     "icon" => "robot",
6629     "title" => "XMLSlurp",
6630     "rule" => array(
6631     "^XMLSlurp[ /]([0-9a-z.]{1,10})" => "\\1"
6632     ),
6633     "uri" => ""
6634     ),
6635     "xml-sitemaps" => array(
6636     "icon" => "xml-sitemaps",
6637     "title" => "XML-Sitemaps",
6638     "rule" => array(
6639     "XML-Sitemaps[ /]([0-9a-z.]{1,10})" => "\\1"
6640     ),
6641     "uri" => ""
6642     ),
6643     "xmlrpc" => array(
6644     "icon" => "robot",
6645     "title" => "Trackback",
6646     "rule" => array(
6647     "XMLRPC" => ""
6648     ),
6649     "uri" => ""
6650     ),
6651 matthys 294 "xovi" => array(
6652     "icon" => "xovi",
6653     "title" => "Xovi",
6654     "rule" => array(
6655     "XoviBot[ /]([0-9a-z.]{1,10})" => "\\1"
6656     ),
6657     "uri" => "http://www.xovibot.net"
6658     ),
6659 joku 63 "yacy" => array(
6660     "icon" => "yacy",
6661     "title" => "Yacy",
6662     "rule" => array(
6663     "yacy\.net" => ""
6664     ),
6665     "uri" => ""
6666     ),
6667     "yahoo" => array(
6668     "icon" => "yahoo",
6669     "title" => "Yahoo",
6670     "rule" => array(
6671     "Yahoo(! ([a-z]{1,3} )?Slurp|-)" => "",
6672     "Yahoo-MMCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6673     "Yahoo-VerticalCrawler-FormerWebCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6674     "^AnzwersCrawl[/ ]([0-9a-z.]{1,10})" => "\\1",
6675     "Y!J(-BSC|-SRD)*[/ ]([0-9a-z.]{1,10})" => "\\2",
6676     "Y!OASIS/TEST" => "",
6677     "Harvest-NG[/ ]([0-9a-z.]{1,10})" => "\\1",
6678     "Y!J; for robot study" => "",
6679     "Yahoo Japan; for robot study" => ""
6680     ),
6681     "uri" => "http://www.yahoo.com"
6682     ),
6683     "yahoo-feed" => array(
6684     "icon" => "yahoo",
6685     "title" => "Yahoo Feedseeker",
6686     "rule" => array(
6687     "^YahooFeedSeeker[/ ]([0-9a-z.]{1,10})" => "\\1"
6688     ),
6689     "uri" => "http://www.yahoo.com"
6690     ),
6691     "yandex" => array(
6692     "icon" => "yandex",
6693     "title" => "Yandex",
6694     "rule" => array(
6695     "Yandex[/ ]([0-9.]{1,10})" => "\\1",
6696     "Yandex(Bot|Images|Media|Antivirus)[/ ]([0-9.]{1,10})" => "\\2"
6697     ),
6698     "uri" => "http://yandex.com/bots"
6699     ),
6700     "yanga" => array(
6701     "icon" => "yanga",
6702     "title" => "Yanga",
6703     "rule" => array (
6704     "^Yanga.*v([0-9.]{1,10})" => "\\1"
6705     ),
6706     "uri" => "http://www.yanga.co.uk/"
6707     ),
6708     "yap" => array(
6709     "icon" => "yap",
6710     "title" => "Yap",
6711     "rule" => array(
6712     "^YapBot[_/ ]v([0-9.]{1,10})" => "\\1"
6713     ),
6714     "uri" => "http://www.yapinc.com/"
6715     ),
6716     "yarienavoir" => array(
6717     "icon" => "robot",
6718     "title" => "Yarienavoir",
6719     "rule" => array(
6720     "^yarienavoir.net[/ ]([0-9.]{1,10})" => "\\1"
6721     ),
6722     "uri" => "http://www.yarienavoir.net/"
6723     ),
6724     "yell" => array(
6725     "icon" => "yell",
6726     "title" => "Yell",
6727     "rule" => array(
6728     "YellCrawl[ /]V?([0-9.]{1,10})" => "\\1",
6729     "Yellbot[ /]Nutch-([0-9.]{1,10})" => "\\1",
6730     ),
6731     "uri" => ""
6732     ),
6733     "youdao" => array(
6734     "icon" => "youdao",
6735     "title" => "Youdao",
6736     "rule" => array(
6737     "YodaoBot-(Image|Mobile)?[ /]([0-9.]{1,10})" => "\\2",
6738     "YoudaoBot[ /]([0-9.]{1,10})" => "\\1"
6739     ),
6740     "uri" => "http://www.youdao.com/help/webmaster/spider/"
6741     ),
6742     "yoogli" => array(
6743     "icon" => "yoogli",
6744     "title" => "Yoogli",
6745     "rule" => array(
6746     "yoogliFetchAgent[ /]([0-9.]{1,10})" => "\\1"
6747     ),
6748     "uri" => "http://www.yoogli.com"
6749     ),
6750     "yotta" => array(
6751     "icon" => "robot",
6752     "title" => "Yotta",
6753     "rule" => array(
6754     "Yotta(Shopping|Cars)_Bot[ /]([0-9.]{1,10})" => "\\2",
6755     "OmniExplorer_Bot[ /]([0-9.]{1,10})" => "\\1"
6756     ),
6757     "uri" => "http://www.yottacars.com"
6758     ),
6759     "yoono" => array(
6760     "icon" => "yoono",
6761     "title" => "Yoono",
6762     "rule" => array(
6763     "Yoono" => ""
6764     ),
6765     "uri" => "http://www.yoono.com/"
6766     ),
6767     "yowedo" => array(
6768     "icon" => "robot",
6769     "title" => "Yowedo",
6770     "rule" => array(
6771     "Yowedo[ /]([0-9.]{1,10})" => "\\1"
6772     ),
6773     "uri" => "http://yowedo.com/en/partners.html"
6774     ),
6775     "yuntis" => array(
6776     "icon" => "robot",
6777 matthys 209 "title" => "Yuntis",
6778 joku 63 "rule" => array(
6779     "Gulper Web Bot[ /]([0-9.]{1,10})" => "\\1"
6780     ),
6781     "uri" => "http://yuntis.ecsl.cs.sunysb.edu/help/robot/"
6782     ),
6783     "zao" => array(
6784     "icon" => "robot",
6785     "title" => "Zao",
6786     "rule" => array(
6787     "Zao[ /]([0-9.]{1,10})" => "\\1",
6788     "Zao-crawler" => ""
6789     ),
6790     "uri" => ""
6791     ),
6792     "zealbot" => array(
6793     "icon" => "zeal",
6794     "title" => "ZealBot",
6795     "rule" => array(
6796     "Zealbot[ /]([0-9.]{1,10})" => "\\1"
6797     ),
6798     "uri" => ""
6799     ),
6800     "zearchit" => array(
6801     "icon" => "zearchit",
6802     "title" => "Zearchit",
6803     "rule" => array(
6804     "Zearchit" => ""
6805     ),
6806     "uri" => "http://www.zearchit.de/"
6807     ),
6808     "zebz" => array(
6809     "icon" => "robot",
6810     "title" => "ze.bz",
6811     "rule" => array(
6812     "^ZeBot_(lseek\.net|www\.ze\.bz)" => ""
6813     ),
6814     "uri" => "http://www.ze.bz/"
6815     ),
6816     "zedzo" => array(
6817     "icon" => "robot",
6818     "title" => "Zedzo",
6819     "rule" => array(
6820     "zedzo.digest[ /]([0-9.]{1,10})" => "\\1"
6821     ),
6822     "uri" => "http://www.zedzo.com/"
6823     ),
6824     "zerx" => array(
6825     "icon" => "zerx",
6826     "title" => "Zerx",
6827     "rule" => array(
6828     "^zerxbot[ /](Version|v)*[ /]*([0-9.]{1,10})" => "\\2"
6829     ),
6830     "uri" => "http://www.zerx.com/"
6831     ),
6832     "zeus" => array(
6833     "icon" => "zeus",
6834     "title" => "Zeus",
6835     "rule" => array(
6836     "Zeus" => ""
6837     ),
6838     "uri" => "http://www.zeus.com"
6839     ),
6840     "zippp" => array(
6841     "icon" => "robot",
6842     "title" => "Zippp",
6843     "rule" => array(
6844     "ZipppBot[ /]([0-9.]{1,10})" => "\\1"
6845     ),
6846     "uri" => ""
6847     ),
6848     "zippy" => array(
6849     "icon" => "robot",
6850     "title" => "Zippy",
6851     "rule" => array(
6852     "^Zippy[ v/]*([0-9.]{1,10})" => "\\1"
6853     ),
6854     "uri" => "http://www.zippyfinder.com"
6855     ),
6856     "zoeky" => array(
6857     "icon" => "robot",
6858     "title" => "Zoeky",
6859     "rule" => array(
6860     "Zoekybot[ /]([0-9.]{1,10})" => "\\1"
6861     ),
6862     "uri" => ""
6863     ),
6864     "zoom" => array(
6865     "icon" => "zoom",
6866 matthys 209 "title" => "ZoomSpider",
6867 joku 63 "rule" => array(
6868     "^ZoomSpider" => ""
6869     ),
6870     "uri" => "http://www.wrensoft.com/"
6871     ),
6872     "zspider" => array(
6873     "icon" => "robot",
6874 matthys 209 "title" => "Zspider",
6875 joku 63 "rule" => array(
6876     "zspider[ /]([0-9.a-z]{1,10})" => "\\1"
6877     ),
6878     "uri" => "http://feedback.redkolibri.com/"
6879     ),
6880 matthys 281 "zumbot" => array(
6881     "icon" => "robot",
6882     "title" => "ZUM Search",
6883     "rule" => array(
6884     "ZumBot[ /]([0-9.]{1,10})" => "\\1"
6885     ),
6886     "uri" => "http://help.zum.com/inquiry"
6887     ),
6888 joku 63 "zyborg" => array(
6889     "icon" => "zyborg",
6890     "title" => "WiseNutBot",
6891     "rule" => array(
6892     "(WISE|Zy)bo(rg|t)[ /]([0-9.]{1,10})" => "\\3"
6893     ),
6894     "uri" => ""
6895     ),
6896     // Catch up for the originals, they got to stay in that order.
6897     "blogbot" => array(
6898     "icon" => "blogbot",
6899     "title" => "BlogBot",
6900     "rule" => array(
6901     "Blog[ \-]?Bot" => ""
6902     ),
6903     "uri" => "http://www.blogbot.com/"
6904     ),
6905     "centrum" => array(
6906     "icon" => "centrum",
6907     "title" => "Centrum",
6908     "rule" => array(
6909     "holmes[/ ]([0-9.]{1,10})" => "\\1",
6910     "^Centrum-checker" => ""
6911     ),
6912     "uri" => ""
6913     ),
6914     "httpclient" => array(
6915     "icon" => "robot",
6916     "title" => "HTTPClient",
6917     "rule" => array(
6918     "HTTP[ \-]?Client[ /]([0-9.]{1,10})" => "\\1",
6919     "HTTP[ \-]?Client" => ""
6920     ),
6921     "uri" => "http://www.innovation.ch/java/HTTPClient/"
6922     ),
6923     "incywincy" => array(
6924     "icon" => "robot",
6925     "title" => "IncyWincy",
6926     "rule" => array(
6927     "^IncyWincy[ /]([0-9.]{1,10})" => "\\1",
6928     "^IncyWincy" => ""
6929     ),
6930     "uri" => ""
6931     ),
6932     "java" => array(
6933     "icon" => "java",
6934     "title" => "Java",
6935     "rule" => array(
6936     "^java[ /]*([0-9.a-z]{1,10})" => "\\1"
6937     ),
6938     "uri" => ""
6939     ),
6940     "libfetch" => array(
6941     "icon" => "robot",
6942     "title" => "Libfetch",
6943     "rule" => array(
6944     "^(fetch )?libfetch[ /]([0-9.]{1,10})" => "\\2"
6945     ),
6946     "uri" => "http://www.freebsd.org/"
6947     ),
6948     "libwww" => array(
6949     "icon" => "libwww",
6950 matthys 209 "title" => "LibWWW",
6951 joku 63 "rule" => array(
6952     "^libww(w|w-perl|w-FM)[ /]([0-9.]{1,10})" => "\\2",
6953     "^libww(w|w-perl|w-FM)" => "",
6954     "MyApp.*libww(w|w-perl|w-FM)" => ""
6955     ),
6956     "uri" => ""
6957     ),
6958     "litefinder" => array(
6959     "icon" => "litefinder",
6960     "title" => "LiteFinder",
6961     "rule" => array(
6962     "LiteFinder[ /]([0-9.]{1,10})" => "\\1"
6963     ),
6964     "uri" => "http://www.litefinder.net/about.html"
6965     ),
6966     "nutchorg" => array(
6967     "icon" => "nutchorg",
6968     "title" => "Nutch",
6969     "rule" => array(
6970     "Nutc(hOrg|hCVS|h)?[ /]([0-9.]{1,10})" => "\\2",
6971     "Nutch" => ""
6972     ),
6973     "uri" => "http://lucene.apache.org/nutch/"
6974     ),
6975     "pythonurl" => array(
6976     "icon" => "pythonurl",
6977     "title" => "Python-url",
6978     "rule" => array(
6979     "Python[ \-]?urllib" => ""
6980     ),
6981     "uri" => ""
6982     ),
6983     // Know Robots as SPAM BOTS
6984     "SPAM" => array(
6985     "icon" => "robot",
6986     "title" => "SPAM",
6987     "rule" => array(
6988     "NASA Search[/ ]([0-9.]{1,10})" => "\\1",
6989     "^PHOTO CHECK" => "",
6990     "^FOTOCHECKER" => "",
6991     "^IPTC CHECK" => "",
6992     "^DataCha0s" => "",
6993     "^Mac Finder" => "",
6994     "^Missigua Locator[ /]([0-9.]{1,10})" => "\\1",
6995     "^Missouri College Browse" => "",
6996     "Email[ \-]?Siphon" => "",
6997     "atSpider" => "",
6998     "autoemailspider" => "",
6999     "^Demo Bot" => "",
7000     "^Program Shareware" => "",
7001     "^Snapbot" => "",
7002     "^snap.com" => "",
7003     "^Guestbook Auto Submitter" => "",
7004     "panscient.com" => "",
7005     ),
7006     "uri" => ""
7007     ),
7008     // Things we don't know by now
7009     "robot" => array(
7010     "icon" => "robot",
7011     "title" => "Robot",
7012     "rule" => array(
7013     "(robot|spider|harvest|(?<!orange)bot|(?<!msie)crawler)" => ""
7014     )
7015     )
7016     );
7017 joku 261 ?>

Properties

Name Value
svn:keywords Id