ViewVC Help
View File | Revision Log | Show Annotations | View Changeset | Root Listing
root/BBClone/trunk/lib/robot.php
Revision: 337
Committed: Wed Dec 24 13:24:56 2014 UTC (9 years, 11 months ago) by joku
File size: 157083 byte(s)
Log Message:
added Owler

File Contents

# User Rev Content
1 joku 63 <?php
2     /* This file is part of BBClone (A PHP based Web Counter on Steroids)
3     *
4     * SVN FILE $Id$
5     *
6 joku 312 * Copyright (C) 2001-2015, the BBClone Team (see doc/authors.txt for details)
7 joku 63 *
8     * This program is free software: you can redistribute it and/or modify
9     * it under the terms of the GNU General Public License as published by
10     * the Free Software Foundation, either version 3 of the License, or
11     * (at your option) any later version.
12     *
13     * This program is distributed in the hope that it will be useful,
14     * but WITHOUT ANY WARRANTY; without even the implied warranty of
15     * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16     * GNU General Public License for more details.
17     *
18     * See doc/copying.txt for details
19     */
20    
21     /////////////////////
22     // Robot Detection //
23     /////////////////////
24    
25     $robot = array(
26     "1noon" => array(
27     "icon" => "1noon",
28     "title" => "1noon",
29     "rule" => array(
30     "1Noonbot[/ ]([0-9.]{1,10})" => "\\1",
31     "^Yeti$" => ""
32     ),
33     "uri" => ""
34     ),
35     "123people" => array(
36     "icon" => "123people",
37     "title" => "123people",
38     "rule" => array(
39     "123peoplebot[ /]([0-9.]{1,10})" => "\\1"
40     ),
41     "uri" => "http://www.123people.fr/"
42     ),
43     "123spider" => array(
44     "icon" => "robot",
45     "title" => "123Spider",
46     "rule" => array(
47     "123spider-Bot \(Version: ([0-9.]{1,10})" => "\\1"
48     ),
49     "uri" => "http://www.123spider.de/"
50     ),
51     "192com" => array(
52     "icon" => "robot",
53     "title" => "192.com",
54     "rule" => array(
55     "192.comAgent" => ""
56     ),
57     "uri" => "http://www.192.com/"
58     ),
59 matthys 298 "200please" => array(
60     "icon" => "200please",
61     "title" => "200please Crawler",
62     "rule" => array(
63     "200PleaseBot[ /]([0-9.]{1,10})" => "\\1"
64     ),
65     "uri" => "http://www.200please.com/bot"
66     ),
67 joku 63 "2dehands" => array(
68     "icon" => "2dehands",
69     "title" => "2deHands",
70     "rule" => array(
71     "2dehands\.nl" => ""
72     ),
73     "uri" => ""
74     ),
75     "80legs" => array(
76     "icon" => "80legs",
77     "title" => "80legs",
78     "rule" => array(
79     "008[/ ]([0-9.]{1,10}).*80legs" => "\\1"
80     ),
81     "uri" => "http://www.80legs.com/"
82     ),
83     "a1sitemap" => array(
84     "icon" => "a1sitemap",
85     "title" => "A1 Sitemap",
86     "rule" => array(
87     "^A1 Sitemap Generator[ /]([0-9.]{1,10})" => "\\1",
88     "miggibot[ /]([0-9.]{1,10})" => "\\1"
89     ),
90     "uri" => "http://www.micro-sys.dk/products/sitemap-generator/"
91     ),
92     "a2b" => array(
93     "icon" => "a2b",
94     "title" => "A2B",
95     "rule" => array(
96     "www\.a2b\.cc" => ""
97     ),
98     "uri" => "http://www.a2b.cc"
99     ),
100     "abacho" => array(
101     "icon" => "robot",
102     "title" => "Abacho",
103     "rule" => array(
104     "^ABACHOBot" => ""
105     ),
106     "uri" => ""
107     ),
108     "abcdatos" => array(
109     "icon" => "abcdatos",
110     "title" => "ABCdatos",
111     "rule" => array(
112     "^ABCdatos BotLink[ /]([0-9.]{1,10})" => "\\1"
113     ),
114     "uri" => "http://www.abcdatos.com/"
115     ),
116     "abot" => array(
117     "icon" => "abot",
118     "title" => "aBot",
119     "rule" => array(
120     "^abot[ /]([0-9.]{1,10})" => "\\1"
121     ),
122     "uri" => ""
123     ),
124     "about" => array(
125     "icon" => "about",
126     "title" => "About",
127     "rule" => array(
128     "Libby[_/ ]([0-9.]{1,10})" => "\\1",
129     "About[_/ ]([0-9.]{1,10})libwww-perl" => "\\1"
130     ),
131     "uri" => ""
132     ),
133     "aboutus" => array(
134     "icon" => "aboutus",
135     "title" => "AboutUs",
136     "rule" => array(
137     "AboutUsBot" => ""
138     ),
139     "uri" => "http://www.aboutus.org/"
140     ),
141     "ackerm" => array(
142     "icon" => "robot",
143     "title" => "Ackerm",
144     "rule" => array(
145     "www.ackerm.com" => ""
146     ),
147     "uri" => "http://www.ackerm.com/"
148     ),
149     "acoi" => array(
150     "icon" => "acoi",
151     "title" => "AcoiRobot",
152     "rule" => array(
153     "^AcoiRobot" => ""
154     ),
155     "uri" => "http://monetdb.cwi.nl/acoi/projects.html"
156     ),
157     "acoon" => array(
158     "icon" => "acoon",
159     "title" => "Acoon",
160     "rule" => array(
161     "Acoon[ \-]?Robot" => ""
162     ),
163     "uri" => ""
164     ),
165     "accoona" => array(
166     "icon" => "accoona",
167     "title" => "Accoona",
168     "rule" => array(
169     "Accoona-AI-Agent[/ ]([0-9.]{1,10})" => "\\1",
170     "^accoona" => ""
171     ),
172     "uri" => ""
173     ),
174     "acme" => array(
175     "icon" => "acme",
176     "title" => "Acme",
177     "rule" => array(
178     "^Acme\.Spider" => ""
179     ),
180     "uri" => "http://www.acme.com/java/software/Acme.Spider.html"
181     ),
182     "active" => array(
183     "icon" => "robot",
184     "title" => "ActiveBookmark",
185     "rule" => array(
186     "ActiveBookmark[/ ]([0-9.]{1,10})" => "\\1"
187     ),
188     "uri" => ""
189     ),
190     "admuncher" => array(
191     "icon" => "robot",
192     "title" => "Ad Muncher",
193     "rule" => array(
194     "Ad Muncher[/ v]*([0-9.]{1,10})" => "\\1"
195     ),
196     "uri" => ""
197     ),
198     "aesop" => array(
199     "icon" => "robot",
200     "title" => "Aesop",
201     "rule" => array(
202     "^AESOP_com_SpiderMan" => ""
203     ),
204     "uri" => "http://www.aesop.com"
205     ),
206     "agada" => array(
207     "icon" => "robot",
208     "title" => "Agada",
209     "rule" => array(
210     "^agadine[/ ]([0-9.]{1,10})" => "\\1"
211     ),
212     "uri" => ""
213     ),
214     "ahrefs" => array(
215     "icon" => "ahrefs",
216     "title" => "Ahrefs",
217     "rule" => array(
218     "AhrefsBot[ /]([0-9.]{1,10})" => "\\1"
219     ),
220     "uri" => "http://ahrefs.com/"
221     ),
222     "aibot" => array(
223     "icon" => "robot",
224     "title" => "Aibot",
225     "rule" => array(
226     "AIBOT[/ ]([0-9.]{1,10})" => "\\1"
227     ),
228     "uri" => ""
229     ),
230     "aihitbot" => array(
231     "icon" => "robot",
232     "title" => "aiHit",
233     "rule" => array(
234     "aiHitBot[/ ]([0-9.]{1,10})" => "\\1"
235     ),
236     "uri" => "http://www.aihit.com/"
237     ),
238     "aipbot" => array(
239     "icon" => "robot",
240     "title" => "Aipbot",
241     "rule" => array(
242     "aipbot[/ ]([0-9.]{1,10})" => "\\1"
243     ),
244     "uri" => ""
245     ),
246     "aleksika" => array(
247     "icon" => "aleksika",
248     "title" => "Aleksika",
249     "rule" => array(
250     "Aleksika Spider[/ ]([0-9.]{1,10})" => "\\1"
251     ),
252     "uri" => ""
253     ),
254     "alertsite" => array(
255     "icon" => "alertsite",
256     "title" => "AlertSite",
257     "rule" => array(
258     "ipd[ /]([0-9.]{1,10}).*Alertsite\.com" => "\\1"
259     ),
260     "uri" => "http://www.alertsite.com/index.html"
261     ),
262     "alexa" => array(
263     "icon" => "alexa",
264     "title" => "Alexa",
265     "rule" => array(
266     "^ia_archive" => ""
267     ),
268     "uri" => "http://www.alexa.com/"
269     ),
270     "almaden" => array(
271     "icon" => "almaden",
272     "title" => "IBM Crawler",
273     "rule" => array(
274     "www\.almaden\.ibm\.com/cs/crawler" => ""
275     ),
276     "uri" => "http://www.almaden.ibm.com/cs/crawler/"
277     ),
278     "altavista" => array(
279     "icon" => "altavista",
280     "title" => "Altavista",
281     "rule" => array(
282     "Scooter[ /\-]*[a-z]*([0-9.]{1,10})" => "\\1",
283     "AltaVista V([0-9.]{1,10})" => "\\1",
284     "AltaVista Intranet V([0-9.]{1,10})" => "\\1"
285     ),
286     "uri" => "http://www.altavista.com/"
287     ),
288     "amazon" => array(
289     "icon" => "amazon",
290     "title" => "Amazon",
291     "rule" => array(
292     "^(aranhabot|amzn_assoc)" => "",
293     "^NutchEC2Test" => ""
294     ),
295     "uri" => "http://www.amazon.com/"
296     ),
297     "amidalla" => array(
298     "icon" => "amidalla",
299     "title" => "Amidalla",
300     "rule" => array(
301     "^amibot" => ""
302     ),
303     "uri" => ""
304     ),
305     "amfibi" => array(
306     "icon" => "amfibi",
307     "title" => "Amfibi",
308     "rule" => array(
309     "Amfibibot[/ ]([0-9.]{1,10})" => "\\1",
310     "Amfibibot" => ""
311     ),
312     "uri" => ""
313     ),
314     "amphetadesk" => array(
315     "icon" => "robot",
316     "title" => "AmphetaDesk",
317     "rule" => array(
318     "AmphetaDesk[/ ]([0-9.]{1,10})" => "\\1"
319     ),
320     "uri" => ""
321     ),
322     "amphetameme" => array(
323     "icon" => "robot",
324     "title" => "Amphetameme",
325     "rule" => array(
326     "amphetameme[ \-]?crawler" => ""
327     ),
328     "uri" => ""
329     ),
330     "annomille" => array(
331     "icon" => "robot",
332     "title" => "AnnoMille",
333     "rule" => array(
334     "^AnnoMille( spider)?[/ ]([0-9.]{1,10})" => "\\2"
335     ),
336     "uri" => "http://www.annomille.it"
337     ),
338     "anonymouse" => array(
339     "icon" => "anonymouse",
340     "title" => "Anonymouse.org",
341     "rule" => array(
342     "http://Anonymouse.org" => ""
343     ),
344     "uri" => "http://anonymouse.org"
345     ),
346     "ansearch" => array(
347     "icon" => "robot",
348     "title" => "Ansearch",
349     "rule" => array(
350     "AnsearchBot[/ ]([0-9.]{1,10})" => "\\1"
351     ),
352     "uri" => ""
353     ),
354     "answerchase" => array(
355     "icon" => "answerchase",
356     "title" => "AnswerChase",
357     "rule" => array(
358     "AnswerChase( PROve)?[/ ]([0-9.]{1,10})" => "\\2"
359     ),
360     "uri" => "http://www.answerchase.com/"
361     ),
362     "antibot" => array(
363     "icon" => "robot",
364 matthys 205 "title" => "Antibot",
365 joku 63 "rule" => array(
366     "antibot-V([0-9.]{1,10})" => "\\1"
367     ),
368     "uri" => ""
369     ),
370     "aonde" => array(
371     "icon" => "aonde",
372     "title" => "Aonde",
373     "rule" => array(
374     "^AONDE-Spider" => ""
375     ),
376     "uri" => ""
377     ),
378     "aonline" => array(
379     "icon" => "robot",
380     "title" => "A-Online.at",
381     "rule" => array(
382     "^A-Online Search" => ""
383     ),
384     "uri" => "http://www.a-online.at/"
385     ),
386     "aol" => array(
387     "icon" => "aol",
388     "title" => "AOLserver",
389     "rule" => array(
390     "^AOLserver-Tcl[/ ]([0-9.]{1,10})" => "\\1",
391     "^AOLserver" => ""
392     ),
393     "uri" => ""
394     ),
395     "apachebench" => array(
396     "icon" => "robot",
397     "title" => "ApacheBench",
398     "rule" => array(
399     "ApacheBench[ /]([0-9.]{1,10})" => "\\1"
400     ),
401     "uri" => ""
402     ),
403     "apassion4jazz" => array(
404     "icon" => "robot",
405     "title" => "Passion 4 Jazz",
406     "rule" => array(
407     "^BebopBot[ /]([0-9.]{1,10})" => "\\1"
408     ),
409     "uri" => "http://www.apassion4jazz.net/bebopbot.html"
410     ),
411     "apexoo" => array(
412     "icon" => "robot",
413     "title" => "Apexoo",
414     "rule" => array(
415     "^Apexoo Spider ([0-9.]{1,10})" => "\\1"
416     ),
417     "uri" => "http://www.apexoo.com/"
418     ),
419     "apnoti" => array(
420     "icon" => "apnoti",
421 matthys 205 "title" => "Apnoti",
422 joku 63 "rule" => array(
423     "apnoti.*Robot[ /]v([0-9.]{1,10})" => "\\1"
424     ),
425     "uri" => "http://www.apnoti.com/"
426     ),
427     "aport" => array(
428     "icon" => "aport",
429     "title" => "Aport",
430     "rule" => array(
431     "^Aport" => ""
432     ),
433     "uri" => ""
434     ),
435     "appie" => array(
436     "icon" => "walhello",
437     "title" => "Walhello",
438     "rule" => array(
439     "appie[ /]([0-9.]{1,10})" => "\\1"
440     ),
441     "uri" => ""
442     ),
443     "arachmo" => array(
444     "icon" => "arachmo",
445     "title" => "Arachmo",
446     "rule" => array(
447     "compatible; Arachmo" => ""
448     ),
449     "uri" => ""
450     ),
451     "arexera" => array(
452     "icon" => "arexera",
453     "title" => "Arexera",
454     "rule" => array(
455     "^X-Crawler" => "",
456     "^TECOMAC-Crawler[ /]([0-9.]{1,10})" => "\\1"
457     ),
458     "uri" => "http://www.arexera.de/"
459     ),
460     "arianna" => array(
461     "icon" => "arianna",
462     "title" => "Arianna",
463     "rule" => array(
464     "^www.arianna.it" => ""
465     ),
466     "uri" => "http://www.arianna.it/"
467     ),
468     "artface" => array(
469     "icon" => "robot",
470     "title" => "Artface",
471     "rule" => array(
472     "^ArtfaceBot" => ""
473     ),
474     "uri" => ""
475     ),
476     "artviper" => array(
477     "icon" => "artviper",
478     "title" => "artViper",
479     "rule" => array(
480     "artViper" => ""
481     ),
482     "uri" => "http://www.artviper.net/"
483     ),
484     "asinfo" => array(
485     "icon" => "robot",
486     "title" => "Any Search Info",
487     "rule" => array(
488     "Sleek Spider[ /]([0-9.]{1,10})" => "\\1"
489     ),
490     "uri" => "http://search-info.com/"
491     ),
492     "ask" => array(
493     "icon" => "askjeeves",
494     "title" => "Ask Jeeves",
495     "rule" => array(
496     "Ask[ \-]?Jeeves" => "",
497     "teomaagent" => ""
498     ),
499     "uri" => ""
500     ),
501     "askaboutoil" => array(
502     "icon" => "robot",
503     "title" => "ASPseek",
504     "rule" => array(
505     "^AskAboutOil[ /]([0-9.]{1,10})" => "\\1"
506     ),
507     "uri" => "http://askaboutoil.com/"
508     ),
509     "asked" => array(
510     "icon" => "robot",
511 matthys 205 "title" => "AskEd!",
512 joku 63 "rule" => array(
513     "^asked[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
514     ),
515     "uri" => "http://asked.jp"
516     ),
517     "aspseek" => array(
518     "icon" => "robot",
519     "title" => "ASPseek",
520     "rule" => array(
521     "^ASPseek[/ ]([0-9.]{1,10})" => "\\1"
522     ),
523     "uri" => ""
524     ),
525     "atlocal" => array(
526     "icon" => "robot",
527     "title" => "At Local",
528     "rule" => array(
529     "AtlocalBot[/ ]([0-9.]{1,10})" => "\\1"
530     ),
531     "uri" => "http://www.atlocal.com/"
532     ),
533     "atomz" => array(
534     "icon" => "atomz",
535     "title" => "Atomz",
536     "rule" => array(
537     "Atomz[/ ]([0-9.]{1,10})" => "\\1"
538     ),
539     "uri" => ""
540     ),
541     "axel" => array(
542     "icon" => "robot",
543     "title" => "Axel",
544     "rule" => array(
545     "^axel" => ""
546     ),
547     "uri" => ""
548     ),
549     "axmo" => array(
550     "icon" => "axmo",
551     "title" => "Axmo",
552     "rule" => array(
553     "AxmoRobot" => ""
554     ),
555     "uri" => ""
556     ),
557     "answerbus" => array(
558     "icon" => "answerbus",
559     "title" => "AnswerBus",
560     "rule" => array(
561     "answerbus" => ""
562     ),
563     "uri" => ""
564     ),
565     "automapit" => array(
566     "icon" => "robot",
567     "title" => "AutoMapIt",
568     "rule" => array(
569     "AutoMapIt[ /](Bot)?" => ""
570     ),
571     "uri" => "http://www.automapit.com/bot.html"
572     ),
573     "augurnfind" => array(
574     "icon" => "robot",
575     "title" => "Augurnfind",
576     "rule" => array(
577     "augurnfind[/ ][v\-]*([0-9.]{1,10})" => "\\1"
578     ),
579     "uri" => ""
580     ),
581     "awasu" => array(
582     "icon" => "awasu",
583     "title" => "Awasu",
584     "rule" => array(
585     "Awasu[/ ]([0-9a-z.]{1,10})" => "\\1"
586     ),
587     "uri" => ""
588     ),
589     "axxus" => array(
590     "icon" => "axxus",
591     "title" => "axxus.de",
592     "rule" => array(
593     "whoiam" => ""
594     ),
595     "uri" => "http://www.axxus.de/"
596     ),
597     "ayell" => array(
598     "icon" => "ayell",
599     "title" => "Ayell",
600     "rule" => array(
601     "^Eurobot[ /]([0-9.]{1,10})" => "\\1"
602     ),
603     "uri" => "http://eurobot.ayell.eu"
604     ),
605     "babaloo" => array(
606     "icon" => "babaloo",
607     "title" => "Babaloo",
608     "rule" => array(
609     "BabalooSpider[ /]([0-9.]{1,10})" => "\\1"
610     ),
611     "uri" => "http://www.babaloo.si"
612     ),
613     "babe" => array(
614     "icon" => "robot",
615     "title" => "ba.be",
616     "rule" => array(
617     "BACS http://www.ba.be" => ""
618     ),
619     "uri" => "http://www.ba.be/"
620     ),
621     "baidu" => array(
622     "icon" => "baidu",
623     "title" => "Baidu",
624     "rule" => array(
625     "Baiduspider[ /]([0-9.]{1,10})" => "\\1",
626     "Baiduspider" => ""
627     ),
628     "uri" => "http://www.baidu.com/search/spider.html"
629     ),
630     "bananatree" => array(
631     "icon" => "robot",
632     "title" => "BananaTree",
633     "rule" => array(
634     "www\.thebananatree\.org" => ""
635     ),
636     "uri" => "http://www.thebananatree.org/"
637     ),
638     "bdcindexer" => array(
639     "icon" => "robot",
640     "title" => "bdcindexer",
641     "rule" => array(
642     "bdcindexer_([0-9a-z.]{1,10})" => "\\1"
643     ),
644     "uri" => "http://www.business.com/"
645     ),
646     "bdfetch" => array(
647     "icon" => "robot",
648     "title" => "BDFetch",
649     "rule" => array(
650     "^BDFetch" => ""
651     ),
652     "uri" => ""
653     ),
654     "bdncentral" => array(
655     "icon" => "robot",
656     "title" => "Bdncentral",
657     "rule" => array(
658     "BDNcentral Crawler v([0-9.]{1,10})" => "\\1"
659     ),
660     "uri" => "http://www.bdncentral.com/robot.html"
661     ),
662     "beammachine" => array(
663     "icon" => "robot",
664     "title" => "BeamMachine",
665     "rule" => array(
666     "^BeamMachine[ /]([0-9.]{1,10})" => "\\1"
667     ),
668     "uri" => "http://www.beammachine.net/"
669     ),
670     "become" => array(
671     "icon" => "become",
672     "title" => "Become",
673     "rule" => array(
674     "Become(JP)?Bot[/ ]([0-9.]{1,10})" => "\\2",
675     "(BecomeBot|Exabot)@exava\.com\)$" => ""
676     ),
677     "uri" => "http://www.become.com/"
678     ),
679     "beebware" => array(
680     "icon" => "robot",
681     "title" => "Beebware",
682     "rule" => array(
683     "BeebwareDirectory[/ ]v?([0-9.]{1,10})" => "\\2"
684     ),
685     "uri" => ""
686     ),
687     "bigbrother" => array(
688     "icon" => "robot",
689     "title" => "Big Brother",
690     "rule" => array(
691     "^Big Brother" => ""
692     ),
693     "uri" => "http://pauillac.inria.fr/~fpottier/"
694     ),
695     "bigclique" => array(
696     "icon" => "robot",
697     "title" => "BigClique",
698     "rule" => array(
699     "^BigCliqueBOT[/ ]([0-9.]{1,10})" => "\\1"
700     ),
701     "uri" => "http://www.bigclique.com"
702     ),
703     "biglotron" => array(
704     "icon" => "robot",
705     "title" => "Biglotron",
706     "rule" => array(
707     "^BIGLOTRON" => ""
708     ),
709     "uri" => "http://www.bigclique.com"
710     ),
711     "bigsearch" => array(
712     "icon" => "bigsearch",
713     "title" => "Bigsearch",
714     "rule" => array(
715     "Bigsearch.ca[/ ]Nutch[- ]([0-9.]{1,10})" => "\\1"
716     ),
717     "uri" => ""
718     ),
719     "bilbo" => array(
720     "icon" => "robot",
721     "title" => "Bilbo",
722     "rule" => array(
723     "Bilbo[ /]([0-9.]{1,10})" => "\\1"
724     ),
725     "uri" => "http://home.broadpark.no/~tnilsen-1/Linux/Bilbo_-_Nessus_WEB/bilbo_-_nessus_web.html"
726     ),
727     "bilgi" => array(
728     "icon" => "bilgi",
729     "title" => "Bilgi",
730     "rule" => array(
731     "Bilgi(Beta)?Bot[ /]([0-9.]{1,10})" => "\\1"
732     ),
733     "uri" => "http://www.bilgi.com/"
734     ),
735     "bitacle" => array(
736     "icon" => "bitacle",
737     "title" => "Bitacle",
738     "rule" => array(
739     "Bitacle (ro)?bot[ \(/V\:]+([0-9.]{1,10})" => "\\2",
740     ),
741     "uri" => "http://bitacle.org/"
742     ),
743     "bitbeamer" => array(
744     "icon" => "bitbeamer",
745     "title" => "BitBeamer",
746     "rule" => array(
747     "BitBeamer/([0-9.]{1,10})" => "\\1"
748     ),
749     "uri" => ""
750     ),
751     "biz360" => array(
752     "icon" => "biz360",
753     "title" => "Biz360",
754     "rule" => array(
755     "^Biz360 spider" => ""
756     ),
757     "uri" => ""
758     ),
759     "backlinktest" => array(
760     "icon" => "backlinktest",
761     "title" => "BacklinkCrawler",
762     "rule" => array(
763     "BacklinkCrawler" => ""
764     ),
765     "uri" => "http://www.backlinktest.com/crawler.html"
766     ),
767     "blaizbee" => array(
768     "icon" => "blaiz-bee",
769     "title" => "Blaiz-Bee",
770     "rule" => array(
771     "Blaiz-Bee[ /]([0-9.]{1,10})" => ""
772     ),
773     "uri" => ""
774     ),
775     "blogbeat" => array(
776     "icon" => "robot",
777     "title" => "BlogBeat",
778     "rule" => array(
779     "BlogBeat/?([0-9.]{1,10})" => "\\1",
780     ),
781     "uri" => "http://www.blogbeat.nl"
782     ),
783     "blogbotde" => array(
784     "icon" => "robot",
785     "title" => "blogbot.de",
786     "rule" => array(
787     "Naamah[ /]([0-9.a-z]{1,10})[ /]Blogbot" => "\\1",
788     ),
789     "uri" => "http://blogbot.de/"
790     ),
791     "blogcensus" => array(
792     "icon" => "blogcensus",
793     "title" => "Blogcensus",
794     "rule" => array(
795     "^Blogcensus" => "",
796     ),
797     "uri" => "http://blogcensus.de/bot/"
798     ),
799     "blogdex" => array(
800     "icon" => "robot",
801     "title" => "Blogdex",
802     "rule" => array(
803     "Blogdex[ /]([0-9.]{1,10})" => "\\1",
804     ),
805     "uri" => ""
806     ),
807     "blogg" => array(
808     "icon" => "blogg",
809     "title" => "Blogg",
810     "rule" => array(
811     "^blogg\.de" => ""
812     ),
813     "uri" => ""
814     ),
815     "blogland" => array(
816     "icon" => "robot",
817     "title" => "BlogLand",
818     "rule" => array(
819     "BlogLand[/ ]([0-9.]{1,10})" => "\\1"
820     ),
821     "uri" => ""
822     ),
823     "bloglines" => array(
824     "icon" => "bloglines",
825     "title" => "Bloglines",
826     "rule" => array(
827     "Bloglines[ /]([0-9.]{1,10})" => "\\1",
828     "Bloglines" => ""
829     ),
830     "uri" => ""
831     ),
832     "blogmap" => array(
833     "icon" => "robot",
834     "title" => "Blogmap",
835     "rule" => array(
836     "blogmap" => ""
837     ),
838     "uri" => ""
839     ),
840     "blogosphere" => array(
841     "icon" => "robot",
842     "title" => "Blogosphere",
843     "rule" => array(
844     "Blogosphere" => ""
845     ),
846     "uri" => ""
847     ),
848     "blogpeople" => array(
849     "icon" => "robot",
850     "title" => "BlogPeople",
851     "rule" => array(
852     "BlogPeople" => ""
853     ),
854     "uri" => ""
855     ),
856     "blogpulse" => array(
857     "icon" => "blogpulse",
858     "title" => "Blogpulse",
859     "rule" => array(
860     "Blogpulse" => ""
861     ),
862     "uri" => ""
863     ),
864     "blogranking" => array(
865     "icon" => "blogranking",
866     "title" => "BlogRanking",
867     "rule" => array(
868     "^BlogRanking(/RSS checker)?" => ""
869     ),
870     "uri" => ""
871     ),
872     "blogs" => array(
873     "icon" => "blogs",
874     "title" => "Blo.gs",
875     "rule" => array(
876     "blo\.gs[ /]([0-9.]{1,10})" => "\\1",
877     "blo\.gs" => ""
878     ),
879     "uri" => ""
880     ),
881     "blogshares" => array(
882     "icon" => "blogshares",
883     "title" => "BlogShares",
884     "rule" => array(
885     "BlogShares[ /]V?([0-9.]{1,10})" => "\\1",
886     "(^| |\()Blogshares(\.com| |\))" => ""
887     ),
888     "uri" => ""
889     ),
890     "blogslife" => array(
891     "icon" => "robot",
892     "title" => "BlogsLife",
893     "rule" => array(
894     "Blogslive" => ""
895     ),
896     "uri" => ""
897     ),
898     "blogsnow" => array(
899     "icon" => "blogsnow",
900     "title" => "BlogsNow",
901     "rule" => array(
902     "blogsnowbot" => "",
903     "BlogsNow" => ""
904     ),
905     "uri" => ""
906     ),
907     "blogstreet" => array(
908     "icon" => "blogstreet",
909     "title" => "BlogStreet",
910     "rule" => array(
911     "^BlogStreetBot" => ""
912     ),
913     "uri" => ""
914     ),
915     "blogsurf" => array(
916     "icon" => "robot",
917     "title" => "BlogSurf",
918     "rule" => array(
919     "nomadscafe_ra[/ ]([0-9.]{1,10})" => "\\1"
920     ),
921     "uri" => ""
922     ),
923     "blogtick" => array(
924     "icon" => "robot",
925     "title" => "BlogTick",
926     "rule" => array(
927     "BlogTickServer" => ""
928     ),
929     "uri" => ""
930     ),
931     "blogwatcher" => array(
932     "icon" => "blogwatcher",
933     "title" => "Blogwatcher",
934     "rule" => array(
935     "blogWatcher_Spider[/ ]([0-9.]{1,10})" => "\\1"
936     ),
937     "uri" => ""
938     ),
939     "blogwise" => array(
940     "icon" => "blogwise",
941     "title" => "Blogwise",
942     "rule" => array(
943     "Blogwise\.com(-MetaChecker)?[/ ]([0-9.]{1,10})" => "\\2"
944     ),
945     "uri" => ""
946     ),
947     "boardreader" => array(
948     "icon" => "boardreader",
949     "title" => "BoardReader",
950     "rule" => array(
951     "BoardReader[ \-](Image|Favicon)[ \-]Fetcher[ /]+([0-9.]{1,10})" => "\\2"
952     ),
953     "uri" => "http://www.boardreader.com"
954     ),
955     "bobby" => array(
956     "icon" => "bobby",
957     "title" => "Bobby",
958     "rule" => array(
959     "bobby[ /]([0-9.]{1,10})" => "\\1"
960     ),
961     "uri" => ""
962     ),
963     "boitho" => array(
964     "icon" => "robot",
965     "title" => "Boitho",
966     "rule" => array(
967     "Boitho\.com[ \-](dc|robot)?[/ ]([0-9.]{1,10})" => "\\2"
968     ),
969     "uri" => ""
970     ),
971     "booch" => array(
972     "icon" => "robot",
973     "title" => "Booch",
974     "rule" => array(
975     "^booch[_ /]([0-9.]{1,10})" => "\\1"
976     ),
977     "uri" => ""
978     ),
979     "book" => array(
980     "icon" => "book",
981     "title" => "Bookmark",
982     "rule" => array(
983     "http://www\.bookmark\.ne\.jp" => ""
984     ),
985     "uri" => ""
986     ),
987     "bookdog" => array(
988     "icon" => "bookdog",
989     "title" => "Bookdog",
990     "rule" => array(
991     "^Bookdog[ /]([0-9.]{1,10})" => "\\1"
992     ),
993     "uri" => ""
994     ),
995     "bordermanager" => array(
996     "icon" => "bordermanager",
997     "title" => "Border Manager",
998     "rule" => array(
999     "BorderManager[ /]([0-9.]{1,10})" => "\\1"
1000     ),
1001     "uri" => ""
1002     ),
1003     "botonparade" => array(
1004     "icon" => "botonparade",
1005     "title" => "Bot on Parade",
1006     "rule" => array(
1007     "BotOnParade" => ""
1008     ),
1009     "uri" => "http://www.bots-on-para.de/bot.html"
1010     ),
1011     "botje" => array(
1012     "icon" => "botje",
1013     "title" => "Botje",
1014     "rule" => array(
1015     "Plukkie[ /]([0-9.]{1,10})" => "\\1"
1016     ),
1017     "uri" => "http://www.botje.com/"
1018     ),
1019     "bottomfeeder" => array(
1020     "icon" => "bottomfeeder",
1021     "title" => "BottomFeeder",
1022     "rule" => array(
1023     "BottomFeeder[ /]([0-9.]{1,10})" => "\\1"
1024     ),
1025     "uri" => ""
1026     ),
1027     "browseremulator" => array(
1028     "icon" => "browseremulator",
1029     "title" => "BrowserEmulator",
1030     "rule" => array(
1031     "BrowserEmulator[ /]([0-9.]{1,10})" => "\\1"
1032     ),
1033     "uri" => "http://www.dejavu.org/emulator.htm"
1034     ),
1035     "browsershots" => array(
1036     "icon" => "browsershots",
1037     "title" => "Browsershots",
1038     "rule" => array(
1039     "Browsershots URL Check" => ""
1040     ),
1041     "uri" => "http://browsershots.org"
1042     ),
1043     "browserspy" => array(
1044     "icon" => "robot",
1045     "title" => "BrowserSpy",
1046     "rule" => array(
1047     "BrowserSpy" => ""
1048     ),
1049     "uri" => ""
1050     ),
1051     "bruinbot" => array(
1052     "icon" => "robot",
1053     "title" => "BruinBot",
1054     "rule" => array(
1055     "BruinBot" => ""
1056     ),
1057     "uri" => ""
1058     ),
1059     "bruno" => array(
1060     "icon" => "robot",
1061     "title" => "Bruno",
1062     "rule" => array(
1063     "^Bruno" => ""
1064     ),
1065     "uri" => ""
1066     ),
1067     "btbot" => array(
1068     "icon" => "btbot",
1069     "title" => "BitTorrent",
1070     "rule" => array(
1071     "BTbot/([0-9.]{1,10})" => "\\1"
1072     ),
1073     "uri" => ""
1074     ),
1075     "builtwith" => array(
1076     "icon" => "builtwith",
1077     "title" => "BuiltWith",
1078     "rule" => array(
1079     "BuiltWith[/ ]([0-9.]{1,10})" => "\\1"
1080     ),
1081     "uri" => "http://builtwith.com/bot.html"
1082     ),
1083     "bulkfeeds" => array(
1084     "icon" => "robot",
1085     "title" => "Bulkfeeds",
1086     "rule" => array(
1087     "Bulkfeeds[/ ]([a-z0-9.]{1,10})" => "\\1"
1088     ),
1089     "uri" => ""
1090     ),
1091     "burf" => array(
1092     "icon" => "burf",
1093     "title" => "Burf.com",
1094     "rule" => array(
1095     "^Norbert the Spider" => ""
1096     ),
1097     "uri" => "http://www.burf.com/"
1098     ),
1099     "butch" => array(
1100     "icon" => "robot",
1101     "title" => "Butch",
1102     "rule" => array(
1103     "Butch(__| )?([a-z0-9.]{1,10})" => "\\2"
1104     ),
1105     "uri" => ""
1106     ),
1107     "buzzlogic" => array(
1108     "icon" => "buzzlogic",
1109     "title" => "Buzzlogic",
1110     "rule" => array(
1111     "BuzzBot[ /]([0-9.]{1,10})" => "\\1"
1112     ),
1113     "uri" => "http://www.buzzlogic.com"
1114     ),
1115     "catchbot" => array(
1116     "icon" => "catchbot",
1117     "title" => "CatchBot",
1118     "rule" => array(
1119     "^CatchBot[/ ]([0-9.]{1,10})" => "\\1"
1120     ),
1121     "uri" => "http://www.catchbot.com"
1122     ),
1123     "camdiscover" => array(
1124     "icon" => "robot",
1125     "title" => "Camdiscover",
1126     "rule" => array(
1127     "^Camcrawler" => ""
1128     ),
1129     "uri" => ""
1130     ),
1131     "cazoodle" => array(
1132     "icon" => "cazoodle",
1133     "title" => "Cazoodle",
1134     "rule" => array(
1135     "^CazoodleBot/(Nutch|CazoodleBot)[/ \-]([0-9.]{1,10})" => "\\2",
1136     "^CazoodleBot[/ ]([a-z0-9.]{1,10})" => "\\1"
1137     ),
1138     "uri" => "http://www.cazoodle.com/cazoodlebot"
1139     ),
1140     "ccbot" => array(
1141     "icon" => "robot",
1142     "title" => "ccBot",
1143     "rule" => array(
1144     "CCBot[/ ]([0-9.]{1,10})" => "\\1"
1145     ),
1146     "uri" => "http://www.commoncrawl.org/bot.html"
1147     ),
1148     "ccgcrawl" => array(
1149     "icon" => "robot",
1150     "title" => "CCGCrawl",
1151     "rule" => array(
1152     "CCGCrawl[/ ]([0-9.]{1,10})" => "\\1"
1153     ),
1154     "uri" => "http://www.myworkbase.com/bot.html"
1155     ),
1156     "cerberian" => array(
1157     "icon" => "robot",
1158     "title" => "Cerberian Drtrs",
1159     "rule" => array(
1160     "^Cerberian Drtrs" => ""
1161     ),
1162     "uri" => ""
1163     ),
1164     "cfnetwork" => array(
1165     "icon" => "robot",
1166     "title" => "Cerberian Drtrs",
1167     "rule" => array(
1168     "^CFNetwork[/ ]([0-9.]{1,10})" => "\\1"
1169     ),
1170     "uri" => "http://www.cfnetwork.be/"
1171     ),
1172     "charlotte" => array(
1173     "icon" => "charlotte",
1174     "title" => "Charlotte",
1175     "rule" => array(
1176     "Charlotte[/ ]([0-9a-z.]{1,10})" => "\\1"
1177     ),
1178     "uri" => ""
1179     ),
1180     "cirilizator" => array(
1181     "icon" => "cirilizator",
1182     "title" => "Cirilizator",
1183     "rule" => array(
1184     "Cirilizator[/ ]([0-9.]{1,10})" => "\\1"
1185     ),
1186     "uri" => ""
1187     ),
1188     "claria" => array(
1189     "icon" => "robot",
1190     "title" => "Claria",
1191     "rule" => array(
1192     "(Claria|Diamond)(Bot)?[ /]([0-9.]{1,10})" => "\\3",
1193     "(Claria|Diamond)(Bot)" => ""
1194     ),
1195     "uri" => ""
1196     ),
1197     "claymont" => array(
1198     "icon" => "claymont",
1199     "title" => "Claymont",
1200     "rule" => array(
1201     "claymont\.com" => "",
1202     "OliverPerry" => ""
1203     ),
1204     "uri" => "http://www.claymont.com"
1205     ),
1206     "clush" => array(
1207     "icon" => "clush",
1208     "title" => "Clush",
1209     "rule" => array(
1210     "Clus(tered-Search-|h)Bot[ /]([0-9.]{1,10})" => "\\2"
1211     ),
1212     "uri" => ""
1213     ),
1214     "cmsworldmap" => array(
1215     "icon" => "cmsworldmap",
1216     "title" => "CMS World Map",
1217     "rule" => array(
1218     "cmsworldmap" => ""
1219     ),
1220     "uri" => "http://www.cmsworldmap.com/"
1221     ),
1222     "cobion" => array(
1223     "icon" => "robot",
1224     "title" => "Cobion",
1225     "rule" => array(
1226     " (QXW03018|obot)\)" => ""
1227     ),
1228     "uri" => ""
1229     ),
1230     "coccoc" => array(
1231 matthys 287 "icon" => "coccoc",
1232 matthys 209 "title" => "Coccoc",
1233 joku 63 "rule" => array(
1234     "coccoc[ /]([0-9.]{1,10})" => "\\1"
1235     ),
1236 matthys 287 "uri" => "http://help.coccoc.com"
1237 joku 63 ),
1238     "coldfusion" => array(
1239     "icon" => "coldfusion",
1240     "title" => "ColdFusion",
1241     "rule" => array(
1242     "^coldfusion" => ""
1243     ),
1244     "uri" => ""
1245     ),
1246     "combine" => array(
1247     "icon" => "robot",
1248     "title" => "Combine",
1249     "rule" => array(
1250     "Combine[ /]([0-9.]{1,10})" => "\\1"
1251     ),
1252     "uri" => ""
1253     ),
1254     "combot" => array(
1255     "icon" => "robot",
1256     "title" => "comBot",
1257     "rule" => array(
1258     "^comBot[ /]([0-9.]{1,10})" => "\\1"
1259     ),
1260     "uri" => ""
1261     ),
1262     "comet" => array(
1263     "icon" => "comet",
1264     "title" => "Comet",
1265     "rule" => array(
1266     "cometsearch@cometsystems" => ""
1267     ),
1268     "uri" => ""
1269     ),
1270     "commerobo" => array(
1271     "icon" => "robot",
1272     "title" => "Commerobo",
1273     "rule" => array(
1274     "Commerobo[/ ]([0-9.]{1,10})" => "\\1"
1275     ),
1276     "uri" => ""
1277     ),
1278     "comrite" => array(
1279     "icon" => "robot",
1280     "title" => "ComRite",
1281     "rule" => array(
1282     "Comrite[/ ]([0-9.]{1,10})" => "\\1"
1283     ),
1284     "uri" => "http://www.comrite.com/"
1285     ),
1286     "convera" => array(
1287     "icon" => "convera",
1288     "title" => "Convera",
1289     "rule" => array(
1290     "Convera(MultiMedia)?Crawler[/ ]([0-9.]{1,10})" => "\\2",
1291     "Convera Internet Spider V([0-9.]{1,10})" => "\\1"
1292     ),
1293     "uri" => ""
1294     ),
1295     "coolbot" => array(
1296     "icon" => "robot",
1297     "title" => "CoolBot",
1298     "rule" => array(
1299     "^CoolBot" => ""
1300     ),
1301     "uri" => ""
1302     ),
1303     "cosmix" => array(
1304     "icon" => "robot",
1305     "title" => "Cosmix",
1306     "rule" => array(
1307     "^(voyager|cfetch|CosmixCrawler|carleson)[/ ]([0-9.]{1,10})" => "\\2",
1308     ),
1309     "uri" => ""
1310     ),
1311     "cosmos" => array(
1312     "icon" => "robot",
1313     "title" => "Cosmos",
1314     "rule" => array(
1315     "^cosmos" => ""
1316     ),
1317     "uri" => ""
1318     ),
1319     "cosmoty" => array(
1320     "icon" => "robot",
1321     "title" => "Cosmoty",
1322     "rule" => array(
1323     "^beautybot[/ ]([0-9.]{1,10})" => "\\1"
1324     ),
1325     "uri" => "http://www.uchoose.de/crawler/beautybot/"
1326     ),
1327     "covario" => array(
1328     "icon" => "covario",
1329     "title" => "Covario",
1330     "rule" => array(
1331     "Covario-IDS[/ ]([0-9.]{1,10})" => "\\1"
1332     ),
1333     "uri" => "http://www.covario.com/ids/"
1334     ),
1335     "creativecommons" => array(
1336     "icon" => "creativecommons",
1337     "title" => "Creative Commons",
1338     "rule" => array(
1339     "CreativeCommons[/ ]([0-9.]{1,6}(-dev)?)" => "\\1"
1340     ),
1341     "uri" => ""
1342     ),
1343     "cscrawler" => array(
1344     "icon" => "robot",
1345     "title" => "CsCrawler",
1346     "rule" => array(
1347     "CsCrawler" => ""
1348     ),
1349     "uri" => "http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html"
1350     ),
1351 joku 111 "jigsaw" => array(
1352     "icon" => "jigsaw",
1353     "title" => "Jigsaw",
1354     "rule" => array(
1355     "Jigsaw[ /]([0-9.]{1,10})" => "\\1"
1356     ),
1357     "uri" => "http://jigsaw.w3.org/css-validator/"
1358     ),
1359 joku 63 "csscheck" => array(
1360     "icon" => "w3c",
1361     "title" => "W3C CSS Validator",
1362     "rule" => array(
1363     "CSS(Check|_Validator).+[ /]([0-9.]{1,10})" => "\\2"
1364     ),
1365     "uri" => "http://jigsaw.w3.org/css-validator/"
1366     ),
1367     "custo" => array(
1368     "icon" => "robot",
1369     "title" => "Custo",
1370     "rule" => array(
1371     "Custo[ /]([0-9.]{1,10})" => "\\1"
1372     ),
1373     "uri" => ""
1374     ),
1375     "cybernavi" => array(
1376     "icon" => "robot",
1377     "title" => "CyberNavi",
1378     "rule" => array(
1379     "CyberNavi_WebGet[ /]([0-9.]{1,10})" => "\\1"
1380     ),
1381     "uri" => ""
1382     ),
1383     "cyberpatrol" => array(
1384     "icon" => "cyberpatrol",
1385     "title" => "CyberPatrol",
1386     "rule" => array(
1387     "^CyberPatrol" => ""
1388     ),
1389     "uri" => "http://www.cyberpatrol.com/cyberpatrolcrawler.asp"
1390     ),
1391     "cyberz" => array(
1392     "icon" => "cyberz",
1393     "title" => "Cyberz",
1394     "rule" => array(
1395     "Cyberz Communication Agent" => ""
1396     ),
1397     "uri" => ""
1398     ),
1399     "cydral" => array(
1400     "icon" => "robot",
1401     "title" => "Cydral",
1402     "rule" => array(
1403     "CydralSpider[ /]([0-9.]{1,10})" => "\\1"
1404     ),
1405     "uri" => ""
1406     ),
1407     "cynthia" => array(
1408     "icon" => "cynthia",
1409     "title" => "Cynthia Says",
1410     "rule" => array(
1411     "Cynthia[ /]([0-9.]{1,10})" => "\\1"
1412     ),
1413     "uri" => ""
1414     ),
1415     "d4x" => array(
1416     "icon" => "d4x",
1417     "title" => "Downloader for X",
1418     "rule" => array(
1419     "Downloader for X[ /]([0-9.]{1,10})" => "\\1"
1420     ),
1421     "uri" => ""
1422     ),
1423     "da" => array(
1424     "icon" => "da",
1425     "title" => "DA",
1426     "rule" => array(
1427     "^DA[ /]([0-9.]{1,10})" => "\\1"
1428     ),
1429     "uri" => ""
1430     ),
1431     "daum" => array(
1432     "icon" => "daum",
1433     "title" => "DAUM",
1434     "rule" => array(
1435     "DAUMOA[ /]([0-9.]{1,10})" => "\\1",
1436     "DAUM Web Robot" => "",
1437     "Daum Communications Corp" => "",
1438     "EDI[ /]([0-9.]{1,10})" => "\\1",
1439     "Edacious.*Intelligent Web Robot" => "",
1440     "RaBot[/ ]([0-9.]{1,10}) Agent" => "\\1"
1441     ),
1442     "uri" => "http://ws.daum.net/"
1443     ),
1444     "daypop" => array(
1445     "icon" => "robot",
1446     "title" => "Daypop",
1447     "rule" => array(
1448     "daypopbot[/ ]([0-9.]{1,10})" => "\\1"
1449     ),
1450     "uri" => ""
1451     ),
1452     "delfi" => array(
1453     "icon" => "delfi",
1454     "title" => "Delfi",
1455     "rule" => array(
1456     "crawl at delfi dot lt" => ""
1457     ),
1458     "uri" => ""
1459     ),
1460     "depspid" => array(
1461     "icon" => "depspid",
1462     "title" => "DepSpid",
1463     "rule" => array(
1464     "DepSpid[/ ]([0-9.]{1,10})" => "\\1"
1465     ),
1466     "uri" => ""
1467     ),
1468     "devonagent" => array(
1469     "icon" => "devonagent",
1470     "title" => "DEVONagent",
1471     "rule" => array(
1472     "DEVONtech" => ""
1473     ),
1474     "uri" => ""
1475     ),
1476     "diffbot" => array(
1477     "icon" => "diffbot",
1478     "title" => "Diffbot",
1479     "rule" => array(
1480     " Diffbot" => ""
1481     ),
1482     "uri" => "http://www.diffbot.com"
1483     ),
1484     "diribot" => array(
1485     "icon" => "diribot",
1486     "title" => "Diri",
1487     "rule" => array(
1488     "diribot" => ""
1489     ),
1490     "uri" => "http://www.diri.bg"
1491     ),
1492     "directhit" => array(
1493     "icon" => "robot",
1494     "title" => "Direct Hit",
1495     "rule" => array(
1496     "EZResult -- Internet Search Engine" => ""
1497     ),
1498     "uri" => "http://www.directhit.com"
1499     ),
1500     "disco" => array(
1501     "icon" => "disco",
1502 matthys 209 "title" => "Disco",
1503 joku 63 "rule" => array(
1504     "disco/Nutch[/ -]([0-9.]{1,10})" => "\\1",
1505     "discobot[/ -]([0-9.]{1,10})" => "\\1",
1506     "disco-crawl@discoveryengine.com" => ""
1507     ),
1508     "uri" => "http://www.discoveryengine.com/"
1509     ),
1510     "discopump" => array(
1511     "icon" => "robot",
1512     "title" => "DISCo Pump",
1513     "rule" => array(
1514     "DISCo Pump[/ ]([0-9.]{1,10})" => "\\1"
1515     ),
1516     "uri" => ""
1517     ),
1518     "dkimreputation" => array(
1519     "icon" => "dkimreputation",
1520     "title" => "DKIM Reputation",
1521     "rule" => array(
1522     "DKIMRepBot[ /]([0-9.]{1,10})" => "\\1"
1523     ),
1524     "uri" => "http://www.dkim-reputation.org"
1525     ),
1526     "dnsdigger" => array(
1527     "icon" => "dnsdigger",
1528     "title" => "DNS-Digger",
1529     "rule" => array(
1530     "DNS-Digger-Explorer[ /]([0-9.]{1,10})" => "\\1"
1531     ),
1532     "uri" => "http://www.dnsdigger.com"
1533     ),
1534     "dnsvalidation" => array(
1535     "icon" => "dnsvalidation",
1536     "title" => "DNS Validation",
1537     "rule" => array(
1538     "DNSValidation[ /]([0-9.]{1,10})" => "\\1"
1539     ),
1540     "uri" => "http://www.dnsvalidation.com/"
1541     ),
1542     "doctorhtml" => array(
1543     "icon" => "robot",
1544     "title" => "DoctorHTML",
1545     "rule" => array(
1546     "Doctor[ \-]?HTML" => ""
1547     ),
1548     "uri" => ""
1549     ),
1550     "dolphin" => array(
1551     "icon" => "dolphin",
1552     "title" => "Dolphin",
1553     "rule" => array(
1554     "Dolphin[ /]([0-9.]{1,10})" => "\\1"
1555     ),
1556     "uri" => "http://telehouse.ru/crawler.html"
1557     ),
1558     "domaindatei" => array(
1559     "icon" => "robot",
1560     "title" => "Domaindatei",
1561     "rule" => array(
1562     "DomaindateiSpider[ /]([0-9.]{1,10})" => "\\1"
1563     ),
1564     "uri" => ""
1565     ),
1566     "dontbuylists" => array(
1567     "icon" => "dontbuylists",
1568     "title" => "Dontbuylists",
1569     "rule" => array(
1570     "DBLBot[ /]([0-9.]{1,10})" => "\\1"
1571     ),
1572     "uri" => "http://www.dontbuylists.com"
1573     ),
1574     "dotbot" => array(
1575     "icon" => "robot",
1576     "title" => "DotBot",
1577     "rule" => array(
1578     "DotBot[ /]([0-9.]{1,10})" => "\\1"
1579     ),
1580     "uri" => "http://www.dotnetdotcom.org"
1581     ),
1582     "doweb" => array(
1583     "icon" => "doweb",
1584     "title" => "DoWeb",
1585     "rule" => array(
1586     "^www.doweb.co.uk" => ""
1587     ),
1588     "uri" => "http://www.doweb.co.uk/"
1589     ),
1590     "downforeveryoneorjustme" => array(
1591     "icon" => "downforeveryoneorjustme",
1592     "title" => "Down for everyone or just me",
1593     "rule" => array(
1594     "downforeveryoneorjustme" => ""
1595     ),
1596     "uri" => "http://www.downforeveryoneorjustme.com"
1597     ),
1598     "downloadninja" => array(
1599     "icon" => "robot",
1600     "title" => "Download Ninja",
1601     "rule" => array(
1602     "Download Ninja[ /]([0-9.]{1,10})" => "\\1"
1603     ),
1604     "uri" => ""
1605     ),
1606     "drupal" => array(
1607     "icon" => "drupal",
1608     "title" => "Drupal",
1609     "rule" => array(
1610     "^Drupal" => ""
1611     ),
1612     "uri" => ""
1613     ),
1614     "dsns" => array(
1615     "icon" => "robot",
1616     "title" => "DSNS Scanner",
1617     "rule" => array(
1618     "^DSNS" => ""
1619     ),
1620     "uri" => ""
1621     ),
1622     "dtsagent" => array(
1623     "icon" => "robot",
1624     "title" => "DTS Agent",
1625     "rule" => array(
1626     "DTS Agent" => ""
1627     ),
1628     "uri" => ""
1629     ),
1630     "earthcom" => array(
1631     "icon" => "earthcom",
1632     "title" => "Earthcom",
1633     "rule" => array(
1634     "EARTHCOM\.info[/ ]([0-9a-z.]{1,10})" => "\\1"
1635     ),
1636     "uri" => ""
1637     ),
1638     "ebay" => array(
1639     "icon" => "ebay",
1640     "title" => "eBay",
1641     "rule" => array(
1642     "eBay Relevance Ad Crawler" => ""
1643     ),
1644     "uri" => ""
1645     ),
1646     "echo" => array(
1647     "icon" => "robot",
1648     "title" => "Echo.com",
1649     "rule" => array(
1650     "_TrueRobot[/ ]([0-9.]{1,10})" => "\\1"
1651     ),
1652     "uri" => "http://www.echo.com/"
1653     ),
1654     "eert" => array(
1655     "icon" => "robot",
1656 matthys 209 "title" => "Eert",
1657 joku 63 "rule" => array(
1658     "eert spdr[/ ]([0-9.]{1,10})" => "\\1"
1659     ),
1660     "uri" => "http://bot.eert.net"
1661     ),
1662     "eknip" => array(
1663     "icon" => "eknip",
1664     "title" => "E-Knip",
1665     "rule" => array(
1666     "eknip[ /]([0-9a-z.]{1,10})" => "\\1"
1667     ),
1668     "uri" => ""
1669     ),
1670     "zoominfo" => array(
1671     "icon" => "zoominfo",
1672 matthys 209 "title" => "ZoomInfo", //Previous called Eliyon
1673 joku 63 "rule" => array(
1674     "NextGenSearchBot[/ ]([0-9.]{1,10})" => "\\1"
1675     ),
1676     "uri" => "http://www.zoominfo.com/business/nextgensearchbot.html"
1677     ),
1678     "emeraldshield" => array(
1679     "icon" => "emeraldshield",
1680     "title" => "EmeraldShield",
1681     "rule" => array(
1682     "^EmeraldShield" => ""
1683     ),
1684     "uri" => ""
1685     ),
1686     "empas" => array(
1687     "icon" => "empas",
1688     "title" => "Empas",
1689     "rule" => array(
1690     "DigExt; empas\)$" => "",
1691     "^EMPAS[_\-]ROBOT" => ""
1692     ),
1693     "uri" => ""
1694     ),
1695     "entireweb" => array(
1696     "icon" => "entireweb",
1697     "title" => "Entireweb",
1698     "rule" => array(
1699     "Speedy[ ]?Spider" => ""
1700     ),
1701     "uri" => ""
1702     ),
1703     "envolk" => array(
1704     "icon" => "envolk",
1705     "title" => "Envolk",
1706     "rule" => array(
1707     "envolk\[ITS\]spider[/ ]([0-9.]{1,10})" => "\\1",
1708     "envolk[/ ]([0-9.]{1,10})" => "\\1"
1709     ),
1710     "uri" => ""
1711     ),
1712     "esnet" => array(
1713     "icon" => "robot",
1714     "title" => "ES.NET",
1715     "rule" => array(
1716     "ES.NET Crawler[ /]([0-9.]{1,10})" => "\\1"
1717     ),
1718     "uri" => ""
1719     ),
1720     "estyle" => array(
1721     "icon" => "estyle",
1722     "title" => "eStyle Search",
1723     "rule" => array(
1724     "eStyleSearch[ /]([0-9.]{1,10})" => "\\1"
1725     ),
1726     "uri" => ""
1727     ),
1728     "eurip" => array(
1729     "icon" => "robot",
1730     "title" => "Eurip",
1731     "rule" => array(
1732     "EuripBot[ /]([0-9.]{1,10})" => "\\1"
1733     ),
1734     "uri" => "http://www.eurip.com"
1735     ),
1736     "eurodirectory" => array(
1737     "icon" => "robot",
1738     "title" => "Euro Directory",
1739     "rule" => array(
1740     "www\.euro-directory\.com" => ""
1741     ),
1742     "uri" => "http://www.euro-directory.com/"
1743     ),
1744     "euroseek" => array(
1745     "icon" => "euroseek",
1746     "title" => "EuroSeek",
1747     "rule" => array(
1748     "Arachnoidea" => ""
1749     ),
1750     "uri" => ""
1751     ),
1752     "evaal" => array(
1753     "icon" => "evaal",
1754     "title" => "Evaal",
1755     "rule" => array(
1756     "^EvaalSE" => ""
1757     ),
1758     "uri" => "http://www.evaal.com/"
1759     ),
1760     "eventax" => array(
1761     "icon" => "eventax",
1762     "title" => "Eventax",
1763     "rule" => array(
1764     "^eventax[ /]([0-9.]{1,10})" => "\\1"
1765     ),
1766     "uri" => "http://www.eventax.de/"
1767     ),
1768     "everbee" => array(
1769     "icon" => "everbee",
1770     "title" => "Everbee",
1771     "rule" => array(
1772     "EverbeeCrawler" => ""
1773     ),
1774     "uri" => ""
1775     ),
1776     "everest" => array(
1777     "icon" => "everest",
1778     "title" => "Everest",
1779     "rule" => array(
1780     "Everest-Vulcan Inc.[ /]([0-9.]{1,10})" => "\\1"
1781     ),
1782     "uri" => ""
1783     ),
1784     "exabot" => array(
1785     "icon" => "exabot",
1786     "title" => "ExaBot",
1787     "rule" => array(
1788     "^NG[ /]([0-9.]{1,10})" => "\\1",
1789     "Exabot/([0-9.]{1,10})" => "\\1",
1790     "ExaBotTest/([0-9.]{1,10})" => "\\1",
1791     "ExaBot-(Test|Images)/([0-9.]{1,10})" => "\\2",
1792     "ExaBot-Thumbnails" => ""
1793     ),
1794     "uri" => "http://www.exabot.com/go/robot"
1795     ),
1796     "exactseek" => array(
1797     "icon" => "exactseek",
1798     "title" => "ExactSeek",
1799     "rule" => array(
1800     "^exactseek[ \-]?(pagereaper|crawler)[ \-]?([0-9.]{1,10})" => "\\2",
1801     "ExactSeek[ \.\-]?(Crawler|com)" => ""
1802     ),
1803     "uri" => "http://www.exactseek.com/"
1804     ),
1805     "excite" => array(
1806     "icon" => "excite",
1807     "title" => "Excite",
1808     "rule" => array(
1809     "Architext[ \-]?Spider" => ""
1810     ),
1811     "uri" => ""
1812     ),
1813     "execrawl" => array(
1814     "icon" => "robot",
1815     "title" => "Execrawl",
1816     "rule" => array(
1817     "Execrawl[ /]([0-9.]{1,10})" => "\\1",
1818     "Execrawl" => ""
1819     ),
1820     "uri" => ""
1821     ),
1822     "expertmonitor" => array(
1823     "icon" => "robot",
1824     "title" => "ExpertMonitor",
1825     "rule" => array(
1826     "^NetMonitor[ /]([0-9.]{1,10})" => "\\1"
1827     ),
1828     "uri" => ""
1829     ),
1830     "explorerrss" => array(
1831     "icon" => "robot",
1832     "title" => "Explorer RSS",
1833     "rule" => array(
1834     "^Windows-RSS-Platform[ /]([0-9.]{1,10})" => "\\1"
1835     ),
1836     "uri" => ""
1837     ),
1838     "ezooms" => array(
1839     "icon" => "robot",
1840     "title" => "Ezooms",
1841     "rule" => array(
1842     "ezooms[/ ]([0-9a-z.\-]{1,10})" => "\\1"
1843     ),
1844     "uri" => ""
1845     ),
1846     "facebook" => array(
1847     "icon" => "facebook",
1848     "title" => "Facebook",
1849     "rule" => array(
1850     "FacebookFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1851     "facebookexternalhit/([0-9.]{1,10})" => "\\1",
1852     "^facebook" => ""
1853     ),
1854     "uri" => "http://www.facebook.com/"
1855     ),
1856     "fast" => array(
1857     "icon" => "fast",
1858     "title" => "Fast",
1859     "rule" => array(
1860     "^FAST( Enterprise |-Web| MetaWeb )?Crawler[ /]([0-9.]{1,10})" => "\\2",
1861     "^FAST( Enterprise |-Web| MetaWeb | PartnerSite )?Crawler" => "",
1862     "^Fast Crawler" => "",
1863     "^libwww-perl[ /]([0-9.]{1,10}) FP[ /]([0-9.]{1,10})" => "\\2"
1864     ),
1865     "uri" => "http://www.alltheweb.com/"
1866     ),
1867     "fastbuzz" => array(
1868     "icon" => "fastbuzz",
1869     "title" => "Fastbuzz",
1870     "rule" => array(
1871     "^fastbuzz\.com" => ""
1872     ),
1873     "uri" => ""
1874     ),
1875     "favorg" => array(
1876     "icon" => "robot",
1877     "title" => "FavOrg",
1878     "rule" => array(
1879     "^FavOrg" => ""
1880     ),
1881     "uri" => ""
1882     ),
1883     "favorstar" => array(
1884     "icon" => "favorstar",
1885 matthys 209 "title" => "Favorstar",
1886 joku 63 "rule" => array(
1887     "favorstarbot[ /]([0-9.]{1,10})" => "\\1"
1888     ),
1889     "uri" => "http://favorstar.com/bot.html"
1890     ),
1891     "faxo" => array(
1892     "icon" => "robot",
1893     "title" => "Faxo",
1894     "rule" => array(
1895     "^Faxobot[ /]([0-9.]{1,10})" => "\\1"
1896     ),
1897     "uri" => "http://www.faxo.com/"
1898     ),
1899     "fdse" => array(
1900     "icon" => "robot",
1901     "title" => "FDSE Robot",
1902     "rule" => array(
1903     "FDSE[ \-]?robot" => ""
1904     ),
1905     "uri" => ""
1906     ),
1907     "feedback" => array(
1908     "icon" => "robot",
1909     "title" => "FeedBack",
1910     "rule" => array(
1911     "FeedBack[/ ]([0-9.]{1,10})" => "\\1"
1912     ),
1913     "uri" => ""
1914     ),
1915     "feedburner" => array(
1916     "icon" => "feedburner",
1917     "title" => "FeedBurner",
1918     "rule" => array(
1919     "^FeedBurner[/ ]([0-9.]{1,10})" => "\\1"
1920     ),
1921     "uri" => ""
1922     ),
1923     "feeddemon" => array(
1924     "icon" => "feeddemon",
1925     "title" => "FeedDemon",
1926     "rule" => array(
1927     "FeedDemon[/ ]([0-9.]{1,10})" => "\\1"
1928     ),
1929     "uri" => ""
1930     ),
1931     "feedfind" => array(
1932     "icon" => "feedfind",
1933     "title" => "FeedFind",
1934     "rule" => array(
1935     "Feed::Find[ /]([0-9.]{1,10})" => "\\1"
1936     ),
1937     "uri" => ""
1938     ),
1939     "feedonfeeds" => array(
1940     "icon" => "robot",
1941     "title" => "Feed On Feeds",
1942     "rule" => array(
1943     "FeedOnFeeds[/ ]([0-9.]{1,10})" => "\\1"
1944     ),
1945     "uri" => ""
1946     ),
1947     "feedparser" => array(
1948     "icon" => "robot",
1949     "title" => "Feedparser",
1950     "rule" => array(
1951     "UniversalFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1952     "FeedParser" => ""
1953     ),
1954     "uri" => ""
1955     ),
1956     "feedreader" => array(
1957     "icon" => "feedreader",
1958     "title" => "Feedreader",
1959     "rule" => array(
1960     "^Feedreader" => ""
1961     ),
1962     "uri" => ""
1963     ),
1964     "feedserver" => array(
1965     "icon" => "robot",
1966     "title" => "FeedServer",
1967     "rule" => array(
1968     "FeedServer[/ ]([0-9.]{1,10})" => "\\1"
1969     ),
1970     "uri" => ""
1971     ),
1972     "feedster" => array(
1973     "icon" => "feedster",
1974     "title" => "Feedster",
1975     "rule" => array(
1976     "Feedster Crawler[/ ]([0-9.]{1,10})" => "\\1"
1977     ),
1978     "uri" => ""
1979     ),
1980     "feedvalidator" => array(
1981     "icon" => "feedvalidator",
1982     "title" => "Feed Validator",
1983     "rule" => array(
1984     "^FeedValidator[/ ]([0-9.]{1,10})" => "\\1"
1985     ),
1986     "uri" => ""
1987     ),
1988     "fdm" => array(
1989     "icon" => "robot",
1990     "title" => "Free Download Manager",
1991     "rule" => array(
1992     "^FDM[/ ]([0-9a-z.]{1,10})" => "\\1"
1993     ),
1994     "uri" => ""
1995     ),
1996     "filangy" => array(
1997     "icon" => "robot",
1998     "title" => "Filangy",
1999     "rule" => array(
2000     "Filangy[/ ]([0-9.]{1,10})" => "\\1"
2001     ),
2002     "uri" => "http://www.filangy.com/"
2003     ),
2004     "findanisp" => array(
2005     "icon" => "robot",
2006     "title" => "FindAnISP",
2007     "rule" => array(
2008     "FindAnISP" => ""
2009     ),
2010     "uri" => "http://www.findanisp.com/"
2011     ),
2012     "findengines" => array(
2013     "icon" => "findengines",
2014     "title" => "FindEngines",
2015     "rule" => array(
2016     "FindEngines! Bot" => ""
2017     ),
2018     "uri" => ""
2019     ),
2020     "findexa" => array(
2021     "icon" => "findexa",
2022     "title" => "Findexa",
2023     "rule" => array(
2024     "Findexa Crawler" => ""
2025     ),
2026     "uri" => ""
2027     ),
2028     "findlinks" => array(
2029     "icon" => "findlinks",
2030     "title" => "FindLinks",
2031     "rule" => array(
2032     "findlinks[ /]([0-9.]{1,10})" => "\\1",
2033     "^FindLinks" => ""
2034     ),
2035     "uri" => ""
2036     ),
2037     "findoor" => array(
2038     "icon" => "findoor",
2039 matthys 209 "title" => "Findoor",
2040 joku 63 "rule" => array(
2041     "^findoor(-Bot)?" => "\\1"
2042     ),
2043     "uri" => ""
2044     ),
2045     "firefly" => array(
2046     "icon" => "firefly",
2047     "title" => "Firefly",
2048     "rule" => array(
2049     "Firefly" => ""
2050     ),
2051     "uri" => ""
2052     ),
2053     "flashget" => array(
2054     "icon" => "flashget",
2055     "title" => "FlashGet",
2056     "rule" => array(
2057     "^FlashGet" => ""
2058     ),
2059     "uri" => ""
2060     ),
2061     "flatland" => array(
2062     "icon" => "flatland",
2063     "title" => "Flatland",
2064     "rule" => array(
2065     "^flatlandbot" => ""
2066     ),
2067     "uri" => "http://www.flatlandindustries.com/flatlandbot"
2068     ),
2069     "flickbot" => array(
2070     "icon" => "flickbot",
2071     "title" => "FlickBot",
2072     "rule" => array(
2073     "FlickBot[ /]([0-9.]{1,10})" => "\\1"
2074     ),
2075     "uri" => ""
2076     ),
2077     "flightdeckreports" => array(
2078     "icon" => "flightdeckreports",
2079     "title" => "Flight Deck Reports",
2080     "rule" => array(
2081     "FlightDeckReportsBot[ /]([0-9.]{1,10})" => "\\1"
2082     ),
2083     "uri" => "http://www.flightdeckreports.com/"
2084     ),
2085     "forex" => array(
2086     "icon" => "robot",
2087     "title" => "Forex",
2088     "rule" => array(
2089     "^Forex Trading Network Organization" => ""
2090     ),
2091     "uri" => "http://www.netforex.org/"
2092     ),
2093     "freshmeat" => array(
2094     "icon" => "freshmeat",
2095 matthys 209 "title" => "Freshmeat",
2096 joku 63 "rule" => array(
2097     "fmII URL validator[ /]([0-9.]{1,10})" => "\\1",
2098     "freshmeat.net URL validator[ /]([0-9.]{1,10})" => "\\1"
2099     ),
2100     "uri" => "http://www.freshmeat.net/"
2101     ),
2102     "friend" => array(
2103     "icon" => "friend",
2104     "title" => "Friend",
2105     "rule" => array(
2106     "www\.friend\.fr" => ""
2107     ),
2108     "uri" => "http://www.friend.fr/"
2109     ),
2110     "frontier" => array(
2111     "icon" => "frontier",
2112     "title" => "Frontier",
2113     "rule" => array(
2114     "Frontier[ /]([0-9.]{1,10})" => "\\1"
2115     ),
2116     "uri" => ""
2117     ),
2118     "fyberspider" => array(
2119     "icon" => "robot",
2120     "title" => "FyberSpider",
2121     "rule" => array(
2122     "FyberSpider[ /]([0-9.]{1,10})" => "\\1"
2123     ),
2124     "uri" => "http://www.fyberspider.com/"
2125     ),
2126     "gaisbot" => array(
2127     "icon" => "gais",
2128     "title" => "Gaisbot",
2129     "rule" => array(
2130     "Gaisbot[ /]([0-9.]{1,10})" => "\\1"
2131     ),
2132     "uri" => ""
2133     ),
2134     "galaxy" => array(
2135     "icon" => "galaxy",
2136     "title" => "Galaxy",
2137     "rule" => array(
2138     "GalaxyBot[ /]([0-9.]{1,10})" => "\\1",
2139     "www.galaxy.com" => ""
2140     ),
2141     "uri" => "http://www.galaxy.com/"
2142     ),
2143     "gamespy" => array(
2144     "icon" => "gamespy",
2145     "title" => "GameSpy",
2146     "rule" => array(
2147     "GameSpyHTTP[ /]([0-9.]{1,10})" => "\\1"
2148     ),
2149     "uri" => ""
2150     ),
2151     "garlik" => array(
2152     "icon" => "garlik",
2153     "title" => "Garlik",
2154     "rule" => array(
2155     "GarlikCrawler[ /]([0-9.]{1,10})" => "\\1"
2156     ),
2157     "uri" => "http://garlik.com/"
2158     ),
2159     "gdesktop" => array(
2160     "icon" => "gdesktop",
2161     "title" => "Google Desktop",
2162     "rule" => array(
2163     "compatible; Google Desktop" => ""
2164     ),
2165     "uri" => ""
2166     ),
2167     "genome" => array(
2168     "icon" => "robot",
2169     "title" => "Genome Machine",
2170     "rule" => array(
2171     "Genome[ \-]?Machine" => ""
2172     ),
2173     "uri" => ""
2174     ),
2175     "geohash" => array(
2176     "icon" => "geohash",
2177     "title" => "Geohash",
2178     "rule" => array(
2179     "GeoHasher(/Nutch)[ /-]([0-9.]{1,10})" => "\\2"
2180     ),
2181     "uri" => "http://geohash.org/"
2182     ),
2183     "geona" => array(
2184     "icon" => "robot",
2185     "title" => "Geona",
2186     "rule" => array(
2187     "GeonaBot[ /]([0-9.]{1,10})" => "\\1"
2188     ),
2189     "uri" => ""
2190     ),
2191     "geoblog" => array(
2192     "icon" => "robot",
2193     "title" => "The World as a Blog",
2194     "rule" => array(
2195     "The World as a Blog" => ""
2196     ),
2197     "uri" => ""
2198     ),
2199     "geourl" => array(
2200     "icon" => "geourl",
2201     "title" => "GeoUrl",
2202     "rule" => array(
2203     "geourl[ /]([0-9.]{1,10})" => "\\1",
2204     "^GeoURLBot[ /]([0-9.]{1,10})" => "\\1",
2205     ),
2206     "uri" => ""
2207     ),
2208     "getnetwise" => array(
2209     "icon" => "robot",
2210     "title" => "GetNetWise",
2211     "rule" => array(
2212     " Crayon Crawler" => ""
2213     ),
2214     "uri" => ""
2215     ),
2216     "getright" => array(
2217     "icon" => "getright",
2218     "title" => "GetRight",
2219     "rule" => array(
2220     "GetRight[ /]([0-9.]{1,10})" => "\\1"
2221     ),
2222     "uri" => ""
2223     ),
2224     "getsmart" => array(
2225     "icon" => "getsmart",
2226     "title" => "GetSmart",
2227     "rule" => array(
2228     "GetSmart[ /]([0-9.]{1,10})" => "\\1"
2229     ),
2230     "uri" => ""
2231     ),
2232     "gigabot" => array(
2233     "icon" => "gigablast",
2234     "title" => "Gigablast",
2235     "rule" => array(
2236     "(Gigabot|Sitesearch)[/ ]([0-9.]{1,10})" => "\\2",
2237     "GigabotSiteSearch[/ ]([0-9.]{1,10})" => "\\1",
2238 joku 336 "GigablastOpenSource" => ""
2239 joku 63 ),
2240     "uri" => ""
2241 matthys 328 ),
2242     "gimme" => array(
2243     "icon" => "gimme",
2244     "title" => "gimmeUSA",
2245     "rule" => array(
2246     "Gimme60bot[ /]([0-9.]{1,10})" => "\\1"
2247     ),
2248     "uri" => "http://gimme60.com"
2249 joku 63 ),
2250 matthys 328 "ginger" => array(
2251     "icon" => "ginger",
2252     "title" => "GingerCrawler",
2253     "rule" => array(
2254     "GingerCrawler[ /]([0-9.]{1,10})" => "\\1"
2255     ),
2256     "uri" => "http://www.gingersoftware.com/crawler_agent.htm"
2257     ),
2258 joku 63 "girafabot" => array(
2259     "icon" => "girafa",
2260     "title" => "Girafa",
2261     "rule" => array(
2262     "Girafabot" => ""
2263     ),
2264     "uri" => ""
2265     ),
2266     "globalspec" => array(
2267     "icon" => "globalspec",
2268     "title" => "GlobalSpec",
2269     "rule" => array(
2270     "Ocelli[ /]([0-9.]{1,10})" => "\\1"
2271     ),
2272     "uri" => ""
2273     ),
2274     "glucose" => array(
2275     "icon" => "glucose",
2276     "title" => "Glucose",
2277     "rule" => array(
2278     "glucose[ /]([0-9a-z.\-]{1,10})" => "\\1"
2279     ),
2280     "uri" => ""
2281     ),
2282     "gnomit" => array(
2283     "icon" => "gnomit",
2284     "title" => "Gnomit",
2285     "rule" => array(
2286     "gnomit[ /]([0-9.]{1,10})" => "\\1"
2287     ),
2288     "uri" => "http://www.gnomit.com/",
2289     ),
2290     "goforit" => array(
2291     "icon" => "goforit",
2292     "title" => "GoForIt",
2293     "rule" => array(
2294     "^GoForIt\.com" => "",
2295     "^GOFORITBOT" => ""
2296     ),
2297     "uri" => ""
2298     ),
2299     "goguides" => array(
2300     "icon" => "robot",
2301     "title" => "GoGuides",
2302     "rule" => array(
2303     "^GoGuidesBot[ /]([0-9.]{1,10})" => "\\1"
2304     ),
2305     "uri" => "http://www.goguides.org/"
2306     ),
2307     // Needs to be before google for correct detection
2308     "mediapartners" => array(
2309     "icon" => "google",
2310     "title" => "Mediapartners",
2311     "rule" => array (
2312     "Mediapartners-Google[ /]([0-9.]{1,10})" => "\\1",
2313     "Mediapartners-Google" => ""
2314     ),
2315     "uri" => ""
2316     ),
2317     "google" => array(
2318     "icon" => "google",
2319     "title" => "Google",
2320     "rule" => array (
2321     "Googl(e|ebot)(-Image)?/([0-9.]{1,10})" => "\\3",
2322     "Googl(e|ebot)(-Image)?/" => "",
2323     "^gsa-crawler" => "",
2324     "Google Web Preview" => ""
2325     ),
2326     "uri" => "http://www.google.com/"
2327     ),
2328     "googlesitemaps" => array(
2329     "icon" => "google",
2330     "title" => "Google-Sitemaps",
2331     "rule" => array (
2332     "Googl(e|ebot)(-Sitemaps)?/([0-9.]{1,10})" => "\\3",
2333     "GSiteCrawler[ /v]*([0-9.a-z]{1,10})" => "\\1",
2334     "Googl(e|ebot)(-Sitemaps)?/" => ""
2335     ),
2336     "uri" => ""
2337     ),
2338     "googlemobile" => array(
2339     "icon" => "google",
2340     "title" => "Google-Mobile",
2341     "rule" => array (
2342     "Googl(e|ebot)(-Mobile)?/([0-9.]{1,10})" => "\\3",
2343     "Googl(e|ebot)(-Mobile)?/" => ""
2344     ),
2345     "uri" => ""
2346     ),
2347     "googleads" => array(
2348     "icon" => "google",
2349     "title" => "Google-AdsBot",
2350     "rule" => array (
2351     "^AdsBot-Google" => "",
2352     ),
2353     "uri" => ""
2354     ),
2355     "googlefeeds" => array(
2356     "icon" => "google",
2357     "title" => "Google-Feedfetcher",
2358     "rule" => array (
2359     "^Feedfetcher-Google" => "",
2360     ),
2361     "uri" => ""
2362     ),
2363     "googlverification" => array(
2364     "icon" => "google",
2365     "title" => "Google-Site-Verification",
2366     "rule" => array (
2367     "Google-Site-Verification[ /]([0-9.]{1,10})" => "\\1"
2368     ),
2369     "uri" => ""
2370     ),
2371 matthys 207 // Needs to be AFTER Google detection
2372     "goo" => array(
2373     "icon" => "goo",
2374     "title" => "Goo",
2375     "rule" => array (
2376     "(gazz|ichiro|mog(et|imogi))[ /]([0-9.]{1,10})" => "\\3",
2377     "DoCoMo[ /]([0-9.]{1,10})" => "\\1"
2378     ),
2379     "uri" => ""
2380     ),
2381 joku 63 "goongee" => array(
2382     "icon" => "robot",
2383     "title" => "GoonGee",
2384     "rule" => array (
2385     "^Big Fish[ /]v?([0-9.]{1,10})" => "\\2"
2386     ),
2387     "uri" => "http://www.goongee.com/"
2388     ),
2389     "gpost" => array(
2390     "icon" => "gpost",
2391     "title" => "GPost",
2392     "rule" => array(
2393     "^GPostbot" => ""
2394     ),
2395     "uri" => ""
2396     ),
2397 matthys 309 "grapeshot" => array(
2398     "icon" => "grapeshot",
2399     "title" => "Grapeshot",
2400     "rule" => array(
2401     "GrapeshotCrawler[/ ]([0-9.]{1,10})" => "\\1"
2402     ),
2403     "uri" => "http://www.grapeshot.co.uk/crawler.php"
2404     ),
2405 joku 63 "gregarius" => array(
2406     "icon" => "robot",
2407     "title" => "Gregarius",
2408     "rule" => array(
2409     "^Gregarius[/ ]([0-9.]{1,10})" => ""
2410     ),
2411     "uri" => ""
2412     ),
2413     "grub" => array(
2414     "icon" => "grub",
2415     "title" => "Grub",
2416     "rule" => array(
2417     "grub[ \-]?client[ /\-]{1,5}([0-9.]{1,10})" => "\\1",
2418     "grub crawler" => "",
2419     "grub[/ ]([0-9.]{1,10})" => "\\1",
2420     "^GrubNG([0-9. ]{1,10})?" => "\\1"
2421     ),
2422     "uri" => "http://www.grub.org/"
2423     ),
2424     "gulliver" => array(
2425     "icon" => "robot",
2426     "title" => "Gulliver",
2427     "rule" => array(
2428     "Gulliver" => ""
2429     ),
2430     "uri" => ""
2431     ),
2432     "guruji" => array(
2433     "icon" => "guruji",
2434     "title" => "Guruji",
2435     "rule" => array(
2436     "GurujiBot[/ ]([0-9.]{1,10})" => "\\1"
2437     ),
2438     "uri" => "http://www.guruji.com/"
2439     ),
2440     "gush" => array(
2441     "icon" => "robot",
2442     "title" => "Gush",
2443     "rule" => array(
2444     "^Gush[/ ]([0-9.]{1,10})" => "\\1"
2445     ),
2446     "uri" => ""
2447     ),
2448     "gziptester" => array(
2449     "icon" => "robot",
2450     "title" => "Gzip Tester",
2451     "rule" => array(
2452     "g(id)?zip[ \-]?test(er)?" => ""
2453     ),
2454     "uri" => ""
2455     ),
2456     "hanzoweb" => array(
2457     "icon" => "hanzoweb",
2458     "title" => "Hanzoweb",
2459     "rule" => array(
2460     "^Hanzoweb" => ""
2461     ),
2462     "uri" => ""
2463     ),
2464     "harbot" => array(
2465     "icon" => "harbot",
2466     "title" => "Harbot",
2467     "rule" => array(
2468     "^Harbot GateStation" => ""
2469     ),
2470     "uri" => ""
2471     ),
2472     "hatena" => array(
2473     "icon" => "hatena",
2474     "title" => "Hatena",
2475     "rule" => array(
2476     "Hatena (Antenna|Bookmark|Pagetitle Agent)[ /]([0-9.]{1,10})" => "\\2"
2477     ),
2478     "uri" => ""
2479     ),
2480     "htmlparser" => array(
2481     "icon" => "htmlparser",
2482     "title" => "HTMLParser",
2483     "rule" => array(
2484     "HTMLParser[ /]([0-9.]{1,10})" => "\\1"
2485     ),
2486     "uri" => "http://htmlparser.sourceforge.net/"
2487     ),
2488     "helix" => array(
2489     "icon" => "helix",
2490     "title" => "Heritrix",
2491     "rule" => array(
2492     "^helix[ /]([0-9.]{1,10})" => "\\1"
2493     ),
2494     "uri" => "http://www.sitesearch.ca/helix/"
2495     ),
2496     "heritrix" => array(
2497     "icon" => "heritrix",
2498     "title" => "Heritrix",
2499     "rule" => array(
2500     "heritrix[ /]([0-9.]{1,10})" => "\\1",
2501     "archive.org_bot" => "",
2502     "InternetArchive[ /]([0-9.a-z]{1,10})" => "\\1"
2503     ),
2504     "uri" => "http://archive.org"
2505     ),
2506     "hiddenmarket" => array(
2507     "icon" => "robot",
2508     "title" => "HiddenMarket",
2509     "rule" => array(
2510     "HiddenMarket[ /\-]([0-9.]{1,10})" => "\\1"
2511     ),
2512     "uri" => ""
2513     ),
2514     "honda" => array(
2515     "icon" => "robot",
2516     "title" => "Honda",
2517     "rule" => array(
2518     "Honda-Search[ /]([0-9.]{1,10})" => "\\1"
2519     ),
2520     "uri" => "http://www.honda-search.com"
2521     ),
2522     "hoowwwer" => array(
2523     "icon" => "hoowwwer",
2524     "title" => "HooWWWer",
2525     "rule" => array(
2526     "HooWWWer[ /]([0-9.]{1,10})" => "\\1"
2527     ),
2528     "uri" => ""
2529     ),
2530     "hotzonu" => array(
2531     "icon" => "hotzonu",
2532     "title" => "Hotzonu",
2533     "rule" => array(
2534     "Hotzonu[ /]([0-9.]{1,10})" => "\\1"
2535     ),
2536     "uri" => ""
2537     ),
2538     "houxou" => array(
2539     "icon" => "robot",
2540     "title" => "Houxou",
2541     "rule" => array(
2542     "HouxouCrawler[ /]Nutch.([0-9.]{1,10})" => "\\1",
2543     "HouxouCrawler" => ""
2544     ),
2545     "uri" => ""
2546     ),
2547     "htdig" => array(
2548     "icon" => "htdig",
2549     "title" => "ht://Dig",
2550     "rule" => array(
2551     "htdig[ /]([0-9.]{1,10})" => "\\1",
2552     "htdig" => "\\1"
2553     ),
2554     "uri" => ""
2555     ),
2556     "html2jpg" => array(
2557     "icon" => "html2jpg",
2558     "title" => "HTML2JPG",
2559     "rule" => array(
2560     "^HTML2JPG" => ""
2561     ),
2562     "uri" => ""
2563     ),
2564     "httperf" => array(
2565     "icon" => "robot",
2566     "title" => "HTTPerf",
2567     "rule" => array(
2568     "httperf[ /]([0-9.]{1,10})" => "\\1"
2569     ),
2570     "uri" => ""
2571     ),
2572     "httpunit" => array(
2573     "icon" => "httpunit",
2574     "title" => "HttpUnit",
2575     "rule" => array(
2576     "httpunit[ /]([0-9.]{1,10})" => "\\1"
2577     ),
2578     "uri" => ""
2579     ),
2580     "httrack" => array(
2581     "icon" => "httrack",
2582     "title" => "HTTrack",
2583     "rule" => array(
2584     "HTTrack[ /]([0-9.]{1,10})" => "\\1"
2585     ),
2586     "uri" => ""
2587     ),
2588     "huaweisymantec" => array(
2589     "icon" => "huaweisymantec",
2590     "title" => "HuaweiSymantec",
2591     "rule" => array(
2592     "HuaweiSymantecSpider[ /]([0-9.]{1,10})" => "\\1"
2593     ),
2594     "uri" => "http://www.huaweisymantec.com/en/IRL/spider/"
2595     ),
2596     "hungary" => array(
2597     "icon" => "hungary",
2598     "title" => "Hungary",
2599     "rule" => array(
2600     "HuRob[ /]([0-9.]{1,10})" => "\\1"
2601     ),
2602     "uri" => ""
2603     ),
2604 joku 261 "i18n" => array(
2605     "icon" => "w3c",
2606     "title" => "W3C I18n Checker",
2607     "rule" => array(
2608     "^W3C_I18n-Checker[ /]([0-9.]{1,10})" => "\\1"
2609 joku 169 ),
2610 joku 261 "uri" => "http://validator.w3.org/services"
2611     ),
2612 joku 63 "iakke" => array(
2613     "icon" => "iakke",
2614 matthys 209 "title" => "Iakké",
2615 joku 63 "rule" => array(
2616     "^iakke_bot[ /]v([0-9.]{1,10})" => "\\1"
2617     ),
2618     "uri" => "http://fr.iakke.com/"
2619     ),
2620     "iask" => array(
2621     "icon" => "iask",
2622     "title" => "IAsk",
2623     "rule" => array(
2624     "iaskspider[ /]([0-9.]{1,10})" => "\\1",
2625     "^iaskspider" => ""
2626     ),
2627     "uri" => "http://iask.com"
2628     ),
2629     "icc" => array(
2630     "icon" => "icc",
2631     "title" => "ICC-Crawler",
2632     "rule" => array(
2633     "^ICC-Crawler" => ""
2634     ),
2635     "uri" => "http://kc.nict.go.jp/icc/crawl.html"
2636     ),
2637     "icerocket" => array(
2638     "icon" => "icerocket",
2639     "title" => "Icerocket",
2640     "rule" => array(
2641     "BlogzIce[ /]([0-9.]{1,10})" => "\\1",
2642     "BlogSearch[ /]([0-9.]{1,10})" => "\\1"
2643     ),
2644     "uri" => ""
2645     ),
2646     "icjobs" => array(
2647     "icon" => "icjobs",
2648     "title" => "iCjobs",
2649     "rule" => array(
2650     "iCjobs[ /]([0-9.]{1,10})" => "\\1"
2651     ),
2652     "uri" => "http://www.icjobs.de/"
2653     ),
2654     "icra" => array(
2655     "icon" => "icra",
2656     "title" => "ICRA",
2657     "rule" => array(
2658     "^ICRA_Semantic_spider[ /]([0-9.]{1,10})" => "\\1"
2659     ),
2660     "uri" => "http://www.icra.org"
2661     ),
2662     "iknow" => array(
2663     "icon" => "robot",
2664     "title" => "I know",
2665     "rule" => array(
2666     "Comaneci_bot[ /]([0-9.]{1,10})" => "\\1"
2667     ),
2668     "uri" => ""
2669     ),
2670     "ilial" => array(
2671     "icon" => "robot",
2672     "title" => "Ilial",
2673     "rule" => array(
2674     "ilial[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
2675     ),
2676     "uri" => ""
2677     ),
2678     "ilocal" => array(
2679     "icon" => "ilocal",
2680     "title" => "ilocal",
2681     "rule" => array(
2682     "^ilocal" => "",
2683     ),
2684     "uri" => "http://www.ilocal.nl"
2685     ),
2686     "ilse" => array(
2687     "icon" => "ilse",
2688     "title" => "Ilse",
2689     "rule" => array(
2690     "I(NGRID|lseRobot|lseBot)[ /]([0-9.]{1,10})" => "\\1"
2691     ),
2692     "uri" => "http://ilse.nl/"
2693     ),
2694     "iltrovatore" => array(
2695     "icon" => "iltrovatore",
2696     "title" => "IlTrovatore",
2697     "rule" => array(
2698     "iltrovatore-setaccio[ /]([0-9.]{1,10})" => "\\1",
2699     "Iltrovatore-Setaccio" => "",
2700     "iltrovatore[ /]([0-9.]{1,10})" => "\\1"
2701     ),
2702     "uri" => ""
2703     ),
2704     "indylibrary" => array(
2705     "icon" => "robot",
2706     "title" => "Indy Library",
2707     "rule" => array(
2708     "Indy[ \-]?Library" => ""
2709     ),
2710     "uri" => ""
2711     ),
2712     "inela" => array(
2713     "icon" => "robot",
2714     "title" => "Inela",
2715     "rule" => array(
2716     "InelaBot[ /]([0-9.]{1,10})" => ""
2717     ),
2718     "uri" => "http://inelegant.org/bot"
2719     ),
2720     "ineturl" => array(
2721     "icon" => "robot",
2722     "title" => "InetURL",
2723     "rule" => array(
2724     "InetURL.?[ /]([0-9.]{1,10})" => ""
2725     ),
2726     "uri" => ""
2727     ),
2728     "infoart" => array(
2729     "icon" => "robot",
2730     "title" => "InfoArt",
2731     "rule" => array(
2732     "InfoArt crawler" => ""
2733     ),
2734     "uri" => ""
2735     ),
2736     "infomine" => array(
2737     "icon" => "infomine",
2738     "title" => "INFOMINE",
2739     "rule" => array(
2740     "^DataFountains/DMOZ" => "",
2741     "^INFOMINE[ /]([0-9.]{1,10})" => "\\1"
2742     ),
2743     "uri" => "http://infomine.ucr.edu/"
2744     ),
2745     "infoseek" => array(
2746     "icon" => "infoseek",
2747     "title" => "Infoseek",
2748     "rule" => array(
2749     "SideWinder[ /]?([0-9a-z.]{1,10})" => "\\1",
2750     "Infoseek" => ""
2751     ),
2752     "uri" => ""
2753     ),
2754     "inktomi" => array(
2755     "icon" => "inktomi",
2756     "title" => "Inktomi",
2757     "rule" => array(
2758     "slurp@inktomi\.com" => ""
2759     ),
2760     "uri" => ""
2761     ),
2762     "innerprise" => array(
2763     "icon" => "robot",
2764     "title" => "Innerprise",
2765     "rule" => array(
2766     "^InnerpriseBot[ /]([0-9.]{1,10})" => "\\1",
2767     "URL[ _]Spider[ _]Pro[ /]([0-9.+]{1,10})" => "\\1",
2768     "^ES[ .]NET[ _]Crawler[ /]([0-9.]{1,10})" => "\\1"
2769     ),
2770     "uri" => "http://www.innerprise.com/"
2771     ),
2772     "inria" => array(
2773     "icon" => "inria",
2774     "title" => "Inria",
2775     "rule" => array(
2776     "^xyro_" => ""
2777     ),
2778     "uri" => ""
2779     ),
2780     "insitor" => array(
2781     "icon" => "insitor",
2782     "title" => "Insitor",
2783     "rule" => array(
2784     "^Insitor(,|\.|naut)" => ""
2785     ),
2786     "uri" => "http://www.insitor.com/"
2787     ),
2788     "internetninja" => array(
2789     "icon" => "robot",
2790     "title" => "Internet Ninja",
2791     "rule" => array(
2792     "^Internet Ninja[ /]([0-9.]{1,10})" => "\\1"
2793     ),
2794     "uri" => ""
2795     ),
2796     "internetseer" => array(
2797     "icon" => "internetseer",
2798     "title" => "InternetSeer",
2799     "rule" => array(
2800     "^InternetSeer\.com" => ""
2801     ),
2802     "uri" => ""
2803     ),
2804     "interseek" => array(
2805     "icon" => "interseek",
2806     "title" => "Interseek",
2807     "rule" => array(
2808     "Interseek.com" => ""
2809     ),
2810     "uri" => "http://www.interseek.com"
2811     ),
2812     "intravnews" => array(
2813     "icon" => "intravnews",
2814     "title" => "IntraVnews",
2815     "rule" => array(
2816     "IntraVnews[ /]([0-9.]{1,10})" => "\\1"
2817     ),
2818     "uri" => "http://www.intravnews.com/"
2819     ),
2820     "ip2location" => array(
2821     "icon" => "ip2location",
2822     "title" => "IP2LocationBot",
2823     "rule" => array(
2824     "^IP2(Map|Location)Bot[ /]([0-9.]{1,10})" => "\\2"
2825     ),
2826     "uri" => "http://www.ip2location.com"
2827     ),
2828     "ipworks" => array(
2829     "icon" => "ipworks",
2830     "title" => "IP*Works",
2831     "rule" => array(
2832     "^IP\*Works\! V([0-9.]{1,10})" => "\\1"
2833     ),
2834     "uri" => "http://www.nsoftware.com/ipworks/"
2835     ),
2836     "irca" => array(
2837     "icon" => "robot",
2838     "title" => "Novell iChain Cool Solutions caching",
2839     "rule" => array(
2840 matthys 209 "^ICRA_(label_generator|Semantic_spider)[ /]([0-9.]{1,10})" => "\\2",
2841     "^Mozilla[/ ]([0-9.]{1,10})[/ ]\(compatible[ ;]*ICS" => "\\1"
2842 joku 63 ),
2843     "uri" => "http://www.icra.org"
2844     ),
2845     "irvine" => array(
2846     "icon" => "robot",
2847     "title" => "Irvine",
2848     "rule" => array(
2849     "Irvine[ /]([0-9.]{1,10})" => "\\1"
2850     ),
2851     "uri" => ""
2852     ),
2853     "ips-agent" => array(
2854     "icon" => "robot",
2855 matthys 209 "title" => "IPS-agent",
2856 joku 63 "rule" => array(
2857     "ips-agent" => ""
2858     ),
2859     "uri" => ""
2860     ),
2861     "isara" => array(
2862     "icon" => "isara",
2863 matthys 209 "title" => "Isara",
2864 joku 63 "rule" => array(
2865     "Isara[ -]([0-9.]{1,10})" => "\\1"
2866     ),
2867     "uri" => "http://www.isara.org/"
2868     ),
2869     "isspider" => array(
2870     "icon" => "robot",
2871     "title" => "ISSpider",
2872     "rule" => array(
2873     "ISSpider[ /\-]([0-9.]{1,10})" => "\\1"
2874     ),
2875     "uri" => ""
2876     ),
2877     "it2media" => array(
2878     "icon" => "it2media",
2879     "title" => "IT2media",
2880     "rule" => array(
2881     "www.adressendeutschland.de" => ""
2882     ),
2883     "uri" => "http://www.adressendeutschland.de/"
2884     ),
2885     "ivia" => array(
2886     "icon" => "robot",
2887     "title" => "iVia",
2888     "rule" => array(
2889     "iVia Site Checker.?[ /]([0-9.]{1,10})" => "\\1"
2890     ),
2891     "uri" => ""
2892     ),
2893     "jeteye" => array(
2894     "icon" => "jeteye",
2895     "title" => "Jeteye",
2896     "rule" => array(
2897     "Jetbot[ /]([0-9.]{1,10})" => "\\1"
2898     ),
2899     "uri" => ""
2900     ),
2901     "jobsde" => array(
2902     "icon" => "jobsde",
2903     "title" => "jobs.de",
2904     "rule" => array(
2905     "www\.jobs\.de" => "",
2906     "jobs.de-Robot" => ""
2907     ),
2908     "uri" => "http://www.jobs.de/"
2909     ),
2910     "jpluck" => array(
2911     "icon" => "robot",
2912     "title" => "Jpluck",
2913     "rule" => array(
2914     "JPluck[ /]([0-9a-z.]{1,10})" => "\\1"
2915     ),
2916     "uri" => ""
2917     ),
2918     "jxta" => array(
2919     "icon" => "robot",
2920     "title" => "Jxta",
2921     "rule" => array(
2922     "falcon[ /]([0-9.]{1,10})" => "\\1"
2923     ),
2924     "uri" => ""
2925     ),
2926     "jyte" => array(
2927     "icon" => "jyte",
2928     "title" => "Jyte",
2929     "rule" => array(
2930     "jyte_fetcher[ /]([0-9.]{1,10})" => "\\1"
2931     ),
2932     "uri" => ""
2933     ),
2934     "jyxo" => array(
2935     "icon" => "jyxo",
2936     "title" => "Jyxo",
2937     "rule" => array(
2938     "Jyxobot[ /]([0-9.]{1,10})" => "\\1"
2939     ),
2940     "uri" => ""
2941     ),
2942     "kalooga" => array(
2943     "icon" => "kalooga",
2944     "title" => "Kalooga",
2945     "rule" => array(
2946     "kalooga[ /-]([0-9.]{1,10})" => "\\1",
2947     "^kalooga" => "",
2948     "KaloogaBot" => ""
2949     ),
2950     "uri" => "http://www.kalooga.com"
2951     ),
2952     "keywen" => array(
2953     "icon" => "keywen",
2954     "title" => "Keywen",
2955     "rule" => array(
2956     "EasyDL[ /]([0-9.]{1,10})" => "\\1"
2957     ),
2958     "uri" => ""
2959     ),
2960     "kilomonkey" => array(
2961     "icon" => "robot",
2962     "title" => "Kilomonkey",
2963     "rule" => array(
2964     "kmky-not-a-bot[ /]([0-9.]{1,10})" => "\\1"
2965     ),
2966     "uri" => "http://www.kilomonkey.com/notabot.txt"
2967     ),
2968     "kinja" => array(
2969     "icon" => "kinja",
2970     "title" => "Kinja",
2971     "rule" => array(
2972     "kinjabot[ /]([0-9.]{1,10})" => "\\1",
2973     "^kinjabot" => ""
2974     ),
2975     "uri" => ""
2976     ),
2977     "kiwi" => array(
2978     "icon" => "robot",
2979     "title" => "KiwiStatus",
2980     "rule" => array(
2981     "KiwiStatus[ /]([0-9.]{1,10})" => "\\1",
2982     "KiwiStatus" => ""
2983     ),
2984     "uri" => "http://www.nzs.com/kiei-status/"
2985     ),
2986     "lachesis" => array(
2987     "icon" => "robot",
2988     "title" => "Lachesis",
2989     "rule" => array(
2990     "lachesis" => ""
2991     ),
2992     "uri" => ""
2993     ),
2994     "lanshan" => array(
2995     "icon" => "robot",
2996     "title" => "Lachesis",
2997     "rule" => array(
2998     "lanshanbot[/ ]([0-9.]{1,10})" => "\\1"
2999     ),
3000     "uri" => ""
3001     ),
3002     "lapozz" => array(
3003     "icon" => "lapozz",
3004     "title" => "Lapozz",
3005     "rule" => array(
3006     "LapozzBot[/ ]?([0-9.]{1,10})" => "\\1"
3007     ),
3008     "uri" => ""
3009     ),
3010     "larbin" => array(
3011     "icon" => "robot",
3012     "title" => "Larbin",
3013     "rule" => array(
3014     "larbin[_/ ]?([0-9.]{1,10})" => "\\1"
3015     ),
3016     "uri" => ""
3017     ),
3018     "laurion" => array(
3019     "icon" => "robot",
3020     "title" => "Laurion",
3021     "rule" => array(
3022     "^IPiumBot" => ""
3023     ),
3024     "uri" => "http://www.laurion.com/"
3025     ),
3026     "leechget" => array(
3027     "icon" => "leechget",
3028     "title" => "LeechGet",
3029     "rule" => array(
3030     "^LeechGet[ /]([0-9.]{1,10})" => "\\1"
3031     ),
3032     "uri" => ""
3033     ),
3034     "linguaseek" => array(
3035     "icon" => "linguaseek",
3036     "title" => "Linguaseek",
3037     "rule" => array(
3038     "^LinguaBot[ /]v([0-9.]{1,10})" => "\\1"
3039     ),
3040     "uri" => "http://www.linguaseek.com/"
3041     ),
3042     "linguee" => array(
3043     "icon" => "linguee",
3044     "title" => "Linguee",
3045     "rule" => array(
3046     "^Linguee Bot" => ""
3047     ),
3048     "uri" => "http://www.linguee.com/"
3049     ),
3050     "linkguard" => array(
3051     "icon" => "robot",
3052     "title" => "Linkguard",
3053     "rule" => array(
3054     "Linkguard Online[ /]([0-9.]{1,10})" => "\\1"
3055     ),
3056     "uri" => "http://www.linkguard.com/"
3057     ),
3058     "linklint" => array(
3059     "icon" => "linklint",
3060     "title" => "Linklint",
3061     "rule" => array(
3062     "^Linklint[-\-a-z /]*([0-9.]{1,10})" => "\\1"
3063     ),
3064     "uri" => "http://www.linklint.org/"
3065     ),
3066     "linkman" => array(
3067     "icon" => "linkman",
3068     "title" => "Linkman",
3069     "rule" => array(
3070     "\(compatible; Linkman\)" => ""
3071     ),
3072     "uri" => ""
3073     ),
3074     // Needs to be before linkcheck for correct detection
3075     "linkchecker" => array(
3076     "icon" => "w3c",
3077     "title" => "W3C Link Checker",
3078     "rule" => array(
3079     "^W3C-checklink[ /]([0-9.]{1,10})" => "\\1"
3080     ),
3081     "uri" => "http://validator.w3.org/checklink"
3082     ),
3083     "linkcheck" => array(
3084     "icon" => "linkcheck",
3085     "title" => "Linkcheck",
3086     "rule" => array(
3087     "checklink[ /]([0-9.]{1,10})" => "\\1",
3088     "Link[ \-]?(Chec(k|ker)|Val(et|idator))" => "",
3089     "Adaxas Spider" => "",
3090     "Agent-SharewarePlazaFileCheckBot[ /]([0-9.]{1,10})" => "\\1",
3091     "NetMechanic V([0-9.]{1,10})" => "\\1",
3092     "^InfoLink" => "",
3093     "InternetLinkAgent" => "",
3094     "; SPENG\)" => "",
3095     "SharewarePlazaFileCheckBot" => "",
3096     "fileboost.net" => "",
3097     "^billbot" => ""
3098     ),
3099     "uri" => ""
3100     ),
3101     "linkru" => array(
3102     "icon" => "robot",
3103     "title" => "Link.RU",
3104     "rule" => array(
3105     "^Link.RU bot" => ""
3106     ),
3107     "uri" => ""
3108     ),
3109     "linkssql" => array(
3110     "icon" => "robot",
3111     "title" => "Links SQL",
3112     "rule" => array(
3113     "links sql" => ""
3114     ),
3115     "uri" => ""
3116     ),
3117     "linksweeper" => array(
3118     "icon" => "robot",
3119     "title" => "Link Sweeper",
3120     "rule" => array(
3121     "LinkSweeper[ /]([0-9.]{1,10})" => "\\1"
3122     ),
3123     "uri" => ""
3124     ),
3125     "linkwalker" => array(
3126     "icon" => "robot",
3127     "title" => "Link Walker",
3128     "rule" => array(
3129     "^LinkWalker" => ""
3130     ),
3131     "uri" => ""
3132     ),
3133     "lipperhey" => array(
3134     "icon" => "lipperhey",
3135     "title" => "Lipperhey",
3136     "rule" => array(
3137     "Lipperhey Spider" => ""
3138     ),
3139     "uri" => "http://www.lipperhey.com"
3140     ),
3141     "livedoor" => array(
3142     "icon" => "livedoor",
3143     "title" => "Livedoor",
3144     "rule" => array(
3145     "^Livedoor( SF( - California Crawl)?|Checkers)[ /]" => ""
3146     ),
3147     "uri" => ""
3148     ),
3149     "livejournal" => array(
3150     "icon" => "livejournal",
3151     "title" => "Live Journal",
3152     "rule" => array(
3153     "^LiveJournal\.com" => ""
3154     ),
3155     "uri" => "http://www.livejournal.com"
3156     ),
3157     "ljpic" => array(
3158     "icon" => "ljpic",
3159     "title" => "ljpic",
3160     "rule" => array(
3161     "LjSEEK Picture-Bot[ /]+([0-9.]{1,10})" => "\\1"
3162     ),
3163     "uri" => "http://www.ljpic.com"
3164     ),
3165     "lmspider" => array(
3166     "icon" => "robot",
3167     "title" => "Lmspider",
3168     "rule" => array(
3169     "^lmspider" => ""
3170     ),
3171     "uri" => ""
3172     ),
3173     "locators" => array(
3174     "icon" => "robot",
3175     "title" => "Locaters",
3176     "rule" => array(
3177     "^FiNDoBot[/ ]([0-9a-z.]{1,10})" => "\\1"
3178     ),
3179     "uri" => ""
3180     ),
3181     "look" => array(
3182     "icon" => "look",
3183     "title" => "Look",
3184     "rule" => array(
3185     "www\.look\.com" => "",
3186     "Lookbot" => ""
3187     ),
3188     "uri" => ""
3189     ),
3190     "looksmart" => array(
3191     "icon" => "looksmart",
3192     "title" => "LookSmart",
3193     "rule" => array(
3194     "^Martini" => "",
3195     "^MantraAgent" => "",
3196     "FurlBot" => "",
3197     "looksmart-sv-fw" => ""
3198     ),
3199     "uri" => ""
3200     ),
3201     "loop" => array(
3202     "icon" => "loop",
3203     "title" => "LOOP",
3204     "rule" => array(
3205     "NetResearchServer[ /]([0-9.]{1,10})" => "\\1"
3206     ),
3207     "uri" => ""
3208     ),
3209     "lotkyll" => array(
3210     "icon" => "robot",
3211     "title" => "Lotkyll",
3212     "rule" => array(
3213     "Lotkyll" => ""
3214     ),
3215     "uri" => ""
3216     ),
3217 joku 335 "ltx71" => array(
3218     "icon" => "robot",
3219     "title" => "LTX71",
3220     "rule" => array(
3221     "ltx71" => ""
3222     ),
3223     "uri" => "http://ltx71.com/"
3224     ),
3225 joku 63 "lwp" => array(
3226     "icon" => "robot",
3227     "title" => "lwp",
3228     "rule" => array(
3229     "lwp(-trivial|::simple)[ /]([0-9.]{1,10})" => "\\2"
3230     ),
3231     "uri" => ""
3232     ),
3233     "lycos" => array(
3234     "icon" => "lycos",
3235     "title" => "Lycos",
3236     "rule" => array(
3237     "Lycos_Spider_" => ""
3238     ),
3239     "uri" => ""
3240     ),
3241     "magpierss" => array(
3242     "icon" => "rss",
3243     "title" => "MagpieRSS",
3244     "rule" => array(
3245     "MagpieRSS" => ""
3246     ),
3247     "uri" => "http://magpierss.sourceforge.net/"
3248     ),
3249     "mailru" => array(
3250     "icon" => "mailru",
3251 matthys 209 "title" => "Mail.Ru",
3252 joku 63 "rule" => array(
3253 matthys 195 "^Mail.Ru[ /]([0-9.]{1,10})" => "\\1",
3254     "Mail.RU_Bot[ /]([0-9.]{1,10})" => "\\1"
3255 joku 63 ),
3256 matthys 209 "uri" => "http://www.mail.ru/"
3257 joku 63 ),
3258     "mailsweeper" => array(
3259     "icon" => "robot",
3260     "title" => "Mail Sweeper",
3261     "rule" => array(
3262     "Mail[ \-]?Sweeper" => ""
3263     ),
3264     "uri" => ""
3265     ),
3266     "marvin" => array(
3267     "icon" => "robot",
3268     "title" => "Marvin",
3269     "rule" => array(
3270     "^Marvin" => ""
3271     ),
3272     "uri" => ""
3273     ),
3274     "matkurja" => array(
3275     "icon" => "matkurja",
3276     "title" => "Mat'Kurja",
3277     "rule" => array(
3278     "Mosad[ /]([0-9.]{1,10})" => "\\1"
3279     ),
3280     "uri" => ""
3281     ),
3282     "mavicanet" => array(
3283     "icon" => "mavicanet",
3284     "title" => "Mavicanet",
3285     "rule" => array(
3286     "Mavicanet robot" => ""
3287     ),
3288     "uri" => ""
3289     ),
3290 matthys 292 "meanpath" => array(
3291     "icon" => "meanpath",
3292 matthys 290 "title" => "Meanpath",
3293 matthys 280 "rule" => array(
3294     "meanpathbot[ /]([0-9.]{1,10})" => "\\1"
3295     ),
3296     "uri" => "http://www.meanpath.com/meanpathbot.html"
3297 matthys 275 ),
3298 matthys 280 "mediater" => array(
3299 joku 63 "icon" => "robot",
3300     "title" => "Mediater",
3301     "rule" => array (
3302     "^libwww[ /]([0-9.]{1,10})" => "\\1"
3303 matthys 280 ),
3304     "uri" => ""
3305 joku 63 ),
3306 matthys 305 "memory" => array(
3307     "icon" => "memory",
3308     "title" => "internet Memory",
3309     "rule" => array (
3310     "memoryBot[ /]([0-9.]{1,10})" => "\\1"
3311     ),
3312     "uri" => "http://internetmemory.org/en/"
3313     ),
3314 joku 63 "mercator" => array(
3315     "icon" => "robot",
3316     "title" => "Mercator",
3317     "rule" => array(
3318     "Mercator" => ""
3319     ),
3320     "uri" => ""
3321     ),
3322     "metacarta" => array(
3323     "icon" => "robot",
3324     "title" => "Metacarta",
3325     "rule" => array(
3326     "^RRC (crawler_admin@bigfoot.com)" => "",
3327     "^flunky" => "",
3328     "^Mozilla.*\(samualt9@bigfoot.com\)$" => ""
3329     ),
3330     "uri" => "http://www.metacarta.com"
3331     ),
3332     "metager" => array(
3333     "icon" => "metager",
3334     "title" => "MetaGer",
3335     "rule" => array(
3336     "MetaGer" => ""
3337     ),
3338     "uri" => ""
3339     ),
3340     "metamark" => array(
3341     "icon" => "robot",
3342     "title" => "Metamark",
3343     "rule" => array(
3344     "^XRL[ /]([0-9.a-z]{1,10})" => "\\1"
3345     ),
3346     "uri" => "http://metamark.net"
3347     ),
3348     "metamedic" => array(
3349     "icon" => "metamedic",
3350     "title" => "MetaMedic",
3351     "rule" => array(
3352     "MediBot[ /]([0-9.]{1,10})" => "\\1"
3353     ),
3354     "uri" => ""
3355     ),
3356     "mirago" => array(
3357     "icon" => "mirago",
3358     "title" => "Mirago",
3359     "rule" => array(
3360     "Mirago" => ""
3361     ),
3362     "uri" => ""
3363     ),
3364     "misterwong" => array(
3365     "icon" => "misterwong",
3366     "title" => "Mister Wong",
3367     "rule" => array(
3368     "Mister Wong-Bot[ /]([0-9.]{1,10})" => "\\1"
3369     ),
3370     "uri" => "http://www.mister-wong.de/"
3371     ),
3372     "miva" => array(
3373     "icon" => "miva",
3374     "title" => "Miva",
3375     "rule" => array(
3376     "AlgoFeedback@miva\.com" => ""
3377     ),
3378     "uri" => "http://www.miva.com/"
3379     ),
3380     "mj12" => array(
3381     "icon" => "mj12",
3382     "title" => "Majestic-12",
3383     "rule" => array(
3384     "Mj12bot[ /]v?([0-9.]{1,10})" => "\\1",
3385     "MJ12bot \(mini\)[ /]([0-9.]{1,10})" => "\\1"
3386     ),
3387     "uri" => "http://majestic12.co.uk/bot.php"
3388     ),
3389     "mlbot" => array(
3390     "icon" => "robot",
3391     "title" => "MLBot",
3392     "rule" => array(
3393     "^MLBot" => ""
3394     ),
3395     "uri" => "http://www.metadatalabs.com/mlbot"
3396     ),
3397     "mnogo" => array(
3398     "icon" => "mnogo",
3399     "title" => "mnoGoSearch",
3400     "rule" => array(
3401     "Mnogosearch[ /\-]([0-9.]{1,10})" => "\\1"
3402     ),
3403     "uri" => "http://www.mnogosearch.org/"
3404     ),
3405     "mobileok" => array(
3406     "icon" => "mobileok",
3407     "title" => "W3C mobileOK",
3408     "rule" => array(
3409     "^W3C-mobileOK" => ""
3410     ),
3411     "uri" => "http://www.w3.org/2006/07/mobileok-ddc"
3412     ),
3413 matthys 296 "mojeek" => array(
3414     "icon" => "mojeek",
3415     "title" => "Mojeek",
3416 joku 63 "rule" => array(
3417     "MojeekBot[ /]([0-9.]{1,10})" => "\\1"
3418     ),
3419 matthys 284 "uri" => "https://www.mojeek.com/bot.html"
3420 joku 63 ),
3421     "momspider" => array(
3422     "icon" => "robot",
3423     "title" => "MOM Spider",
3424     "rule" => array(
3425     "MOMspider[ /]([0-9.]{1,10})" => "\\1"
3426     ),
3427     "uri" => ""
3428     ),
3429     "moreover" => array(
3430     "icon" => "moreover",
3431     "title" => "Moreover",
3432     "rule" => array(
3433     "^Moreoverbot[ /]([0-9.]{1,10})" => "\\1"
3434     ),
3435     "uri" => ""
3436     ),
3437     "movabletype" => array(
3438     "icon" => "movabletype",
3439     "title" => "Movable Type",
3440     "rule" => array(
3441     "MovableType[ /]([0-9.]{1,10})" => "\\1"
3442     ),
3443     "uri" => ""
3444     ),
3445     "mozdex" => array(
3446     "icon" => "mozdex",
3447     "title" => "MozDex",
3448     "rule" => array(
3449     "mozDex[ /]([0-9.]{1,6}(-dev)?)" => "\\1"
3450     ),
3451     "uri" => ""
3452     ),
3453     "mqbot" => array(
3454     "icon" => "robot",
3455     "title" => "MQbot",
3456     "rule" => array(
3457     "MQbot" => ""
3458     ),
3459     "uri" => ""
3460     ),
3461     "msnbot" => array(
3462     "icon" => "bing",
3463 matthys 205 "title" => "Bing",
3464 joku 63 "rule" => array(
3465     "MSN(BOT|PTC)[ /]([0-9.]{1,10})" => "\\2",
3466     "MS Search ([0-9.]{1,10}) Robot" => "\\1",
3467     "MSNBOT-(MEDIA|PRODUCTS|NewsBlogs)[ /]([0-9.]{1,10})" => "\\2",
3468     "bingbot[ /]([0-9.]{1,10})" => "\\1"
3469     ),
3470     "uri" => ""
3471     ),
3472     "msnbot-mobile" => array(
3473     "icon" => "msn",
3474     "title" => "MSN Mobile",
3475     "rule" => array(
3476     "MSNBOT-(MOBILE|)[ /]([0-9.]{1,10})" => "\\2",
3477     "MSNBOT_Mobile" => "",
3478     "MSMOBOT" => ""
3479     ),
3480     "uri" => ""
3481     ),
3482     "mslivebot" => array(
3483     "icon" => "livesearch",
3484     "title" => "MS Live Search",
3485     "rule" => array(
3486     "MSNBOT-(Academic)[ /]([0-9.]{1,10})" => "\\2"
3487     ),
3488     "uri" => ""
3489     ),
3490     "msproxy" => array(
3491     "icon" => "robot",
3492     "title" => "MSProxy",
3493     "rule" => array(
3494     "MSProxy[ /]([0-9.]{1,10})" => "\\1"
3495     ),
3496     "uri" => ""
3497     ),
3498     "msrbot" => array(
3499     "icon" => "robot",
3500     "title" => "MSRBOT",
3501     "rule" => array(
3502     "^MSRBOT" => ""
3503     ),
3504     "uri" => "http://research.microsoft.com/research/sv/msrbot/"
3505     ),
3506     "mswebdav" => array(
3507     "icon" => "robot",
3508     "title" => "MS-WebDAV",
3509     "rule" => array(
3510     "Microsoft[ \-]?WebDAV[ \-]?MiniRedir" => ""
3511     ),
3512     "uri" => ""
3513     ),
3514     "mticon" => array(
3515     "icon" => "robot",
3516     "title" => "MTIcon",
3517     "rule" => array(
3518     "MTIcon[/ ]([0-9.]{1,10})" => "\\1"
3519     ),
3520     "uri" => ""
3521     ),
3522     "multipage-validator" => array(
3523     "icon" => "multipage-validator",
3524     "title" => "Multipage Validator",
3525     "rule" => array(
3526     "^W3C_Multipage_Validator[ /]([0-9.]{1,10})" => "\\1"
3527     ),
3528     "uri" => "http://www.validator.ca/"
3529     ),
3530     "myrss" => array(
3531     "icon" => "rss",
3532     "title" => "MyRSS",
3533     "rule" => array(
3534     "MyRSS.jp[/ ]([0-9.]{1,10})" => "\\1"
3535     ),
3536     "uri" => ""
3537     ),
3538     "multimap" => array(
3539     "icon" => "robot",
3540     "title" => "Multimap",
3541     "rule" => array(
3542     "Multimap Geotag Blog Parser[/ ]([0-9.]{1,10})" => "\\1"
3543     ),
3544     "uri" => ""
3545     ),
3546     "najdi" => array(
3547     "icon" => "najdi",
3548     "title" => "Najdi.si",
3549     "rule" => array(
3550     "Najdi.si" => ""
3551     ),
3552     "uri" => "http://www.najdi.si"
3553     ),
3554     "nameprotect" => array(
3555     "icon" => "nameprotect",
3556     "title" => "Name Protect",
3557     "rule" => array(
3558     "NPBot" => ""
3559     ),
3560     "uri" => ""
3561     ),
3562     "nationaldirectory" => array(
3563     "icon" => "robot",
3564     "title" => "National Directory",
3565     "rule" => array(
3566     "NationalDirectory-WebSpider[ /]([0-9.]{1,10})" => "\\1"
3567     ),
3568     "uri" => ""
3569     ),
3570     "natsumican" => array(
3571     "icon" => "robot",
3572     "title" => "Natsu Mican",
3573     "rule" => array(
3574     "NATSU[ \-]MICAN[/ ]([0-9a-z.]{1,10})" => "\\1"
3575     ),
3576     "uri" => ""
3577     ),
3578     "naverbot" => array(
3579     "icon" => "naverbot",
3580     "title" => "Naver",
3581     "rule" => array(
3582     "NaverBot([_\-]dloader)?[/ \-]([0-9.]{1,10})" => "\\2",
3583     "Naver(Bot)?" => "",
3584     "^nabot" => ""
3585     ),
3586     "uri" => ""
3587     ),
3588     "navisso" => array(
3589     "icon" => "navisso",
3590     "title" => "Navisso",
3591     "rule" => array(
3592     "Navisso(Bot)?" => ""
3593     ),
3594     "uri" => "http://www.navisso.com"
3595     ),
3596     "neofonie" => array(
3597     "icon" => "robot",
3598 matthys 205 "title" => "Neofonie",
3599 joku 63 "rule" => array(
3600     "www.neofonie.de" => ""
3601     ),
3602     "uri" => "http://www.neofonie.de/loesungen/search/robot.html"
3603     ),
3604     "neomo" => array(
3605     "icon" => "robot",
3606     "title" => "Neomo",
3607     "rule" => array(
3608     "Francis[ /]([0-9.]{1,10})" => "\\1"
3609     ),
3610     "uri" => ""
3611     ),
3612     "nessus" => array(
3613     "icon" => "nessus",
3614     "title" => "Nessus",
3615     "rule" => array(
3616     "Nessus\)$" => ""
3617     ),
3618     "uri" => ""
3619     ),
3620 matthys 279 "nerdybot" => array(
3621 matthys 280 "icon" => "robot",
3622     "title" => "NerdyBot",
3623     "rule" => array(
3624     "NerdyBot" => ""
3625     ),
3626     "uri" => "http://nerdybot.com/"
3627 matthys 279 ),
3628 joku 63 "nerdbynature" => array(
3629     "icon" => "nerdbynature",
3630     "title" => "NerdByNature",
3631     "rule" => array(
3632     "NerdByNature.Bot" => ""
3633     ),
3634     "uri" => "http://www.nerdbynature.net/bot"
3635     ),
3636     "netants" => array(
3637     "icon" => "netants",
3638     "title" => "NetAnts",
3639     "rule" => array(
3640     "NetAnts[ /]([0-9.]{1,10})" => "\\1"
3641     ),
3642     "uri" => ""
3643     ),
3644     "netcraft" => array(
3645     "icon" => "netcraft",
3646     "title" => "Netcraft",
3647     "rule" => array(
3648     "netcraft" => ""
3649     ),
3650     "uri" => ""
3651     ),
3652     "netinfo" => array(
3653     "icon" => "netinfo",
3654     "title" => "Netinfo",
3655     "rule" => array(
3656     "^NetinfoBot[ /]([0-9.]{1,10})" => "\\1"
3657     ),
3658     "uri" => "http://netinfo.bg/"
3659     ),
3660     "netluchs" => array(
3661     "icon" => "netluchs",
3662     "title" => "Netluchs",
3663     "rule" => array(
3664     "Netluchs[ /]([0-9.a-z]{1,10})" => "\\1"
3665     ),
3666     "uri" => "http://www.netluchs.de/"
3667     ),
3668     "netmechanic" => array(
3669     "icon" => "netmechanic",
3670     "title" => "NetMechanic",
3671     "rule" => array(
3672     "NetMechanic[ /V]{1,5}([0-9.]{1,10})" => "\\1"
3673     ),
3674     "uri" => ""
3675     ),
3676     "netnose" => array(
3677     "icon" => "netnose",
3678     "title" => "NetNose",
3679     "rule" => array(
3680     "NetNose[ \-]Crawler[/ ]([0-9.]{1,10})" => "\\1"
3681     ),
3682     "uri" => ""
3683     ),
3684     "netoskop" => array(
3685     "icon" => "robot",
3686     "title" => "Netoskop",
3687     "rule" => array(
3688     "netoskop" => ""
3689     ),
3690     "uri" => ""
3691     ),
3692     "netpromoter" => array(
3693     "icon" => "netpromoter",
3694     "title" => "NetPromoter",
3695     "rule" => array(
3696     "NetPromoter Spider" => ""
3697     ),
3698     "uri" => "http://www.net-promoter.com/"
3699     ),
3700     "netprospector" => array(
3701     "icon" => "robot",
3702     "title" => "Netprospector",
3703     "rule" => array(
3704     "^netprospector" => ""
3705     )
3706     ),
3707     "netpumper" => array(
3708     "icon" => "robot",
3709     "title" => "Netpumper",
3710     "rule" => array(
3711     "^NetPumper[/ ]([0-9.]{1,10})" => "\\1"
3712     ),
3713     "uri" => ""
3714     ),
3715     "netscapeproxy" => array(
3716     "icon" => "netscape",
3717     "title" => "Netscape Proxy",
3718     "rule" => array(
3719     "Netscape-Proxy[/ ]([0-9.]{1,10})" => "\\1"
3720     ),
3721     "uri" => ""
3722     ),
3723     "netspective" => array(
3724     "icon" => "robot",
3725     "title" => "NetSpective",
3726     "rule" => array(
3727     "^WebFilter Robot ([0-9.]{1,10})" => "\\1"
3728     ),
3729     "uri" => ""
3730     ),
3731     "netvibes" => array(
3732     "icon" => "netvibes",
3733     "title" => " Netvibes",
3734     "rule" => array(
3735     "^Netvibes" => "\\1"
3736     ),
3737     "uri" => ""
3738     ),
3739     "newsfire" => array(
3740     "icon" => "newsfire",
3741     "title" => "NewsFire",
3742     "rule" => array(
3743     "NewsFire[/ ]([0-9.]{1,10})" => "\\1"
3744     ),
3745     "uri" => ""
3746     ),
3747     "newsgator" => array(
3748     "icon" => "newsgator",
3749     "title" => "NewsGator",
3750     "rule" => array(
3751     "NewsGato(r|rOnline)[/ ]([0-9.]{1,10})" => "\\2"
3752     ),
3753     "uri" => ""
3754     ),
3755     "newzcrawler" => array(
3756     "icon" => "newzcrawler",
3757     "title" => "NewzCrawler",
3758     "rule" => array(
3759     "NewzCrawler[/ ]([0-9.]{1,10})" => "\\1"
3760     ),
3761     "uri" => ""
3762     ),
3763     "nextopia" => array(
3764     "icon" => "newzcrawler",
3765     "title" => "NewzCrawler",
3766     "rule" => array(
3767     "^NextopiaBOT.*[v ]([0-9.]{1,10})" => "\\1"
3768     ),
3769     "uri" => ""
3770     ),
3771     "ngsearch" => array(
3772     "icon" => "ngsearch",
3773     "title" => "NG Search",
3774     "rule" => array(
3775     "NG-Search[/ ]([0-9.]{1,10})" => "\\1"
3776     ),
3777     "uri" => ""
3778     ),
3779     "nimble" => array(
3780     "icon" => "robot",
3781     "title" => "Nimble",
3782     "rule" => array(
3783     "NimbleCrawler[/ ]([0-9.]{1,10})" => "\\1"
3784     ),
3785     "uri" => ""
3786     ),
3787     "nmap" => array(
3788     "icon" => "nmap",
3789     "title" => "Nmap",
3790     "rule" => array(
3791     "Nmap Scripting Engine" => ""
3792     ),
3793     "uri" => "http://nmap.org/book/nse.html"
3794     ),
3795     "nusearch" => array(
3796     "icon" => "robot",
3797     "title" => "NuSearch",
3798     "rule" => array(
3799     "^nuSearch" => ""
3800     ),
3801     "uri" => "http://www.nusearch.com/"
3802     ),
3803     "noago" => array(
3804     "icon" => "noago",
3805     "title" => "Noago",
3806     "rule" => array(
3807     "Noago Spider" => ""
3808     ),
3809     "uri" => "http://www.noago.com/"
3810     ),
3811     "noviforum" => array(
3812     "icon" => "noviforum",
3813     "title" => "Noviforum",
3814     "rule" => array(
3815     "TridentSpider[/ ]?([0-9.]{1,10})" => "\\1"
3816     ),
3817     "uri" => ""
3818     ),
3819     "noxtrum" => array(
3820     "icon" => "noxtrum",
3821     "title" => "noXtrum",
3822     "rule" => array(
3823     "noxtrumbot[/ ]?([0-9.]{1,10})" => "\\1"
3824     ),
3825     "uri" => ""
3826     ),
3827     "noyona" => array(
3828     "icon" => "robot",
3829     "title" => "Noyona",
3830     "rule" => array(
3831     "noyona.([0-9._]{1,10})" => "\\1"
3832     ),
3833     "uri" => "http://noyona.com/"
3834     ),
3835     "nsauditor" => array(
3836     "icon" => "nsauditor",
3837     "title" => "Nsauditor",
3838     "rule" => array(
3839     "Nsauditor[ /]([0-9.]{1,10})" => "\\1"
3840     ),
3841     "uri" => "http://www.nsauditor.com/"
3842     ),
3843     "obidosbot" => array(
3844     "icon" => "robot",
3845     "title" => "Bookwatch",
3846     "rule" => array(
3847     "obidos[ \-]?bot" => ""
3848     ),
3849     "uri" => ""
3850     ),
3851     "objectssearch" => array(
3852     "icon" => "robot",
3853     "title" => "Objects Search",
3854     "rule" => array(
3855     "ObjectsSearch[ /]([0-9.]{1,10})" => "\\1"
3856     ),
3857     "uri" => ""
3858     ),
3859     "obot" => array(
3860 matthys 297 "icon" => "ibm",
3861     "title" => "IBM (ONLY) Crawler",
3862 joku 63 "rule" => array(
3863 matthys 297 "oBot[ /]([0-9.]{1,10})" => "\\1"
3864 joku 63 ),
3865 matthys 297 "uri" => "http://filterdb.iss.net/crawler/"
3866     // Previous from "ONLY Solutions GmbH" – that is what the O stands for
3867 joku 63 ),
3868     "ocawa" => array(
3869     "icon" => "ocawa",
3870     "title" => "Ocawa",
3871     "rule" => array(
3872     "Ocawa[ /]([A-Z.a-z][0-9.]{1,10})" => "\\1",
3873     "Ocawa" => ""
3874     ),
3875     "uri" => "http://www.ocawa.com/"
3876     ),
3877     "octora" => array(
3878     "icon" => "octora",
3879     "title" => "Octora",
3880     "rule" => array(
3881     "^Octora (Beta)?" => ""
3882     ),
3883     "uri" => "http://www.octora.com/"
3884     ),
3885     "offlineexplorer" => array(
3886     "icon" => "robot",
3887     "title" => "OfflineExplorer",
3888     "rule" => array(
3889     "^Offline Explorer[ /]([0-9.]{1,10})" => "\\1"
3890     ),
3891     "uri" => ""
3892     ),
3893     "omea" => array(
3894     "icon" => "omea",
3895     "title" => "Omea Reader",
3896     "rule" => array(
3897     "Omea Reader[ /]([0-9.]{1,10})" => "\\1"
3898     ),
3899     "uri" => ""
3900     ),
3901     "onet" => array(
3902     "icon" => "onet",
3903     "title" => "Onet",
3904     "rule" => array(
3905     "OnetSzukaj[ /]([0-9.]{1,10})" => "\\1",
3906     "Onet\.pl" => "",
3907     "inktomi.search.onet" => ""
3908     ),
3909     "uri" => "http://www.onet.pl"
3910     ),
3911     "online24" => array(
3912     "icon" => "robot",
3913 matthys 209 "title" => "Online24",
3914 joku 63 "rule" => array(
3915     "^Online24-Bot .* ([0-9.]{1,10})" => "\\1"
3916     ),
3917     "uri" => "http://www.online24.de"
3918     ),
3919     "onlinewebcheck" => array(
3920     "icon" => "csehtmlvalidator",
3921     "title" => "CSE HTML Validator",
3922     "rule" => array(
3923     "onlinewebcheck" => ""
3924     ),
3925     "uri" => "http://www.onlinewebcheck.com"
3926     ),
3927     "onsearch" => array(
3928     "icon" => "onsearch",
3929 matthys 209 "title" => "OnSearch",
3930 joku 63 "rule" => array(
3931     "^onCHECK-Robot" => ""
3932     ),
3933     "uri" => "http://www.onsearch.de"
3934     ),
3935     "onto" => array(
3936     "icon" => "robot",
3937     "title" => "OntoSpider",
3938     "rule" => array(
3939     "^OntoSpider[ /]([0-9.]{1,10})" => "\\1"
3940     ),
3941     "uri" => "http://ontospider.i-n.info/"
3942     ),
3943     "openacoon" => array(
3944     "icon" => "robot",
3945     "title" => "OpenAcoon",
3946     "rule" => array(
3947     "^OpenAcoon v([0-9.]{1,10})" => "\\1"
3948     ),
3949     "uri" => "http://www.openacoon.de/"
3950     ),
3951     "openfind" => array(
3952     "icon" => "openfind",
3953     "title" => "Openfind",
3954     "rule" => array(
3955     "openbot[ /]([0-9.]{1,10})" => "\\1",
3956     "Openfind Robot[ /]([0-9.A-Z]{1,10})" => "\\1"
3957     ),
3958     "uri" => ""
3959     ),
3960     "opentagger" => array(
3961     "icon" => "robot",
3962     "title" => "OpenTagger",
3963     "rule" => array(
3964     "^OpenTaggerBot" => ""
3965     ),
3966     "uri" => "http://www.opentagger.com/opentaggerbot.htm"
3967     ),
3968     "opentext" => array(
3969     "icon" => "opentext",
3970     "title" => "OpenText",
3971     "rule" => array(
3972     "^OpenTextSiteCrawler[ /]([0-9.]{1,10})" => "\\1"
3973     ),
3974     "uri" => "http://www.opentext.net/"
3975     ),
3976     "openweb" => array(
3977     "icon" => "robot",
3978     "title" => "OpenWebSpider",
3979     "rule" => array(
3980     "^OpenWebSpider[ /]([0-9.]{1,10})" => "\\1",
3981     "^OpenWebSpider v([0-9.A-Z]{1,10})" => "\\1"
3982     ),
3983     "uri" => "http://www.openwebspider.org"
3984     ),
3985     "openx" => array(
3986     "icon" => "openx",
3987     "title" => "OpenX Spider",
3988     "rule" => array(
3989     "OpenX" => ""
3990     ),
3991     "uri" => "http://www.openx.org"
3992     ),
3993     "orange" => array(
3994     "icon" => "orange",
3995     "title" => "Orange",
3996     "rule" => array(
3997     "OrangeBot-Mobile[ /]([0-9.]{1,10})" => "\\1"
3998     ),
3999     "uri" => "http://orange.com/"
4000     ),
4001     "organica" => array(
4002     "icon" => "robot",
4003     "title" => "Organica",
4004     "rule" => array(
4005     "crawler@organica\.us" => ""
4006     ),
4007     "uri" => ""
4008     ),
4009     "outfox" => array(
4010     "icon" => "robot",
4011     "title" => "Outfox Melon",
4012     "rule" => array(
4013     "OutfoxMelonBot[ /]([0-9.]{1,10})" => "\\1",
4014     "OutfoxBot[ /]([0-9.]{1,10})" => "\\1"
4015     ),
4016     "uri" => ""
4017     ),
4018     "overture" => array(
4019     "icon" => "overture",
4020     "title" => "Overture",
4021     "rule" => array(
4022     "Overture[ \-]?WebCrawler" => ""
4023     ),
4024     "uri" => ""
4025     ),
4026 joku 337 "owler" => array(
4027     "icon" => "robot",
4028     "title" => "Owler",
4029     "rule" => array(
4030     "Owler[ /]([0-9.]{1,10})" => "\\1",
4031     "Owler" => ""
4032     ),
4033     "uri" => ""
4034     ),
4035 joku 63 "page2rss" => array(
4036     "icon" => "page2rss",
4037     "title" => "Page2RSS",
4038     "rule" => array(
4039     "Page2RSS[ /]([0-9.]{1,10})" => "\\1"
4040     ),
4041     "uri" => "http://page2rss.com"
4042     ),
4043     "pagebytes" => array(
4044     "icon" => "robot",
4045     "title" => "PageBites",
4046     "rule" => array(
4047     "^PageBitesHyperBot[ /]([0-9.]{1,10})" => "\\1"
4048     ),
4049     "uri" => ""
4050     ),
4051 matthys 282 "pagesinventory" => array(
4052     "icon" => "pagesinventory",
4053     "title" => "PagesInventory",
4054     "rule" => array(
4055     "^PagesInventory" => ""
4056     ),
4057     "uri" => "http://www.pagesinventory.com"
4058     ),
4059 joku 63 "pagesjaunes" => array(
4060     "icon" => "pagesjaunes",
4061     "title" => "Pages Jaunes",
4062     "rule" => array(
4063     "PJBot[ /]([0-9.]{1,10})" => "\\1"
4064     ),
4065     "uri" => "http://www.pagesjaunes.fr/"
4066     ),
4067     "pagevalet" => array(
4068     "icon" => "wdg",
4069     "title" => "WDG Page Valet",
4070     "rule" => array(
4071     "^Page Valet[ /]([0-9.]{1,10})" => "\\1"
4072     ),
4073     "uri" => "http://www.htmlhelp.com/tools/validator/"
4074     ),
4075     "panopeabot" => array(
4076     "icon" => "robot",
4077     "title" => "PanopeaBot",
4078     "rule" => array(
4079     "PanopeaBot[/ ]([0-9.]{1,10})" => "\\1"
4080     ),
4081     "uri" => ""
4082     ),
4083     "parchmenthill" => array(
4084     "icon" => "robot",
4085     "title" => "Parchment Hill",
4086     "rule" => array(
4087     "ParchBot[ /]([0-9.]{1,10})" => "\\1"
4088     ),
4089     "uri" => "http://www.parchmenthill.com/search.htm"
4090     ),
4091     "pascient" => array(
4092     "icon" => "pascient",
4093     "title" => "Pascient",
4094     "rule" => array(
4095     "panscient.com" => ""
4096     ),
4097     "uri" => "http://www.panscient.com/"
4098     ),
4099     "peerbot" => array(
4100     "icon" => "peerbot",
4101     "title" => "Peerbot",
4102     "rule" => array(
4103     "^PEERbot" => ""
4104     ),
4105     "uri" => ""
4106     ),
4107     "php" => array(
4108     "icon" => "php",
4109     "title" => "PHP",
4110     "rule" => array(
4111     "^PHP[ /]([0-9.]{1,10})" => "\\1"
4112     ),
4113     "uri" => ""
4114     ),
4115     "phpcrawl" => array(
4116     "icon" => "robot",
4117     "title" => "PHPCrawl",
4118     "rule" => array(
4119     "^PHPCrawl" => ""
4120     ),
4121     "uri" => "http://phpcrawl.cuab.de/"
4122     ),
4123     "phpdig" => array(
4124     "icon" => "robot",
4125     "title" => "PhpDig",
4126     "rule" => array(
4127     "^PhpDig[ /]([0-9.]{1,10})" => "\\1"
4128     ),
4129     "uri" => "http://www.finbot.com/"
4130     ),
4131     "phpversiontracker" => array(
4132     "icon" => "phpversiontracker",
4133     "title" => "PHP version tracker",
4134     "rule" => array(
4135     "^PHP version tracker" => ""
4136     ),
4137     "uri" => "http://www.nexen.net/phpversion/bot.php"
4138     ),
4139     "pictureofinternet" => array(
4140     "icon" => "robot",
4141     "title" => "PictureOfInternet",
4142     "rule" => array(
4143     "^PictureOfInternet[ /]([0-9.]{1,10})" => ""
4144     ),
4145     "uri" => ""
4146     ),
4147     "pingdom" => array(
4148     "icon" => "pingdom",
4149     "title" => "Pingdom",
4150     "rule" => array(
4151     "^Pingdom GIGRIB v([0-9.]{1,10})" => "\\1",
4152     "^Pingdom" => ""
4153     ),
4154     "uri" => "http://www.pingdom.com/"
4155     ),
4156     "pinseri" => array(
4157     "icon" => "pinseri",
4158     "title" => "Pinseri",
4159     "rule" => array(
4160     "www\.pinseri\.com/bloglist" => ""
4161     ),
4162     "uri" => ""
4163     ),
4164     "plagger" => array(
4165     "icon" => "plagger",
4166     "title" => "Plagger",
4167     "rule" => array(
4168     "Plagger[ /]([0-9.]{1,10})" => "\\1"
4169     ),
4170     "uri" => "http://www.plugger.org"
4171     ),
4172     "planet" => array(
4173     "icon" => "planet",
4174     "title" => "Planet",
4175     "rule" => array(
4176     "Planet[ /]([0-9.]{1,10})" => "\\1"
4177     ),
4178     "uri" => ""
4179     ),
4180     "plantynet" => array(
4181     "icon" => "robot",
4182     "title" => "PlantyNet",
4183     "rule" => array(
4184     "PlantyNet_WebRobot[_ /]V?([0-9.]{1,10})" => "\\1"
4185     ),
4186     "uri" => ""
4187     ),
4188     "pluck" => array(
4189     "icon" => "pluck",
4190     "title" => "Pluck",
4191     "rule" => array(
4192     "PluckFeedCrawler[ /]([0-9.]{1,10})" => "\\1"
4193     ),
4194     "uri" => ""
4195     ),
4196     "plsearch" => array(
4197     "icon" => "plsearch",
4198     "title" => "PlanetSearch",
4199     "rule" => array(
4200     "fido[ /]([0-9.]{1,10}) Harvest" => "\\1"
4201     ),
4202     "uri" => ""
4203     ),
4204     "poe" => array(
4205     "icon" => "robot",
4206     "title" => "POE-Component",
4207     "rule" => array(
4208     "^POE-Component-Client-HTTP[/ ]([0-9.]{1,10})" => "\\1"
4209     ),
4210     "uri" => ""
4211     ),
4212     "pogodak" => array(
4213     "icon" => "pogodak",
4214     "title" => "Pogodak",
4215     "rule" => array(
4216     "Pogodak\.hr[/ ]?([0-9.]{1,10})" => "\\1"
4217     ),
4218     "uri" => ""
4219     ),
4220     "poodle" => array(
4221     "icon" => "robot",
4222     "title" => "Poodle predictor",
4223     "rule" => array(
4224     "P(oo|ooo)dle[ \-]?predictor[ \-]?([0-9.]{1,10})" => "\\1",
4225     "P(oo|ooo)dle[ \-]?predictor" => ""
4226     ),
4227     "uri" => "http://www.gritechnologies.com/tools/spider.go"
4228     ),
4229     "pompos" => array(
4230     "icon" => "pompos",
4231     "title" => "Pompos",
4232     "rule" => array(
4233     "Pompos[ /]([0-9.]{1,10})" => "\\1"
4234     ),
4235     "uri" => ""
4236     ),
4237     "popdex" => array(
4238     "icon" => "robot",
4239     "title" => "Popdexter",
4240     "rule" => array(
4241     "Popdexter" => ""
4242     ),
4243     "uri" => ""
4244     ),
4245     "postrank" => array(
4246     "icon" => "postrank",
4247     "title" => "PostRank",
4248     "rule" => array(
4249     "^PostRank[ /]+([0-9.]{1,10})" => "\\1"
4250     ),
4251     "uri" => "http://www.postrank.com/"
4252     ),
4253     "powermarks" => array(
4254     "icon" => "robot",
4255     "title" => "Powermarks",
4256     "rule" => array(
4257     "Powermarks[ /]([0-9.]{1,10})" => "\\1"
4258     ),
4259     "uri" => ""
4260     ),
4261     "probe" => array(
4262     "icon" => "robot",
4263     "title" => "PROBE!",
4264     "rule" => array(
4265     "^PROBE!" => ""
4266     ),
4267     "uri" => ""
4268     ),
4269     "projecthoneypot" => array(
4270     "icon" => "projecthoneypot",
4271     "title" => "Project Honeypot",
4272     "rule" => array(
4273     "^PHPot Verispider[ /v]+([0-9.]{1,10})" => "\\1",
4274     "projecthoneypot" => ""
4275     ),
4276     "uri" => "http://www.projecthoneypot.org"
4277     ),
4278     "proxycache" => array(
4279     "icon" => "robot",
4280     "title" => "Proxy Cache",
4281     "rule" => array(
4282     "^Mozilla/[0-9.]{1,10} \(compatible\;\)$" => ""
4283     ),
4284     "uri" => ""
4285     ),
4286     "proxyhunter" => array(
4287     "icon" => "robot",
4288     "title" => "ProxyHunter",
4289     "rule" => array(
4290     "ProxyHunter" => ""
4291     ),
4292     "uri" => ""
4293     ),
4294     "psbot" => array(
4295     "icon" => "picsearch",
4296     "title" => "PicSearch",
4297     "rule" => array(
4298     "^psbot" => ""
4299     ),
4300     "uri" => ""
4301     ),
4302     "pubsub" => array(
4303     "icon" => "pubsub",
4304     "title" => "PubSub",
4305     "rule" => array(
4306     "^PubSub-RSS-Reader[ /]([0-9.]{1,10})" => "\\1",
4307     "^PubSub\.com" => ""
4308     ),
4309     "uri" => ""
4310     ),
4311 joku 330 "pubarch" => array(
4312 joku 334 "icon" => "robot",
4313 joku 330 "title" => "PubArchive",
4314     "rule" => array(
4315     "publiclibraryarchive.org" => ""
4316     ),
4317     "uri" => ""
4318     ),
4319 joku 63 "pukiwiki" => array(
4320     "icon" => "pukiwiki",
4321     "title" => "PukiWiki",
4322     "rule" => array(
4323     "PukiWiki[ /]([0-9.]{1,10})" => "\\1"
4324     ),
4325     "uri" => ""
4326     ),
4327     "pwebotxy" => array(
4328     "icon" => "pwebotxy",
4329     "title" => "PWeBot/X.Y",
4330     "rule" => array(
4331     "^PWeBot[ /]([0-9.]{1,10})" => "\\1"
4332     ),
4333     "uri" => "http://www.programacionweb.net/robot.php"
4334     ),
4335     "pxys" => array(
4336     "icon" => "robot",
4337     "title" => "PXYS",
4338     "rule" => array(
4339     "^pxys" => ""
4340     ),
4341     "uri" => ""
4342     ),
4343     "qango" => array(
4344     "icon" => "qango",
4345     "title" => "Qango",
4346     "rule" => array(
4347     "^Qango.com" => ""
4348     ),
4349     "uri" => "http://www.quango.com/"
4350     ),
4351     "qihoo" => array(
4352     "icon" => "qihoo",
4353     "title" => "Qihoo",
4354     "rule" => array(
4355     "QihooBot[ /]([0-9.]{1,10})" => "\\1"
4356     ),
4357     "uri" => "http://www.qihoo.com/"
4358     ),
4359     "qseero" => array(
4360     "icon" => "robot",
4361     "title" => "Qseero",
4362     "rule" => array(
4363     "Qseero v([0-9.]{1,10})" => "\\1"
4364     ),
4365     "uri" => "http://www.q0.com/"
4366     ),
4367     "quantcast" => array(
4368     "icon" => "robot",
4369     "title" => "Quantcast",
4370     "rule" => array(
4371     "Quantcastbot[ /]([0-9.]{1,10})" => "\\1"
4372     ),
4373     "uri" => "http://www.quantcast.com/"
4374     ),
4375     "quepasa" => array(
4376     "icon" => "quepasa",
4377     "title" => "Quepasa",
4378     "rule" => array(
4379     "Quepasa[ \-]?Creep" => ""
4380     ),
4381     "uri" => ""
4382     ),
4383     "questfinder" => array(
4384     "icon" => "robot",
4385     "title" => "QuestFinder",
4386     "rule" => array(
4387     "www\.questfinder\.com" => ""
4388     ),
4389     "uri" => ""
4390     ),
4391     "qweery" => array(
4392     "icon" => "robot",
4393     "title" => "Qweery",
4394     "rule" => array(
4395     "^QweeryBot[ /]([0-9.]{1,10})" => "\\1"
4396     ),
4397     "uri" => "http://qweerybot.qweery.nl"
4398     ),
4399     "racaicrawler" => array(
4400     "icon" => "robot",
4401     "title" => "RacaiCrawler",
4402     "rule" => array(
4403     "RacaiCrawler[ -]([0-9.]{1,10})" => "\\1"
4404     )
4405     ),
4406     "radian6" => array(
4407     "icon" => "robot",
4408     "title" => "Radian6",
4409     "rule" => array(
4410     "www\.radian6\.com" => ""
4411     ),
4412     "uri" => "http://www.radian6.com"
4413     ),
4414     "rambler" => array(
4415     "icon" => "rambler",
4416     "title" => "Rambler",
4417     "rule" => array(
4418     "StackRambler[ /]([0-9.]{1,10})" => "\\1"
4419     ),
4420     "uri" => ""
4421     ),
4422     "ramiba" => array(
4423     "icon" => "robot",
4424 matthys 209 "title" => "Ramiba",
4425 joku 63 "rule" => array(
4426     "^ramiba(-bot)?" => "\\1"
4427     ),
4428     "uri" => ""
4429     ),
4430     "rankur" => array(
4431     "icon" => "rankur",
4432     "title" => "Rankur",
4433     "rule" => array(
4434     "^RankurBot/Rankur([0-9.]{1,10})" => "\\1"
4435     ),
4436     "uri" => "http://rankur.com/",
4437     ),
4438 joku 261 "red" => array(
4439     "icon" => "red",
4440     "title" => "RED",
4441     "rule" => array(
4442     "RED[ /]([0-9.]{1,10})" => "\\1"
4443     ),
4444     "uri" => "http://redbot.org/"
4445 joku 181 ),
4446 joku 63 "rediff" => array(
4447     "icon" => "rediff",
4448 matthys 209 "title" => "Rediff",
4449 joku 63 "rule" => array(
4450     "^RedBot/redbot[ /\-]([0-9.]{1,10})" => "\\1"
4451     ),
4452     "uri" => "http://www.rediff.com",
4453     ),
4454     "repia" => array(
4455     "icon" => "robot",
4456     "title" => "Repia",
4457     "rule" => array(
4458     "webmaster@repia\.com" => ""
4459     ),
4460     "uri" => ""
4461     ),
4462     "robotgenius" => array(
4463     "icon" => "robot",
4464     "title" => "Robot Genius",
4465     "rule" => array(
4466     "^robotgenius" => ""
4467     ),
4468     "uri" => "http://robotgenius.net",
4469     ),
4470     "robozilla" => array(
4471     "icon" => "robot",
4472     "title" => "Robozilla",
4473     "rule" => array(
4474     "Robozilla" => ""
4475     ),
4476     "uri" => ""
4477     ),
4478 matthys 302 "rogerbot" => array(
4479 matthys 306 "icon" => "moz",
4480     "title" => "Moz Rogerbot",
4481 matthys 302 "rule" => array(
4482     "rogerbot[ /]([0-9.]{1,10})" => "\\1"
4483     ),
4484     "uri" => "http://moz.com/help/guides/moz-procedures/who-is-rogerbot"
4485     ),
4486 joku 63 "rojo" => array(
4487     "icon" => "rojo",
4488     "title" => "Rojo",
4489     "rule" => array(
4490     "Rojo[ /]([0-9.]{1,10})" => "\\1"
4491     ),
4492     "uri" => ""
4493     ),
4494     "rss-atom" => array(
4495     "icon" => "rss",
4496     "title" => "RSS / Atom",
4497     "rule" => array(
4498     "^Apple-PubSub" => "",
4499     "^AppleSyndication" => ""
4500     ),
4501     "uri" => ""
4502     ),
4503     "rssbot" => array(
4504     "icon" => "rss",
4505 matthys 209 "title" => "RSS-bot",
4506 joku 63 "rule" => array(
4507     "rss-bot[ /]([0-9.]{1,10})" => "\\1"
4508     ),
4509     "uri" => ""
4510     ),
4511     "rssbandit" => array(
4512     "icon" => "rssbandit",
4513     "title" => "RssBandit",
4514     "rule" => array(
4515     "RssBandit[ /]([0-9.]{1,10})" => "\\1"
4516     ),
4517     "uri" => ""
4518     ),
4519     "rssimages" => array(
4520     "icon" => "rss",
4521 matthys 209 "title" => "RssImages",
4522 joku 63 "rule" => array(
4523     "rssImagesBot[ /]([0-9.]{1,10})" => "\\1"
4524     ),
4525     "uri" => ""
4526     ),
4527     "rssmicro" => array(
4528     "icon" => "rssmicro",
4529     "title" => "RSSMicro",
4530     "rule" => array(
4531     "RSSMicro\.com" => ""
4532     ),
4533     "uri" => "http://www.rssmicro.com"
4534     ),
4535     "rssowl" => array(
4536     "icon" => "rssowl",
4537     "title" => "RSSOwl",
4538     "rule" => array(
4539     "RSSOwl[ /]([0-9a-z.]{1,10})" => "\\1"
4540     ),
4541     "uri" => ""
4542     ),
4543     "rssreader" => array(
4544     "icon" => "rss",
4545     "title" => "RssReader",
4546     "rule" => array(
4547     "RssReader[ /]([0-9.]{1,10})" => ""
4548     ),
4549     "uri" => ""
4550     ),
4551     "rtgi" => array(
4552     "icon" => "rtgi",
4553 matthys 209 "title" => "Rtgi",
4554 joku 63 "rule" => array(
4555     "RTGI" => ""
4556     ),
4557     "uri" => "http://rtgi.fr/"
4558     ),
4559     "rufusbot" => array(
4560     "icon" => "robot",
4561     "title" => "RufusBot",
4562     "rule" => array(
4563     "RufusBot" => ""
4564     ),
4565     "uri" => ""
4566     ),
4567 matthys 304 "runet" => array(
4568     "icon" => "runet",
4569     "title" => "iTrack RuNet Crawler",
4570     "rule" => array(
4571     "Runet-Research-Crawler" => ""
4572     ),
4573     "uri" => "http://www.itrack.ru/research/cmsrate/"
4574     ),
4575 joku 63 "runnk" => array(
4576     "icon" => "robot",
4577     "title" => "Runnk",
4578     "rule" => array(
4579     "Runnk RSS finder" => ""
4580     ),
4581     "uri" => "http://www.runnk.com/il/law"
4582     ),
4583     "sagool" => array(
4584     "icon" => "robot",
4585     "title" => "Sagool",
4586     "rule" => array(
4587     "MaSagool" => ""
4588     ),
4589     "uri" => "http://sagool.jp/"
4590     ),
4591     "sanszbot" => array(
4592     "icon" => "robot",
4593     "title" => "Sansz",
4594     "rule" => array(
4595     "SanszBot" => ""
4596     ),
4597     "uri" => ""
4598     ),
4599     "saucereader" => array(
4600     "icon" => "saucereader",
4601     "title" => "Sauce Reader",
4602     "rule" => array(
4603     "Sauce[ ]?Reader[ /]([0-9.]{1,10})" => "\\1"
4604     ),
4605     "uri" => ""
4606     ),
4607     "sbider" => array(
4608     "icon" => "sbider",
4609     "title" => "SBIder",
4610     "rule" => array(
4611     "SBIder[/ ]([0-9.]{1,10})" => "\\1",
4612     "SBIder[/ ]SBIder.([0-9.]{1,10})" => "\\1"
4613     ),
4614     "uri" => ""
4615     ),
4616     "scirus" => array(
4617     "icon" => "robot",
4618     "title" => "Scirus",
4619     "rule" => array(
4620     "FAST-WebCrawler/[0-9a-z.]{1,10}/Scirus" => ""
4621     ),
4622     "uri" => ""
4623     ),
4624     "scoutjet" => array(
4625     "icon" => "scoutjet",
4626     "title" => "ScoutJet",
4627     "rule" => array(
4628     "ScoutJet" => ""
4629     ),
4630     "uri" => "http://www.scoutjet.com/"
4631     ),
4632 joku 261 "scrapy" => array(
4633     "icon" => "scrapy",
4634     "title" => "Scrapy",
4635     "rule" => array(
4636     "Scrapy[ /]([0-9.]{1,10})" => "\\1"
4637     ),
4638     "uri" => "http://scrapy.org"
4639     ),
4640 joku 63 "scrubby" => array(
4641     "icon" => "scrubby",
4642     "title" => "Scrubby",
4643     "rule" => array(
4644     "Scrubby[ /]([0-9.]{1,10})" => "\\1"
4645     ),
4646     "uri" => ""
4647     ),
4648     "sdm" => array(
4649     "icon" => "sdm",
4650     "title" => "SUN Download Manager",
4651     "rule" => array(
4652     "Sun Download Manager[/ ]([0-9.]{1,10})" => "\\1"
4653     ),
4654     "uri" => ""
4655     ),
4656     "sealinks" => array(
4657     "icon" => "robot",
4658     "title" => "Sea Links",
4659     "rule" => array(
4660     "SEA-Links( HTML-Scanner Pingoo\!)?[ /]([0-9.]{1,10})" => "\\2"
4661     ),
4662     "uri" => ""
4663     ),
4664     "search17" => array(
4665     "icon" => "robot",
4666     "title" => "Search 17",
4667     "rule" => array(
4668     "Search17Bot[ /]([0-9.]{1,10})" => "\\1"
4669     ),
4670     "uri" => "http://www.search17.com/bot.php"
4671     ),
4672     "search2" => array(
4673     "icon" => "search2",
4674     "title" => "Search2.net",
4675     "rule" => array(
4676     "^S2Bot[ /]([0-9.]{1,10})" => "\\1"
4677     ),
4678     "uri" => "http://search2.net/"
4679     ),
4680     "searchbot" => array(
4681     "icon" => "robot",
4682     "title" => "Searchbot",
4683     "rule" => array(
4684     "Searchbot[ /]([0-9.]{1,10})" => "\\1"
4685     ),
4686     "uri" => ""
4687     ),
4688     "searchch" => array(
4689     "icon" => "robot",
4690     "title" => "Search.ch",
4691     "rule" => array(
4692     "search\.ch[ /]?V?([0-9.]{1,10})" => "\\1"
4693     ),
4694     "uri" => ""
4695     ),
4696     "searchengineworld" => array(
4697     "icon" => "robot",
4698     "title" => "SearchEngineWorld",
4699     "rule" => array(
4700     "searchengineworld" => ""
4701     ),
4702     "uri" => "http://www.searchengineworld.com/"
4703     ),
4704     "searchhippo" => array(
4705     "icon" => "searchhippo",
4706     "title" => "Searchhippo",
4707     "rule" => array(
4708     "searchhippo" => ""
4709     ),
4710     "uri" => "http://www.searchhippo.com/"
4711     ),
4712     "searchthruus" => array(
4713     "icon" => "robot",
4714     "title" => "SearchThruUs",
4715     "rule" => array(
4716     "www\.unitek-systems\.co\.uk[ /]([0-9.]{1,10})" => "\\1"
4717     ),
4718     "uri" => ""
4719     ),
4720     "securecomputing" => array(
4721     "icon" => "robot",
4722     "title" => "Secure Computing",
4723     "rule" => array(
4724     "securecomputing" => ""
4725     ),
4726     "uri" => ""
4727     ),
4728     "seekport" => array(
4729     "icon" => "seekport",
4730     "title" => "Seekport",
4731     "rule" => array(
4732     "Seekbot[ /]([0-9.]{1,10})" => "\\1"
4733     ),
4734     "uri" => ""
4735     ),
4736     "semanticdiscovery" => array(
4737     "icon" => "robot",
4738     "title" => "Semantic Discovery",
4739     "rule" => array(
4740     "semanticdiscovery[ /]([0-9.]{1,10})" => "\\1"
4741     ),
4742     "uri" => ""
4743     ),
4744 matthys 319 "semrush" => array(
4745     "icon" => "semrush",
4746     "title" => "SEMrush",
4747     "rule" => array(
4748     "SemrushBot[ /]([0-9.]{1,10})" => "\\1"
4749     ),
4750     "uri" => "http://www.semrush.com/bot.html"
4751     ),
4752 joku 63 "sengine" => array(
4753     "icon" => "sengine",
4754     "title" => "Sengine",
4755     "rule" => array(
4756     "netEstate NE Crawler" => ""
4757     ),
4758     "uri" => "http://www.sengine.info/"
4759     ),
4760     "sensis" => array(
4761     "icon" => "sensis",
4762     "title" => "Sensis",
4763     "rule" => array(
4764     "^Sensis(.com.au)? Web Crawler" => ""
4765     ),
4766     "uri" => "http://sensis.com.au"
4767     ),
4768     "seokicks" => array(
4769     "icon" => "seokicks",
4770     "title" => "SEOkicks",
4771     "rule" => array(
4772     "SEOkicks-Robot" => ""
4773     ),
4774     "uri" => "http://www.seokicks.de/"
4775     ),
4776     "seoprofiler" => array(
4777     "icon" => "seoprofiler",
4778     "title" => "SEOprofiler",
4779     "rule" => array(
4780     "spbot[ /]([0-9.]{1,10})" => "\\1"
4781     ),
4782     "uri" => "http://www.seoprofiler.com/"
4783     ),
4784     "setooz" => array(
4785     "icon" => "setooz",
4786     "title" => "Setooz",
4787     "rule" => array(
4788     "OOZBOT[ /]([0-9.]{1,10})" => "\\1"
4789     ),
4790     "uri" => "http://www.setooz.com/oozbot.html"
4791     ),
4792     "seznam" => array(
4793     "icon" => "seznam",
4794     "title" => "Seznam",
4795     "rule" => array(
4796     "SeznamBot[ /]([0-9.]{1,10})" => "\\1",
4797     "Seznam" => ""
4798     ),
4799     "uri" => "http://www.seznam.cz"
4800     ),
4801     "sharpreader" => array(
4802     "icon" => "sharpreader",
4803     "title" => "SharpReader",
4804     "rule" => array(
4805     "SharpReader[ /]([0-9.]{1,10})" => "\\1"
4806     ),
4807     "uri" => ""
4808     ),
4809     "shelob" => array(
4810     "icon" => "shelob",
4811     "title" => "Sherlock Spider",
4812     "rule" => array(
4813     "^Shelob" => ""
4814     ),
4815     "uri" => "http://www.gmx.net"
4816     ),
4817     "sherlockspider" => array(
4818     "icon" => "robot",
4819     "title" => "Sherlock Spider",
4820     "rule" => array(
4821     "sherlock_spider" => ""
4822     ),
4823     "uri" => ""
4824     ),
4825     "shim" => array(
4826     "icon" => "robot",
4827     "title" => "Shim Crawler",
4828     "rule" => array(
4829     "shim[ \-]crawler" => ""
4830     ),
4831     "uri" => ""
4832     ),
4833     "shopwiki" => array(
4834     "icon" => "shopwiki",
4835     "title" => "ShopWiki",
4836     "rule" => array(
4837     "^ShopWiki[ /]([0-9.]{1,10})" => "\\1"
4838     ),
4839     "uri" => ""
4840     ),
4841     "shoula" => array(
4842     "icon" => "robot",
4843     "title" => "Shoula",
4844     "rule" => array(
4845     "^Shoula.com Crawler ([0-9.]{1,10})" => "\\1"
4846     ),
4847     "uri" => "http://www.shoula.com"
4848     ),
4849     "siege" => array(
4850     "icon" => "robot",
4851     "title" => "Siege",
4852     "rule" => array(
4853     "Siege[ /]([0-9.]{1,10})" => "\\1"
4854     ),
4855     "uri" => ""
4856     ),
4857     "siets" => array(
4858     "icon" => "robot",
4859     "title" => "Siets",
4860     "rule" => array(
4861     "SietsCrawler[ /]([0-9.]{1,10})" => "\\1"
4862     ),
4863     "uri" => ""
4864     ),
4865     "simpy" => array(
4866     "icon" => "simpy",
4867     "title" => "Simpy",
4868     "rule" => array(
4869     "^(argus|simpy)[ /]([0-9.]{1,10})" => "\\2",
4870     ),
4871     "uri" => ""
4872     ),
4873     "singingfish" => array(
4874     "icon" => "singingfish",
4875     "title" => "SingingFish",
4876     "rule" => array(
4877     "asterias[ /]([0-9.]{1,10})" => "\\1",
4878     "Asterias Crawler v([0-9.]{1,10})" => "\\1",
4879     "asterias" => ""
4880     ),
4881     "uri" => ""
4882     ),
4883     "sirketce" => array(
4884     "icon" => "robot",
4885     "title" => "Sirketce",
4886     "rule" => array(
4887     "Sirketcebot[ /v]+([0-9.]{1,10})" => "\\1"
4888     ),
4889     "uri" => "http://www.sirketce.com/bot.html"
4890     ),
4891     "sirobot" => array(
4892     "icon" => "robot",
4893     "title" => "SiroBot",
4894     "rule" => array(
4895     "sirobot" => ""
4896     ),
4897     "uri" => ""
4898     ),
4899     "sistrix" => array(
4900     "icon" => "sistrix",
4901     "title" => "SISTRIX",
4902     "rule" => array(
4903     "SISTRIX Crawler" => ""
4904     ),
4905     "uri" => "http://crawler.sistrix.net/"
4906     ),
4907     "sitebar" => array(
4908     "icon" => "sitebar",
4909     "title" => "SiteBar",
4910     "rule" => array(
4911     "SiteBar[ /]([0-9.]{1,10})" => "\\1"
4912     ),
4913     "uri" => ""
4914     ),
4915     "sitebot" => array(
4916     "icon" => "sitebot",
4917     "title" => "SiteBot",
4918     "rule" => array(
4919     "SiteBot[ /]([0-9.]{1,10})" => "\\1"
4920     ),
4921     "uri" => "http://www.sitebot.org/robot/"
4922     ),
4923 matthys 273 "siteexplorer" => array(
4924     "icon" => "siteexplorer",
4925     "title" => "SiteExplorer",
4926     "rule" => array(
4927     "SiteExplorer[ /]([0-9a-z.]{1,10})" => "\\1"
4928     ),
4929     "uri" => "http://siteexplorer.info/"
4930     ),
4931 joku 63 "sitesell" => array(
4932     "icon" => "sitesell",
4933     "title" => "SiteSell",
4934     "rule" => array(
4935     "SBIder[/ ]([0-9a-z.\-]{1,10})" => "\\1"
4936     ),
4937     "uri" => ""
4938     ),
4939     "sitespider" => array(
4940     "icon" => "robot",
4941     "title" => "SiteSpider",
4942     "rule" => array(
4943     "^SiteSpider" => ""
4944     ),
4945     "uri" => ""
4946     ),
4947     "sitesucker" => array(
4948     "icon" => "sitesucker",
4949     "title" => "SiteSucker",
4950     "rule" => array(
4951     "Sitesucker[ /]([0-9.]{1,10})" => "\\1"
4952     ),
4953     "uri" => "http://www.sitesucker.us/"
4954     ),
4955     "sitidi" => array(
4956     "icon" => "robot",
4957     "title" => "SitiDi",
4958     "rule" => array(
4959     "SitiDiBot[ /]([0-9.]{1,10})" => "\\1"
4960     ),
4961     "uri" => ""
4962     ),
4963 joku 329 "sixy" => array(
4964     "icon" => "robot",
4965     "title" => "Sixy.ch",
4966     "rule" => array(
4967     "sixy.ch[ /]([0-9a-z.]{1,10})" => "\\1"
4968     ),
4969     "uri" => "http://sixy.ch"
4970     ),
4971 joku 63 "skaffe" => array(
4972     "icon" => "robot",
4973     "title" => "Skaffe",
4974     "rule" => array(
4975     "Skampy[ /]([0-9.\-]{1,10})" => "\\1"
4976     ),
4977     "uri" => "http://www.skaffe.com"
4978     ),
4979     "skizzle" => array(
4980     "icon" => "skizzle",
4981     "title" => "Skizzle",
4982     "rule" => array(
4983     "SKIZZLE! Distributed Internet Spider[ /v]+([0-9a-z.\-]{1,10})" => "\\1"
4984     ),
4985     "uri" => "http://www.skizzle.com"
4986     ),
4987     "slider" => array(
4988     "icon" => "robot",
4989     "title" => "Slider",
4990     "rule" => array(
4991     "^Slider[ /]([0-9.]{1,10})" => "\\1"
4992     ),
4993     "uri" => ""
4994     ),
4995     "slugch" => array(
4996     "icon" => "robot",
4997 matthys 209 "title" => "Slugch",
4998 joku 63 "rule" => array(
4999     "^slug\.ch crawl ([0-9a-z.\-]{1,10})" => "\\1"
5000     ),
5001     "uri" => ""
5002     ),
5003     "smartware" => array(
5004     "icon" => "robot",
5005     "title" => "SmartWareSoft",
5006     "rule" => array(
5007     "^SWSBot-Images[ /]([0-9.]{1,10})" => "\\1"
5008     ),
5009     "uri" => "http://www.smartwaresoft.com/swsbot12.html"
5010     ),
5011     "snookit" => array(
5012     "icon" => "snookit",
5013     "title" => "Snookit",
5014     "rule" => array(
5015     "^snookit" => ""
5016     ),
5017     "uri" => "http://www.snookit.com/"
5018     ),
5019     "snoopy" => array(
5020     "icon" => "robot",
5021     "title" => "Snoopy",
5022     "rule" => array(
5023     "^Snoopy.+([0-9.]{1,10})" => "\\1",
5024     "sna-([0-9.]{1,10})" => "\\1"
5025     ),
5026     "uri" => "http://snoopy.sourceforge.net/"
5027     ),
5028     "snyke" => array(
5029     "icon" => "robot",
5030     "title" => "Snyke",
5031     "rule" => array(
5032     "^SnykeBot[ /]([0-9.]{1,10})" => "\\1"
5033     ),
5034     "uri" => "http://www.snyke.com"
5035     ),
5036     "socialradar" => array(
5037     "icon" => "socialradar",
5038     "title" => "Social Radar",
5039     "rule" => array(
5040     "Socialradarbot[ /]([0-9.]{1,10})" => "\\1"
5041     ),
5042     "uri" => "http://infegy.com/"
5043     ),
5044     "soegning" => array(
5045     "icon" => "soegning",
5046 matthys 209 "title" => "Søgning",
5047 joku 63 "rule" => array(
5048     "soegning\.dk[/ ]spider[ /]([0-9.]{1,10})" => "\\1"
5049     ),
5050     "uri" => ""
5051     ),
5052     "soft411" => array(
5053     "icon" => "soft411",
5054     "title" => "Soft411",
5055     "rule" => array(
5056     "SOFT411 Directory" => ""
5057     ),
5058     "uri" => ""
5059     ),
5060     "sogou" => array(
5061     "icon" => "sogou",
5062     "title" => "Sogou",
5063     "rule" => array(
5064     "Sogou web spider[ /]([0-9.]{1,10})" => "\\1"
5065     ),
5066     "uri" => "http://www.sogou.com/docs/help/webmasters.htm#07"
5067     ),
5068     "sohu" => array(
5069     "icon" => "robot",
5070     "title" => "Sohu",
5071     "rule" => array(
5072     "sohu[ \-](agent|search)" => ""
5073     ),
5074     "uri" => ""
5075     ),
5076     "somewhere" => array(
5077     "icon" => "robot",
5078 matthys 209 "title" => "Somewhere.com",
5079 joku 63 "rule" => array(
5080     "Mozilla\@somewhere\.com" => "\\1"
5081     ),
5082     "uri" => "http://www.somewhere.com/"
5083     ),
5084     "sopheus" => array(
5085     "icon" => "robot",
5086     "title" => "Sopheus",
5087     "rule" => array(
5088     "Sopheus Project[ /]([0-9.]{1,10})" => "\\1"
5089     ),
5090     "uri" => "http://www.thenetplanet.com"
5091     ),
5092     "soso" => array(
5093     "icon" => "soso",
5094     "title" => "Soso",
5095     "rule" => array(
5096     "^Soso(image)?spider" => ""
5097     ),
5098     "uri" => "http://help.soso.com/soso-image-spider.htm"
5099     ),
5100     "souppot" => array(
5101     "icon" => "robot",
5102     "title" => "SoupPot",
5103     "rule" => array(
5104     "SoupPotBot" => ""
5105     ),
5106     "uri" => ""
5107     ),
5108     "specificmedia" => array(
5109     "icon" => "specificmedia",
5110     "title" => "Specific Media",
5111     "rule" => array(
5112     "^SMBot[ /]([0-9.]{1,10})" => "\\1"
5113     ),
5114     "uri" => ""
5115     ),
5116     "sphider" => array(
5117     "icon" => "sphider",
5118     "title" => "Sphider",
5119     "rule" => array(
5120     "Sphider" => ""
5121     ),
5122     "uri" => "http://www.sphider.eu"
5123     ),
5124     "spinn3r" => array(
5125     "icon" => "robot",
5126     "title" => "Spinn3r",
5127     "rule" => array(
5128     "Spinn3r[ /]([0-9.]{1,10})" => "\\1"
5129     ),
5130     "uri" => "http://spinn3r.com/robot"
5131     ),
5132     "sproose" => array(
5133     "icon" => "robot",
5134 matthys 209 "title" => "Sproose",
5135 joku 63 "rule" => array(
5136     "^sproose[ /]([0-9a-z.]{1,10})" => "\\1"
5137     ),
5138     "uri" => "http://www.sproose.com/bot.html"
5139     ),
5140     "spurlbot" => array(
5141     "icon" => "robot",
5142     "title" => "SpurlBot",
5143     "rule" => array(
5144     "SpurlBot[/ ]([0-9.]{1,10})" => "\\1"
5145     ),
5146     "uri" => ""
5147     ),
5148     "stardownloader" => array(
5149     "icon" => "stardownloader",
5150     "title" => "Star Downloader",
5151     "rule" => array(
5152     "^Star Downloader( Pro)?" => ""
5153     ),
5154     "uri" => ""
5155     ),
5156     "steeler" => array(
5157     "icon" => "robot",
5158     "title" => "Steeler",
5159     "rule" => array(
5160     "Steeler[ /]([0-9.]{1,10})" => "\\1"
5161     ),
5162     "uri" => ""
5163     ),
5164     "strategicboard" => array(
5165     "icon" => "strategicboard",
5166     "title" => "Strategic Board",
5167     "rule" => array(
5168     "Strategic Board Bot" => ""
5169     ),
5170     "uri" => "http://www.strategicboard.com"
5171     ),
5172     "suchbaer" => array(
5173     "icon" => "robot",
5174 matthys 209 "title" => "Suchbaer.de",
5175 joku 63 "rule" => array(
5176     "^suchbaer\.de" => ""
5177     ),
5178     "uri" => "http://www.suchbaer.de/"
5179     ),
5180     "suchbot" => array(
5181     "icon" => "robot",
5182 matthys 209 "title" => "Suchbot",
5183 joku 63 "rule" => array(
5184     "^suchbot" => ""
5185     ),
5186     "uri" => ""
5187     ),
5188     "suchende" => array(
5189     "icon" => "suchende",
5190 matthys 209 "title" => "Suchen.de",
5191 joku 63 "rule" => array(
5192     "^gonzo([0-9]{1,2}).*www.suchen.de" => "\\1",
5193     "^gonzo/([0-9.]{1,10})" => "\\1"
5194     ),
5195     "uri" => "http://www.suchen.de/"
5196     ),
5197     "suchknecht" => array(
5198     "icon" => "robot",
5199     "title" => "Suchknecht",
5200     "rule" => array(
5201     "^Suchknecht.at-Robot" => ""
5202     ),
5203     "uri" => "http://www.suchknecht.at/"
5204     ),
5205     "suchpad" => array(
5206     "icon" => "robot",
5207 matthys 209 "title" => "Suchpad",
5208 joku 63 "rule" => array(
5209     "^suchpadbot[ /]([0-9.]{1,10})" => "\\1"
5210     ),
5211     "uri" => "http://www.suchpad.de"
5212     ),
5213     "sunrise" => array(
5214     "icon" => "sunrise",
5215     "title" => "Sunrise",
5216     "rule" => array(
5217     "^Sunrise[ /]([0-9a-z.]{1,10})" => "\\1"
5218     ),
5219     "uri" => ""
5220     ),
5221     "superbot" => array(
5222     "icon" => "superbot",
5223     "title" => "SuperBot",
5224     "rule" => array(
5225     "SuperBot[ /]([0-9.]{1,10})" => "\\1"
5226     ),
5227     "uri" => ""
5228     ),
5229     "surfcontrol" => array(
5230     "icon" => "robot",
5231     "title" => "SurfControl",
5232     "rule" => array(
5233     "SurfControl" => "",
5234     "ScSpider[ /]([0-9.]{1,10})" => "\\1"
5235     ),
5236     "uri" => ""
5237     ),
5238     "surfnet" => array(
5239     "icon" => "robot",
5240     "title" => "SURFnet",
5241     "rule" => array(
5242     "AVSearch[ \-]([0-9.]{1,10})" => "\\1"
5243     ),
5244     "uri" => ""
5245     ),
5246     "surfsafely" => array(
5247     "icon" => "robot",
5248     "title" => "Surfsafely",
5249     "rule" => array(
5250     "Submission Spider at surfsafely.com" => ""
5251     ),
5252     "uri" => "http://www.surfsafely.com"
5253     ),
5254     "surphace" => array(
5255     "icon" => "spherescout",
5256     "title" => "Surphace",
5257     "rule" => array(
5258     "Sphere Scout.+([0-9.]{1,10})" => "\\1",//Previous called Sphere Scout
5259     "Surphace.+v([0-9.]{1,10})" => "\\1"
5260     ),
5261     "uri" => "http://www.surphace.com"
5262     ),
5263     "surveybot" => array(
5264     "icon" => "surveybot",
5265     "title" => "Whois Survey",
5266     "rule" => array(
5267     "SurveyBot[ /]([0-9.]{1,10})" => "\\1"
5268     ),
5269     "uri" => ""
5270     ),
5271     "swoogle" => array(
5272     "icon" => "robot",
5273     "title" => "Swoogle",
5274     "rule" => array(
5275     "^Swooglebot[ /]([0-9.]{1,10})" => "\\1"
5276     ),
5277     "uri" => "http://swoogle.umbc.edu/swooglebot.htm"
5278     ),
5279     "swse" => array(
5280     "icon" => "robot",
5281     "title" => "SWSE",
5282     "rule" => array(
5283     "sw\.deri\.org" => ""
5284     ),
5285     "uri" => "http://sw.deri.org/2006/04/multicrawler/robots.html"
5286     ),
5287     "swish-e" => array(
5288     "icon" => "swish-e",
5289     "title" => "Swish-e",
5290     "rule" => array(
5291     "^swish-e" => ""
5292     ),
5293     "uri" => "http://swish-e.org/"
5294     ),
5295     "sygol" => array(
5296     "icon" => "sygol",
5297     "title" => "Sygol",
5298     "rule" => array(
5299     "www.sygol.(com|net)" => ""
5300     ),
5301     "uri" => "http://www.sygol.com"
5302     ),
5303     "syllabs" => array(
5304     "icon" => "syllabs",
5305     "title" => "Syllabs",
5306     "rule" => array(
5307     "Focal[-]([0-9.]{1,10})" => "\\1"
5308     ),
5309     "uri" => "http://www.syllabs.com/crawler.html"
5310     ),
5311     "synapse" => array(
5312     "icon" => "robot",
5313     "title" => "Synapse",
5314     "rule" => array(
5315     " Synapse\)" => ""
5316     ),
5317     "uri" => "http://ws.apache.org/synapse/"
5318     ),
5319     "sync2it" => array(
5320     "icon" => "robot",
5321 matthys 209 "title" => "Sync2it",
5322 joku 63 "rule" => array(
5323     "^\!Susie" => ""
5324     ),
5325     "uri" => "http://www.sync2it.com/bms/susie.php"
5326     ),
5327     "syncit" => array(
5328     "icon" => "robot",
5329 matthys 209 "title" => "Syncit",
5330 joku 63 "rule" => array(
5331     "^SyncIT[ /]([0-9.]{1,10})" => "\\1"
5332     ),
5333     "uri" => "http://www.syncit.com/"
5334     ),
5335     "syndic8" => array(
5336     "icon" => "syndic8",
5337     "title" => "Syndic8",
5338     "rule" => array(
5339     "Syndic8[ /]([0-9.]{1,10})" => "\\1"
5340     ),
5341     "uri" => "http://www.syndic8.com/"
5342     ),
5343     "syndicatie" => array(
5344     "icon" => "robot",
5345     "title" => "Syndicatie.nl",
5346     "rule" => array(
5347     "Syndicatie\.nl robot v ([0-9.]{1,10})" => "\\1",
5348     "Syndicatie\.nl robot;" => ""
5349     ),
5350     "uri" => ""
5351     ),
5352     "synomia" => array(
5353     "icon" => "robot",
5354     "title" => "Synomia",
5355     "rule" => array(
5356     "^SynoBot" => ""
5357     ),
5358     "uri" => ""
5359     ),
5360     "synoo" => array(
5361     "icon" => "robot",
5362     "title" => "SynooBot",
5363     "rule" => array(
5364     "SynooBot[ /]([0-9.]{1,10})" => "\\1",
5365     ),
5366     "uri" => ""
5367     ),
5368     "szukacz" => array(
5369     "icon" => "szukacz",
5370     "title" => "Szukacz",
5371     "rule" => array(
5372     "Szukacz[ /]([0-9.]{1,10})" => "\\1"
5373     ),
5374     "uri" => ""
5375     ),
5376     "tagoo" => array(
5377     "icon" => "tagoobot",
5378     "title" => "Tagoo",
5379     "rule" => array(
5380     "Tagoobot[ /]([0-9.]{1,10})" => "\\1"
5381     ),
5382     "uri" => "http://www.tagoo.ru"
5383     ),
5384     "tagword" => array(
5385     "icon" => "tagword",
5386     "title" => "Tagword",
5387     "rule" => array(
5388     "^Tagword" => ""
5389     ),
5390     "uri" => "http://tagword.com/dmoz_survey.php"
5391     ),
5392     "trailfire" => array(
5393     "icon" => "trailfire",
5394     "title" => "Trailfire",
5395     "rule" => array(
5396     "^Trailfire-bot[ /]([0-9.]{1,10})" => "\\1"
5397     ),
5398     "uri" => "http://trailfire.com"
5399     ),
5400     "tamu" => array(
5401     "icon" => "tamu",
5402     "title" => "Tamu Crawler",
5403     "rule" => array(
5404     "IRLbot[ /]([0-9.]{1,10})" => "\\1",
5405     "TAMU_CS_IRL_CRAWLER[ /]([0-9.]{1,10})" => "\\1"
5406     ),
5407     "uri" => "http://irl.cs.tamu.edu/crawler/"
5408     ),
5409     "taptubot" => array(
5410     "icon" => "taptubot",
5411     "title" => "Taptu",
5412     "rule" => array(
5413     "taptubot" => ""
5414     ),
5415     "uri" => "http://www.taptu.com/corp/taptubot"
5416     ),
5417     "targetseek" => array(
5418     "icon" => "robot",
5419     "title" => "TargetSeek",
5420     "rule" => array(
5421     "TargetSeek[ /]([0-9.]{1,10})" => "\\1"
5422     ),
5423     "uri" => "http://www.targetgroups.net/TargetSeek.html"
5424     ),
5425     "taw" => array(
5426     "icon" => "taw",
5427     "title" => "TAW",
5428     "rule" => array(
5429     "TAW[ /]([0-9.]{1,10})" => "\\1"
5430     ),
5431     "uri" => "http://www.tawdis.net"
5432     ),
5433     "tcd" => array(
5434     "icon" => "tcd",
5435     "title" => "Trinity College Dublin",
5436     "rule" => array(
5437     "^TCDBOT/Nutch-([0-9.]{1,10})" => "\\1"
5438     ),
5439     "uri" => "http://www.tcd.ie"
5440     ),
5441     "technorati" => array(
5442     "icon" => "technorati",
5443     "title" => "Technorati",
5444     "rule" => array(
5445     "Technoratibot[ /]([0-9.]{1,10})" => "\\1"
5446     ),
5447     "uri" => ""
5448     ),
5449     "teleport" => array(
5450     "icon" => "teleport",
5451     "title" => "Teleport",
5452     "rule" => array(
5453     "Teleport[ \-]?Pro" => ""
5454     ),
5455     "uri" => ""
5456     ),
5457     "terrar" => array(
5458     "icon" => "robot",
5459     "title" => "Terrar",
5460     "rule" => array(
5461     "^Fresh Search :: Terrar" => ""
5462     ),
5463     "uri" => ""
5464     ),
5465     "theophrastus" => array(
5466     "icon" => "robot",
5467     "title" => "Theophrastus",
5468     "rule" => array(
5469     "Theophrastus[ /]([0-9.]{1,10})" => "\\1"
5470     ),
5471     "uri" => "http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php"
5472     ),
5473     "thumbnailscz" => array(
5474     "icon" => "robot",
5475 matthys 209 "title" => "Thumbnails.cz",
5476 joku 63 "rule" => array(
5477     "^thumbnail\.cz robot[ /]([0-9.]{1,10})" => "\\1"
5478     ),
5479     "uri" => ""
5480     ),
5481     "thumbshot" => array(
5482     "icon" => "robot",
5483 matthys 209 "title" => "Thumbshots",
5484 joku 63 "rule" => array(
5485     "^thumbshots.*(Version: |v)([0-9.]{2,10})e" => "\\1",
5486     "^thumbshots-de" => ""
5487     ),
5488     "uri" => "http://www.thumbshots.de"
5489     ),
5490     "thunderstone" => array(
5491     "icon" => "thunderstone",
5492     "title" => "Thunderstone",
5493     "rule" => array(
5494     "T-H-U-N-D-E-R-S-T-O-N-E" => "",
5495     "search.thunderstone.com" => ""
5496     ),
5497     "uri" => "http://search.thunderstone.com/"
5498     ),
5499     "timbobot" => array(
5500     "icon" => "robot",
5501 matthys 209 "title" => "TimboBot",
5502 joku 63 "rule" => array(
5503     "timboBot" => ""
5504     ),
5505     "uri" => ""
5506     ),
5507     "topsy" => array(
5508     "icon" => "topsy",
5509     "title" => "Topsy",
5510     "rule" => array(
5511     "Butterfly[ /]([0-9.]{1,10})" => "\\1"
5512     ),
5513     "uri" => "http://labs.topsy.com/butterfly.html"
5514     ),
5515     "trayce" => array(
5516     "icon" => "robot",
5517 matthys 209 "title" => "Trayce",
5518 joku 63 "rule" => array(
5519     "traycebot[ /]([0-9a-z.\-]{1,10})" => "\\1"
5520     ),
5521     "uri" => ""
5522     ),
5523     "tricus" => array(
5524     "icon" => "robot",
5525     "title" => "Tricus",
5526     "rule" => array(
5527     "B_l_i_t_z_B_O_T_@_t_r_i_c_u_s_\._c_o_m" => ""
5528     ),
5529     "uri" => ""
5530     ),
5531     "topicblogs" => array(
5532     "icon" => "robot",
5533     "title" => "Topicblogs",
5534     "rule" => array(
5535     "topicblogs[ /]([0-9.]{1,10})" => "\\1"
5536     ),
5537     "uri" => ""
5538     ),
5539     "touche" => array(
5540     "icon" => "touche",
5541 matthys 209 "title" => "Touché",
5542 joku 63 "rule" => array(
5543     "^Touche" => ""
5544     ),
5545     "uri" => "http://touche.com.ve"
5546     ),
5547     "tuezilla" => array(
5548     "icon" => "robot",
5549 matthys 209 "title" => "TÃœzilla",
5550 joku 63 "rule" => array(
5551     "tuezilla.de" => ""
5552     ),
5553     "uri" => "http://tuezilla.de/t_st-odp-entries-agent.html"
5554     ),
5555     "turnitin" => array(
5556     "icon" => "turnitin",
5557     "title" => "Turnitin",
5558     "rule" => array(
5559     "TurnitinBot[ /]([0-9.]{1,10})" => "\\1"
5560     ),
5561     "uri" => ""
5562     ),
5563     "tutorgig" => array(
5564     "icon" => "robot",
5565     "title" => "TutorGig",
5566     "rule" => array(
5567     "TutorGig(Bot)?[ /]([0-9.]{1,10})" => "\\2"
5568     ),
5569     "uri" => ""
5570     ),
5571     "twiceler" => array(
5572     "icon" => "cuill",
5573 matthys 209 "title" => "Cuill",
5574 joku 63 "rule" => array(
5575     "Twiceler[ /-]([0-9.]{1,10})" => "\\1",
5576     "Twiceler" => ""
5577     ),
5578     "uri" => "http://www.cuill.com/twiceler/robot.html"
5579     ),
5580     "twingly" => array(
5581     "icon" => "twingly",
5582     "title" => "Twingly",
5583     "rule" => array(
5584     "Twingly Recon" => ""
5585     ),
5586     "uri" => "http://www.twingly.com/"
5587     ),
5588 matthys 320 "twitter" => array(
5589     "icon" => "twitter",
5590     "title" => "Twitter",
5591     "rule" => array(
5592     "Twitterbot[ /-]([0-9.]{1,10})" => "\\1"
5593     ),
5594     "uri" => "https://dev.twitter.com/cards/getting-started#crawling"
5595     ),
5596 joku 63 "typepad" => array(
5597     "icon" => "typepad",
5598     "title" => "TypePad",
5599     "rule" => array(
5600     "TypePad/([0-9a-z.]{1,10})" => "\\1"
5601     ),
5602     "uri" => ""
5603     ),
5604     "udmsearch" => array(
5605     "icon" => "robot",
5606     "title" => "UdmSearch",
5607     "rule" => array(
5608     "UdmSearch[/ ]([0-9.]{1,10})" => "\\1"
5609     ),
5610     "uri" => ""
5611     ),
5612     "ukwizz" => array(
5613     "icon" => "ukwizz",
5614     "title" => "UKWizz",
5615     "rule" => array(
5616     "^Mackster.*ukwizz" => ""
5617     ),
5618     "uri" => "http://www.ukwizz.com"
5619     ),
5620     "ultraseek" => array(
5621     "icon" => "robot",
5622     "title" => "Ultraseek",
5623     "rule" => array(
5624     "Ultraseek" => ""
5625     ),
5626     "uri" => ""
5627     ),
5628     "ultraspider" => array(
5629     "icon" => "robot",
5630     "title" => "UltraSpider",
5631     "rule" => array(
5632     "UltraSpider3000[/ ]([0-9.]{1,10})" => "\\1"
5633     ),
5634     "uri" => "http://www.search.ch"
5635     ),
5636     "umai" => array(
5637     "icon" => "robot",
5638 matthys 209 "title" => "Umai",
5639 joku 63 "rule" => array(
5640     "umai[/ ]([0-9.]{1,10})" => "\\1"
5641     ),
5642     "uri" => ""
5643     ),
5644     "unchaos" => array(
5645     "icon" => "robot",
5646     "title" => "Unchaos",
5647     "rule" => array(
5648     "unchaos_crawler[_ /]([0-9.]{1,10})" => "\\1",
5649     "unchaos" => ""
5650     ),
5651     "uri" => ""
5652     ),
5653     "unido" => array(
5654     "icon" => "robot",
5655 matthys 209 "title" => "UNIdo",
5656 joku 63 "rule" => array(
5657     "^unido-bot" => "\\1"
5658     ),
5659     "uri" => "http://mobicom.cs.uni-dortmund.de/bot.html"
5660     ),
5661     "updated" => array(
5662     "icon" => "robot",
5663     "title" => "Updated",
5664     "rule" => array(
5665     "updated[ /]([0-9a-z.]{1,10})" => "\\1"
5666     ),
5667     "uri" => ""
5668     ),
5669     "uptimebot" => array(
5670     "icon" => "robot",
5671     "title" => "UptimeBot",
5672     "rule" => array(
5673     "^UptimeBot" => ""
5674     ),
5675     "uri" => "http://www.uptimebot.com/"
5676     ),
5677     "urifetch" => array(
5678     "icon" => "robot",
5679     "title" => "URI::Fetch",
5680     "rule" => array(
5681     "^URI::Fetch[ /]([0-9.]{1,10})" => "\\1"
5682     ),
5683     "uri" => ""
5684     ),
5685     "urlbase" => array(
5686     "icon" => "robot",
5687     "title" => "URLBase",
5688     "rule" => array(
5689     "URLBase[ /]([0-9.]{1,10})" => "\\1"
5690     ),
5691     "uri" => ""
5692     ),
5693     "urlblaze" => array(
5694     "icon" => "robot",
5695     "title" => "URLBlaze",
5696     "rule" => array(
5697     "^URLBlaze" => ""
5698     ),
5699     "uri" => ""
5700     ),
5701     "urlcontr" => array(
5702     "icon" => "robot",
5703     "title" => "MS URL Control",
5704     "rule" => array(
5705     "Microsoft URL[ \-]?Control" => ""
5706     ),
5707     "uri" => ""
5708     ),
5709     "urlgetfile" => array(
5710     "icon" => "robot",
5711     "title" => "URLGetFile",
5712     "rule" => array(
5713     "^URLGetFile" => ""
5714     ),
5715     "uri" => ""
5716     ),
5717     "urlscope" => array(
5718     "icon" => "robot",
5719     "title" => "UrlScope",
5720     "rule" => array(
5721     "UrlScope" => ""
5722     ),
5723     "uri" => ""
5724     ),
5725     "urltrends" => array(
5726     "icon" => "urltrends",
5727 matthys 209 "title" => "UrlTrends",
5728 joku 63 "rule" => array(
5729     "Snappy/([0-9.]{1,10})" => "\\1",
5730     ),
5731     "uri" => ""
5732     ),
5733     "usww" => array(
5734     "icon" => "usww",
5735 matthys 209 "title" => "USWW",
5736 joku 63 "rule" => array(
5737     "usww\.com" => "",
5738     "Mozilla/5\.0 URL-Spider" => ""
5739     ),
5740     "uri" => "http://www.usww.com/"
5741     ),
5742     "usyd" => array(
5743     "icon" => "robot",
5744     "title" => "USyd-NLP-Spider",
5745     "rule" => array(
5746     "^USyd-NLP-Spider" => ""
5747     ),
5748     "uri" => "http://www.it.usyd.edu.au/~vinci/bot.html"
5749     ),
5750     "vagabondo" => array(
5751     "icon" => "wiseguys",
5752     "title" => "WiseGuys",
5753     "rule" => array(
5754     "Vagabondo[ /]([0-9.]{1,10})" => "\\1",
5755     "Vagabondo-WAP[ /]([0-9.]{1,10})" => "\\1"
5756     ),
5757     "uri" => ""
5758     ),
5759     "unicorn" => array(
5760     "icon" => "w3c",
5761     "title" => "W3C Unicorn",
5762     "rule" => array(
5763     "Unicorn[ /]([0-9.]{1,10})" => "\\1",
5764     ),
5765     "uri" => "http://validator.w3.org/unicorn/"
5766     ),
5767     "validator" => array(
5768     "icon" => "w3c",
5769     "title" => "W3C Validator",
5770     "rule" => array(
5771     "W3C_Validator[ /]([0-9.]{1,10})" => "\\1"
5772     ),
5773     "uri" => "http://validator.w3.org/"
5774     ),
5775     "validator.nu" => array(
5776     "icon" => "validatornu",
5777     "title" => "Validator.nu",
5778     "rule" => array(
5779     "^Validator.nu[ /]([0-9.]{1,10})" => "\\1",
5780     "^Validator.nu/LV" => "\\1"
5781     ),
5782     "uri" => "http://validator.nu/"
5783     ),
5784     "verity" => array(
5785     "icon" => "robot",
5786     "title" => "Verity",
5787     "rule" => array(
5788     "^vspider[ /]([0-9.]{1,10})" => "\\1",
5789     "^vspider" => ""
5790     ),
5791     "uri" => "http://www.verity.com/"
5792     ),
5793     "versionsproject" => array(
5794     "icon" => "robot",
5795     "title" => "Versions-project",
5796     "rule" => array(
5797     "InfoFly[ /]([0-9.]{1,10})" => "\\1"
5798     ),
5799     "uri" => "http://www.versions-project.org/"
5800     ),
5801     "verticalmatch" => array(
5802     "icon" => "robot",
5803     "title" => "VerticalMatch",
5804     "rule" => array(
5805     "^VMBot[ /]([0-9.]{1,10})" => "\\1"
5806     ),
5807     "uri" => "http://www.VerticalMatch.com/"
5808     ),
5809     "verzamelgids" => array(
5810     "icon" => "robot",
5811     "title" => "Verzamelgids",
5812     "rule" => array(
5813     "Verzamelgids[ /]([0-9.]{1,10})" => "\\1"
5814     ),
5815     "uri" => "http://www.verzamelgids.nl/"
5816     ),
5817     "vestris" => array(
5818     "icon" => "vestris",
5819     "title" => "Vestris",
5820     "rule" => array(
5821     "AlkalineBOT[ /]([0-9.]{1,10})" => "\\1"
5822     ),
5823     "uri" => "http://alkaline.vestris.com/"
5824     ),
5825     "vindex" => array(
5826     "icon" => "vindex",
5827     "title" => "Vindex",
5828     "rule" => array(
5829     "Vindex[ /]([0-9.]{1,10})" => "\\1"
5830     ),
5831     "uri" => ""
5832     ),
5833     "visvo" => array(
5834     "icon" => "robot",
5835     "title" => "Visvo",
5836     "rule" => array(
5837     "VisBot[ /]([0-9.]{1,10})" => "\\1"
5838     ),
5839     "uri" => "http://www.visvo.com"
5840     ),
5841     "voila" => array(
5842     "icon" => "voila",
5843     "title" => "Voila",
5844     "rule" => array(
5845     "VoilaBot[ /]?[a-z ]*([0-9.]{1,10})" => "\\1",
5846     "VoilaBot;[ /]([0-9.]{1,10})" => "\\1"
5847     ),
5848     "uri" => ""
5849     ),
5850     "vonna" => array(
5851     "icon" => "robot",
5852     "title" => "Vonna",
5853     "rule" => array(
5854     "Vonna.com b o t" => ""
5855     ),
5856     "uri" => ""
5857     ),
5858     "vortex" => array(
5859     "icon" => "robot",
5860     "title" => "Vortex",
5861     "rule" => array(
5862     "Vortex[ /]([0-9.]{1,10})" => "\\1"
5863     ),
5864     "uri" => "http://marty.anstey.ca/robots/vortex/"
5865     ),
5866     "w3sitesearch" => array(
5867     "icon" => "w3sitesearch",
5868     "title" => "W3SiteSearch",
5869     "rule" => array(
5870     "^W3SiteSearch Crawler[\_v]*([0-9.]{1,10})" => "\\1"
5871     ),
5872     "uri" => "http://www.w3sitesearch.de"
5873     ),
5874     "wagger" => array(
5875     "icon" => "robot",
5876     "title" => "Wagger",
5877     "rule" => array(
5878     "^Waggr" => ""
5879     ),
5880     "uri" => "http://www.waggr.com/"
5881     ),
5882     "wanadoo" => array(
5883     "icon" => "robot",
5884     "title" => "Wanadoo",
5885     "rule" => array(
5886     "^SurferF3[ /]([0-9./]{1,10})" => "\\1"
5887     ),
5888     "uri" => "http://www.wanadoo.fr/"
5889     ),
5890     "wapalizer" => array(
5891     "icon" => "robot",
5892     "title" => "Wapalizer",
5893     "rule" => array(
5894     "wapalizer[ /]([0-9.]{1,10})" => "\\1"
5895     ),
5896     "uri" => "http://www.wapdrive.com/"
5897     ),
5898     "watson" => array(
5899     "icon" => "addy",
5900     "title" => "Dr.Watson",
5901     "rule" => array(
5902     "Watson[ /]([0-9.]{1,10})" => "\\1",
5903     "watson\.addy\.com" => ""
5904     ),
5905     "uri" => ""
5906     ),
5907     "wavefire" => array(
5908     "icon" => "robot",
5909     "title" => "Wavefire",
5910     "rule" => array(
5911     "^Wavefire[ /]([0-9.]{1,10})" => "\\1"
5912     ),
5913     "uri" => ""
5914     ),
5915     "waypath" => array(
5916     "icon" => "waypath",
5917     "title" => "Waypath",
5918     "rule" => array(
5919     "Waypath[ \-]?Scout" => "",
5920     "Waypath (development )?crawler" => ""
5921     ),
5922     "uri" => ""
5923     ),
5924     "wauuu" => array(
5925     "icon" => "wauuu",
5926     "title" => "Wauuu",
5927     "rule" => array(
5928     "Wauuu[/ ]([0-9.]{1,10})" => "\\2"
5929     ),
5930     "uri" => "http://www.wauuu.com"
5931     ),
5932     "wdg" => array(
5933     "icon" => "wdg",
5934     "title" => "WDG Validator",
5935     "rule" => array(
5936     "^WDG_(Site)?Validator[/ ]([0-9.]{1,10})" => "\\2"
5937     ),
5938     "uri" => "http://www.htmlhelp.com/tools/validator/"
5939     ),
5940     "webagogo" => array(
5941     "icon" => "webagogo",
5942     "title" => "Webagogo",
5943     "rule" => array(
5944     "^Webagogo" => ""
5945     ),
5946     "uri" => "http://www.webagogo.be/"
5947     ),
5948     "webalta" => array(
5949     "icon" => "webalta",
5950     "title" => "WebAlta",
5951     "rule" => array(
5952     "^WebAlta( Crawler)?[/ ]([0-9.]{1,10})" => "\\2"
5953     ),
5954     "uri" => "http://www.webalta.net/ru/about_webmaster.html"
5955     ),
5956     "webdigity" => array(
5957     "icon" => "robot",
5958     "title" => "Webdigity Whois Service",
5959     "rule" => array(
5960     "^webdigity whois service" => ""
5961     ),
5962     "uri" => "http://www.webdigity.com/ws"
5963     ),
5964     "webelixir" => array(
5965     "icon" => "webelixir",
5966     "title" => "Webelixir",
5967     "rule" => array(
5968     "^webelixir" => ""
5969     ),
5970     "uri" => "http://www.webelixir.net/"
5971     ),
5972     "webbotru" => array(
5973     "icon" => "robot",
5974     "title" => "Webbot.ru",
5975     "rule" => array(
5976     " Webbot[/ ]([0-9.]{1,10})" => "\\1"
5977     ),
5978     "uri" => "http://www.webbot.ru/bot.html"
5979     ),
5980     "webcapture" => array(
5981     "icon" => "robot",
5982     "title" => "WebCapture",
5983     "rule" => array(
5984     "WebCapture[/ ]([0-9.]{1,10})" => "\\1"
5985     ),
5986     "uri" => ""
5987     ),
5988     "webcollage" => array(
5989     "icon" => "robot",
5990     "title" => "Webcollage",
5991     "rule" => array(
5992     "webcollage" => ""
5993     ),
5994     "uri" => ""
5995     ),
5996     "webcopier" => array(
5997     "icon" => "webcopier",
5998     "title" => "WebCopier",
5999     "rule" => array(
6000     "WebCopier[/ ]v?([0-9.]{1,10})" => "\\1"
6001     ),
6002     "uri" => ""
6003     ),
6004     "webcorp" => array(
6005     "icon" => "webcorp",
6006     "title" => "WebCorp",
6007     "rule" => array(
6008     "WebCorp[/ ]+([0-9.]{1,10})" => "\\1"
6009     ),
6010     "uri" => "http://www.webcorp.org.uk/"
6011     ),
6012     "webcrawl" => array(
6013     "icon" => "robot",
6014     "title" => "WebCrawl",
6015     "rule" => array(
6016     "webcrawl\.net" => ""
6017     ),
6018     "uri" => ""
6019     ),
6020     "webdownloader" => array(
6021     "icon" => "robot",
6022     "title" => "Web Downloader",
6023     "rule" => array(
6024     "Web Downloader[/ ]([0-9.]{1,10})" => "\\1"
6025     ),
6026     "uri" => ""
6027     ),
6028     "webfetch" => array(
6029     "icon" => "robot",
6030 matthys 209 "title" => "WebFetch",
6031 joku 63 "rule" => array(
6032     "^webfetch[/ ]([0-9.]{1,10})" => "\\1"
6033     ),
6034     "uri" => ""
6035     ),
6036     "webfind" => array(
6037     "icon" => "robot",
6038 matthys 209 "title" => "WebFind",
6039 joku 63 "rule" => array(
6040     "^WebFindBot" => ""
6041     ),
6042     "uri" => "http://www.web-find.com"
6043     ),
6044     "webglimpse" => array(
6045     "icon" => "robot",
6046     "title" => "Webglimpse",
6047     "rule" => array(
6048     "^Webglimpse[/ ]([0-9.]{1,10})" => "\\1"
6049     ),
6050     "uri" => "http://webglimpse.net"
6051     ),
6052     "webgobbler" => array(
6053     "icon" => "robot",
6054     "title" => "webGobbler",
6055     "rule" => array(
6056     "^webGobbler[/ ]([0-9.]{1,10})" => "\\1"
6057     ),
6058     "uri" => ""
6059     ),
6060     "webimages" => array(
6061     "icon" => "webimages",
6062     "title" => "WebImages",
6063     "rule" => array(
6064     "^WebImages[/ ]([0-9.]{1,10})" => "\\1"
6065     ),
6066     "uri" => "http://herbert.groot.jebbink.nl/"
6067     ),
6068     "weblight" => array(
6069     "icon" => "robot",
6070     "title" => "WebLight",
6071     "rule" => array(
6072     "^WebLight[/ ]([0-9.]{1,10})" => "\\1"
6073     ),
6074     "uri" => "http://www.illumit.com/Products/weblight/"
6075     ),
6076     "weblinks" => array(
6077     "icon" => "robot",
6078     "title" => "WebLink's",
6079     "rule" => array(
6080     "^Weblink.s checker" => ""
6081     ),
6082     "uri" => ""
6083     ),
6084     "webmeasurement" => array(
6085     "icon" => "robot",
6086     "title" => "Webmeasurement",
6087     "rule" => array(
6088     "^webmeasurement-bot" => ""
6089     ),
6090     "uri" => "http://rvs.informatik.uni-leipzig.de"
6091     ),
6092     "webminer" => array(
6093     "icon" => "robot",
6094     "title" => "WebMiner",
6095     "rule" => array(
6096     "^WebMiner[/ ]([0-9.]{1,10})" => "\\1"
6097     ),
6098     "uri" => ""
6099     ),
6100     "webmin" => array(
6101     "icon" => "webmin",
6102     "title" => "Webmin",
6103     "rule" => array(
6104     "^webmin" => ""
6105     ),
6106     "uri" => ""
6107     ),
6108     "webmon" => array(
6109     "icon" => "webmon",
6110     "title" => "Webmon",
6111     "rule" => array(
6112     "WebMon[ /]([0-9.]{1,10})" => "\\1"
6113     ),
6114     "uri" => "http://www.markwell.btinternet.co.uk/webmon/"
6115     ),
6116     "webox" => array(
6117     "icon" => "robot",
6118     "title" => " WeBoX",
6119     "rule" => array(
6120     "WeBoX[/ ]([0-9.]{1,10})" => "\\1"
6121     ),
6122     "uri" => ""
6123     ),
6124     "webpatrol" => array(
6125     "icon" => "webpatrol",
6126     "title" => "WebPatrol",
6127     "rule" => array(
6128     "^WebPatrol[ /]([0-9.]{1,10})" => "\\1"
6129     ),
6130     "uri" => "http://soft.macfeeling.com/WebPatrol.html"
6131     ),
6132     "webpix" => array(
6133     "icon" => "webpix",
6134     "title" => "WebPix",
6135     "rule" => array(
6136     "WebPix[/ ]([0-9.]{1,10})" => "\\1"
6137     ),
6138     "uri" => ""
6139     ),
6140     "webrace" => array(
6141     "icon" => "robot",
6142     "title" => "WebRACE",
6143     "rule" => array(
6144     "^WebRACE[/ ]([0-9.]{1,10})" => "\\1"
6145     ),
6146     "uri" => ""
6147     ),
6148     "webreaper" => array(
6149     "icon" => "webreaper",
6150     "title" => "WebReaper",
6151     "rule" => array(
6152     "^WebReaper " => ""
6153     ),
6154     "uri" => "http://www.webreaper.net/"
6155     ),
6156     "webresult" => array(
6157     "icon" => "robot",
6158     "title" => "Webresult",
6159     "rule" => array(
6160     "Der webresult\.de Robot" => ""
6161     ),
6162     "uri" => ""
6163     ),
6164     "webring" => array(
6165     "icon" => "robot",
6166     "title" => "Webring Checker",
6167     "rule" => array(
6168     "WebRingChecker[/ ]([0-9.]{1,10})" => "\\1"
6169     ),
6170     "uri" => ""
6171     ),
6172     "webripper" => array(
6173     "icon" => "webripper",
6174     "title" => "WebRipper",
6175     "rule" => array(
6176     "^WebRipper" => ""
6177     ),
6178     "uri" => "http://calluna-software.com"
6179     ),
6180     "webscaled" => array(
6181     "icon" => "webscaled",
6182     "title" => "Webscaled",
6183     "rule" => array(
6184     "Swarm" => ""
6185     ),
6186     "uri" => "http://webscaled.com/"
6187     ),
6188     "websearchau" => array(
6189     "icon" => "websearchau",
6190     "title" => "WebSearch.COM.AU",
6191     "rule" => array(
6192     "WebSearch.COM.AU[/ ]+([0-9.]{1,10})" => "\\1"
6193     ),
6194     "uri" => "http://WebSearch.com.au/"
6195     ),
6196     "websearchbench" => array(
6197     "icon" => "robot",
6198     "title" => "WebSearchBench",
6199     "rule" => array(
6200     "WebSearchBench WebCrawler[v/ ]+([0-9.]{1,10})" => "\\1"
6201     ),
6202     "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6203     ),
6204     "websense" => array(
6205     "icon" => "websense",
6206     "title" => "Websense",
6207     "rule" => array(
6208     "(Sqworm|websense|Konqueror/3\.(0|1)(-rc[1-6])?; i686 Linux; 2002[0-9]{4})" => ""
6209     ),
6210     "uri" => ""
6211     ),
6212     "websiteshadow" => array(
6213     "icon" => "websiteshadow",
6214     "title" => "Websiteshadow",
6215     "rule" => array(
6216     "Websiteshadowbot[ /]([0-9.]{1,10})" => "\\1"
6217     ),
6218     "uri" => "http://websiteshadow.com"
6219     ),
6220     "websiteworth" => array(
6221     "icon" => "robot",
6222     "title" => "WebsiteWorth",
6223     "rule" => array(
6224     "WebsiteWorth[v/ ]+([0-9.]{1,10})" => "\\1"
6225     ),
6226     "uri" => "http://directory.sootle.com/website-worth/tata.php"
6227     ),
6228     "websquash" => array(
6229     "icon" => "websquash",
6230     "title" => "Websquash",
6231     "rule" => array(
6232     "webs(quash\.com|ite[ \-]?Monitor)" => ""
6233     ),
6234     "uri" => ""
6235     ),
6236     "webstripper" => array(
6237     "icon" => "robot",
6238     "title" => "WebStripper",
6239     "rule" => array(
6240     "WebStripper[ /]([0-9.]{1,10})" => "\\1"
6241     ),
6242     "uri" => ""
6243     ),
6244     "webzip" => array(
6245     "icon" => "webzip",
6246     "title" => "WebZIP",
6247     "rule" => array(
6248     "Web[ \-]?ZIP[ /]([0-9.]{1,10})" => "\\1"
6249     ),
6250     "uri" => ""
6251     ),
6252     "wep" => array(
6253     "icon" => "robot",
6254     "title" => "WEP Search",
6255     "rule" => array(
6256     "WEP Search[ /]([0-9.]{1,10})" => "\\1"
6257     ),
6258     "uri" => ""
6259     ),
6260     "westwind" => array(
6261     "icon" => "robot",
6262     "title" => "West Wind Internet Protocols",
6263     "rule" => array(
6264     "^West Wind Internet Protocols[ /]([0-9.]{1,10})" => "\\1"
6265     ),
6266     "uri" => "http://www.west-wind.com/wwipstuff.asp"
6267     ),
6268     "wget" => array(
6269     "icon" => "wget",
6270     "title" => "Wget",
6271     "rule" => array(
6272 joku 308 "Wget[ /]([0-9.]{1,10})" => "\\1",
6273     "Wget" => ""
6274 joku 63 ),
6275     "uri" => ""
6276     ),
6277     "whizbang" => array(
6278     "icon" => "whizbang",
6279     "title" => "WhizBang",
6280     "rule" => array(
6281     "WhizBang" => ""
6282     ),
6283     "uri" => "http://www.whizbang.com/crawler/"
6284     ),
6285     "whois" => array(
6286     "icon" => "whois",
6287     "title" => "Who.is",
6288     "rule" => array(
6289     "Who.is Bot" => ""
6290     ),
6291     "uri" => "http://www.who.is/"
6292     ),
6293     "wikiwix" => array(
6294     "icon" => "wikiwix",
6295     "title" => "Wikiwix",
6296     "rule" => array(
6297     "wikiwix-bot-([0-9.]{1,10})" => "\\1"
6298     ),
6299     "uri" => "http://www.wikiwix.com/"
6300     ),
6301     "wingflyer" => array(
6302     "icon" => "robot",
6303     "title" => "WingFlyer",
6304     "rule" => array(
6305     "^WebFetch" => ""
6306     ),
6307     "uri" => "http://www.wingflyer.com/"
6308     ),
6309     "wininet" => array(
6310     "icon" => "robot",
6311     "title" => "WinInet",
6312     "rule" => array(
6313     "TeamSoft WinInet Component" => ""
6314     ),
6315     "uri" => "http://www.winsoft.sk/wininet.htm"
6316     ),
6317     "winhttp" => array(
6318     "icon" => "robot",
6319     "title" => "WinHTTP",
6320     "rule" => array(
6321     "WinHttp\.WinHttpRequest\.([0-9.]{1,10})" => "\\1"
6322     ),
6323     "uri" => ""
6324     ),
6325     "wire" => array(
6326     "icon" => "robot",
6327     "title" => "WIRE",
6328     "rule" => array(
6329     "^WIRE[ /]([0-9.]{1,10})" => "\\1"
6330     ),
6331     "uri" => ""
6332     ),
6333     "wmp" => array(
6334     "icon" => "robot",
6335     "title" => "WMP",
6336     "rule" => array(
6337     "^WMP" => ""
6338     ),
6339     "uri" => ""
6340     ),
6341     "woozweb" => array(
6342     "icon" => "woozweb",
6343     "title" => "Woozweb",
6344     "rule" => array(
6345     "woozweb" => ""
6346     ),
6347     "uri" => "http://www.woozweb.com/"
6348     ),
6349     "wordchamp" => array(
6350     "icon" => "robot",
6351     "title" => "WordChamp",
6352     "rule" => array(
6353     "^WordChampBot" => ""
6354     ),
6355     "uri" => "http://www.wordchamp.com/"
6356     ),
6357     "wordpress" => array(
6358     "icon" => "wordpress",
6359     "title" => "WordPress",
6360     "rule" => array(
6361     "WordPress[ /]([0-9.]{1,10})" => "\\1"
6362     ),
6363     "uri" => ""
6364     ),
6365     "worio" => array(
6366     "icon" => "worio",
6367     "title" => "Worio",
6368     "rule" => array(
6369     "woriobot" => ""
6370     ),
6371     "uri" => "http://worio.com/"
6372     ),
6373     "worldlight" => array(
6374     "icon" => "worldlight",
6375     "title" => "WorldLight",
6376     "rule" => array(
6377     "^WorldLight" => ""
6378     ),
6379     "uri" => ""
6380     ),
6381     "worqmada" => array(
6382     "icon" => "robot",
6383     "title" => "WorQmada",
6384     "rule" => array(
6385     "WorQmada[ /]([0-9.]{1,10})" => "\\1"
6386     ),
6387     "uri" => ""
6388     ),
6389     "wotbox" => array(
6390     "icon" => "wotbox",
6391     "title" => "Wotbox",
6392     "rule" => array(
6393     "Wotbox[ /]?[a-z]*([0-9.]{1,10})" => "\\1"
6394     ),
6395     "uri" => ""
6396     ),
6397     "wp" => array(
6398     "icon" => "wp",
6399     "title" => "Wirtualna Polska",
6400     "rule" => array(
6401     "NetSprint[ /\-]{1,4}([0-9.]{1,10})" => "\\1"
6402     ),
6403     "uri" => "http://wp.pl"
6404     ),
6405     "wsb" => array(
6406     "icon" => "robot",
6407     "title" => "WebSearchBench",
6408     "rule" => array(
6409     "WSB WebCrawler V([0-9.]{1,10})" => "\\1",
6410     "WSB " => ""
6411     ),
6412     "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6413     ),
6414     "wume" => array(
6415     "icon" => "robot",
6416     "title" => "WUME Lab's",
6417     "rule" => array(
6418     "^wume_crawler[ /]([0-9.]{1,10})" => "\\1",
6419     ),
6420     "uri" => "http://wume.cse.lehigh.edu/~xiq204/crawler/"
6421     ),
6422     "wusage" => array(
6423     "icon" => "wusage",
6424     "title" => "Wusage",
6425     "rule" => array(
6426     "Wusage[ /]([0-9.]{1,10})" => "\\1",
6427     ),
6428     "uri" => "http://www.boutell.com/wusage/"
6429     ),
6430     "wwgrapevine" => array(
6431     "icon" => "wwgrapevine",
6432     "title" => "WWgrapevine",
6433     "rule" => array(
6434     "wwgrapevine[ /]([0-9.]{1,10})" => "\\1"
6435     ),
6436     "uri" => ""
6437     ),
6438     "wws" => array(
6439     "icon" => "robot",
6440     "title" => "WWSBOT",
6441     "rule" => array(
6442     "WWSBOT[ /]([0-9.]{1,10})" => "\\1",
6443     ),
6444     "uri" => "http://www.analyzer.nu"
6445     ),
6446     "www4mail" => array(
6447     "icon" => "robot",
6448 matthys 209 "title" => "WWW4mail",
6449 joku 63 "rule" => array(
6450     "^www4mail[ /]([0-9.]{1,10})" => "\\1"
6451     ),
6452     "uri" => "http://www.www4mail.org/"
6453     ),
6454     "wwwc" => array(
6455     "icon" => "wwwc",
6456     "title" => "WWWC",
6457     "rule" => array(
6458     "^WWWC[ /]([0-9.]{1,10})" => "\\1"
6459     ),
6460     "uri" => ""
6461     ),
6462     "wwwd" => array(
6463     "icon" => "robot",
6464     "title" => "WWWD",
6465     "rule" => array(
6466     "^WWWD[ /]([0-9.]{1,10})" => "\\1"
6467     ),
6468     "uri" => ""
6469     ),
6470     "wwweasel" => array(
6471     "icon" => "wwweasel",
6472     "title" => "WWWeasel",
6473     "rule" => array(
6474     "WWWeasel( Robot)?[/ ]v?([0-9.]{1,10})" => "\\2"
6475     ),
6476     "uri" => ""
6477     ),
6478     "wwwfi" => array(
6479     "icon" => "wwwfi",
6480     "title" => "www.fi",
6481     "rule" => array(
6482     "www\.fi crawler" => ""
6483     ),
6484     "uri" => "http://www.fi/"
6485     ),
6486     "wwwmechanize" => array(
6487     "icon" => "robot",
6488     "title" => "WWW-Mechanize",
6489     "rule" => array(
6490     "^WWW-Mechanize[/ ]([0-9.]{1,10})" => "\\1"
6491     ),
6492     "uri" => ""
6493     ),
6494     "wwwoffle" => array(
6495     "icon" => "robot",
6496     "title" => "WWWoffle",
6497     "rule" => array(
6498     "^wwwoffle[/ ]([0-9.]{1,10})" => "\\1"
6499     ),
6500     "uri" => ""
6501     ),
6502     "wwwster" => array(
6503     "icon" => "robot",
6504     "title" => "WWWster",
6505     "rule" => array(
6506     "^wwwster[/ ]([0-9.]{1,10})" => "\\1"
6507     ),
6508     "uri" => ""
6509     ),
6510     "wysigot" => array(
6511     "icon" => "wysigot",
6512     "title" => "Wysigot",
6513     "rule" => array(
6514     "Wysigot[/ ]([0-9.]{1,10})" => "\\1"
6515     ),
6516     "uri" => ""
6517     ),
6518     "xaldon" => array(
6519     "icon" => "xaldon",
6520     "title" => "Xaldon",
6521     "rule" => array(
6522     "Xaldon WebSpider" => ""
6523     ),
6524     "uri" => "http://www.xaldon.de/"
6525     ),
6526     "xenu" => array(
6527     "icon" => "xenu",
6528     "title" => "Xenu Link Sleuth",
6529     "rule" => array(
6530     "Xenu Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6531     "Xenu(&#039;s)? Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6532     "Xenu_Link_Sleuth_([0-9a-z.]{1,10})" => "\\1"
6533     ),
6534     "uri" => "http://home.snafu.de/tilman/xenulink.html"
6535     ),
6536     "xerka" => array(
6537     "icon" => "xerka",
6538     "title" => "Xerka",
6539     "rule" => array(
6540     "^Xerka WebBot v([0-9a-z.]{1,10})" => "\\1"
6541     ),
6542     "uri" => "http://www.diana-teknologia.com/www1/english/xerka.htm"
6543     ),
6544     "xirq" => array(
6545     "icon" => "robot",
6546     "title" => "XIRQ",
6547     "rule" => array(
6548     "^xirq[ /]([0-9a-z.]{1,10})" => "\\1"
6549     ),
6550     "uri" => "http://www.xirq.com"
6551     ),
6552     "xmlslurp" => array(
6553     "icon" => "robot",
6554     "title" => "XMLSlurp",
6555     "rule" => array(
6556     "^XMLSlurp[ /]([0-9a-z.]{1,10})" => "\\1"
6557     ),
6558     "uri" => ""
6559     ),
6560     "xml-sitemaps" => array(
6561     "icon" => "xml-sitemaps",
6562     "title" => "XML-Sitemaps",
6563     "rule" => array(
6564     "XML-Sitemaps[ /]([0-9a-z.]{1,10})" => "\\1"
6565     ),
6566     "uri" => ""
6567     ),
6568     "xmlrpc" => array(
6569     "icon" => "robot",
6570     "title" => "Trackback",
6571     "rule" => array(
6572     "XMLRPC" => ""
6573     ),
6574     "uri" => ""
6575     ),
6576 matthys 294 "xovi" => array(
6577     "icon" => "xovi",
6578     "title" => "Xovi",
6579     "rule" => array(
6580     "XoviBot[ /]([0-9a-z.]{1,10})" => "\\1"
6581     ),
6582     "uri" => "http://www.xovibot.net"
6583     ),
6584 joku 63 "yacy" => array(
6585     "icon" => "yacy",
6586     "title" => "Yacy",
6587     "rule" => array(
6588     "yacy\.net" => ""
6589     ),
6590     "uri" => ""
6591     ),
6592     "yahoo" => array(
6593     "icon" => "yahoo",
6594     "title" => "Yahoo",
6595     "rule" => array(
6596     "Yahoo(! ([a-z]{1,3} )?Slurp|-)" => "",
6597     "Yahoo-MMCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6598     "Yahoo-VerticalCrawler-FormerWebCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6599     "^AnzwersCrawl[/ ]([0-9a-z.]{1,10})" => "\\1",
6600     "Y!J(-BSC|-SRD)*[/ ]([0-9a-z.]{1,10})" => "\\2",
6601     "Y!OASIS/TEST" => "",
6602     "Harvest-NG[/ ]([0-9a-z.]{1,10})" => "\\1",
6603     "Y!J; for robot study" => "",
6604     "Yahoo Japan; for robot study" => ""
6605     ),
6606     "uri" => "http://www.yahoo.com"
6607     ),
6608     "yahoo-feed" => array(
6609     "icon" => "yahoo",
6610     "title" => "Yahoo Feedseeker",
6611     "rule" => array(
6612     "^YahooFeedSeeker[/ ]([0-9a-z.]{1,10})" => "\\1"
6613     ),
6614     "uri" => "http://www.yahoo.com"
6615     ),
6616     "yandex" => array(
6617     "icon" => "yandex",
6618     "title" => "Yandex",
6619     "rule" => array(
6620     "Yandex[/ ]([0-9.]{1,10})" => "\\1",
6621     "Yandex(Bot|Images|Media|Antivirus)[/ ]([0-9.]{1,10})" => "\\2"
6622     ),
6623     "uri" => "http://yandex.com/bots"
6624     ),
6625     "yanga" => array(
6626     "icon" => "yanga",
6627     "title" => "Yanga",
6628     "rule" => array (
6629     "^Yanga.*v([0-9.]{1,10})" => "\\1"
6630     ),
6631     "uri" => "http://www.yanga.co.uk/"
6632     ),
6633     "yap" => array(
6634     "icon" => "yap",
6635     "title" => "Yap",
6636     "rule" => array(
6637     "^YapBot[_/ ]v([0-9.]{1,10})" => "\\1"
6638     ),
6639     "uri" => "http://www.yapinc.com/"
6640     ),
6641     "yarienavoir" => array(
6642     "icon" => "robot",
6643     "title" => "Yarienavoir",
6644     "rule" => array(
6645     "^yarienavoir.net[/ ]([0-9.]{1,10})" => "\\1"
6646     ),
6647     "uri" => "http://www.yarienavoir.net/"
6648     ),
6649     "yell" => array(
6650     "icon" => "yell",
6651     "title" => "Yell",
6652     "rule" => array(
6653     "YellCrawl[ /]V?([0-9.]{1,10})" => "\\1",
6654     "Yellbot[ /]Nutch-([0-9.]{1,10})" => "\\1",
6655     ),
6656     "uri" => ""
6657     ),
6658     "youdao" => array(
6659     "icon" => "youdao",
6660     "title" => "Youdao",
6661     "rule" => array(
6662     "YodaoBot-(Image|Mobile)?[ /]([0-9.]{1,10})" => "\\2",
6663     "YoudaoBot[ /]([0-9.]{1,10})" => "\\1"
6664     ),
6665     "uri" => "http://www.youdao.com/help/webmaster/spider/"
6666     ),
6667     "yoogli" => array(
6668     "icon" => "yoogli",
6669     "title" => "Yoogli",
6670     "rule" => array(
6671     "yoogliFetchAgent[ /]([0-9.]{1,10})" => "\\1"
6672     ),
6673     "uri" => "http://www.yoogli.com"
6674     ),
6675     "yotta" => array(
6676     "icon" => "robot",
6677     "title" => "Yotta",
6678     "rule" => array(
6679     "Yotta(Shopping|Cars)_Bot[ /]([0-9.]{1,10})" => "\\2",
6680     "OmniExplorer_Bot[ /]([0-9.]{1,10})" => "\\1"
6681     ),
6682     "uri" => "http://www.yottacars.com"
6683     ),
6684     "yoono" => array(
6685     "icon" => "yoono",
6686     "title" => "Yoono",
6687     "rule" => array(
6688     "Yoono" => ""
6689     ),
6690     "uri" => "http://www.yoono.com/"
6691     ),
6692     "yowedo" => array(
6693     "icon" => "robot",
6694     "title" => "Yowedo",
6695     "rule" => array(
6696     "Yowedo[ /]([0-9.]{1,10})" => "\\1"
6697     ),
6698     "uri" => "http://yowedo.com/en/partners.html"
6699     ),
6700     "yuntis" => array(
6701     "icon" => "robot",
6702 matthys 209 "title" => "Yuntis",
6703 joku 63 "rule" => array(
6704     "Gulper Web Bot[ /]([0-9.]{1,10})" => "\\1"
6705     ),
6706     "uri" => "http://yuntis.ecsl.cs.sunysb.edu/help/robot/"
6707     ),
6708     "zao" => array(
6709     "icon" => "robot",
6710     "title" => "Zao",
6711     "rule" => array(
6712     "Zao[ /]([0-9.]{1,10})" => "\\1",
6713     "Zao-crawler" => ""
6714     ),
6715     "uri" => ""
6716     ),
6717     "zealbot" => array(
6718     "icon" => "zeal",
6719     "title" => "ZealBot",
6720     "rule" => array(
6721     "Zealbot[ /]([0-9.]{1,10})" => "\\1"
6722     ),
6723     "uri" => ""
6724     ),
6725     "zearchit" => array(
6726     "icon" => "zearchit",
6727     "title" => "Zearchit",
6728     "rule" => array(
6729     "Zearchit" => ""
6730     ),
6731     "uri" => "http://www.zearchit.de/"
6732     ),
6733     "zebz" => array(
6734     "icon" => "robot",
6735     "title" => "ze.bz",
6736     "rule" => array(
6737     "^ZeBot_(lseek\.net|www\.ze\.bz)" => ""
6738     ),
6739     "uri" => "http://www.ze.bz/"
6740     ),
6741     "zedzo" => array(
6742     "icon" => "robot",
6743     "title" => "Zedzo",
6744     "rule" => array(
6745     "zedzo.digest[ /]([0-9.]{1,10})" => "\\1"
6746     ),
6747     "uri" => "http://www.zedzo.com/"
6748     ),
6749     "zerx" => array(
6750     "icon" => "zerx",
6751     "title" => "Zerx",
6752     "rule" => array(
6753     "^zerxbot[ /](Version|v)*[ /]*([0-9.]{1,10})" => "\\2"
6754     ),
6755     "uri" => "http://www.zerx.com/"
6756     ),
6757     "zeus" => array(
6758     "icon" => "zeus",
6759     "title" => "Zeus",
6760     "rule" => array(
6761     "Zeus" => ""
6762     ),
6763     "uri" => "http://www.zeus.com"
6764     ),
6765     "zippp" => array(
6766     "icon" => "robot",
6767     "title" => "Zippp",
6768     "rule" => array(
6769     "ZipppBot[ /]([0-9.]{1,10})" => "\\1"
6770     ),
6771     "uri" => ""
6772     ),
6773     "zippy" => array(
6774     "icon" => "robot",
6775     "title" => "Zippy",
6776     "rule" => array(
6777     "^Zippy[ v/]*([0-9.]{1,10})" => "\\1"
6778     ),
6779     "uri" => "http://www.zippyfinder.com"
6780     ),
6781     "zoeky" => array(
6782     "icon" => "robot",
6783     "title" => "Zoeky",
6784     "rule" => array(
6785     "Zoekybot[ /]([0-9.]{1,10})" => "\\1"
6786     ),
6787     "uri" => ""
6788     ),
6789     "zoom" => array(
6790     "icon" => "zoom",
6791 matthys 209 "title" => "ZoomSpider",
6792 joku 63 "rule" => array(
6793     "^ZoomSpider" => ""
6794     ),
6795     "uri" => "http://www.wrensoft.com/"
6796     ),
6797     "zspider" => array(
6798     "icon" => "robot",
6799 matthys 209 "title" => "Zspider",
6800 joku 63 "rule" => array(
6801     "zspider[ /]([0-9.a-z]{1,10})" => "\\1"
6802     ),
6803     "uri" => "http://feedback.redkolibri.com/"
6804     ),
6805 matthys 281 "zumbot" => array(
6806     "icon" => "robot",
6807     "title" => "ZUM Search",
6808     "rule" => array(
6809     "ZumBot[ /]([0-9.]{1,10})" => "\\1"
6810     ),
6811     "uri" => "http://help.zum.com/inquiry"
6812     ),
6813 joku 63 "zyborg" => array(
6814     "icon" => "zyborg",
6815     "title" => "WiseNutBot",
6816     "rule" => array(
6817     "(WISE|Zy)bo(rg|t)[ /]([0-9.]{1,10})" => "\\3"
6818     ),
6819     "uri" => ""
6820     ),
6821     // Catch up for the originals, they got to stay in that order.
6822     "blogbot" => array(
6823     "icon" => "blogbot",
6824     "title" => "BlogBot",
6825     "rule" => array(
6826     "Blog[ \-]?Bot" => ""
6827     ),
6828     "uri" => "http://www.blogbot.com/"
6829     ),
6830     "centrum" => array(
6831     "icon" => "centrum",
6832     "title" => "Centrum",
6833     "rule" => array(
6834     "holmes[/ ]([0-9.]{1,10})" => "\\1",
6835     "^Centrum-checker" => ""
6836     ),
6837     "uri" => ""
6838     ),
6839     "httpclient" => array(
6840     "icon" => "robot",
6841     "title" => "HTTPClient",
6842     "rule" => array(
6843     "HTTP[ \-]?Client[ /]([0-9.]{1,10})" => "\\1",
6844     "HTTP[ \-]?Client" => ""
6845     ),
6846     "uri" => "http://www.innovation.ch/java/HTTPClient/"
6847     ),
6848     "incywincy" => array(
6849     "icon" => "robot",
6850     "title" => "IncyWincy",
6851     "rule" => array(
6852     "^IncyWincy[ /]([0-9.]{1,10})" => "\\1",
6853     "^IncyWincy" => ""
6854     ),
6855     "uri" => ""
6856     ),
6857     "java" => array(
6858     "icon" => "java",
6859     "title" => "Java",
6860     "rule" => array(
6861     "^java[ /]*([0-9.a-z]{1,10})" => "\\1"
6862     ),
6863     "uri" => ""
6864     ),
6865     "libfetch" => array(
6866     "icon" => "robot",
6867     "title" => "Libfetch",
6868     "rule" => array(
6869     "^(fetch )?libfetch[ /]([0-9.]{1,10})" => "\\2"
6870     ),
6871     "uri" => "http://www.freebsd.org/"
6872     ),
6873     "libwww" => array(
6874     "icon" => "libwww",
6875 matthys 209 "title" => "LibWWW",
6876 joku 63 "rule" => array(
6877     "^libww(w|w-perl|w-FM)[ /]([0-9.]{1,10})" => "\\2",
6878     "^libww(w|w-perl|w-FM)" => "",
6879     "MyApp.*libww(w|w-perl|w-FM)" => ""
6880     ),
6881     "uri" => ""
6882     ),
6883     "litefinder" => array(
6884     "icon" => "litefinder",
6885     "title" => "LiteFinder",
6886     "rule" => array(
6887     "LiteFinder[ /]([0-9.]{1,10})" => "\\1"
6888     ),
6889     "uri" => "http://www.litefinder.net/about.html"
6890     ),
6891     "nutchorg" => array(
6892     "icon" => "nutchorg",
6893     "title" => "Nutch",
6894     "rule" => array(
6895     "Nutc(hOrg|hCVS|h)?[ /]([0-9.]{1,10})" => "\\2",
6896     "Nutch" => ""
6897     ),
6898     "uri" => "http://lucene.apache.org/nutch/"
6899     ),
6900     "pythonurl" => array(
6901     "icon" => "pythonurl",
6902     "title" => "Python-url",
6903     "rule" => array(
6904     "Python[ \-]?urllib" => ""
6905     ),
6906     "uri" => ""
6907     ),
6908     // Know Robots as SPAM BOTS
6909     "SPAM" => array(
6910     "icon" => "robot",
6911     "title" => "SPAM",
6912     "rule" => array(
6913     "NASA Search[/ ]([0-9.]{1,10})" => "\\1",
6914     "^PHOTO CHECK" => "",
6915     "^FOTOCHECKER" => "",
6916     "^IPTC CHECK" => "",
6917     "^DataCha0s" => "",
6918     "^Mac Finder" => "",
6919     "^Missigua Locator[ /]([0-9.]{1,10})" => "\\1",
6920     "^Missouri College Browse" => "",
6921     "Email[ \-]?Siphon" => "",
6922     "atSpider" => "",
6923     "autoemailspider" => "",
6924     "^Demo Bot" => "",
6925     "^Program Shareware" => "",
6926     "^Snapbot" => "",
6927     "^snap.com" => "",
6928     "^Guestbook Auto Submitter" => "",
6929     "panscient.com" => "",
6930     ),
6931     "uri" => ""
6932     ),
6933     // Things we don't know by now
6934     "robot" => array(
6935     "icon" => "robot",
6936     "title" => "Robot",
6937     "rule" => array(
6938     "(robot|spider|harvest|(?<!orange)bot|(?<!msie)crawler)" => ""
6939     )
6940     )
6941     );
6942 joku 261 ?>

Properties

Name Value
svn:keywords Id