ViewVC Help
View File | Revision Log | Show Annotations | View Changeset | Root Listing
root/BBClone/branches/0.6.4-RC1/lib/robot.php
Revision: 296
Committed: Wed Sep 3 09:45:25 2014 UTC (10 years, 2 months ago) by matthys
Original Path: trunk/lib/robot.php
File size: 154577 byte(s)
Log Message:
Renamed mojeekbot to mojeek

File Contents

# User Rev Content
1 joku 63 <?php
2     /* This file is part of BBClone (A PHP based Web Counter on Steroids)
3     *
4     * SVN FILE $Id$
5     *
6     * Copyright (C) 2001-2014, the BBClone Team (see doc/authors.txt for details)
7     *
8     * This program is free software: you can redistribute it and/or modify
9     * it under the terms of the GNU General Public License as published by
10     * the Free Software Foundation, either version 3 of the License, or
11     * (at your option) any later version.
12     *
13     * This program is distributed in the hope that it will be useful,
14     * but WITHOUT ANY WARRANTY; without even the implied warranty of
15     * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16     * GNU General Public License for more details.
17     *
18     * See doc/copying.txt for details
19     */
20    
21     /////////////////////
22     // Robot Detection //
23     /////////////////////
24    
25     $robot = array(
26     "1noon" => array(
27     "icon" => "1noon",
28     "title" => "1noon",
29     "rule" => array(
30     "1Noonbot[/ ]([0-9.]{1,10})" => "\\1",
31     "^Yeti$" => ""
32     ),
33     "uri" => ""
34     ),
35     "123people" => array(
36     "icon" => "123people",
37     "title" => "123people",
38     "rule" => array(
39     "123peoplebot[ /]([0-9.]{1,10})" => "\\1"
40     ),
41     "uri" => "http://www.123people.fr/"
42     ),
43     "123spider" => array(
44     "icon" => "robot",
45     "title" => "123Spider",
46     "rule" => array(
47     "123spider-Bot \(Version: ([0-9.]{1,10})" => "\\1"
48     ),
49     "uri" => "http://www.123spider.de/"
50     ),
51     "192com" => array(
52     "icon" => "robot",
53     "title" => "192.com",
54     "rule" => array(
55     "192.comAgent" => ""
56     ),
57     "uri" => "http://www.192.com/"
58     ),
59     "2dehands" => array(
60     "icon" => "2dehands",
61     "title" => "2deHands",
62     "rule" => array(
63     "2dehands\.nl" => ""
64     ),
65     "uri" => ""
66     ),
67     "80legs" => array(
68     "icon" => "80legs",
69     "title" => "80legs",
70     "rule" => array(
71     "008[/ ]([0-9.]{1,10}).*80legs" => "\\1"
72     ),
73     "uri" => "http://www.80legs.com/"
74     ),
75     "a1sitemap" => array(
76     "icon" => "a1sitemap",
77     "title" => "A1 Sitemap",
78     "rule" => array(
79     "^A1 Sitemap Generator[ /]([0-9.]{1,10})" => "\\1",
80     "miggibot[ /]([0-9.]{1,10})" => "\\1"
81     ),
82     "uri" => "http://www.micro-sys.dk/products/sitemap-generator/"
83     ),
84     "a2b" => array(
85     "icon" => "a2b",
86     "title" => "A2B",
87     "rule" => array(
88     "www\.a2b\.cc" => ""
89     ),
90     "uri" => "http://www.a2b.cc"
91     ),
92     "abacho" => array(
93     "icon" => "robot",
94     "title" => "Abacho",
95     "rule" => array(
96     "^ABACHOBot" => ""
97     ),
98     "uri" => ""
99     ),
100     "abcdatos" => array(
101     "icon" => "abcdatos",
102     "title" => "ABCdatos",
103     "rule" => array(
104     "^ABCdatos BotLink[ /]([0-9.]{1,10})" => "\\1"
105     ),
106     "uri" => "http://www.abcdatos.com/"
107     ),
108     "abot" => array(
109     "icon" => "abot",
110     "title" => "aBot",
111     "rule" => array(
112     "^abot[ /]([0-9.]{1,10})" => "\\1"
113     ),
114     "uri" => ""
115     ),
116     "about" => array(
117     "icon" => "about",
118     "title" => "About",
119     "rule" => array(
120     "Libby[_/ ]([0-9.]{1,10})" => "\\1",
121     "About[_/ ]([0-9.]{1,10})libwww-perl" => "\\1"
122     ),
123     "uri" => ""
124     ),
125     "aboutus" => array(
126     "icon" => "aboutus",
127     "title" => "AboutUs",
128     "rule" => array(
129     "AboutUsBot" => ""
130     ),
131     "uri" => "http://www.aboutus.org/"
132     ),
133     "ackerm" => array(
134     "icon" => "robot",
135     "title" => "Ackerm",
136     "rule" => array(
137     "www.ackerm.com" => ""
138     ),
139     "uri" => "http://www.ackerm.com/"
140     ),
141     "acoi" => array(
142     "icon" => "acoi",
143     "title" => "AcoiRobot",
144     "rule" => array(
145     "^AcoiRobot" => ""
146     ),
147     "uri" => "http://monetdb.cwi.nl/acoi/projects.html"
148     ),
149     "acoon" => array(
150     "icon" => "acoon",
151     "title" => "Acoon",
152     "rule" => array(
153     "Acoon[ \-]?Robot" => ""
154     ),
155     "uri" => ""
156     ),
157     "accoona" => array(
158     "icon" => "accoona",
159     "title" => "Accoona",
160     "rule" => array(
161     "Accoona-AI-Agent[/ ]([0-9.]{1,10})" => "\\1",
162     "^accoona" => ""
163     ),
164     "uri" => ""
165     ),
166     "acme" => array(
167     "icon" => "acme",
168     "title" => "Acme",
169     "rule" => array(
170     "^Acme\.Spider" => ""
171     ),
172     "uri" => "http://www.acme.com/java/software/Acme.Spider.html"
173     ),
174     "active" => array(
175     "icon" => "robot",
176     "title" => "ActiveBookmark",
177     "rule" => array(
178     "ActiveBookmark[/ ]([0-9.]{1,10})" => "\\1"
179     ),
180     "uri" => ""
181     ),
182     "admuncher" => array(
183     "icon" => "robot",
184     "title" => "Ad Muncher",
185     "rule" => array(
186     "Ad Muncher[/ v]*([0-9.]{1,10})" => "\\1"
187     ),
188     "uri" => ""
189     ),
190     "aesop" => array(
191     "icon" => "robot",
192     "title" => "Aesop",
193     "rule" => array(
194     "^AESOP_com_SpiderMan" => ""
195     ),
196     "uri" => "http://www.aesop.com"
197     ),
198     "agada" => array(
199     "icon" => "robot",
200     "title" => "Agada",
201     "rule" => array(
202     "^agadine[/ ]([0-9.]{1,10})" => "\\1"
203     ),
204     "uri" => ""
205     ),
206     "ahrefs" => array(
207     "icon" => "ahrefs",
208     "title" => "Ahrefs",
209     "rule" => array(
210     "AhrefsBot[ /]([0-9.]{1,10})" => "\\1"
211     ),
212     "uri" => "http://ahrefs.com/"
213     ),
214     "aibot" => array(
215     "icon" => "robot",
216     "title" => "Aibot",
217     "rule" => array(
218     "AIBOT[/ ]([0-9.]{1,10})" => "\\1"
219     ),
220     "uri" => ""
221     ),
222     "aihitbot" => array(
223     "icon" => "robot",
224     "title" => "aiHit",
225     "rule" => array(
226     "aiHitBot[/ ]([0-9.]{1,10})" => "\\1"
227     ),
228     "uri" => "http://www.aihit.com/"
229     ),
230     "aipbot" => array(
231     "icon" => "robot",
232     "title" => "Aipbot",
233     "rule" => array(
234     "aipbot[/ ]([0-9.]{1,10})" => "\\1"
235     ),
236     "uri" => ""
237     ),
238     "aleksika" => array(
239     "icon" => "aleksika",
240     "title" => "Aleksika",
241     "rule" => array(
242     "Aleksika Spider[/ ]([0-9.]{1,10})" => "\\1"
243     ),
244     "uri" => ""
245     ),
246     "alertsite" => array(
247     "icon" => "alertsite",
248     "title" => "AlertSite",
249     "rule" => array(
250     "ipd[ /]([0-9.]{1,10}).*Alertsite\.com" => "\\1"
251     ),
252     "uri" => "http://www.alertsite.com/index.html"
253     ),
254     "alexa" => array(
255     "icon" => "alexa",
256     "title" => "Alexa",
257     "rule" => array(
258     "^ia_archive" => ""
259     ),
260     "uri" => "http://www.alexa.com/"
261     ),
262     "almaden" => array(
263     "icon" => "almaden",
264     "title" => "IBM Crawler",
265     "rule" => array(
266     "www\.almaden\.ibm\.com/cs/crawler" => ""
267     ),
268     "uri" => "http://www.almaden.ibm.com/cs/crawler/"
269     ),
270     "altavista" => array(
271     "icon" => "altavista",
272     "title" => "Altavista",
273     "rule" => array(
274     "Scooter[ /\-]*[a-z]*([0-9.]{1,10})" => "\\1",
275     "AltaVista V([0-9.]{1,10})" => "\\1",
276     "AltaVista Intranet V([0-9.]{1,10})" => "\\1"
277     ),
278     "uri" => "http://www.altavista.com/"
279     ),
280     "amazon" => array(
281     "icon" => "amazon",
282     "title" => "Amazon",
283     "rule" => array(
284     "^(aranhabot|amzn_assoc)" => "",
285     "^NutchEC2Test" => ""
286     ),
287     "uri" => "http://www.amazon.com/"
288     ),
289     "amidalla" => array(
290     "icon" => "amidalla",
291     "title" => "Amidalla",
292     "rule" => array(
293     "^amibot" => ""
294     ),
295     "uri" => ""
296     ),
297     "amfibi" => array(
298     "icon" => "amfibi",
299     "title" => "Amfibi",
300     "rule" => array(
301     "Amfibibot[/ ]([0-9.]{1,10})" => "\\1",
302     "Amfibibot" => ""
303     ),
304     "uri" => ""
305     ),
306     "amphetadesk" => array(
307     "icon" => "robot",
308     "title" => "AmphetaDesk",
309     "rule" => array(
310     "AmphetaDesk[/ ]([0-9.]{1,10})" => "\\1"
311     ),
312     "uri" => ""
313     ),
314     "amphetameme" => array(
315     "icon" => "robot",
316     "title" => "Amphetameme",
317     "rule" => array(
318     "amphetameme[ \-]?crawler" => ""
319     ),
320     "uri" => ""
321     ),
322     "annomille" => array(
323     "icon" => "robot",
324     "title" => "AnnoMille",
325     "rule" => array(
326     "^AnnoMille( spider)?[/ ]([0-9.]{1,10})" => "\\2"
327     ),
328     "uri" => "http://www.annomille.it"
329     ),
330     "anonymouse" => array(
331     "icon" => "anonymouse",
332     "title" => "Anonymouse.org",
333     "rule" => array(
334     "http://Anonymouse.org" => ""
335     ),
336     "uri" => "http://anonymouse.org"
337     ),
338     "ansearch" => array(
339     "icon" => "robot",
340     "title" => "Ansearch",
341     "rule" => array(
342     "AnsearchBot[/ ]([0-9.]{1,10})" => "\\1"
343     ),
344     "uri" => ""
345     ),
346     "answerchase" => array(
347     "icon" => "answerchase",
348     "title" => "AnswerChase",
349     "rule" => array(
350     "AnswerChase( PROve)?[/ ]([0-9.]{1,10})" => "\\2"
351     ),
352     "uri" => "http://www.answerchase.com/"
353     ),
354     "antibot" => array(
355     "icon" => "robot",
356 matthys 205 "title" => "Antibot",
357 joku 63 "rule" => array(
358     "antibot-V([0-9.]{1,10})" => "\\1"
359     ),
360     "uri" => ""
361     ),
362     "aonde" => array(
363     "icon" => "aonde",
364     "title" => "Aonde",
365     "rule" => array(
366     "^AONDE-Spider" => ""
367     ),
368     "uri" => ""
369     ),
370     "aonline" => array(
371     "icon" => "robot",
372     "title" => "A-Online.at",
373     "rule" => array(
374     "^A-Online Search" => ""
375     ),
376     "uri" => "http://www.a-online.at/"
377     ),
378     "aol" => array(
379     "icon" => "aol",
380     "title" => "AOLserver",
381     "rule" => array(
382     "^AOLserver-Tcl[/ ]([0-9.]{1,10})" => "\\1",
383     "^AOLserver" => ""
384     ),
385     "uri" => ""
386     ),
387     "apachebench" => array(
388     "icon" => "robot",
389     "title" => "ApacheBench",
390     "rule" => array(
391     "ApacheBench[ /]([0-9.]{1,10})" => "\\1"
392     ),
393     "uri" => ""
394     ),
395     "apassion4jazz" => array(
396     "icon" => "robot",
397     "title" => "Passion 4 Jazz",
398     "rule" => array(
399     "^BebopBot[ /]([0-9.]{1,10})" => "\\1"
400     ),
401     "uri" => "http://www.apassion4jazz.net/bebopbot.html"
402     ),
403     "apexoo" => array(
404     "icon" => "robot",
405     "title" => "Apexoo",
406     "rule" => array(
407     "^Apexoo Spider ([0-9.]{1,10})" => "\\1"
408     ),
409     "uri" => "http://www.apexoo.com/"
410     ),
411     "apnoti" => array(
412     "icon" => "apnoti",
413 matthys 205 "title" => "Apnoti",
414 joku 63 "rule" => array(
415     "apnoti.*Robot[ /]v([0-9.]{1,10})" => "\\1"
416     ),
417     "uri" => "http://www.apnoti.com/"
418     ),
419     "aport" => array(
420     "icon" => "aport",
421     "title" => "Aport",
422     "rule" => array(
423     "^Aport" => ""
424     ),
425     "uri" => ""
426     ),
427     "appie" => array(
428     "icon" => "walhello",
429     "title" => "Walhello",
430     "rule" => array(
431     "appie[ /]([0-9.]{1,10})" => "\\1"
432     ),
433     "uri" => ""
434     ),
435     "arachmo" => array(
436     "icon" => "arachmo",
437     "title" => "Arachmo",
438     "rule" => array(
439     "compatible; Arachmo" => ""
440     ),
441     "uri" => ""
442     ),
443     "arexera" => array(
444     "icon" => "arexera",
445     "title" => "Arexera",
446     "rule" => array(
447     "^X-Crawler" => "",
448     "^TECOMAC-Crawler[ /]([0-9.]{1,10})" => "\\1"
449     ),
450     "uri" => "http://www.arexera.de/"
451     ),
452     "arianna" => array(
453     "icon" => "arianna",
454     "title" => "Arianna",
455     "rule" => array(
456     "^www.arianna.it" => ""
457     ),
458     "uri" => "http://www.arianna.it/"
459     ),
460     "artface" => array(
461     "icon" => "robot",
462     "title" => "Artface",
463     "rule" => array(
464     "^ArtfaceBot" => ""
465     ),
466     "uri" => ""
467     ),
468     "artviper" => array(
469     "icon" => "artviper",
470     "title" => "artViper",
471     "rule" => array(
472     "artViper" => ""
473     ),
474     "uri" => "http://www.artviper.net/"
475     ),
476     "asinfo" => array(
477     "icon" => "robot",
478     "title" => "Any Search Info",
479     "rule" => array(
480     "Sleek Spider[ /]([0-9.]{1,10})" => "\\1"
481     ),
482     "uri" => "http://search-info.com/"
483     ),
484     "ask" => array(
485     "icon" => "askjeeves",
486     "title" => "Ask Jeeves",
487     "rule" => array(
488     "Ask[ \-]?Jeeves" => "",
489     "teomaagent" => ""
490     ),
491     "uri" => ""
492     ),
493     "askaboutoil" => array(
494     "icon" => "robot",
495     "title" => "ASPseek",
496     "rule" => array(
497     "^AskAboutOil[ /]([0-9.]{1,10})" => "\\1"
498     ),
499     "uri" => "http://askaboutoil.com/"
500     ),
501     "asked" => array(
502     "icon" => "robot",
503 matthys 205 "title" => "AskEd!",
504 joku 63 "rule" => array(
505     "^asked[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
506     ),
507     "uri" => "http://asked.jp"
508     ),
509     "aspseek" => array(
510     "icon" => "robot",
511     "title" => "ASPseek",
512     "rule" => array(
513     "^ASPseek[/ ]([0-9.]{1,10})" => "\\1"
514     ),
515     "uri" => ""
516     ),
517     "atlocal" => array(
518     "icon" => "robot",
519     "title" => "At Local",
520     "rule" => array(
521     "AtlocalBot[/ ]([0-9.]{1,10})" => "\\1"
522     ),
523     "uri" => "http://www.atlocal.com/"
524     ),
525     "atomz" => array(
526     "icon" => "atomz",
527     "title" => "Atomz",
528     "rule" => array(
529     "Atomz[/ ]([0-9.]{1,10})" => "\\1"
530     ),
531     "uri" => ""
532     ),
533     "axel" => array(
534     "icon" => "robot",
535     "title" => "Axel",
536     "rule" => array(
537     "^axel" => ""
538     ),
539     "uri" => ""
540     ),
541     "axmo" => array(
542     "icon" => "axmo",
543     "title" => "Axmo",
544     "rule" => array(
545     "AxmoRobot" => ""
546     ),
547     "uri" => ""
548     ),
549     "answerbus" => array(
550     "icon" => "answerbus",
551     "title" => "AnswerBus",
552     "rule" => array(
553     "answerbus" => ""
554     ),
555     "uri" => ""
556     ),
557     "automapit" => array(
558     "icon" => "robot",
559     "title" => "AutoMapIt",
560     "rule" => array(
561     "AutoMapIt[ /](Bot)?" => ""
562     ),
563     "uri" => "http://www.automapit.com/bot.html"
564     ),
565     "augurnfind" => array(
566     "icon" => "robot",
567     "title" => "Augurnfind",
568     "rule" => array(
569     "augurnfind[/ ][v\-]*([0-9.]{1,10})" => "\\1"
570     ),
571     "uri" => ""
572     ),
573     "awasu" => array(
574     "icon" => "awasu",
575     "title" => "Awasu",
576     "rule" => array(
577     "Awasu[/ ]([0-9a-z.]{1,10})" => "\\1"
578     ),
579     "uri" => ""
580     ),
581     "axxus" => array(
582     "icon" => "axxus",
583     "title" => "axxus.de",
584     "rule" => array(
585     "whoiam" => ""
586     ),
587     "uri" => "http://www.axxus.de/"
588     ),
589     "ayell" => array(
590     "icon" => "ayell",
591     "title" => "Ayell",
592     "rule" => array(
593     "^Eurobot[ /]([0-9.]{1,10})" => "\\1"
594     ),
595     "uri" => "http://eurobot.ayell.eu"
596     ),
597     "babaloo" => array(
598     "icon" => "babaloo",
599     "title" => "Babaloo",
600     "rule" => array(
601     "BabalooSpider[ /]([0-9.]{1,10})" => "\\1"
602     ),
603     "uri" => "http://www.babaloo.si"
604     ),
605     "babe" => array(
606     "icon" => "robot",
607     "title" => "ba.be",
608     "rule" => array(
609     "BACS http://www.ba.be" => ""
610     ),
611     "uri" => "http://www.ba.be/"
612     ),
613     "baidu" => array(
614     "icon" => "baidu",
615     "title" => "Baidu",
616     "rule" => array(
617     "Baiduspider[ /]([0-9.]{1,10})" => "\\1",
618     "Baiduspider" => ""
619     ),
620     "uri" => "http://www.baidu.com/search/spider.html"
621     ),
622     "bananatree" => array(
623     "icon" => "robot",
624     "title" => "BananaTree",
625     "rule" => array(
626     "www\.thebananatree\.org" => ""
627     ),
628     "uri" => "http://www.thebananatree.org/"
629     ),
630     "bdcindexer" => array(
631     "icon" => "robot",
632     "title" => "bdcindexer",
633     "rule" => array(
634     "bdcindexer_([0-9a-z.]{1,10})" => "\\1"
635     ),
636     "uri" => "http://www.business.com/"
637     ),
638     "bdfetch" => array(
639     "icon" => "robot",
640     "title" => "BDFetch",
641     "rule" => array(
642     "^BDFetch" => ""
643     ),
644     "uri" => ""
645     ),
646     "bdncentral" => array(
647     "icon" => "robot",
648     "title" => "Bdncentral",
649     "rule" => array(
650     "BDNcentral Crawler v([0-9.]{1,10})" => "\\1"
651     ),
652     "uri" => "http://www.bdncentral.com/robot.html"
653     ),
654     "beammachine" => array(
655     "icon" => "robot",
656     "title" => "BeamMachine",
657     "rule" => array(
658     "^BeamMachine[ /]([0-9.]{1,10})" => "\\1"
659     ),
660     "uri" => "http://www.beammachine.net/"
661     ),
662     "become" => array(
663     "icon" => "become",
664     "title" => "Become",
665     "rule" => array(
666     "Become(JP)?Bot[/ ]([0-9.]{1,10})" => "\\2",
667     "(BecomeBot|Exabot)@exava\.com\)$" => ""
668     ),
669     "uri" => "http://www.become.com/"
670     ),
671     "beebware" => array(
672     "icon" => "robot",
673     "title" => "Beebware",
674     "rule" => array(
675     "BeebwareDirectory[/ ]v?([0-9.]{1,10})" => "\\2"
676     ),
677     "uri" => ""
678     ),
679     "bigbrother" => array(
680     "icon" => "robot",
681     "title" => "Big Brother",
682     "rule" => array(
683     "^Big Brother" => ""
684     ),
685     "uri" => "http://pauillac.inria.fr/~fpottier/"
686     ),
687     "bigclique" => array(
688     "icon" => "robot",
689     "title" => "BigClique",
690     "rule" => array(
691     "^BigCliqueBOT[/ ]([0-9.]{1,10})" => "\\1"
692     ),
693     "uri" => "http://www.bigclique.com"
694     ),
695     "biglotron" => array(
696     "icon" => "robot",
697     "title" => "Biglotron",
698     "rule" => array(
699     "^BIGLOTRON" => ""
700     ),
701     "uri" => "http://www.bigclique.com"
702     ),
703     "bigsearch" => array(
704     "icon" => "bigsearch",
705     "title" => "Bigsearch",
706     "rule" => array(
707     "Bigsearch.ca[/ ]Nutch[- ]([0-9.]{1,10})" => "\\1"
708     ),
709     "uri" => ""
710     ),
711     "bilbo" => array(
712     "icon" => "robot",
713     "title" => "Bilbo",
714     "rule" => array(
715     "Bilbo[ /]([0-9.]{1,10})" => "\\1"
716     ),
717     "uri" => "http://home.broadpark.no/~tnilsen-1/Linux/Bilbo_-_Nessus_WEB/bilbo_-_nessus_web.html"
718     ),
719     "bilgi" => array(
720     "icon" => "bilgi",
721     "title" => "Bilgi",
722     "rule" => array(
723     "Bilgi(Beta)?Bot[ /]([0-9.]{1,10})" => "\\1"
724     ),
725     "uri" => "http://www.bilgi.com/"
726     ),
727     "bitacle" => array(
728     "icon" => "bitacle",
729     "title" => "Bitacle",
730     "rule" => array(
731     "Bitacle (ro)?bot[ \(/V\:]+([0-9.]{1,10})" => "\\2",
732     ),
733     "uri" => "http://bitacle.org/"
734     ),
735     "bitbeamer" => array(
736     "icon" => "bitbeamer",
737     "title" => "BitBeamer",
738     "rule" => array(
739     "BitBeamer/([0-9.]{1,10})" => "\\1"
740     ),
741     "uri" => ""
742     ),
743     "biz360" => array(
744     "icon" => "biz360",
745     "title" => "Biz360",
746     "rule" => array(
747     "^Biz360 spider" => ""
748     ),
749     "uri" => ""
750     ),
751     "backlinktest" => array(
752     "icon" => "backlinktest",
753     "title" => "BacklinkCrawler",
754     "rule" => array(
755     "BacklinkCrawler" => ""
756     ),
757     "uri" => "http://www.backlinktest.com/crawler.html"
758     ),
759     "blaizbee" => array(
760     "icon" => "blaiz-bee",
761     "title" => "Blaiz-Bee",
762     "rule" => array(
763     "Blaiz-Bee[ /]([0-9.]{1,10})" => ""
764     ),
765     "uri" => ""
766     ),
767     "blogbeat" => array(
768     "icon" => "robot",
769     "title" => "BlogBeat",
770     "rule" => array(
771     "BlogBeat/?([0-9.]{1,10})" => "\\1",
772     ),
773     "uri" => "http://www.blogbeat.nl"
774     ),
775     "blogbotde" => array(
776     "icon" => "robot",
777     "title" => "blogbot.de",
778     "rule" => array(
779     "Naamah[ /]([0-9.a-z]{1,10})[ /]Blogbot" => "\\1",
780     ),
781     "uri" => "http://blogbot.de/"
782     ),
783     "blogcensus" => array(
784     "icon" => "blogcensus",
785     "title" => "Blogcensus",
786     "rule" => array(
787     "^Blogcensus" => "",
788     ),
789     "uri" => "http://blogcensus.de/bot/"
790     ),
791     "blogdex" => array(
792     "icon" => "robot",
793     "title" => "Blogdex",
794     "rule" => array(
795     "Blogdex[ /]([0-9.]{1,10})" => "\\1",
796     ),
797     "uri" => ""
798     ),
799     "blogg" => array(
800     "icon" => "blogg",
801     "title" => "Blogg",
802     "rule" => array(
803     "^blogg\.de" => ""
804     ),
805     "uri" => ""
806     ),
807     "blogland" => array(
808     "icon" => "robot",
809     "title" => "BlogLand",
810     "rule" => array(
811     "BlogLand[/ ]([0-9.]{1,10})" => "\\1"
812     ),
813     "uri" => ""
814     ),
815     "bloglines" => array(
816     "icon" => "bloglines",
817     "title" => "Bloglines",
818     "rule" => array(
819     "Bloglines[ /]([0-9.]{1,10})" => "\\1",
820     "Bloglines" => ""
821     ),
822     "uri" => ""
823     ),
824     "blogmap" => array(
825     "icon" => "robot",
826     "title" => "Blogmap",
827     "rule" => array(
828     "blogmap" => ""
829     ),
830     "uri" => ""
831     ),
832     "blogosphere" => array(
833     "icon" => "robot",
834     "title" => "Blogosphere",
835     "rule" => array(
836     "Blogosphere" => ""
837     ),
838     "uri" => ""
839     ),
840     "blogpeople" => array(
841     "icon" => "robot",
842     "title" => "BlogPeople",
843     "rule" => array(
844     "BlogPeople" => ""
845     ),
846     "uri" => ""
847     ),
848     "blogpulse" => array(
849     "icon" => "blogpulse",
850     "title" => "Blogpulse",
851     "rule" => array(
852     "Blogpulse" => ""
853     ),
854     "uri" => ""
855     ),
856     "blogranking" => array(
857     "icon" => "blogranking",
858     "title" => "BlogRanking",
859     "rule" => array(
860     "^BlogRanking(/RSS checker)?" => ""
861     ),
862     "uri" => ""
863     ),
864     "blogs" => array(
865     "icon" => "blogs",
866     "title" => "Blo.gs",
867     "rule" => array(
868     "blo\.gs[ /]([0-9.]{1,10})" => "\\1",
869     "blo\.gs" => ""
870     ),
871     "uri" => ""
872     ),
873     "blogshares" => array(
874     "icon" => "blogshares",
875     "title" => "BlogShares",
876     "rule" => array(
877     "BlogShares[ /]V?([0-9.]{1,10})" => "\\1",
878     "(^| |\()Blogshares(\.com| |\))" => ""
879     ),
880     "uri" => ""
881     ),
882     "blogslife" => array(
883     "icon" => "robot",
884     "title" => "BlogsLife",
885     "rule" => array(
886     "Blogslive" => ""
887     ),
888     "uri" => ""
889     ),
890     "blogsnow" => array(
891     "icon" => "blogsnow",
892     "title" => "BlogsNow",
893     "rule" => array(
894     "blogsnowbot" => "",
895     "BlogsNow" => ""
896     ),
897     "uri" => ""
898     ),
899     "blogstreet" => array(
900     "icon" => "blogstreet",
901     "title" => "BlogStreet",
902     "rule" => array(
903     "^BlogStreetBot" => ""
904     ),
905     "uri" => ""
906     ),
907     "blogsurf" => array(
908     "icon" => "robot",
909     "title" => "BlogSurf",
910     "rule" => array(
911     "nomadscafe_ra[/ ]([0-9.]{1,10})" => "\\1"
912     ),
913     "uri" => ""
914     ),
915     "blogtick" => array(
916     "icon" => "robot",
917     "title" => "BlogTick",
918     "rule" => array(
919     "BlogTickServer" => ""
920     ),
921     "uri" => ""
922     ),
923     "blogwatcher" => array(
924     "icon" => "blogwatcher",
925     "title" => "Blogwatcher",
926     "rule" => array(
927     "blogWatcher_Spider[/ ]([0-9.]{1,10})" => "\\1"
928     ),
929     "uri" => ""
930     ),
931     "blogwise" => array(
932     "icon" => "blogwise",
933     "title" => "Blogwise",
934     "rule" => array(
935     "Blogwise\.com(-MetaChecker)?[/ ]([0-9.]{1,10})" => "\\2"
936     ),
937     "uri" => ""
938     ),
939     "boardreader" => array(
940     "icon" => "boardreader",
941     "title" => "BoardReader",
942     "rule" => array(
943     "BoardReader[ \-](Image|Favicon)[ \-]Fetcher[ /]+([0-9.]{1,10})" => "\\2"
944     ),
945     "uri" => "http://www.boardreader.com"
946     ),
947     "bobby" => array(
948     "icon" => "bobby",
949     "title" => "Bobby",
950     "rule" => array(
951     "bobby[ /]([0-9.]{1,10})" => "\\1"
952     ),
953     "uri" => ""
954     ),
955     "boitho" => array(
956     "icon" => "robot",
957     "title" => "Boitho",
958     "rule" => array(
959     "Boitho\.com[ \-](dc|robot)?[/ ]([0-9.]{1,10})" => "\\2"
960     ),
961     "uri" => ""
962     ),
963     "booch" => array(
964     "icon" => "robot",
965     "title" => "Booch",
966     "rule" => array(
967     "^booch[_ /]([0-9.]{1,10})" => "\\1"
968     ),
969     "uri" => ""
970     ),
971     "book" => array(
972     "icon" => "book",
973     "title" => "Bookmark",
974     "rule" => array(
975     "http://www\.bookmark\.ne\.jp" => ""
976     ),
977     "uri" => ""
978     ),
979     "bookdog" => array(
980     "icon" => "bookdog",
981     "title" => "Bookdog",
982     "rule" => array(
983     "^Bookdog[ /]([0-9.]{1,10})" => "\\1"
984     ),
985     "uri" => ""
986     ),
987     "bordermanager" => array(
988     "icon" => "bordermanager",
989     "title" => "Border Manager",
990     "rule" => array(
991     "BorderManager[ /]([0-9.]{1,10})" => "\\1"
992     ),
993     "uri" => ""
994     ),
995     "botonparade" => array(
996     "icon" => "botonparade",
997     "title" => "Bot on Parade",
998     "rule" => array(
999     "BotOnParade" => ""
1000     ),
1001     "uri" => "http://www.bots-on-para.de/bot.html"
1002     ),
1003     "botje" => array(
1004     "icon" => "botje",
1005     "title" => "Botje",
1006     "rule" => array(
1007     "Plukkie[ /]([0-9.]{1,10})" => "\\1"
1008     ),
1009     "uri" => "http://www.botje.com/"
1010     ),
1011     "bottomfeeder" => array(
1012     "icon" => "bottomfeeder",
1013     "title" => "BottomFeeder",
1014     "rule" => array(
1015     "BottomFeeder[ /]([0-9.]{1,10})" => "\\1"
1016     ),
1017     "uri" => ""
1018     ),
1019     "browseremulator" => array(
1020     "icon" => "browseremulator",
1021     "title" => "BrowserEmulator",
1022     "rule" => array(
1023     "BrowserEmulator[ /]([0-9.]{1,10})" => "\\1"
1024     ),
1025     "uri" => "http://www.dejavu.org/emulator.htm"
1026     ),
1027     "browsershots" => array(
1028     "icon" => "browsershots",
1029     "title" => "Browsershots",
1030     "rule" => array(
1031     "Browsershots URL Check" => ""
1032     ),
1033     "uri" => "http://browsershots.org"
1034     ),
1035     "browserspy" => array(
1036     "icon" => "robot",
1037     "title" => "BrowserSpy",
1038     "rule" => array(
1039     "BrowserSpy" => ""
1040     ),
1041     "uri" => ""
1042     ),
1043     "bruinbot" => array(
1044     "icon" => "robot",
1045     "title" => "BruinBot",
1046     "rule" => array(
1047     "BruinBot" => ""
1048     ),
1049     "uri" => ""
1050     ),
1051     "bruno" => array(
1052     "icon" => "robot",
1053     "title" => "Bruno",
1054     "rule" => array(
1055     "^Bruno" => ""
1056     ),
1057     "uri" => ""
1058     ),
1059     "btbot" => array(
1060     "icon" => "btbot",
1061     "title" => "BitTorrent",
1062     "rule" => array(
1063     "BTbot/([0-9.]{1,10})" => "\\1"
1064     ),
1065     "uri" => ""
1066     ),
1067     "builtwith" => array(
1068     "icon" => "builtwith",
1069     "title" => "BuiltWith",
1070     "rule" => array(
1071     "BuiltWith[/ ]([0-9.]{1,10})" => "\\1"
1072     ),
1073     "uri" => "http://builtwith.com/bot.html"
1074     ),
1075     "bulkfeeds" => array(
1076     "icon" => "robot",
1077     "title" => "Bulkfeeds",
1078     "rule" => array(
1079     "Bulkfeeds[/ ]([a-z0-9.]{1,10})" => "\\1"
1080     ),
1081     "uri" => ""
1082     ),
1083     "burf" => array(
1084     "icon" => "burf",
1085     "title" => "Burf.com",
1086     "rule" => array(
1087     "^Norbert the Spider" => ""
1088     ),
1089     "uri" => "http://www.burf.com/"
1090     ),
1091     "butch" => array(
1092     "icon" => "robot",
1093     "title" => "Butch",
1094     "rule" => array(
1095     "Butch(__| )?([a-z0-9.]{1,10})" => "\\2"
1096     ),
1097     "uri" => ""
1098     ),
1099     "buzzlogic" => array(
1100     "icon" => "buzzlogic",
1101     "title" => "Buzzlogic",
1102     "rule" => array(
1103     "BuzzBot[ /]([0-9.]{1,10})" => "\\1"
1104     ),
1105     "uri" => "http://www.buzzlogic.com"
1106     ),
1107     "catchbot" => array(
1108     "icon" => "catchbot",
1109     "title" => "CatchBot",
1110     "rule" => array(
1111     "^CatchBot[/ ]([0-9.]{1,10})" => "\\1"
1112     ),
1113     "uri" => "http://www.catchbot.com"
1114     ),
1115     "camdiscover" => array(
1116     "icon" => "robot",
1117     "title" => "Camdiscover",
1118     "rule" => array(
1119     "^Camcrawler" => ""
1120     ),
1121     "uri" => ""
1122     ),
1123     "cazoodle" => array(
1124     "icon" => "cazoodle",
1125     "title" => "Cazoodle",
1126     "rule" => array(
1127     "^CazoodleBot/(Nutch|CazoodleBot)[/ \-]([0-9.]{1,10})" => "\\2",
1128     "^CazoodleBot[/ ]([a-z0-9.]{1,10})" => "\\1"
1129     ),
1130     "uri" => "http://www.cazoodle.com/cazoodlebot"
1131     ),
1132     "ccbot" => array(
1133     "icon" => "robot",
1134     "title" => "ccBot",
1135     "rule" => array(
1136     "CCBot[/ ]([0-9.]{1,10})" => "\\1"
1137     ),
1138     "uri" => "http://www.commoncrawl.org/bot.html"
1139     ),
1140     "ccgcrawl" => array(
1141     "icon" => "robot",
1142     "title" => "CCGCrawl",
1143     "rule" => array(
1144     "CCGCrawl[/ ]([0-9.]{1,10})" => "\\1"
1145     ),
1146     "uri" => "http://www.myworkbase.com/bot.html"
1147     ),
1148     "cerberian" => array(
1149     "icon" => "robot",
1150     "title" => "Cerberian Drtrs",
1151     "rule" => array(
1152     "^Cerberian Drtrs" => ""
1153     ),
1154     "uri" => ""
1155     ),
1156     "cfnetwork" => array(
1157     "icon" => "robot",
1158     "title" => "Cerberian Drtrs",
1159     "rule" => array(
1160     "^CFNetwork[/ ]([0-9.]{1,10})" => "\\1"
1161     ),
1162     "uri" => "http://www.cfnetwork.be/"
1163     ),
1164     "charlotte" => array(
1165     "icon" => "charlotte",
1166     "title" => "Charlotte",
1167     "rule" => array(
1168     "Charlotte[/ ]([0-9a-z.]{1,10})" => "\\1"
1169     ),
1170     "uri" => ""
1171     ),
1172     "cirilizator" => array(
1173     "icon" => "cirilizator",
1174     "title" => "Cirilizator",
1175     "rule" => array(
1176     "Cirilizator[/ ]([0-9.]{1,10})" => "\\1"
1177     ),
1178     "uri" => ""
1179     ),
1180     "claria" => array(
1181     "icon" => "robot",
1182     "title" => "Claria",
1183     "rule" => array(
1184     "(Claria|Diamond)(Bot)?[ /]([0-9.]{1,10})" => "\\3",
1185     "(Claria|Diamond)(Bot)" => ""
1186     ),
1187     "uri" => ""
1188     ),
1189     "claymont" => array(
1190     "icon" => "claymont",
1191     "title" => "Claymont",
1192     "rule" => array(
1193     "claymont\.com" => "",
1194     "OliverPerry" => ""
1195     ),
1196     "uri" => "http://www.claymont.com"
1197     ),
1198     "clush" => array(
1199     "icon" => "clush",
1200     "title" => "Clush",
1201     "rule" => array(
1202     "Clus(tered-Search-|h)Bot[ /]([0-9.]{1,10})" => "\\2"
1203     ),
1204     "uri" => ""
1205     ),
1206     "cmsworldmap" => array(
1207     "icon" => "cmsworldmap",
1208     "title" => "CMS World Map",
1209     "rule" => array(
1210     "cmsworldmap" => ""
1211     ),
1212     "uri" => "http://www.cmsworldmap.com/"
1213     ),
1214     "cobion" => array(
1215     "icon" => "robot",
1216     "title" => "Cobion",
1217     "rule" => array(
1218     " (QXW03018|obot)\)" => ""
1219     ),
1220     "uri" => ""
1221     ),
1222     "coccoc" => array(
1223 matthys 287 "icon" => "coccoc",
1224 matthys 209 "title" => "Coccoc",
1225 joku 63 "rule" => array(
1226     "coccoc[ /]([0-9.]{1,10})" => "\\1"
1227     ),
1228 matthys 287 "uri" => "http://help.coccoc.com"
1229 joku 63 ),
1230     "coldfusion" => array(
1231     "icon" => "coldfusion",
1232     "title" => "ColdFusion",
1233     "rule" => array(
1234     "^coldfusion" => ""
1235     ),
1236     "uri" => ""
1237     ),
1238     "combine" => array(
1239     "icon" => "robot",
1240     "title" => "Combine",
1241     "rule" => array(
1242     "Combine[ /]([0-9.]{1,10})" => "\\1"
1243     ),
1244     "uri" => ""
1245     ),
1246     "combot" => array(
1247     "icon" => "robot",
1248     "title" => "comBot",
1249     "rule" => array(
1250     "^comBot[ /]([0-9.]{1,10})" => "\\1"
1251     ),
1252     "uri" => ""
1253     ),
1254     "comet" => array(
1255     "icon" => "comet",
1256     "title" => "Comet",
1257     "rule" => array(
1258     "cometsearch@cometsystems" => ""
1259     ),
1260     "uri" => ""
1261     ),
1262     "commerobo" => array(
1263     "icon" => "robot",
1264     "title" => "Commerobo",
1265     "rule" => array(
1266     "Commerobo[/ ]([0-9.]{1,10})" => "\\1"
1267     ),
1268     "uri" => ""
1269     ),
1270     "comrite" => array(
1271     "icon" => "robot",
1272     "title" => "ComRite",
1273     "rule" => array(
1274     "Comrite[/ ]([0-9.]{1,10})" => "\\1"
1275     ),
1276     "uri" => "http://www.comrite.com/"
1277     ),
1278     "convera" => array(
1279     "icon" => "convera",
1280     "title" => "Convera",
1281     "rule" => array(
1282     "Convera(MultiMedia)?Crawler[/ ]([0-9.]{1,10})" => "\\2",
1283     "Convera Internet Spider V([0-9.]{1,10})" => "\\1"
1284     ),
1285     "uri" => ""
1286     ),
1287     "coolbot" => array(
1288     "icon" => "robot",
1289     "title" => "CoolBot",
1290     "rule" => array(
1291     "^CoolBot" => ""
1292     ),
1293     "uri" => ""
1294     ),
1295     "cosmix" => array(
1296     "icon" => "robot",
1297     "title" => "Cosmix",
1298     "rule" => array(
1299     "^(voyager|cfetch|CosmixCrawler|carleson)[/ ]([0-9.]{1,10})" => "\\2",
1300     ),
1301     "uri" => ""
1302     ),
1303     "cosmos" => array(
1304     "icon" => "robot",
1305     "title" => "Cosmos",
1306     "rule" => array(
1307     "^cosmos" => ""
1308     ),
1309     "uri" => ""
1310     ),
1311     "cosmoty" => array(
1312     "icon" => "robot",
1313     "title" => "Cosmoty",
1314     "rule" => array(
1315     "^beautybot[/ ]([0-9.]{1,10})" => "\\1"
1316     ),
1317     "uri" => "http://www.uchoose.de/crawler/beautybot/"
1318     ),
1319     "covario" => array(
1320     "icon" => "covario",
1321     "title" => "Covario",
1322     "rule" => array(
1323     "Covario-IDS[/ ]([0-9.]{1,10})" => "\\1"
1324     ),
1325     "uri" => "http://www.covario.com/ids/"
1326     ),
1327     "creativecommons" => array(
1328     "icon" => "creativecommons",
1329     "title" => "Creative Commons",
1330     "rule" => array(
1331     "CreativeCommons[/ ]([0-9.]{1,6}(-dev)?)" => "\\1"
1332     ),
1333     "uri" => ""
1334     ),
1335     "cscrawler" => array(
1336     "icon" => "robot",
1337     "title" => "CsCrawler",
1338     "rule" => array(
1339     "CsCrawler" => ""
1340     ),
1341     "uri" => "http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html"
1342     ),
1343 joku 111 "jigsaw" => array(
1344     "icon" => "jigsaw",
1345     "title" => "Jigsaw",
1346     "rule" => array(
1347     "Jigsaw[ /]([0-9.]{1,10})" => "\\1"
1348     ),
1349     "uri" => "http://jigsaw.w3.org/css-validator/"
1350     ),
1351 joku 63 "csscheck" => array(
1352     "icon" => "w3c",
1353     "title" => "W3C CSS Validator",
1354     "rule" => array(
1355     "CSS(Check|_Validator).+[ /]([0-9.]{1,10})" => "\\2"
1356     ),
1357     "uri" => "http://jigsaw.w3.org/css-validator/"
1358     ),
1359     "custo" => array(
1360     "icon" => "robot",
1361     "title" => "Custo",
1362     "rule" => array(
1363     "Custo[ /]([0-9.]{1,10})" => "\\1"
1364     ),
1365     "uri" => ""
1366     ),
1367     "cybernavi" => array(
1368     "icon" => "robot",
1369     "title" => "CyberNavi",
1370     "rule" => array(
1371     "CyberNavi_WebGet[ /]([0-9.]{1,10})" => "\\1"
1372     ),
1373     "uri" => ""
1374     ),
1375     "cyberpatrol" => array(
1376     "icon" => "cyberpatrol",
1377     "title" => "CyberPatrol",
1378     "rule" => array(
1379     "^CyberPatrol" => ""
1380     ),
1381     "uri" => "http://www.cyberpatrol.com/cyberpatrolcrawler.asp"
1382     ),
1383     "cyberz" => array(
1384     "icon" => "cyberz",
1385     "title" => "Cyberz",
1386     "rule" => array(
1387     "Cyberz Communication Agent" => ""
1388     ),
1389     "uri" => ""
1390     ),
1391     "cydral" => array(
1392     "icon" => "robot",
1393     "title" => "Cydral",
1394     "rule" => array(
1395     "CydralSpider[ /]([0-9.]{1,10})" => "\\1"
1396     ),
1397     "uri" => ""
1398     ),
1399     "cynthia" => array(
1400     "icon" => "cynthia",
1401     "title" => "Cynthia Says",
1402     "rule" => array(
1403     "Cynthia[ /]([0-9.]{1,10})" => "\\1"
1404     ),
1405     "uri" => ""
1406     ),
1407     "d4x" => array(
1408     "icon" => "d4x",
1409     "title" => "Downloader for X",
1410     "rule" => array(
1411     "Downloader for X[ /]([0-9.]{1,10})" => "\\1"
1412     ),
1413     "uri" => ""
1414     ),
1415     "da" => array(
1416     "icon" => "da",
1417     "title" => "DA",
1418     "rule" => array(
1419     "^DA[ /]([0-9.]{1,10})" => "\\1"
1420     ),
1421     "uri" => ""
1422     ),
1423     "daum" => array(
1424     "icon" => "daum",
1425     "title" => "DAUM",
1426     "rule" => array(
1427     "DAUMOA[ /]([0-9.]{1,10})" => "\\1",
1428     "DAUM Web Robot" => "",
1429     "Daum Communications Corp" => "",
1430     "EDI[ /]([0-9.]{1,10})" => "\\1",
1431     "Edacious.*Intelligent Web Robot" => "",
1432     "RaBot[/ ]([0-9.]{1,10}) Agent" => "\\1"
1433     ),
1434     "uri" => "http://ws.daum.net/"
1435     ),
1436     "daypop" => array(
1437     "icon" => "robot",
1438     "title" => "Daypop",
1439     "rule" => array(
1440     "daypopbot[/ ]([0-9.]{1,10})" => "\\1"
1441     ),
1442     "uri" => ""
1443     ),
1444     "delfi" => array(
1445     "icon" => "delfi",
1446     "title" => "Delfi",
1447     "rule" => array(
1448     "crawl at delfi dot lt" => ""
1449     ),
1450     "uri" => ""
1451     ),
1452     "depspid" => array(
1453     "icon" => "depspid",
1454     "title" => "DepSpid",
1455     "rule" => array(
1456     "DepSpid[/ ]([0-9.]{1,10})" => "\\1"
1457     ),
1458     "uri" => ""
1459     ),
1460     "devonagent" => array(
1461     "icon" => "devonagent",
1462     "title" => "DEVONagent",
1463     "rule" => array(
1464     "DEVONtech" => ""
1465     ),
1466     "uri" => ""
1467     ),
1468     "diffbot" => array(
1469     "icon" => "diffbot",
1470     "title" => "Diffbot",
1471     "rule" => array(
1472     " Diffbot" => ""
1473     ),
1474     "uri" => "http://www.diffbot.com"
1475     ),
1476     "diribot" => array(
1477     "icon" => "diribot",
1478     "title" => "Diri",
1479     "rule" => array(
1480     "diribot" => ""
1481     ),
1482     "uri" => "http://www.diri.bg"
1483     ),
1484     "directhit" => array(
1485     "icon" => "robot",
1486     "title" => "Direct Hit",
1487     "rule" => array(
1488     "EZResult -- Internet Search Engine" => ""
1489     ),
1490     "uri" => "http://www.directhit.com"
1491     ),
1492     "disco" => array(
1493     "icon" => "disco",
1494 matthys 209 "title" => "Disco",
1495 joku 63 "rule" => array(
1496     "disco/Nutch[/ -]([0-9.]{1,10})" => "\\1",
1497     "discobot[/ -]([0-9.]{1,10})" => "\\1",
1498     "disco-crawl@discoveryengine.com" => ""
1499     ),
1500     "uri" => "http://www.discoveryengine.com/"
1501     ),
1502     "discopump" => array(
1503     "icon" => "robot",
1504     "title" => "DISCo Pump",
1505     "rule" => array(
1506     "DISCo Pump[/ ]([0-9.]{1,10})" => "\\1"
1507     ),
1508     "uri" => ""
1509     ),
1510     "dkimreputation" => array(
1511     "icon" => "dkimreputation",
1512     "title" => "DKIM Reputation",
1513     "rule" => array(
1514     "DKIMRepBot[ /]([0-9.]{1,10})" => "\\1"
1515     ),
1516     "uri" => "http://www.dkim-reputation.org"
1517     ),
1518     "dnsdigger" => array(
1519     "icon" => "dnsdigger",
1520     "title" => "DNS-Digger",
1521     "rule" => array(
1522     "DNS-Digger-Explorer[ /]([0-9.]{1,10})" => "\\1"
1523     ),
1524     "uri" => "http://www.dnsdigger.com"
1525     ),
1526     "dnsvalidation" => array(
1527     "icon" => "dnsvalidation",
1528     "title" => "DNS Validation",
1529     "rule" => array(
1530     "DNSValidation[ /]([0-9.]{1,10})" => "\\1"
1531     ),
1532     "uri" => "http://www.dnsvalidation.com/"
1533     ),
1534     "doctorhtml" => array(
1535     "icon" => "robot",
1536     "title" => "DoctorHTML",
1537     "rule" => array(
1538     "Doctor[ \-]?HTML" => ""
1539     ),
1540     "uri" => ""
1541     ),
1542     "dolphin" => array(
1543     "icon" => "dolphin",
1544     "title" => "Dolphin",
1545     "rule" => array(
1546     "Dolphin[ /]([0-9.]{1,10})" => "\\1"
1547     ),
1548     "uri" => "http://telehouse.ru/crawler.html"
1549     ),
1550     "domaindatei" => array(
1551     "icon" => "robot",
1552     "title" => "Domaindatei",
1553     "rule" => array(
1554     "DomaindateiSpider[ /]([0-9.]{1,10})" => "\\1"
1555     ),
1556     "uri" => ""
1557     ),
1558     "dontbuylists" => array(
1559     "icon" => "dontbuylists",
1560     "title" => "Dontbuylists",
1561     "rule" => array(
1562     "DBLBot[ /]([0-9.]{1,10})" => "\\1"
1563     ),
1564     "uri" => "http://www.dontbuylists.com"
1565     ),
1566     "dotbot" => array(
1567     "icon" => "robot",
1568     "title" => "DotBot",
1569     "rule" => array(
1570     "DotBot[ /]([0-9.]{1,10})" => "\\1"
1571     ),
1572     "uri" => "http://www.dotnetdotcom.org"
1573     ),
1574     "doweb" => array(
1575     "icon" => "doweb",
1576     "title" => "DoWeb",
1577     "rule" => array(
1578     "^www.doweb.co.uk" => ""
1579     ),
1580     "uri" => "http://www.doweb.co.uk/"
1581     ),
1582     "downforeveryoneorjustme" => array(
1583     "icon" => "downforeveryoneorjustme",
1584     "title" => "Down for everyone or just me",
1585     "rule" => array(
1586     "downforeveryoneorjustme" => ""
1587     ),
1588     "uri" => "http://www.downforeveryoneorjustme.com"
1589     ),
1590     "downloadninja" => array(
1591     "icon" => "robot",
1592     "title" => "Download Ninja",
1593     "rule" => array(
1594     "Download Ninja[ /]([0-9.]{1,10})" => "\\1"
1595     ),
1596     "uri" => ""
1597     ),
1598     "drupal" => array(
1599     "icon" => "drupal",
1600     "title" => "Drupal",
1601     "rule" => array(
1602     "^Drupal" => ""
1603     ),
1604     "uri" => ""
1605     ),
1606     "dsns" => array(
1607     "icon" => "robot",
1608     "title" => "DSNS Scanner",
1609     "rule" => array(
1610     "^DSNS" => ""
1611     ),
1612     "uri" => ""
1613     ),
1614     "dtsagent" => array(
1615     "icon" => "robot",
1616     "title" => "DTS Agent",
1617     "rule" => array(
1618     "DTS Agent" => ""
1619     ),
1620     "uri" => ""
1621     ),
1622     "earthcom" => array(
1623     "icon" => "earthcom",
1624     "title" => "Earthcom",
1625     "rule" => array(
1626     "EARTHCOM\.info[/ ]([0-9a-z.]{1,10})" => "\\1"
1627     ),
1628     "uri" => ""
1629     ),
1630     "ebay" => array(
1631     "icon" => "ebay",
1632     "title" => "eBay",
1633     "rule" => array(
1634     "eBay Relevance Ad Crawler" => ""
1635     ),
1636     "uri" => ""
1637     ),
1638     "echo" => array(
1639     "icon" => "robot",
1640     "title" => "Echo.com",
1641     "rule" => array(
1642     "_TrueRobot[/ ]([0-9.]{1,10})" => "\\1"
1643     ),
1644     "uri" => "http://www.echo.com/"
1645     ),
1646     "eert" => array(
1647     "icon" => "robot",
1648 matthys 209 "title" => "Eert",
1649 joku 63 "rule" => array(
1650     "eert spdr[/ ]([0-9.]{1,10})" => "\\1"
1651     ),
1652     "uri" => "http://bot.eert.net"
1653     ),
1654     "eknip" => array(
1655     "icon" => "eknip",
1656     "title" => "E-Knip",
1657     "rule" => array(
1658     "eknip[ /]([0-9a-z.]{1,10})" => "\\1"
1659     ),
1660     "uri" => ""
1661     ),
1662     "zoominfo" => array(
1663     "icon" => "zoominfo",
1664 matthys 209 "title" => "ZoomInfo", //Previous called Eliyon
1665 joku 63 "rule" => array(
1666     "NextGenSearchBot[/ ]([0-9.]{1,10})" => "\\1"
1667     ),
1668     "uri" => "http://www.zoominfo.com/business/nextgensearchbot.html"
1669     ),
1670     "emeraldshield" => array(
1671     "icon" => "emeraldshield",
1672     "title" => "EmeraldShield",
1673     "rule" => array(
1674     "^EmeraldShield" => ""
1675     ),
1676     "uri" => ""
1677     ),
1678     "empas" => array(
1679     "icon" => "empas",
1680     "title" => "Empas",
1681     "rule" => array(
1682     "DigExt; empas\)$" => "",
1683     "^EMPAS[_\-]ROBOT" => ""
1684     ),
1685     "uri" => ""
1686     ),
1687     "entireweb" => array(
1688     "icon" => "entireweb",
1689     "title" => "Entireweb",
1690     "rule" => array(
1691     "Speedy[ ]?Spider" => ""
1692     ),
1693     "uri" => ""
1694     ),
1695     "envolk" => array(
1696     "icon" => "envolk",
1697     "title" => "Envolk",
1698     "rule" => array(
1699     "envolk\[ITS\]spider[/ ]([0-9.]{1,10})" => "\\1",
1700     "envolk[/ ]([0-9.]{1,10})" => "\\1"
1701     ),
1702     "uri" => ""
1703     ),
1704     "esnet" => array(
1705     "icon" => "robot",
1706     "title" => "ES.NET",
1707     "rule" => array(
1708     "ES.NET Crawler[ /]([0-9.]{1,10})" => "\\1"
1709     ),
1710     "uri" => ""
1711     ),
1712     "estyle" => array(
1713     "icon" => "estyle",
1714     "title" => "eStyle Search",
1715     "rule" => array(
1716     "eStyleSearch[ /]([0-9.]{1,10})" => "\\1"
1717     ),
1718     "uri" => ""
1719     ),
1720     "eurip" => array(
1721     "icon" => "robot",
1722     "title" => "Eurip",
1723     "rule" => array(
1724     "EuripBot[ /]([0-9.]{1,10})" => "\\1"
1725     ),
1726     "uri" => "http://www.eurip.com"
1727     ),
1728     "eurodirectory" => array(
1729     "icon" => "robot",
1730     "title" => "Euro Directory",
1731     "rule" => array(
1732     "www\.euro-directory\.com" => ""
1733     ),
1734     "uri" => "http://www.euro-directory.com/"
1735     ),
1736     "euroseek" => array(
1737     "icon" => "euroseek",
1738     "title" => "EuroSeek",
1739     "rule" => array(
1740     "Arachnoidea" => ""
1741     ),
1742     "uri" => ""
1743     ),
1744     "evaal" => array(
1745     "icon" => "evaal",
1746     "title" => "Evaal",
1747     "rule" => array(
1748     "^EvaalSE" => ""
1749     ),
1750     "uri" => "http://www.evaal.com/"
1751     ),
1752     "eventax" => array(
1753     "icon" => "eventax",
1754     "title" => "Eventax",
1755     "rule" => array(
1756     "^eventax[ /]([0-9.]{1,10})" => "\\1"
1757     ),
1758     "uri" => "http://www.eventax.de/"
1759     ),
1760     "everbee" => array(
1761     "icon" => "everbee",
1762     "title" => "Everbee",
1763     "rule" => array(
1764     "EverbeeCrawler" => ""
1765     ),
1766     "uri" => ""
1767     ),
1768     "everest" => array(
1769     "icon" => "everest",
1770     "title" => "Everest",
1771     "rule" => array(
1772     "Everest-Vulcan Inc.[ /]([0-9.]{1,10})" => "\\1"
1773     ),
1774     "uri" => ""
1775     ),
1776     "exabot" => array(
1777     "icon" => "exabot",
1778     "title" => "ExaBot",
1779     "rule" => array(
1780     "^NG[ /]([0-9.]{1,10})" => "\\1",
1781     "Exabot/([0-9.]{1,10})" => "\\1",
1782     "ExaBotTest/([0-9.]{1,10})" => "\\1",
1783     "ExaBot-(Test|Images)/([0-9.]{1,10})" => "\\2",
1784     "ExaBot-Thumbnails" => ""
1785     ),
1786     "uri" => "http://www.exabot.com/go/robot"
1787     ),
1788     "exactseek" => array(
1789     "icon" => "exactseek",
1790     "title" => "ExactSeek",
1791     "rule" => array(
1792     "^exactseek[ \-]?(pagereaper|crawler)[ \-]?([0-9.]{1,10})" => "\\2",
1793     "ExactSeek[ \.\-]?(Crawler|com)" => ""
1794     ),
1795     "uri" => "http://www.exactseek.com/"
1796     ),
1797     "excite" => array(
1798     "icon" => "excite",
1799     "title" => "Excite",
1800     "rule" => array(
1801     "Architext[ \-]?Spider" => ""
1802     ),
1803     "uri" => ""
1804     ),
1805     "execrawl" => array(
1806     "icon" => "robot",
1807     "title" => "Execrawl",
1808     "rule" => array(
1809     "Execrawl[ /]([0-9.]{1,10})" => "\\1",
1810     "Execrawl" => ""
1811     ),
1812     "uri" => ""
1813     ),
1814     "expertmonitor" => array(
1815     "icon" => "robot",
1816     "title" => "ExpertMonitor",
1817     "rule" => array(
1818     "^NetMonitor[ /]([0-9.]{1,10})" => "\\1"
1819     ),
1820     "uri" => ""
1821     ),
1822     "explorerrss" => array(
1823     "icon" => "robot",
1824     "title" => "Explorer RSS",
1825     "rule" => array(
1826     "^Windows-RSS-Platform[ /]([0-9.]{1,10})" => "\\1"
1827     ),
1828     "uri" => ""
1829     ),
1830     "ezooms" => array(
1831     "icon" => "robot",
1832     "title" => "Ezooms",
1833     "rule" => array(
1834     "ezooms[/ ]([0-9a-z.\-]{1,10})" => "\\1"
1835     ),
1836     "uri" => ""
1837     ),
1838     "facebook" => array(
1839     "icon" => "facebook",
1840     "title" => "Facebook",
1841     "rule" => array(
1842     "FacebookFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1843     "facebookexternalhit/([0-9.]{1,10})" => "\\1",
1844     "^facebook" => ""
1845     ),
1846     "uri" => "http://www.facebook.com/"
1847     ),
1848     "fast" => array(
1849     "icon" => "fast",
1850     "title" => "Fast",
1851     "rule" => array(
1852     "^FAST( Enterprise |-Web| MetaWeb )?Crawler[ /]([0-9.]{1,10})" => "\\2",
1853     "^FAST( Enterprise |-Web| MetaWeb | PartnerSite )?Crawler" => "",
1854     "^Fast Crawler" => "",
1855     "^libwww-perl[ /]([0-9.]{1,10}) FP[ /]([0-9.]{1,10})" => "\\2"
1856     ),
1857     "uri" => "http://www.alltheweb.com/"
1858     ),
1859     "fastbuzz" => array(
1860     "icon" => "fastbuzz",
1861     "title" => "Fastbuzz",
1862     "rule" => array(
1863     "^fastbuzz\.com" => ""
1864     ),
1865     "uri" => ""
1866     ),
1867     "favorg" => array(
1868     "icon" => "robot",
1869     "title" => "FavOrg",
1870     "rule" => array(
1871     "^FavOrg" => ""
1872     ),
1873     "uri" => ""
1874     ),
1875     "favorstar" => array(
1876     "icon" => "favorstar",
1877 matthys 209 "title" => "Favorstar",
1878 joku 63 "rule" => array(
1879     "favorstarbot[ /]([0-9.]{1,10})" => "\\1"
1880     ),
1881     "uri" => "http://favorstar.com/bot.html"
1882     ),
1883     "faxo" => array(
1884     "icon" => "robot",
1885     "title" => "Faxo",
1886     "rule" => array(
1887     "^Faxobot[ /]([0-9.]{1,10})" => "\\1"
1888     ),
1889     "uri" => "http://www.faxo.com/"
1890     ),
1891     "fdse" => array(
1892     "icon" => "robot",
1893     "title" => "FDSE Robot",
1894     "rule" => array(
1895     "FDSE[ \-]?robot" => ""
1896     ),
1897     "uri" => ""
1898     ),
1899     "feedback" => array(
1900     "icon" => "robot",
1901     "title" => "FeedBack",
1902     "rule" => array(
1903     "FeedBack[/ ]([0-9.]{1,10})" => "\\1"
1904     ),
1905     "uri" => ""
1906     ),
1907     "feedburner" => array(
1908     "icon" => "feedburner",
1909     "title" => "FeedBurner",
1910     "rule" => array(
1911     "^FeedBurner[/ ]([0-9.]{1,10})" => "\\1"
1912     ),
1913     "uri" => ""
1914     ),
1915     "feeddemon" => array(
1916     "icon" => "feeddemon",
1917     "title" => "FeedDemon",
1918     "rule" => array(
1919     "FeedDemon[/ ]([0-9.]{1,10})" => "\\1"
1920     ),
1921     "uri" => ""
1922     ),
1923     "feedfind" => array(
1924     "icon" => "feedfind",
1925     "title" => "FeedFind",
1926     "rule" => array(
1927     "Feed::Find[ /]([0-9.]{1,10})" => "\\1"
1928     ),
1929     "uri" => ""
1930     ),
1931     "feedonfeeds" => array(
1932     "icon" => "robot",
1933     "title" => "Feed On Feeds",
1934     "rule" => array(
1935     "FeedOnFeeds[/ ]([0-9.]{1,10})" => "\\1"
1936     ),
1937     "uri" => ""
1938     ),
1939     "feedparser" => array(
1940     "icon" => "robot",
1941     "title" => "Feedparser",
1942     "rule" => array(
1943     "UniversalFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1944     "FeedParser" => ""
1945     ),
1946     "uri" => ""
1947     ),
1948     "feedreader" => array(
1949     "icon" => "feedreader",
1950     "title" => "Feedreader",
1951     "rule" => array(
1952     "^Feedreader" => ""
1953     ),
1954     "uri" => ""
1955     ),
1956     "feedserver" => array(
1957     "icon" => "robot",
1958     "title" => "FeedServer",
1959     "rule" => array(
1960     "FeedServer[/ ]([0-9.]{1,10})" => "\\1"
1961     ),
1962     "uri" => ""
1963     ),
1964     "feedster" => array(
1965     "icon" => "feedster",
1966     "title" => "Feedster",
1967     "rule" => array(
1968     "Feedster Crawler[/ ]([0-9.]{1,10})" => "\\1"
1969     ),
1970     "uri" => ""
1971     ),
1972     "feedvalidator" => array(
1973     "icon" => "feedvalidator",
1974     "title" => "Feed Validator",
1975     "rule" => array(
1976     "^FeedValidator[/ ]([0-9.]{1,10})" => "\\1"
1977     ),
1978     "uri" => ""
1979     ),
1980     "fdm" => array(
1981     "icon" => "robot",
1982     "title" => "Free Download Manager",
1983     "rule" => array(
1984     "^FDM[/ ]([0-9a-z.]{1,10})" => "\\1"
1985     ),
1986     "uri" => ""
1987     ),
1988     "filangy" => array(
1989     "icon" => "robot",
1990     "title" => "Filangy",
1991     "rule" => array(
1992     "Filangy[/ ]([0-9.]{1,10})" => "\\1"
1993     ),
1994     "uri" => "http://www.filangy.com/"
1995     ),
1996     "findanisp" => array(
1997     "icon" => "robot",
1998     "title" => "FindAnISP",
1999     "rule" => array(
2000     "FindAnISP" => ""
2001     ),
2002     "uri" => "http://www.findanisp.com/"
2003     ),
2004     "findengines" => array(
2005     "icon" => "findengines",
2006     "title" => "FindEngines",
2007     "rule" => array(
2008     "FindEngines! Bot" => ""
2009     ),
2010     "uri" => ""
2011     ),
2012     "findexa" => array(
2013     "icon" => "findexa",
2014     "title" => "Findexa",
2015     "rule" => array(
2016     "Findexa Crawler" => ""
2017     ),
2018     "uri" => ""
2019     ),
2020     "findlinks" => array(
2021     "icon" => "findlinks",
2022     "title" => "FindLinks",
2023     "rule" => array(
2024     "findlinks[ /]([0-9.]{1,10})" => "\\1",
2025     "^FindLinks" => ""
2026     ),
2027     "uri" => ""
2028     ),
2029     "findoor" => array(
2030     "icon" => "findoor",
2031 matthys 209 "title" => "Findoor",
2032 joku 63 "rule" => array(
2033     "^findoor(-Bot)?" => "\\1"
2034     ),
2035     "uri" => ""
2036     ),
2037     "firefly" => array(
2038     "icon" => "firefly",
2039     "title" => "Firefly",
2040     "rule" => array(
2041     "Firefly" => ""
2042     ),
2043     "uri" => ""
2044     ),
2045     "flashget" => array(
2046     "icon" => "flashget",
2047     "title" => "FlashGet",
2048     "rule" => array(
2049     "^FlashGet" => ""
2050     ),
2051     "uri" => ""
2052     ),
2053     "flatland" => array(
2054     "icon" => "flatland",
2055     "title" => "Flatland",
2056     "rule" => array(
2057     "^flatlandbot" => ""
2058     ),
2059     "uri" => "http://www.flatlandindustries.com/flatlandbot"
2060     ),
2061     "flickbot" => array(
2062     "icon" => "flickbot",
2063     "title" => "FlickBot",
2064     "rule" => array(
2065     "FlickBot[ /]([0-9.]{1,10})" => "\\1"
2066     ),
2067     "uri" => ""
2068     ),
2069     "flightdeckreports" => array(
2070     "icon" => "flightdeckreports",
2071     "title" => "Flight Deck Reports",
2072     "rule" => array(
2073     "FlightDeckReportsBot[ /]([0-9.]{1,10})" => "\\1"
2074     ),
2075     "uri" => "http://www.flightdeckreports.com/"
2076     ),
2077     "forex" => array(
2078     "icon" => "robot",
2079     "title" => "Forex",
2080     "rule" => array(
2081     "^Forex Trading Network Organization" => ""
2082     ),
2083     "uri" => "http://www.netforex.org/"
2084     ),
2085     "freshmeat" => array(
2086     "icon" => "freshmeat",
2087 matthys 209 "title" => "Freshmeat",
2088 joku 63 "rule" => array(
2089     "fmII URL validator[ /]([0-9.]{1,10})" => "\\1",
2090     "freshmeat.net URL validator[ /]([0-9.]{1,10})" => "\\1"
2091     ),
2092     "uri" => "http://www.freshmeat.net/"
2093     ),
2094     "friend" => array(
2095     "icon" => "friend",
2096     "title" => "Friend",
2097     "rule" => array(
2098     "www\.friend\.fr" => ""
2099     ),
2100     "uri" => "http://www.friend.fr/"
2101     ),
2102     "frontier" => array(
2103     "icon" => "frontier",
2104     "title" => "Frontier",
2105     "rule" => array(
2106     "Frontier[ /]([0-9.]{1,10})" => "\\1"
2107     ),
2108     "uri" => ""
2109     ),
2110     "fyberspider" => array(
2111     "icon" => "robot",
2112     "title" => "FyberSpider",
2113     "rule" => array(
2114     "FyberSpider[ /]([0-9.]{1,10})" => "\\1"
2115     ),
2116     "uri" => "http://www.fyberspider.com/"
2117     ),
2118     "gaisbot" => array(
2119     "icon" => "gais",
2120     "title" => "Gaisbot",
2121     "rule" => array(
2122     "Gaisbot[ /]([0-9.]{1,10})" => "\\1"
2123     ),
2124     "uri" => ""
2125     ),
2126     "galaxy" => array(
2127     "icon" => "galaxy",
2128     "title" => "Galaxy",
2129     "rule" => array(
2130     "GalaxyBot[ /]([0-9.]{1,10})" => "\\1",
2131     "www.galaxy.com" => ""
2132     ),
2133     "uri" => "http://www.galaxy.com/"
2134     ),
2135     "gamespy" => array(
2136     "icon" => "gamespy",
2137     "title" => "GameSpy",
2138     "rule" => array(
2139     "GameSpyHTTP[ /]([0-9.]{1,10})" => "\\1"
2140     ),
2141     "uri" => ""
2142     ),
2143     "garlik" => array(
2144     "icon" => "garlik",
2145     "title" => "Garlik",
2146     "rule" => array(
2147     "GarlikCrawler[ /]([0-9.]{1,10})" => "\\1"
2148     ),
2149     "uri" => "http://garlik.com/"
2150     ),
2151     "gdesktop" => array(
2152     "icon" => "gdesktop",
2153     "title" => "Google Desktop",
2154     "rule" => array(
2155     "compatible; Google Desktop" => ""
2156     ),
2157     "uri" => ""
2158     ),
2159     "genome" => array(
2160     "icon" => "robot",
2161     "title" => "Genome Machine",
2162     "rule" => array(
2163     "Genome[ \-]?Machine" => ""
2164     ),
2165     "uri" => ""
2166     ),
2167     "geohash" => array(
2168     "icon" => "geohash",
2169     "title" => "Geohash",
2170     "rule" => array(
2171     "GeoHasher(/Nutch)[ /-]([0-9.]{1,10})" => "\\2"
2172     ),
2173     "uri" => "http://geohash.org/"
2174     ),
2175     "geona" => array(
2176     "icon" => "robot",
2177     "title" => "Geona",
2178     "rule" => array(
2179     "GeonaBot[ /]([0-9.]{1,10})" => "\\1"
2180     ),
2181     "uri" => ""
2182     ),
2183     "geoblog" => array(
2184     "icon" => "robot",
2185     "title" => "The World as a Blog",
2186     "rule" => array(
2187     "The World as a Blog" => ""
2188     ),
2189     "uri" => ""
2190     ),
2191     "geourl" => array(
2192     "icon" => "geourl",
2193     "title" => "GeoUrl",
2194     "rule" => array(
2195     "geourl[ /]([0-9.]{1,10})" => "\\1",
2196     "^GeoURLBot[ /]([0-9.]{1,10})" => "\\1",
2197     ),
2198     "uri" => ""
2199     ),
2200     "getnetwise" => array(
2201     "icon" => "robot",
2202     "title" => "GetNetWise",
2203     "rule" => array(
2204     " Crayon Crawler" => ""
2205     ),
2206     "uri" => ""
2207     ),
2208     "getright" => array(
2209     "icon" => "getright",
2210     "title" => "GetRight",
2211     "rule" => array(
2212     "GetRight[ /]([0-9.]{1,10})" => "\\1"
2213     ),
2214     "uri" => ""
2215     ),
2216     "getsmart" => array(
2217     "icon" => "getsmart",
2218     "title" => "GetSmart",
2219     "rule" => array(
2220     "GetSmart[ /]([0-9.]{1,10})" => "\\1"
2221     ),
2222     "uri" => ""
2223     ),
2224     "ginger" => array(
2225     "icon" => "ginger",
2226     "title" => "GingerCrawler",
2227     "rule" => array(
2228     "GingerCrawler[ /]([0-9.]{1,10})" => "\\1"
2229     ),
2230     "uri" => "http://www.gingersoftware.com/crawler_agent.htm"
2231     ),
2232     "gigabot" => array(
2233     "icon" => "gigablast",
2234     "title" => "Gigablast",
2235     "rule" => array(
2236     "(Gigabot|Sitesearch)[/ ]([0-9.]{1,10})" => "\\2",
2237     "GigabotSiteSearch[/ ]([0-9.]{1,10})" => "\\1",
2238     ),
2239     "uri" => ""
2240     ),
2241     "girafabot" => array(
2242     "icon" => "girafa",
2243     "title" => "Girafa",
2244     "rule" => array(
2245     "Girafabot" => ""
2246     ),
2247     "uri" => ""
2248     ),
2249     "globalspec" => array(
2250     "icon" => "globalspec",
2251     "title" => "GlobalSpec",
2252     "rule" => array(
2253     "Ocelli[ /]([0-9.]{1,10})" => "\\1"
2254     ),
2255     "uri" => ""
2256     ),
2257     "glucose" => array(
2258     "icon" => "glucose",
2259     "title" => "Glucose",
2260     "rule" => array(
2261     "glucose[ /]([0-9a-z.\-]{1,10})" => "\\1"
2262     ),
2263     "uri" => ""
2264     ),
2265     "gnomit" => array(
2266     "icon" => "gnomit",
2267     "title" => "Gnomit",
2268     "rule" => array(
2269     "gnomit[ /]([0-9.]{1,10})" => "\\1"
2270     ),
2271     "uri" => "http://www.gnomit.com/",
2272     ),
2273     "goforit" => array(
2274     "icon" => "goforit",
2275     "title" => "GoForIt",
2276     "rule" => array(
2277     "^GoForIt\.com" => "",
2278     "^GOFORITBOT" => ""
2279     ),
2280     "uri" => ""
2281     ),
2282     "goguides" => array(
2283     "icon" => "robot",
2284     "title" => "GoGuides",
2285     "rule" => array(
2286     "^GoGuidesBot[ /]([0-9.]{1,10})" => "\\1"
2287     ),
2288     "uri" => "http://www.goguides.org/"
2289     ),
2290     // Needs to be before google for correct detection
2291     "mediapartners" => array(
2292     "icon" => "google",
2293     "title" => "Mediapartners",
2294     "rule" => array (
2295     "Mediapartners-Google[ /]([0-9.]{1,10})" => "\\1",
2296     "Mediapartners-Google" => ""
2297     ),
2298     "uri" => ""
2299     ),
2300     "google" => array(
2301     "icon" => "google",
2302     "title" => "Google",
2303     "rule" => array (
2304     "Googl(e|ebot)(-Image)?/([0-9.]{1,10})" => "\\3",
2305     "Googl(e|ebot)(-Image)?/" => "",
2306     "^gsa-crawler" => "",
2307     "Google Web Preview" => ""
2308     ),
2309     "uri" => "http://www.google.com/"
2310     ),
2311     "googlesitemaps" => array(
2312     "icon" => "google",
2313     "title" => "Google-Sitemaps",
2314     "rule" => array (
2315     "Googl(e|ebot)(-Sitemaps)?/([0-9.]{1,10})" => "\\3",
2316     "GSiteCrawler[ /v]*([0-9.a-z]{1,10})" => "\\1",
2317     "Googl(e|ebot)(-Sitemaps)?/" => ""
2318     ),
2319     "uri" => ""
2320     ),
2321     "googlemobile" => array(
2322     "icon" => "google",
2323     "title" => "Google-Mobile",
2324     "rule" => array (
2325     "Googl(e|ebot)(-Mobile)?/([0-9.]{1,10})" => "\\3",
2326     "Googl(e|ebot)(-Mobile)?/" => ""
2327     ),
2328     "uri" => ""
2329     ),
2330     "googleads" => array(
2331     "icon" => "google",
2332     "title" => "Google-AdsBot",
2333     "rule" => array (
2334     "^AdsBot-Google" => "",
2335     ),
2336     "uri" => ""
2337     ),
2338     "googlefeeds" => array(
2339     "icon" => "google",
2340     "title" => "Google-Feedfetcher",
2341     "rule" => array (
2342     "^Feedfetcher-Google" => "",
2343     ),
2344     "uri" => ""
2345     ),
2346     "googlverification" => array(
2347     "icon" => "google",
2348     "title" => "Google-Site-Verification",
2349     "rule" => array (
2350     "Google-Site-Verification[ /]([0-9.]{1,10})" => "\\1"
2351     ),
2352     "uri" => ""
2353     ),
2354 matthys 207 // Needs to be AFTER Google detection
2355     "goo" => array(
2356     "icon" => "goo",
2357     "title" => "Goo",
2358     "rule" => array (
2359     "(gazz|ichiro|mog(et|imogi))[ /]([0-9.]{1,10})" => "\\3",
2360     "DoCoMo[ /]([0-9.]{1,10})" => "\\1"
2361     ),
2362     "uri" => ""
2363     ),
2364 joku 63 "goongee" => array(
2365     "icon" => "robot",
2366     "title" => "GoonGee",
2367     "rule" => array (
2368     "^Big Fish[ /]v?([0-9.]{1,10})" => "\\2"
2369     ),
2370     "uri" => "http://www.goongee.com/"
2371     ),
2372     "gpost" => array(
2373     "icon" => "gpost",
2374     "title" => "GPost",
2375     "rule" => array(
2376     "^GPostbot" => ""
2377     ),
2378     "uri" => ""
2379     ),
2380     "gregarius" => array(
2381     "icon" => "robot",
2382     "title" => "Gregarius",
2383     "rule" => array(
2384     "^Gregarius[/ ]([0-9.]{1,10})" => ""
2385     ),
2386     "uri" => ""
2387     ),
2388     "grub" => array(
2389     "icon" => "grub",
2390     "title" => "Grub",
2391     "rule" => array(
2392     "grub[ \-]?client[ /\-]{1,5}([0-9.]{1,10})" => "\\1",
2393     "grub crawler" => "",
2394     "grub[/ ]([0-9.]{1,10})" => "\\1",
2395     "^GrubNG([0-9. ]{1,10})?" => "\\1"
2396     ),
2397     "uri" => "http://www.grub.org/"
2398     ),
2399     "gulliver" => array(
2400     "icon" => "robot",
2401     "title" => "Gulliver",
2402     "rule" => array(
2403     "Gulliver" => ""
2404     ),
2405     "uri" => ""
2406     ),
2407     "guruji" => array(
2408     "icon" => "guruji",
2409     "title" => "Guruji",
2410     "rule" => array(
2411     "GurujiBot[/ ]([0-9.]{1,10})" => "\\1"
2412     ),
2413     "uri" => "http://www.guruji.com/"
2414     ),
2415     "gush" => array(
2416     "icon" => "robot",
2417     "title" => "Gush",
2418     "rule" => array(
2419     "^Gush[/ ]([0-9.]{1,10})" => "\\1"
2420     ),
2421     "uri" => ""
2422     ),
2423     "gziptester" => array(
2424     "icon" => "robot",
2425     "title" => "Gzip Tester",
2426     "rule" => array(
2427     "g(id)?zip[ \-]?test(er)?" => ""
2428     ),
2429     "uri" => ""
2430     ),
2431     "hanzoweb" => array(
2432     "icon" => "hanzoweb",
2433     "title" => "Hanzoweb",
2434     "rule" => array(
2435     "^Hanzoweb" => ""
2436     ),
2437     "uri" => ""
2438     ),
2439     "harbot" => array(
2440     "icon" => "harbot",
2441     "title" => "Harbot",
2442     "rule" => array(
2443     "^Harbot GateStation" => ""
2444     ),
2445     "uri" => ""
2446     ),
2447     "hatena" => array(
2448     "icon" => "hatena",
2449     "title" => "Hatena",
2450     "rule" => array(
2451     "Hatena (Antenna|Bookmark|Pagetitle Agent)[ /]([0-9.]{1,10})" => "\\2"
2452     ),
2453     "uri" => ""
2454     ),
2455     "htmlparser" => array(
2456     "icon" => "htmlparser",
2457     "title" => "HTMLParser",
2458     "rule" => array(
2459     "HTMLParser[ /]([0-9.]{1,10})" => "\\1"
2460     ),
2461     "uri" => "http://htmlparser.sourceforge.net/"
2462     ),
2463     "helix" => array(
2464     "icon" => "helix",
2465     "title" => "Heritrix",
2466     "rule" => array(
2467     "^helix[ /]([0-9.]{1,10})" => "\\1"
2468     ),
2469     "uri" => "http://www.sitesearch.ca/helix/"
2470     ),
2471     "heritrix" => array(
2472     "icon" => "heritrix",
2473     "title" => "Heritrix",
2474     "rule" => array(
2475     "heritrix[ /]([0-9.]{1,10})" => "\\1",
2476     "archive.org_bot" => "",
2477     "InternetArchive[ /]([0-9.a-z]{1,10})" => "\\1"
2478     ),
2479     "uri" => "http://archive.org"
2480     ),
2481     "hiddenmarket" => array(
2482     "icon" => "robot",
2483     "title" => "HiddenMarket",
2484     "rule" => array(
2485     "HiddenMarket[ /\-]([0-9.]{1,10})" => "\\1"
2486     ),
2487     "uri" => ""
2488     ),
2489     "honda" => array(
2490     "icon" => "robot",
2491     "title" => "Honda",
2492     "rule" => array(
2493     "Honda-Search[ /]([0-9.]{1,10})" => "\\1"
2494     ),
2495     "uri" => "http://www.honda-search.com"
2496     ),
2497     "hoowwwer" => array(
2498     "icon" => "hoowwwer",
2499     "title" => "HooWWWer",
2500     "rule" => array(
2501     "HooWWWer[ /]([0-9.]{1,10})" => "\\1"
2502     ),
2503     "uri" => ""
2504     ),
2505     "hotzonu" => array(
2506     "icon" => "hotzonu",
2507     "title" => "Hotzonu",
2508     "rule" => array(
2509     "Hotzonu[ /]([0-9.]{1,10})" => "\\1"
2510     ),
2511     "uri" => ""
2512     ),
2513     "houxou" => array(
2514     "icon" => "robot",
2515     "title" => "Houxou",
2516     "rule" => array(
2517     "HouxouCrawler[ /]Nutch.([0-9.]{1,10})" => "\\1",
2518     "HouxouCrawler" => ""
2519     ),
2520     "uri" => ""
2521     ),
2522     "htdig" => array(
2523     "icon" => "htdig",
2524     "title" => "ht://Dig",
2525     "rule" => array(
2526     "htdig[ /]([0-9.]{1,10})" => "\\1",
2527     "htdig" => "\\1"
2528     ),
2529     "uri" => ""
2530     ),
2531     "html2jpg" => array(
2532     "icon" => "html2jpg",
2533     "title" => "HTML2JPG",
2534     "rule" => array(
2535     "^HTML2JPG" => ""
2536     ),
2537     "uri" => ""
2538     ),
2539     "httperf" => array(
2540     "icon" => "robot",
2541     "title" => "HTTPerf",
2542     "rule" => array(
2543     "httperf[ /]([0-9.]{1,10})" => "\\1"
2544     ),
2545     "uri" => ""
2546     ),
2547     "httpunit" => array(
2548     "icon" => "httpunit",
2549     "title" => "HttpUnit",
2550     "rule" => array(
2551     "httpunit[ /]([0-9.]{1,10})" => "\\1"
2552     ),
2553     "uri" => ""
2554     ),
2555     "httrack" => array(
2556     "icon" => "httrack",
2557     "title" => "HTTrack",
2558     "rule" => array(
2559     "HTTrack[ /]([0-9.]{1,10})" => "\\1"
2560     ),
2561     "uri" => ""
2562     ),
2563     "huaweisymantec" => array(
2564     "icon" => "huaweisymantec",
2565     "title" => "HuaweiSymantec",
2566     "rule" => array(
2567     "HuaweiSymantecSpider[ /]([0-9.]{1,10})" => "\\1"
2568     ),
2569     "uri" => "http://www.huaweisymantec.com/en/IRL/spider/"
2570     ),
2571     "hungary" => array(
2572     "icon" => "hungary",
2573     "title" => "Hungary",
2574     "rule" => array(
2575     "HuRob[ /]([0-9.]{1,10})" => "\\1"
2576     ),
2577     "uri" => ""
2578     ),
2579 joku 261 "i18n" => array(
2580     "icon" => "w3c",
2581     "title" => "W3C I18n Checker",
2582     "rule" => array(
2583     "^W3C_I18n-Checker[ /]([0-9.]{1,10})" => "\\1"
2584 joku 169 ),
2585 joku 261 "uri" => "http://validator.w3.org/services"
2586     ),
2587 joku 63 "iakke" => array(
2588     "icon" => "iakke",
2589 matthys 209 "title" => "Iakké",
2590 joku 63 "rule" => array(
2591     "^iakke_bot[ /]v([0-9.]{1,10})" => "\\1"
2592     ),
2593     "uri" => "http://fr.iakke.com/"
2594     ),
2595     "iask" => array(
2596     "icon" => "iask",
2597     "title" => "IAsk",
2598     "rule" => array(
2599     "iaskspider[ /]([0-9.]{1,10})" => "\\1",
2600     "^iaskspider" => ""
2601     ),
2602     "uri" => "http://iask.com"
2603     ),
2604     "icc" => array(
2605     "icon" => "icc",
2606     "title" => "ICC-Crawler",
2607     "rule" => array(
2608     "^ICC-Crawler" => ""
2609     ),
2610     "uri" => "http://kc.nict.go.jp/icc/crawl.html"
2611     ),
2612     "icerocket" => array(
2613     "icon" => "icerocket",
2614     "title" => "Icerocket",
2615     "rule" => array(
2616     "BlogzIce[ /]([0-9.]{1,10})" => "\\1",
2617     "BlogSearch[ /]([0-9.]{1,10})" => "\\1"
2618     ),
2619     "uri" => ""
2620     ),
2621     "icjobs" => array(
2622     "icon" => "icjobs",
2623     "title" => "iCjobs",
2624     "rule" => array(
2625     "iCjobs[ /]([0-9.]{1,10})" => "\\1"
2626     ),
2627     "uri" => "http://www.icjobs.de/"
2628     ),
2629     "icra" => array(
2630     "icon" => "icra",
2631     "title" => "ICRA",
2632     "rule" => array(
2633     "^ICRA_Semantic_spider[ /]([0-9.]{1,10})" => "\\1"
2634     ),
2635     "uri" => "http://www.icra.org"
2636     ),
2637     "iknow" => array(
2638     "icon" => "robot",
2639     "title" => "I know",
2640     "rule" => array(
2641     "Comaneci_bot[ /]([0-9.]{1,10})" => "\\1"
2642     ),
2643     "uri" => ""
2644     ),
2645     "ilial" => array(
2646     "icon" => "robot",
2647     "title" => "Ilial",
2648     "rule" => array(
2649     "ilial[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
2650     ),
2651     "uri" => ""
2652     ),
2653     "ilocal" => array(
2654     "icon" => "ilocal",
2655     "title" => "ilocal",
2656     "rule" => array(
2657     "^ilocal" => "",
2658     ),
2659     "uri" => "http://www.ilocal.nl"
2660     ),
2661     "ilse" => array(
2662     "icon" => "ilse",
2663     "title" => "Ilse",
2664     "rule" => array(
2665     "I(NGRID|lseRobot|lseBot)[ /]([0-9.]{1,10})" => "\\1"
2666     ),
2667     "uri" => "http://ilse.nl/"
2668     ),
2669     "iltrovatore" => array(
2670     "icon" => "iltrovatore",
2671     "title" => "IlTrovatore",
2672     "rule" => array(
2673     "iltrovatore-setaccio[ /]([0-9.]{1,10})" => "\\1",
2674     "Iltrovatore-Setaccio" => "",
2675     "iltrovatore[ /]([0-9.]{1,10})" => "\\1"
2676     ),
2677     "uri" => ""
2678     ),
2679     "indylibrary" => array(
2680     "icon" => "robot",
2681     "title" => "Indy Library",
2682     "rule" => array(
2683     "Indy[ \-]?Library" => ""
2684     ),
2685     "uri" => ""
2686     ),
2687     "inela" => array(
2688     "icon" => "robot",
2689     "title" => "Inela",
2690     "rule" => array(
2691     "InelaBot[ /]([0-9.]{1,10})" => ""
2692     ),
2693     "uri" => "http://inelegant.org/bot"
2694     ),
2695     "ineturl" => array(
2696     "icon" => "robot",
2697     "title" => "InetURL",
2698     "rule" => array(
2699     "InetURL.?[ /]([0-9.]{1,10})" => ""
2700     ),
2701     "uri" => ""
2702     ),
2703     "infoart" => array(
2704     "icon" => "robot",
2705     "title" => "InfoArt",
2706     "rule" => array(
2707     "InfoArt crawler" => ""
2708     ),
2709     "uri" => ""
2710     ),
2711     "infomine" => array(
2712     "icon" => "infomine",
2713     "title" => "INFOMINE",
2714     "rule" => array(
2715     "^DataFountains/DMOZ" => "",
2716     "^INFOMINE[ /]([0-9.]{1,10})" => "\\1"
2717     ),
2718     "uri" => "http://infomine.ucr.edu/"
2719     ),
2720     "infoseek" => array(
2721     "icon" => "infoseek",
2722     "title" => "Infoseek",
2723     "rule" => array(
2724     "SideWinder[ /]?([0-9a-z.]{1,10})" => "\\1",
2725     "Infoseek" => ""
2726     ),
2727     "uri" => ""
2728     ),
2729     "inktomi" => array(
2730     "icon" => "inktomi",
2731     "title" => "Inktomi",
2732     "rule" => array(
2733     "slurp@inktomi\.com" => ""
2734     ),
2735     "uri" => ""
2736     ),
2737     "innerprise" => array(
2738     "icon" => "robot",
2739     "title" => "Innerprise",
2740     "rule" => array(
2741     "^InnerpriseBot[ /]([0-9.]{1,10})" => "\\1",
2742     "URL[ _]Spider[ _]Pro[ /]([0-9.+]{1,10})" => "\\1",
2743     "^ES[ .]NET[ _]Crawler[ /]([0-9.]{1,10})" => "\\1"
2744     ),
2745     "uri" => "http://www.innerprise.com/"
2746     ),
2747     "inria" => array(
2748     "icon" => "inria",
2749     "title" => "Inria",
2750     "rule" => array(
2751     "^xyro_" => ""
2752     ),
2753     "uri" => ""
2754     ),
2755     "insitor" => array(
2756     "icon" => "insitor",
2757     "title" => "Insitor",
2758     "rule" => array(
2759     "^Insitor(,|\.|naut)" => ""
2760     ),
2761     "uri" => "http://www.insitor.com/"
2762     ),
2763     "internetninja" => array(
2764     "icon" => "robot",
2765     "title" => "Internet Ninja",
2766     "rule" => array(
2767     "^Internet Ninja[ /]([0-9.]{1,10})" => "\\1"
2768     ),
2769     "uri" => ""
2770     ),
2771     "internetseer" => array(
2772     "icon" => "internetseer",
2773     "title" => "InternetSeer",
2774     "rule" => array(
2775     "^InternetSeer\.com" => ""
2776     ),
2777     "uri" => ""
2778     ),
2779     "interseek" => array(
2780     "icon" => "interseek",
2781     "title" => "Interseek",
2782     "rule" => array(
2783     "Interseek.com" => ""
2784     ),
2785     "uri" => "http://www.interseek.com"
2786     ),
2787     "intravnews" => array(
2788     "icon" => "intravnews",
2789     "title" => "IntraVnews",
2790     "rule" => array(
2791     "IntraVnews[ /]([0-9.]{1,10})" => "\\1"
2792     ),
2793     "uri" => "http://www.intravnews.com/"
2794     ),
2795     "ip2location" => array(
2796     "icon" => "ip2location",
2797     "title" => "IP2LocationBot",
2798     "rule" => array(
2799     "^IP2(Map|Location)Bot[ /]([0-9.]{1,10})" => "\\2"
2800     ),
2801     "uri" => "http://www.ip2location.com"
2802     ),
2803     "ipworks" => array(
2804     "icon" => "ipworks",
2805     "title" => "IP*Works",
2806     "rule" => array(
2807     "^IP\*Works\! V([0-9.]{1,10})" => "\\1"
2808     ),
2809     "uri" => "http://www.nsoftware.com/ipworks/"
2810     ),
2811     "irca" => array(
2812     "icon" => "robot",
2813     "title" => "Novell iChain Cool Solutions caching",
2814     "rule" => array(
2815 matthys 209 "^ICRA_(label_generator|Semantic_spider)[ /]([0-9.]{1,10})" => "\\2",
2816     "^Mozilla[/ ]([0-9.]{1,10})[/ ]\(compatible[ ;]*ICS" => "\\1"
2817 joku 63 ),
2818     "uri" => "http://www.icra.org"
2819     ),
2820     "irvine" => array(
2821     "icon" => "robot",
2822     "title" => "Irvine",
2823     "rule" => array(
2824     "Irvine[ /]([0-9.]{1,10})" => "\\1"
2825     ),
2826     "uri" => ""
2827     ),
2828     "ips-agent" => array(
2829     "icon" => "robot",
2830 matthys 209 "title" => "IPS-agent",
2831 joku 63 "rule" => array(
2832     "ips-agent" => ""
2833     ),
2834     "uri" => ""
2835     ),
2836     "isara" => array(
2837     "icon" => "isara",
2838 matthys 209 "title" => "Isara",
2839 joku 63 "rule" => array(
2840     "Isara[ -]([0-9.]{1,10})" => "\\1"
2841     ),
2842     "uri" => "http://www.isara.org/"
2843     ),
2844     "isspider" => array(
2845     "icon" => "robot",
2846     "title" => "ISSpider",
2847     "rule" => array(
2848     "ISSpider[ /\-]([0-9.]{1,10})" => "\\1"
2849     ),
2850     "uri" => ""
2851     ),
2852     "it2media" => array(
2853     "icon" => "it2media",
2854     "title" => "IT2media",
2855     "rule" => array(
2856     "www.adressendeutschland.de" => ""
2857     ),
2858     "uri" => "http://www.adressendeutschland.de/"
2859     ),
2860     "ivia" => array(
2861     "icon" => "robot",
2862     "title" => "iVia",
2863     "rule" => array(
2864     "iVia Site Checker.?[ /]([0-9.]{1,10})" => "\\1"
2865     ),
2866     "uri" => ""
2867     ),
2868     "jeteye" => array(
2869     "icon" => "jeteye",
2870     "title" => "Jeteye",
2871     "rule" => array(
2872     "Jetbot[ /]([0-9.]{1,10})" => "\\1"
2873     ),
2874     "uri" => ""
2875     ),
2876     "jobsde" => array(
2877     "icon" => "jobsde",
2878     "title" => "jobs.de",
2879     "rule" => array(
2880     "www\.jobs\.de" => "",
2881     "jobs.de-Robot" => ""
2882     ),
2883     "uri" => "http://www.jobs.de/"
2884     ),
2885     "jpluck" => array(
2886     "icon" => "robot",
2887     "title" => "Jpluck",
2888     "rule" => array(
2889     "JPluck[ /]([0-9a-z.]{1,10})" => "\\1"
2890     ),
2891     "uri" => ""
2892     ),
2893     "jxta" => array(
2894     "icon" => "robot",
2895     "title" => "Jxta",
2896     "rule" => array(
2897     "falcon[ /]([0-9.]{1,10})" => "\\1"
2898     ),
2899     "uri" => ""
2900     ),
2901     "jyte" => array(
2902     "icon" => "jyte",
2903     "title" => "Jyte",
2904     "rule" => array(
2905     "jyte_fetcher[ /]([0-9.]{1,10})" => "\\1"
2906     ),
2907     "uri" => ""
2908     ),
2909     "jyxo" => array(
2910     "icon" => "jyxo",
2911     "title" => "Jyxo",
2912     "rule" => array(
2913     "Jyxobot[ /]([0-9.]{1,10})" => "\\1"
2914     ),
2915     "uri" => ""
2916     ),
2917     "kalooga" => array(
2918     "icon" => "kalooga",
2919     "title" => "Kalooga",
2920     "rule" => array(
2921     "kalooga[ /-]([0-9.]{1,10})" => "\\1",
2922     "^kalooga" => "",
2923     "KaloogaBot" => ""
2924     ),
2925     "uri" => "http://www.kalooga.com"
2926     ),
2927     "keywen" => array(
2928     "icon" => "keywen",
2929     "title" => "Keywen",
2930     "rule" => array(
2931     "EasyDL[ /]([0-9.]{1,10})" => "\\1"
2932     ),
2933     "uri" => ""
2934     ),
2935     "kilomonkey" => array(
2936     "icon" => "robot",
2937     "title" => "Kilomonkey",
2938     "rule" => array(
2939     "kmky-not-a-bot[ /]([0-9.]{1,10})" => "\\1"
2940     ),
2941     "uri" => "http://www.kilomonkey.com/notabot.txt"
2942     ),
2943     "kinja" => array(
2944     "icon" => "kinja",
2945     "title" => "Kinja",
2946     "rule" => array(
2947     "kinjabot[ /]([0-9.]{1,10})" => "\\1",
2948     "^kinjabot" => ""
2949     ),
2950     "uri" => ""
2951     ),
2952     "kiwi" => array(
2953     "icon" => "robot",
2954     "title" => "KiwiStatus",
2955     "rule" => array(
2956     "KiwiStatus[ /]([0-9.]{1,10})" => "\\1",
2957     "KiwiStatus" => ""
2958     ),
2959     "uri" => "http://www.nzs.com/kiei-status/"
2960     ),
2961     "lachesis" => array(
2962     "icon" => "robot",
2963     "title" => "Lachesis",
2964     "rule" => array(
2965     "lachesis" => ""
2966     ),
2967     "uri" => ""
2968     ),
2969     "lanshan" => array(
2970     "icon" => "robot",
2971     "title" => "Lachesis",
2972     "rule" => array(
2973     "lanshanbot[/ ]([0-9.]{1,10})" => "\\1"
2974     ),
2975     "uri" => ""
2976     ),
2977     "lapozz" => array(
2978     "icon" => "lapozz",
2979     "title" => "Lapozz",
2980     "rule" => array(
2981     "LapozzBot[/ ]?([0-9.]{1,10})" => "\\1"
2982     ),
2983     "uri" => ""
2984     ),
2985     "larbin" => array(
2986     "icon" => "robot",
2987     "title" => "Larbin",
2988     "rule" => array(
2989     "larbin[_/ ]?([0-9.]{1,10})" => "\\1"
2990     ),
2991     "uri" => ""
2992     ),
2993     "laurion" => array(
2994     "icon" => "robot",
2995     "title" => "Laurion",
2996     "rule" => array(
2997     "^IPiumBot" => ""
2998     ),
2999     "uri" => "http://www.laurion.com/"
3000     ),
3001     "leechget" => array(
3002     "icon" => "leechget",
3003     "title" => "LeechGet",
3004     "rule" => array(
3005     "^LeechGet[ /]([0-9.]{1,10})" => "\\1"
3006     ),
3007     "uri" => ""
3008     ),
3009     "linguaseek" => array(
3010     "icon" => "linguaseek",
3011     "title" => "Linguaseek",
3012     "rule" => array(
3013     "^LinguaBot[ /]v([0-9.]{1,10})" => "\\1"
3014     ),
3015     "uri" => "http://www.linguaseek.com/"
3016     ),
3017     "linguee" => array(
3018     "icon" => "linguee",
3019     "title" => "Linguee",
3020     "rule" => array(
3021     "^Linguee Bot" => ""
3022     ),
3023     "uri" => "http://www.linguee.com/"
3024     ),
3025     "linkguard" => array(
3026     "icon" => "robot",
3027     "title" => "Linkguard",
3028     "rule" => array(
3029     "Linkguard Online[ /]([0-9.]{1,10})" => "\\1"
3030     ),
3031     "uri" => "http://www.linkguard.com/"
3032     ),
3033     "linklint" => array(
3034     "icon" => "linklint",
3035     "title" => "Linklint",
3036     "rule" => array(
3037     "^Linklint[-\-a-z /]*([0-9.]{1,10})" => "\\1"
3038     ),
3039     "uri" => "http://www.linklint.org/"
3040     ),
3041     "linkman" => array(
3042     "icon" => "linkman",
3043     "title" => "Linkman",
3044     "rule" => array(
3045     "\(compatible; Linkman\)" => ""
3046     ),
3047     "uri" => ""
3048     ),
3049     // Needs to be before linkcheck for correct detection
3050     "linkchecker" => array(
3051     "icon" => "w3c",
3052     "title" => "W3C Link Checker",
3053     "rule" => array(
3054     "^W3C-checklink[ /]([0-9.]{1,10})" => "\\1"
3055     ),
3056     "uri" => "http://validator.w3.org/checklink"
3057     ),
3058     "linkcheck" => array(
3059     "icon" => "linkcheck",
3060     "title" => "Linkcheck",
3061     "rule" => array(
3062     "checklink[ /]([0-9.]{1,10})" => "\\1",
3063     "Link[ \-]?(Chec(k|ker)|Val(et|idator))" => "",
3064     "Adaxas Spider" => "",
3065     "Agent-SharewarePlazaFileCheckBot[ /]([0-9.]{1,10})" => "\\1",
3066     "NetMechanic V([0-9.]{1,10})" => "\\1",
3067     "^InfoLink" => "",
3068     "InternetLinkAgent" => "",
3069     "; SPENG\)" => "",
3070     "SharewarePlazaFileCheckBot" => "",
3071     "fileboost.net" => "",
3072     "^billbot" => ""
3073     ),
3074     "uri" => ""
3075     ),
3076     "linkru" => array(
3077     "icon" => "robot",
3078     "title" => "Link.RU",
3079     "rule" => array(
3080     "^Link.RU bot" => ""
3081     ),
3082     "uri" => ""
3083     ),
3084     "linkssql" => array(
3085     "icon" => "robot",
3086     "title" => "Links SQL",
3087     "rule" => array(
3088     "links sql" => ""
3089     ),
3090     "uri" => ""
3091     ),
3092     "linksweeper" => array(
3093     "icon" => "robot",
3094     "title" => "Link Sweeper",
3095     "rule" => array(
3096     "LinkSweeper[ /]([0-9.]{1,10})" => "\\1"
3097     ),
3098     "uri" => ""
3099     ),
3100     "linkwalker" => array(
3101     "icon" => "robot",
3102     "title" => "Link Walker",
3103     "rule" => array(
3104     "^LinkWalker" => ""
3105     ),
3106     "uri" => ""
3107     ),
3108     "lipperhey" => array(
3109     "icon" => "lipperhey",
3110     "title" => "Lipperhey",
3111     "rule" => array(
3112     "Lipperhey Spider" => ""
3113     ),
3114     "uri" => "http://www.lipperhey.com"
3115     ),
3116     "livedoor" => array(
3117     "icon" => "livedoor",
3118     "title" => "Livedoor",
3119     "rule" => array(
3120     "^Livedoor( SF( - California Crawl)?|Checkers)[ /]" => ""
3121     ),
3122     "uri" => ""
3123     ),
3124     "livejournal" => array(
3125     "icon" => "livejournal",
3126     "title" => "Live Journal",
3127     "rule" => array(
3128     "^LiveJournal\.com" => ""
3129     ),
3130     "uri" => "http://www.livejournal.com"
3131     ),
3132     "ljpic" => array(
3133     "icon" => "ljpic",
3134     "title" => "ljpic",
3135     "rule" => array(
3136     "LjSEEK Picture-Bot[ /]+([0-9.]{1,10})" => "\\1"
3137     ),
3138     "uri" => "http://www.ljpic.com"
3139     ),
3140     "lmspider" => array(
3141     "icon" => "robot",
3142     "title" => "Lmspider",
3143     "rule" => array(
3144     "^lmspider" => ""
3145     ),
3146     "uri" => ""
3147     ),
3148     "locators" => array(
3149     "icon" => "robot",
3150     "title" => "Locaters",
3151     "rule" => array(
3152     "^FiNDoBot[/ ]([0-9a-z.]{1,10})" => "\\1"
3153     ),
3154     "uri" => ""
3155     ),
3156     "look" => array(
3157     "icon" => "look",
3158     "title" => "Look",
3159     "rule" => array(
3160     "www\.look\.com" => "",
3161     "Lookbot" => ""
3162     ),
3163     "uri" => ""
3164     ),
3165     "looksmart" => array(
3166     "icon" => "looksmart",
3167     "title" => "LookSmart",
3168     "rule" => array(
3169     "^Martini" => "",
3170     "^MantraAgent" => "",
3171     "FurlBot" => "",
3172     "looksmart-sv-fw" => ""
3173     ),
3174     "uri" => ""
3175     ),
3176     "loop" => array(
3177     "icon" => "loop",
3178     "title" => "LOOP",
3179     "rule" => array(
3180     "NetResearchServer[ /]([0-9.]{1,10})" => "\\1"
3181     ),
3182     "uri" => ""
3183     ),
3184     "lotkyll" => array(
3185     "icon" => "robot",
3186     "title" => "Lotkyll",
3187     "rule" => array(
3188     "Lotkyll" => ""
3189     ),
3190     "uri" => ""
3191     ),
3192     "lwp" => array(
3193     "icon" => "robot",
3194     "title" => "lwp",
3195     "rule" => array(
3196     "lwp(-trivial|::simple)[ /]([0-9.]{1,10})" => "\\2"
3197     ),
3198     "uri" => ""
3199     ),
3200     "lycos" => array(
3201     "icon" => "lycos",
3202     "title" => "Lycos",
3203     "rule" => array(
3204     "Lycos_Spider_" => ""
3205     ),
3206     "uri" => ""
3207     ),
3208     "magpierss" => array(
3209     "icon" => "rss",
3210     "title" => "MagpieRSS",
3211     "rule" => array(
3212     "MagpieRSS" => ""
3213     ),
3214     "uri" => "http://magpierss.sourceforge.net/"
3215     ),
3216     "mailru" => array(
3217     "icon" => "mailru",
3218 matthys 209 "title" => "Mail.Ru",
3219 joku 63 "rule" => array(
3220 matthys 195 "^Mail.Ru[ /]([0-9.]{1,10})" => "\\1",
3221     "Mail.RU_Bot[ /]([0-9.]{1,10})" => "\\1"
3222 joku 63 ),
3223 matthys 209 "uri" => "http://www.mail.ru/"
3224 joku 63 ),
3225     "mailsweeper" => array(
3226     "icon" => "robot",
3227     "title" => "Mail Sweeper",
3228     "rule" => array(
3229     "Mail[ \-]?Sweeper" => ""
3230     ),
3231     "uri" => ""
3232     ),
3233     "marvin" => array(
3234     "icon" => "robot",
3235     "title" => "Marvin",
3236     "rule" => array(
3237     "^Marvin" => ""
3238     ),
3239     "uri" => ""
3240     ),
3241     "matkurja" => array(
3242     "icon" => "matkurja",
3243     "title" => "Mat'Kurja",
3244     "rule" => array(
3245     "Mosad[ /]([0-9.]{1,10})" => "\\1"
3246     ),
3247     "uri" => ""
3248     ),
3249     "mavicanet" => array(
3250     "icon" => "mavicanet",
3251     "title" => "Mavicanet",
3252     "rule" => array(
3253     "Mavicanet robot" => ""
3254     ),
3255     "uri" => ""
3256     ),
3257 matthys 292 "meanpath" => array(
3258     "icon" => "meanpath",
3259 matthys 290 "title" => "Meanpath",
3260 matthys 280 "rule" => array(
3261     "meanpathbot[ /]([0-9.]{1,10})" => "\\1"
3262     ),
3263     "uri" => "http://www.meanpath.com/meanpathbot.html"
3264 matthys 275 ),
3265 matthys 280 "mediater" => array(
3266 joku 63 "icon" => "robot",
3267     "title" => "Mediater",
3268     "rule" => array (
3269     "^libwww[ /]([0-9.]{1,10})" => "\\1"
3270 matthys 280 ),
3271     "uri" => ""
3272 joku 63 ),
3273     "mercator" => array(
3274     "icon" => "robot",
3275     "title" => "Mercator",
3276     "rule" => array(
3277     "Mercator" => ""
3278     ),
3279     "uri" => ""
3280     ),
3281     "metacarta" => array(
3282     "icon" => "robot",
3283     "title" => "Metacarta",
3284     "rule" => array(
3285     "^RRC (crawler_admin@bigfoot.com)" => "",
3286     "^flunky" => "",
3287     "^Mozilla.*\(samualt9@bigfoot.com\)$" => ""
3288     ),
3289     "uri" => "http://www.metacarta.com"
3290     ),
3291     "metager" => array(
3292     "icon" => "metager",
3293     "title" => "MetaGer",
3294     "rule" => array(
3295     "MetaGer" => ""
3296     ),
3297     "uri" => ""
3298     ),
3299     "metamark" => array(
3300     "icon" => "robot",
3301     "title" => "Metamark",
3302     "rule" => array(
3303     "^XRL[ /]([0-9.a-z]{1,10})" => "\\1"
3304     ),
3305     "uri" => "http://metamark.net"
3306     ),
3307     "metamedic" => array(
3308     "icon" => "metamedic",
3309     "title" => "MetaMedic",
3310     "rule" => array(
3311     "MediBot[ /]([0-9.]{1,10})" => "\\1"
3312     ),
3313     "uri" => ""
3314     ),
3315     "mirago" => array(
3316     "icon" => "mirago",
3317     "title" => "Mirago",
3318     "rule" => array(
3319     "Mirago" => ""
3320     ),
3321     "uri" => ""
3322     ),
3323     "misterwong" => array(
3324     "icon" => "misterwong",
3325     "title" => "Mister Wong",
3326     "rule" => array(
3327     "Mister Wong-Bot[ /]([0-9.]{1,10})" => "\\1"
3328     ),
3329     "uri" => "http://www.mister-wong.de/"
3330     ),
3331     "miva" => array(
3332     "icon" => "miva",
3333     "title" => "Miva",
3334     "rule" => array(
3335     "AlgoFeedback@miva\.com" => ""
3336     ),
3337     "uri" => "http://www.miva.com/"
3338     ),
3339     "mj12" => array(
3340     "icon" => "mj12",
3341     "title" => "Majestic-12",
3342     "rule" => array(
3343     "Mj12bot[ /]v?([0-9.]{1,10})" => "\\1",
3344     "MJ12bot \(mini\)[ /]([0-9.]{1,10})" => "\\1"
3345     ),
3346     "uri" => "http://majestic12.co.uk/bot.php"
3347     ),
3348     "mlbot" => array(
3349     "icon" => "robot",
3350     "title" => "MLBot",
3351     "rule" => array(
3352     "^MLBot" => ""
3353     ),
3354     "uri" => "http://www.metadatalabs.com/mlbot"
3355     ),
3356     "mnogo" => array(
3357     "icon" => "mnogo",
3358     "title" => "mnoGoSearch",
3359     "rule" => array(
3360     "Mnogosearch[ /\-]([0-9.]{1,10})" => "\\1"
3361     ),
3362     "uri" => "http://www.mnogosearch.org/"
3363     ),
3364     "mobileok" => array(
3365     "icon" => "mobileok",
3366     "title" => "W3C mobileOK",
3367     "rule" => array(
3368     "^W3C-mobileOK" => ""
3369     ),
3370     "uri" => "http://www.w3.org/2006/07/mobileok-ddc"
3371     ),
3372 matthys 296 "mojeek" => array(
3373     "icon" => "mojeek",
3374     "title" => "Mojeek",
3375 joku 63 "rule" => array(
3376     "MojeekBot[ /]([0-9.]{1,10})" => "\\1"
3377     ),
3378 matthys 284 "uri" => "https://www.mojeek.com/bot.html"
3379 joku 63 ),
3380     "momspider" => array(
3381     "icon" => "robot",
3382     "title" => "MOM Spider",
3383     "rule" => array(
3384     "MOMspider[ /]([0-9.]{1,10})" => "\\1"
3385     ),
3386     "uri" => ""
3387     ),
3388     "moreover" => array(
3389     "icon" => "moreover",
3390     "title" => "Moreover",
3391     "rule" => array(
3392     "^Moreoverbot[ /]([0-9.]{1,10})" => "\\1"
3393     ),
3394     "uri" => ""
3395     ),
3396     "movabletype" => array(
3397     "icon" => "movabletype",
3398     "title" => "Movable Type",
3399     "rule" => array(
3400     "MovableType[ /]([0-9.]{1,10})" => "\\1"
3401     ),
3402     "uri" => ""
3403     ),
3404     "mozdex" => array(
3405     "icon" => "mozdex",
3406     "title" => "MozDex",
3407     "rule" => array(
3408     "mozDex[ /]([0-9.]{1,6}(-dev)?)" => "\\1"
3409     ),
3410     "uri" => ""
3411     ),
3412     "mqbot" => array(
3413     "icon" => "robot",
3414     "title" => "MQbot",
3415     "rule" => array(
3416     "MQbot" => ""
3417     ),
3418     "uri" => ""
3419     ),
3420     "msnbot" => array(
3421     "icon" => "bing",
3422 matthys 205 "title" => "Bing",
3423 joku 63 "rule" => array(
3424     "MSN(BOT|PTC)[ /]([0-9.]{1,10})" => "\\2",
3425     "MS Search ([0-9.]{1,10}) Robot" => "\\1",
3426     "MSNBOT-(MEDIA|PRODUCTS|NewsBlogs)[ /]([0-9.]{1,10})" => "\\2",
3427     "bingbot[ /]([0-9.]{1,10})" => "\\1"
3428     ),
3429     "uri" => ""
3430     ),
3431     "msnbot-mobile" => array(
3432     "icon" => "msn",
3433     "title" => "MSN Mobile",
3434     "rule" => array(
3435     "MSNBOT-(MOBILE|)[ /]([0-9.]{1,10})" => "\\2",
3436     "MSNBOT_Mobile" => "",
3437     "MSMOBOT" => ""
3438     ),
3439     "uri" => ""
3440     ),
3441     "mslivebot" => array(
3442     "icon" => "livesearch",
3443     "title" => "MS Live Search",
3444     "rule" => array(
3445     "MSNBOT-(Academic)[ /]([0-9.]{1,10})" => "\\2"
3446     ),
3447     "uri" => ""
3448     ),
3449     "msproxy" => array(
3450     "icon" => "robot",
3451     "title" => "MSProxy",
3452     "rule" => array(
3453     "MSProxy[ /]([0-9.]{1,10})" => "\\1"
3454     ),
3455     "uri" => ""
3456     ),
3457     "msrbot" => array(
3458     "icon" => "robot",
3459     "title" => "MSRBOT",
3460     "rule" => array(
3461     "^MSRBOT" => ""
3462     ),
3463     "uri" => "http://research.microsoft.com/research/sv/msrbot/"
3464     ),
3465     "mswebdav" => array(
3466     "icon" => "robot",
3467     "title" => "MS-WebDAV",
3468     "rule" => array(
3469     "Microsoft[ \-]?WebDAV[ \-]?MiniRedir" => ""
3470     ),
3471     "uri" => ""
3472     ),
3473     "mticon" => array(
3474     "icon" => "robot",
3475     "title" => "MTIcon",
3476     "rule" => array(
3477     "MTIcon[/ ]([0-9.]{1,10})" => "\\1"
3478     ),
3479     "uri" => ""
3480     ),
3481     "multipage-validator" => array(
3482     "icon" => "multipage-validator",
3483     "title" => "Multipage Validator",
3484     "rule" => array(
3485     "^W3C_Multipage_Validator[ /]([0-9.]{1,10})" => "\\1"
3486     ),
3487     "uri" => "http://www.validator.ca/"
3488     ),
3489     "myrss" => array(
3490     "icon" => "rss",
3491     "title" => "MyRSS",
3492     "rule" => array(
3493     "MyRSS.jp[/ ]([0-9.]{1,10})" => "\\1"
3494     ),
3495     "uri" => ""
3496     ),
3497     "multimap" => array(
3498     "icon" => "robot",
3499     "title" => "Multimap",
3500     "rule" => array(
3501     "Multimap Geotag Blog Parser[/ ]([0-9.]{1,10})" => "\\1"
3502     ),
3503     "uri" => ""
3504     ),
3505     "najdi" => array(
3506     "icon" => "najdi",
3507     "title" => "Najdi.si",
3508     "rule" => array(
3509     "Najdi.si" => ""
3510     ),
3511     "uri" => "http://www.najdi.si"
3512     ),
3513     "nameprotect" => array(
3514     "icon" => "nameprotect",
3515     "title" => "Name Protect",
3516     "rule" => array(
3517     "NPBot" => ""
3518     ),
3519     "uri" => ""
3520     ),
3521     "nationaldirectory" => array(
3522     "icon" => "robot",
3523     "title" => "National Directory",
3524     "rule" => array(
3525     "NationalDirectory-WebSpider[ /]([0-9.]{1,10})" => "\\1"
3526     ),
3527     "uri" => ""
3528     ),
3529     "natsumican" => array(
3530     "icon" => "robot",
3531     "title" => "Natsu Mican",
3532     "rule" => array(
3533     "NATSU[ \-]MICAN[/ ]([0-9a-z.]{1,10})" => "\\1"
3534     ),
3535     "uri" => ""
3536     ),
3537     "naverbot" => array(
3538     "icon" => "naverbot",
3539     "title" => "Naver",
3540     "rule" => array(
3541     "NaverBot([_\-]dloader)?[/ \-]([0-9.]{1,10})" => "\\2",
3542     "Naver(Bot)?" => "",
3543     "^nabot" => ""
3544     ),
3545     "uri" => ""
3546     ),
3547     "navisso" => array(
3548     "icon" => "navisso",
3549     "title" => "Navisso",
3550     "rule" => array(
3551     "Navisso(Bot)?" => ""
3552     ),
3553     "uri" => "http://www.navisso.com"
3554     ),
3555     "neofonie" => array(
3556     "icon" => "robot",
3557 matthys 205 "title" => "Neofonie",
3558 joku 63 "rule" => array(
3559     "www.neofonie.de" => ""
3560     ),
3561     "uri" => "http://www.neofonie.de/loesungen/search/robot.html"
3562     ),
3563     "neomo" => array(
3564     "icon" => "robot",
3565     "title" => "Neomo",
3566     "rule" => array(
3567     "Francis[ /]([0-9.]{1,10})" => "\\1"
3568     ),
3569     "uri" => ""
3570     ),
3571     "nessus" => array(
3572     "icon" => "nessus",
3573     "title" => "Nessus",
3574     "rule" => array(
3575     "Nessus\)$" => ""
3576     ),
3577     "uri" => ""
3578     ),
3579 matthys 279 "nerdybot" => array(
3580 matthys 280 "icon" => "robot",
3581     "title" => "NerdyBot",
3582     "rule" => array(
3583     "NerdyBot" => ""
3584     ),
3585     "uri" => "http://nerdybot.com/"
3586 matthys 279 ),
3587 joku 63 "nerdbynature" => array(
3588     "icon" => "nerdbynature",
3589     "title" => "NerdByNature",
3590     "rule" => array(
3591     "NerdByNature.Bot" => ""
3592     ),
3593     "uri" => "http://www.nerdbynature.net/bot"
3594     ),
3595     "netants" => array(
3596     "icon" => "netants",
3597     "title" => "NetAnts",
3598     "rule" => array(
3599     "NetAnts[ /]([0-9.]{1,10})" => "\\1"
3600     ),
3601     "uri" => ""
3602     ),
3603     "netcraft" => array(
3604     "icon" => "netcraft",
3605     "title" => "Netcraft",
3606     "rule" => array(
3607     "netcraft" => ""
3608     ),
3609     "uri" => ""
3610     ),
3611     "netinfo" => array(
3612     "icon" => "netinfo",
3613     "title" => "Netinfo",
3614     "rule" => array(
3615     "^NetinfoBot[ /]([0-9.]{1,10})" => "\\1"
3616     ),
3617     "uri" => "http://netinfo.bg/"
3618     ),
3619     "netluchs" => array(
3620     "icon" => "netluchs",
3621     "title" => "Netluchs",
3622     "rule" => array(
3623     "Netluchs[ /]([0-9.a-z]{1,10})" => "\\1"
3624     ),
3625     "uri" => "http://www.netluchs.de/"
3626     ),
3627     "netmechanic" => array(
3628     "icon" => "netmechanic",
3629     "title" => "NetMechanic",
3630     "rule" => array(
3631     "NetMechanic[ /V]{1,5}([0-9.]{1,10})" => "\\1"
3632     ),
3633     "uri" => ""
3634     ),
3635     "netnose" => array(
3636     "icon" => "netnose",
3637     "title" => "NetNose",
3638     "rule" => array(
3639     "NetNose[ \-]Crawler[/ ]([0-9.]{1,10})" => "\\1"
3640     ),
3641     "uri" => ""
3642     ),
3643     "netoskop" => array(
3644     "icon" => "robot",
3645     "title" => "Netoskop",
3646     "rule" => array(
3647     "netoskop" => ""
3648     ),
3649     "uri" => ""
3650     ),
3651     "netpromoter" => array(
3652     "icon" => "netpromoter",
3653     "title" => "NetPromoter",
3654     "rule" => array(
3655     "NetPromoter Spider" => ""
3656     ),
3657     "uri" => "http://www.net-promoter.com/"
3658     ),
3659     "netprospector" => array(
3660     "icon" => "robot",
3661     "title" => "Netprospector",
3662     "rule" => array(
3663     "^netprospector" => ""
3664     )
3665     ),
3666     "netpumper" => array(
3667     "icon" => "robot",
3668     "title" => "Netpumper",
3669     "rule" => array(
3670     "^NetPumper[/ ]([0-9.]{1,10})" => "\\1"
3671     ),
3672     "uri" => ""
3673     ),
3674     "netscapeproxy" => array(
3675     "icon" => "netscape",
3676     "title" => "Netscape Proxy",
3677     "rule" => array(
3678     "Netscape-Proxy[/ ]([0-9.]{1,10})" => "\\1"
3679     ),
3680     "uri" => ""
3681     ),
3682     "netspective" => array(
3683     "icon" => "robot",
3684     "title" => "NetSpective",
3685     "rule" => array(
3686     "^WebFilter Robot ([0-9.]{1,10})" => "\\1"
3687     ),
3688     "uri" => ""
3689     ),
3690     "netvibes" => array(
3691     "icon" => "netvibes",
3692     "title" => " Netvibes",
3693     "rule" => array(
3694     "^Netvibes" => "\\1"
3695     ),
3696     "uri" => ""
3697     ),
3698     "newsfire" => array(
3699     "icon" => "newsfire",
3700     "title" => "NewsFire",
3701     "rule" => array(
3702     "NewsFire[/ ]([0-9.]{1,10})" => "\\1"
3703     ),
3704     "uri" => ""
3705     ),
3706     "newsgator" => array(
3707     "icon" => "newsgator",
3708     "title" => "NewsGator",
3709     "rule" => array(
3710     "NewsGato(r|rOnline)[/ ]([0-9.]{1,10})" => "\\2"
3711     ),
3712     "uri" => ""
3713     ),
3714     "newzcrawler" => array(
3715     "icon" => "newzcrawler",
3716     "title" => "NewzCrawler",
3717     "rule" => array(
3718     "NewzCrawler[/ ]([0-9.]{1,10})" => "\\1"
3719     ),
3720     "uri" => ""
3721     ),
3722     "nextopia" => array(
3723     "icon" => "newzcrawler",
3724     "title" => "NewzCrawler",
3725     "rule" => array(
3726     "^NextopiaBOT.*[v ]([0-9.]{1,10})" => "\\1"
3727     ),
3728     "uri" => ""
3729     ),
3730     "ngsearch" => array(
3731     "icon" => "ngsearch",
3732     "title" => "NG Search",
3733     "rule" => array(
3734     "NG-Search[/ ]([0-9.]{1,10})" => "\\1"
3735     ),
3736     "uri" => ""
3737     ),
3738     "nimble" => array(
3739     "icon" => "robot",
3740     "title" => "Nimble",
3741     "rule" => array(
3742     "NimbleCrawler[/ ]([0-9.]{1,10})" => "\\1"
3743     ),
3744     "uri" => ""
3745     ),
3746     "nmap" => array(
3747     "icon" => "nmap",
3748     "title" => "Nmap",
3749     "rule" => array(
3750     "Nmap Scripting Engine" => ""
3751     ),
3752     "uri" => "http://nmap.org/book/nse.html"
3753     ),
3754     "nusearch" => array(
3755     "icon" => "robot",
3756     "title" => "NuSearch",
3757     "rule" => array(
3758     "^nuSearch" => ""
3759     ),
3760     "uri" => "http://www.nusearch.com/"
3761     ),
3762     "noago" => array(
3763     "icon" => "noago",
3764     "title" => "Noago",
3765     "rule" => array(
3766     "Noago Spider" => ""
3767     ),
3768     "uri" => "http://www.noago.com/"
3769     ),
3770     "noviforum" => array(
3771     "icon" => "noviforum",
3772     "title" => "Noviforum",
3773     "rule" => array(
3774     "TridentSpider[/ ]?([0-9.]{1,10})" => "\\1"
3775     ),
3776     "uri" => ""
3777     ),
3778     "noxtrum" => array(
3779     "icon" => "noxtrum",
3780     "title" => "noXtrum",
3781     "rule" => array(
3782     "noxtrumbot[/ ]?([0-9.]{1,10})" => "\\1"
3783     ),
3784     "uri" => ""
3785     ),
3786     "noyona" => array(
3787     "icon" => "robot",
3788     "title" => "Noyona",
3789     "rule" => array(
3790     "noyona.([0-9._]{1,10})" => "\\1"
3791     ),
3792     "uri" => "http://noyona.com/"
3793     ),
3794     "nsauditor" => array(
3795     "icon" => "nsauditor",
3796     "title" => "Nsauditor",
3797     "rule" => array(
3798     "Nsauditor[ /]([0-9.]{1,10})" => "\\1"
3799     ),
3800     "uri" => "http://www.nsauditor.com/"
3801     ),
3802     "obidosbot" => array(
3803     "icon" => "robot",
3804     "title" => "Bookwatch",
3805     "rule" => array(
3806     "obidos[ \-]?bot" => ""
3807     ),
3808     "uri" => ""
3809     ),
3810     "objectssearch" => array(
3811     "icon" => "robot",
3812     "title" => "Objects Search",
3813     "rule" => array(
3814     "ObjectsSearch[ /]([0-9.]{1,10})" => "\\1"
3815     ),
3816     "uri" => ""
3817     ),
3818     "obot" => array(
3819     "icon" => "obot",
3820     "title" => "oBot",
3821     "rule" => array(
3822     "^oBot " => ""
3823     ),
3824     "uri" => "http://www.onlysolutions.de/"
3825     ),
3826     "ocawa" => array(
3827     "icon" => "ocawa",
3828     "title" => "Ocawa",
3829     "rule" => array(
3830     "Ocawa[ /]([A-Z.a-z][0-9.]{1,10})" => "\\1",
3831     "Ocawa" => ""
3832     ),
3833     "uri" => "http://www.ocawa.com/"
3834     ),
3835     "octora" => array(
3836     "icon" => "octora",
3837     "title" => "Octora",
3838     "rule" => array(
3839     "^Octora (Beta)?" => ""
3840     ),
3841     "uri" => "http://www.octora.com/"
3842     ),
3843     "offlineexplorer" => array(
3844     "icon" => "robot",
3845     "title" => "OfflineExplorer",
3846     "rule" => array(
3847     "^Offline Explorer[ /]([0-9.]{1,10})" => "\\1"
3848     ),
3849     "uri" => ""
3850     ),
3851     "omea" => array(
3852     "icon" => "omea",
3853     "title" => "Omea Reader",
3854     "rule" => array(
3855     "Omea Reader[ /]([0-9.]{1,10})" => "\\1"
3856     ),
3857     "uri" => ""
3858     ),
3859     "onet" => array(
3860     "icon" => "onet",
3861     "title" => "Onet",
3862     "rule" => array(
3863     "OnetSzukaj[ /]([0-9.]{1,10})" => "\\1",
3864     "Onet\.pl" => "",
3865     "inktomi.search.onet" => ""
3866     ),
3867     "uri" => "http://www.onet.pl"
3868     ),
3869     "online24" => array(
3870     "icon" => "robot",
3871 matthys 209 "title" => "Online24",
3872 joku 63 "rule" => array(
3873     "^Online24-Bot .* ([0-9.]{1,10})" => "\\1"
3874     ),
3875     "uri" => "http://www.online24.de"
3876     ),
3877     "onlinewebcheck" => array(
3878     "icon" => "csehtmlvalidator",
3879     "title" => "CSE HTML Validator",
3880     "rule" => array(
3881     "onlinewebcheck" => ""
3882     ),
3883     "uri" => "http://www.onlinewebcheck.com"
3884     ),
3885     "onsearch" => array(
3886     "icon" => "onsearch",
3887 matthys 209 "title" => "OnSearch",
3888 joku 63 "rule" => array(
3889     "^onCHECK-Robot" => ""
3890     ),
3891     "uri" => "http://www.onsearch.de"
3892     ),
3893     "onto" => array(
3894     "icon" => "robot",
3895     "title" => "OntoSpider",
3896     "rule" => array(
3897     "^OntoSpider[ /]([0-9.]{1,10})" => "\\1"
3898     ),
3899     "uri" => "http://ontospider.i-n.info/"
3900     ),
3901     "openacoon" => array(
3902     "icon" => "robot",
3903     "title" => "OpenAcoon",
3904     "rule" => array(
3905     "^OpenAcoon v([0-9.]{1,10})" => "\\1"
3906     ),
3907     "uri" => "http://www.openacoon.de/"
3908     ),
3909     "openfind" => array(
3910     "icon" => "openfind",
3911     "title" => "Openfind",
3912     "rule" => array(
3913     "openbot[ /]([0-9.]{1,10})" => "\\1",
3914     "Openfind Robot[ /]([0-9.A-Z]{1,10})" => "\\1"
3915     ),
3916     "uri" => ""
3917     ),
3918     "opentagger" => array(
3919     "icon" => "robot",
3920     "title" => "OpenTagger",
3921     "rule" => array(
3922     "^OpenTaggerBot" => ""
3923     ),
3924     "uri" => "http://www.opentagger.com/opentaggerbot.htm"
3925     ),
3926     "opentext" => array(
3927     "icon" => "opentext",
3928     "title" => "OpenText",
3929     "rule" => array(
3930     "^OpenTextSiteCrawler[ /]([0-9.]{1,10})" => "\\1"
3931     ),
3932     "uri" => "http://www.opentext.net/"
3933     ),
3934     "openweb" => array(
3935     "icon" => "robot",
3936     "title" => "OpenWebSpider",
3937     "rule" => array(
3938     "^OpenWebSpider[ /]([0-9.]{1,10})" => "\\1",
3939     "^OpenWebSpider v([0-9.A-Z]{1,10})" => "\\1"
3940     ),
3941     "uri" => "http://www.openwebspider.org"
3942     ),
3943     "openx" => array(
3944     "icon" => "openx",
3945     "title" => "OpenX Spider",
3946     "rule" => array(
3947     "OpenX" => ""
3948     ),
3949     "uri" => "http://www.openx.org"
3950     ),
3951     "orange" => array(
3952     "icon" => "orange",
3953     "title" => "Orange",
3954     "rule" => array(
3955     "OrangeBot-Mobile[ /]([0-9.]{1,10})" => "\\1"
3956     ),
3957     "uri" => "http://orange.com/"
3958     ),
3959     "organica" => array(
3960     "icon" => "robot",
3961     "title" => "Organica",
3962     "rule" => array(
3963     "crawler@organica\.us" => ""
3964     ),
3965     "uri" => ""
3966     ),
3967     "outfox" => array(
3968     "icon" => "robot",
3969     "title" => "Outfox Melon",
3970     "rule" => array(
3971     "OutfoxMelonBot[ /]([0-9.]{1,10})" => "\\1",
3972     "OutfoxBot[ /]([0-9.]{1,10})" => "\\1"
3973     ),
3974     "uri" => ""
3975     ),
3976     "overture" => array(
3977     "icon" => "overture",
3978     "title" => "Overture",
3979     "rule" => array(
3980     "Overture[ \-]?WebCrawler" => ""
3981     ),
3982     "uri" => ""
3983     ),
3984     "page2rss" => array(
3985     "icon" => "page2rss",
3986     "title" => "Page2RSS",
3987     "rule" => array(
3988     "Page2RSS[ /]([0-9.]{1,10})" => "\\1"
3989     ),
3990     "uri" => "http://page2rss.com"
3991     ),
3992     "pagebytes" => array(
3993     "icon" => "robot",
3994     "title" => "PageBites",
3995     "rule" => array(
3996     "^PageBitesHyperBot[ /]([0-9.]{1,10})" => "\\1"
3997     ),
3998     "uri" => ""
3999     ),
4000 matthys 282 "pagesinventory" => array(
4001     "icon" => "pagesinventory",
4002     "title" => "PagesInventory",
4003     "rule" => array(
4004     "^PagesInventory" => ""
4005     ),
4006     "uri" => "http://www.pagesinventory.com"
4007     ),
4008 joku 63 "pagesjaunes" => array(
4009     "icon" => "pagesjaunes",
4010     "title" => "Pages Jaunes",
4011     "rule" => array(
4012     "PJBot[ /]([0-9.]{1,10})" => "\\1"
4013     ),
4014     "uri" => "http://www.pagesjaunes.fr/"
4015     ),
4016     "pagevalet" => array(
4017     "icon" => "wdg",
4018     "title" => "WDG Page Valet",
4019     "rule" => array(
4020     "^Page Valet[ /]([0-9.]{1,10})" => "\\1"
4021     ),
4022     "uri" => "http://www.htmlhelp.com/tools/validator/"
4023     ),
4024     "panopeabot" => array(
4025     "icon" => "robot",
4026     "title" => "PanopeaBot",
4027     "rule" => array(
4028     "PanopeaBot[/ ]([0-9.]{1,10})" => "\\1"
4029     ),
4030     "uri" => ""
4031     ),
4032     "parchmenthill" => array(
4033     "icon" => "robot",
4034     "title" => "Parchment Hill",
4035     "rule" => array(
4036     "ParchBot[ /]([0-9.]{1,10})" => "\\1"
4037     ),
4038     "uri" => "http://www.parchmenthill.com/search.htm"
4039     ),
4040     "pascient" => array(
4041     "icon" => "pascient",
4042     "title" => "Pascient",
4043     "rule" => array(
4044     "panscient.com" => ""
4045     ),
4046     "uri" => "http://www.panscient.com/"
4047     ),
4048     "peerbot" => array(
4049     "icon" => "peerbot",
4050     "title" => "Peerbot",
4051     "rule" => array(
4052     "^PEERbot" => ""
4053     ),
4054     "uri" => ""
4055     ),
4056     "php" => array(
4057     "icon" => "php",
4058     "title" => "PHP",
4059     "rule" => array(
4060     "^PHP[ /]([0-9.]{1,10})" => "\\1"
4061     ),
4062     "uri" => ""
4063     ),
4064     "phpcrawl" => array(
4065     "icon" => "robot",
4066     "title" => "PHPCrawl",
4067     "rule" => array(
4068     "^PHPCrawl" => ""
4069     ),
4070     "uri" => "http://phpcrawl.cuab.de/"
4071     ),
4072     "phpdig" => array(
4073     "icon" => "robot",
4074     "title" => "PhpDig",
4075     "rule" => array(
4076     "^PhpDig[ /]([0-9.]{1,10})" => "\\1"
4077     ),
4078     "uri" => "http://www.finbot.com/"
4079     ),
4080     "phpversiontracker" => array(
4081     "icon" => "phpversiontracker",
4082     "title" => "PHP version tracker",
4083     "rule" => array(
4084     "^PHP version tracker" => ""
4085     ),
4086     "uri" => "http://www.nexen.net/phpversion/bot.php"
4087     ),
4088     "pictureofinternet" => array(
4089     "icon" => "robot",
4090     "title" => "PictureOfInternet",
4091     "rule" => array(
4092     "^PictureOfInternet[ /]([0-9.]{1,10})" => ""
4093     ),
4094     "uri" => ""
4095     ),
4096     "pingdom" => array(
4097     "icon" => "pingdom",
4098     "title" => "Pingdom",
4099     "rule" => array(
4100     "^Pingdom GIGRIB v([0-9.]{1,10})" => "\\1",
4101     "^Pingdom" => ""
4102     ),
4103     "uri" => "http://www.pingdom.com/"
4104     ),
4105     "pinseri" => array(
4106     "icon" => "pinseri",
4107     "title" => "Pinseri",
4108     "rule" => array(
4109     "www\.pinseri\.com/bloglist" => ""
4110     ),
4111     "uri" => ""
4112     ),
4113     "plagger" => array(
4114     "icon" => "plagger",
4115     "title" => "Plagger",
4116     "rule" => array(
4117     "Plagger[ /]([0-9.]{1,10})" => "\\1"
4118     ),
4119     "uri" => "http://www.plugger.org"
4120     ),
4121     "planet" => array(
4122     "icon" => "planet",
4123     "title" => "Planet",
4124     "rule" => array(
4125     "Planet[ /]([0-9.]{1,10})" => "\\1"
4126     ),
4127     "uri" => ""
4128     ),
4129     "plantynet" => array(
4130     "icon" => "robot",
4131     "title" => "PlantyNet",
4132     "rule" => array(
4133     "PlantyNet_WebRobot[_ /]V?([0-9.]{1,10})" => "\\1"
4134     ),
4135     "uri" => ""
4136     ),
4137     "pluck" => array(
4138     "icon" => "pluck",
4139     "title" => "Pluck",
4140     "rule" => array(
4141     "PluckFeedCrawler[ /]([0-9.]{1,10})" => "\\1"
4142     ),
4143     "uri" => ""
4144     ),
4145     "plsearch" => array(
4146     "icon" => "plsearch",
4147     "title" => "PlanetSearch",
4148     "rule" => array(
4149     "fido[ /]([0-9.]{1,10}) Harvest" => "\\1"
4150     ),
4151     "uri" => ""
4152     ),
4153     "poe" => array(
4154     "icon" => "robot",
4155     "title" => "POE-Component",
4156     "rule" => array(
4157     "^POE-Component-Client-HTTP[/ ]([0-9.]{1,10})" => "\\1"
4158     ),
4159     "uri" => ""
4160     ),
4161     "pogodak" => array(
4162     "icon" => "pogodak",
4163     "title" => "Pogodak",
4164     "rule" => array(
4165     "Pogodak\.hr[/ ]?([0-9.]{1,10})" => "\\1"
4166     ),
4167     "uri" => ""
4168     ),
4169     "poodle" => array(
4170     "icon" => "robot",
4171     "title" => "Poodle predictor",
4172     "rule" => array(
4173     "P(oo|ooo)dle[ \-]?predictor[ \-]?([0-9.]{1,10})" => "\\1",
4174     "P(oo|ooo)dle[ \-]?predictor" => ""
4175     ),
4176     "uri" => "http://www.gritechnologies.com/tools/spider.go"
4177     ),
4178     "pompos" => array(
4179     "icon" => "pompos",
4180     "title" => "Pompos",
4181     "rule" => array(
4182     "Pompos[ /]([0-9.]{1,10})" => "\\1"
4183     ),
4184     "uri" => ""
4185     ),
4186     "popdex" => array(
4187     "icon" => "robot",
4188     "title" => "Popdexter",
4189     "rule" => array(
4190     "Popdexter" => ""
4191     ),
4192     "uri" => ""
4193     ),
4194     "postrank" => array(
4195     "icon" => "postrank",
4196     "title" => "PostRank",
4197     "rule" => array(
4198     "^PostRank[ /]+([0-9.]{1,10})" => "\\1"
4199     ),
4200     "uri" => "http://www.postrank.com/"
4201     ),
4202     "powermarks" => array(
4203     "icon" => "robot",
4204     "title" => "Powermarks",
4205     "rule" => array(
4206     "Powermarks[ /]([0-9.]{1,10})" => "\\1"
4207     ),
4208     "uri" => ""
4209     ),
4210     "probe" => array(
4211     "icon" => "robot",
4212     "title" => "PROBE!",
4213     "rule" => array(
4214     "^PROBE!" => ""
4215     ),
4216     "uri" => ""
4217     ),
4218     "projecthoneypot" => array(
4219     "icon" => "projecthoneypot",
4220     "title" => "Project Honeypot",
4221     "rule" => array(
4222     "^PHPot Verispider[ /v]+([0-9.]{1,10})" => "\\1",
4223     "projecthoneypot" => ""
4224     ),
4225     "uri" => "http://www.projecthoneypot.org"
4226     ),
4227     "proxycache" => array(
4228     "icon" => "robot",
4229     "title" => "Proxy Cache",
4230     "rule" => array(
4231     "^Mozilla/[0-9.]{1,10} \(compatible\;\)$" => ""
4232     ),
4233     "uri" => ""
4234     ),
4235     "proxyhunter" => array(
4236     "icon" => "robot",
4237     "title" => "ProxyHunter",
4238     "rule" => array(
4239     "ProxyHunter" => ""
4240     ),
4241     "uri" => ""
4242     ),
4243     "psbot" => array(
4244     "icon" => "picsearch",
4245     "title" => "PicSearch",
4246     "rule" => array(
4247     "^psbot" => ""
4248     ),
4249     "uri" => ""
4250     ),
4251     "pubsub" => array(
4252     "icon" => "pubsub",
4253     "title" => "PubSub",
4254     "rule" => array(
4255     "^PubSub-RSS-Reader[ /]([0-9.]{1,10})" => "\\1",
4256     "^PubSub\.com" => ""
4257     ),
4258     "uri" => ""
4259     ),
4260     "pukiwiki" => array(
4261     "icon" => "pukiwiki",
4262     "title" => "PukiWiki",
4263     "rule" => array(
4264     "PukiWiki[ /]([0-9.]{1,10})" => "\\1"
4265     ),
4266     "uri" => ""
4267     ),
4268     "pwebotxy" => array(
4269     "icon" => "pwebotxy",
4270     "title" => "PWeBot/X.Y",
4271     "rule" => array(
4272     "^PWeBot[ /]([0-9.]{1,10})" => "\\1"
4273     ),
4274     "uri" => "http://www.programacionweb.net/robot.php"
4275     ),
4276     "pxys" => array(
4277     "icon" => "robot",
4278     "title" => "PXYS",
4279     "rule" => array(
4280     "^pxys" => ""
4281     ),
4282     "uri" => ""
4283     ),
4284     "qango" => array(
4285     "icon" => "qango",
4286     "title" => "Qango",
4287     "rule" => array(
4288     "^Qango.com" => ""
4289     ),
4290     "uri" => "http://www.quango.com/"
4291     ),
4292     "qihoo" => array(
4293     "icon" => "qihoo",
4294     "title" => "Qihoo",
4295     "rule" => array(
4296     "QihooBot[ /]([0-9.]{1,10})" => "\\1"
4297     ),
4298     "uri" => "http://www.qihoo.com/"
4299     ),
4300     "qseero" => array(
4301     "icon" => "robot",
4302     "title" => "Qseero",
4303     "rule" => array(
4304     "Qseero v([0-9.]{1,10})" => "\\1"
4305     ),
4306     "uri" => "http://www.q0.com/"
4307     ),
4308     "quantcast" => array(
4309     "icon" => "robot",
4310     "title" => "Quantcast",
4311     "rule" => array(
4312     "Quantcastbot[ /]([0-9.]{1,10})" => "\\1"
4313     ),
4314     "uri" => "http://www.quantcast.com/"
4315     ),
4316     "quepasa" => array(
4317     "icon" => "quepasa",
4318     "title" => "Quepasa",
4319     "rule" => array(
4320     "Quepasa[ \-]?Creep" => ""
4321     ),
4322     "uri" => ""
4323     ),
4324     "questfinder" => array(
4325     "icon" => "robot",
4326     "title" => "QuestFinder",
4327     "rule" => array(
4328     "www\.questfinder\.com" => ""
4329     ),
4330     "uri" => ""
4331     ),
4332     "qweery" => array(
4333     "icon" => "robot",
4334     "title" => "Qweery",
4335     "rule" => array(
4336     "^QweeryBot[ /]([0-9.]{1,10})" => "\\1"
4337     ),
4338     "uri" => "http://qweerybot.qweery.nl"
4339     ),
4340     "racaicrawler" => array(
4341     "icon" => "robot",
4342     "title" => "RacaiCrawler",
4343     "rule" => array(
4344     "RacaiCrawler[ -]([0-9.]{1,10})" => "\\1"
4345     )
4346     ),
4347     "radian6" => array(
4348     "icon" => "robot",
4349     "title" => "Radian6",
4350     "rule" => array(
4351     "www\.radian6\.com" => ""
4352     ),
4353     "uri" => "http://www.radian6.com"
4354     ),
4355     "rambler" => array(
4356     "icon" => "rambler",
4357     "title" => "Rambler",
4358     "rule" => array(
4359     "StackRambler[ /]([0-9.]{1,10})" => "\\1"
4360     ),
4361     "uri" => ""
4362     ),
4363     "ramiba" => array(
4364     "icon" => "robot",
4365 matthys 209 "title" => "Ramiba",
4366 joku 63 "rule" => array(
4367     "^ramiba(-bot)?" => "\\1"
4368     ),
4369     "uri" => ""
4370     ),
4371     "rankur" => array(
4372     "icon" => "rankur",
4373     "title" => "Rankur",
4374     "rule" => array(
4375     "^RankurBot/Rankur([0-9.]{1,10})" => "\\1"
4376     ),
4377     "uri" => "http://rankur.com/",
4378     ),
4379 joku 261 "red" => array(
4380     "icon" => "red",
4381     "title" => "RED",
4382     "rule" => array(
4383     "RED[ /]([0-9.]{1,10})" => "\\1"
4384     ),
4385     "uri" => "http://redbot.org/"
4386 joku 181 ),
4387 joku 63 "rediff" => array(
4388     "icon" => "rediff",
4389 matthys 209 "title" => "Rediff",
4390 joku 63 "rule" => array(
4391     "^RedBot/redbot[ /\-]([0-9.]{1,10})" => "\\1"
4392     ),
4393     "uri" => "http://www.rediff.com",
4394     ),
4395     "repia" => array(
4396     "icon" => "robot",
4397     "title" => "Repia",
4398     "rule" => array(
4399     "webmaster@repia\.com" => ""
4400     ),
4401     "uri" => ""
4402     ),
4403     "robotgenius" => array(
4404     "icon" => "robot",
4405     "title" => "Robot Genius",
4406     "rule" => array(
4407     "^robotgenius" => ""
4408     ),
4409     "uri" => "http://robotgenius.net",
4410     ),
4411     "robozilla" => array(
4412     "icon" => "robot",
4413     "title" => "Robozilla",
4414     "rule" => array(
4415     "Robozilla" => ""
4416     ),
4417     "uri" => ""
4418     ),
4419     "rojo" => array(
4420     "icon" => "rojo",
4421     "title" => "Rojo",
4422     "rule" => array(
4423     "Rojo[ /]([0-9.]{1,10})" => "\\1"
4424     ),
4425     "uri" => ""
4426     ),
4427     "rss-atom" => array(
4428     "icon" => "rss",
4429     "title" => "RSS / Atom",
4430     "rule" => array(
4431     "^Apple-PubSub" => "",
4432     "^AppleSyndication" => ""
4433     ),
4434     "uri" => ""
4435     ),
4436     "rssbot" => array(
4437     "icon" => "rss",
4438 matthys 209 "title" => "RSS-bot",
4439 joku 63 "rule" => array(
4440     "rss-bot[ /]([0-9.]{1,10})" => "\\1"
4441     ),
4442     "uri" => ""
4443     ),
4444     "rssbandit" => array(
4445     "icon" => "rssbandit",
4446     "title" => "RssBandit",
4447     "rule" => array(
4448     "RssBandit[ /]([0-9.]{1,10})" => "\\1"
4449     ),
4450     "uri" => ""
4451     ),
4452     "rssimages" => array(
4453     "icon" => "rss",
4454 matthys 209 "title" => "RssImages",
4455 joku 63 "rule" => array(
4456     "rssImagesBot[ /]([0-9.]{1,10})" => "\\1"
4457     ),
4458     "uri" => ""
4459     ),
4460     "rssmicro" => array(
4461     "icon" => "rssmicro",
4462     "title" => "RSSMicro",
4463     "rule" => array(
4464     "RSSMicro\.com" => ""
4465     ),
4466     "uri" => "http://www.rssmicro.com"
4467     ),
4468     "rssowl" => array(
4469     "icon" => "rssowl",
4470     "title" => "RSSOwl",
4471     "rule" => array(
4472     "RSSOwl[ /]([0-9a-z.]{1,10})" => "\\1"
4473     ),
4474     "uri" => ""
4475     ),
4476     "rssreader" => array(
4477     "icon" => "rss",
4478     "title" => "RssReader",
4479     "rule" => array(
4480     "RssReader[ /]([0-9.]{1,10})" => ""
4481     ),
4482     "uri" => ""
4483     ),
4484     "rtgi" => array(
4485     "icon" => "rtgi",
4486 matthys 209 "title" => "Rtgi",
4487 joku 63 "rule" => array(
4488     "RTGI" => ""
4489     ),
4490     "uri" => "http://rtgi.fr/"
4491     ),
4492     "rufusbot" => array(
4493     "icon" => "robot",
4494     "title" => "RufusBot",
4495     "rule" => array(
4496     "RufusBot" => ""
4497     ),
4498     "uri" => ""
4499     ),
4500     "runnk" => array(
4501     "icon" => "robot",
4502     "title" => "Runnk",
4503     "rule" => array(
4504     "Runnk RSS finder" => ""
4505     ),
4506     "uri" => "http://www.runnk.com/il/law"
4507     ),
4508     "sagool" => array(
4509     "icon" => "robot",
4510     "title" => "Sagool",
4511     "rule" => array(
4512     "MaSagool" => ""
4513     ),
4514     "uri" => "http://sagool.jp/"
4515     ),
4516     "sanszbot" => array(
4517     "icon" => "robot",
4518     "title" => "Sansz",
4519     "rule" => array(
4520     "SanszBot" => ""
4521     ),
4522     "uri" => ""
4523     ),
4524     "saucereader" => array(
4525     "icon" => "saucereader",
4526     "title" => "Sauce Reader",
4527     "rule" => array(
4528     "Sauce[ ]?Reader[ /]([0-9.]{1,10})" => "\\1"
4529     ),
4530     "uri" => ""
4531     ),
4532     "sbider" => array(
4533     "icon" => "sbider",
4534     "title" => "SBIder",
4535     "rule" => array(
4536     "SBIder[/ ]([0-9.]{1,10})" => "\\1",
4537     "SBIder[/ ]SBIder.([0-9.]{1,10})" => "\\1"
4538     ),
4539     "uri" => ""
4540     ),
4541     "scirus" => array(
4542     "icon" => "robot",
4543     "title" => "Scirus",
4544     "rule" => array(
4545     "FAST-WebCrawler/[0-9a-z.]{1,10}/Scirus" => ""
4546     ),
4547     "uri" => ""
4548     ),
4549     "scoutjet" => array(
4550     "icon" => "scoutjet",
4551     "title" => "ScoutJet",
4552     "rule" => array(
4553     "ScoutJet" => ""
4554     ),
4555     "uri" => "http://www.scoutjet.com/"
4556     ),
4557 joku 261 "scrapy" => array(
4558     "icon" => "scrapy",
4559     "title" => "Scrapy",
4560     "rule" => array(
4561     "Scrapy[ /]([0-9.]{1,10})" => "\\1"
4562     ),
4563     "uri" => "http://scrapy.org"
4564     ),
4565 joku 63 "scrubby" => array(
4566     "icon" => "scrubby",
4567     "title" => "Scrubby",
4568     "rule" => array(
4569     "Scrubby[ /]([0-9.]{1,10})" => "\\1"
4570     ),
4571     "uri" => ""
4572     ),
4573     "sdm" => array(
4574     "icon" => "sdm",
4575     "title" => "SUN Download Manager",
4576     "rule" => array(
4577     "Sun Download Manager[/ ]([0-9.]{1,10})" => "\\1"
4578     ),
4579     "uri" => ""
4580     ),
4581     "sealinks" => array(
4582     "icon" => "robot",
4583     "title" => "Sea Links",
4584     "rule" => array(
4585     "SEA-Links( HTML-Scanner Pingoo\!)?[ /]([0-9.]{1,10})" => "\\2"
4586     ),
4587     "uri" => ""
4588     ),
4589     "search17" => array(
4590     "icon" => "robot",
4591     "title" => "Search 17",
4592     "rule" => array(
4593     "Search17Bot[ /]([0-9.]{1,10})" => "\\1"
4594     ),
4595     "uri" => "http://www.search17.com/bot.php"
4596     ),
4597     "search2" => array(
4598     "icon" => "search2",
4599     "title" => "Search2.net",
4600     "rule" => array(
4601     "^S2Bot[ /]([0-9.]{1,10})" => "\\1"
4602     ),
4603     "uri" => "http://search2.net/"
4604     ),
4605     "searchbot" => array(
4606     "icon" => "robot",
4607     "title" => "Searchbot",
4608     "rule" => array(
4609     "Searchbot[ /]([0-9.]{1,10})" => "\\1"
4610     ),
4611     "uri" => ""
4612     ),
4613     "searchch" => array(
4614     "icon" => "robot",
4615     "title" => "Search.ch",
4616     "rule" => array(
4617     "search\.ch[ /]?V?([0-9.]{1,10})" => "\\1"
4618     ),
4619     "uri" => ""
4620     ),
4621     "searchengineworld" => array(
4622     "icon" => "robot",
4623     "title" => "SearchEngineWorld",
4624     "rule" => array(
4625     "searchengineworld" => ""
4626     ),
4627     "uri" => "http://www.searchengineworld.com/"
4628     ),
4629     "searchhippo" => array(
4630     "icon" => "searchhippo",
4631     "title" => "Searchhippo",
4632     "rule" => array(
4633     "searchhippo" => ""
4634     ),
4635     "uri" => "http://www.searchhippo.com/"
4636     ),
4637     "searchthruus" => array(
4638     "icon" => "robot",
4639     "title" => "SearchThruUs",
4640     "rule" => array(
4641     "www\.unitek-systems\.co\.uk[ /]([0-9.]{1,10})" => "\\1"
4642     ),
4643     "uri" => ""
4644     ),
4645     "securecomputing" => array(
4646     "icon" => "robot",
4647     "title" => "Secure Computing",
4648     "rule" => array(
4649     "securecomputing" => ""
4650     ),
4651     "uri" => ""
4652     ),
4653     "seekport" => array(
4654     "icon" => "seekport",
4655     "title" => "Seekport",
4656     "rule" => array(
4657     "Seekbot[ /]([0-9.]{1,10})" => "\\1"
4658     ),
4659     "uri" => ""
4660     ),
4661     "semanticdiscovery" => array(
4662     "icon" => "robot",
4663     "title" => "Semantic Discovery",
4664     "rule" => array(
4665     "semanticdiscovery[ /]([0-9.]{1,10})" => "\\1"
4666     ),
4667     "uri" => ""
4668     ),
4669     "sengine" => array(
4670     "icon" => "sengine",
4671     "title" => "Sengine",
4672     "rule" => array(
4673     "netEstate NE Crawler" => ""
4674     ),
4675     "uri" => "http://www.sengine.info/"
4676     ),
4677     "sensis" => array(
4678     "icon" => "sensis",
4679     "title" => "Sensis",
4680     "rule" => array(
4681     "^Sensis(.com.au)? Web Crawler" => ""
4682     ),
4683     "uri" => "http://sensis.com.au"
4684     ),
4685     "seokicks" => array(
4686     "icon" => "seokicks",
4687     "title" => "SEOkicks",
4688     "rule" => array(
4689     "SEOkicks-Robot" => ""
4690     ),
4691     "uri" => "http://www.seokicks.de/"
4692     ),
4693     "seoprofiler" => array(
4694     "icon" => "seoprofiler",
4695     "title" => "SEOprofiler",
4696     "rule" => array(
4697     "spbot[ /]([0-9.]{1,10})" => "\\1"
4698     ),
4699     "uri" => "http://www.seoprofiler.com/"
4700     ),
4701     "setooz" => array(
4702     "icon" => "setooz",
4703     "title" => "Setooz",
4704     "rule" => array(
4705     "OOZBOT[ /]([0-9.]{1,10})" => "\\1"
4706     ),
4707     "uri" => "http://www.setooz.com/oozbot.html"
4708     ),
4709     "seznam" => array(
4710     "icon" => "seznam",
4711     "title" => "Seznam",
4712     "rule" => array(
4713     "SeznamBot[ /]([0-9.]{1,10})" => "\\1",
4714     "Seznam" => ""
4715     ),
4716     "uri" => "http://www.seznam.cz"
4717     ),
4718     "sharpreader" => array(
4719     "icon" => "sharpreader",
4720     "title" => "SharpReader",
4721     "rule" => array(
4722     "SharpReader[ /]([0-9.]{1,10})" => "\\1"
4723     ),
4724     "uri" => ""
4725     ),
4726     "shelob" => array(
4727     "icon" => "shelob",
4728     "title" => "Sherlock Spider",
4729     "rule" => array(
4730     "^Shelob" => ""
4731     ),
4732     "uri" => "http://www.gmx.net"
4733     ),
4734     "sherlockspider" => array(
4735     "icon" => "robot",
4736     "title" => "Sherlock Spider",
4737     "rule" => array(
4738     "sherlock_spider" => ""
4739     ),
4740     "uri" => ""
4741     ),
4742     "shim" => array(
4743     "icon" => "robot",
4744     "title" => "Shim Crawler",
4745     "rule" => array(
4746     "shim[ \-]crawler" => ""
4747     ),
4748     "uri" => ""
4749     ),
4750     "shopwiki" => array(
4751     "icon" => "shopwiki",
4752     "title" => "ShopWiki",
4753     "rule" => array(
4754     "^ShopWiki[ /]([0-9.]{1,10})" => "\\1"
4755     ),
4756     "uri" => ""
4757     ),
4758     "shoula" => array(
4759     "icon" => "robot",
4760     "title" => "Shoula",
4761     "rule" => array(
4762     "^Shoula.com Crawler ([0-9.]{1,10})" => "\\1"
4763     ),
4764     "uri" => "http://www.shoula.com"
4765     ),
4766     "siege" => array(
4767     "icon" => "robot",
4768     "title" => "Siege",
4769     "rule" => array(
4770     "Siege[ /]([0-9.]{1,10})" => "\\1"
4771     ),
4772     "uri" => ""
4773     ),
4774     "siets" => array(
4775     "icon" => "robot",
4776     "title" => "Siets",
4777     "rule" => array(
4778     "SietsCrawler[ /]([0-9.]{1,10})" => "\\1"
4779     ),
4780     "uri" => ""
4781     ),
4782     "simpy" => array(
4783     "icon" => "simpy",
4784     "title" => "Simpy",
4785     "rule" => array(
4786     "^(argus|simpy)[ /]([0-9.]{1,10})" => "\\2",
4787     ),
4788     "uri" => ""
4789     ),
4790     "singingfish" => array(
4791     "icon" => "singingfish",
4792     "title" => "SingingFish",
4793     "rule" => array(
4794     "asterias[ /]([0-9.]{1,10})" => "\\1",
4795     "Asterias Crawler v([0-9.]{1,10})" => "\\1",
4796     "asterias" => ""
4797     ),
4798     "uri" => ""
4799     ),
4800     "sirketce" => array(
4801     "icon" => "robot",
4802     "title" => "Sirketce",
4803     "rule" => array(
4804     "Sirketcebot[ /v]+([0-9.]{1,10})" => "\\1"
4805     ),
4806     "uri" => "http://www.sirketce.com/bot.html"
4807     ),
4808     "sirobot" => array(
4809     "icon" => "robot",
4810     "title" => "SiroBot",
4811     "rule" => array(
4812     "sirobot" => ""
4813     ),
4814     "uri" => ""
4815     ),
4816     "sistrix" => array(
4817     "icon" => "sistrix",
4818     "title" => "SISTRIX",
4819     "rule" => array(
4820     "SISTRIX Crawler" => ""
4821     ),
4822     "uri" => "http://crawler.sistrix.net/"
4823     ),
4824     "sitebar" => array(
4825     "icon" => "sitebar",
4826     "title" => "SiteBar",
4827     "rule" => array(
4828     "SiteBar[ /]([0-9.]{1,10})" => "\\1"
4829     ),
4830     "uri" => ""
4831     ),
4832     "sitebot" => array(
4833     "icon" => "sitebot",
4834     "title" => "SiteBot",
4835     "rule" => array(
4836     "SiteBot[ /]([0-9.]{1,10})" => "\\1"
4837     ),
4838     "uri" => "http://www.sitebot.org/robot/"
4839     ),
4840 matthys 273 "siteexplorer" => array(
4841     "icon" => "siteexplorer",
4842     "title" => "SiteExplorer",
4843     "rule" => array(
4844     "SiteExplorer[ /]([0-9a-z.]{1,10})" => "\\1"
4845     ),
4846     "uri" => "http://siteexplorer.info/"
4847     ),
4848 joku 63 "sitesell" => array(
4849     "icon" => "sitesell",
4850     "title" => "SiteSell",
4851     "rule" => array(
4852     "SBIder[/ ]([0-9a-z.\-]{1,10})" => "\\1"
4853     ),
4854     "uri" => ""
4855     ),
4856     "sitespider" => array(
4857     "icon" => "robot",
4858     "title" => "SiteSpider",
4859     "rule" => array(
4860     "^SiteSpider" => ""
4861     ),
4862     "uri" => ""
4863     ),
4864     "sitesucker" => array(
4865     "icon" => "sitesucker",
4866     "title" => "SiteSucker",
4867     "rule" => array(
4868     "Sitesucker[ /]([0-9.]{1,10})" => "\\1"
4869     ),
4870     "uri" => "http://www.sitesucker.us/"
4871     ),
4872     "sitidi" => array(
4873     "icon" => "robot",
4874     "title" => "SitiDi",
4875     "rule" => array(
4876     "SitiDiBot[ /]([0-9.]{1,10})" => "\\1"
4877     ),
4878     "uri" => ""
4879     ),
4880     "skaffe" => array(
4881     "icon" => "robot",
4882     "title" => "Skaffe",
4883     "rule" => array(
4884     "Skampy[ /]([0-9.\-]{1,10})" => "\\1"
4885     ),
4886     "uri" => "http://www.skaffe.com"
4887     ),
4888     "skizzle" => array(
4889     "icon" => "skizzle",
4890     "title" => "Skizzle",
4891     "rule" => array(
4892     "SKIZZLE! Distributed Internet Spider[ /v]+([0-9a-z.\-]{1,10})" => "\\1"
4893     ),
4894     "uri" => "http://www.skizzle.com"
4895     ),
4896     "slider" => array(
4897     "icon" => "robot",
4898     "title" => "Slider",
4899     "rule" => array(
4900     "^Slider[ /]([0-9.]{1,10})" => "\\1"
4901     ),
4902     "uri" => ""
4903     ),
4904     "slugch" => array(
4905     "icon" => "robot",
4906 matthys 209 "title" => "Slugch",
4907 joku 63 "rule" => array(
4908     "^slug\.ch crawl ([0-9a-z.\-]{1,10})" => "\\1"
4909     ),
4910     "uri" => ""
4911     ),
4912     "smartware" => array(
4913     "icon" => "robot",
4914     "title" => "SmartWareSoft",
4915     "rule" => array(
4916     "^SWSBot-Images[ /]([0-9.]{1,10})" => "\\1"
4917     ),
4918     "uri" => "http://www.smartwaresoft.com/swsbot12.html"
4919     ),
4920     "snookit" => array(
4921     "icon" => "snookit",
4922     "title" => "Snookit",
4923     "rule" => array(
4924     "^snookit" => ""
4925     ),
4926     "uri" => "http://www.snookit.com/"
4927     ),
4928     "snoopy" => array(
4929     "icon" => "robot",
4930     "title" => "Snoopy",
4931     "rule" => array(
4932     "^Snoopy.+([0-9.]{1,10})" => "\\1",
4933     "sna-([0-9.]{1,10})" => "\\1"
4934     ),
4935     "uri" => "http://snoopy.sourceforge.net/"
4936     ),
4937     "snyke" => array(
4938     "icon" => "robot",
4939     "title" => "Snyke",
4940     "rule" => array(
4941     "^SnykeBot[ /]([0-9.]{1,10})" => "\\1"
4942     ),
4943     "uri" => "http://www.snyke.com"
4944     ),
4945     "socialradar" => array(
4946     "icon" => "socialradar",
4947     "title" => "Social Radar",
4948     "rule" => array(
4949     "Socialradarbot[ /]([0-9.]{1,10})" => "\\1"
4950     ),
4951     "uri" => "http://infegy.com/"
4952     ),
4953     "soegning" => array(
4954     "icon" => "soegning",
4955 matthys 209 "title" => "Søgning",
4956 joku 63 "rule" => array(
4957     "soegning\.dk[/ ]spider[ /]([0-9.]{1,10})" => "\\1"
4958     ),
4959     "uri" => ""
4960     ),
4961     "soft411" => array(
4962     "icon" => "soft411",
4963     "title" => "Soft411",
4964     "rule" => array(
4965     "SOFT411 Directory" => ""
4966     ),
4967     "uri" => ""
4968     ),
4969     "sogou" => array(
4970     "icon" => "sogou",
4971     "title" => "Sogou",
4972     "rule" => array(
4973     "Sogou web spider[ /]([0-9.]{1,10})" => "\\1"
4974     ),
4975     "uri" => "http://www.sogou.com/docs/help/webmasters.htm#07"
4976     ),
4977     "sohu" => array(
4978     "icon" => "robot",
4979     "title" => "Sohu",
4980     "rule" => array(
4981     "sohu[ \-](agent|search)" => ""
4982     ),
4983     "uri" => ""
4984     ),
4985     "somewhere" => array(
4986     "icon" => "robot",
4987 matthys 209 "title" => "Somewhere.com",
4988 joku 63 "rule" => array(
4989     "Mozilla\@somewhere\.com" => "\\1"
4990     ),
4991     "uri" => "http://www.somewhere.com/"
4992     ),
4993     "sopheus" => array(
4994     "icon" => "robot",
4995     "title" => "Sopheus",
4996     "rule" => array(
4997     "Sopheus Project[ /]([0-9.]{1,10})" => "\\1"
4998     ),
4999     "uri" => "http://www.thenetplanet.com"
5000     ),
5001     "soso" => array(
5002     "icon" => "soso",
5003     "title" => "Soso",
5004     "rule" => array(
5005     "^Soso(image)?spider" => ""
5006     ),
5007     "uri" => "http://help.soso.com/soso-image-spider.htm"
5008     ),
5009     "souppot" => array(
5010     "icon" => "robot",
5011     "title" => "SoupPot",
5012     "rule" => array(
5013     "SoupPotBot" => ""
5014     ),
5015     "uri" => ""
5016     ),
5017     "specificmedia" => array(
5018     "icon" => "specificmedia",
5019     "title" => "Specific Media",
5020     "rule" => array(
5021     "^SMBot[ /]([0-9.]{1,10})" => "\\1"
5022     ),
5023     "uri" => ""
5024     ),
5025     "sphider" => array(
5026     "icon" => "sphider",
5027     "title" => "Sphider",
5028     "rule" => array(
5029     "Sphider" => ""
5030     ),
5031     "uri" => "http://www.sphider.eu"
5032     ),
5033     "spinn3r" => array(
5034     "icon" => "robot",
5035     "title" => "Spinn3r",
5036     "rule" => array(
5037     "Spinn3r[ /]([0-9.]{1,10})" => "\\1"
5038     ),
5039     "uri" => "http://spinn3r.com/robot"
5040     ),
5041     "sproose" => array(
5042     "icon" => "robot",
5043 matthys 209 "title" => "Sproose",
5044 joku 63 "rule" => array(
5045     "^sproose[ /]([0-9a-z.]{1,10})" => "\\1"
5046     ),
5047     "uri" => "http://www.sproose.com/bot.html"
5048     ),
5049     "spurlbot" => array(
5050     "icon" => "robot",
5051     "title" => "SpurlBot",
5052     "rule" => array(
5053     "SpurlBot[/ ]([0-9.]{1,10})" => "\\1"
5054     ),
5055     "uri" => ""
5056     ),
5057     "stardownloader" => array(
5058     "icon" => "stardownloader",
5059     "title" => "Star Downloader",
5060     "rule" => array(
5061     "^Star Downloader( Pro)?" => ""
5062     ),
5063     "uri" => ""
5064     ),
5065     "steeler" => array(
5066     "icon" => "robot",
5067     "title" => "Steeler",
5068     "rule" => array(
5069     "Steeler[ /]([0-9.]{1,10})" => "\\1"
5070     ),
5071     "uri" => ""
5072     ),
5073     "strategicboard" => array(
5074     "icon" => "strategicboard",
5075     "title" => "Strategic Board",
5076     "rule" => array(
5077     "Strategic Board Bot" => ""
5078     ),
5079     "uri" => "http://www.strategicboard.com"
5080     ),
5081     "suchbaer" => array(
5082     "icon" => "robot",
5083 matthys 209 "title" => "Suchbaer.de",
5084 joku 63 "rule" => array(
5085     "^suchbaer\.de" => ""
5086     ),
5087     "uri" => "http://www.suchbaer.de/"
5088     ),
5089     "suchbot" => array(
5090     "icon" => "robot",
5091 matthys 209 "title" => "Suchbot",
5092 joku 63 "rule" => array(
5093     "^suchbot" => ""
5094     ),
5095     "uri" => ""
5096     ),
5097     "suchende" => array(
5098     "icon" => "suchende",
5099 matthys 209 "title" => "Suchen.de",
5100 joku 63 "rule" => array(
5101     "^gonzo([0-9]{1,2}).*www.suchen.de" => "\\1",
5102     "^gonzo/([0-9.]{1,10})" => "\\1"
5103     ),
5104     "uri" => "http://www.suchen.de/"
5105     ),
5106     "suchknecht" => array(
5107     "icon" => "robot",
5108     "title" => "Suchknecht",
5109     "rule" => array(
5110     "^Suchknecht.at-Robot" => ""
5111     ),
5112     "uri" => "http://www.suchknecht.at/"
5113     ),
5114     "suchpad" => array(
5115     "icon" => "robot",
5116 matthys 209 "title" => "Suchpad",
5117 joku 63 "rule" => array(
5118     "^suchpadbot[ /]([0-9.]{1,10})" => "\\1"
5119     ),
5120     "uri" => "http://www.suchpad.de"
5121     ),
5122     "sunrise" => array(
5123     "icon" => "sunrise",
5124     "title" => "Sunrise",
5125     "rule" => array(
5126     "^Sunrise[ /]([0-9a-z.]{1,10})" => "\\1"
5127     ),
5128     "uri" => ""
5129     ),
5130     "superbot" => array(
5131     "icon" => "superbot",
5132     "title" => "SuperBot",
5133     "rule" => array(
5134     "SuperBot[ /]([0-9.]{1,10})" => "\\1"
5135     ),
5136     "uri" => ""
5137     ),
5138     "surfcontrol" => array(
5139     "icon" => "robot",
5140     "title" => "SurfControl",
5141     "rule" => array(
5142     "SurfControl" => "",
5143     "ScSpider[ /]([0-9.]{1,10})" => "\\1"
5144     ),
5145     "uri" => ""
5146     ),
5147     "surfnet" => array(
5148     "icon" => "robot",
5149     "title" => "SURFnet",
5150     "rule" => array(
5151     "AVSearch[ \-]([0-9.]{1,10})" => "\\1"
5152     ),
5153     "uri" => ""
5154     ),
5155     "surfsafely" => array(
5156     "icon" => "robot",
5157     "title" => "Surfsafely",
5158     "rule" => array(
5159     "Submission Spider at surfsafely.com" => ""
5160     ),
5161     "uri" => "http://www.surfsafely.com"
5162     ),
5163     "surphace" => array(
5164     "icon" => "spherescout",
5165     "title" => "Surphace",
5166     "rule" => array(
5167     "Sphere Scout.+([0-9.]{1,10})" => "\\1",//Previous called Sphere Scout
5168     "Surphace.+v([0-9.]{1,10})" => "\\1"
5169     ),
5170     "uri" => "http://www.surphace.com"
5171     ),
5172     "surveybot" => array(
5173     "icon" => "surveybot",
5174     "title" => "Whois Survey",
5175     "rule" => array(
5176     "SurveyBot[ /]([0-9.]{1,10})" => "\\1"
5177     ),
5178     "uri" => ""
5179     ),
5180     "swoogle" => array(
5181     "icon" => "robot",
5182     "title" => "Swoogle",
5183     "rule" => array(
5184     "^Swooglebot[ /]([0-9.]{1,10})" => "\\1"
5185     ),
5186     "uri" => "http://swoogle.umbc.edu/swooglebot.htm"
5187     ),
5188     "swse" => array(
5189     "icon" => "robot",
5190     "title" => "SWSE",
5191     "rule" => array(
5192     "sw\.deri\.org" => ""
5193     ),
5194     "uri" => "http://sw.deri.org/2006/04/multicrawler/robots.html"
5195     ),
5196     "swish-e" => array(
5197     "icon" => "swish-e",
5198     "title" => "Swish-e",
5199     "rule" => array(
5200     "^swish-e" => ""
5201     ),
5202     "uri" => "http://swish-e.org/"
5203     ),
5204     "sygol" => array(
5205     "icon" => "sygol",
5206     "title" => "Sygol",
5207     "rule" => array(
5208     "www.sygol.(com|net)" => ""
5209     ),
5210     "uri" => "http://www.sygol.com"
5211     ),
5212     "syllabs" => array(
5213     "icon" => "syllabs",
5214     "title" => "Syllabs",
5215     "rule" => array(
5216     "Focal[-]([0-9.]{1,10})" => "\\1"
5217     ),
5218     "uri" => "http://www.syllabs.com/crawler.html"
5219     ),
5220     "synapse" => array(
5221     "icon" => "robot",
5222     "title" => "Synapse",
5223     "rule" => array(
5224     " Synapse\)" => ""
5225     ),
5226     "uri" => "http://ws.apache.org/synapse/"
5227     ),
5228     "sync2it" => array(
5229     "icon" => "robot",
5230 matthys 209 "title" => "Sync2it",
5231 joku 63 "rule" => array(
5232     "^\!Susie" => ""
5233     ),
5234     "uri" => "http://www.sync2it.com/bms/susie.php"
5235     ),
5236     "syncit" => array(
5237     "icon" => "robot",
5238 matthys 209 "title" => "Syncit",
5239 joku 63 "rule" => array(
5240     "^SyncIT[ /]([0-9.]{1,10})" => "\\1"
5241     ),
5242     "uri" => "http://www.syncit.com/"
5243     ),
5244     "syndic8" => array(
5245     "icon" => "syndic8",
5246     "title" => "Syndic8",
5247     "rule" => array(
5248     "Syndic8[ /]([0-9.]{1,10})" => "\\1"
5249     ),
5250     "uri" => "http://www.syndic8.com/"
5251     ),
5252     "syndicatie" => array(
5253     "icon" => "robot",
5254     "title" => "Syndicatie.nl",
5255     "rule" => array(
5256     "Syndicatie\.nl robot v ([0-9.]{1,10})" => "\\1",
5257     "Syndicatie\.nl robot;" => ""
5258     ),
5259     "uri" => ""
5260     ),
5261     "synomia" => array(
5262     "icon" => "robot",
5263     "title" => "Synomia",
5264     "rule" => array(
5265     "^SynoBot" => ""
5266     ),
5267     "uri" => ""
5268     ),
5269     "synoo" => array(
5270     "icon" => "robot",
5271     "title" => "SynooBot",
5272     "rule" => array(
5273     "SynooBot[ /]([0-9.]{1,10})" => "\\1",
5274     ),
5275     "uri" => ""
5276     ),
5277     "szukacz" => array(
5278     "icon" => "szukacz",
5279     "title" => "Szukacz",
5280     "rule" => array(
5281     "Szukacz[ /]([0-9.]{1,10})" => "\\1"
5282     ),
5283     "uri" => ""
5284     ),
5285     "tagoo" => array(
5286     "icon" => "tagoobot",
5287     "title" => "Tagoo",
5288     "rule" => array(
5289     "Tagoobot[ /]([0-9.]{1,10})" => "\\1"
5290     ),
5291     "uri" => "http://www.tagoo.ru"
5292     ),
5293     "tagword" => array(
5294     "icon" => "tagword",
5295     "title" => "Tagword",
5296     "rule" => array(
5297     "^Tagword" => ""
5298     ),
5299     "uri" => "http://tagword.com/dmoz_survey.php"
5300     ),
5301     "trailfire" => array(
5302     "icon" => "trailfire",
5303     "title" => "Trailfire",
5304     "rule" => array(
5305     "^Trailfire-bot[ /]([0-9.]{1,10})" => "\\1"
5306     ),
5307     "uri" => "http://trailfire.com"
5308     ),
5309     "tamu" => array(
5310     "icon" => "tamu",
5311     "title" => "Tamu Crawler",
5312     "rule" => array(
5313     "IRLbot[ /]([0-9.]{1,10})" => "\\1",
5314     "TAMU_CS_IRL_CRAWLER[ /]([0-9.]{1,10})" => "\\1"
5315     ),
5316     "uri" => "http://irl.cs.tamu.edu/crawler/"
5317     ),
5318     "taptubot" => array(
5319     "icon" => "taptubot",
5320     "title" => "Taptu",
5321     "rule" => array(
5322     "taptubot" => ""
5323     ),
5324     "uri" => "http://www.taptu.com/corp/taptubot"
5325     ),
5326     "targetseek" => array(
5327     "icon" => "robot",
5328     "title" => "TargetSeek",
5329     "rule" => array(
5330     "TargetSeek[ /]([0-9.]{1,10})" => "\\1"
5331     ),
5332     "uri" => "http://www.targetgroups.net/TargetSeek.html"
5333     ),
5334     "taw" => array(
5335     "icon" => "taw",
5336     "title" => "TAW",
5337     "rule" => array(
5338     "TAW[ /]([0-9.]{1,10})" => "\\1"
5339     ),
5340     "uri" => "http://www.tawdis.net"
5341     ),
5342     "tcd" => array(
5343     "icon" => "tcd",
5344     "title" => "Trinity College Dublin",
5345     "rule" => array(
5346     "^TCDBOT/Nutch-([0-9.]{1,10})" => "\\1"
5347     ),
5348     "uri" => "http://www.tcd.ie"
5349     ),
5350     "technorati" => array(
5351     "icon" => "technorati",
5352     "title" => "Technorati",
5353     "rule" => array(
5354     "Technoratibot[ /]([0-9.]{1,10})" => "\\1"
5355     ),
5356     "uri" => ""
5357     ),
5358     "teleport" => array(
5359     "icon" => "teleport",
5360     "title" => "Teleport",
5361     "rule" => array(
5362     "Teleport[ \-]?Pro" => ""
5363     ),
5364     "uri" => ""
5365     ),
5366     "terrar" => array(
5367     "icon" => "robot",
5368     "title" => "Terrar",
5369     "rule" => array(
5370     "^Fresh Search :: Terrar" => ""
5371     ),
5372     "uri" => ""
5373     ),
5374     "theophrastus" => array(
5375     "icon" => "robot",
5376     "title" => "Theophrastus",
5377     "rule" => array(
5378     "Theophrastus[ /]([0-9.]{1,10})" => "\\1"
5379     ),
5380     "uri" => "http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php"
5381     ),
5382     "thumbnailscz" => array(
5383     "icon" => "robot",
5384 matthys 209 "title" => "Thumbnails.cz",
5385 joku 63 "rule" => array(
5386     "^thumbnail\.cz robot[ /]([0-9.]{1,10})" => "\\1"
5387     ),
5388     "uri" => ""
5389     ),
5390     "thumbshot" => array(
5391     "icon" => "robot",
5392 matthys 209 "title" => "Thumbshots",
5393 joku 63 "rule" => array(
5394     "^thumbshots.*(Version: |v)([0-9.]{2,10})e" => "\\1",
5395     "^thumbshots-de" => ""
5396     ),
5397     "uri" => "http://www.thumbshots.de"
5398     ),
5399     "thunderstone" => array(
5400     "icon" => "thunderstone",
5401     "title" => "Thunderstone",
5402     "rule" => array(
5403     "T-H-U-N-D-E-R-S-T-O-N-E" => "",
5404     "search.thunderstone.com" => ""
5405     ),
5406     "uri" => "http://search.thunderstone.com/"
5407     ),
5408     "timbobot" => array(
5409     "icon" => "robot",
5410 matthys 209 "title" => "TimboBot",
5411 joku 63 "rule" => array(
5412     "timboBot" => ""
5413     ),
5414     "uri" => ""
5415     ),
5416     "topsy" => array(
5417     "icon" => "topsy",
5418     "title" => "Topsy",
5419     "rule" => array(
5420     "Butterfly[ /]([0-9.]{1,10})" => "\\1"
5421     ),
5422     "uri" => "http://labs.topsy.com/butterfly.html"
5423     ),
5424     "trayce" => array(
5425     "icon" => "robot",
5426 matthys 209 "title" => "Trayce",
5427 joku 63 "rule" => array(
5428     "traycebot[ /]([0-9a-z.\-]{1,10})" => "\\1"
5429     ),
5430     "uri" => ""
5431     ),
5432     "tricus" => array(
5433     "icon" => "robot",
5434     "title" => "Tricus",
5435     "rule" => array(
5436     "B_l_i_t_z_B_O_T_@_t_r_i_c_u_s_\._c_o_m" => ""
5437     ),
5438     "uri" => ""
5439     ),
5440     "topicblogs" => array(
5441     "icon" => "robot",
5442     "title" => "Topicblogs",
5443     "rule" => array(
5444     "topicblogs[ /]([0-9.]{1,10})" => "\\1"
5445     ),
5446     "uri" => ""
5447     ),
5448     "touche" => array(
5449     "icon" => "touche",
5450 matthys 209 "title" => "Touché",
5451 joku 63 "rule" => array(
5452     "^Touche" => ""
5453     ),
5454     "uri" => "http://touche.com.ve"
5455     ),
5456     "tuezilla" => array(
5457     "icon" => "robot",
5458 matthys 209 "title" => "TÃœzilla",
5459 joku 63 "rule" => array(
5460     "tuezilla.de" => ""
5461     ),
5462     "uri" => "http://tuezilla.de/t_st-odp-entries-agent.html"
5463     ),
5464     "turnitin" => array(
5465     "icon" => "turnitin",
5466     "title" => "Turnitin",
5467     "rule" => array(
5468     "TurnitinBot[ /]([0-9.]{1,10})" => "\\1"
5469     ),
5470     "uri" => ""
5471     ),
5472     "tutorgig" => array(
5473     "icon" => "robot",
5474     "title" => "TutorGig",
5475     "rule" => array(
5476     "TutorGig(Bot)?[ /]([0-9.]{1,10})" => "\\2"
5477     ),
5478     "uri" => ""
5479     ),
5480     "twiceler" => array(
5481     "icon" => "cuill",
5482 matthys 209 "title" => "Cuill",
5483 joku 63 "rule" => array(
5484     "Twiceler[ /-]([0-9.]{1,10})" => "\\1",
5485     "Twiceler" => ""
5486     ),
5487     "uri" => "http://www.cuill.com/twiceler/robot.html"
5488     ),
5489     "twingly" => array(
5490     "icon" => "twingly",
5491     "title" => "Twingly",
5492     "rule" => array(
5493     "Twingly Recon" => ""
5494     ),
5495     "uri" => "http://www.twingly.com/"
5496     ),
5497     "typepad" => array(
5498     "icon" => "typepad",
5499     "title" => "TypePad",
5500     "rule" => array(
5501     "TypePad/([0-9a-z.]{1,10})" => "\\1"
5502     ),
5503     "uri" => ""
5504     ),
5505     "udmsearch" => array(
5506     "icon" => "robot",
5507     "title" => "UdmSearch",
5508     "rule" => array(
5509     "UdmSearch[/ ]([0-9.]{1,10})" => "\\1"
5510     ),
5511     "uri" => ""
5512     ),
5513     "ukwizz" => array(
5514     "icon" => "ukwizz",
5515     "title" => "UKWizz",
5516     "rule" => array(
5517     "^Mackster.*ukwizz" => ""
5518     ),
5519     "uri" => "http://www.ukwizz.com"
5520     ),
5521     "ultraseek" => array(
5522     "icon" => "robot",
5523     "title" => "Ultraseek",
5524     "rule" => array(
5525     "Ultraseek" => ""
5526     ),
5527     "uri" => ""
5528     ),
5529     "ultraspider" => array(
5530     "icon" => "robot",
5531     "title" => "UltraSpider",
5532     "rule" => array(
5533     "UltraSpider3000[/ ]([0-9.]{1,10})" => "\\1"
5534     ),
5535     "uri" => "http://www.search.ch"
5536     ),
5537     "umai" => array(
5538     "icon" => "robot",
5539 matthys 209 "title" => "Umai",
5540 joku 63 "rule" => array(
5541     "umai[/ ]([0-9.]{1,10})" => "\\1"
5542     ),
5543     "uri" => ""
5544     ),
5545     "unchaos" => array(
5546     "icon" => "robot",
5547     "title" => "Unchaos",
5548     "rule" => array(
5549     "unchaos_crawler[_ /]([0-9.]{1,10})" => "\\1",
5550     "unchaos" => ""
5551     ),
5552     "uri" => ""
5553     ),
5554     "unido" => array(
5555     "icon" => "robot",
5556 matthys 209 "title" => "UNIdo",
5557 joku 63 "rule" => array(
5558     "^unido-bot" => "\\1"
5559     ),
5560     "uri" => "http://mobicom.cs.uni-dortmund.de/bot.html"
5561     ),
5562     "updated" => array(
5563     "icon" => "robot",
5564     "title" => "Updated",
5565     "rule" => array(
5566     "updated[ /]([0-9a-z.]{1,10})" => "\\1"
5567     ),
5568     "uri" => ""
5569     ),
5570     "uptimebot" => array(
5571     "icon" => "robot",
5572     "title" => "UptimeBot",
5573     "rule" => array(
5574     "^UptimeBot" => ""
5575     ),
5576     "uri" => "http://www.uptimebot.com/"
5577     ),
5578     "urifetch" => array(
5579     "icon" => "robot",
5580     "title" => "URI::Fetch",
5581     "rule" => array(
5582     "^URI::Fetch[ /]([0-9.]{1,10})" => "\\1"
5583     ),
5584     "uri" => ""
5585     ),
5586     "urlbase" => array(
5587     "icon" => "robot",
5588     "title" => "URLBase",
5589     "rule" => array(
5590     "URLBase[ /]([0-9.]{1,10})" => "\\1"
5591     ),
5592     "uri" => ""
5593     ),
5594     "urlblaze" => array(
5595     "icon" => "robot",
5596     "title" => "URLBlaze",
5597     "rule" => array(
5598     "^URLBlaze" => ""
5599     ),
5600     "uri" => ""
5601     ),
5602     "urlcontr" => array(
5603     "icon" => "robot",
5604     "title" => "MS URL Control",
5605     "rule" => array(
5606     "Microsoft URL[ \-]?Control" => ""
5607     ),
5608     "uri" => ""
5609     ),
5610     "urlgetfile" => array(
5611     "icon" => "robot",
5612     "title" => "URLGetFile",
5613     "rule" => array(
5614     "^URLGetFile" => ""
5615     ),
5616     "uri" => ""
5617     ),
5618     "urlscope" => array(
5619     "icon" => "robot",
5620     "title" => "UrlScope",
5621     "rule" => array(
5622     "UrlScope" => ""
5623     ),
5624     "uri" => ""
5625     ),
5626     "urltrends" => array(
5627     "icon" => "urltrends",
5628 matthys 209 "title" => "UrlTrends",
5629 joku 63 "rule" => array(
5630     "Snappy/([0-9.]{1,10})" => "\\1",
5631     ),
5632     "uri" => ""
5633     ),
5634     "usww" => array(
5635     "icon" => "usww",
5636 matthys 209 "title" => "USWW",
5637 joku 63 "rule" => array(
5638     "usww\.com" => "",
5639     "Mozilla/5\.0 URL-Spider" => ""
5640     ),
5641     "uri" => "http://www.usww.com/"
5642     ),
5643     "usyd" => array(
5644     "icon" => "robot",
5645     "title" => "USyd-NLP-Spider",
5646     "rule" => array(
5647     "^USyd-NLP-Spider" => ""
5648     ),
5649     "uri" => "http://www.it.usyd.edu.au/~vinci/bot.html"
5650     ),
5651     "vagabondo" => array(
5652     "icon" => "wiseguys",
5653     "title" => "WiseGuys",
5654     "rule" => array(
5655     "Vagabondo[ /]([0-9.]{1,10})" => "\\1",
5656     "Vagabondo-WAP[ /]([0-9.]{1,10})" => "\\1"
5657     ),
5658     "uri" => ""
5659     ),
5660     "unicorn" => array(
5661     "icon" => "w3c",
5662     "title" => "W3C Unicorn",
5663     "rule" => array(
5664     "Unicorn[ /]([0-9.]{1,10})" => "\\1",
5665     ),
5666     "uri" => "http://validator.w3.org/unicorn/"
5667     ),
5668     "validator" => array(
5669     "icon" => "w3c",
5670     "title" => "W3C Validator",
5671     "rule" => array(
5672     "W3C_Validator[ /]([0-9.]{1,10})" => "\\1"
5673     ),
5674     "uri" => "http://validator.w3.org/"
5675     ),
5676     "validator.nu" => array(
5677     "icon" => "validatornu",
5678     "title" => "Validator.nu",
5679     "rule" => array(
5680     "^Validator.nu[ /]([0-9.]{1,10})" => "\\1",
5681     "^Validator.nu/LV" => "\\1"
5682     ),
5683     "uri" => "http://validator.nu/"
5684     ),
5685     "verity" => array(
5686     "icon" => "robot",
5687     "title" => "Verity",
5688     "rule" => array(
5689     "^vspider[ /]([0-9.]{1,10})" => "\\1",
5690     "^vspider" => ""
5691     ),
5692     "uri" => "http://www.verity.com/"
5693     ),
5694     "versionsproject" => array(
5695     "icon" => "robot",
5696     "title" => "Versions-project",
5697     "rule" => array(
5698     "InfoFly[ /]([0-9.]{1,10})" => "\\1"
5699     ),
5700     "uri" => "http://www.versions-project.org/"
5701     ),
5702     "verticalmatch" => array(
5703     "icon" => "robot",
5704     "title" => "VerticalMatch",
5705     "rule" => array(
5706     "^VMBot[ /]([0-9.]{1,10})" => "\\1"
5707     ),
5708     "uri" => "http://www.VerticalMatch.com/"
5709     ),
5710     "verzamelgids" => array(
5711     "icon" => "robot",
5712     "title" => "Verzamelgids",
5713     "rule" => array(
5714     "Verzamelgids[ /]([0-9.]{1,10})" => "\\1"
5715     ),
5716     "uri" => "http://www.verzamelgids.nl/"
5717     ),
5718     "vestris" => array(
5719     "icon" => "vestris",
5720     "title" => "Vestris",
5721     "rule" => array(
5722     "AlkalineBOT[ /]([0-9.]{1,10})" => "\\1"
5723     ),
5724     "uri" => "http://alkaline.vestris.com/"
5725     ),
5726     "vindex" => array(
5727     "icon" => "vindex",
5728     "title" => "Vindex",
5729     "rule" => array(
5730     "Vindex[ /]([0-9.]{1,10})" => "\\1"
5731     ),
5732     "uri" => ""
5733     ),
5734     "visvo" => array(
5735     "icon" => "robot",
5736     "title" => "Visvo",
5737     "rule" => array(
5738     "VisBot[ /]([0-9.]{1,10})" => "\\1"
5739     ),
5740     "uri" => "http://www.visvo.com"
5741     ),
5742     "voila" => array(
5743     "icon" => "voila",
5744     "title" => "Voila",
5745     "rule" => array(
5746     "VoilaBot[ /]?[a-z ]*([0-9.]{1,10})" => "\\1",
5747     "VoilaBot;[ /]([0-9.]{1,10})" => "\\1"
5748     ),
5749     "uri" => ""
5750     ),
5751     "vonna" => array(
5752     "icon" => "robot",
5753     "title" => "Vonna",
5754     "rule" => array(
5755     "Vonna.com b o t" => ""
5756     ),
5757     "uri" => ""
5758     ),
5759     "vortex" => array(
5760     "icon" => "robot",
5761     "title" => "Vortex",
5762     "rule" => array(
5763     "Vortex[ /]([0-9.]{1,10})" => "\\1"
5764     ),
5765     "uri" => "http://marty.anstey.ca/robots/vortex/"
5766     ),
5767     "w3sitesearch" => array(
5768     "icon" => "w3sitesearch",
5769     "title" => "W3SiteSearch",
5770     "rule" => array(
5771     "^W3SiteSearch Crawler[\_v]*([0-9.]{1,10})" => "\\1"
5772     ),
5773     "uri" => "http://www.w3sitesearch.de"
5774     ),
5775     "wagger" => array(
5776     "icon" => "robot",
5777     "title" => "Wagger",
5778     "rule" => array(
5779     "^Waggr" => ""
5780     ),
5781     "uri" => "http://www.waggr.com/"
5782     ),
5783     "wanadoo" => array(
5784     "icon" => "robot",
5785     "title" => "Wanadoo",
5786     "rule" => array(
5787     "^SurferF3[ /]([0-9./]{1,10})" => "\\1"
5788     ),
5789     "uri" => "http://www.wanadoo.fr/"
5790     ),
5791     "wapalizer" => array(
5792     "icon" => "robot",
5793     "title" => "Wapalizer",
5794     "rule" => array(
5795     "wapalizer[ /]([0-9.]{1,10})" => "\\1"
5796     ),
5797     "uri" => "http://www.wapdrive.com/"
5798     ),
5799     "watson" => array(
5800     "icon" => "addy",
5801     "title" => "Dr.Watson",
5802     "rule" => array(
5803     "Watson[ /]([0-9.]{1,10})" => "\\1",
5804     "watson\.addy\.com" => ""
5805     ),
5806     "uri" => ""
5807     ),
5808     "wavefire" => array(
5809     "icon" => "robot",
5810     "title" => "Wavefire",
5811     "rule" => array(
5812     "^Wavefire[ /]([0-9.]{1,10})" => "\\1"
5813     ),
5814     "uri" => ""
5815     ),
5816     "waypath" => array(
5817     "icon" => "waypath",
5818     "title" => "Waypath",
5819     "rule" => array(
5820     "Waypath[ \-]?Scout" => "",
5821     "Waypath (development )?crawler" => ""
5822     ),
5823     "uri" => ""
5824     ),
5825     "wauuu" => array(
5826     "icon" => "wauuu",
5827     "title" => "Wauuu",
5828     "rule" => array(
5829     "Wauuu[/ ]([0-9.]{1,10})" => "\\2"
5830     ),
5831     "uri" => "http://www.wauuu.com"
5832     ),
5833     "wdg" => array(
5834     "icon" => "wdg",
5835     "title" => "WDG Validator",
5836     "rule" => array(
5837     "^WDG_(Site)?Validator[/ ]([0-9.]{1,10})" => "\\2"
5838     ),
5839     "uri" => "http://www.htmlhelp.com/tools/validator/"
5840     ),
5841     "webagogo" => array(
5842     "icon" => "webagogo",
5843     "title" => "Webagogo",
5844     "rule" => array(
5845     "^Webagogo" => ""
5846     ),
5847     "uri" => "http://www.webagogo.be/"
5848     ),
5849     "webalta" => array(
5850     "icon" => "webalta",
5851     "title" => "WebAlta",
5852     "rule" => array(
5853     "^WebAlta( Crawler)?[/ ]([0-9.]{1,10})" => "\\2"
5854     ),
5855     "uri" => "http://www.webalta.net/ru/about_webmaster.html"
5856     ),
5857     "webdigity" => array(
5858     "icon" => "robot",
5859     "title" => "Webdigity Whois Service",
5860     "rule" => array(
5861     "^webdigity whois service" => ""
5862     ),
5863     "uri" => "http://www.webdigity.com/ws"
5864     ),
5865     "webelixir" => array(
5866     "icon" => "webelixir",
5867     "title" => "Webelixir",
5868     "rule" => array(
5869     "^webelixir" => ""
5870     ),
5871     "uri" => "http://www.webelixir.net/"
5872     ),
5873     "webbotru" => array(
5874     "icon" => "robot",
5875     "title" => "Webbot.ru",
5876     "rule" => array(
5877     " Webbot[/ ]([0-9.]{1,10})" => "\\1"
5878     ),
5879     "uri" => "http://www.webbot.ru/bot.html"
5880     ),
5881     "webcapture" => array(
5882     "icon" => "robot",
5883     "title" => "WebCapture",
5884     "rule" => array(
5885     "WebCapture[/ ]([0-9.]{1,10})" => "\\1"
5886     ),
5887     "uri" => ""
5888     ),
5889     "webcollage" => array(
5890     "icon" => "robot",
5891     "title" => "Webcollage",
5892     "rule" => array(
5893     "webcollage" => ""
5894     ),
5895     "uri" => ""
5896     ),
5897     "webcopier" => array(
5898     "icon" => "webcopier",
5899     "title" => "WebCopier",
5900     "rule" => array(
5901     "WebCopier[/ ]v?([0-9.]{1,10})" => "\\1"
5902     ),
5903     "uri" => ""
5904     ),
5905     "webcorp" => array(
5906     "icon" => "webcorp",
5907     "title" => "WebCorp",
5908     "rule" => array(
5909     "WebCorp[/ ]+([0-9.]{1,10})" => "\\1"
5910     ),
5911     "uri" => "http://www.webcorp.org.uk/"
5912     ),
5913     "webcrawl" => array(
5914     "icon" => "robot",
5915     "title" => "WebCrawl",
5916     "rule" => array(
5917     "webcrawl\.net" => ""
5918     ),
5919     "uri" => ""
5920     ),
5921     "webdownloader" => array(
5922     "icon" => "robot",
5923     "title" => "Web Downloader",
5924     "rule" => array(
5925     "Web Downloader[/ ]([0-9.]{1,10})" => "\\1"
5926     ),
5927     "uri" => ""
5928     ),
5929     "webfetch" => array(
5930     "icon" => "robot",
5931 matthys 209 "title" => "WebFetch",
5932 joku 63 "rule" => array(
5933     "^webfetch[/ ]([0-9.]{1,10})" => "\\1"
5934     ),
5935     "uri" => ""
5936     ),
5937     "webfind" => array(
5938     "icon" => "robot",
5939 matthys 209 "title" => "WebFind",
5940 joku 63 "rule" => array(
5941     "^WebFindBot" => ""
5942     ),
5943     "uri" => "http://www.web-find.com"
5944     ),
5945     "webglimpse" => array(
5946     "icon" => "robot",
5947     "title" => "Webglimpse",
5948     "rule" => array(
5949     "^Webglimpse[/ ]([0-9.]{1,10})" => "\\1"
5950     ),
5951     "uri" => "http://webglimpse.net"
5952     ),
5953     "webgobbler" => array(
5954     "icon" => "robot",
5955     "title" => "webGobbler",
5956     "rule" => array(
5957     "^webGobbler[/ ]([0-9.]{1,10})" => "\\1"
5958     ),
5959     "uri" => ""
5960     ),
5961     "webimages" => array(
5962     "icon" => "webimages",
5963     "title" => "WebImages",
5964     "rule" => array(
5965     "^WebImages[/ ]([0-9.]{1,10})" => "\\1"
5966     ),
5967     "uri" => "http://herbert.groot.jebbink.nl/"
5968     ),
5969     "weblight" => array(
5970     "icon" => "robot",
5971     "title" => "WebLight",
5972     "rule" => array(
5973     "^WebLight[/ ]([0-9.]{1,10})" => "\\1"
5974     ),
5975     "uri" => "http://www.illumit.com/Products/weblight/"
5976     ),
5977     "weblinks" => array(
5978     "icon" => "robot",
5979     "title" => "WebLink's",
5980     "rule" => array(
5981     "^Weblink.s checker" => ""
5982     ),
5983     "uri" => ""
5984     ),
5985     "webmeasurement" => array(
5986     "icon" => "robot",
5987     "title" => "Webmeasurement",
5988     "rule" => array(
5989     "^webmeasurement-bot" => ""
5990     ),
5991     "uri" => "http://rvs.informatik.uni-leipzig.de"
5992     ),
5993     "webminer" => array(
5994     "icon" => "robot",
5995     "title" => "WebMiner",
5996     "rule" => array(
5997     "^WebMiner[/ ]([0-9.]{1,10})" => "\\1"
5998     ),
5999     "uri" => ""
6000     ),
6001     "webmin" => array(
6002     "icon" => "webmin",
6003     "title" => "Webmin",
6004     "rule" => array(
6005     "^webmin" => ""
6006     ),
6007     "uri" => ""
6008     ),
6009     "webmon" => array(
6010     "icon" => "webmon",
6011     "title" => "Webmon",
6012     "rule" => array(
6013     "WebMon[ /]([0-9.]{1,10})" => "\\1"
6014     ),
6015     "uri" => "http://www.markwell.btinternet.co.uk/webmon/"
6016     ),
6017     "webox" => array(
6018     "icon" => "robot",
6019     "title" => " WeBoX",
6020     "rule" => array(
6021     "WeBoX[/ ]([0-9.]{1,10})" => "\\1"
6022     ),
6023     "uri" => ""
6024     ),
6025     "webpatrol" => array(
6026     "icon" => "webpatrol",
6027     "title" => "WebPatrol",
6028     "rule" => array(
6029     "^WebPatrol[ /]([0-9.]{1,10})" => "\\1"
6030     ),
6031     "uri" => "http://soft.macfeeling.com/WebPatrol.html"
6032     ),
6033     "webpix" => array(
6034     "icon" => "webpix",
6035     "title" => "WebPix",
6036     "rule" => array(
6037     "WebPix[/ ]([0-9.]{1,10})" => "\\1"
6038     ),
6039     "uri" => ""
6040     ),
6041     "webrace" => array(
6042     "icon" => "robot",
6043     "title" => "WebRACE",
6044     "rule" => array(
6045     "^WebRACE[/ ]([0-9.]{1,10})" => "\\1"
6046     ),
6047     "uri" => ""
6048     ),
6049     "webreaper" => array(
6050     "icon" => "webreaper",
6051     "title" => "WebReaper",
6052     "rule" => array(
6053     "^WebReaper " => ""
6054     ),
6055     "uri" => "http://www.webreaper.net/"
6056     ),
6057     "webresult" => array(
6058     "icon" => "robot",
6059     "title" => "Webresult",
6060     "rule" => array(
6061     "Der webresult\.de Robot" => ""
6062     ),
6063     "uri" => ""
6064     ),
6065     "webring" => array(
6066     "icon" => "robot",
6067     "title" => "Webring Checker",
6068     "rule" => array(
6069     "WebRingChecker[/ ]([0-9.]{1,10})" => "\\1"
6070     ),
6071     "uri" => ""
6072     ),
6073     "webripper" => array(
6074     "icon" => "webripper",
6075     "title" => "WebRipper",
6076     "rule" => array(
6077     "^WebRipper" => ""
6078     ),
6079     "uri" => "http://calluna-software.com"
6080     ),
6081     "webscaled" => array(
6082     "icon" => "webscaled",
6083     "title" => "Webscaled",
6084     "rule" => array(
6085     "Swarm" => ""
6086     ),
6087     "uri" => "http://webscaled.com/"
6088     ),
6089     "websearchau" => array(
6090     "icon" => "websearchau",
6091     "title" => "WebSearch.COM.AU",
6092     "rule" => array(
6093     "WebSearch.COM.AU[/ ]+([0-9.]{1,10})" => "\\1"
6094     ),
6095     "uri" => "http://WebSearch.com.au/"
6096     ),
6097     "websearchbench" => array(
6098     "icon" => "robot",
6099     "title" => "WebSearchBench",
6100     "rule" => array(
6101     "WebSearchBench WebCrawler[v/ ]+([0-9.]{1,10})" => "\\1"
6102     ),
6103     "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6104     ),
6105     "websense" => array(
6106     "icon" => "websense",
6107     "title" => "Websense",
6108     "rule" => array(
6109     "(Sqworm|websense|Konqueror/3\.(0|1)(-rc[1-6])?; i686 Linux; 2002[0-9]{4})" => ""
6110     ),
6111     "uri" => ""
6112     ),
6113     "websiteshadow" => array(
6114     "icon" => "websiteshadow",
6115     "title" => "Websiteshadow",
6116     "rule" => array(
6117     "Websiteshadowbot[ /]([0-9.]{1,10})" => "\\1"
6118     ),
6119     "uri" => "http://websiteshadow.com"
6120     ),
6121     "websiteworth" => array(
6122     "icon" => "robot",
6123     "title" => "WebsiteWorth",
6124     "rule" => array(
6125     "WebsiteWorth[v/ ]+([0-9.]{1,10})" => "\\1"
6126     ),
6127     "uri" => "http://directory.sootle.com/website-worth/tata.php"
6128     ),
6129     "websquash" => array(
6130     "icon" => "websquash",
6131     "title" => "Websquash",
6132     "rule" => array(
6133     "webs(quash\.com|ite[ \-]?Monitor)" => ""
6134     ),
6135     "uri" => ""
6136     ),
6137     "webstripper" => array(
6138     "icon" => "robot",
6139     "title" => "WebStripper",
6140     "rule" => array(
6141     "WebStripper[ /]([0-9.]{1,10})" => "\\1"
6142     ),
6143     "uri" => ""
6144     ),
6145     "webzip" => array(
6146     "icon" => "webzip",
6147     "title" => "WebZIP",
6148     "rule" => array(
6149     "Web[ \-]?ZIP[ /]([0-9.]{1,10})" => "\\1"
6150     ),
6151     "uri" => ""
6152     ),
6153     "wep" => array(
6154     "icon" => "robot",
6155     "title" => "WEP Search",
6156     "rule" => array(
6157     "WEP Search[ /]([0-9.]{1,10})" => "\\1"
6158     ),
6159     "uri" => ""
6160     ),
6161     "westwind" => array(
6162     "icon" => "robot",
6163     "title" => "West Wind Internet Protocols",
6164     "rule" => array(
6165     "^West Wind Internet Protocols[ /]([0-9.]{1,10})" => "\\1"
6166     ),
6167     "uri" => "http://www.west-wind.com/wwipstuff.asp"
6168     ),
6169     "wget" => array(
6170     "icon" => "wget",
6171     "title" => "Wget",
6172     "rule" => array(
6173     "Wget[ /]([0-9.]{1,10})" => "\\1"
6174     ),
6175     "uri" => ""
6176     ),
6177     "whizbang" => array(
6178     "icon" => "whizbang",
6179     "title" => "WhizBang",
6180     "rule" => array(
6181     "WhizBang" => ""
6182     ),
6183     "uri" => "http://www.whizbang.com/crawler/"
6184     ),
6185     "whois" => array(
6186     "icon" => "whois",
6187     "title" => "Who.is",
6188     "rule" => array(
6189     "Who.is Bot" => ""
6190     ),
6191     "uri" => "http://www.who.is/"
6192     ),
6193     "wikiwix" => array(
6194     "icon" => "wikiwix",
6195     "title" => "Wikiwix",
6196     "rule" => array(
6197     "wikiwix-bot-([0-9.]{1,10})" => "\\1"
6198     ),
6199     "uri" => "http://www.wikiwix.com/"
6200     ),
6201     "wingflyer" => array(
6202     "icon" => "robot",
6203     "title" => "WingFlyer",
6204     "rule" => array(
6205     "^WebFetch" => ""
6206     ),
6207     "uri" => "http://www.wingflyer.com/"
6208     ),
6209     "wininet" => array(
6210     "icon" => "robot",
6211     "title" => "WinInet",
6212     "rule" => array(
6213     "TeamSoft WinInet Component" => ""
6214     ),
6215     "uri" => "http://www.winsoft.sk/wininet.htm"
6216     ),
6217     "winhttp" => array(
6218     "icon" => "robot",
6219     "title" => "WinHTTP",
6220     "rule" => array(
6221     "WinHttp\.WinHttpRequest\.([0-9.]{1,10})" => "\\1"
6222     ),
6223     "uri" => ""
6224     ),
6225     "wire" => array(
6226     "icon" => "robot",
6227     "title" => "WIRE",
6228     "rule" => array(
6229     "^WIRE[ /]([0-9.]{1,10})" => "\\1"
6230     ),
6231     "uri" => ""
6232     ),
6233     "wmp" => array(
6234     "icon" => "robot",
6235     "title" => "WMP",
6236     "rule" => array(
6237     "^WMP" => ""
6238     ),
6239     "uri" => ""
6240     ),
6241     "woozweb" => array(
6242     "icon" => "woozweb",
6243     "title" => "Woozweb",
6244     "rule" => array(
6245     "woozweb" => ""
6246     ),
6247     "uri" => "http://www.woozweb.com/"
6248     ),
6249     "wordchamp" => array(
6250     "icon" => "robot",
6251     "title" => "WordChamp",
6252     "rule" => array(
6253     "^WordChampBot" => ""
6254     ),
6255     "uri" => "http://www.wordchamp.com/"
6256     ),
6257     "wordpress" => array(
6258     "icon" => "wordpress",
6259     "title" => "WordPress",
6260     "rule" => array(
6261     "WordPress[ /]([0-9.]{1,10})" => "\\1"
6262     ),
6263     "uri" => ""
6264     ),
6265     "worio" => array(
6266     "icon" => "worio",
6267     "title" => "Worio",
6268     "rule" => array(
6269     "woriobot" => ""
6270     ),
6271     "uri" => "http://worio.com/"
6272     ),
6273     "worldlight" => array(
6274     "icon" => "worldlight",
6275     "title" => "WorldLight",
6276     "rule" => array(
6277     "^WorldLight" => ""
6278     ),
6279     "uri" => ""
6280     ),
6281     "worqmada" => array(
6282     "icon" => "robot",
6283     "title" => "WorQmada",
6284     "rule" => array(
6285     "WorQmada[ /]([0-9.]{1,10})" => "\\1"
6286     ),
6287     "uri" => ""
6288     ),
6289     "wotbox" => array(
6290     "icon" => "wotbox",
6291     "title" => "Wotbox",
6292     "rule" => array(
6293     "Wotbox[ /]?[a-z]*([0-9.]{1,10})" => "\\1"
6294     ),
6295     "uri" => ""
6296     ),
6297     "wp" => array(
6298     "icon" => "wp",
6299     "title" => "Wirtualna Polska",
6300     "rule" => array(
6301     "NetSprint[ /\-]{1,4}([0-9.]{1,10})" => "\\1"
6302     ),
6303     "uri" => "http://wp.pl"
6304     ),
6305     "wsb" => array(
6306     "icon" => "robot",
6307     "title" => "WebSearchBench",
6308     "rule" => array(
6309     "WSB WebCrawler V([0-9.]{1,10})" => "\\1",
6310     "WSB " => ""
6311     ),
6312     "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6313     ),
6314     "wume" => array(
6315     "icon" => "robot",
6316     "title" => "WUME Lab's",
6317     "rule" => array(
6318     "^wume_crawler[ /]([0-9.]{1,10})" => "\\1",
6319     ),
6320     "uri" => "http://wume.cse.lehigh.edu/~xiq204/crawler/"
6321     ),
6322     "wusage" => array(
6323     "icon" => "wusage",
6324     "title" => "Wusage",
6325     "rule" => array(
6326     "Wusage[ /]([0-9.]{1,10})" => "\\1",
6327     ),
6328     "uri" => "http://www.boutell.com/wusage/"
6329     ),
6330     "wwgrapevine" => array(
6331     "icon" => "wwgrapevine",
6332     "title" => "WWgrapevine",
6333     "rule" => array(
6334     "wwgrapevine[ /]([0-9.]{1,10})" => "\\1"
6335     ),
6336     "uri" => ""
6337     ),
6338     "wws" => array(
6339     "icon" => "robot",
6340     "title" => "WWSBOT",
6341     "rule" => array(
6342     "WWSBOT[ /]([0-9.]{1,10})" => "\\1",
6343     ),
6344     "uri" => "http://www.analyzer.nu"
6345     ),
6346     "www4mail" => array(
6347     "icon" => "robot",
6348 matthys 209 "title" => "WWW4mail",
6349 joku 63 "rule" => array(
6350     "^www4mail[ /]([0-9.]{1,10})" => "\\1"
6351     ),
6352     "uri" => "http://www.www4mail.org/"
6353     ),
6354     "wwwc" => array(
6355     "icon" => "wwwc",
6356     "title" => "WWWC",
6357     "rule" => array(
6358     "^WWWC[ /]([0-9.]{1,10})" => "\\1"
6359     ),
6360     "uri" => ""
6361     ),
6362     "wwwd" => array(
6363     "icon" => "robot",
6364     "title" => "WWWD",
6365     "rule" => array(
6366     "^WWWD[ /]([0-9.]{1,10})" => "\\1"
6367     ),
6368     "uri" => ""
6369     ),
6370     "wwweasel" => array(
6371     "icon" => "wwweasel",
6372     "title" => "WWWeasel",
6373     "rule" => array(
6374     "WWWeasel( Robot)?[/ ]v?([0-9.]{1,10})" => "\\2"
6375     ),
6376     "uri" => ""
6377     ),
6378     "wwwfi" => array(
6379     "icon" => "wwwfi",
6380     "title" => "www.fi",
6381     "rule" => array(
6382     "www\.fi crawler" => ""
6383     ),
6384     "uri" => "http://www.fi/"
6385     ),
6386     "wwwmechanize" => array(
6387     "icon" => "robot",
6388     "title" => "WWW-Mechanize",
6389     "rule" => array(
6390     "^WWW-Mechanize[/ ]([0-9.]{1,10})" => "\\1"
6391     ),
6392     "uri" => ""
6393     ),
6394     "wwwoffle" => array(
6395     "icon" => "robot",
6396     "title" => "WWWoffle",
6397     "rule" => array(
6398     "^wwwoffle[/ ]([0-9.]{1,10})" => "\\1"
6399     ),
6400     "uri" => ""
6401     ),
6402     "wwwster" => array(
6403     "icon" => "robot",
6404     "title" => "WWWster",
6405     "rule" => array(
6406     "^wwwster[/ ]([0-9.]{1,10})" => "\\1"
6407     ),
6408     "uri" => ""
6409     ),
6410     "wysigot" => array(
6411     "icon" => "wysigot",
6412     "title" => "Wysigot",
6413     "rule" => array(
6414     "Wysigot[/ ]([0-9.]{1,10})" => "\\1"
6415     ),
6416     "uri" => ""
6417     ),
6418     "xaldon" => array(
6419     "icon" => "xaldon",
6420     "title" => "Xaldon",
6421     "rule" => array(
6422     "Xaldon WebSpider" => ""
6423     ),
6424     "uri" => "http://www.xaldon.de/"
6425     ),
6426     "xenu" => array(
6427     "icon" => "xenu",
6428     "title" => "Xenu Link Sleuth",
6429     "rule" => array(
6430     "Xenu Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6431     "Xenu(&#039;s)? Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6432     "Xenu_Link_Sleuth_([0-9a-z.]{1,10})" => "\\1"
6433     ),
6434     "uri" => "http://home.snafu.de/tilman/xenulink.html"
6435     ),
6436     "xerka" => array(
6437     "icon" => "xerka",
6438     "title" => "Xerka",
6439     "rule" => array(
6440     "^Xerka WebBot v([0-9a-z.]{1,10})" => "\\1"
6441     ),
6442     "uri" => "http://www.diana-teknologia.com/www1/english/xerka.htm"
6443     ),
6444     "xirq" => array(
6445     "icon" => "robot",
6446     "title" => "XIRQ",
6447     "rule" => array(
6448     "^xirq[ /]([0-9a-z.]{1,10})" => "\\1"
6449     ),
6450     "uri" => "http://www.xirq.com"
6451     ),
6452     "xmlslurp" => array(
6453     "icon" => "robot",
6454     "title" => "XMLSlurp",
6455     "rule" => array(
6456     "^XMLSlurp[ /]([0-9a-z.]{1,10})" => "\\1"
6457     ),
6458     "uri" => ""
6459     ),
6460     "xml-sitemaps" => array(
6461     "icon" => "xml-sitemaps",
6462     "title" => "XML-Sitemaps",
6463     "rule" => array(
6464     "XML-Sitemaps[ /]([0-9a-z.]{1,10})" => "\\1"
6465     ),
6466     "uri" => ""
6467     ),
6468     "xmlrpc" => array(
6469     "icon" => "robot",
6470     "title" => "Trackback",
6471     "rule" => array(
6472     "XMLRPC" => ""
6473     ),
6474     "uri" => ""
6475     ),
6476 matthys 294 "xovi" => array(
6477     "icon" => "xovi",
6478     "title" => "Xovi",
6479     "rule" => array(
6480     "XoviBot[ /]([0-9a-z.]{1,10})" => "\\1"
6481     ),
6482     "uri" => "http://www.xovibot.net"
6483     ),
6484 joku 63 "yacy" => array(
6485     "icon" => "yacy",
6486     "title" => "Yacy",
6487     "rule" => array(
6488     "yacy\.net" => ""
6489     ),
6490     "uri" => ""
6491     ),
6492     "yahoo" => array(
6493     "icon" => "yahoo",
6494     "title" => "Yahoo",
6495     "rule" => array(
6496     "Yahoo(! ([a-z]{1,3} )?Slurp|-)" => "",
6497     "Yahoo-MMCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6498     "Yahoo-VerticalCrawler-FormerWebCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6499     "^AnzwersCrawl[/ ]([0-9a-z.]{1,10})" => "\\1",
6500     "Y!J(-BSC|-SRD)*[/ ]([0-9a-z.]{1,10})" => "\\2",
6501     "Y!OASIS/TEST" => "",
6502     "Harvest-NG[/ ]([0-9a-z.]{1,10})" => "\\1",
6503     "Y!J; for robot study" => "",
6504     "Yahoo Japan; for robot study" => ""
6505     ),
6506     "uri" => "http://www.yahoo.com"
6507     ),
6508     "yahoo-feed" => array(
6509     "icon" => "yahoo",
6510     "title" => "Yahoo Feedseeker",
6511     "rule" => array(
6512     "^YahooFeedSeeker[/ ]([0-9a-z.]{1,10})" => "\\1"
6513     ),
6514     "uri" => "http://www.yahoo.com"
6515     ),
6516     "yandex" => array(
6517     "icon" => "yandex",
6518     "title" => "Yandex",
6519     "rule" => array(
6520     "Yandex[/ ]([0-9.]{1,10})" => "\\1",
6521     "Yandex(Bot|Images|Media|Antivirus)[/ ]([0-9.]{1,10})" => "\\2"
6522     ),
6523     "uri" => "http://yandex.com/bots"
6524     ),
6525     "yanga" => array(
6526     "icon" => "yanga",
6527     "title" => "Yanga",
6528     "rule" => array (
6529     "^Yanga.*v([0-9.]{1,10})" => "\\1"
6530     ),
6531     "uri" => "http://www.yanga.co.uk/"
6532     ),
6533     "yap" => array(
6534     "icon" => "yap",
6535     "title" => "Yap",
6536     "rule" => array(
6537     "^YapBot[_/ ]v([0-9.]{1,10})" => "\\1"
6538     ),
6539     "uri" => "http://www.yapinc.com/"
6540     ),
6541     "yarienavoir" => array(
6542     "icon" => "robot",
6543     "title" => "Yarienavoir",
6544     "rule" => array(
6545     "^yarienavoir.net[/ ]([0-9.]{1,10})" => "\\1"
6546     ),
6547     "uri" => "http://www.yarienavoir.net/"
6548     ),
6549     "yell" => array(
6550     "icon" => "yell",
6551     "title" => "Yell",
6552     "rule" => array(
6553     "YellCrawl[ /]V?([0-9.]{1,10})" => "\\1",
6554     "Yellbot[ /]Nutch-([0-9.]{1,10})" => "\\1",
6555     ),
6556     "uri" => ""
6557     ),
6558     "youdao" => array(
6559     "icon" => "youdao",
6560     "title" => "Youdao",
6561     "rule" => array(
6562     "YodaoBot-(Image|Mobile)?[ /]([0-9.]{1,10})" => "\\2",
6563     "YoudaoBot[ /]([0-9.]{1,10})" => "\\1"
6564     ),
6565     "uri" => "http://www.youdao.com/help/webmaster/spider/"
6566     ),
6567     "yoogli" => array(
6568     "icon" => "yoogli",
6569     "title" => "Yoogli",
6570     "rule" => array(
6571     "yoogliFetchAgent[ /]([0-9.]{1,10})" => "\\1"
6572     ),
6573     "uri" => "http://www.yoogli.com"
6574     ),
6575     "yotta" => array(
6576     "icon" => "robot",
6577     "title" => "Yotta",
6578     "rule" => array(
6579     "Yotta(Shopping|Cars)_Bot[ /]([0-9.]{1,10})" => "\\2",
6580     "OmniExplorer_Bot[ /]([0-9.]{1,10})" => "\\1"
6581     ),
6582     "uri" => "http://www.yottacars.com"
6583     ),
6584     "yoono" => array(
6585     "icon" => "yoono",
6586     "title" => "Yoono",
6587     "rule" => array(
6588     "Yoono" => ""
6589     ),
6590     "uri" => "http://www.yoono.com/"
6591     ),
6592     "yowedo" => array(
6593     "icon" => "robot",
6594     "title" => "Yowedo",
6595     "rule" => array(
6596     "Yowedo[ /]([0-9.]{1,10})" => "\\1"
6597     ),
6598     "uri" => "http://yowedo.com/en/partners.html"
6599     ),
6600     "yuntis" => array(
6601     "icon" => "robot",
6602 matthys 209 "title" => "Yuntis",
6603 joku 63 "rule" => array(
6604     "Gulper Web Bot[ /]([0-9.]{1,10})" => "\\1"
6605     ),
6606     "uri" => "http://yuntis.ecsl.cs.sunysb.edu/help/robot/"
6607     ),
6608     "zao" => array(
6609     "icon" => "robot",
6610     "title" => "Zao",
6611     "rule" => array(
6612     "Zao[ /]([0-9.]{1,10})" => "\\1",
6613     "Zao-crawler" => ""
6614     ),
6615     "uri" => ""
6616     ),
6617     "zealbot" => array(
6618     "icon" => "zeal",
6619     "title" => "ZealBot",
6620     "rule" => array(
6621     "Zealbot[ /]([0-9.]{1,10})" => "\\1"
6622     ),
6623     "uri" => ""
6624     ),
6625     "zearchit" => array(
6626     "icon" => "zearchit",
6627     "title" => "Zearchit",
6628     "rule" => array(
6629     "Zearchit" => ""
6630     ),
6631     "uri" => "http://www.zearchit.de/"
6632     ),
6633     "zebz" => array(
6634     "icon" => "robot",
6635     "title" => "ze.bz",
6636     "rule" => array(
6637     "^ZeBot_(lseek\.net|www\.ze\.bz)" => ""
6638     ),
6639     "uri" => "http://www.ze.bz/"
6640     ),
6641     "zedzo" => array(
6642     "icon" => "robot",
6643     "title" => "Zedzo",
6644     "rule" => array(
6645     "zedzo.digest[ /]([0-9.]{1,10})" => "\\1"
6646     ),
6647     "uri" => "http://www.zedzo.com/"
6648     ),
6649     "zerx" => array(
6650     "icon" => "zerx",
6651     "title" => "Zerx",
6652     "rule" => array(
6653     "^zerxbot[ /](Version|v)*[ /]*([0-9.]{1,10})" => "\\2"
6654     ),
6655     "uri" => "http://www.zerx.com/"
6656     ),
6657     "zeus" => array(
6658     "icon" => "zeus",
6659     "title" => "Zeus",
6660     "rule" => array(
6661     "Zeus" => ""
6662     ),
6663     "uri" => "http://www.zeus.com"
6664     ),
6665     "zippp" => array(
6666     "icon" => "robot",
6667     "title" => "Zippp",
6668     "rule" => array(
6669     "ZipppBot[ /]([0-9.]{1,10})" => "\\1"
6670     ),
6671     "uri" => ""
6672     ),
6673     "zippy" => array(
6674     "icon" => "robot",
6675     "title" => "Zippy",
6676     "rule" => array(
6677     "^Zippy[ v/]*([0-9.]{1,10})" => "\\1"
6678     ),
6679     "uri" => "http://www.zippyfinder.com"
6680     ),
6681     "zoeky" => array(
6682     "icon" => "robot",
6683     "title" => "Zoeky",
6684     "rule" => array(
6685     "Zoekybot[ /]([0-9.]{1,10})" => "\\1"
6686     ),
6687     "uri" => ""
6688     ),
6689     "zoom" => array(
6690     "icon" => "zoom",
6691 matthys 209 "title" => "ZoomSpider",
6692 joku 63 "rule" => array(
6693     "^ZoomSpider" => ""
6694     ),
6695     "uri" => "http://www.wrensoft.com/"
6696     ),
6697     "zspider" => array(
6698     "icon" => "robot",
6699 matthys 209 "title" => "Zspider",
6700 joku 63 "rule" => array(
6701     "zspider[ /]([0-9.a-z]{1,10})" => "\\1"
6702     ),
6703     "uri" => "http://feedback.redkolibri.com/"
6704     ),
6705 matthys 281 "zumbot" => array(
6706     "icon" => "robot",
6707     "title" => "ZUM Search",
6708     "rule" => array(
6709     "ZumBot[ /]([0-9.]{1,10})" => "\\1"
6710     ),
6711     "uri" => "http://help.zum.com/inquiry"
6712     ),
6713 joku 63 "zyborg" => array(
6714     "icon" => "zyborg",
6715     "title" => "WiseNutBot",
6716     "rule" => array(
6717     "(WISE|Zy)bo(rg|t)[ /]([0-9.]{1,10})" => "\\3"
6718     ),
6719     "uri" => ""
6720     ),
6721     // Catch up for the originals, they got to stay in that order.
6722     "blogbot" => array(
6723     "icon" => "blogbot",
6724     "title" => "BlogBot",
6725     "rule" => array(
6726     "Blog[ \-]?Bot" => ""
6727     ),
6728     "uri" => "http://www.blogbot.com/"
6729     ),
6730     "centrum" => array(
6731     "icon" => "centrum",
6732     "title" => "Centrum",
6733     "rule" => array(
6734     "holmes[/ ]([0-9.]{1,10})" => "\\1",
6735     "^Centrum-checker" => ""
6736     ),
6737     "uri" => ""
6738     ),
6739     "httpclient" => array(
6740     "icon" => "robot",
6741     "title" => "HTTPClient",
6742     "rule" => array(
6743     "HTTP[ \-]?Client[ /]([0-9.]{1,10})" => "\\1",
6744     "HTTP[ \-]?Client" => ""
6745     ),
6746     "uri" => "http://www.innovation.ch/java/HTTPClient/"
6747     ),
6748     "incywincy" => array(
6749     "icon" => "robot",
6750     "title" => "IncyWincy",
6751     "rule" => array(
6752     "^IncyWincy[ /]([0-9.]{1,10})" => "\\1",
6753     "^IncyWincy" => ""
6754     ),
6755     "uri" => ""
6756     ),
6757     "java" => array(
6758     "icon" => "java",
6759     "title" => "Java",
6760     "rule" => array(
6761     "^java[ /]*([0-9.a-z]{1,10})" => "\\1"
6762     ),
6763     "uri" => ""
6764     ),
6765     "libfetch" => array(
6766     "icon" => "robot",
6767     "title" => "Libfetch",
6768     "rule" => array(
6769     "^(fetch )?libfetch[ /]([0-9.]{1,10})" => "\\2"
6770     ),
6771     "uri" => "http://www.freebsd.org/"
6772     ),
6773     "libwww" => array(
6774     "icon" => "libwww",
6775 matthys 209 "title" => "LibWWW",
6776 joku 63 "rule" => array(
6777     "^libww(w|w-perl|w-FM)[ /]([0-9.]{1,10})" => "\\2",
6778     "^libww(w|w-perl|w-FM)" => "",
6779     "MyApp.*libww(w|w-perl|w-FM)" => ""
6780     ),
6781     "uri" => ""
6782     ),
6783     "litefinder" => array(
6784     "icon" => "litefinder",
6785     "title" => "LiteFinder",
6786     "rule" => array(
6787     "LiteFinder[ /]([0-9.]{1,10})" => "\\1"
6788     ),
6789     "uri" => "http://www.litefinder.net/about.html"
6790     ),
6791     "nutchorg" => array(
6792     "icon" => "nutchorg",
6793     "title" => "Nutch",
6794     "rule" => array(
6795     "Nutc(hOrg|hCVS|h)?[ /]([0-9.]{1,10})" => "\\2",
6796     "Nutch" => ""
6797     ),
6798     "uri" => "http://lucene.apache.org/nutch/"
6799     ),
6800     "pythonurl" => array(
6801     "icon" => "pythonurl",
6802     "title" => "Python-url",
6803     "rule" => array(
6804     "Python[ \-]?urllib" => ""
6805     ),
6806     "uri" => ""
6807     ),
6808     // Know Robots as SPAM BOTS
6809     "SPAM" => array(
6810     "icon" => "robot",
6811     "title" => "SPAM",
6812     "rule" => array(
6813     "NASA Search[/ ]([0-9.]{1,10})" => "\\1",
6814     "^PHOTO CHECK" => "",
6815     "^FOTOCHECKER" => "",
6816     "^IPTC CHECK" => "",
6817     "^DataCha0s" => "",
6818     "^Mac Finder" => "",
6819     "^Missigua Locator[ /]([0-9.]{1,10})" => "\\1",
6820     "^Missouri College Browse" => "",
6821     "Email[ \-]?Siphon" => "",
6822     "atSpider" => "",
6823     "autoemailspider" => "",
6824     "^Demo Bot" => "",
6825     "^Program Shareware" => "",
6826     "^Snapbot" => "",
6827     "^snap.com" => "",
6828     "^Guestbook Auto Submitter" => "",
6829     "panscient.com" => "",
6830     ),
6831     "uri" => ""
6832     ),
6833     // Things we don't know by now
6834     "robot" => array(
6835     "icon" => "robot",
6836     "title" => "Robot",
6837     "rule" => array(
6838     "(robot|spider|harvest|(?<!orange)bot|(?<!msie)crawler)" => ""
6839     )
6840     )
6841     );
6842 joku 261 ?>

Properties

Name Value
svn:keywords Id