ViewVC Help
View File | Revision Log | Show Annotations | View Changeset | Root Listing
root/BBClone/trunk/lib/robot.php
Revision: 397
Committed: Thu Oct 28 09:02:36 2021 UTC (3 years, 1 month ago) by matthys
File size: 159469 byte(s)
Log Message:
Updated DuckDuckGo Bot

File Contents

# User Rev Content
1 joku 63 <?php
2     /* This file is part of BBClone (A PHP based Web Counter on Steroids)
3     *
4     * SVN FILE $Id$
5     *
6 joku 394 * Copyright (C) 2001-2021, the BBClone Team (see doc/authors.txt for details)
7 joku 63 *
8     * This program is free software: you can redistribute it and/or modify
9     * it under the terms of the GNU General Public License as published by
10     * the Free Software Foundation, either version 3 of the License, or
11     * (at your option) any later version.
12     *
13     * This program is distributed in the hope that it will be useful,
14     * but WITHOUT ANY WARRANTY; without even the implied warranty of
15     * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16     * GNU General Public License for more details.
17     *
18     * See doc/copying.txt for details
19     */
20    
21     /////////////////////
22     // Robot Detection //
23     /////////////////////
24    
25     $robot = array(
26     "1noon" => array(
27     "icon" => "1noon",
28     "title" => "1noon",
29     "rule" => array(
30     "1Noonbot[/ ]([0-9.]{1,10})" => "\\1",
31     "^Yeti$" => ""
32     ),
33     "uri" => ""
34     ),
35     "123people" => array(
36     "icon" => "123people",
37     "title" => "123people",
38     "rule" => array(
39     "123peoplebot[ /]([0-9.]{1,10})" => "\\1"
40     ),
41     "uri" => "http://www.123people.fr/"
42     ),
43     "123spider" => array(
44     "icon" => "robot",
45     "title" => "123Spider",
46     "rule" => array(
47     "123spider-Bot \(Version: ([0-9.]{1,10})" => "\\1"
48     ),
49     "uri" => "http://www.123spider.de/"
50     ),
51     "192com" => array(
52     "icon" => "robot",
53     "title" => "192.com",
54     "rule" => array(
55     "192.comAgent" => ""
56     ),
57     "uri" => "http://www.192.com/"
58     ),
59 matthys 298 "200please" => array(
60     "icon" => "200please",
61     "title" => "200please Crawler",
62     "rule" => array(
63     "200PleaseBot[ /]([0-9.]{1,10})" => "\\1"
64     ),
65     "uri" => "http://www.200please.com/bot"
66     ),
67 joku 63 "2dehands" => array(
68     "icon" => "2dehands",
69     "title" => "2deHands",
70     "rule" => array(
71     "2dehands\.nl" => ""
72     ),
73     "uri" => ""
74     ),
75     "80legs" => array(
76     "icon" => "80legs",
77     "title" => "80legs",
78     "rule" => array(
79     "008[/ ]([0-9.]{1,10}).*80legs" => "\\1"
80     ),
81     "uri" => "http://www.80legs.com/"
82     ),
83     "a1sitemap" => array(
84     "icon" => "a1sitemap",
85     "title" => "A1 Sitemap",
86     "rule" => array(
87     "^A1 Sitemap Generator[ /]([0-9.]{1,10})" => "\\1",
88     "miggibot[ /]([0-9.]{1,10})" => "\\1"
89     ),
90     "uri" => "http://www.micro-sys.dk/products/sitemap-generator/"
91     ),
92     "a2b" => array(
93     "icon" => "a2b",
94     "title" => "A2B",
95     "rule" => array(
96     "www\.a2b\.cc" => ""
97     ),
98     "uri" => "http://www.a2b.cc"
99     ),
100     "abacho" => array(
101     "icon" => "robot",
102     "title" => "Abacho",
103     "rule" => array(
104     "^ABACHOBot" => ""
105     ),
106     "uri" => ""
107     ),
108     "abcdatos" => array(
109     "icon" => "abcdatos",
110     "title" => "ABCdatos",
111     "rule" => array(
112     "^ABCdatos BotLink[ /]([0-9.]{1,10})" => "\\1"
113     ),
114     "uri" => "http://www.abcdatos.com/"
115     ),
116     "abot" => array(
117     "icon" => "abot",
118     "title" => "aBot",
119     "rule" => array(
120     "^abot[ /]([0-9.]{1,10})" => "\\1"
121     ),
122     "uri" => ""
123     ),
124     "about" => array(
125     "icon" => "about",
126     "title" => "About",
127     "rule" => array(
128     "Libby[_/ ]([0-9.]{1,10})" => "\\1",
129     "About[_/ ]([0-9.]{1,10})libwww-perl" => "\\1"
130     ),
131     "uri" => ""
132     ),
133     "aboutus" => array(
134     "icon" => "aboutus",
135     "title" => "AboutUs",
136     "rule" => array(
137     "AboutUsBot" => ""
138     ),
139     "uri" => "http://www.aboutus.org/"
140     ),
141     "ackerm" => array(
142     "icon" => "robot",
143     "title" => "Ackerm",
144     "rule" => array(
145     "www.ackerm.com" => ""
146     ),
147     "uri" => "http://www.ackerm.com/"
148     ),
149     "acoi" => array(
150     "icon" => "acoi",
151     "title" => "AcoiRobot",
152     "rule" => array(
153     "^AcoiRobot" => ""
154     ),
155     "uri" => "http://monetdb.cwi.nl/acoi/projects.html"
156     ),
157     "acoon" => array(
158     "icon" => "acoon",
159     "title" => "Acoon",
160     "rule" => array(
161     "Acoon[ \-]?Robot" => ""
162     ),
163     "uri" => ""
164     ),
165     "accoona" => array(
166     "icon" => "accoona",
167     "title" => "Accoona",
168     "rule" => array(
169     "Accoona-AI-Agent[/ ]([0-9.]{1,10})" => "\\1",
170     "^accoona" => ""
171     ),
172     "uri" => ""
173     ),
174     "acme" => array(
175     "icon" => "acme",
176     "title" => "Acme",
177     "rule" => array(
178     "^Acme\.Spider" => ""
179     ),
180     "uri" => "http://www.acme.com/java/software/Acme.Spider.html"
181     ),
182     "active" => array(
183     "icon" => "robot",
184     "title" => "ActiveBookmark",
185     "rule" => array(
186     "ActiveBookmark[/ ]([0-9.]{1,10})" => "\\1"
187     ),
188     "uri" => ""
189     ),
190     "admuncher" => array(
191     "icon" => "robot",
192     "title" => "Ad Muncher",
193     "rule" => array(
194     "Ad Muncher[/ v]*([0-9.]{1,10})" => "\\1"
195     ),
196     "uri" => ""
197     ),
198     "aesop" => array(
199     "icon" => "robot",
200     "title" => "Aesop",
201     "rule" => array(
202     "^AESOP_com_SpiderMan" => ""
203     ),
204     "uri" => "http://www.aesop.com"
205     ),
206     "agada" => array(
207     "icon" => "robot",
208     "title" => "Agada",
209     "rule" => array(
210     "^agadine[/ ]([0-9.]{1,10})" => "\\1"
211     ),
212     "uri" => ""
213     ),
214     "ahrefs" => array(
215     "icon" => "ahrefs",
216     "title" => "Ahrefs",
217     "rule" => array(
218     "AhrefsBot[ /]([0-9.]{1,10})" => "\\1"
219     ),
220     "uri" => "http://ahrefs.com/"
221     ),
222     "aibot" => array(
223     "icon" => "robot",
224     "title" => "Aibot",
225     "rule" => array(
226     "AIBOT[/ ]([0-9.]{1,10})" => "\\1"
227     ),
228     "uri" => ""
229     ),
230     "aihitbot" => array(
231     "icon" => "robot",
232     "title" => "aiHit",
233     "rule" => array(
234     "aiHitBot[/ ]([0-9.]{1,10})" => "\\1"
235     ),
236     "uri" => "http://www.aihit.com/"
237     ),
238     "aipbot" => array(
239     "icon" => "robot",
240     "title" => "Aipbot",
241     "rule" => array(
242     "aipbot[/ ]([0-9.]{1,10})" => "\\1"
243     ),
244     "uri" => ""
245     ),
246     "aleksika" => array(
247     "icon" => "aleksika",
248     "title" => "Aleksika",
249     "rule" => array(
250     "Aleksika Spider[/ ]([0-9.]{1,10})" => "\\1"
251     ),
252     "uri" => ""
253     ),
254     "alertsite" => array(
255     "icon" => "alertsite",
256     "title" => "AlertSite",
257     "rule" => array(
258     "ipd[ /]([0-9.]{1,10}).*Alertsite\.com" => "\\1"
259     ),
260     "uri" => "http://www.alertsite.com/index.html"
261     ),
262     "alexa" => array(
263     "icon" => "alexa",
264     "title" => "Alexa",
265     "rule" => array(
266     "^ia_archive" => ""
267     ),
268     "uri" => "http://www.alexa.com/"
269     ),
270     "almaden" => array(
271     "icon" => "almaden",
272     "title" => "IBM Crawler",
273     "rule" => array(
274     "www\.almaden\.ibm\.com/cs/crawler" => ""
275     ),
276     "uri" => "http://www.almaden.ibm.com/cs/crawler/"
277     ),
278     "altavista" => array(
279     "icon" => "altavista",
280     "title" => "Altavista",
281     "rule" => array(
282     "Scooter[ /\-]*[a-z]*([0-9.]{1,10})" => "\\1",
283     "AltaVista V([0-9.]{1,10})" => "\\1",
284     "AltaVista Intranet V([0-9.]{1,10})" => "\\1"
285     ),
286     "uri" => "http://www.altavista.com/"
287     ),
288     "amazon" => array(
289     "icon" => "amazon",
290     "title" => "Amazon",
291     "rule" => array(
292     "^(aranhabot|amzn_assoc)" => "",
293     "^NutchEC2Test" => ""
294     ),
295     "uri" => "http://www.amazon.com/"
296     ),
297     "amidalla" => array(
298     "icon" => "amidalla",
299     "title" => "Amidalla",
300     "rule" => array(
301     "^amibot" => ""
302     ),
303     "uri" => ""
304     ),
305     "amfibi" => array(
306     "icon" => "amfibi",
307     "title" => "Amfibi",
308     "rule" => array(
309     "Amfibibot[/ ]([0-9.]{1,10})" => "\\1",
310     "Amfibibot" => ""
311     ),
312     "uri" => ""
313     ),
314     "amphetadesk" => array(
315     "icon" => "robot",
316     "title" => "AmphetaDesk",
317     "rule" => array(
318     "AmphetaDesk[/ ]([0-9.]{1,10})" => "\\1"
319     ),
320     "uri" => ""
321     ),
322     "amphetameme" => array(
323     "icon" => "robot",
324     "title" => "Amphetameme",
325     "rule" => array(
326     "amphetameme[ \-]?crawler" => ""
327     ),
328     "uri" => ""
329     ),
330     "annomille" => array(
331     "icon" => "robot",
332     "title" => "AnnoMille",
333     "rule" => array(
334     "^AnnoMille( spider)?[/ ]([0-9.]{1,10})" => "\\2"
335     ),
336     "uri" => "http://www.annomille.it"
337     ),
338     "anonymouse" => array(
339     "icon" => "anonymouse",
340     "title" => "Anonymouse.org",
341     "rule" => array(
342     "http://Anonymouse.org" => ""
343     ),
344     "uri" => "http://anonymouse.org"
345     ),
346     "ansearch" => array(
347     "icon" => "robot",
348     "title" => "Ansearch",
349     "rule" => array(
350     "AnsearchBot[/ ]([0-9.]{1,10})" => "\\1"
351     ),
352     "uri" => ""
353     ),
354     "answerchase" => array(
355     "icon" => "answerchase",
356     "title" => "AnswerChase",
357     "rule" => array(
358     "AnswerChase( PROve)?[/ ]([0-9.]{1,10})" => "\\2"
359     ),
360     "uri" => "http://www.answerchase.com/"
361     ),
362     "antibot" => array(
363     "icon" => "robot",
364 matthys 205 "title" => "Antibot",
365 joku 63 "rule" => array(
366     "antibot-V([0-9.]{1,10})" => "\\1"
367     ),
368     "uri" => ""
369     ),
370     "aonde" => array(
371     "icon" => "aonde",
372     "title" => "Aonde",
373     "rule" => array(
374     "^AONDE-Spider" => ""
375     ),
376     "uri" => ""
377     ),
378     "aonline" => array(
379     "icon" => "robot",
380     "title" => "A-Online.at",
381     "rule" => array(
382     "^A-Online Search" => ""
383     ),
384     "uri" => "http://www.a-online.at/"
385     ),
386     "aol" => array(
387     "icon" => "aol",
388     "title" => "AOLserver",
389     "rule" => array(
390     "^AOLserver-Tcl[/ ]([0-9.]{1,10})" => "\\1",
391     "^AOLserver" => ""
392     ),
393     "uri" => ""
394     ),
395     "apachebench" => array(
396     "icon" => "robot",
397     "title" => "ApacheBench",
398     "rule" => array(
399     "ApacheBench[ /]([0-9.]{1,10})" => "\\1"
400     ),
401     "uri" => ""
402     ),
403     "apassion4jazz" => array(
404     "icon" => "robot",
405     "title" => "Passion 4 Jazz",
406     "rule" => array(
407     "^BebopBot[ /]([0-9.]{1,10})" => "\\1"
408     ),
409     "uri" => "http://www.apassion4jazz.net/bebopbot.html"
410     ),
411     "apexoo" => array(
412     "icon" => "robot",
413     "title" => "Apexoo",
414     "rule" => array(
415     "^Apexoo Spider ([0-9.]{1,10})" => "\\1"
416     ),
417     "uri" => "http://www.apexoo.com/"
418     ),
419     "apnoti" => array(
420     "icon" => "apnoti",
421 matthys 205 "title" => "Apnoti",
422 joku 63 "rule" => array(
423     "apnoti.*Robot[ /]v([0-9.]{1,10})" => "\\1"
424     ),
425     "uri" => "http://www.apnoti.com/"
426     ),
427     "aport" => array(
428     "icon" => "aport",
429     "title" => "Aport",
430     "rule" => array(
431     "^Aport" => ""
432     ),
433     "uri" => ""
434     ),
435     "appie" => array(
436     "icon" => "walhello",
437     "title" => "Walhello",
438     "rule" => array(
439     "appie[ /]([0-9.]{1,10})" => "\\1"
440     ),
441     "uri" => ""
442     ),
443 matthys 389 "apple" => array(
444     "icon" => "apple",
445     "title" => "Apple",
446     "rule" => array(
447     "Applebot[ /]([0-9.]{1,10})" => "\\1"
448     ),
449     "uri" => "http://www.apple.com/go/applebot"
450     ),
451    
452 joku 63 "arachmo" => array(
453     "icon" => "arachmo",
454     "title" => "Arachmo",
455     "rule" => array(
456     "compatible; Arachmo" => ""
457     ),
458     "uri" => ""
459     ),
460     "arexera" => array(
461     "icon" => "arexera",
462     "title" => "Arexera",
463     "rule" => array(
464     "^X-Crawler" => "",
465     "^TECOMAC-Crawler[ /]([0-9.]{1,10})" => "\\1"
466     ),
467     "uri" => "http://www.arexera.de/"
468     ),
469     "arianna" => array(
470     "icon" => "arianna",
471     "title" => "Arianna",
472     "rule" => array(
473     "^www.arianna.it" => ""
474     ),
475     "uri" => "http://www.arianna.it/"
476     ),
477     "artface" => array(
478     "icon" => "robot",
479     "title" => "Artface",
480     "rule" => array(
481     "^ArtfaceBot" => ""
482     ),
483     "uri" => ""
484     ),
485     "artviper" => array(
486     "icon" => "artviper",
487     "title" => "artViper",
488     "rule" => array(
489     "artViper" => ""
490     ),
491     "uri" => "http://www.artviper.net/"
492     ),
493     "asinfo" => array(
494     "icon" => "robot",
495     "title" => "Any Search Info",
496     "rule" => array(
497     "Sleek Spider[ /]([0-9.]{1,10})" => "\\1"
498     ),
499     "uri" => "http://search-info.com/"
500     ),
501     "ask" => array(
502     "icon" => "askjeeves",
503     "title" => "Ask Jeeves",
504     "rule" => array(
505     "Ask[ \-]?Jeeves" => "",
506     "teomaagent" => ""
507     ),
508     "uri" => ""
509     ),
510     "askaboutoil" => array(
511     "icon" => "robot",
512     "title" => "ASPseek",
513     "rule" => array(
514     "^AskAboutOil[ /]([0-9.]{1,10})" => "\\1"
515     ),
516     "uri" => "http://askaboutoil.com/"
517     ),
518     "asked" => array(
519     "icon" => "robot",
520 matthys 205 "title" => "AskEd!",
521 joku 63 "rule" => array(
522     "^asked[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
523     ),
524     "uri" => "http://asked.jp"
525     ),
526     "aspseek" => array(
527     "icon" => "robot",
528     "title" => "ASPseek",
529     "rule" => array(
530     "^ASPseek[/ ]([0-9.]{1,10})" => "\\1"
531     ),
532     "uri" => ""
533     ),
534     "atlocal" => array(
535     "icon" => "robot",
536     "title" => "At Local",
537     "rule" => array(
538     "AtlocalBot[/ ]([0-9.]{1,10})" => "\\1"
539     ),
540     "uri" => "http://www.atlocal.com/"
541     ),
542     "atomz" => array(
543     "icon" => "atomz",
544     "title" => "Atomz",
545     "rule" => array(
546     "Atomz[/ ]([0-9.]{1,10})" => "\\1"
547     ),
548     "uri" => ""
549     ),
550 matthys 345 "avira" => array(
551     "icon" => "avira",
552     "title" => "Avira SafeSearch",
553     "rule" => array(
554     "^SafeSearch microdata crawler" => ""
555     ),
556     "uri" => "https://safesearch.avira.com"
557     ),
558 joku 63 "axel" => array(
559     "icon" => "robot",
560     "title" => "Axel",
561     "rule" => array(
562     "^axel" => ""
563     ),
564     "uri" => ""
565     ),
566     "axmo" => array(
567     "icon" => "axmo",
568     "title" => "Axmo",
569     "rule" => array(
570     "AxmoRobot" => ""
571     ),
572     "uri" => ""
573     ),
574     "answerbus" => array(
575     "icon" => "answerbus",
576     "title" => "AnswerBus",
577     "rule" => array(
578     "answerbus" => ""
579     ),
580     "uri" => ""
581     ),
582     "automapit" => array(
583     "icon" => "robot",
584     "title" => "AutoMapIt",
585     "rule" => array(
586     "AutoMapIt[ /](Bot)?" => ""
587     ),
588     "uri" => "http://www.automapit.com/bot.html"
589     ),
590     "augurnfind" => array(
591     "icon" => "robot",
592     "title" => "Augurnfind",
593     "rule" => array(
594     "augurnfind[/ ][v\-]*([0-9.]{1,10})" => "\\1"
595     ),
596     "uri" => ""
597     ),
598     "awasu" => array(
599     "icon" => "awasu",
600     "title" => "Awasu",
601     "rule" => array(
602     "Awasu[/ ]([0-9a-z.]{1,10})" => "\\1"
603     ),
604     "uri" => ""
605     ),
606     "axxus" => array(
607     "icon" => "axxus",
608     "title" => "axxus.de",
609     "rule" => array(
610     "whoiam" => ""
611     ),
612     "uri" => "http://www.axxus.de/"
613     ),
614     "ayell" => array(
615     "icon" => "ayell",
616     "title" => "Ayell",
617     "rule" => array(
618     "^Eurobot[ /]([0-9.]{1,10})" => "\\1"
619     ),
620     "uri" => "http://eurobot.ayell.eu"
621     ),
622     "babaloo" => array(
623     "icon" => "babaloo",
624     "title" => "Babaloo",
625     "rule" => array(
626     "BabalooSpider[ /]([0-9.]{1,10})" => "\\1"
627     ),
628     "uri" => "http://www.babaloo.si"
629     ),
630     "babe" => array(
631     "icon" => "robot",
632     "title" => "ba.be",
633     "rule" => array(
634     "BACS http://www.ba.be" => ""
635     ),
636     "uri" => "http://www.ba.be/"
637     ),
638     "baidu" => array(
639     "icon" => "baidu",
640     "title" => "Baidu",
641     "rule" => array(
642     "Baiduspider[ /]([0-9.]{1,10})" => "\\1",
643     "Baiduspider" => ""
644     ),
645     "uri" => "http://www.baidu.com/search/spider.html"
646     ),
647     "bananatree" => array(
648     "icon" => "robot",
649     "title" => "BananaTree",
650     "rule" => array(
651     "www\.thebananatree\.org" => ""
652     ),
653     "uri" => "http://www.thebananatree.org/"
654     ),
655     "bdcindexer" => array(
656     "icon" => "robot",
657     "title" => "bdcindexer",
658     "rule" => array(
659     "bdcindexer_([0-9a-z.]{1,10})" => "\\1"
660     ),
661     "uri" => "http://www.business.com/"
662     ),
663     "bdfetch" => array(
664     "icon" => "robot",
665     "title" => "BDFetch",
666     "rule" => array(
667     "^BDFetch" => ""
668     ),
669     "uri" => ""
670     ),
671     "bdncentral" => array(
672     "icon" => "robot",
673     "title" => "Bdncentral",
674     "rule" => array(
675     "BDNcentral Crawler v([0-9.]{1,10})" => "\\1"
676     ),
677     "uri" => "http://www.bdncentral.com/robot.html"
678     ),
679     "beammachine" => array(
680     "icon" => "robot",
681     "title" => "BeamMachine",
682     "rule" => array(
683     "^BeamMachine[ /]([0-9.]{1,10})" => "\\1"
684     ),
685     "uri" => "http://www.beammachine.net/"
686     ),
687     "become" => array(
688     "icon" => "become",
689     "title" => "Become",
690     "rule" => array(
691     "Become(JP)?Bot[/ ]([0-9.]{1,10})" => "\\2",
692     "(BecomeBot|Exabot)@exava\.com\)$" => ""
693     ),
694     "uri" => "http://www.become.com/"
695     ),
696     "beebware" => array(
697     "icon" => "robot",
698     "title" => "Beebware",
699     "rule" => array(
700     "BeebwareDirectory[/ ]v?([0-9.]{1,10})" => "\\2"
701     ),
702     "uri" => ""
703     ),
704     "bigbrother" => array(
705     "icon" => "robot",
706     "title" => "Big Brother",
707     "rule" => array(
708     "^Big Brother" => ""
709     ),
710     "uri" => "http://pauillac.inria.fr/~fpottier/"
711     ),
712     "bigclique" => array(
713     "icon" => "robot",
714     "title" => "BigClique",
715     "rule" => array(
716     "^BigCliqueBOT[/ ]([0-9.]{1,10})" => "\\1"
717     ),
718     "uri" => "http://www.bigclique.com"
719     ),
720     "biglotron" => array(
721     "icon" => "robot",
722     "title" => "Biglotron",
723     "rule" => array(
724     "^BIGLOTRON" => ""
725     ),
726     "uri" => "http://www.bigclique.com"
727     ),
728     "bigsearch" => array(
729     "icon" => "bigsearch",
730     "title" => "Bigsearch",
731     "rule" => array(
732     "Bigsearch.ca[/ ]Nutch[- ]([0-9.]{1,10})" => "\\1"
733     ),
734     "uri" => ""
735     ),
736     "bilbo" => array(
737     "icon" => "robot",
738     "title" => "Bilbo",
739     "rule" => array(
740     "Bilbo[ /]([0-9.]{1,10})" => "\\1"
741     ),
742     "uri" => "http://home.broadpark.no/~tnilsen-1/Linux/Bilbo_-_Nessus_WEB/bilbo_-_nessus_web.html"
743     ),
744     "bilgi" => array(
745     "icon" => "bilgi",
746     "title" => "Bilgi",
747     "rule" => array(
748     "Bilgi(Beta)?Bot[ /]([0-9.]{1,10})" => "\\1"
749     ),
750     "uri" => "http://www.bilgi.com/"
751     ),
752     "bitacle" => array(
753     "icon" => "bitacle",
754     "title" => "Bitacle",
755     "rule" => array(
756     "Bitacle (ro)?bot[ \(/V\:]+([0-9.]{1,10})" => "\\2",
757     ),
758     "uri" => "http://bitacle.org/"
759     ),
760     "bitbeamer" => array(
761     "icon" => "bitbeamer",
762     "title" => "BitBeamer",
763     "rule" => array(
764     "BitBeamer/([0-9.]{1,10})" => "\\1"
765     ),
766     "uri" => ""
767     ),
768     "biz360" => array(
769     "icon" => "biz360",
770     "title" => "Biz360",
771     "rule" => array(
772     "^Biz360 spider" => ""
773     ),
774     "uri" => ""
775     ),
776     "backlinktest" => array(
777     "icon" => "backlinktest",
778     "title" => "BacklinkCrawler",
779     "rule" => array(
780     "BacklinkCrawler" => ""
781     ),
782     "uri" => "http://www.backlinktest.com/crawler.html"
783     ),
784     "blaizbee" => array(
785     "icon" => "blaiz-bee",
786     "title" => "Blaiz-Bee",
787     "rule" => array(
788     "Blaiz-Bee[ /]([0-9.]{1,10})" => ""
789     ),
790     "uri" => ""
791     ),
792     "blogbeat" => array(
793     "icon" => "robot",
794     "title" => "BlogBeat",
795     "rule" => array(
796     "BlogBeat/?([0-9.]{1,10})" => "\\1",
797     ),
798     "uri" => "http://www.blogbeat.nl"
799     ),
800     "blogbotde" => array(
801     "icon" => "robot",
802     "title" => "blogbot.de",
803     "rule" => array(
804     "Naamah[ /]([0-9.a-z]{1,10})[ /]Blogbot" => "\\1",
805     ),
806     "uri" => "http://blogbot.de/"
807     ),
808     "blogcensus" => array(
809     "icon" => "blogcensus",
810     "title" => "Blogcensus",
811     "rule" => array(
812     "^Blogcensus" => "",
813     ),
814     "uri" => "http://blogcensus.de/bot/"
815     ),
816     "blogdex" => array(
817     "icon" => "robot",
818     "title" => "Blogdex",
819     "rule" => array(
820     "Blogdex[ /]([0-9.]{1,10})" => "\\1",
821     ),
822     "uri" => ""
823     ),
824     "blogg" => array(
825     "icon" => "blogg",
826     "title" => "Blogg",
827     "rule" => array(
828     "^blogg\.de" => ""
829     ),
830     "uri" => ""
831     ),
832     "blogland" => array(
833     "icon" => "robot",
834     "title" => "BlogLand",
835     "rule" => array(
836     "BlogLand[/ ]([0-9.]{1,10})" => "\\1"
837     ),
838     "uri" => ""
839     ),
840     "bloglines" => array(
841     "icon" => "bloglines",
842     "title" => "Bloglines",
843     "rule" => array(
844     "Bloglines[ /]([0-9.]{1,10})" => "\\1",
845     "Bloglines" => ""
846     ),
847     "uri" => ""
848     ),
849     "blogmap" => array(
850     "icon" => "robot",
851     "title" => "Blogmap",
852     "rule" => array(
853     "blogmap" => ""
854     ),
855     "uri" => ""
856     ),
857     "blogosphere" => array(
858     "icon" => "robot",
859     "title" => "Blogosphere",
860     "rule" => array(
861     "Blogosphere" => ""
862     ),
863     "uri" => ""
864     ),
865     "blogpeople" => array(
866     "icon" => "robot",
867     "title" => "BlogPeople",
868     "rule" => array(
869     "BlogPeople" => ""
870     ),
871     "uri" => ""
872     ),
873     "blogpulse" => array(
874     "icon" => "blogpulse",
875     "title" => "Blogpulse",
876     "rule" => array(
877     "Blogpulse" => ""
878     ),
879     "uri" => ""
880     ),
881     "blogranking" => array(
882     "icon" => "blogranking",
883     "title" => "BlogRanking",
884     "rule" => array(
885     "^BlogRanking(/RSS checker)?" => ""
886     ),
887     "uri" => ""
888     ),
889     "blogs" => array(
890     "icon" => "blogs",
891     "title" => "Blo.gs",
892     "rule" => array(
893     "blo\.gs[ /]([0-9.]{1,10})" => "\\1",
894     "blo\.gs" => ""
895     ),
896     "uri" => ""
897     ),
898     "blogshares" => array(
899     "icon" => "blogshares",
900     "title" => "BlogShares",
901     "rule" => array(
902     "BlogShares[ /]V?([0-9.]{1,10})" => "\\1",
903     "(^| |\()Blogshares(\.com| |\))" => ""
904     ),
905     "uri" => ""
906     ),
907     "blogslife" => array(
908     "icon" => "robot",
909     "title" => "BlogsLife",
910     "rule" => array(
911     "Blogslive" => ""
912     ),
913     "uri" => ""
914     ),
915     "blogsnow" => array(
916     "icon" => "blogsnow",
917     "title" => "BlogsNow",
918     "rule" => array(
919     "blogsnowbot" => "",
920     "BlogsNow" => ""
921     ),
922     "uri" => ""
923     ),
924     "blogstreet" => array(
925     "icon" => "blogstreet",
926     "title" => "BlogStreet",
927     "rule" => array(
928     "^BlogStreetBot" => ""
929     ),
930     "uri" => ""
931     ),
932     "blogsurf" => array(
933     "icon" => "robot",
934     "title" => "BlogSurf",
935     "rule" => array(
936     "nomadscafe_ra[/ ]([0-9.]{1,10})" => "\\1"
937     ),
938     "uri" => ""
939     ),
940     "blogtick" => array(
941     "icon" => "robot",
942     "title" => "BlogTick",
943     "rule" => array(
944     "BlogTickServer" => ""
945     ),
946     "uri" => ""
947     ),
948     "blogwatcher" => array(
949     "icon" => "blogwatcher",
950     "title" => "Blogwatcher",
951     "rule" => array(
952     "blogWatcher_Spider[/ ]([0-9.]{1,10})" => "\\1"
953     ),
954     "uri" => ""
955     ),
956     "blogwise" => array(
957     "icon" => "blogwise",
958     "title" => "Blogwise",
959     "rule" => array(
960     "Blogwise\.com(-MetaChecker)?[/ ]([0-9.]{1,10})" => "\\2"
961     ),
962     "uri" => ""
963     ),
964     "boardreader" => array(
965     "icon" => "boardreader",
966     "title" => "BoardReader",
967     "rule" => array(
968     "BoardReader[ \-](Image|Favicon)[ \-]Fetcher[ /]+([0-9.]{1,10})" => "\\2"
969     ),
970     "uri" => "http://www.boardreader.com"
971     ),
972     "bobby" => array(
973     "icon" => "bobby",
974     "title" => "Bobby",
975     "rule" => array(
976     "bobby[ /]([0-9.]{1,10})" => "\\1"
977     ),
978     "uri" => ""
979     ),
980     "boitho" => array(
981     "icon" => "robot",
982     "title" => "Boitho",
983     "rule" => array(
984     "Boitho\.com[ \-](dc|robot)?[/ ]([0-9.]{1,10})" => "\\2"
985     ),
986     "uri" => ""
987     ),
988     "booch" => array(
989     "icon" => "robot",
990     "title" => "Booch",
991     "rule" => array(
992     "^booch[_ /]([0-9.]{1,10})" => "\\1"
993     ),
994     "uri" => ""
995     ),
996     "book" => array(
997     "icon" => "book",
998     "title" => "Bookmark",
999     "rule" => array(
1000     "http://www\.bookmark\.ne\.jp" => ""
1001     ),
1002     "uri" => ""
1003     ),
1004     "bookdog" => array(
1005     "icon" => "bookdog",
1006     "title" => "Bookdog",
1007     "rule" => array(
1008     "^Bookdog[ /]([0-9.]{1,10})" => "\\1"
1009     ),
1010     "uri" => ""
1011     ),
1012     "bordermanager" => array(
1013     "icon" => "bordermanager",
1014     "title" => "Border Manager",
1015     "rule" => array(
1016     "BorderManager[ /]([0-9.]{1,10})" => "\\1"
1017     ),
1018     "uri" => ""
1019     ),
1020     "botonparade" => array(
1021     "icon" => "botonparade",
1022     "title" => "Bot on Parade",
1023     "rule" => array(
1024     "BotOnParade" => ""
1025     ),
1026     "uri" => "http://www.bots-on-para.de/bot.html"
1027     ),
1028     "botje" => array(
1029     "icon" => "botje",
1030     "title" => "Botje",
1031     "rule" => array(
1032     "Plukkie[ /]([0-9.]{1,10})" => "\\1"
1033     ),
1034     "uri" => "http://www.botje.com/"
1035     ),
1036     "bottomfeeder" => array(
1037     "icon" => "bottomfeeder",
1038     "title" => "BottomFeeder",
1039     "rule" => array(
1040     "BottomFeeder[ /]([0-9.]{1,10})" => "\\1"
1041     ),
1042     "uri" => ""
1043     ),
1044     "browseremulator" => array(
1045     "icon" => "browseremulator",
1046     "title" => "BrowserEmulator",
1047     "rule" => array(
1048     "BrowserEmulator[ /]([0-9.]{1,10})" => "\\1"
1049     ),
1050     "uri" => "http://www.dejavu.org/emulator.htm"
1051     ),
1052     "browsershots" => array(
1053     "icon" => "browsershots",
1054     "title" => "Browsershots",
1055     "rule" => array(
1056     "Browsershots URL Check" => ""
1057     ),
1058     "uri" => "http://browsershots.org"
1059     ),
1060     "browserspy" => array(
1061     "icon" => "robot",
1062     "title" => "BrowserSpy",
1063     "rule" => array(
1064     "BrowserSpy" => ""
1065     ),
1066     "uri" => ""
1067     ),
1068     "bruinbot" => array(
1069     "icon" => "robot",
1070     "title" => "BruinBot",
1071     "rule" => array(
1072     "BruinBot" => ""
1073     ),
1074     "uri" => ""
1075     ),
1076     "bruno" => array(
1077     "icon" => "robot",
1078     "title" => "Bruno",
1079     "rule" => array(
1080     "^Bruno" => ""
1081     ),
1082     "uri" => ""
1083     ),
1084     "btbot" => array(
1085     "icon" => "btbot",
1086     "title" => "BitTorrent",
1087     "rule" => array(
1088     "BTbot/([0-9.]{1,10})" => "\\1"
1089     ),
1090     "uri" => ""
1091     ),
1092 joku 380 "bubing" => array(
1093     "icon" => "robot",
1094     "title" => "BUbiNG",
1095     "rule" => array(
1096     "BUbiNG" => ""
1097     ),
1098     "uri" => "http://law.di.unimi.it/BUbiNG.html"
1099     ),
1100 joku 63 "builtwith" => array(
1101     "icon" => "builtwith",
1102     "title" => "BuiltWith",
1103     "rule" => array(
1104     "BuiltWith[/ ]([0-9.]{1,10})" => "\\1"
1105     ),
1106     "uri" => "http://builtwith.com/bot.html"
1107     ),
1108     "bulkfeeds" => array(
1109     "icon" => "robot",
1110     "title" => "Bulkfeeds",
1111     "rule" => array(
1112     "Bulkfeeds[/ ]([a-z0-9.]{1,10})" => "\\1"
1113     ),
1114     "uri" => ""
1115     ),
1116     "burf" => array(
1117     "icon" => "burf",
1118     "title" => "Burf.com",
1119     "rule" => array(
1120     "^Norbert the Spider" => ""
1121     ),
1122     "uri" => "http://www.burf.com/"
1123     ),
1124     "butch" => array(
1125     "icon" => "robot",
1126     "title" => "Butch",
1127     "rule" => array(
1128     "Butch(__| )?([a-z0-9.]{1,10})" => "\\2"
1129     ),
1130     "uri" => ""
1131     ),
1132     "buzzlogic" => array(
1133     "icon" => "buzzlogic",
1134     "title" => "Buzzlogic",
1135     "rule" => array(
1136     "BuzzBot[ /]([0-9.]{1,10})" => "\\1"
1137     ),
1138     "uri" => "http://www.buzzlogic.com"
1139     ),
1140     "catchbot" => array(
1141     "icon" => "catchbot",
1142     "title" => "CatchBot",
1143     "rule" => array(
1144     "^CatchBot[/ ]([0-9.]{1,10})" => "\\1"
1145     ),
1146     "uri" => "http://www.catchbot.com"
1147     ),
1148     "camdiscover" => array(
1149     "icon" => "robot",
1150     "title" => "Camdiscover",
1151     "rule" => array(
1152     "^Camcrawler" => ""
1153     ),
1154     "uri" => ""
1155     ),
1156     "cazoodle" => array(
1157     "icon" => "cazoodle",
1158     "title" => "Cazoodle",
1159     "rule" => array(
1160     "^CazoodleBot/(Nutch|CazoodleBot)[/ \-]([0-9.]{1,10})" => "\\2",
1161     "^CazoodleBot[/ ]([a-z0-9.]{1,10})" => "\\1"
1162     ),
1163     "uri" => "http://www.cazoodle.com/cazoodlebot"
1164     ),
1165     "ccbot" => array(
1166     "icon" => "robot",
1167     "title" => "ccBot",
1168     "rule" => array(
1169     "CCBot[/ ]([0-9.]{1,10})" => "\\1"
1170     ),
1171     "uri" => "http://www.commoncrawl.org/bot.html"
1172     ),
1173     "ccgcrawl" => array(
1174     "icon" => "robot",
1175     "title" => "CCGCrawl",
1176     "rule" => array(
1177     "CCGCrawl[/ ]([0-9.]{1,10})" => "\\1"
1178     ),
1179     "uri" => "http://www.myworkbase.com/bot.html"
1180     ),
1181     "cerberian" => array(
1182     "icon" => "robot",
1183     "title" => "Cerberian Drtrs",
1184     "rule" => array(
1185     "^Cerberian Drtrs" => ""
1186     ),
1187     "uri" => ""
1188     ),
1189     "cfnetwork" => array(
1190     "icon" => "robot",
1191     "title" => "Cerberian Drtrs",
1192     "rule" => array(
1193     "^CFNetwork[/ ]([0-9.]{1,10})" => "\\1"
1194     ),
1195     "uri" => "http://www.cfnetwork.be/"
1196     ),
1197     "charlotte" => array(
1198     "icon" => "charlotte",
1199     "title" => "Charlotte",
1200     "rule" => array(
1201     "Charlotte[/ ]([0-9a-z.]{1,10})" => "\\1"
1202     ),
1203     "uri" => ""
1204     ),
1205     "cirilizator" => array(
1206     "icon" => "cirilizator",
1207     "title" => "Cirilizator",
1208     "rule" => array(
1209     "Cirilizator[/ ]([0-9.]{1,10})" => "\\1"
1210     ),
1211     "uri" => ""
1212     ),
1213     "claria" => array(
1214     "icon" => "robot",
1215     "title" => "Claria",
1216     "rule" => array(
1217     "(Claria|Diamond)(Bot)?[ /]([0-9.]{1,10})" => "\\3",
1218     "(Claria|Diamond)(Bot)" => ""
1219     ),
1220     "uri" => ""
1221     ),
1222     "claymont" => array(
1223     "icon" => "claymont",
1224     "title" => "Claymont",
1225     "rule" => array(
1226     "claymont\.com" => "",
1227     "OliverPerry" => ""
1228     ),
1229     "uri" => "http://www.claymont.com"
1230     ),
1231 joku 377 "clipinc" => array(
1232     "icon" => "clipinc",
1233     "title" => "ClipInc",
1234     "rule" => array(
1235     "ClipInc" => ""
1236     ),
1237     "uri" => "http://tobit.software"
1238     ),
1239 joku 63 "clush" => array(
1240     "icon" => "clush",
1241     "title" => "Clush",
1242     "rule" => array(
1243     "Clus(tered-Search-|h)Bot[ /]([0-9.]{1,10})" => "\\2"
1244     ),
1245     "uri" => ""
1246     ),
1247     "cmsworldmap" => array(
1248     "icon" => "cmsworldmap",
1249     "title" => "CMS World Map",
1250     "rule" => array(
1251     "cmsworldmap" => ""
1252     ),
1253     "uri" => "http://www.cmsworldmap.com/"
1254     ),
1255     "cobion" => array(
1256     "icon" => "robot",
1257     "title" => "Cobion",
1258     "rule" => array(
1259     " (QXW03018|obot)\)" => ""
1260     ),
1261     "uri" => ""
1262     ),
1263     "coccoc" => array(
1264 matthys 287 "icon" => "coccoc",
1265 matthys 209 "title" => "Coccoc",
1266 joku 63 "rule" => array(
1267     "coccoc[ /]([0-9.]{1,10})" => "\\1"
1268     ),
1269 matthys 287 "uri" => "http://help.coccoc.com"
1270 joku 63 ),
1271     "coldfusion" => array(
1272     "icon" => "coldfusion",
1273     "title" => "ColdFusion",
1274     "rule" => array(
1275     "^coldfusion" => ""
1276     ),
1277     "uri" => ""
1278     ),
1279     "combine" => array(
1280     "icon" => "robot",
1281     "title" => "Combine",
1282     "rule" => array(
1283     "Combine[ /]([0-9.]{1,10})" => "\\1"
1284     ),
1285     "uri" => ""
1286     ),
1287     "combot" => array(
1288     "icon" => "robot",
1289     "title" => "comBot",
1290     "rule" => array(
1291     "^comBot[ /]([0-9.]{1,10})" => "\\1"
1292     ),
1293     "uri" => ""
1294     ),
1295     "comet" => array(
1296     "icon" => "comet",
1297     "title" => "Comet",
1298     "rule" => array(
1299     "cometsearch@cometsystems" => ""
1300     ),
1301     "uri" => ""
1302     ),
1303     "commerobo" => array(
1304     "icon" => "robot",
1305     "title" => "Commerobo",
1306     "rule" => array(
1307     "Commerobo[/ ]([0-9.]{1,10})" => "\\1"
1308     ),
1309     "uri" => ""
1310     ),
1311     "comrite" => array(
1312     "icon" => "robot",
1313     "title" => "ComRite",
1314     "rule" => array(
1315     "Comrite[/ ]([0-9.]{1,10})" => "\\1"
1316     ),
1317     "uri" => "http://www.comrite.com/"
1318     ),
1319     "convera" => array(
1320     "icon" => "convera",
1321     "title" => "Convera",
1322     "rule" => array(
1323     "Convera(MultiMedia)?Crawler[/ ]([0-9.]{1,10})" => "\\2",
1324     "Convera Internet Spider V([0-9.]{1,10})" => "\\1"
1325     ),
1326     "uri" => ""
1327     ),
1328     "coolbot" => array(
1329     "icon" => "robot",
1330     "title" => "CoolBot",
1331     "rule" => array(
1332     "^CoolBot" => ""
1333     ),
1334     "uri" => ""
1335     ),
1336     "cosmix" => array(
1337     "icon" => "robot",
1338     "title" => "Cosmix",
1339     "rule" => array(
1340     "^(voyager|cfetch|CosmixCrawler|carleson)[/ ]([0-9.]{1,10})" => "\\2",
1341     ),
1342     "uri" => ""
1343     ),
1344     "cosmos" => array(
1345     "icon" => "robot",
1346     "title" => "Cosmos",
1347     "rule" => array(
1348     "^cosmos" => ""
1349     ),
1350     "uri" => ""
1351     ),
1352     "cosmoty" => array(
1353     "icon" => "robot",
1354     "title" => "Cosmoty",
1355     "rule" => array(
1356     "^beautybot[/ ]([0-9.]{1,10})" => "\\1"
1357     ),
1358     "uri" => "http://www.uchoose.de/crawler/beautybot/"
1359     ),
1360     "covario" => array(
1361     "icon" => "covario",
1362     "title" => "Covario",
1363     "rule" => array(
1364     "Covario-IDS[/ ]([0-9.]{1,10})" => "\\1"
1365     ),
1366     "uri" => "http://www.covario.com/ids/"
1367     ),
1368     "creativecommons" => array(
1369     "icon" => "creativecommons",
1370     "title" => "Creative Commons",
1371     "rule" => array(
1372     "CreativeCommons[/ ]([0-9.]{1,6}(-dev)?)" => "\\1"
1373     ),
1374     "uri" => ""
1375     ),
1376     "cscrawler" => array(
1377     "icon" => "robot",
1378     "title" => "CsCrawler",
1379     "rule" => array(
1380     "CsCrawler" => ""
1381     ),
1382     "uri" => "http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html"
1383     ),
1384 joku 111 "jigsaw" => array(
1385     "icon" => "jigsaw",
1386     "title" => "Jigsaw",
1387     "rule" => array(
1388     "Jigsaw[ /]([0-9.]{1,10})" => "\\1"
1389     ),
1390     "uri" => "http://jigsaw.w3.org/css-validator/"
1391     ),
1392 joku 63 "csscheck" => array(
1393     "icon" => "w3c",
1394     "title" => "W3C CSS Validator",
1395     "rule" => array(
1396     "CSS(Check|_Validator).+[ /]([0-9.]{1,10})" => "\\2"
1397     ),
1398     "uri" => "http://jigsaw.w3.org/css-validator/"
1399     ),
1400     "custo" => array(
1401     "icon" => "robot",
1402     "title" => "Custo",
1403     "rule" => array(
1404     "Custo[ /]([0-9.]{1,10})" => "\\1"
1405     ),
1406     "uri" => ""
1407     ),
1408     "cybernavi" => array(
1409     "icon" => "robot",
1410     "title" => "CyberNavi",
1411     "rule" => array(
1412     "CyberNavi_WebGet[ /]([0-9.]{1,10})" => "\\1"
1413     ),
1414     "uri" => ""
1415     ),
1416     "cyberpatrol" => array(
1417     "icon" => "cyberpatrol",
1418     "title" => "CyberPatrol",
1419     "rule" => array(
1420     "^CyberPatrol" => ""
1421     ),
1422     "uri" => "http://www.cyberpatrol.com/cyberpatrolcrawler.asp"
1423     ),
1424     "cyberz" => array(
1425     "icon" => "cyberz",
1426     "title" => "Cyberz",
1427     "rule" => array(
1428     "Cyberz Communication Agent" => ""
1429     ),
1430     "uri" => ""
1431     ),
1432     "cydral" => array(
1433     "icon" => "robot",
1434     "title" => "Cydral",
1435     "rule" => array(
1436     "CydralSpider[ /]([0-9.]{1,10})" => "\\1"
1437     ),
1438     "uri" => ""
1439     ),
1440     "cynthia" => array(
1441     "icon" => "cynthia",
1442     "title" => "Cynthia Says",
1443     "rule" => array(
1444     "Cynthia[ /]([0-9.]{1,10})" => "\\1"
1445     ),
1446     "uri" => ""
1447     ),
1448     "d4x" => array(
1449     "icon" => "d4x",
1450     "title" => "Downloader for X",
1451     "rule" => array(
1452     "Downloader for X[ /]([0-9.]{1,10})" => "\\1"
1453     ),
1454     "uri" => ""
1455     ),
1456     "da" => array(
1457     "icon" => "da",
1458     "title" => "DA",
1459     "rule" => array(
1460     "^DA[ /]([0-9.]{1,10})" => "\\1"
1461     ),
1462     "uri" => ""
1463     ),
1464     "daum" => array(
1465     "icon" => "daum",
1466     "title" => "DAUM",
1467     "rule" => array(
1468     "DAUMOA[ /]([0-9.]{1,10})" => "\\1",
1469 joku 379 "Daum[ /]([0-9.]{1,10})" => "\\1",
1470 joku 63 "DAUM Web Robot" => "",
1471 joku 339 "daum.net" => "",
1472 joku 63 "Daum Communications Corp" => "",
1473     "EDI[ /]([0-9.]{1,10})" => "\\1",
1474     "Edacious.*Intelligent Web Robot" => "",
1475     "RaBot[/ ]([0-9.]{1,10}) Agent" => "\\1"
1476     ),
1477     "uri" => "http://ws.daum.net/"
1478     ),
1479     "daypop" => array(
1480     "icon" => "robot",
1481     "title" => "Daypop",
1482     "rule" => array(
1483     "daypopbot[/ ]([0-9.]{1,10})" => "\\1"
1484     ),
1485     "uri" => ""
1486     ),
1487     "delfi" => array(
1488     "icon" => "delfi",
1489     "title" => "Delfi",
1490     "rule" => array(
1491     "crawl at delfi dot lt" => ""
1492     ),
1493     "uri" => ""
1494     ),
1495     "depspid" => array(
1496     "icon" => "depspid",
1497     "title" => "DepSpid",
1498     "rule" => array(
1499     "DepSpid[/ ]([0-9.]{1,10})" => "\\1"
1500     ),
1501     "uri" => ""
1502     ),
1503     "devonagent" => array(
1504     "icon" => "devonagent",
1505     "title" => "DEVONagent",
1506     "rule" => array(
1507     "DEVONtech" => ""
1508     ),
1509     "uri" => ""
1510     ),
1511     "diffbot" => array(
1512     "icon" => "diffbot",
1513     "title" => "Diffbot",
1514     "rule" => array(
1515     " Diffbot" => ""
1516     ),
1517     "uri" => "http://www.diffbot.com"
1518     ),
1519     "diribot" => array(
1520     "icon" => "diribot",
1521     "title" => "Diri",
1522     "rule" => array(
1523     "diribot" => ""
1524     ),
1525     "uri" => "http://www.diri.bg"
1526     ),
1527     "directhit" => array(
1528     "icon" => "robot",
1529     "title" => "Direct Hit",
1530     "rule" => array(
1531     "EZResult -- Internet Search Engine" => ""
1532     ),
1533     "uri" => "http://www.directhit.com"
1534     ),
1535     "disco" => array(
1536     "icon" => "disco",
1537 matthys 209 "title" => "Disco",
1538 joku 63 "rule" => array(
1539     "disco/Nutch[/ -]([0-9.]{1,10})" => "\\1",
1540     "discobot[/ -]([0-9.]{1,10})" => "\\1",
1541     "disco-crawl@discoveryengine.com" => ""
1542     ),
1543     "uri" => "http://www.discoveryengine.com/"
1544     ),
1545     "discopump" => array(
1546     "icon" => "robot",
1547     "title" => "DISCo Pump",
1548     "rule" => array(
1549     "DISCo Pump[/ ]([0-9.]{1,10})" => "\\1"
1550     ),
1551     "uri" => ""
1552     ),
1553     "dkimreputation" => array(
1554     "icon" => "dkimreputation",
1555     "title" => "DKIM Reputation",
1556     "rule" => array(
1557     "DKIMRepBot[ /]([0-9.]{1,10})" => "\\1"
1558     ),
1559     "uri" => "http://www.dkim-reputation.org"
1560     ),
1561     "dnsdigger" => array(
1562     "icon" => "dnsdigger",
1563     "title" => "DNS-Digger",
1564     "rule" => array(
1565     "DNS-Digger-Explorer[ /]([0-9.]{1,10})" => "\\1"
1566     ),
1567     "uri" => "http://www.dnsdigger.com"
1568     ),
1569     "dnsvalidation" => array(
1570     "icon" => "dnsvalidation",
1571     "title" => "DNS Validation",
1572     "rule" => array(
1573     "DNSValidation[ /]([0-9.]{1,10})" => "\\1"
1574     ),
1575     "uri" => "http://www.dnsvalidation.com/"
1576     ),
1577     "doctorhtml" => array(
1578     "icon" => "robot",
1579     "title" => "DoctorHTML",
1580     "rule" => array(
1581     "Doctor[ \-]?HTML" => ""
1582     ),
1583     "uri" => ""
1584     ),
1585     "dolphin" => array(
1586     "icon" => "dolphin",
1587     "title" => "Dolphin",
1588     "rule" => array(
1589     "Dolphin[ /]([0-9.]{1,10})" => "\\1"
1590     ),
1591     "uri" => "http://telehouse.ru/crawler.html"
1592     ),
1593     "domaindatei" => array(
1594     "icon" => "robot",
1595     "title" => "Domaindatei",
1596     "rule" => array(
1597     "DomaindateiSpider[ /]([0-9.]{1,10})" => "\\1"
1598     ),
1599     "uri" => ""
1600     ),
1601     "dontbuylists" => array(
1602     "icon" => "dontbuylists",
1603     "title" => "Dontbuylists",
1604     "rule" => array(
1605     "DBLBot[ /]([0-9.]{1,10})" => "\\1"
1606     ),
1607     "uri" => "http://www.dontbuylists.com"
1608     ),
1609     "dotbot" => array(
1610     "icon" => "robot",
1611     "title" => "DotBot",
1612     "rule" => array(
1613     "DotBot[ /]([0-9.]{1,10})" => "\\1"
1614     ),
1615     "uri" => "http://www.dotnetdotcom.org"
1616     ),
1617     "doweb" => array(
1618     "icon" => "doweb",
1619     "title" => "DoWeb",
1620     "rule" => array(
1621     "^www.doweb.co.uk" => ""
1622     ),
1623     "uri" => "http://www.doweb.co.uk/"
1624     ),
1625     "downforeveryoneorjustme" => array(
1626     "icon" => "downforeveryoneorjustme",
1627     "title" => "Down for everyone or just me",
1628     "rule" => array(
1629     "downforeveryoneorjustme" => ""
1630     ),
1631     "uri" => "http://www.downforeveryoneorjustme.com"
1632     ),
1633     "downloadninja" => array(
1634     "icon" => "robot",
1635     "title" => "Download Ninja",
1636     "rule" => array(
1637     "Download Ninja[ /]([0-9.]{1,10})" => "\\1"
1638     ),
1639     "uri" => ""
1640     ),
1641     "drupal" => array(
1642     "icon" => "drupal",
1643     "title" => "Drupal",
1644     "rule" => array(
1645     "^Drupal" => ""
1646     ),
1647     "uri" => ""
1648     ),
1649     "dsns" => array(
1650     "icon" => "robot",
1651     "title" => "DSNS Scanner",
1652     "rule" => array(
1653     "^DSNS" => ""
1654     ),
1655     "uri" => ""
1656     ),
1657     "dtsagent" => array(
1658     "icon" => "robot",
1659     "title" => "DTS Agent",
1660     "rule" => array(
1661     "DTS Agent" => ""
1662     ),
1663     "uri" => ""
1664     ),
1665 matthys 342 "duckduckgo" => array(
1666     "icon" => "duckduckgo",
1667     "title" => "DuckDuckGo",
1668     "rule" => array(
1669 matthys 397 "DuckDuckGo-Favicons-Bot[ /]([0-9.]{1,10})" => "\\1",
1670     "DuckDuckBot-Https[ /]([0-9.]{1,10})" => "\\1"
1671 matthys 342 ),
1672     "uri" => "http://duckduckgo.com"
1673     ),
1674 joku 63 "earthcom" => array(
1675     "icon" => "earthcom",
1676     "title" => "Earthcom",
1677     "rule" => array(
1678     "EARTHCOM\.info[/ ]([0-9a-z.]{1,10})" => "\\1"
1679     ),
1680     "uri" => ""
1681     ),
1682     "ebay" => array(
1683     "icon" => "ebay",
1684     "title" => "eBay",
1685     "rule" => array(
1686     "eBay Relevance Ad Crawler" => ""
1687     ),
1688     "uri" => ""
1689     ),
1690     "echo" => array(
1691     "icon" => "robot",
1692     "title" => "Echo.com",
1693     "rule" => array(
1694     "_TrueRobot[/ ]([0-9.]{1,10})" => "\\1"
1695     ),
1696     "uri" => "http://www.echo.com/"
1697     ),
1698     "eert" => array(
1699     "icon" => "robot",
1700 matthys 209 "title" => "Eert",
1701 joku 63 "rule" => array(
1702     "eert spdr[/ ]([0-9.]{1,10})" => "\\1"
1703     ),
1704     "uri" => "http://bot.eert.net"
1705     ),
1706     "eknip" => array(
1707     "icon" => "eknip",
1708     "title" => "E-Knip",
1709     "rule" => array(
1710     "eknip[ /]([0-9a-z.]{1,10})" => "\\1"
1711     ),
1712     "uri" => ""
1713     ),
1714     "zoominfo" => array(
1715     "icon" => "zoominfo",
1716 matthys 209 "title" => "ZoomInfo", //Previous called Eliyon
1717 joku 63 "rule" => array(
1718     "NextGenSearchBot[/ ]([0-9.]{1,10})" => "\\1"
1719     ),
1720     "uri" => "http://www.zoominfo.com/business/nextgensearchbot.html"
1721     ),
1722     "emeraldshield" => array(
1723     "icon" => "emeraldshield",
1724     "title" => "EmeraldShield",
1725     "rule" => array(
1726     "^EmeraldShield" => ""
1727     ),
1728     "uri" => ""
1729     ),
1730     "empas" => array(
1731     "icon" => "empas",
1732     "title" => "Empas",
1733     "rule" => array(
1734     "DigExt; empas\)$" => "",
1735     "^EMPAS[_\-]ROBOT" => ""
1736     ),
1737     "uri" => ""
1738     ),
1739     "entireweb" => array(
1740     "icon" => "entireweb",
1741     "title" => "Entireweb",
1742     "rule" => array(
1743     "Speedy[ ]?Spider" => ""
1744     ),
1745     "uri" => ""
1746     ),
1747     "envolk" => array(
1748     "icon" => "envolk",
1749     "title" => "Envolk",
1750     "rule" => array(
1751     "envolk\[ITS\]spider[/ ]([0-9.]{1,10})" => "\\1",
1752     "envolk[/ ]([0-9.]{1,10})" => "\\1"
1753     ),
1754     "uri" => ""
1755     ),
1756     "esnet" => array(
1757     "icon" => "robot",
1758     "title" => "ES.NET",
1759     "rule" => array(
1760     "ES.NET Crawler[ /]([0-9.]{1,10})" => "\\1"
1761     ),
1762     "uri" => ""
1763     ),
1764     "estyle" => array(
1765     "icon" => "estyle",
1766     "title" => "eStyle Search",
1767     "rule" => array(
1768     "eStyleSearch[ /]([0-9.]{1,10})" => "\\1"
1769     ),
1770     "uri" => ""
1771     ),
1772     "eurip" => array(
1773     "icon" => "robot",
1774     "title" => "Eurip",
1775     "rule" => array(
1776     "EuripBot[ /]([0-9.]{1,10})" => "\\1"
1777     ),
1778     "uri" => "http://www.eurip.com"
1779     ),
1780     "eurodirectory" => array(
1781     "icon" => "robot",
1782     "title" => "Euro Directory",
1783     "rule" => array(
1784     "www\.euro-directory\.com" => ""
1785     ),
1786     "uri" => "http://www.euro-directory.com/"
1787     ),
1788     "euroseek" => array(
1789     "icon" => "euroseek",
1790     "title" => "EuroSeek",
1791     "rule" => array(
1792     "Arachnoidea" => ""
1793     ),
1794     "uri" => ""
1795     ),
1796     "evaal" => array(
1797     "icon" => "evaal",
1798     "title" => "Evaal",
1799     "rule" => array(
1800     "^EvaalSE" => ""
1801     ),
1802     "uri" => "http://www.evaal.com/"
1803     ),
1804     "eventax" => array(
1805     "icon" => "eventax",
1806     "title" => "Eventax",
1807     "rule" => array(
1808     "^eventax[ /]([0-9.]{1,10})" => "\\1"
1809     ),
1810     "uri" => "http://www.eventax.de/"
1811     ),
1812     "everbee" => array(
1813     "icon" => "everbee",
1814     "title" => "Everbee",
1815     "rule" => array(
1816     "EverbeeCrawler" => ""
1817     ),
1818     "uri" => ""
1819     ),
1820     "everest" => array(
1821     "icon" => "everest",
1822     "title" => "Everest",
1823     "rule" => array(
1824     "Everest-Vulcan Inc.[ /]([0-9.]{1,10})" => "\\1"
1825     ),
1826     "uri" => ""
1827     ),
1828     "exabot" => array(
1829     "icon" => "exabot",
1830     "title" => "ExaBot",
1831     "rule" => array(
1832     "^NG[ /]([0-9.]{1,10})" => "\\1",
1833     "Exabot/([0-9.]{1,10})" => "\\1",
1834     "ExaBotTest/([0-9.]{1,10})" => "\\1",
1835     "ExaBot-(Test|Images)/([0-9.]{1,10})" => "\\2",
1836     "ExaBot-Thumbnails" => ""
1837     ),
1838     "uri" => "http://www.exabot.com/go/robot"
1839     ),
1840     "exactseek" => array(
1841     "icon" => "exactseek",
1842     "title" => "ExactSeek",
1843     "rule" => array(
1844     "^exactseek[ \-]?(pagereaper|crawler)[ \-]?([0-9.]{1,10})" => "\\2",
1845     "ExactSeek[ \.\-]?(Crawler|com)" => ""
1846     ),
1847     "uri" => "http://www.exactseek.com/"
1848     ),
1849     "excite" => array(
1850     "icon" => "excite",
1851     "title" => "Excite",
1852     "rule" => array(
1853     "Architext[ \-]?Spider" => ""
1854     ),
1855     "uri" => ""
1856     ),
1857     "execrawl" => array(
1858     "icon" => "robot",
1859     "title" => "Execrawl",
1860     "rule" => array(
1861     "Execrawl[ /]([0-9.]{1,10})" => "\\1",
1862     "Execrawl" => ""
1863     ),
1864     "uri" => ""
1865     ),
1866     "expertmonitor" => array(
1867     "icon" => "robot",
1868     "title" => "ExpertMonitor",
1869     "rule" => array(
1870     "^NetMonitor[ /]([0-9.]{1,10})" => "\\1"
1871     ),
1872     "uri" => ""
1873     ),
1874     "explorerrss" => array(
1875     "icon" => "robot",
1876     "title" => "Explorer RSS",
1877     "rule" => array(
1878     "^Windows-RSS-Platform[ /]([0-9.]{1,10})" => "\\1"
1879     ),
1880     "uri" => ""
1881     ),
1882     "ezooms" => array(
1883     "icon" => "robot",
1884     "title" => "Ezooms",
1885     "rule" => array(
1886     "ezooms[/ ]([0-9a-z.\-]{1,10})" => "\\1"
1887     ),
1888     "uri" => ""
1889     ),
1890     "facebook" => array(
1891     "icon" => "facebook",
1892     "title" => "Facebook",
1893     "rule" => array(
1894     "FacebookFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1895     "facebookexternalhit/([0-9.]{1,10})" => "\\1",
1896     "^facebook" => ""
1897     ),
1898     "uri" => "http://www.facebook.com/"
1899     ),
1900     "fast" => array(
1901     "icon" => "fast",
1902     "title" => "Fast",
1903     "rule" => array(
1904     "^FAST( Enterprise |-Web| MetaWeb )?Crawler[ /]([0-9.]{1,10})" => "\\2",
1905     "^FAST( Enterprise |-Web| MetaWeb | PartnerSite )?Crawler" => "",
1906     "^Fast Crawler" => "",
1907     "^libwww-perl[ /]([0-9.]{1,10}) FP[ /]([0-9.]{1,10})" => "\\2"
1908     ),
1909     "uri" => "http://www.alltheweb.com/"
1910     ),
1911     "fastbuzz" => array(
1912     "icon" => "fastbuzz",
1913     "title" => "Fastbuzz",
1914     "rule" => array(
1915     "^fastbuzz\.com" => ""
1916     ),
1917     "uri" => ""
1918     ),
1919     "favorg" => array(
1920     "icon" => "robot",
1921     "title" => "FavOrg",
1922     "rule" => array(
1923     "^FavOrg" => ""
1924     ),
1925     "uri" => ""
1926     ),
1927     "favorstar" => array(
1928     "icon" => "favorstar",
1929 matthys 209 "title" => "Favorstar",
1930 joku 63 "rule" => array(
1931     "favorstarbot[ /]([0-9.]{1,10})" => "\\1"
1932     ),
1933     "uri" => "http://favorstar.com/bot.html"
1934     ),
1935     "faxo" => array(
1936     "icon" => "robot",
1937     "title" => "Faxo",
1938     "rule" => array(
1939     "^Faxobot[ /]([0-9.]{1,10})" => "\\1"
1940     ),
1941     "uri" => "http://www.faxo.com/"
1942     ),
1943     "fdse" => array(
1944     "icon" => "robot",
1945     "title" => "FDSE Robot",
1946     "rule" => array(
1947     "FDSE[ \-]?robot" => ""
1948     ),
1949     "uri" => ""
1950     ),
1951     "feedback" => array(
1952     "icon" => "robot",
1953     "title" => "FeedBack",
1954     "rule" => array(
1955     "FeedBack[/ ]([0-9.]{1,10})" => "\\1"
1956     ),
1957     "uri" => ""
1958     ),
1959     "feedburner" => array(
1960     "icon" => "feedburner",
1961     "title" => "FeedBurner",
1962     "rule" => array(
1963     "^FeedBurner[/ ]([0-9.]{1,10})" => "\\1"
1964     ),
1965     "uri" => ""
1966     ),
1967     "feeddemon" => array(
1968     "icon" => "feeddemon",
1969     "title" => "FeedDemon",
1970     "rule" => array(
1971     "FeedDemon[/ ]([0-9.]{1,10})" => "\\1"
1972     ),
1973     "uri" => ""
1974     ),
1975     "feedfind" => array(
1976     "icon" => "feedfind",
1977     "title" => "FeedFind",
1978     "rule" => array(
1979     "Feed::Find[ /]([0-9.]{1,10})" => "\\1"
1980     ),
1981     "uri" => ""
1982     ),
1983     "feedonfeeds" => array(
1984     "icon" => "robot",
1985     "title" => "Feed On Feeds",
1986     "rule" => array(
1987     "FeedOnFeeds[/ ]([0-9.]{1,10})" => "\\1"
1988     ),
1989     "uri" => ""
1990     ),
1991     "feedparser" => array(
1992     "icon" => "robot",
1993     "title" => "Feedparser",
1994     "rule" => array(
1995     "UniversalFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1996     "FeedParser" => ""
1997     ),
1998     "uri" => ""
1999     ),
2000     "feedreader" => array(
2001     "icon" => "feedreader",
2002     "title" => "Feedreader",
2003     "rule" => array(
2004     "^Feedreader" => ""
2005     ),
2006     "uri" => ""
2007     ),
2008     "feedserver" => array(
2009     "icon" => "robot",
2010     "title" => "FeedServer",
2011     "rule" => array(
2012     "FeedServer[/ ]([0-9.]{1,10})" => "\\1"
2013     ),
2014     "uri" => ""
2015     ),
2016     "feedster" => array(
2017     "icon" => "feedster",
2018     "title" => "Feedster",
2019     "rule" => array(
2020     "Feedster Crawler[/ ]([0-9.]{1,10})" => "\\1"
2021     ),
2022     "uri" => ""
2023     ),
2024     "feedvalidator" => array(
2025     "icon" => "feedvalidator",
2026     "title" => "Feed Validator",
2027     "rule" => array(
2028     "^FeedValidator[/ ]([0-9.]{1,10})" => "\\1"
2029     ),
2030     "uri" => ""
2031     ),
2032     "fdm" => array(
2033     "icon" => "robot",
2034     "title" => "Free Download Manager",
2035     "rule" => array(
2036     "^FDM[/ ]([0-9a-z.]{1,10})" => "\\1"
2037     ),
2038     "uri" => ""
2039     ),
2040     "filangy" => array(
2041     "icon" => "robot",
2042     "title" => "Filangy",
2043     "rule" => array(
2044     "Filangy[/ ]([0-9.]{1,10})" => "\\1"
2045     ),
2046     "uri" => "http://www.filangy.com/"
2047     ),
2048     "findanisp" => array(
2049     "icon" => "robot",
2050     "title" => "FindAnISP",
2051     "rule" => array(
2052     "FindAnISP" => ""
2053     ),
2054     "uri" => "http://www.findanisp.com/"
2055     ),
2056     "findengines" => array(
2057     "icon" => "findengines",
2058     "title" => "FindEngines",
2059     "rule" => array(
2060     "FindEngines! Bot" => ""
2061     ),
2062     "uri" => ""
2063     ),
2064     "findexa" => array(
2065     "icon" => "findexa",
2066     "title" => "Findexa",
2067     "rule" => array(
2068     "Findexa Crawler" => ""
2069     ),
2070     "uri" => ""
2071     ),
2072     "findlinks" => array(
2073     "icon" => "findlinks",
2074     "title" => "FindLinks",
2075     "rule" => array(
2076     "findlinks[ /]([0-9.]{1,10})" => "\\1",
2077     "^FindLinks" => ""
2078     ),
2079     "uri" => ""
2080     ),
2081     "findoor" => array(
2082     "icon" => "findoor",
2083 matthys 209 "title" => "Findoor",
2084 joku 63 "rule" => array(
2085     "^findoor(-Bot)?" => "\\1"
2086     ),
2087     "uri" => ""
2088     ),
2089     "firefly" => array(
2090     "icon" => "firefly",
2091     "title" => "Firefly",
2092     "rule" => array(
2093     "Firefly" => ""
2094     ),
2095     "uri" => ""
2096     ),
2097     "flashget" => array(
2098     "icon" => "flashget",
2099     "title" => "FlashGet",
2100     "rule" => array(
2101     "^FlashGet" => ""
2102     ),
2103     "uri" => ""
2104     ),
2105     "flatland" => array(
2106     "icon" => "flatland",
2107     "title" => "Flatland",
2108     "rule" => array(
2109     "^flatlandbot" => ""
2110     ),
2111     "uri" => "http://www.flatlandindustries.com/flatlandbot"
2112     ),
2113     "flickbot" => array(
2114     "icon" => "flickbot",
2115     "title" => "FlickBot",
2116     "rule" => array(
2117     "FlickBot[ /]([0-9.]{1,10})" => "\\1"
2118     ),
2119     "uri" => ""
2120     ),
2121     "flightdeckreports" => array(
2122     "icon" => "flightdeckreports",
2123     "title" => "Flight Deck Reports",
2124     "rule" => array(
2125     "FlightDeckReportsBot[ /]([0-9.]{1,10})" => "\\1"
2126     ),
2127     "uri" => "http://www.flightdeckreports.com/"
2128     ),
2129     "forex" => array(
2130     "icon" => "robot",
2131     "title" => "Forex",
2132     "rule" => array(
2133     "^Forex Trading Network Organization" => ""
2134     ),
2135     "uri" => "http://www.netforex.org/"
2136     ),
2137     "freshmeat" => array(
2138     "icon" => "freshmeat",
2139 matthys 209 "title" => "Freshmeat",
2140 joku 63 "rule" => array(
2141     "fmII URL validator[ /]([0-9.]{1,10})" => "\\1",
2142     "freshmeat.net URL validator[ /]([0-9.]{1,10})" => "\\1"
2143     ),
2144     "uri" => "http://www.freshmeat.net/"
2145     ),
2146     "friend" => array(
2147     "icon" => "friend",
2148     "title" => "Friend",
2149     "rule" => array(
2150     "www\.friend\.fr" => ""
2151     ),
2152     "uri" => "http://www.friend.fr/"
2153     ),
2154     "frontier" => array(
2155     "icon" => "frontier",
2156     "title" => "Frontier",
2157     "rule" => array(
2158     "Frontier[ /]([0-9.]{1,10})" => "\\1"
2159     ),
2160     "uri" => ""
2161     ),
2162     "fyberspider" => array(
2163     "icon" => "robot",
2164     "title" => "FyberSpider",
2165     "rule" => array(
2166     "FyberSpider[ /]([0-9.]{1,10})" => "\\1"
2167     ),
2168     "uri" => "http://www.fyberspider.com/"
2169     ),
2170     "gaisbot" => array(
2171     "icon" => "gais",
2172     "title" => "Gaisbot",
2173     "rule" => array(
2174     "Gaisbot[ /]([0-9.]{1,10})" => "\\1"
2175     ),
2176     "uri" => ""
2177     ),
2178     "galaxy" => array(
2179     "icon" => "galaxy",
2180     "title" => "Galaxy",
2181     "rule" => array(
2182     "GalaxyBot[ /]([0-9.]{1,10})" => "\\1",
2183     "www.galaxy.com" => ""
2184     ),
2185     "uri" => "http://www.galaxy.com/"
2186     ),
2187     "gamespy" => array(
2188     "icon" => "gamespy",
2189     "title" => "GameSpy",
2190     "rule" => array(
2191     "GameSpyHTTP[ /]([0-9.]{1,10})" => "\\1"
2192     ),
2193     "uri" => ""
2194     ),
2195     "garlik" => array(
2196     "icon" => "garlik",
2197     "title" => "Garlik",
2198     "rule" => array(
2199     "GarlikCrawler[ /]([0-9.]{1,10})" => "\\1"
2200     ),
2201     "uri" => "http://garlik.com/"
2202     ),
2203     "gdesktop" => array(
2204     "icon" => "gdesktop",
2205     "title" => "Google Desktop",
2206     "rule" => array(
2207     "compatible; Google Desktop" => ""
2208     ),
2209     "uri" => ""
2210     ),
2211     "genome" => array(
2212     "icon" => "robot",
2213     "title" => "Genome Machine",
2214     "rule" => array(
2215     "Genome[ \-]?Machine" => ""
2216     ),
2217     "uri" => ""
2218     ),
2219     "geohash" => array(
2220     "icon" => "geohash",
2221     "title" => "Geohash",
2222     "rule" => array(
2223     "GeoHasher(/Nutch)[ /-]([0-9.]{1,10})" => "\\2"
2224     ),
2225     "uri" => "http://geohash.org/"
2226     ),
2227     "geona" => array(
2228     "icon" => "robot",
2229     "title" => "Geona",
2230     "rule" => array(
2231     "GeonaBot[ /]([0-9.]{1,10})" => "\\1"
2232     ),
2233     "uri" => ""
2234     ),
2235     "geoblog" => array(
2236     "icon" => "robot",
2237     "title" => "The World as a Blog",
2238     "rule" => array(
2239     "The World as a Blog" => ""
2240     ),
2241     "uri" => ""
2242     ),
2243     "geourl" => array(
2244     "icon" => "geourl",
2245     "title" => "GeoUrl",
2246     "rule" => array(
2247     "geourl[ /]([0-9.]{1,10})" => "\\1",
2248     "^GeoURLBot[ /]([0-9.]{1,10})" => "\\1",
2249     ),
2250     "uri" => ""
2251     ),
2252     "getnetwise" => array(
2253     "icon" => "robot",
2254     "title" => "GetNetWise",
2255     "rule" => array(
2256     " Crayon Crawler" => ""
2257     ),
2258     "uri" => ""
2259     ),
2260     "getright" => array(
2261     "icon" => "getright",
2262     "title" => "GetRight",
2263     "rule" => array(
2264     "GetRight[ /]([0-9.]{1,10})" => "\\1"
2265     ),
2266     "uri" => ""
2267     ),
2268     "getsmart" => array(
2269     "icon" => "getsmart",
2270     "title" => "GetSmart",
2271     "rule" => array(
2272     "GetSmart[ /]([0-9.]{1,10})" => "\\1"
2273     ),
2274     "uri" => ""
2275     ),
2276     "gigabot" => array(
2277     "icon" => "gigablast",
2278     "title" => "Gigablast",
2279     "rule" => array(
2280     "(Gigabot|Sitesearch)[/ ]([0-9.]{1,10})" => "\\2",
2281     "GigabotSiteSearch[/ ]([0-9.]{1,10})" => "\\1",
2282 joku 336 "GigablastOpenSource" => ""
2283 joku 63 ),
2284     "uri" => ""
2285 matthys 328 ),
2286     "gimme" => array(
2287     "icon" => "gimme",
2288     "title" => "gimmeUSA",
2289     "rule" => array(
2290     "Gimme60bot[ /]([0-9.]{1,10})" => "\\1"
2291     ),
2292     "uri" => "http://gimme60.com"
2293 joku 63 ),
2294 matthys 328 "ginger" => array(
2295     "icon" => "ginger",
2296     "title" => "GingerCrawler",
2297     "rule" => array(
2298     "GingerCrawler[ /]([0-9.]{1,10})" => "\\1"
2299     ),
2300     "uri" => "http://www.gingersoftware.com/crawler_agent.htm"
2301     ),
2302 joku 63 "girafabot" => array(
2303     "icon" => "girafa",
2304     "title" => "Girafa",
2305     "rule" => array(
2306     "Girafabot" => ""
2307     ),
2308     "uri" => ""
2309     ),
2310     "globalspec" => array(
2311     "icon" => "globalspec",
2312     "title" => "GlobalSpec",
2313     "rule" => array(
2314     "Ocelli[ /]([0-9.]{1,10})" => "\\1"
2315     ),
2316     "uri" => ""
2317     ),
2318     "glucose" => array(
2319     "icon" => "glucose",
2320     "title" => "Glucose",
2321     "rule" => array(
2322     "glucose[ /]([0-9a-z.\-]{1,10})" => "\\1"
2323     ),
2324     "uri" => ""
2325     ),
2326     "gnomit" => array(
2327     "icon" => "gnomit",
2328     "title" => "Gnomit",
2329     "rule" => array(
2330     "gnomit[ /]([0-9.]{1,10})" => "\\1"
2331     ),
2332     "uri" => "http://www.gnomit.com/",
2333     ),
2334     "goforit" => array(
2335     "icon" => "goforit",
2336     "title" => "GoForIt",
2337     "rule" => array(
2338     "^GoForIt\.com" => "",
2339     "^GOFORITBOT" => ""
2340     ),
2341     "uri" => ""
2342     ),
2343     "goguides" => array(
2344     "icon" => "robot",
2345     "title" => "GoGuides",
2346     "rule" => array(
2347     "^GoGuidesBot[ /]([0-9.]{1,10})" => "\\1"
2348     ),
2349     "uri" => "http://www.goguides.org/"
2350     ),
2351     // Needs to be before google for correct detection
2352     "mediapartners" => array(
2353     "icon" => "google",
2354     "title" => "Mediapartners",
2355     "rule" => array (
2356     "Mediapartners-Google[ /]([0-9.]{1,10})" => "\\1",
2357     "Mediapartners-Google" => ""
2358     ),
2359     "uri" => ""
2360     ),
2361     "google" => array(
2362     "icon" => "google",
2363     "title" => "Google",
2364     "rule" => array (
2365     "Googl(e|ebot)(-Image)?/([0-9.]{1,10})" => "\\3",
2366     "Googl(e|ebot)(-Image)?/" => "",
2367     "^gsa-crawler" => "",
2368     "Google Web Preview" => ""
2369     ),
2370     "uri" => "http://www.google.com/"
2371     ),
2372     "googlesitemaps" => array(
2373     "icon" => "google",
2374     "title" => "Google-Sitemaps",
2375     "rule" => array (
2376     "Googl(e|ebot)(-Sitemaps)?/([0-9.]{1,10})" => "\\3",
2377     "GSiteCrawler[ /v]*([0-9.a-z]{1,10})" => "\\1",
2378     "Googl(e|ebot)(-Sitemaps)?/" => ""
2379     ),
2380     "uri" => ""
2381     ),
2382     "googlemobile" => array(
2383     "icon" => "google",
2384     "title" => "Google-Mobile",
2385     "rule" => array (
2386     "Googl(e|ebot)(-Mobile)?/([0-9.]{1,10})" => "\\3",
2387     "Googl(e|ebot)(-Mobile)?/" => ""
2388     ),
2389     "uri" => ""
2390     ),
2391     "googleads" => array(
2392     "icon" => "google",
2393     "title" => "Google-AdsBot",
2394     "rule" => array (
2395     "^AdsBot-Google" => "",
2396     ),
2397     "uri" => ""
2398     ),
2399     "googlefeeds" => array(
2400     "icon" => "google",
2401     "title" => "Google-Feedfetcher",
2402     "rule" => array (
2403     "^Feedfetcher-Google" => "",
2404     ),
2405     "uri" => ""
2406     ),
2407     "googlverification" => array(
2408     "icon" => "google",
2409     "title" => "Google-Site-Verification",
2410     "rule" => array (
2411     "Google-Site-Verification[ /]([0-9.]{1,10})" => "\\1"
2412     ),
2413     "uri" => ""
2414     ),
2415 matthys 207 // Needs to be AFTER Google detection
2416     "goo" => array(
2417     "icon" => "goo",
2418     "title" => "Goo",
2419     "rule" => array (
2420     "(gazz|ichiro|mog(et|imogi))[ /]([0-9.]{1,10})" => "\\3",
2421     "DoCoMo[ /]([0-9.]{1,10})" => "\\1"
2422     ),
2423     "uri" => ""
2424     ),
2425 joku 63 "goongee" => array(
2426     "icon" => "robot",
2427     "title" => "GoonGee",
2428     "rule" => array (
2429     "^Big Fish[ /]v?([0-9.]{1,10})" => "\\2"
2430     ),
2431     "uri" => "http://www.goongee.com/"
2432     ),
2433     "gpost" => array(
2434     "icon" => "gpost",
2435     "title" => "GPost",
2436     "rule" => array(
2437     "^GPostbot" => ""
2438     ),
2439     "uri" => ""
2440     ),
2441 matthys 309 "grapeshot" => array(
2442     "icon" => "grapeshot",
2443     "title" => "Grapeshot",
2444     "rule" => array(
2445     "GrapeshotCrawler[/ ]([0-9.]{1,10})" => "\\1"
2446     ),
2447     "uri" => "http://www.grapeshot.co.uk/crawler.php"
2448     ),
2449 joku 63 "gregarius" => array(
2450     "icon" => "robot",
2451     "title" => "Gregarius",
2452     "rule" => array(
2453     "^Gregarius[/ ]([0-9.]{1,10})" => ""
2454     ),
2455     "uri" => ""
2456     ),
2457     "grub" => array(
2458     "icon" => "grub",
2459     "title" => "Grub",
2460     "rule" => array(
2461     "grub[ \-]?client[ /\-]{1,5}([0-9.]{1,10})" => "\\1",
2462     "grub crawler" => "",
2463     "grub[/ ]([0-9.]{1,10})" => "\\1",
2464     "^GrubNG([0-9. ]{1,10})?" => "\\1"
2465     ),
2466     "uri" => "http://www.grub.org/"
2467     ),
2468     "gulliver" => array(
2469     "icon" => "robot",
2470     "title" => "Gulliver",
2471     "rule" => array(
2472     "Gulliver" => ""
2473     ),
2474     "uri" => ""
2475     ),
2476     "guruji" => array(
2477     "icon" => "guruji",
2478     "title" => "Guruji",
2479     "rule" => array(
2480     "GurujiBot[/ ]([0-9.]{1,10})" => "\\1"
2481     ),
2482     "uri" => "http://www.guruji.com/"
2483     ),
2484     "gush" => array(
2485     "icon" => "robot",
2486     "title" => "Gush",
2487     "rule" => array(
2488     "^Gush[/ ]([0-9.]{1,10})" => "\\1"
2489     ),
2490     "uri" => ""
2491     ),
2492     "gziptester" => array(
2493     "icon" => "robot",
2494     "title" => "Gzip Tester",
2495     "rule" => array(
2496     "g(id)?zip[ \-]?test(er)?" => ""
2497     ),
2498     "uri" => ""
2499     ),
2500     "hanzoweb" => array(
2501     "icon" => "hanzoweb",
2502     "title" => "Hanzoweb",
2503     "rule" => array(
2504     "^Hanzoweb" => ""
2505     ),
2506     "uri" => ""
2507     ),
2508     "harbot" => array(
2509     "icon" => "harbot",
2510     "title" => "Harbot",
2511     "rule" => array(
2512     "^Harbot GateStation" => ""
2513     ),
2514     "uri" => ""
2515     ),
2516     "hatena" => array(
2517     "icon" => "hatena",
2518     "title" => "Hatena",
2519     "rule" => array(
2520     "Hatena (Antenna|Bookmark|Pagetitle Agent)[ /]([0-9.]{1,10})" => "\\2"
2521     ),
2522     "uri" => ""
2523     ),
2524     "htmlparser" => array(
2525     "icon" => "htmlparser",
2526     "title" => "HTMLParser",
2527     "rule" => array(
2528     "HTMLParser[ /]([0-9.]{1,10})" => "\\1"
2529     ),
2530     "uri" => "http://htmlparser.sourceforge.net/"
2531     ),
2532     "helix" => array(
2533     "icon" => "helix",
2534     "title" => "Heritrix",
2535     "rule" => array(
2536     "^helix[ /]([0-9.]{1,10})" => "\\1"
2537     ),
2538     "uri" => "http://www.sitesearch.ca/helix/"
2539     ),
2540     "heritrix" => array(
2541     "icon" => "heritrix",
2542     "title" => "Heritrix",
2543     "rule" => array(
2544     "heritrix[ /]([0-9.]{1,10})" => "\\1",
2545     "archive.org_bot" => "",
2546     "InternetArchive[ /]([0-9.a-z]{1,10})" => "\\1"
2547     ),
2548     "uri" => "http://archive.org"
2549     ),
2550     "hiddenmarket" => array(
2551     "icon" => "robot",
2552     "title" => "HiddenMarket",
2553     "rule" => array(
2554     "HiddenMarket[ /\-]([0-9.]{1,10})" => "\\1"
2555     ),
2556     "uri" => ""
2557     ),
2558     "honda" => array(
2559     "icon" => "robot",
2560     "title" => "Honda",
2561     "rule" => array(
2562     "Honda-Search[ /]([0-9.]{1,10})" => "\\1"
2563     ),
2564     "uri" => "http://www.honda-search.com"
2565     ),
2566     "hoowwwer" => array(
2567     "icon" => "hoowwwer",
2568     "title" => "HooWWWer",
2569     "rule" => array(
2570     "HooWWWer[ /]([0-9.]{1,10})" => "\\1"
2571     ),
2572     "uri" => ""
2573     ),
2574     "hotzonu" => array(
2575     "icon" => "hotzonu",
2576     "title" => "Hotzonu",
2577     "rule" => array(
2578     "Hotzonu[ /]([0-9.]{1,10})" => "\\1"
2579     ),
2580     "uri" => ""
2581     ),
2582     "houxou" => array(
2583     "icon" => "robot",
2584     "title" => "Houxou",
2585     "rule" => array(
2586     "HouxouCrawler[ /]Nutch.([0-9.]{1,10})" => "\\1",
2587     "HouxouCrawler" => ""
2588     ),
2589     "uri" => ""
2590     ),
2591     "htdig" => array(
2592     "icon" => "htdig",
2593     "title" => "ht://Dig",
2594     "rule" => array(
2595     "htdig[ /]([0-9.]{1,10})" => "\\1",
2596     "htdig" => "\\1"
2597     ),
2598     "uri" => ""
2599     ),
2600     "html2jpg" => array(
2601     "icon" => "html2jpg",
2602     "title" => "HTML2JPG",
2603     "rule" => array(
2604     "^HTML2JPG" => ""
2605     ),
2606     "uri" => ""
2607     ),
2608     "httperf" => array(
2609     "icon" => "robot",
2610     "title" => "HTTPerf",
2611     "rule" => array(
2612     "httperf[ /]([0-9.]{1,10})" => "\\1"
2613     ),
2614     "uri" => ""
2615     ),
2616     "httpunit" => array(
2617     "icon" => "httpunit",
2618     "title" => "HttpUnit",
2619     "rule" => array(
2620     "httpunit[ /]([0-9.]{1,10})" => "\\1"
2621     ),
2622     "uri" => ""
2623     ),
2624     "httrack" => array(
2625     "icon" => "httrack",
2626     "title" => "HTTrack",
2627     "rule" => array(
2628     "HTTrack[ /]([0-9.]{1,10})" => "\\1"
2629     ),
2630     "uri" => ""
2631     ),
2632     "huaweisymantec" => array(
2633     "icon" => "huaweisymantec",
2634     "title" => "HuaweiSymantec",
2635     "rule" => array(
2636     "HuaweiSymantecSpider[ /]([0-9.]{1,10})" => "\\1"
2637     ),
2638     "uri" => "http://www.huaweisymantec.com/en/IRL/spider/"
2639     ),
2640     "hungary" => array(
2641     "icon" => "hungary",
2642     "title" => "Hungary",
2643     "rule" => array(
2644     "HuRob[ /]([0-9.]{1,10})" => "\\1"
2645     ),
2646     "uri" => ""
2647     ),
2648 joku 261 "i18n" => array(
2649     "icon" => "w3c",
2650     "title" => "W3C I18n Checker",
2651     "rule" => array(
2652     "^W3C_I18n-Checker[ /]([0-9.]{1,10})" => "\\1"
2653 joku 169 ),
2654 joku 261 "uri" => "http://validator.w3.org/services"
2655     ),
2656 joku 63 "iakke" => array(
2657     "icon" => "iakke",
2658 matthys 209 "title" => "Iakké",
2659 joku 63 "rule" => array(
2660     "^iakke_bot[ /]v([0-9.]{1,10})" => "\\1"
2661     ),
2662     "uri" => "http://fr.iakke.com/"
2663     ),
2664     "iask" => array(
2665     "icon" => "iask",
2666     "title" => "IAsk",
2667     "rule" => array(
2668     "iaskspider[ /]([0-9.]{1,10})" => "\\1",
2669     "^iaskspider" => ""
2670     ),
2671     "uri" => "http://iask.com"
2672     ),
2673     "icc" => array(
2674     "icon" => "icc",
2675     "title" => "ICC-Crawler",
2676     "rule" => array(
2677     "^ICC-Crawler" => ""
2678     ),
2679     "uri" => "http://kc.nict.go.jp/icc/crawl.html"
2680     ),
2681     "icerocket" => array(
2682     "icon" => "icerocket",
2683     "title" => "Icerocket",
2684     "rule" => array(
2685     "BlogzIce[ /]([0-9.]{1,10})" => "\\1",
2686     "BlogSearch[ /]([0-9.]{1,10})" => "\\1"
2687     ),
2688     "uri" => ""
2689     ),
2690     "icjobs" => array(
2691     "icon" => "icjobs",
2692     "title" => "iCjobs",
2693     "rule" => array(
2694     "iCjobs[ /]([0-9.]{1,10})" => "\\1"
2695     ),
2696     "uri" => "http://www.icjobs.de/"
2697     ),
2698     "icra" => array(
2699     "icon" => "icra",
2700     "title" => "ICRA",
2701     "rule" => array(
2702     "^ICRA_Semantic_spider[ /]([0-9.]{1,10})" => "\\1"
2703     ),
2704     "uri" => "http://www.icra.org"
2705     ),
2706     "iknow" => array(
2707     "icon" => "robot",
2708     "title" => "I know",
2709     "rule" => array(
2710     "Comaneci_bot[ /]([0-9.]{1,10})" => "\\1"
2711     ),
2712     "uri" => ""
2713     ),
2714     "ilial" => array(
2715     "icon" => "robot",
2716     "title" => "Ilial",
2717     "rule" => array(
2718     "ilial[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
2719     ),
2720     "uri" => ""
2721     ),
2722     "ilocal" => array(
2723     "icon" => "ilocal",
2724     "title" => "ilocal",
2725     "rule" => array(
2726     "^ilocal" => "",
2727     ),
2728     "uri" => "http://www.ilocal.nl"
2729     ),
2730     "ilse" => array(
2731     "icon" => "ilse",
2732     "title" => "Ilse",
2733     "rule" => array(
2734     "I(NGRID|lseRobot|lseBot)[ /]([0-9.]{1,10})" => "\\1"
2735     ),
2736     "uri" => "http://ilse.nl/"
2737     ),
2738     "iltrovatore" => array(
2739     "icon" => "iltrovatore",
2740     "title" => "IlTrovatore",
2741     "rule" => array(
2742     "iltrovatore-setaccio[ /]([0-9.]{1,10})" => "\\1",
2743     "Iltrovatore-Setaccio" => "",
2744     "iltrovatore[ /]([0-9.]{1,10})" => "\\1"
2745     ),
2746     "uri" => ""
2747     ),
2748     "indylibrary" => array(
2749     "icon" => "robot",
2750     "title" => "Indy Library",
2751     "rule" => array(
2752     "Indy[ \-]?Library" => ""
2753     ),
2754     "uri" => ""
2755     ),
2756     "inela" => array(
2757     "icon" => "robot",
2758     "title" => "Inela",
2759     "rule" => array(
2760     "InelaBot[ /]([0-9.]{1,10})" => ""
2761     ),
2762     "uri" => "http://inelegant.org/bot"
2763     ),
2764     "ineturl" => array(
2765     "icon" => "robot",
2766     "title" => "InetURL",
2767     "rule" => array(
2768     "InetURL.?[ /]([0-9.]{1,10})" => ""
2769     ),
2770     "uri" => ""
2771     ),
2772     "infoart" => array(
2773     "icon" => "robot",
2774     "title" => "InfoArt",
2775     "rule" => array(
2776     "InfoArt crawler" => ""
2777     ),
2778     "uri" => ""
2779     ),
2780     "infomine" => array(
2781     "icon" => "infomine",
2782     "title" => "INFOMINE",
2783     "rule" => array(
2784     "^DataFountains/DMOZ" => "",
2785     "^INFOMINE[ /]([0-9.]{1,10})" => "\\1"
2786     ),
2787     "uri" => "http://infomine.ucr.edu/"
2788     ),
2789     "infoseek" => array(
2790     "icon" => "infoseek",
2791     "title" => "Infoseek",
2792     "rule" => array(
2793     "SideWinder[ /]?([0-9a-z.]{1,10})" => "\\1",
2794     "Infoseek" => ""
2795     ),
2796     "uri" => ""
2797     ),
2798     "inktomi" => array(
2799     "icon" => "inktomi",
2800     "title" => "Inktomi",
2801     "rule" => array(
2802     "slurp@inktomi\.com" => ""
2803     ),
2804     "uri" => ""
2805     ),
2806     "innerprise" => array(
2807     "icon" => "robot",
2808     "title" => "Innerprise",
2809     "rule" => array(
2810     "^InnerpriseBot[ /]([0-9.]{1,10})" => "\\1",
2811     "URL[ _]Spider[ _]Pro[ /]([0-9.+]{1,10})" => "\\1",
2812     "^ES[ .]NET[ _]Crawler[ /]([0-9.]{1,10})" => "\\1"
2813     ),
2814     "uri" => "http://www.innerprise.com/"
2815     ),
2816     "inria" => array(
2817     "icon" => "inria",
2818     "title" => "Inria",
2819     "rule" => array(
2820     "^xyro_" => ""
2821     ),
2822     "uri" => ""
2823     ),
2824     "insitor" => array(
2825     "icon" => "insitor",
2826     "title" => "Insitor",
2827     "rule" => array(
2828     "^Insitor(,|\.|naut)" => ""
2829     ),
2830     "uri" => "http://www.insitor.com/"
2831     ),
2832     "internetninja" => array(
2833     "icon" => "robot",
2834     "title" => "Internet Ninja",
2835     "rule" => array(
2836     "^Internet Ninja[ /]([0-9.]{1,10})" => "\\1"
2837     ),
2838     "uri" => ""
2839     ),
2840     "internetseer" => array(
2841     "icon" => "internetseer",
2842     "title" => "InternetSeer",
2843     "rule" => array(
2844     "^InternetSeer\.com" => ""
2845     ),
2846     "uri" => ""
2847     ),
2848     "interseek" => array(
2849     "icon" => "interseek",
2850     "title" => "Interseek",
2851     "rule" => array(
2852     "Interseek.com" => ""
2853     ),
2854     "uri" => "http://www.interseek.com"
2855     ),
2856     "intravnews" => array(
2857     "icon" => "intravnews",
2858     "title" => "IntraVnews",
2859     "rule" => array(
2860     "IntraVnews[ /]([0-9.]{1,10})" => "\\1"
2861     ),
2862     "uri" => "http://www.intravnews.com/"
2863     ),
2864     "ip2location" => array(
2865     "icon" => "ip2location",
2866     "title" => "IP2LocationBot",
2867     "rule" => array(
2868     "^IP2(Map|Location)Bot[ /]([0-9.]{1,10})" => "\\2"
2869     ),
2870     "uri" => "http://www.ip2location.com"
2871     ),
2872     "ipworks" => array(
2873     "icon" => "ipworks",
2874     "title" => "IP*Works",
2875     "rule" => array(
2876     "^IP\*Works\! V([0-9.]{1,10})" => "\\1"
2877     ),
2878     "uri" => "http://www.nsoftware.com/ipworks/"
2879     ),
2880     "irca" => array(
2881     "icon" => "robot",
2882     "title" => "Novell iChain Cool Solutions caching",
2883     "rule" => array(
2884 matthys 209 "^ICRA_(label_generator|Semantic_spider)[ /]([0-9.]{1,10})" => "\\2",
2885     "^Mozilla[/ ]([0-9.]{1,10})[/ ]\(compatible[ ;]*ICS" => "\\1"
2886 joku 63 ),
2887     "uri" => "http://www.icra.org"
2888     ),
2889     "irvine" => array(
2890     "icon" => "robot",
2891     "title" => "Irvine",
2892     "rule" => array(
2893     "Irvine[ /]([0-9.]{1,10})" => "\\1"
2894     ),
2895     "uri" => ""
2896     ),
2897     "ips-agent" => array(
2898     "icon" => "robot",
2899 matthys 209 "title" => "IPS-agent",
2900 joku 63 "rule" => array(
2901     "ips-agent" => ""
2902     ),
2903     "uri" => ""
2904     ),
2905     "isara" => array(
2906     "icon" => "isara",
2907 matthys 209 "title" => "Isara",
2908 joku 63 "rule" => array(
2909     "Isara[ -]([0-9.]{1,10})" => "\\1"
2910     ),
2911     "uri" => "http://www.isara.org/"
2912     ),
2913     "isspider" => array(
2914     "icon" => "robot",
2915     "title" => "ISSpider",
2916     "rule" => array(
2917     "ISSpider[ /\-]([0-9.]{1,10})" => "\\1"
2918     ),
2919     "uri" => ""
2920     ),
2921     "it2media" => array(
2922     "icon" => "it2media",
2923     "title" => "IT2media",
2924     "rule" => array(
2925     "www.adressendeutschland.de" => ""
2926     ),
2927     "uri" => "http://www.adressendeutschland.de/"
2928     ),
2929     "ivia" => array(
2930     "icon" => "robot",
2931     "title" => "iVia",
2932     "rule" => array(
2933     "iVia Site Checker.?[ /]([0-9.]{1,10})" => "\\1"
2934     ),
2935     "uri" => ""
2936     ),
2937     "jeteye" => array(
2938     "icon" => "jeteye",
2939     "title" => "Jeteye",
2940     "rule" => array(
2941     "Jetbot[ /]([0-9.]{1,10})" => "\\1"
2942     ),
2943     "uri" => ""
2944     ),
2945     "jobsde" => array(
2946     "icon" => "jobsde",
2947     "title" => "jobs.de",
2948     "rule" => array(
2949     "www\.jobs\.de" => "",
2950     "jobs.de-Robot" => ""
2951     ),
2952     "uri" => "http://www.jobs.de/"
2953     ),
2954     "jpluck" => array(
2955     "icon" => "robot",
2956     "title" => "Jpluck",
2957     "rule" => array(
2958     "JPluck[ /]([0-9a-z.]{1,10})" => "\\1"
2959     ),
2960     "uri" => ""
2961     ),
2962     "jxta" => array(
2963     "icon" => "robot",
2964     "title" => "Jxta",
2965     "rule" => array(
2966     "falcon[ /]([0-9.]{1,10})" => "\\1"
2967     ),
2968     "uri" => ""
2969     ),
2970     "jyte" => array(
2971     "icon" => "jyte",
2972     "title" => "Jyte",
2973     "rule" => array(
2974     "jyte_fetcher[ /]([0-9.]{1,10})" => "\\1"
2975     ),
2976     "uri" => ""
2977     ),
2978     "jyxo" => array(
2979     "icon" => "jyxo",
2980     "title" => "Jyxo",
2981     "rule" => array(
2982     "Jyxobot[ /]([0-9.]{1,10})" => "\\1"
2983     ),
2984     "uri" => ""
2985     ),
2986     "kalooga" => array(
2987     "icon" => "kalooga",
2988     "title" => "Kalooga",
2989     "rule" => array(
2990     "kalooga[ /-]([0-9.]{1,10})" => "\\1",
2991     "^kalooga" => "",
2992     "KaloogaBot" => ""
2993     ),
2994     "uri" => "http://www.kalooga.com"
2995     ),
2996     "keywen" => array(
2997     "icon" => "keywen",
2998     "title" => "Keywen",
2999     "rule" => array(
3000     "EasyDL[ /]([0-9.]{1,10})" => "\\1"
3001     ),
3002     "uri" => ""
3003     ),
3004     "kilomonkey" => array(
3005     "icon" => "robot",
3006     "title" => "Kilomonkey",
3007     "rule" => array(
3008     "kmky-not-a-bot[ /]([0-9.]{1,10})" => "\\1"
3009     ),
3010     "uri" => "http://www.kilomonkey.com/notabot.txt"
3011     ),
3012     "kinja" => array(
3013     "icon" => "kinja",
3014     "title" => "Kinja",
3015     "rule" => array(
3016     "kinjabot[ /]([0-9.]{1,10})" => "\\1",
3017     "^kinjabot" => ""
3018     ),
3019     "uri" => ""
3020     ),
3021     "kiwi" => array(
3022     "icon" => "robot",
3023     "title" => "KiwiStatus",
3024     "rule" => array(
3025     "KiwiStatus[ /]([0-9.]{1,10})" => "\\1",
3026     "KiwiStatus" => ""
3027     ),
3028     "uri" => "http://www.nzs.com/kiei-status/"
3029     ),
3030     "lachesis" => array(
3031     "icon" => "robot",
3032     "title" => "Lachesis",
3033     "rule" => array(
3034     "lachesis" => ""
3035     ),
3036     "uri" => ""
3037     ),
3038     "lanshan" => array(
3039     "icon" => "robot",
3040     "title" => "Lachesis",
3041     "rule" => array(
3042     "lanshanbot[/ ]([0-9.]{1,10})" => "\\1"
3043     ),
3044     "uri" => ""
3045     ),
3046     "lapozz" => array(
3047     "icon" => "lapozz",
3048     "title" => "Lapozz",
3049     "rule" => array(
3050     "LapozzBot[/ ]?([0-9.]{1,10})" => "\\1"
3051     ),
3052     "uri" => ""
3053     ),
3054     "larbin" => array(
3055     "icon" => "robot",
3056     "title" => "Larbin",
3057     "rule" => array(
3058     "larbin[_/ ]?([0-9.]{1,10})" => "\\1"
3059     ),
3060     "uri" => ""
3061     ),
3062     "laurion" => array(
3063     "icon" => "robot",
3064     "title" => "Laurion",
3065     "rule" => array(
3066     "^IPiumBot" => ""
3067     ),
3068     "uri" => "http://www.laurion.com/"
3069     ),
3070     "leechget" => array(
3071     "icon" => "leechget",
3072     "title" => "LeechGet",
3073     "rule" => array(
3074     "^LeechGet[ /]([0-9.]{1,10})" => "\\1"
3075     ),
3076     "uri" => ""
3077     ),
3078     "linguaseek" => array(
3079     "icon" => "linguaseek",
3080     "title" => "Linguaseek",
3081     "rule" => array(
3082     "^LinguaBot[ /]v([0-9.]{1,10})" => "\\1"
3083     ),
3084     "uri" => "http://www.linguaseek.com/"
3085     ),
3086     "linguee" => array(
3087     "icon" => "linguee",
3088     "title" => "Linguee",
3089     "rule" => array(
3090     "^Linguee Bot" => ""
3091     ),
3092     "uri" => "http://www.linguee.com/"
3093     ),
3094 matthys 355 "linkapedia" => array(
3095     "icon" => "linkapedia",
3096     "title" => "Linkapedia",
3097     "rule" => array(
3098     "^linkapedia" => ""
3099     ),
3100     "uri" => "http://www.linkapedia.com"
3101     ),
3102 matthys 346 "linkdex" => array(
3103     "icon" => "linkdex",
3104     "title" => "Linkdex",
3105     "rule" => array(
3106     "linkdexbot[ /]([0-9.]{1,10})" => "\\1"
3107     ),
3108     "uri" => "http://www.linkdex.com/bots/"
3109     ),
3110 matthys 366 "linkedin" => array(
3111     "icon" => "linkedin",
3112     "title" => "LinkedIn",
3113     "rule" => array(
3114     "LinkedInBot[ /]([0-9.]{1,10})" => "\\1"
3115     ),
3116     "uri" => "http://www.linkedin.com"
3117     ),
3118 joku 63 "linkguard" => array(
3119     "icon" => "robot",
3120     "title" => "Linkguard",
3121     "rule" => array(
3122     "Linkguard Online[ /]([0-9.]{1,10})" => "\\1"
3123     ),
3124     "uri" => "http://www.linkguard.com/"
3125     ),
3126     "linklint" => array(
3127     "icon" => "linklint",
3128     "title" => "Linklint",
3129     "rule" => array(
3130     "^Linklint[-\-a-z /]*([0-9.]{1,10})" => "\\1"
3131     ),
3132     "uri" => "http://www.linklint.org/"
3133     ),
3134     "linkman" => array(
3135     "icon" => "linkman",
3136     "title" => "Linkman",
3137     "rule" => array(
3138     "\(compatible; Linkman\)" => ""
3139     ),
3140     "uri" => ""
3141     ),
3142     // Needs to be before linkcheck for correct detection
3143     "linkchecker" => array(
3144     "icon" => "w3c",
3145     "title" => "W3C Link Checker",
3146     "rule" => array(
3147     "^W3C-checklink[ /]([0-9.]{1,10})" => "\\1"
3148     ),
3149     "uri" => "http://validator.w3.org/checklink"
3150     ),
3151     "linkcheck" => array(
3152     "icon" => "linkcheck",
3153     "title" => "Linkcheck",
3154     "rule" => array(
3155     "checklink[ /]([0-9.]{1,10})" => "\\1",
3156     "Link[ \-]?(Chec(k|ker)|Val(et|idator))" => "",
3157     "Adaxas Spider" => "",
3158     "Agent-SharewarePlazaFileCheckBot[ /]([0-9.]{1,10})" => "\\1",
3159     "NetMechanic V([0-9.]{1,10})" => "\\1",
3160     "^InfoLink" => "",
3161     "InternetLinkAgent" => "",
3162     "; SPENG\)" => "",
3163     "SharewarePlazaFileCheckBot" => "",
3164     "fileboost.net" => "",
3165     "^billbot" => ""
3166     ),
3167     "uri" => ""
3168     ),
3169     "linkru" => array(
3170     "icon" => "robot",
3171     "title" => "Link.RU",
3172     "rule" => array(
3173     "^Link.RU bot" => ""
3174     ),
3175     "uri" => ""
3176     ),
3177     "linkssql" => array(
3178     "icon" => "robot",
3179     "title" => "Links SQL",
3180     "rule" => array(
3181     "links sql" => ""
3182     ),
3183     "uri" => ""
3184     ),
3185     "linksweeper" => array(
3186     "icon" => "robot",
3187     "title" => "Link Sweeper",
3188     "rule" => array(
3189     "LinkSweeper[ /]([0-9.]{1,10})" => "\\1"
3190     ),
3191     "uri" => ""
3192     ),
3193     "linkwalker" => array(
3194     "icon" => "robot",
3195     "title" => "Link Walker",
3196     "rule" => array(
3197     "^LinkWalker" => ""
3198     ),
3199     "uri" => ""
3200     ),
3201     "lipperhey" => array(
3202     "icon" => "lipperhey",
3203     "title" => "Lipperhey",
3204     "rule" => array(
3205     "Lipperhey Spider" => ""
3206     ),
3207     "uri" => "http://www.lipperhey.com"
3208     ),
3209     "livedoor" => array(
3210     "icon" => "livedoor",
3211     "title" => "Livedoor",
3212     "rule" => array(
3213     "^Livedoor( SF( - California Crawl)?|Checkers)[ /]" => ""
3214     ),
3215     "uri" => ""
3216     ),
3217     "livejournal" => array(
3218     "icon" => "livejournal",
3219     "title" => "Live Journal",
3220     "rule" => array(
3221     "^LiveJournal\.com" => ""
3222     ),
3223     "uri" => "http://www.livejournal.com"
3224     ),
3225     "ljpic" => array(
3226     "icon" => "ljpic",
3227     "title" => "ljpic",
3228     "rule" => array(
3229     "LjSEEK Picture-Bot[ /]+([0-9.]{1,10})" => "\\1"
3230     ),
3231     "uri" => "http://www.ljpic.com"
3232     ),
3233     "lmspider" => array(
3234     "icon" => "robot",
3235     "title" => "Lmspider",
3236     "rule" => array(
3237     "^lmspider" => ""
3238     ),
3239     "uri" => ""
3240     ),
3241     "locators" => array(
3242     "icon" => "robot",
3243     "title" => "Locaters",
3244     "rule" => array(
3245     "^FiNDoBot[/ ]([0-9a-z.]{1,10})" => "\\1"
3246     ),
3247     "uri" => ""
3248     ),
3249     "look" => array(
3250     "icon" => "look",
3251     "title" => "Look",
3252     "rule" => array(
3253     "www\.look\.com" => "",
3254     "Lookbot" => ""
3255     ),
3256     "uri" => ""
3257     ),
3258     "looksmart" => array(
3259     "icon" => "looksmart",
3260     "title" => "LookSmart",
3261     "rule" => array(
3262     "^Martini" => "",
3263     "^MantraAgent" => "",
3264     "FurlBot" => "",
3265     "looksmart-sv-fw" => ""
3266     ),
3267     "uri" => ""
3268     ),
3269     "loop" => array(
3270     "icon" => "loop",
3271     "title" => "LOOP",
3272     "rule" => array(
3273     "NetResearchServer[ /]([0-9.]{1,10})" => "\\1"
3274     ),
3275     "uri" => ""
3276     ),
3277     "lotkyll" => array(
3278     "icon" => "robot",
3279     "title" => "Lotkyll",
3280     "rule" => array(
3281     "Lotkyll" => ""
3282     ),
3283     "uri" => ""
3284     ),
3285 joku 335 "ltx71" => array(
3286     "icon" => "robot",
3287     "title" => "LTX71",
3288     "rule" => array(
3289     "ltx71" => ""
3290     ),
3291     "uri" => "http://ltx71.com/"
3292     ),
3293 joku 63 "lwp" => array(
3294     "icon" => "robot",
3295     "title" => "lwp",
3296     "rule" => array(
3297     "lwp(-trivial|::simple)[ /]([0-9.]{1,10})" => "\\2"
3298     ),
3299     "uri" => ""
3300     ),
3301     "lycos" => array(
3302     "icon" => "lycos",
3303     "title" => "Lycos",
3304     "rule" => array(
3305     "Lycos_Spider_" => ""
3306     ),
3307     "uri" => ""
3308     ),
3309     "magpierss" => array(
3310     "icon" => "rss",
3311     "title" => "MagpieRSS",
3312     "rule" => array(
3313     "MagpieRSS" => ""
3314     ),
3315     "uri" => "http://magpierss.sourceforge.net/"
3316     ),
3317     "mailru" => array(
3318     "icon" => "mailru",
3319 matthys 209 "title" => "Mail.Ru",
3320 joku 63 "rule" => array(
3321 matthys 195 "^Mail.Ru[ /]([0-9.]{1,10})" => "\\1",
3322     "Mail.RU_Bot[ /]([0-9.]{1,10})" => "\\1"
3323 joku 63 ),
3324 matthys 209 "uri" => "http://www.mail.ru/"
3325 joku 63 ),
3326     "mailsweeper" => array(
3327     "icon" => "robot",
3328     "title" => "Mail Sweeper",
3329     "rule" => array(
3330     "Mail[ \-]?Sweeper" => ""
3331     ),
3332     "uri" => ""
3333     ),
3334     "marvin" => array(
3335     "icon" => "robot",
3336     "title" => "Marvin",
3337     "rule" => array(
3338     "^Marvin" => ""
3339     ),
3340     "uri" => ""
3341     ),
3342     "matkurja" => array(
3343     "icon" => "matkurja",
3344     "title" => "Mat'Kurja",
3345     "rule" => array(
3346     "Mosad[ /]([0-9.]{1,10})" => "\\1"
3347     ),
3348     "uri" => ""
3349     ),
3350     "mavicanet" => array(
3351     "icon" => "mavicanet",
3352     "title" => "Mavicanet",
3353     "rule" => array(
3354     "Mavicanet robot" => ""
3355     ),
3356     "uri" => ""
3357     ),
3358 matthys 292 "meanpath" => array(
3359     "icon" => "meanpath",
3360 matthys 290 "title" => "Meanpath",
3361 matthys 280 "rule" => array(
3362     "meanpathbot[ /]([0-9.]{1,10})" => "\\1"
3363     ),
3364     "uri" => "http://www.meanpath.com/meanpathbot.html"
3365 matthys 275 ),
3366 matthys 280 "mediater" => array(
3367 joku 63 "icon" => "robot",
3368     "title" => "Mediater",
3369     "rule" => array (
3370     "^libwww[ /]([0-9.]{1,10})" => "\\1"
3371 matthys 280 ),
3372     "uri" => ""
3373 joku 63 ),
3374 matthys 305 "memory" => array(
3375     "icon" => "memory",
3376     "title" => "internet Memory",
3377     "rule" => array (
3378     "memoryBot[ /]([0-9.]{1,10})" => "\\1"
3379     ),
3380     "uri" => "http://internetmemory.org/en/"
3381     ),
3382 joku 63 "mercator" => array(
3383     "icon" => "robot",
3384     "title" => "Mercator",
3385     "rule" => array(
3386     "Mercator" => ""
3387     ),
3388     "uri" => ""
3389     ),
3390     "metacarta" => array(
3391     "icon" => "robot",
3392     "title" => "Metacarta",
3393     "rule" => array(
3394     "^RRC (crawler_admin@bigfoot.com)" => "",
3395     "^flunky" => "",
3396     "^Mozilla.*\(samualt9@bigfoot.com\)$" => ""
3397     ),
3398     "uri" => "http://www.metacarta.com"
3399     ),
3400     "metager" => array(
3401     "icon" => "metager",
3402     "title" => "MetaGer",
3403     "rule" => array(
3404     "MetaGer" => ""
3405     ),
3406     "uri" => ""
3407     ),
3408     "metamark" => array(
3409     "icon" => "robot",
3410     "title" => "Metamark",
3411     "rule" => array(
3412     "^XRL[ /]([0-9.a-z]{1,10})" => "\\1"
3413     ),
3414     "uri" => "http://metamark.net"
3415     ),
3416     "metamedic" => array(
3417     "icon" => "metamedic",
3418     "title" => "MetaMedic",
3419     "rule" => array(
3420     "MediBot[ /]([0-9.]{1,10})" => "\\1"
3421     ),
3422     "uri" => ""
3423     ),
3424     "mirago" => array(
3425     "icon" => "mirago",
3426     "title" => "Mirago",
3427     "rule" => array(
3428     "Mirago" => ""
3429     ),
3430     "uri" => ""
3431     ),
3432     "misterwong" => array(
3433     "icon" => "misterwong",
3434     "title" => "Mister Wong",
3435     "rule" => array(
3436     "Mister Wong-Bot[ /]([0-9.]{1,10})" => "\\1"
3437     ),
3438     "uri" => "http://www.mister-wong.de/"
3439     ),
3440     "miva" => array(
3441     "icon" => "miva",
3442     "title" => "Miva",
3443     "rule" => array(
3444     "AlgoFeedback@miva\.com" => ""
3445     ),
3446     "uri" => "http://www.miva.com/"
3447     ),
3448     "mj12" => array(
3449     "icon" => "mj12",
3450     "title" => "Majestic-12",
3451     "rule" => array(
3452     "Mj12bot[ /]v?([0-9.]{1,10})" => "\\1",
3453     "MJ12bot \(mini\)[ /]([0-9.]{1,10})" => "\\1"
3454     ),
3455     "uri" => "http://majestic12.co.uk/bot.php"
3456     ),
3457     "mlbot" => array(
3458     "icon" => "robot",
3459     "title" => "MLBot",
3460     "rule" => array(
3461     "^MLBot" => ""
3462     ),
3463     "uri" => "http://www.metadatalabs.com/mlbot"
3464     ),
3465     "mnogo" => array(
3466     "icon" => "mnogo",
3467     "title" => "mnoGoSearch",
3468     "rule" => array(
3469     "Mnogosearch[ /\-]([0-9.]{1,10})" => "\\1"
3470     ),
3471     "uri" => "http://www.mnogosearch.org/"
3472     ),
3473     "mobileok" => array(
3474     "icon" => "mobileok",
3475     "title" => "W3C mobileOK",
3476     "rule" => array(
3477     "^W3C-mobileOK" => ""
3478     ),
3479     "uri" => "http://www.w3.org/2006/07/mobileok-ddc"
3480     ),
3481 matthys 296 "mojeek" => array(
3482     "icon" => "mojeek",
3483     "title" => "Mojeek",
3484 joku 63 "rule" => array(
3485     "MojeekBot[ /]([0-9.]{1,10})" => "\\1"
3486     ),
3487 matthys 284 "uri" => "https://www.mojeek.com/bot.html"
3488 joku 63 ),
3489     "momspider" => array(
3490     "icon" => "robot",
3491     "title" => "MOM Spider",
3492     "rule" => array(
3493     "MOMspider[ /]([0-9.]{1,10})" => "\\1"
3494     ),
3495     "uri" => ""
3496     ),
3497     "moreover" => array(
3498     "icon" => "moreover",
3499     "title" => "Moreover",
3500     "rule" => array(
3501     "^Moreoverbot[ /]([0-9.]{1,10})" => "\\1"
3502     ),
3503     "uri" => ""
3504     ),
3505     "movabletype" => array(
3506     "icon" => "movabletype",
3507     "title" => "Movable Type",
3508     "rule" => array(
3509     "MovableType[ /]([0-9.]{1,10})" => "\\1"
3510     ),
3511     "uri" => ""
3512     ),
3513     "mozdex" => array(
3514     "icon" => "mozdex",
3515     "title" => "MozDex",
3516     "rule" => array(
3517     "mozDex[ /]([0-9.]{1,6}(-dev)?)" => "\\1"
3518     ),
3519     "uri" => ""
3520     ),
3521     "mqbot" => array(
3522     "icon" => "robot",
3523     "title" => "MQbot",
3524     "rule" => array(
3525     "MQbot" => ""
3526     ),
3527     "uri" => ""
3528     ),
3529     "msnbot" => array(
3530     "icon" => "bing",
3531 matthys 205 "title" => "Bing",
3532 joku 63 "rule" => array(
3533     "MSN(BOT|PTC)[ /]([0-9.]{1,10})" => "\\2",
3534     "MS Search ([0-9.]{1,10}) Robot" => "\\1",
3535     "MSNBOT-(MEDIA|PRODUCTS|NewsBlogs)[ /]([0-9.]{1,10})" => "\\2",
3536     "bingbot[ /]([0-9.]{1,10})" => "\\1"
3537     ),
3538     "uri" => ""
3539     ),
3540     "msnbot-mobile" => array(
3541     "icon" => "msn",
3542     "title" => "MSN Mobile",
3543     "rule" => array(
3544     "MSNBOT-(MOBILE|)[ /]([0-9.]{1,10})" => "\\2",
3545     "MSNBOT_Mobile" => "",
3546     "MSMOBOT" => ""
3547     ),
3548     "uri" => ""
3549     ),
3550     "mslivebot" => array(
3551     "icon" => "livesearch",
3552     "title" => "MS Live Search",
3553     "rule" => array(
3554     "MSNBOT-(Academic)[ /]([0-9.]{1,10})" => "\\2"
3555     ),
3556     "uri" => ""
3557     ),
3558     "msproxy" => array(
3559     "icon" => "robot",
3560     "title" => "MSProxy",
3561     "rule" => array(
3562     "MSProxy[ /]([0-9.]{1,10})" => "\\1"
3563     ),
3564     "uri" => ""
3565     ),
3566     "msrbot" => array(
3567     "icon" => "robot",
3568     "title" => "MSRBOT",
3569     "rule" => array(
3570     "^MSRBOT" => ""
3571     ),
3572     "uri" => "http://research.microsoft.com/research/sv/msrbot/"
3573     ),
3574     "mswebdav" => array(
3575     "icon" => "robot",
3576     "title" => "MS-WebDAV",
3577     "rule" => array(
3578     "Microsoft[ \-]?WebDAV[ \-]?MiniRedir" => ""
3579     ),
3580     "uri" => ""
3581     ),
3582     "mticon" => array(
3583     "icon" => "robot",
3584     "title" => "MTIcon",
3585     "rule" => array(
3586     "MTIcon[/ ]([0-9.]{1,10})" => "\\1"
3587     ),
3588     "uri" => ""
3589     ),
3590     "multipage-validator" => array(
3591     "icon" => "multipage-validator",
3592     "title" => "Multipage Validator",
3593     "rule" => array(
3594     "^W3C_Multipage_Validator[ /]([0-9.]{1,10})" => "\\1"
3595     ),
3596     "uri" => "http://www.validator.ca/"
3597     ),
3598     "myrss" => array(
3599     "icon" => "rss",
3600     "title" => "MyRSS",
3601     "rule" => array(
3602     "MyRSS.jp[/ ]([0-9.]{1,10})" => "\\1"
3603     ),
3604     "uri" => ""
3605     ),
3606     "multimap" => array(
3607     "icon" => "robot",
3608     "title" => "Multimap",
3609     "rule" => array(
3610     "Multimap Geotag Blog Parser[/ ]([0-9.]{1,10})" => "\\1"
3611     ),
3612     "uri" => ""
3613     ),
3614     "najdi" => array(
3615     "icon" => "najdi",
3616     "title" => "Najdi.si",
3617     "rule" => array(
3618     "Najdi.si" => ""
3619     ),
3620     "uri" => "http://www.najdi.si"
3621     ),
3622     "nameprotect" => array(
3623     "icon" => "nameprotect",
3624     "title" => "Name Protect",
3625     "rule" => array(
3626     "NPBot" => ""
3627     ),
3628     "uri" => ""
3629     ),
3630     "nationaldirectory" => array(
3631     "icon" => "robot",
3632     "title" => "National Directory",
3633     "rule" => array(
3634     "NationalDirectory-WebSpider[ /]([0-9.]{1,10})" => "\\1"
3635     ),
3636     "uri" => ""
3637     ),
3638     "natsumican" => array(
3639     "icon" => "robot",
3640     "title" => "Natsu Mican",
3641     "rule" => array(
3642     "NATSU[ \-]MICAN[/ ]([0-9a-z.]{1,10})" => "\\1"
3643     ),
3644     "uri" => ""
3645     ),
3646     "naverbot" => array(
3647     "icon" => "naverbot",
3648     "title" => "Naver",
3649     "rule" => array(
3650     "NaverBot([_\-]dloader)?[/ \-]([0-9.]{1,10})" => "\\2",
3651     "Naver(Bot)?" => "",
3652     "^nabot" => ""
3653     ),
3654     "uri" => ""
3655     ),
3656     "navisso" => array(
3657     "icon" => "navisso",
3658     "title" => "Navisso",
3659     "rule" => array(
3660     "Navisso(Bot)?" => ""
3661     ),
3662     "uri" => "http://www.navisso.com"
3663     ),
3664     "neofonie" => array(
3665     "icon" => "robot",
3666 matthys 205 "title" => "Neofonie",
3667 joku 63 "rule" => array(
3668     "www.neofonie.de" => ""
3669     ),
3670     "uri" => "http://www.neofonie.de/loesungen/search/robot.html"
3671     ),
3672     "neomo" => array(
3673     "icon" => "robot",
3674     "title" => "Neomo",
3675     "rule" => array(
3676     "Francis[ /]([0-9.]{1,10})" => "\\1"
3677     ),
3678     "uri" => ""
3679     ),
3680     "nessus" => array(
3681     "icon" => "nessus",
3682     "title" => "Nessus",
3683     "rule" => array(
3684     "Nessus\)$" => ""
3685     ),
3686     "uri" => ""
3687     ),
3688 matthys 279 "nerdybot" => array(
3689 matthys 280 "icon" => "robot",
3690     "title" => "NerdyBot",
3691     "rule" => array(
3692     "NerdyBot" => ""
3693     ),
3694     "uri" => "http://nerdybot.com/"
3695 matthys 279 ),
3696 joku 63 "nerdbynature" => array(
3697     "icon" => "nerdbynature",
3698     "title" => "NerdByNature",
3699     "rule" => array(
3700     "NerdByNature.Bot" => ""
3701     ),
3702     "uri" => "http://www.nerdbynature.net/bot"
3703     ),
3704     "netants" => array(
3705     "icon" => "netants",
3706     "title" => "NetAnts",
3707     "rule" => array(
3708     "NetAnts[ /]([0-9.]{1,10})" => "\\1"
3709     ),
3710     "uri" => ""
3711     ),
3712     "netcraft" => array(
3713     "icon" => "netcraft",
3714     "title" => "Netcraft",
3715     "rule" => array(
3716     "netcraft" => ""
3717     ),
3718     "uri" => ""
3719     ),
3720     "netinfo" => array(
3721     "icon" => "netinfo",
3722     "title" => "Netinfo",
3723     "rule" => array(
3724     "^NetinfoBot[ /]([0-9.]{1,10})" => "\\1"
3725     ),
3726     "uri" => "http://netinfo.bg/"
3727     ),
3728     "netluchs" => array(
3729     "icon" => "netluchs",
3730     "title" => "Netluchs",
3731     "rule" => array(
3732     "Netluchs[ /]([0-9.a-z]{1,10})" => "\\1"
3733     ),
3734     "uri" => "http://www.netluchs.de/"
3735     ),
3736     "netmechanic" => array(
3737     "icon" => "netmechanic",
3738     "title" => "NetMechanic",
3739     "rule" => array(
3740     "NetMechanic[ /V]{1,5}([0-9.]{1,10})" => "\\1"
3741     ),
3742     "uri" => ""
3743     ),
3744     "netnose" => array(
3745     "icon" => "netnose",
3746     "title" => "NetNose",
3747     "rule" => array(
3748     "NetNose[ \-]Crawler[/ ]([0-9.]{1,10})" => "\\1"
3749     ),
3750     "uri" => ""
3751     ),
3752     "netoskop" => array(
3753     "icon" => "robot",
3754     "title" => "Netoskop",
3755     "rule" => array(
3756     "netoskop" => ""
3757     ),
3758     "uri" => ""
3759     ),
3760     "netpromoter" => array(
3761     "icon" => "netpromoter",
3762     "title" => "NetPromoter",
3763     "rule" => array(
3764     "NetPromoter Spider" => ""
3765     ),
3766     "uri" => "http://www.net-promoter.com/"
3767     ),
3768     "netprospector" => array(
3769     "icon" => "robot",
3770     "title" => "Netprospector",
3771     "rule" => array(
3772     "^netprospector" => ""
3773     )
3774     ),
3775     "netpumper" => array(
3776     "icon" => "robot",
3777     "title" => "Netpumper",
3778     "rule" => array(
3779     "^NetPumper[/ ]([0-9.]{1,10})" => "\\1"
3780     ),
3781     "uri" => ""
3782     ),
3783     "netscapeproxy" => array(
3784     "icon" => "netscape",
3785     "title" => "Netscape Proxy",
3786     "rule" => array(
3787     "Netscape-Proxy[/ ]([0-9.]{1,10})" => "\\1"
3788     ),
3789     "uri" => ""
3790     ),
3791     "netspective" => array(
3792     "icon" => "robot",
3793     "title" => "NetSpective",
3794     "rule" => array(
3795     "^WebFilter Robot ([0-9.]{1,10})" => "\\1"
3796     ),
3797     "uri" => ""
3798     ),
3799     "netvibes" => array(
3800     "icon" => "netvibes",
3801     "title" => " Netvibes",
3802     "rule" => array(
3803     "^Netvibes" => "\\1"
3804     ),
3805     "uri" => ""
3806     ),
3807     "newsfire" => array(
3808     "icon" => "newsfire",
3809     "title" => "NewsFire",
3810     "rule" => array(
3811     "NewsFire[/ ]([0-9.]{1,10})" => "\\1"
3812     ),
3813     "uri" => ""
3814     ),
3815     "newsgator" => array(
3816     "icon" => "newsgator",
3817     "title" => "NewsGator",
3818     "rule" => array(
3819     "NewsGato(r|rOnline)[/ ]([0-9.]{1,10})" => "\\2"
3820     ),
3821     "uri" => ""
3822     ),
3823     "newzcrawler" => array(
3824     "icon" => "newzcrawler",
3825     "title" => "NewzCrawler",
3826     "rule" => array(
3827     "NewzCrawler[/ ]([0-9.]{1,10})" => "\\1"
3828     ),
3829     "uri" => ""
3830     ),
3831     "nextopia" => array(
3832     "icon" => "newzcrawler",
3833     "title" => "NewzCrawler",
3834     "rule" => array(
3835     "^NextopiaBOT.*[v ]([0-9.]{1,10})" => "\\1"
3836     ),
3837     "uri" => ""
3838     ),
3839     "ngsearch" => array(
3840     "icon" => "ngsearch",
3841     "title" => "NG Search",
3842     "rule" => array(
3843     "NG-Search[/ ]([0-9.]{1,10})" => "\\1"
3844     ),
3845     "uri" => ""
3846     ),
3847     "nimble" => array(
3848     "icon" => "robot",
3849     "title" => "Nimble",
3850     "rule" => array(
3851     "NimbleCrawler[/ ]([0-9.]{1,10})" => "\\1"
3852     ),
3853     "uri" => ""
3854     ),
3855     "nmap" => array(
3856     "icon" => "nmap",
3857     "title" => "Nmap",
3858     "rule" => array(
3859     "Nmap Scripting Engine" => ""
3860     ),
3861     "uri" => "http://nmap.org/book/nse.html"
3862     ),
3863     "nusearch" => array(
3864     "icon" => "robot",
3865     "title" => "NuSearch",
3866     "rule" => array(
3867     "^nuSearch" => ""
3868     ),
3869     "uri" => "http://www.nusearch.com/"
3870     ),
3871     "noago" => array(
3872     "icon" => "noago",
3873     "title" => "Noago",
3874     "rule" => array(
3875     "Noago Spider" => ""
3876     ),
3877     "uri" => "http://www.noago.com/"
3878     ),
3879     "noviforum" => array(
3880     "icon" => "noviforum",
3881     "title" => "Noviforum",
3882     "rule" => array(
3883     "TridentSpider[/ ]?([0-9.]{1,10})" => "\\1"
3884     ),
3885     "uri" => ""
3886     ),
3887     "noxtrum" => array(
3888     "icon" => "noxtrum",
3889     "title" => "noXtrum",
3890     "rule" => array(
3891     "noxtrumbot[/ ]?([0-9.]{1,10})" => "\\1"
3892     ),
3893     "uri" => ""
3894     ),
3895     "noyona" => array(
3896     "icon" => "robot",
3897     "title" => "Noyona",
3898     "rule" => array(
3899     "noyona.([0-9._]{1,10})" => "\\1"
3900     ),
3901     "uri" => "http://noyona.com/"
3902     ),
3903     "nsauditor" => array(
3904     "icon" => "nsauditor",
3905     "title" => "Nsauditor",
3906     "rule" => array(
3907     "Nsauditor[ /]([0-9.]{1,10})" => "\\1"
3908     ),
3909     "uri" => "http://www.nsauditor.com/"
3910     ),
3911     "obidosbot" => array(
3912     "icon" => "robot",
3913     "title" => "Bookwatch",
3914     "rule" => array(
3915     "obidos[ \-]?bot" => ""
3916     ),
3917     "uri" => ""
3918     ),
3919     "objectssearch" => array(
3920     "icon" => "robot",
3921     "title" => "Objects Search",
3922     "rule" => array(
3923     "ObjectsSearch[ /]([0-9.]{1,10})" => "\\1"
3924     ),
3925     "uri" => ""
3926     ),
3927     "obot" => array(
3928 matthys 297 "icon" => "ibm",
3929     "title" => "IBM (ONLY) Crawler",
3930 joku 63 "rule" => array(
3931 matthys 297 "oBot[ /]([0-9.]{1,10})" => "\\1"
3932 joku 63 ),
3933 matthys 297 "uri" => "http://filterdb.iss.net/crawler/"
3934     // Previous from "ONLY Solutions GmbH" – that is what the O stands for
3935 joku 63 ),
3936     "ocawa" => array(
3937     "icon" => "ocawa",
3938     "title" => "Ocawa",
3939     "rule" => array(
3940     "Ocawa[ /]([A-Z.a-z][0-9.]{1,10})" => "\\1",
3941     "Ocawa" => ""
3942     ),
3943     "uri" => "http://www.ocawa.com/"
3944     ),
3945     "octora" => array(
3946     "icon" => "octora",
3947     "title" => "Octora",
3948     "rule" => array(
3949     "^Octora (Beta)?" => ""
3950     ),
3951     "uri" => "http://www.octora.com/"
3952     ),
3953     "offlineexplorer" => array(
3954     "icon" => "robot",
3955     "title" => "OfflineExplorer",
3956     "rule" => array(
3957     "^Offline Explorer[ /]([0-9.]{1,10})" => "\\1"
3958     ),
3959     "uri" => ""
3960     ),
3961     "omea" => array(
3962     "icon" => "omea",
3963     "title" => "Omea Reader",
3964     "rule" => array(
3965     "Omea Reader[ /]([0-9.]{1,10})" => "\\1"
3966     ),
3967     "uri" => ""
3968     ),
3969     "onet" => array(
3970     "icon" => "onet",
3971     "title" => "Onet",
3972     "rule" => array(
3973     "OnetSzukaj[ /]([0-9.]{1,10})" => "\\1",
3974     "Onet\.pl" => "",
3975     "inktomi.search.onet" => ""
3976     ),
3977     "uri" => "http://www.onet.pl"
3978     ),
3979     "online24" => array(
3980     "icon" => "robot",
3981 matthys 209 "title" => "Online24",
3982 joku 63 "rule" => array(
3983     "^Online24-Bot .* ([0-9.]{1,10})" => "\\1"
3984     ),
3985     "uri" => "http://www.online24.de"
3986     ),
3987     "onlinewebcheck" => array(
3988     "icon" => "csehtmlvalidator",
3989     "title" => "CSE HTML Validator",
3990     "rule" => array(
3991     "onlinewebcheck" => ""
3992     ),
3993     "uri" => "http://www.onlinewebcheck.com"
3994     ),
3995     "onsearch" => array(
3996     "icon" => "onsearch",
3997 matthys 209 "title" => "OnSearch",
3998 joku 63 "rule" => array(
3999     "^onCHECK-Robot" => ""
4000     ),
4001     "uri" => "http://www.onsearch.de"
4002     ),
4003     "onto" => array(
4004     "icon" => "robot",
4005     "title" => "OntoSpider",
4006     "rule" => array(
4007     "^OntoSpider[ /]([0-9.]{1,10})" => "\\1"
4008     ),
4009     "uri" => "http://ontospider.i-n.info/"
4010     ),
4011     "openacoon" => array(
4012     "icon" => "robot",
4013     "title" => "OpenAcoon",
4014     "rule" => array(
4015     "^OpenAcoon v([0-9.]{1,10})" => "\\1"
4016     ),
4017     "uri" => "http://www.openacoon.de/"
4018     ),
4019     "openfind" => array(
4020     "icon" => "openfind",
4021     "title" => "Openfind",
4022     "rule" => array(
4023     "openbot[ /]([0-9.]{1,10})" => "\\1",
4024     "Openfind Robot[ /]([0-9.A-Z]{1,10})" => "\\1"
4025     ),
4026     "uri" => ""
4027     ),
4028     "opentagger" => array(
4029     "icon" => "robot",
4030     "title" => "OpenTagger",
4031     "rule" => array(
4032     "^OpenTaggerBot" => ""
4033     ),
4034     "uri" => "http://www.opentagger.com/opentaggerbot.htm"
4035     ),
4036     "opentext" => array(
4037     "icon" => "opentext",
4038     "title" => "OpenText",
4039     "rule" => array(
4040     "^OpenTextSiteCrawler[ /]([0-9.]{1,10})" => "\\1"
4041     ),
4042     "uri" => "http://www.opentext.net/"
4043     ),
4044     "openweb" => array(
4045     "icon" => "robot",
4046     "title" => "OpenWebSpider",
4047     "rule" => array(
4048     "^OpenWebSpider[ /]([0-9.]{1,10})" => "\\1",
4049     "^OpenWebSpider v([0-9.A-Z]{1,10})" => "\\1"
4050     ),
4051     "uri" => "http://www.openwebspider.org"
4052     ),
4053     "openx" => array(
4054     "icon" => "openx",
4055     "title" => "OpenX Spider",
4056     "rule" => array(
4057     "OpenX" => ""
4058     ),
4059     "uri" => "http://www.openx.org"
4060     ),
4061     "orange" => array(
4062     "icon" => "orange",
4063     "title" => "Orange",
4064     "rule" => array(
4065 joku 338 "OrangeBot-Mobile[ /]([0-9.]{1,10})" => "\\1",
4066     "OrangeBot[ /]([0-9.]{1,10})" => "\\1"
4067 joku 63 ),
4068     "uri" => "http://orange.com/"
4069     ),
4070     "organica" => array(
4071     "icon" => "robot",
4072     "title" => "Organica",
4073     "rule" => array(
4074     "crawler@organica\.us" => ""
4075     ),
4076     "uri" => ""
4077     ),
4078     "outfox" => array(
4079     "icon" => "robot",
4080     "title" => "Outfox Melon",
4081     "rule" => array(
4082     "OutfoxMelonBot[ /]([0-9.]{1,10})" => "\\1",
4083     "OutfoxBot[ /]([0-9.]{1,10})" => "\\1"
4084     ),
4085     "uri" => ""
4086     ),
4087     "overture" => array(
4088     "icon" => "overture",
4089     "title" => "Overture",
4090     "rule" => array(
4091     "Overture[ \-]?WebCrawler" => ""
4092     ),
4093     "uri" => ""
4094     ),
4095 joku 337 "owler" => array(
4096     "icon" => "robot",
4097     "title" => "Owler",
4098     "rule" => array(
4099     "Owler[ /]([0-9.]{1,10})" => "\\1",
4100     "Owler" => ""
4101     ),
4102     "uri" => ""
4103     ),
4104 joku 63 "page2rss" => array(
4105     "icon" => "page2rss",
4106     "title" => "Page2RSS",
4107     "rule" => array(
4108     "Page2RSS[ /]([0-9.]{1,10})" => "\\1"
4109     ),
4110     "uri" => "http://page2rss.com"
4111     ),
4112     "pagebytes" => array(
4113     "icon" => "robot",
4114     "title" => "PageBites",
4115     "rule" => array(
4116     "^PageBitesHyperBot[ /]([0-9.]{1,10})" => "\\1"
4117     ),
4118     "uri" => ""
4119     ),
4120 matthys 282 "pagesinventory" => array(
4121     "icon" => "pagesinventory",
4122     "title" => "PagesInventory",
4123     "rule" => array(
4124     "^PagesInventory" => ""
4125     ),
4126     "uri" => "http://www.pagesinventory.com"
4127     ),
4128 joku 63 "pagesjaunes" => array(
4129     "icon" => "pagesjaunes",
4130     "title" => "Pages Jaunes",
4131     "rule" => array(
4132     "PJBot[ /]([0-9.]{1,10})" => "\\1"
4133     ),
4134     "uri" => "http://www.pagesjaunes.fr/"
4135     ),
4136     "pagevalet" => array(
4137     "icon" => "wdg",
4138     "title" => "WDG Page Valet",
4139     "rule" => array(
4140     "^Page Valet[ /]([0-9.]{1,10})" => "\\1"
4141     ),
4142     "uri" => "http://www.htmlhelp.com/tools/validator/"
4143     ),
4144     "panopeabot" => array(
4145     "icon" => "robot",
4146     "title" => "PanopeaBot",
4147     "rule" => array(
4148     "PanopeaBot[/ ]([0-9.]{1,10})" => "\\1"
4149     ),
4150     "uri" => ""
4151     ),
4152     "parchmenthill" => array(
4153     "icon" => "robot",
4154     "title" => "Parchment Hill",
4155     "rule" => array(
4156     "ParchBot[ /]([0-9.]{1,10})" => "\\1"
4157     ),
4158     "uri" => "http://www.parchmenthill.com/search.htm"
4159     ),
4160     "pascient" => array(
4161     "icon" => "pascient",
4162     "title" => "Pascient",
4163     "rule" => array(
4164     "panscient.com" => ""
4165     ),
4166     "uri" => "http://www.panscient.com/"
4167     ),
4168     "peerbot" => array(
4169     "icon" => "peerbot",
4170     "title" => "Peerbot",
4171     "rule" => array(
4172     "^PEERbot" => ""
4173     ),
4174     "uri" => ""
4175     ),
4176 matthys 389 "petalbot" => array(
4177     "icon" => "huawei",
4178     "title" => "PetalBot", // Huawei Search - also called Aspiegel
4179     "rule" => array(
4180     "PetalBot" => "",
4181     "AspiegelBot" => ""
4182     ),
4183     "uri" => "https://aspiegel.com/petalbot"
4184     ),
4185 joku 63 "php" => array(
4186     "icon" => "php",
4187     "title" => "PHP",
4188     "rule" => array(
4189     "^PHP[ /]([0-9.]{1,10})" => "\\1"
4190     ),
4191     "uri" => ""
4192     ),
4193     "phpcrawl" => array(
4194     "icon" => "robot",
4195     "title" => "PHPCrawl",
4196     "rule" => array(
4197     "^PHPCrawl" => ""
4198     ),
4199     "uri" => "http://phpcrawl.cuab.de/"
4200     ),
4201     "phpdig" => array(
4202     "icon" => "robot",
4203     "title" => "PhpDig",
4204     "rule" => array(
4205     "^PhpDig[ /]([0-9.]{1,10})" => "\\1"
4206     ),
4207     "uri" => "http://www.finbot.com/"
4208     ),
4209     "phpversiontracker" => array(
4210     "icon" => "phpversiontracker",
4211     "title" => "PHP version tracker",
4212     "rule" => array(
4213     "^PHP version tracker" => ""
4214     ),
4215     "uri" => "http://www.nexen.net/phpversion/bot.php"
4216     ),
4217     "pictureofinternet" => array(
4218     "icon" => "robot",
4219     "title" => "PictureOfInternet",
4220     "rule" => array(
4221     "^PictureOfInternet[ /]([0-9.]{1,10})" => ""
4222     ),
4223     "uri" => ""
4224     ),
4225     "pingdom" => array(
4226     "icon" => "pingdom",
4227     "title" => "Pingdom",
4228     "rule" => array(
4229     "^Pingdom GIGRIB v([0-9.]{1,10})" => "\\1",
4230     "^Pingdom" => ""
4231     ),
4232     "uri" => "http://www.pingdom.com/"
4233     ),
4234     "pinseri" => array(
4235     "icon" => "pinseri",
4236     "title" => "Pinseri",
4237     "rule" => array(
4238     "www\.pinseri\.com/bloglist" => ""
4239     ),
4240     "uri" => ""
4241     ),
4242     "plagger" => array(
4243     "icon" => "plagger",
4244     "title" => "Plagger",
4245     "rule" => array(
4246     "Plagger[ /]([0-9.]{1,10})" => "\\1"
4247     ),
4248     "uri" => "http://www.plugger.org"
4249     ),
4250     "planet" => array(
4251     "icon" => "planet",
4252     "title" => "Planet",
4253     "rule" => array(
4254     "Planet[ /]([0-9.]{1,10})" => "\\1"
4255     ),
4256     "uri" => ""
4257     ),
4258     "plantynet" => array(
4259     "icon" => "robot",
4260     "title" => "PlantyNet",
4261     "rule" => array(
4262     "PlantyNet_WebRobot[_ /]V?([0-9.]{1,10})" => "\\1"
4263     ),
4264     "uri" => ""
4265     ),
4266     "pluck" => array(
4267     "icon" => "pluck",
4268     "title" => "Pluck",
4269     "rule" => array(
4270     "PluckFeedCrawler[ /]([0-9.]{1,10})" => "\\1"
4271     ),
4272     "uri" => ""
4273     ),
4274     "plsearch" => array(
4275     "icon" => "plsearch",
4276     "title" => "PlanetSearch",
4277     "rule" => array(
4278     "fido[ /]([0-9.]{1,10}) Harvest" => "\\1"
4279     ),
4280     "uri" => ""
4281     ),
4282     "poe" => array(
4283     "icon" => "robot",
4284     "title" => "POE-Component",
4285     "rule" => array(
4286     "^POE-Component-Client-HTTP[/ ]([0-9.]{1,10})" => "\\1"
4287     ),
4288     "uri" => ""
4289     ),
4290     "pogodak" => array(
4291     "icon" => "pogodak",
4292     "title" => "Pogodak",
4293     "rule" => array(
4294     "Pogodak\.hr[/ ]?([0-9.]{1,10})" => "\\1"
4295     ),
4296     "uri" => ""
4297     ),
4298     "poodle" => array(
4299     "icon" => "robot",
4300     "title" => "Poodle predictor",
4301     "rule" => array(
4302     "P(oo|ooo)dle[ \-]?predictor[ \-]?([0-9.]{1,10})" => "\\1",
4303     "P(oo|ooo)dle[ \-]?predictor" => ""
4304     ),
4305     "uri" => "http://www.gritechnologies.com/tools/spider.go"
4306     ),
4307     "pompos" => array(
4308     "icon" => "pompos",
4309     "title" => "Pompos",
4310     "rule" => array(
4311     "Pompos[ /]([0-9.]{1,10})" => "\\1"
4312     ),
4313     "uri" => ""
4314     ),
4315     "popdex" => array(
4316     "icon" => "robot",
4317     "title" => "Popdexter",
4318     "rule" => array(
4319     "Popdexter" => ""
4320     ),
4321     "uri" => ""
4322     ),
4323     "postrank" => array(
4324     "icon" => "postrank",
4325     "title" => "PostRank",
4326     "rule" => array(
4327     "^PostRank[ /]+([0-9.]{1,10})" => "\\1"
4328     ),
4329     "uri" => "http://www.postrank.com/"
4330     ),
4331     "powermarks" => array(
4332     "icon" => "robot",
4333     "title" => "Powermarks",
4334     "rule" => array(
4335     "Powermarks[ /]([0-9.]{1,10})" => "\\1"
4336     ),
4337     "uri" => ""
4338     ),
4339 matthys 366 "pinterest" => array(
4340     "icon" => "pinterest",
4341 joku 63 "title" => "PROBE!",
4342     "rule" => array(
4343 matthys 366 "Pinterest[ /]([0-9.]{1,10})" => "\\1"
4344 joku 63 ),
4345 matthys 366 "uri" => "http://www.pinterest.com/"
4346 joku 63 ),
4347 matthys 366 "probe" => array(
4348     "icon" => "robot",
4349     "title" => "PROBE!",
4350     "rule" => array(
4351     "^PROBE!" => ""
4352     ),
4353     "uri" => ""
4354     ),
4355 joku 63 "projecthoneypot" => array(
4356     "icon" => "projecthoneypot",
4357     "title" => "Project Honeypot",
4358     "rule" => array(
4359     "^PHPot Verispider[ /v]+([0-9.]{1,10})" => "\\1",
4360     "projecthoneypot" => ""
4361     ),
4362     "uri" => "http://www.projecthoneypot.org"
4363     ),
4364     "proxycache" => array(
4365     "icon" => "robot",
4366     "title" => "Proxy Cache",
4367     "rule" => array(
4368     "^Mozilla/[0-9.]{1,10} \(compatible\;\)$" => ""
4369     ),
4370     "uri" => ""
4371     ),
4372     "proxyhunter" => array(
4373     "icon" => "robot",
4374     "title" => "ProxyHunter",
4375     "rule" => array(
4376     "ProxyHunter" => ""
4377     ),
4378     "uri" => ""
4379     ),
4380     "psbot" => array(
4381     "icon" => "picsearch",
4382     "title" => "PicSearch",
4383     "rule" => array(
4384     "^psbot" => ""
4385     ),
4386     "uri" => ""
4387     ),
4388     "pubsub" => array(
4389     "icon" => "pubsub",
4390     "title" => "PubSub",
4391     "rule" => array(
4392     "^PubSub-RSS-Reader[ /]([0-9.]{1,10})" => "\\1",
4393     "^PubSub\.com" => ""
4394     ),
4395     "uri" => ""
4396     ),
4397 joku 330 "pubarch" => array(
4398 joku 334 "icon" => "robot",
4399 joku 330 "title" => "PubArchive",
4400     "rule" => array(
4401     "publiclibraryarchive.org" => ""
4402     ),
4403     "uri" => ""
4404     ),
4405 joku 63 "pukiwiki" => array(
4406     "icon" => "pukiwiki",
4407     "title" => "PukiWiki",
4408     "rule" => array(
4409     "PukiWiki[ /]([0-9.]{1,10})" => "\\1"
4410     ),
4411     "uri" => ""
4412     ),
4413     "pwebotxy" => array(
4414     "icon" => "pwebotxy",
4415     "title" => "PWeBot/X.Y",
4416     "rule" => array(
4417     "^PWeBot[ /]([0-9.]{1,10})" => "\\1"
4418     ),
4419     "uri" => "http://www.programacionweb.net/robot.php"
4420     ),
4421     "pxys" => array(
4422     "icon" => "robot",
4423     "title" => "PXYS",
4424     "rule" => array(
4425     "^pxys" => ""
4426     ),
4427     "uri" => ""
4428     ),
4429     "qango" => array(
4430     "icon" => "qango",
4431     "title" => "Qango",
4432     "rule" => array(
4433     "^Qango.com" => ""
4434     ),
4435     "uri" => "http://www.quango.com/"
4436     ),
4437     "qihoo" => array(
4438     "icon" => "qihoo",
4439     "title" => "Qihoo",
4440     "rule" => array(
4441     "QihooBot[ /]([0-9.]{1,10})" => "\\1"
4442     ),
4443     "uri" => "http://www.qihoo.com/"
4444     ),
4445     "qseero" => array(
4446     "icon" => "robot",
4447     "title" => "Qseero",
4448     "rule" => array(
4449     "Qseero v([0-9.]{1,10})" => "\\1"
4450     ),
4451     "uri" => "http://www.q0.com/"
4452     ),
4453     "quantcast" => array(
4454     "icon" => "robot",
4455     "title" => "Quantcast",
4456     "rule" => array(
4457     "Quantcastbot[ /]([0-9.]{1,10})" => "\\1"
4458     ),
4459     "uri" => "http://www.quantcast.com/"
4460     ),
4461     "quepasa" => array(
4462     "icon" => "quepasa",
4463     "title" => "Quepasa",
4464     "rule" => array(
4465     "Quepasa[ \-]?Creep" => ""
4466     ),
4467     "uri" => ""
4468     ),
4469     "questfinder" => array(
4470     "icon" => "robot",
4471     "title" => "QuestFinder",
4472     "rule" => array(
4473     "www\.questfinder\.com" => ""
4474     ),
4475     "uri" => ""
4476     ),
4477 matthys 351 "qwantify" => array(
4478     "icon" => "qwantify",
4479     "title" => "Qwantify",
4480     "rule" => array(
4481     "Qwantify[ /]([0-9.]{1,10})" => "\\1"
4482     ),
4483     "uri" => "https://www.qwant.com/"
4484     ),
4485 joku 63 "qweery" => array(
4486     "icon" => "robot",
4487     "title" => "Qweery",
4488     "rule" => array(
4489     "^QweeryBot[ /]([0-9.]{1,10})" => "\\1"
4490     ),
4491     "uri" => "http://qweerybot.qweery.nl"
4492     ),
4493     "racaicrawler" => array(
4494     "icon" => "robot",
4495     "title" => "RacaiCrawler",
4496     "rule" => array(
4497     "RacaiCrawler[ -]([0-9.]{1,10})" => "\\1"
4498     )
4499     ),
4500     "radian6" => array(
4501     "icon" => "robot",
4502     "title" => "Radian6",
4503     "rule" => array(
4504     "www\.radian6\.com" => ""
4505     ),
4506     "uri" => "http://www.radian6.com"
4507     ),
4508 joku 375 "radiofx" => array(
4509     "icon" => "radiofx",
4510     "title" => "Radio.fx",
4511     "rule" => array(
4512     "Radio.fx" => ""
4513     ),
4514     "uri" => "https://de.tobit.softwarw"
4515     ),
4516 joku 63 "rambler" => array(
4517     "icon" => "rambler",
4518     "title" => "Rambler",
4519     "rule" => array(
4520     "StackRambler[ /]([0-9.]{1,10})" => "\\1"
4521     ),
4522     "uri" => ""
4523     ),
4524     "ramiba" => array(
4525     "icon" => "robot",
4526 matthys 209 "title" => "Ramiba",
4527 joku 63 "rule" => array(
4528     "^ramiba(-bot)?" => "\\1"
4529     ),
4530     "uri" => ""
4531     ),
4532     "rankur" => array(
4533     "icon" => "rankur",
4534     "title" => "Rankur",
4535     "rule" => array(
4536     "^RankurBot/Rankur([0-9.]{1,10})" => "\\1"
4537     ),
4538     "uri" => "http://rankur.com/",
4539     ),
4540 joku 261 "red" => array(
4541     "icon" => "red",
4542     "title" => "RED",
4543     "rule" => array(
4544     "RED[ /]([0-9.]{1,10})" => "\\1"
4545     ),
4546     "uri" => "http://redbot.org/"
4547 joku 181 ),
4548 joku 63 "rediff" => array(
4549     "icon" => "rediff",
4550 matthys 209 "title" => "Rediff",
4551 joku 63 "rule" => array(
4552     "^RedBot/redbot[ /\-]([0-9.]{1,10})" => "\\1"
4553     ),
4554     "uri" => "http://www.rediff.com",
4555     ),
4556     "repia" => array(
4557     "icon" => "robot",
4558     "title" => "Repia",
4559     "rule" => array(
4560     "webmaster@repia\.com" => ""
4561     ),
4562     "uri" => ""
4563     ),
4564     "robotgenius" => array(
4565     "icon" => "robot",
4566     "title" => "Robot Genius",
4567     "rule" => array(
4568     "^robotgenius" => ""
4569     ),
4570     "uri" => "http://robotgenius.net",
4571     ),
4572     "robozilla" => array(
4573     "icon" => "robot",
4574     "title" => "Robozilla",
4575     "rule" => array(
4576     "Robozilla" => ""
4577     ),
4578     "uri" => ""
4579     ),
4580 matthys 302 "rogerbot" => array(
4581 matthys 306 "icon" => "moz",
4582     "title" => "Moz Rogerbot",
4583 matthys 302 "rule" => array(
4584     "rogerbot[ /]([0-9.]{1,10})" => "\\1"
4585     ),
4586     "uri" => "http://moz.com/help/guides/moz-procedures/who-is-rogerbot"
4587     ),
4588 joku 63 "rojo" => array(
4589     "icon" => "rojo",
4590     "title" => "Rojo",
4591     "rule" => array(
4592     "Rojo[ /]([0-9.]{1,10})" => "\\1"
4593     ),
4594     "uri" => ""
4595     ),
4596     "rss-atom" => array(
4597     "icon" => "rss",
4598     "title" => "RSS / Atom",
4599     "rule" => array(
4600     "^Apple-PubSub" => "",
4601     "^AppleSyndication" => ""
4602     ),
4603     "uri" => ""
4604     ),
4605     "rssbot" => array(
4606     "icon" => "rss",
4607 matthys 209 "title" => "RSS-bot",
4608 joku 63 "rule" => array(
4609     "rss-bot[ /]([0-9.]{1,10})" => "\\1"
4610     ),
4611     "uri" => ""
4612     ),
4613     "rssbandit" => array(
4614     "icon" => "rssbandit",
4615     "title" => "RssBandit",
4616     "rule" => array(
4617     "RssBandit[ /]([0-9.]{1,10})" => "\\1"
4618     ),
4619     "uri" => ""
4620     ),
4621     "rssimages" => array(
4622     "icon" => "rss",
4623 matthys 209 "title" => "RssImages",
4624 joku 63 "rule" => array(
4625     "rssImagesBot[ /]([0-9.]{1,10})" => "\\1"
4626     ),
4627     "uri" => ""
4628     ),
4629     "rssmicro" => array(
4630     "icon" => "rssmicro",
4631     "title" => "RSSMicro",
4632     "rule" => array(
4633     "RSSMicro\.com" => ""
4634     ),
4635     "uri" => "http://www.rssmicro.com"
4636     ),
4637     "rssowl" => array(
4638     "icon" => "rssowl",
4639     "title" => "RSSOwl",
4640     "rule" => array(
4641     "RSSOwl[ /]([0-9a-z.]{1,10})" => "\\1"
4642     ),
4643     "uri" => ""
4644     ),
4645     "rssreader" => array(
4646     "icon" => "rss",
4647     "title" => "RssReader",
4648     "rule" => array(
4649     "RssReader[ /]([0-9.]{1,10})" => ""
4650     ),
4651     "uri" => ""
4652     ),
4653     "rtgi" => array(
4654     "icon" => "rtgi",
4655 matthys 209 "title" => "Rtgi",
4656 joku 63 "rule" => array(
4657     "RTGI" => ""
4658     ),
4659     "uri" => "http://rtgi.fr/"
4660     ),
4661     "rufusbot" => array(
4662     "icon" => "robot",
4663     "title" => "RufusBot",
4664     "rule" => array(
4665     "RufusBot" => ""
4666     ),
4667     "uri" => ""
4668     ),
4669 matthys 304 "runet" => array(
4670     "icon" => "runet",
4671     "title" => "iTrack RuNet Crawler",
4672     "rule" => array(
4673     "Runet-Research-Crawler" => ""
4674     ),
4675     "uri" => "http://www.itrack.ru/research/cmsrate/"
4676     ),
4677 joku 63 "runnk" => array(
4678     "icon" => "robot",
4679     "title" => "Runnk",
4680     "rule" => array(
4681     "Runnk RSS finder" => ""
4682     ),
4683     "uri" => "http://www.runnk.com/il/law"
4684     ),
4685     "sagool" => array(
4686     "icon" => "robot",
4687     "title" => "Sagool",
4688     "rule" => array(
4689     "MaSagool" => ""
4690     ),
4691     "uri" => "http://sagool.jp/"
4692     ),
4693     "sanszbot" => array(
4694     "icon" => "robot",
4695     "title" => "Sansz",
4696     "rule" => array(
4697     "SanszBot" => ""
4698     ),
4699     "uri" => ""
4700     ),
4701     "saucereader" => array(
4702     "icon" => "saucereader",
4703     "title" => "Sauce Reader",
4704     "rule" => array(
4705     "Sauce[ ]?Reader[ /]([0-9.]{1,10})" => "\\1"
4706     ),
4707     "uri" => ""
4708     ),
4709     "sbider" => array(
4710     "icon" => "sbider",
4711     "title" => "SBIder",
4712     "rule" => array(
4713     "SBIder[/ ]([0-9.]{1,10})" => "\\1",
4714     "SBIder[/ ]SBIder.([0-9.]{1,10})" => "\\1"
4715     ),
4716     "uri" => ""
4717     ),
4718     "scirus" => array(
4719     "icon" => "robot",
4720     "title" => "Scirus",
4721     "rule" => array(
4722     "FAST-WebCrawler/[0-9a-z.]{1,10}/Scirus" => ""
4723     ),
4724     "uri" => ""
4725     ),
4726     "scoutjet" => array(
4727     "icon" => "scoutjet",
4728     "title" => "ScoutJet",
4729     "rule" => array(
4730     "ScoutJet" => ""
4731     ),
4732     "uri" => "http://www.scoutjet.com/"
4733     ),
4734 joku 261 "scrapy" => array(
4735     "icon" => "scrapy",
4736     "title" => "Scrapy",
4737     "rule" => array(
4738     "Scrapy[ /]([0-9.]{1,10})" => "\\1"
4739     ),
4740     "uri" => "http://scrapy.org"
4741     ),
4742 joku 63 "scrubby" => array(
4743     "icon" => "scrubby",
4744     "title" => "Scrubby",
4745     "rule" => array(
4746     "Scrubby[ /]([0-9.]{1,10})" => "\\1"
4747     ),
4748     "uri" => ""
4749     ),
4750     "sdm" => array(
4751     "icon" => "sdm",
4752     "title" => "SUN Download Manager",
4753     "rule" => array(
4754     "Sun Download Manager[/ ]([0-9.]{1,10})" => "\\1"
4755     ),
4756     "uri" => ""
4757     ),
4758     "sealinks" => array(
4759     "icon" => "robot",
4760     "title" => "Sea Links",
4761     "rule" => array(
4762     "SEA-Links( HTML-Scanner Pingoo\!)?[ /]([0-9.]{1,10})" => "\\2"
4763     ),
4764     "uri" => ""
4765     ),
4766     "search17" => array(
4767     "icon" => "robot",
4768     "title" => "Search 17",
4769     "rule" => array(
4770     "Search17Bot[ /]([0-9.]{1,10})" => "\\1"
4771     ),
4772     "uri" => "http://www.search17.com/bot.php"
4773     ),
4774     "search2" => array(
4775     "icon" => "search2",
4776     "title" => "Search2.net",
4777     "rule" => array(
4778     "^S2Bot[ /]([0-9.]{1,10})" => "\\1"
4779     ),
4780     "uri" => "http://search2.net/"
4781     ),
4782     "searchbot" => array(
4783     "icon" => "robot",
4784     "title" => "Searchbot",
4785     "rule" => array(
4786     "Searchbot[ /]([0-9.]{1,10})" => "\\1"
4787     ),
4788     "uri" => ""
4789     ),
4790     "searchch" => array(
4791     "icon" => "robot",
4792     "title" => "Search.ch",
4793     "rule" => array(
4794     "search\.ch[ /]?V?([0-9.]{1,10})" => "\\1"
4795     ),
4796     "uri" => ""
4797     ),
4798     "searchengineworld" => array(
4799     "icon" => "robot",
4800     "title" => "SearchEngineWorld",
4801     "rule" => array(
4802     "searchengineworld" => ""
4803     ),
4804     "uri" => "http://www.searchengineworld.com/"
4805     ),
4806     "searchhippo" => array(
4807     "icon" => "searchhippo",
4808     "title" => "Searchhippo",
4809     "rule" => array(
4810     "searchhippo" => ""
4811     ),
4812     "uri" => "http://www.searchhippo.com/"
4813     ),
4814     "searchthruus" => array(
4815     "icon" => "robot",
4816     "title" => "SearchThruUs",
4817     "rule" => array(
4818     "www\.unitek-systems\.co\.uk[ /]([0-9.]{1,10})" => "\\1"
4819     ),
4820     "uri" => ""
4821     ),
4822     "securecomputing" => array(
4823     "icon" => "robot",
4824     "title" => "Secure Computing",
4825     "rule" => array(
4826     "securecomputing" => ""
4827     ),
4828     "uri" => ""
4829     ),
4830     "seekport" => array(
4831     "icon" => "seekport",
4832     "title" => "Seekport",
4833     "rule" => array(
4834     "Seekbot[ /]([0-9.]{1,10})" => "\\1"
4835     ),
4836     "uri" => ""
4837     ),
4838     "semanticdiscovery" => array(
4839     "icon" => "robot",
4840     "title" => "Semantic Discovery",
4841     "rule" => array(
4842     "semanticdiscovery[ /]([0-9.]{1,10})" => "\\1"
4843     ),
4844     "uri" => ""
4845     ),
4846 matthys 319 "semrush" => array(
4847     "icon" => "semrush",
4848     "title" => "SEMrush",
4849     "rule" => array(
4850     "SemrushBot[ /]([0-9.]{1,10})" => "\\1"
4851     ),
4852     "uri" => "http://www.semrush.com/bot.html"
4853     ),
4854 joku 63 "sengine" => array(
4855     "icon" => "sengine",
4856     "title" => "Sengine",
4857     "rule" => array(
4858     "netEstate NE Crawler" => ""
4859     ),
4860     "uri" => "http://www.sengine.info/"
4861     ),
4862     "sensis" => array(
4863     "icon" => "sensis",
4864     "title" => "Sensis",
4865     "rule" => array(
4866     "^Sensis(.com.au)? Web Crawler" => ""
4867     ),
4868     "uri" => "http://sensis.com.au"
4869     ),
4870     "seokicks" => array(
4871     "icon" => "seokicks",
4872     "title" => "SEOkicks",
4873     "rule" => array(
4874     "SEOkicks-Robot" => ""
4875     ),
4876     "uri" => "http://www.seokicks.de/"
4877     ),
4878     "seoprofiler" => array(
4879     "icon" => "seoprofiler",
4880     "title" => "SEOprofiler",
4881     "rule" => array(
4882     "spbot[ /]([0-9.]{1,10})" => "\\1"
4883     ),
4884     "uri" => "http://www.seoprofiler.com/"
4885     ),
4886     "setooz" => array(
4887     "icon" => "setooz",
4888     "title" => "Setooz",
4889     "rule" => array(
4890     "OOZBOT[ /]([0-9.]{1,10})" => "\\1"
4891     ),
4892     "uri" => "http://www.setooz.com/oozbot.html"
4893     ),
4894     "seznam" => array(
4895     "icon" => "seznam",
4896     "title" => "Seznam",
4897     "rule" => array(
4898     "SeznamBot[ /]([0-9.]{1,10})" => "\\1",
4899     "Seznam" => ""
4900     ),
4901     "uri" => "http://www.seznam.cz"
4902     ),
4903     "sharpreader" => array(
4904     "icon" => "sharpreader",
4905     "title" => "SharpReader",
4906     "rule" => array(
4907     "SharpReader[ /]([0-9.]{1,10})" => "\\1"
4908     ),
4909     "uri" => ""
4910     ),
4911     "shelob" => array(
4912     "icon" => "shelob",
4913     "title" => "Sherlock Spider",
4914     "rule" => array(
4915     "^Shelob" => ""
4916     ),
4917     "uri" => "http://www.gmx.net"
4918     ),
4919     "sherlockspider" => array(
4920     "icon" => "robot",
4921     "title" => "Sherlock Spider",
4922     "rule" => array(
4923     "sherlock_spider" => ""
4924     ),
4925     "uri" => ""
4926     ),
4927     "shim" => array(
4928     "icon" => "robot",
4929     "title" => "Shim Crawler",
4930     "rule" => array(
4931     "shim[ \-]crawler" => ""
4932     ),
4933     "uri" => ""
4934     ),
4935     "shopwiki" => array(
4936     "icon" => "shopwiki",
4937     "title" => "ShopWiki",
4938     "rule" => array(
4939     "^ShopWiki[ /]([0-9.]{1,10})" => "\\1"
4940     ),
4941     "uri" => ""
4942     ),
4943     "shoula" => array(
4944     "icon" => "robot",
4945     "title" => "Shoula",
4946     "rule" => array(
4947     "^Shoula.com Crawler ([0-9.]{1,10})" => "\\1"
4948     ),
4949     "uri" => "http://www.shoula.com"
4950     ),
4951     "siege" => array(
4952     "icon" => "robot",
4953     "title" => "Siege",
4954     "rule" => array(
4955     "Siege[ /]([0-9.]{1,10})" => "\\1"
4956     ),
4957     "uri" => ""
4958     ),
4959     "siets" => array(
4960     "icon" => "robot",
4961     "title" => "Siets",
4962     "rule" => array(
4963     "SietsCrawler[ /]([0-9.]{1,10})" => "\\1"
4964     ),
4965     "uri" => ""
4966     ),
4967     "simpy" => array(
4968     "icon" => "simpy",
4969     "title" => "Simpy",
4970     "rule" => array(
4971     "^(argus|simpy)[ /]([0-9.]{1,10})" => "\\2",
4972     ),
4973     "uri" => ""
4974     ),
4975     "singingfish" => array(
4976     "icon" => "singingfish",
4977     "title" => "SingingFish",
4978     "rule" => array(
4979     "asterias[ /]([0-9.]{1,10})" => "\\1",
4980     "Asterias Crawler v([0-9.]{1,10})" => "\\1",
4981     "asterias" => ""
4982     ),
4983     "uri" => ""
4984     ),
4985     "sirketce" => array(
4986     "icon" => "robot",
4987     "title" => "Sirketce",
4988     "rule" => array(
4989     "Sirketcebot[ /v]+([0-9.]{1,10})" => "\\1"
4990     ),
4991     "uri" => "http://www.sirketce.com/bot.html"
4992     ),
4993     "sirobot" => array(
4994     "icon" => "robot",
4995     "title" => "SiroBot",
4996     "rule" => array(
4997     "sirobot" => ""
4998     ),
4999     "uri" => ""
5000     ),
5001     "sistrix" => array(
5002     "icon" => "sistrix",
5003     "title" => "SISTRIX",
5004     "rule" => array(
5005     "SISTRIX Crawler" => ""
5006     ),
5007     "uri" => "http://crawler.sistrix.net/"
5008     ),
5009     "sitebar" => array(
5010     "icon" => "sitebar",
5011     "title" => "SiteBar",
5012     "rule" => array(
5013     "SiteBar[ /]([0-9.]{1,10})" => "\\1"
5014     ),
5015     "uri" => ""
5016     ),
5017     "sitebot" => array(
5018     "icon" => "sitebot",
5019     "title" => "SiteBot",
5020     "rule" => array(
5021     "SiteBot[ /]([0-9.]{1,10})" => "\\1"
5022     ),
5023     "uri" => "http://www.sitebot.org/robot/"
5024     ),
5025 matthys 273 "siteexplorer" => array(
5026     "icon" => "siteexplorer",
5027     "title" => "SiteExplorer",
5028     "rule" => array(
5029     "SiteExplorer[ /]([0-9a-z.]{1,10})" => "\\1"
5030     ),
5031     "uri" => "http://siteexplorer.info/"
5032     ),
5033 joku 63 "sitesell" => array(
5034     "icon" => "sitesell",
5035     "title" => "SiteSell",
5036     "rule" => array(
5037     "SBIder[/ ]([0-9a-z.\-]{1,10})" => "\\1"
5038     ),
5039     "uri" => ""
5040     ),
5041     "sitespider" => array(
5042     "icon" => "robot",
5043     "title" => "SiteSpider",
5044     "rule" => array(
5045     "^SiteSpider" => ""
5046     ),
5047     "uri" => ""
5048     ),
5049     "sitesucker" => array(
5050     "icon" => "sitesucker",
5051     "title" => "SiteSucker",
5052     "rule" => array(
5053     "Sitesucker[ /]([0-9.]{1,10})" => "\\1"
5054     ),
5055     "uri" => "http://www.sitesucker.us/"
5056     ),
5057     "sitidi" => array(
5058     "icon" => "robot",
5059     "title" => "SitiDi",
5060     "rule" => array(
5061     "SitiDiBot[ /]([0-9.]{1,10})" => "\\1"
5062     ),
5063     "uri" => ""
5064     ),
5065 joku 329 "sixy" => array(
5066     "icon" => "robot",
5067     "title" => "Sixy.ch",
5068     "rule" => array(
5069     "sixy.ch[ /]([0-9a-z.]{1,10})" => "\\1"
5070     ),
5071     "uri" => "http://sixy.ch"
5072     ),
5073 joku 63 "skaffe" => array(
5074     "icon" => "robot",
5075     "title" => "Skaffe",
5076     "rule" => array(
5077     "Skampy[ /]([0-9.\-]{1,10})" => "\\1"
5078     ),
5079     "uri" => "http://www.skaffe.com"
5080     ),
5081     "skizzle" => array(
5082     "icon" => "skizzle",
5083     "title" => "Skizzle",
5084     "rule" => array(
5085     "SKIZZLE! Distributed Internet Spider[ /v]+([0-9a-z.\-]{1,10})" => "\\1"
5086     ),
5087     "uri" => "http://www.skizzle.com"
5088     ),
5089     "slider" => array(
5090     "icon" => "robot",
5091     "title" => "Slider",
5092     "rule" => array(
5093     "^Slider[ /]([0-9.]{1,10})" => "\\1"
5094     ),
5095     "uri" => ""
5096     ),
5097     "slugch" => array(
5098     "icon" => "robot",
5099 matthys 209 "title" => "Slugch",
5100 joku 63 "rule" => array(
5101     "^slug\.ch crawl ([0-9a-z.\-]{1,10})" => "\\1"
5102     ),
5103     "uri" => ""
5104     ),
5105     "smartware" => array(
5106     "icon" => "robot",
5107     "title" => "SmartWareSoft",
5108     "rule" => array(
5109     "^SWSBot-Images[ /]([0-9.]{1,10})" => "\\1"
5110     ),
5111     "uri" => "http://www.smartwaresoft.com/swsbot12.html"
5112     ),
5113     "snookit" => array(
5114     "icon" => "snookit",
5115     "title" => "Snookit",
5116     "rule" => array(
5117     "^snookit" => ""
5118     ),
5119     "uri" => "http://www.snookit.com/"
5120     ),
5121     "snoopy" => array(
5122     "icon" => "robot",
5123     "title" => "Snoopy",
5124     "rule" => array(
5125     "^Snoopy.+([0-9.]{1,10})" => "\\1",
5126     "sna-([0-9.]{1,10})" => "\\1"
5127     ),
5128     "uri" => "http://snoopy.sourceforge.net/"
5129     ),
5130     "snyke" => array(
5131     "icon" => "robot",
5132     "title" => "Snyke",
5133     "rule" => array(
5134     "^SnykeBot[ /]([0-9.]{1,10})" => "\\1"
5135     ),
5136     "uri" => "http://www.snyke.com"
5137     ),
5138     "socialradar" => array(
5139     "icon" => "socialradar",
5140     "title" => "Social Radar",
5141     "rule" => array(
5142     "Socialradarbot[ /]([0-9.]{1,10})" => "\\1"
5143     ),
5144     "uri" => "http://infegy.com/"
5145     ),
5146     "soegning" => array(
5147     "icon" => "soegning",
5148 matthys 209 "title" => "Søgning",
5149 joku 63 "rule" => array(
5150     "soegning\.dk[/ ]spider[ /]([0-9.]{1,10})" => "\\1"
5151     ),
5152     "uri" => ""
5153     ),
5154     "soft411" => array(
5155     "icon" => "soft411",
5156     "title" => "Soft411",
5157     "rule" => array(
5158     "SOFT411 Directory" => ""
5159     ),
5160     "uri" => ""
5161     ),
5162     "sogou" => array(
5163     "icon" => "sogou",
5164     "title" => "Sogou",
5165     "rule" => array(
5166     "Sogou web spider[ /]([0-9.]{1,10})" => "\\1"
5167     ),
5168     "uri" => "http://www.sogou.com/docs/help/webmasters.htm#07"
5169     ),
5170     "sohu" => array(
5171     "icon" => "robot",
5172     "title" => "Sohu",
5173     "rule" => array(
5174     "sohu[ \-](agent|search)" => ""
5175     ),
5176     "uri" => ""
5177     ),
5178     "somewhere" => array(
5179     "icon" => "robot",
5180 matthys 209 "title" => "Somewhere.com",
5181 joku 63 "rule" => array(
5182     "Mozilla\@somewhere\.com" => "\\1"
5183     ),
5184     "uri" => "http://www.somewhere.com/"
5185     ),
5186     "sopheus" => array(
5187     "icon" => "robot",
5188     "title" => "Sopheus",
5189     "rule" => array(
5190     "Sopheus Project[ /]([0-9.]{1,10})" => "\\1"
5191     ),
5192     "uri" => "http://www.thenetplanet.com"
5193     ),
5194     "soso" => array(
5195     "icon" => "soso",
5196     "title" => "Soso",
5197     "rule" => array(
5198     "^Soso(image)?spider" => ""
5199     ),
5200     "uri" => "http://help.soso.com/soso-image-spider.htm"
5201     ),
5202     "souppot" => array(
5203     "icon" => "robot",
5204     "title" => "SoupPot",
5205     "rule" => array(
5206     "SoupPotBot" => ""
5207     ),
5208     "uri" => ""
5209     ),
5210     "specificmedia" => array(
5211     "icon" => "specificmedia",
5212     "title" => "Specific Media",
5213     "rule" => array(
5214     "^SMBot[ /]([0-9.]{1,10})" => "\\1"
5215     ),
5216     "uri" => ""
5217     ),
5218     "sphider" => array(
5219     "icon" => "sphider",
5220     "title" => "Sphider",
5221     "rule" => array(
5222     "Sphider" => ""
5223     ),
5224     "uri" => "http://www.sphider.eu"
5225     ),
5226     "spinn3r" => array(
5227     "icon" => "robot",
5228     "title" => "Spinn3r",
5229     "rule" => array(
5230     "Spinn3r[ /]([0-9.]{1,10})" => "\\1"
5231     ),
5232     "uri" => "http://spinn3r.com/robot"
5233     ),
5234     "sproose" => array(
5235     "icon" => "robot",
5236 matthys 209 "title" => "Sproose",
5237 joku 63 "rule" => array(
5238     "^sproose[ /]([0-9a-z.]{1,10})" => "\\1"
5239     ),
5240     "uri" => "http://www.sproose.com/bot.html"
5241     ),
5242     "spurlbot" => array(
5243     "icon" => "robot",
5244     "title" => "SpurlBot",
5245     "rule" => array(
5246     "SpurlBot[/ ]([0-9.]{1,10})" => "\\1"
5247     ),
5248     "uri" => ""
5249     ),
5250     "stardownloader" => array(
5251     "icon" => "stardownloader",
5252     "title" => "Star Downloader",
5253     "rule" => array(
5254     "^Star Downloader( Pro)?" => ""
5255     ),
5256     "uri" => ""
5257     ),
5258     "steeler" => array(
5259     "icon" => "robot",
5260     "title" => "Steeler",
5261     "rule" => array(
5262     "Steeler[ /]([0-9.]{1,10})" => "\\1"
5263     ),
5264     "uri" => ""
5265     ),
5266     "strategicboard" => array(
5267     "icon" => "strategicboard",
5268     "title" => "Strategic Board",
5269     "rule" => array(
5270     "Strategic Board Bot" => ""
5271     ),
5272     "uri" => "http://www.strategicboard.com"
5273     ),
5274     "suchbaer" => array(
5275     "icon" => "robot",
5276 matthys 209 "title" => "Suchbaer.de",
5277 joku 63 "rule" => array(
5278     "^suchbaer\.de" => ""
5279     ),
5280     "uri" => "http://www.suchbaer.de/"
5281     ),
5282     "suchbot" => array(
5283     "icon" => "robot",
5284 matthys 209 "title" => "Suchbot",
5285 joku 63 "rule" => array(
5286     "^suchbot" => ""
5287     ),
5288     "uri" => ""
5289     ),
5290     "suchende" => array(
5291     "icon" => "suchende",
5292 matthys 209 "title" => "Suchen.de",
5293 joku 63 "rule" => array(
5294     "^gonzo([0-9]{1,2}).*www.suchen.de" => "\\1",
5295     "^gonzo/([0-9.]{1,10})" => "\\1"
5296     ),
5297     "uri" => "http://www.suchen.de/"
5298     ),
5299     "suchknecht" => array(
5300     "icon" => "robot",
5301     "title" => "Suchknecht",
5302     "rule" => array(
5303     "^Suchknecht.at-Robot" => ""
5304     ),
5305     "uri" => "http://www.suchknecht.at/"
5306     ),
5307     "suchpad" => array(
5308     "icon" => "robot",
5309 matthys 209 "title" => "Suchpad",
5310 joku 63 "rule" => array(
5311     "^suchpadbot[ /]([0-9.]{1,10})" => "\\1"
5312     ),
5313     "uri" => "http://www.suchpad.de"
5314     ),
5315     "sunrise" => array(
5316     "icon" => "sunrise",
5317     "title" => "Sunrise",
5318     "rule" => array(
5319     "^Sunrise[ /]([0-9a-z.]{1,10})" => "\\1"
5320     ),
5321     "uri" => ""
5322     ),
5323     "superbot" => array(
5324     "icon" => "superbot",
5325     "title" => "SuperBot",
5326     "rule" => array(
5327     "SuperBot[ /]([0-9.]{1,10})" => "\\1"
5328     ),
5329     "uri" => ""
5330     ),
5331     "surfcontrol" => array(
5332     "icon" => "robot",
5333     "title" => "SurfControl",
5334     "rule" => array(
5335     "SurfControl" => "",
5336     "ScSpider[ /]([0-9.]{1,10})" => "\\1"
5337     ),
5338     "uri" => ""
5339     ),
5340     "surfnet" => array(
5341     "icon" => "robot",
5342     "title" => "SURFnet",
5343     "rule" => array(
5344     "AVSearch[ \-]([0-9.]{1,10})" => "\\1"
5345     ),
5346     "uri" => ""
5347     ),
5348     "surfsafely" => array(
5349     "icon" => "robot",
5350     "title" => "Surfsafely",
5351     "rule" => array(
5352     "Submission Spider at surfsafely.com" => ""
5353     ),
5354     "uri" => "http://www.surfsafely.com"
5355     ),
5356     "surphace" => array(
5357     "icon" => "spherescout",
5358     "title" => "Surphace",
5359     "rule" => array(
5360     "Sphere Scout.+([0-9.]{1,10})" => "\\1",//Previous called Sphere Scout
5361     "Surphace.+v([0-9.]{1,10})" => "\\1"
5362     ),
5363     "uri" => "http://www.surphace.com"
5364     ),
5365     "surveybot" => array(
5366     "icon" => "surveybot",
5367     "title" => "Whois Survey",
5368     "rule" => array(
5369     "SurveyBot[ /]([0-9.]{1,10})" => "\\1"
5370     ),
5371     "uri" => ""
5372     ),
5373     "swoogle" => array(
5374     "icon" => "robot",
5375     "title" => "Swoogle",
5376     "rule" => array(
5377     "^Swooglebot[ /]([0-9.]{1,10})" => "\\1"
5378     ),
5379     "uri" => "http://swoogle.umbc.edu/swooglebot.htm"
5380     ),
5381     "swse" => array(
5382     "icon" => "robot",
5383     "title" => "SWSE",
5384     "rule" => array(
5385     "sw\.deri\.org" => ""
5386     ),
5387     "uri" => "http://sw.deri.org/2006/04/multicrawler/robots.html"
5388     ),
5389     "swish-e" => array(
5390     "icon" => "swish-e",
5391     "title" => "Swish-e",
5392     "rule" => array(
5393     "^swish-e" => ""
5394     ),
5395     "uri" => "http://swish-e.org/"
5396     ),
5397     "sygol" => array(
5398     "icon" => "sygol",
5399     "title" => "Sygol",
5400     "rule" => array(
5401     "www.sygol.(com|net)" => ""
5402     ),
5403     "uri" => "http://www.sygol.com"
5404     ),
5405     "syllabs" => array(
5406     "icon" => "syllabs",
5407     "title" => "Syllabs",
5408     "rule" => array(
5409     "Focal[-]([0-9.]{1,10})" => "\\1"
5410     ),
5411     "uri" => "http://www.syllabs.com/crawler.html"
5412     ),
5413     "synapse" => array(
5414     "icon" => "robot",
5415     "title" => "Synapse",
5416     "rule" => array(
5417     " Synapse\)" => ""
5418     ),
5419     "uri" => "http://ws.apache.org/synapse/"
5420     ),
5421     "sync2it" => array(
5422     "icon" => "robot",
5423 matthys 209 "title" => "Sync2it",
5424 joku 63 "rule" => array(
5425     "^\!Susie" => ""
5426     ),
5427     "uri" => "http://www.sync2it.com/bms/susie.php"
5428     ),
5429     "syncit" => array(
5430     "icon" => "robot",
5431 matthys 209 "title" => "Syncit",
5432 joku 63 "rule" => array(
5433     "^SyncIT[ /]([0-9.]{1,10})" => "\\1"
5434     ),
5435     "uri" => "http://www.syncit.com/"
5436     ),
5437     "syndic8" => array(
5438     "icon" => "syndic8",
5439     "title" => "Syndic8",
5440     "rule" => array(
5441     "Syndic8[ /]([0-9.]{1,10})" => "\\1"
5442     ),
5443     "uri" => "http://www.syndic8.com/"
5444     ),
5445     "syndicatie" => array(
5446     "icon" => "robot",
5447     "title" => "Syndicatie.nl",
5448     "rule" => array(
5449     "Syndicatie\.nl robot v ([0-9.]{1,10})" => "\\1",
5450     "Syndicatie\.nl robot;" => ""
5451     ),
5452     "uri" => ""
5453     ),
5454     "synomia" => array(
5455     "icon" => "robot",
5456     "title" => "Synomia",
5457     "rule" => array(
5458     "^SynoBot" => ""
5459     ),
5460     "uri" => ""
5461     ),
5462     "synoo" => array(
5463     "icon" => "robot",
5464     "title" => "SynooBot",
5465     "rule" => array(
5466     "SynooBot[ /]([0-9.]{1,10})" => "\\1",
5467     ),
5468     "uri" => ""
5469     ),
5470     "szukacz" => array(
5471     "icon" => "szukacz",
5472     "title" => "Szukacz",
5473     "rule" => array(
5474     "Szukacz[ /]([0-9.]{1,10})" => "\\1"
5475     ),
5476     "uri" => ""
5477     ),
5478     "tagoo" => array(
5479     "icon" => "tagoobot",
5480     "title" => "Tagoo",
5481     "rule" => array(
5482     "Tagoobot[ /]([0-9.]{1,10})" => "\\1"
5483     ),
5484     "uri" => "http://www.tagoo.ru"
5485     ),
5486     "tagword" => array(
5487     "icon" => "tagword",
5488     "title" => "Tagword",
5489     "rule" => array(
5490     "^Tagword" => ""
5491     ),
5492     "uri" => "http://tagword.com/dmoz_survey.php"
5493     ),
5494     "trailfire" => array(
5495     "icon" => "trailfire",
5496     "title" => "Trailfire",
5497     "rule" => array(
5498     "^Trailfire-bot[ /]([0-9.]{1,10})" => "\\1"
5499     ),
5500     "uri" => "http://trailfire.com"
5501     ),
5502     "tamu" => array(
5503     "icon" => "tamu",
5504     "title" => "Tamu Crawler",
5505     "rule" => array(
5506     "IRLbot[ /]([0-9.]{1,10})" => "\\1",
5507     "TAMU_CS_IRL_CRAWLER[ /]([0-9.]{1,10})" => "\\1"
5508     ),
5509     "uri" => "http://irl.cs.tamu.edu/crawler/"
5510     ),
5511     "taptubot" => array(
5512     "icon" => "taptubot",
5513     "title" => "Taptu",
5514     "rule" => array(
5515     "taptubot" => ""
5516     ),
5517     "uri" => "http://www.taptu.com/corp/taptubot"
5518     ),
5519     "targetseek" => array(
5520     "icon" => "robot",
5521     "title" => "TargetSeek",
5522     "rule" => array(
5523     "TargetSeek[ /]([0-9.]{1,10})" => "\\1"
5524     ),
5525     "uri" => "http://www.targetgroups.net/TargetSeek.html"
5526     ),
5527     "taw" => array(
5528     "icon" => "taw",
5529     "title" => "TAW",
5530     "rule" => array(
5531     "TAW[ /]([0-9.]{1,10})" => "\\1"
5532     ),
5533     "uri" => "http://www.tawdis.net"
5534     ),
5535     "tcd" => array(
5536     "icon" => "tcd",
5537     "title" => "Trinity College Dublin",
5538     "rule" => array(
5539     "^TCDBOT/Nutch-([0-9.]{1,10})" => "\\1"
5540     ),
5541     "uri" => "http://www.tcd.ie"
5542     ),
5543     "technorati" => array(
5544     "icon" => "technorati",
5545     "title" => "Technorati",
5546     "rule" => array(
5547     "Technoratibot[ /]([0-9.]{1,10})" => "\\1"
5548     ),
5549     "uri" => ""
5550     ),
5551     "teleport" => array(
5552     "icon" => "teleport",
5553     "title" => "Teleport",
5554     "rule" => array(
5555     "Teleport[ \-]?Pro" => ""
5556     ),
5557     "uri" => ""
5558     ),
5559     "terrar" => array(
5560     "icon" => "robot",
5561     "title" => "Terrar",
5562     "rule" => array(
5563     "^Fresh Search :: Terrar" => ""
5564     ),
5565     "uri" => ""
5566     ),
5567     "theophrastus" => array(
5568     "icon" => "robot",
5569     "title" => "Theophrastus",
5570     "rule" => array(
5571     "Theophrastus[ /]([0-9.]{1,10})" => "\\1"
5572     ),
5573     "uri" => "http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php"
5574     ),
5575     "thumbnailscz" => array(
5576     "icon" => "robot",
5577 matthys 209 "title" => "Thumbnails.cz",
5578 joku 63 "rule" => array(
5579     "^thumbnail\.cz robot[ /]([0-9.]{1,10})" => "\\1"
5580     ),
5581     "uri" => ""
5582     ),
5583     "thumbshot" => array(
5584     "icon" => "robot",
5585 matthys 209 "title" => "Thumbshots",
5586 joku 63 "rule" => array(
5587     "^thumbshots.*(Version: |v)([0-9.]{2,10})e" => "\\1",
5588     "^thumbshots-de" => ""
5589     ),
5590     "uri" => "http://www.thumbshots.de"
5591     ),
5592     "thunderstone" => array(
5593     "icon" => "thunderstone",
5594     "title" => "Thunderstone",
5595     "rule" => array(
5596     "T-H-U-N-D-E-R-S-T-O-N-E" => "",
5597     "search.thunderstone.com" => ""
5598     ),
5599     "uri" => "http://search.thunderstone.com/"
5600     ),
5601     "timbobot" => array(
5602     "icon" => "robot",
5603 matthys 209 "title" => "TimboBot",
5604 joku 63 "rule" => array(
5605     "timboBot" => ""
5606     ),
5607     "uri" => ""
5608     ),
5609     "topsy" => array(
5610     "icon" => "topsy",
5611     "title" => "Topsy",
5612     "rule" => array(
5613     "Butterfly[ /]([0-9.]{1,10})" => "\\1"
5614     ),
5615     "uri" => "http://labs.topsy.com/butterfly.html"
5616     ),
5617     "trayce" => array(
5618     "icon" => "robot",
5619 matthys 209 "title" => "Trayce",
5620 joku 63 "rule" => array(
5621     "traycebot[ /]([0-9a-z.\-]{1,10})" => "\\1"
5622     ),
5623     "uri" => ""
5624     ),
5625     "tricus" => array(
5626     "icon" => "robot",
5627     "title" => "Tricus",
5628     "rule" => array(
5629     "B_l_i_t_z_B_O_T_@_t_r_i_c_u_s_\._c_o_m" => ""
5630     ),
5631     "uri" => ""
5632     ),
5633     "topicblogs" => array(
5634     "icon" => "robot",
5635     "title" => "Topicblogs",
5636     "rule" => array(
5637     "topicblogs[ /]([0-9.]{1,10})" => "\\1"
5638     ),
5639     "uri" => ""
5640     ),
5641     "touche" => array(
5642     "icon" => "touche",
5643 matthys 209 "title" => "Touché",
5644 joku 63 "rule" => array(
5645     "^Touche" => ""
5646     ),
5647     "uri" => "http://touche.com.ve"
5648     ),
5649     "tuezilla" => array(
5650     "icon" => "robot",
5651 matthys 209 "title" => "TÃœzilla",
5652 joku 63 "rule" => array(
5653     "tuezilla.de" => ""
5654     ),
5655     "uri" => "http://tuezilla.de/t_st-odp-entries-agent.html"
5656     ),
5657     "turnitin" => array(
5658     "icon" => "turnitin",
5659     "title" => "Turnitin",
5660     "rule" => array(
5661     "TurnitinBot[ /]([0-9.]{1,10})" => "\\1"
5662     ),
5663     "uri" => ""
5664     ),
5665     "tutorgig" => array(
5666     "icon" => "robot",
5667     "title" => "TutorGig",
5668     "rule" => array(
5669     "TutorGig(Bot)?[ /]([0-9.]{1,10})" => "\\2"
5670     ),
5671     "uri" => ""
5672     ),
5673     "twiceler" => array(
5674     "icon" => "cuill",
5675 matthys 209 "title" => "Cuill",
5676 joku 63 "rule" => array(
5677     "Twiceler[ /-]([0-9.]{1,10})" => "\\1",
5678     "Twiceler" => ""
5679     ),
5680     "uri" => "http://www.cuill.com/twiceler/robot.html"
5681     ),
5682     "twingly" => array(
5683     "icon" => "twingly",
5684     "title" => "Twingly",
5685     "rule" => array(
5686     "Twingly Recon" => ""
5687     ),
5688     "uri" => "http://www.twingly.com/"
5689     ),
5690 matthys 320 "twitter" => array(
5691     "icon" => "twitter",
5692     "title" => "Twitter",
5693     "rule" => array(
5694     "Twitterbot[ /-]([0-9.]{1,10})" => "\\1"
5695     ),
5696     "uri" => "https://dev.twitter.com/cards/getting-started#crawling"
5697     ),
5698 joku 63 "typepad" => array(
5699     "icon" => "typepad",
5700     "title" => "TypePad",
5701     "rule" => array(
5702     "TypePad/([0-9a-z.]{1,10})" => "\\1"
5703     ),
5704     "uri" => ""
5705     ),
5706     "udmsearch" => array(
5707     "icon" => "robot",
5708     "title" => "UdmSearch",
5709     "rule" => array(
5710     "UdmSearch[/ ]([0-9.]{1,10})" => "\\1"
5711     ),
5712     "uri" => ""
5713     ),
5714     "ukwizz" => array(
5715     "icon" => "ukwizz",
5716     "title" => "UKWizz",
5717     "rule" => array(
5718     "^Mackster.*ukwizz" => ""
5719     ),
5720     "uri" => "http://www.ukwizz.com"
5721     ),
5722     "ultraseek" => array(
5723     "icon" => "robot",
5724     "title" => "Ultraseek",
5725     "rule" => array(
5726     "Ultraseek" => ""
5727     ),
5728     "uri" => ""
5729     ),
5730     "ultraspider" => array(
5731     "icon" => "robot",
5732     "title" => "UltraSpider",
5733     "rule" => array(
5734     "UltraSpider3000[/ ]([0-9.]{1,10})" => "\\1"
5735     ),
5736     "uri" => "http://www.search.ch"
5737     ),
5738     "umai" => array(
5739     "icon" => "robot",
5740 matthys 209 "title" => "Umai",
5741 joku 63 "rule" => array(
5742     "umai[/ ]([0-9.]{1,10})" => "\\1"
5743     ),
5744     "uri" => ""
5745     ),
5746     "unchaos" => array(
5747     "icon" => "robot",
5748     "title" => "Unchaos",
5749     "rule" => array(
5750     "unchaos_crawler[_ /]([0-9.]{1,10})" => "\\1",
5751     "unchaos" => ""
5752     ),
5753     "uri" => ""
5754     ),
5755     "unido" => array(
5756     "icon" => "robot",
5757 matthys 209 "title" => "UNIdo",
5758 joku 63 "rule" => array(
5759     "^unido-bot" => "\\1"
5760     ),
5761     "uri" => "http://mobicom.cs.uni-dortmund.de/bot.html"
5762     ),
5763     "updated" => array(
5764     "icon" => "robot",
5765     "title" => "Updated",
5766     "rule" => array(
5767     "updated[ /]([0-9a-z.]{1,10})" => "\\1"
5768     ),
5769     "uri" => ""
5770     ),
5771     "uptimebot" => array(
5772     "icon" => "robot",
5773     "title" => "UptimeBot",
5774     "rule" => array(
5775     "^UptimeBot" => ""
5776     ),
5777     "uri" => "http://www.uptimebot.com/"
5778     ),
5779     "urifetch" => array(
5780     "icon" => "robot",
5781     "title" => "URI::Fetch",
5782     "rule" => array(
5783     "^URI::Fetch[ /]([0-9.]{1,10})" => "\\1"
5784     ),
5785     "uri" => ""
5786     ),
5787     "urlbase" => array(
5788     "icon" => "robot",
5789     "title" => "URLBase",
5790     "rule" => array(
5791     "URLBase[ /]([0-9.]{1,10})" => "\\1"
5792     ),
5793     "uri" => ""
5794     ),
5795     "urlblaze" => array(
5796     "icon" => "robot",
5797     "title" => "URLBlaze",
5798     "rule" => array(
5799     "^URLBlaze" => ""
5800     ),
5801     "uri" => ""
5802     ),
5803     "urlcontr" => array(
5804     "icon" => "robot",
5805     "title" => "MS URL Control",
5806     "rule" => array(
5807     "Microsoft URL[ \-]?Control" => ""
5808     ),
5809     "uri" => ""
5810     ),
5811     "urlgetfile" => array(
5812     "icon" => "robot",
5813     "title" => "URLGetFile",
5814     "rule" => array(
5815     "^URLGetFile" => ""
5816     ),
5817     "uri" => ""
5818     ),
5819     "urlscope" => array(
5820     "icon" => "robot",
5821     "title" => "UrlScope",
5822     "rule" => array(
5823     "UrlScope" => ""
5824     ),
5825     "uri" => ""
5826     ),
5827     "urltrends" => array(
5828     "icon" => "urltrends",
5829 matthys 209 "title" => "UrlTrends",
5830 joku 63 "rule" => array(
5831     "Snappy/([0-9.]{1,10})" => "\\1",
5832     ),
5833     "uri" => ""
5834     ),
5835     "usww" => array(
5836     "icon" => "usww",
5837 matthys 209 "title" => "USWW",
5838 joku 63 "rule" => array(
5839     "usww\.com" => "",
5840     "Mozilla/5\.0 URL-Spider" => ""
5841     ),
5842     "uri" => "http://www.usww.com/"
5843     ),
5844     "usyd" => array(
5845     "icon" => "robot",
5846     "title" => "USyd-NLP-Spider",
5847     "rule" => array(
5848     "^USyd-NLP-Spider" => ""
5849     ),
5850     "uri" => "http://www.it.usyd.edu.au/~vinci/bot.html"
5851     ),
5852     "vagabondo" => array(
5853     "icon" => "wiseguys",
5854     "title" => "WiseGuys",
5855     "rule" => array(
5856     "Vagabondo[ /]([0-9.]{1,10})" => "\\1",
5857     "Vagabondo-WAP[ /]([0-9.]{1,10})" => "\\1"
5858     ),
5859     "uri" => ""
5860     ),
5861     "unicorn" => array(
5862     "icon" => "w3c",
5863     "title" => "W3C Unicorn",
5864     "rule" => array(
5865     "Unicorn[ /]([0-9.]{1,10})" => "\\1",
5866     ),
5867     "uri" => "http://validator.w3.org/unicorn/"
5868     ),
5869     "validator" => array(
5870     "icon" => "w3c",
5871     "title" => "W3C Validator",
5872     "rule" => array(
5873     "W3C_Validator[ /]([0-9.]{1,10})" => "\\1"
5874     ),
5875     "uri" => "http://validator.w3.org/"
5876     ),
5877     "validator.nu" => array(
5878     "icon" => "validatornu",
5879     "title" => "Validator.nu",
5880     "rule" => array(
5881     "^Validator.nu[ /]([0-9.]{1,10})" => "\\1",
5882     "^Validator.nu/LV" => "\\1"
5883     ),
5884     "uri" => "http://validator.nu/"
5885     ),
5886     "verity" => array(
5887     "icon" => "robot",
5888     "title" => "Verity",
5889     "rule" => array(
5890     "^vspider[ /]([0-9.]{1,10})" => "\\1",
5891     "^vspider" => ""
5892     ),
5893     "uri" => "http://www.verity.com/"
5894     ),
5895     "versionsproject" => array(
5896     "icon" => "robot",
5897     "title" => "Versions-project",
5898     "rule" => array(
5899     "InfoFly[ /]([0-9.]{1,10})" => "\\1"
5900     ),
5901     "uri" => "http://www.versions-project.org/"
5902     ),
5903     "verticalmatch" => array(
5904     "icon" => "robot",
5905     "title" => "VerticalMatch",
5906     "rule" => array(
5907     "^VMBot[ /]([0-9.]{1,10})" => "\\1"
5908     ),
5909     "uri" => "http://www.VerticalMatch.com/"
5910     ),
5911     "verzamelgids" => array(
5912     "icon" => "robot",
5913     "title" => "Verzamelgids",
5914     "rule" => array(
5915     "Verzamelgids[ /]([0-9.]{1,10})" => "\\1"
5916     ),
5917     "uri" => "http://www.verzamelgids.nl/"
5918     ),
5919     "vestris" => array(
5920     "icon" => "vestris",
5921     "title" => "Vestris",
5922     "rule" => array(
5923     "AlkalineBOT[ /]([0-9.]{1,10})" => "\\1"
5924     ),
5925     "uri" => "http://alkaline.vestris.com/"
5926     ),
5927     "vindex" => array(
5928     "icon" => "vindex",
5929     "title" => "Vindex",
5930     "rule" => array(
5931     "Vindex[ /]([0-9.]{1,10})" => "\\1"
5932     ),
5933     "uri" => ""
5934     ),
5935     "visvo" => array(
5936     "icon" => "robot",
5937     "title" => "Visvo",
5938     "rule" => array(
5939     "VisBot[ /]([0-9.]{1,10})" => "\\1"
5940     ),
5941     "uri" => "http://www.visvo.com"
5942     ),
5943     "voila" => array(
5944     "icon" => "voila",
5945     "title" => "Voila",
5946     "rule" => array(
5947     "VoilaBot[ /]?[a-z ]*([0-9.]{1,10})" => "\\1",
5948     "VoilaBot;[ /]([0-9.]{1,10})" => "\\1"
5949     ),
5950     "uri" => ""
5951     ),
5952     "vonna" => array(
5953     "icon" => "robot",
5954     "title" => "Vonna",
5955     "rule" => array(
5956     "Vonna.com b o t" => ""
5957     ),
5958     "uri" => ""
5959     ),
5960     "vortex" => array(
5961     "icon" => "robot",
5962     "title" => "Vortex",
5963     "rule" => array(
5964     "Vortex[ /]([0-9.]{1,10})" => "\\1"
5965     ),
5966     "uri" => "http://marty.anstey.ca/robots/vortex/"
5967     ),
5968     "w3sitesearch" => array(
5969     "icon" => "w3sitesearch",
5970     "title" => "W3SiteSearch",
5971     "rule" => array(
5972     "^W3SiteSearch Crawler[\_v]*([0-9.]{1,10})" => "\\1"
5973     ),
5974     "uri" => "http://www.w3sitesearch.de"
5975     ),
5976     "wagger" => array(
5977     "icon" => "robot",
5978     "title" => "Wagger",
5979     "rule" => array(
5980     "^Waggr" => ""
5981     ),
5982     "uri" => "http://www.waggr.com/"
5983     ),
5984     "wanadoo" => array(
5985     "icon" => "robot",
5986     "title" => "Wanadoo",
5987     "rule" => array(
5988     "^SurferF3[ /]([0-9./]{1,10})" => "\\1"
5989     ),
5990     "uri" => "http://www.wanadoo.fr/"
5991     ),
5992     "wapalizer" => array(
5993     "icon" => "robot",
5994     "title" => "Wapalizer",
5995     "rule" => array(
5996     "wapalizer[ /]([0-9.]{1,10})" => "\\1"
5997     ),
5998     "uri" => "http://www.wapdrive.com/"
5999     ),
6000     "watson" => array(
6001     "icon" => "addy",
6002     "title" => "Dr.Watson",
6003     "rule" => array(
6004     "Watson[ /]([0-9.]{1,10})" => "\\1",
6005     "watson\.addy\.com" => ""
6006     ),
6007     "uri" => ""
6008     ),
6009     "wavefire" => array(
6010     "icon" => "robot",
6011     "title" => "Wavefire",
6012     "rule" => array(
6013     "^Wavefire[ /]([0-9.]{1,10})" => "\\1"
6014     ),
6015     "uri" => ""
6016     ),
6017     "waypath" => array(
6018     "icon" => "waypath",
6019     "title" => "Waypath",
6020     "rule" => array(
6021     "Waypath[ \-]?Scout" => "",
6022     "Waypath (development )?crawler" => ""
6023     ),
6024     "uri" => ""
6025     ),
6026     "wauuu" => array(
6027     "icon" => "wauuu",
6028     "title" => "Wauuu",
6029     "rule" => array(
6030     "Wauuu[/ ]([0-9.]{1,10})" => "\\2"
6031     ),
6032     "uri" => "http://www.wauuu.com"
6033     ),
6034     "wdg" => array(
6035     "icon" => "wdg",
6036     "title" => "WDG Validator",
6037     "rule" => array(
6038     "^WDG_(Site)?Validator[/ ]([0-9.]{1,10})" => "\\2"
6039     ),
6040     "uri" => "http://www.htmlhelp.com/tools/validator/"
6041     ),
6042     "webagogo" => array(
6043     "icon" => "webagogo",
6044     "title" => "Webagogo",
6045     "rule" => array(
6046     "^Webagogo" => ""
6047     ),
6048     "uri" => "http://www.webagogo.be/"
6049     ),
6050     "webalta" => array(
6051     "icon" => "webalta",
6052     "title" => "WebAlta",
6053     "rule" => array(
6054     "^WebAlta( Crawler)?[/ ]([0-9.]{1,10})" => "\\2"
6055     ),
6056     "uri" => "http://www.webalta.net/ru/about_webmaster.html"
6057     ),
6058     "webdigity" => array(
6059     "icon" => "robot",
6060     "title" => "Webdigity Whois Service",
6061     "rule" => array(
6062     "^webdigity whois service" => ""
6063     ),
6064     "uri" => "http://www.webdigity.com/ws"
6065     ),
6066     "webelixir" => array(
6067     "icon" => "webelixir",
6068     "title" => "Webelixir",
6069     "rule" => array(
6070     "^webelixir" => ""
6071     ),
6072     "uri" => "http://www.webelixir.net/"
6073     ),
6074     "webbotru" => array(
6075     "icon" => "robot",
6076     "title" => "Webbot.ru",
6077     "rule" => array(
6078     " Webbot[/ ]([0-9.]{1,10})" => "\\1"
6079     ),
6080     "uri" => "http://www.webbot.ru/bot.html"
6081     ),
6082     "webcapture" => array(
6083     "icon" => "robot",
6084     "title" => "WebCapture",
6085     "rule" => array(
6086     "WebCapture[/ ]([0-9.]{1,10})" => "\\1"
6087     ),
6088     "uri" => ""
6089     ),
6090     "webcollage" => array(
6091     "icon" => "robot",
6092     "title" => "Webcollage",
6093     "rule" => array(
6094     "webcollage" => ""
6095     ),
6096     "uri" => ""
6097     ),
6098     "webcopier" => array(
6099     "icon" => "webcopier",
6100     "title" => "WebCopier",
6101     "rule" => array(
6102     "WebCopier[/ ]v?([0-9.]{1,10})" => "\\1"
6103     ),
6104     "uri" => ""
6105     ),
6106     "webcorp" => array(
6107     "icon" => "webcorp",
6108     "title" => "WebCorp",
6109     "rule" => array(
6110     "WebCorp[/ ]+([0-9.]{1,10})" => "\\1"
6111     ),
6112     "uri" => "http://www.webcorp.org.uk/"
6113     ),
6114     "webcrawl" => array(
6115     "icon" => "robot",
6116     "title" => "WebCrawl",
6117     "rule" => array(
6118     "webcrawl\.net" => ""
6119     ),
6120     "uri" => ""
6121     ),
6122     "webdownloader" => array(
6123     "icon" => "robot",
6124     "title" => "Web Downloader",
6125     "rule" => array(
6126     "Web Downloader[/ ]([0-9.]{1,10})" => "\\1"
6127     ),
6128     "uri" => ""
6129     ),
6130     "webfetch" => array(
6131     "icon" => "robot",
6132 matthys 209 "title" => "WebFetch",
6133 joku 63 "rule" => array(
6134     "^webfetch[/ ]([0-9.]{1,10})" => "\\1"
6135     ),
6136     "uri" => ""
6137     ),
6138     "webfind" => array(
6139     "icon" => "robot",
6140 matthys 209 "title" => "WebFind",
6141 joku 63 "rule" => array(
6142     "^WebFindBot" => ""
6143     ),
6144     "uri" => "http://www.web-find.com"
6145     ),
6146     "webglimpse" => array(
6147     "icon" => "robot",
6148     "title" => "Webglimpse",
6149     "rule" => array(
6150     "^Webglimpse[/ ]([0-9.]{1,10})" => "\\1"
6151     ),
6152     "uri" => "http://webglimpse.net"
6153     ),
6154     "webgobbler" => array(
6155     "icon" => "robot",
6156     "title" => "webGobbler",
6157     "rule" => array(
6158     "^webGobbler[/ ]([0-9.]{1,10})" => "\\1"
6159     ),
6160     "uri" => ""
6161     ),
6162     "webimages" => array(
6163     "icon" => "webimages",
6164     "title" => "WebImages",
6165     "rule" => array(
6166     "^WebImages[/ ]([0-9.]{1,10})" => "\\1"
6167     ),
6168     "uri" => "http://herbert.groot.jebbink.nl/"
6169     ),
6170     "weblight" => array(
6171     "icon" => "robot",
6172     "title" => "WebLight",
6173     "rule" => array(
6174     "^WebLight[/ ]([0-9.]{1,10})" => "\\1"
6175     ),
6176     "uri" => "http://www.illumit.com/Products/weblight/"
6177     ),
6178     "weblinks" => array(
6179     "icon" => "robot",
6180     "title" => "WebLink's",
6181     "rule" => array(
6182     "^Weblink.s checker" => ""
6183     ),
6184     "uri" => ""
6185     ),
6186     "webmeasurement" => array(
6187     "icon" => "robot",
6188     "title" => "Webmeasurement",
6189     "rule" => array(
6190     "^webmeasurement-bot" => ""
6191     ),
6192     "uri" => "http://rvs.informatik.uni-leipzig.de"
6193     ),
6194     "webminer" => array(
6195     "icon" => "robot",
6196     "title" => "WebMiner",
6197     "rule" => array(
6198     "^WebMiner[/ ]([0-9.]{1,10})" => "\\1"
6199     ),
6200     "uri" => ""
6201     ),
6202     "webmin" => array(
6203     "icon" => "webmin",
6204     "title" => "Webmin",
6205     "rule" => array(
6206     "^webmin" => ""
6207     ),
6208     "uri" => ""
6209     ),
6210     "webmon" => array(
6211     "icon" => "webmon",
6212     "title" => "Webmon",
6213     "rule" => array(
6214     "WebMon[ /]([0-9.]{1,10})" => "\\1"
6215     ),
6216     "uri" => "http://www.markwell.btinternet.co.uk/webmon/"
6217     ),
6218     "webox" => array(
6219     "icon" => "robot",
6220     "title" => " WeBoX",
6221     "rule" => array(
6222     "WeBoX[/ ]([0-9.]{1,10})" => "\\1"
6223     ),
6224     "uri" => ""
6225     ),
6226     "webpatrol" => array(
6227     "icon" => "webpatrol",
6228     "title" => "WebPatrol",
6229     "rule" => array(
6230     "^WebPatrol[ /]([0-9.]{1,10})" => "\\1"
6231     ),
6232     "uri" => "http://soft.macfeeling.com/WebPatrol.html"
6233     ),
6234     "webpix" => array(
6235     "icon" => "webpix",
6236     "title" => "WebPix",
6237     "rule" => array(
6238     "WebPix[/ ]([0-9.]{1,10})" => "\\1"
6239     ),
6240     "uri" => ""
6241     ),
6242     "webrace" => array(
6243     "icon" => "robot",
6244     "title" => "WebRACE",
6245     "rule" => array(
6246     "^WebRACE[/ ]([0-9.]{1,10})" => "\\1"
6247     ),
6248     "uri" => ""
6249     ),
6250     "webreaper" => array(
6251     "icon" => "webreaper",
6252     "title" => "WebReaper",
6253     "rule" => array(
6254     "^WebReaper " => ""
6255     ),
6256     "uri" => "http://www.webreaper.net/"
6257     ),
6258     "webresult" => array(
6259     "icon" => "robot",
6260     "title" => "Webresult",
6261     "rule" => array(
6262     "Der webresult\.de Robot" => ""
6263     ),
6264     "uri" => ""
6265     ),
6266     "webring" => array(
6267     "icon" => "robot",
6268     "title" => "Webring Checker",
6269     "rule" => array(
6270     "WebRingChecker[/ ]([0-9.]{1,10})" => "\\1"
6271     ),
6272     "uri" => ""
6273     ),
6274     "webripper" => array(
6275     "icon" => "webripper",
6276     "title" => "WebRipper",
6277     "rule" => array(
6278     "^WebRipper" => ""
6279     ),
6280     "uri" => "http://calluna-software.com"
6281     ),
6282     "webscaled" => array(
6283     "icon" => "webscaled",
6284     "title" => "Webscaled",
6285     "rule" => array(
6286     "Swarm" => ""
6287     ),
6288     "uri" => "http://webscaled.com/"
6289     ),
6290     "websearchau" => array(
6291     "icon" => "websearchau",
6292     "title" => "WebSearch.COM.AU",
6293     "rule" => array(
6294     "WebSearch.COM.AU[/ ]+([0-9.]{1,10})" => "\\1"
6295     ),
6296     "uri" => "http://WebSearch.com.au/"
6297     ),
6298     "websearchbench" => array(
6299     "icon" => "robot",
6300     "title" => "WebSearchBench",
6301     "rule" => array(
6302     "WebSearchBench WebCrawler[v/ ]+([0-9.]{1,10})" => "\\1"
6303     ),
6304     "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6305     ),
6306     "websense" => array(
6307     "icon" => "websense",
6308     "title" => "Websense",
6309     "rule" => array(
6310     "(Sqworm|websense|Konqueror/3\.(0|1)(-rc[1-6])?; i686 Linux; 2002[0-9]{4})" => ""
6311     ),
6312     "uri" => ""
6313     ),
6314     "websiteshadow" => array(
6315     "icon" => "websiteshadow",
6316     "title" => "Websiteshadow",
6317     "rule" => array(
6318     "Websiteshadowbot[ /]([0-9.]{1,10})" => "\\1"
6319     ),
6320     "uri" => "http://websiteshadow.com"
6321     ),
6322     "websiteworth" => array(
6323     "icon" => "robot",
6324     "title" => "WebsiteWorth",
6325     "rule" => array(
6326     "WebsiteWorth[v/ ]+([0-9.]{1,10})" => "\\1"
6327     ),
6328     "uri" => "http://directory.sootle.com/website-worth/tata.php"
6329     ),
6330     "websquash" => array(
6331     "icon" => "websquash",
6332     "title" => "Websquash",
6333     "rule" => array(
6334     "webs(quash\.com|ite[ \-]?Monitor)" => ""
6335     ),
6336     "uri" => ""
6337     ),
6338     "webstripper" => array(
6339     "icon" => "robot",
6340     "title" => "WebStripper",
6341     "rule" => array(
6342     "WebStripper[ /]([0-9.]{1,10})" => "\\1"
6343     ),
6344     "uri" => ""
6345     ),
6346     "webzip" => array(
6347     "icon" => "webzip",
6348     "title" => "WebZIP",
6349     "rule" => array(
6350     "Web[ \-]?ZIP[ /]([0-9.]{1,10})" => "\\1"
6351     ),
6352     "uri" => ""
6353     ),
6354     "wep" => array(
6355     "icon" => "robot",
6356     "title" => "WEP Search",
6357     "rule" => array(
6358     "WEP Search[ /]([0-9.]{1,10})" => "\\1"
6359     ),
6360     "uri" => ""
6361     ),
6362     "westwind" => array(
6363     "icon" => "robot",
6364     "title" => "West Wind Internet Protocols",
6365     "rule" => array(
6366     "^West Wind Internet Protocols[ /]([0-9.]{1,10})" => "\\1"
6367     ),
6368     "uri" => "http://www.west-wind.com/wwipstuff.asp"
6369     ),
6370     "wget" => array(
6371     "icon" => "wget",
6372     "title" => "Wget",
6373     "rule" => array(
6374 joku 308 "Wget[ /]([0-9.]{1,10})" => "\\1",
6375     "Wget" => ""
6376 joku 63 ),
6377     "uri" => ""
6378     ),
6379     "whizbang" => array(
6380     "icon" => "whizbang",
6381     "title" => "WhizBang",
6382     "rule" => array(
6383     "WhizBang" => ""
6384     ),
6385     "uri" => "http://www.whizbang.com/crawler/"
6386     ),
6387     "whois" => array(
6388     "icon" => "whois",
6389     "title" => "Who.is",
6390     "rule" => array(
6391     "Who.is Bot" => ""
6392     ),
6393     "uri" => "http://www.who.is/"
6394     ),
6395     "wikiwix" => array(
6396     "icon" => "wikiwix",
6397     "title" => "Wikiwix",
6398     "rule" => array(
6399     "wikiwix-bot-([0-9.]{1,10})" => "\\1"
6400     ),
6401     "uri" => "http://www.wikiwix.com/"
6402     ),
6403     "wingflyer" => array(
6404     "icon" => "robot",
6405     "title" => "WingFlyer",
6406     "rule" => array(
6407     "^WebFetch" => ""
6408     ),
6409     "uri" => "http://www.wingflyer.com/"
6410     ),
6411     "wininet" => array(
6412     "icon" => "robot",
6413     "title" => "WinInet",
6414     "rule" => array(
6415     "TeamSoft WinInet Component" => ""
6416     ),
6417     "uri" => "http://www.winsoft.sk/wininet.htm"
6418     ),
6419     "winhttp" => array(
6420     "icon" => "robot",
6421     "title" => "WinHTTP",
6422     "rule" => array(
6423     "WinHttp\.WinHttpRequest\.([0-9.]{1,10})" => "\\1"
6424     ),
6425     "uri" => ""
6426     ),
6427     "wire" => array(
6428     "icon" => "robot",
6429     "title" => "WIRE",
6430     "rule" => array(
6431     "^WIRE[ /]([0-9.]{1,10})" => "\\1"
6432     ),
6433     "uri" => ""
6434     ),
6435     "wmp" => array(
6436     "icon" => "robot",
6437     "title" => "WMP",
6438     "rule" => array(
6439     "^WMP" => ""
6440     ),
6441     "uri" => ""
6442     ),
6443     "woozweb" => array(
6444     "icon" => "woozweb",
6445     "title" => "Woozweb",
6446     "rule" => array(
6447     "woozweb" => ""
6448     ),
6449     "uri" => "http://www.woozweb.com/"
6450     ),
6451     "wordchamp" => array(
6452     "icon" => "robot",
6453     "title" => "WordChamp",
6454     "rule" => array(
6455     "^WordChampBot" => ""
6456     ),
6457     "uri" => "http://www.wordchamp.com/"
6458     ),
6459     "wordpress" => array(
6460     "icon" => "wordpress",
6461     "title" => "WordPress",
6462     "rule" => array(
6463     "WordPress[ /]([0-9.]{1,10})" => "\\1"
6464     ),
6465     "uri" => ""
6466     ),
6467     "worio" => array(
6468     "icon" => "worio",
6469     "title" => "Worio",
6470     "rule" => array(
6471     "woriobot" => ""
6472     ),
6473     "uri" => "http://worio.com/"
6474     ),
6475     "worldlight" => array(
6476     "icon" => "worldlight",
6477     "title" => "WorldLight",
6478     "rule" => array(
6479     "^WorldLight" => ""
6480     ),
6481     "uri" => ""
6482     ),
6483     "worqmada" => array(
6484     "icon" => "robot",
6485     "title" => "WorQmada",
6486     "rule" => array(
6487     "WorQmada[ /]([0-9.]{1,10})" => "\\1"
6488     ),
6489     "uri" => ""
6490     ),
6491     "wotbox" => array(
6492     "icon" => "wotbox",
6493     "title" => "Wotbox",
6494     "rule" => array(
6495     "Wotbox[ /]?[a-z]*([0-9.]{1,10})" => "\\1"
6496     ),
6497     "uri" => ""
6498     ),
6499     "wp" => array(
6500     "icon" => "wp",
6501     "title" => "Wirtualna Polska",
6502     "rule" => array(
6503     "NetSprint[ /\-]{1,4}([0-9.]{1,10})" => "\\1"
6504     ),
6505     "uri" => "http://wp.pl"
6506     ),
6507     "wsb" => array(
6508     "icon" => "robot",
6509     "title" => "WebSearchBench",
6510     "rule" => array(
6511     "WSB WebCrawler V([0-9.]{1,10})" => "\\1",
6512     "WSB " => ""
6513     ),
6514     "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6515     ),
6516     "wume" => array(
6517     "icon" => "robot",
6518     "title" => "WUME Lab's",
6519     "rule" => array(
6520     "^wume_crawler[ /]([0-9.]{1,10})" => "\\1",
6521     ),
6522     "uri" => "http://wume.cse.lehigh.edu/~xiq204/crawler/"
6523     ),
6524     "wusage" => array(
6525     "icon" => "wusage",
6526     "title" => "Wusage",
6527     "rule" => array(
6528     "Wusage[ /]([0-9.]{1,10})" => "\\1",
6529     ),
6530     "uri" => "http://www.boutell.com/wusage/"
6531     ),
6532     "wwgrapevine" => array(
6533     "icon" => "wwgrapevine",
6534     "title" => "WWgrapevine",
6535     "rule" => array(
6536     "wwgrapevine[ /]([0-9.]{1,10})" => "\\1"
6537     ),
6538     "uri" => ""
6539     ),
6540     "wws" => array(
6541     "icon" => "robot",
6542     "title" => "WWSBOT",
6543     "rule" => array(
6544     "WWSBOT[ /]([0-9.]{1,10})" => "\\1",
6545     ),
6546     "uri" => "http://www.analyzer.nu"
6547     ),
6548     "www4mail" => array(
6549     "icon" => "robot",
6550 matthys 209 "title" => "WWW4mail",
6551 joku 63 "rule" => array(
6552     "^www4mail[ /]([0-9.]{1,10})" => "\\1"
6553     ),
6554     "uri" => "http://www.www4mail.org/"
6555     ),
6556     "wwwc" => array(
6557     "icon" => "wwwc",
6558     "title" => "WWWC",
6559     "rule" => array(
6560     "^WWWC[ /]([0-9.]{1,10})" => "\\1"
6561     ),
6562     "uri" => ""
6563     ),
6564     "wwwd" => array(
6565     "icon" => "robot",
6566     "title" => "WWWD",
6567     "rule" => array(
6568     "^WWWD[ /]([0-9.]{1,10})" => "\\1"
6569     ),
6570     "uri" => ""
6571     ),
6572     "wwweasel" => array(
6573     "icon" => "wwweasel",
6574     "title" => "WWWeasel",
6575     "rule" => array(
6576     "WWWeasel( Robot)?[/ ]v?([0-9.]{1,10})" => "\\2"
6577     ),
6578     "uri" => ""
6579     ),
6580     "wwwfi" => array(
6581     "icon" => "wwwfi",
6582     "title" => "www.fi",
6583     "rule" => array(
6584     "www\.fi crawler" => ""
6585     ),
6586     "uri" => "http://www.fi/"
6587     ),
6588     "wwwmechanize" => array(
6589     "icon" => "robot",
6590     "title" => "WWW-Mechanize",
6591     "rule" => array(
6592     "^WWW-Mechanize[/ ]([0-9.]{1,10})" => "\\1"
6593     ),
6594     "uri" => ""
6595     ),
6596     "wwwoffle" => array(
6597     "icon" => "robot",
6598     "title" => "WWWoffle",
6599     "rule" => array(
6600     "^wwwoffle[/ ]([0-9.]{1,10})" => "\\1"
6601     ),
6602     "uri" => ""
6603     ),
6604     "wwwster" => array(
6605     "icon" => "robot",
6606     "title" => "WWWster",
6607     "rule" => array(
6608     "^wwwster[/ ]([0-9.]{1,10})" => "\\1"
6609     ),
6610     "uri" => ""
6611     ),
6612     "wysigot" => array(
6613     "icon" => "wysigot",
6614     "title" => "Wysigot",
6615     "rule" => array(
6616     "Wysigot[/ ]([0-9.]{1,10})" => "\\1"
6617     ),
6618     "uri" => ""
6619     ),
6620     "xaldon" => array(
6621     "icon" => "xaldon",
6622     "title" => "Xaldon",
6623     "rule" => array(
6624     "Xaldon WebSpider" => ""
6625     ),
6626     "uri" => "http://www.xaldon.de/"
6627     ),
6628     "xenu" => array(
6629     "icon" => "xenu",
6630     "title" => "Xenu Link Sleuth",
6631     "rule" => array(
6632     "Xenu Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6633     "Xenu(&#039;s)? Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6634     "Xenu_Link_Sleuth_([0-9a-z.]{1,10})" => "\\1"
6635     ),
6636     "uri" => "http://home.snafu.de/tilman/xenulink.html"
6637     ),
6638     "xerka" => array(
6639     "icon" => "xerka",
6640     "title" => "Xerka",
6641     "rule" => array(
6642     "^Xerka WebBot v([0-9a-z.]{1,10})" => "\\1"
6643     ),
6644     "uri" => "http://www.diana-teknologia.com/www1/english/xerka.htm"
6645     ),
6646     "xirq" => array(
6647     "icon" => "robot",
6648     "title" => "XIRQ",
6649     "rule" => array(
6650     "^xirq[ /]([0-9a-z.]{1,10})" => "\\1"
6651     ),
6652     "uri" => "http://www.xirq.com"
6653     ),
6654     "xmlslurp" => array(
6655     "icon" => "robot",
6656     "title" => "XMLSlurp",
6657     "rule" => array(
6658     "^XMLSlurp[ /]([0-9a-z.]{1,10})" => "\\1"
6659     ),
6660     "uri" => ""
6661     ),
6662     "xml-sitemaps" => array(
6663     "icon" => "xml-sitemaps",
6664     "title" => "XML-Sitemaps",
6665     "rule" => array(
6666     "XML-Sitemaps[ /]([0-9a-z.]{1,10})" => "\\1"
6667     ),
6668     "uri" => ""
6669     ),
6670     "xmlrpc" => array(
6671     "icon" => "robot",
6672     "title" => "Trackback",
6673     "rule" => array(
6674     "XMLRPC" => ""
6675     ),
6676     "uri" => ""
6677     ),
6678 matthys 294 "xovi" => array(
6679     "icon" => "xovi",
6680     "title" => "Xovi",
6681     "rule" => array(
6682     "XoviBot[ /]([0-9a-z.]{1,10})" => "\\1"
6683     ),
6684     "uri" => "http://www.xovibot.net"
6685     ),
6686 joku 63 "yacy" => array(
6687     "icon" => "yacy",
6688     "title" => "Yacy",
6689     "rule" => array(
6690     "yacy\.net" => ""
6691     ),
6692     "uri" => ""
6693     ),
6694     "yahoo" => array(
6695     "icon" => "yahoo",
6696     "title" => "Yahoo",
6697     "rule" => array(
6698     "Yahoo(! ([a-z]{1,3} )?Slurp|-)" => "",
6699     "Yahoo-MMCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6700     "Yahoo-VerticalCrawler-FormerWebCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6701     "^AnzwersCrawl[/ ]([0-9a-z.]{1,10})" => "\\1",
6702     "Y!J(-BSC|-SRD)*[/ ]([0-9a-z.]{1,10})" => "\\2",
6703     "Y!OASIS/TEST" => "",
6704     "Harvest-NG[/ ]([0-9a-z.]{1,10})" => "\\1",
6705     "Y!J; for robot study" => "",
6706     "Yahoo Japan; for robot study" => ""
6707     ),
6708     "uri" => "http://www.yahoo.com"
6709     ),
6710     "yahoo-feed" => array(
6711     "icon" => "yahoo",
6712     "title" => "Yahoo Feedseeker",
6713     "rule" => array(
6714     "^YahooFeedSeeker[/ ]([0-9a-z.]{1,10})" => "\\1"
6715     ),
6716     "uri" => "http://www.yahoo.com"
6717     ),
6718     "yandex" => array(
6719     "icon" => "yandex",
6720     "title" => "Yandex",
6721     "rule" => array(
6722     "Yandex[/ ]([0-9.]{1,10})" => "\\1",
6723     "Yandex(Bot|Images|Media|Antivirus)[/ ]([0-9.]{1,10})" => "\\2"
6724     ),
6725     "uri" => "http://yandex.com/bots"
6726     ),
6727     "yanga" => array(
6728     "icon" => "yanga",
6729     "title" => "Yanga",
6730     "rule" => array (
6731     "^Yanga.*v([0-9.]{1,10})" => "\\1"
6732     ),
6733     "uri" => "http://www.yanga.co.uk/"
6734     ),
6735     "yap" => array(
6736     "icon" => "yap",
6737     "title" => "Yap",
6738     "rule" => array(
6739     "^YapBot[_/ ]v([0-9.]{1,10})" => "\\1"
6740     ),
6741     "uri" => "http://www.yapinc.com/"
6742     ),
6743     "yarienavoir" => array(
6744     "icon" => "robot",
6745     "title" => "Yarienavoir",
6746     "rule" => array(
6747     "^yarienavoir.net[/ ]([0-9.]{1,10})" => "\\1"
6748     ),
6749     "uri" => "http://www.yarienavoir.net/"
6750     ),
6751     "yell" => array(
6752     "icon" => "yell",
6753     "title" => "Yell",
6754     "rule" => array(
6755     "YellCrawl[ /]V?([0-9.]{1,10})" => "\\1",
6756     "Yellbot[ /]Nutch-([0-9.]{1,10})" => "\\1",
6757     ),
6758     "uri" => ""
6759     ),
6760     "youdao" => array(
6761     "icon" => "youdao",
6762     "title" => "Youdao",
6763     "rule" => array(
6764     "YodaoBot-(Image|Mobile)?[ /]([0-9.]{1,10})" => "\\2",
6765     "YoudaoBot[ /]([0-9.]{1,10})" => "\\1"
6766     ),
6767     "uri" => "http://www.youdao.com/help/webmaster/spider/"
6768     ),
6769     "yoogli" => array(
6770     "icon" => "yoogli",
6771     "title" => "Yoogli",
6772     "rule" => array(
6773     "yoogliFetchAgent[ /]([0-9.]{1,10})" => "\\1"
6774     ),
6775     "uri" => "http://www.yoogli.com"
6776     ),
6777     "yotta" => array(
6778     "icon" => "robot",
6779     "title" => "Yotta",
6780     "rule" => array(
6781     "Yotta(Shopping|Cars)_Bot[ /]([0-9.]{1,10})" => "\\2",
6782     "OmniExplorer_Bot[ /]([0-9.]{1,10})" => "\\1"
6783     ),
6784     "uri" => "http://www.yottacars.com"
6785     ),
6786     "yoono" => array(
6787     "icon" => "yoono",
6788     "title" => "Yoono",
6789     "rule" => array(
6790     "Yoono" => ""
6791     ),
6792     "uri" => "http://www.yoono.com/"
6793     ),
6794     "yowedo" => array(
6795     "icon" => "robot",
6796     "title" => "Yowedo",
6797     "rule" => array(
6798     "Yowedo[ /]([0-9.]{1,10})" => "\\1"
6799     ),
6800     "uri" => "http://yowedo.com/en/partners.html"
6801     ),
6802     "yuntis" => array(
6803     "icon" => "robot",
6804 matthys 209 "title" => "Yuntis",
6805 joku 63 "rule" => array(
6806     "Gulper Web Bot[ /]([0-9.]{1,10})" => "\\1"
6807     ),
6808     "uri" => "http://yuntis.ecsl.cs.sunysb.edu/help/robot/"
6809     ),
6810     "zao" => array(
6811     "icon" => "robot",
6812     "title" => "Zao",
6813     "rule" => array(
6814     "Zao[ /]([0-9.]{1,10})" => "\\1",
6815     "Zao-crawler" => ""
6816     ),
6817     "uri" => ""
6818     ),
6819     "zealbot" => array(
6820     "icon" => "zeal",
6821     "title" => "ZealBot",
6822     "rule" => array(
6823     "Zealbot[ /]([0-9.]{1,10})" => "\\1"
6824     ),
6825     "uri" => ""
6826     ),
6827     "zearchit" => array(
6828     "icon" => "zearchit",
6829     "title" => "Zearchit",
6830     "rule" => array(
6831     "Zearchit" => ""
6832     ),
6833     "uri" => "http://www.zearchit.de/"
6834     ),
6835     "zebz" => array(
6836     "icon" => "robot",
6837     "title" => "ze.bz",
6838     "rule" => array(
6839     "^ZeBot_(lseek\.net|www\.ze\.bz)" => ""
6840     ),
6841     "uri" => "http://www.ze.bz/"
6842     ),
6843     "zedzo" => array(
6844     "icon" => "robot",
6845     "title" => "Zedzo",
6846     "rule" => array(
6847     "zedzo.digest[ /]([0-9.]{1,10})" => "\\1"
6848     ),
6849     "uri" => "http://www.zedzo.com/"
6850     ),
6851     "zerx" => array(
6852     "icon" => "zerx",
6853     "title" => "Zerx",
6854     "rule" => array(
6855     "^zerxbot[ /](Version|v)*[ /]*([0-9.]{1,10})" => "\\2"
6856     ),
6857     "uri" => "http://www.zerx.com/"
6858     ),
6859     "zeus" => array(
6860     "icon" => "zeus",
6861     "title" => "Zeus",
6862     "rule" => array(
6863     "Zeus" => ""
6864     ),
6865     "uri" => "http://www.zeus.com"
6866     ),
6867     "zippp" => array(
6868     "icon" => "robot",
6869     "title" => "Zippp",
6870     "rule" => array(
6871     "ZipppBot[ /]([0-9.]{1,10})" => "\\1"
6872     ),
6873     "uri" => ""
6874     ),
6875     "zippy" => array(
6876     "icon" => "robot",
6877     "title" => "Zippy",
6878     "rule" => array(
6879     "^Zippy[ v/]*([0-9.]{1,10})" => "\\1"
6880     ),
6881     "uri" => "http://www.zippyfinder.com"
6882     ),
6883     "zoeky" => array(
6884     "icon" => "robot",
6885     "title" => "Zoeky",
6886     "rule" => array(
6887     "Zoekybot[ /]([0-9.]{1,10})" => "\\1"
6888     ),
6889     "uri" => ""
6890     ),
6891     "zoom" => array(
6892     "icon" => "zoom",
6893 matthys 209 "title" => "ZoomSpider",
6894 joku 63 "rule" => array(
6895     "^ZoomSpider" => ""
6896     ),
6897     "uri" => "http://www.wrensoft.com/"
6898     ),
6899     "zspider" => array(
6900     "icon" => "robot",
6901 matthys 209 "title" => "Zspider",
6902 joku 63 "rule" => array(
6903     "zspider[ /]([0-9.a-z]{1,10})" => "\\1"
6904     ),
6905     "uri" => "http://feedback.redkolibri.com/"
6906     ),
6907 matthys 281 "zumbot" => array(
6908     "icon" => "robot",
6909     "title" => "ZUM Search",
6910     "rule" => array(
6911     "ZumBot[ /]([0-9.]{1,10})" => "\\1"
6912     ),
6913     "uri" => "http://help.zum.com/inquiry"
6914     ),
6915 joku 63 "zyborg" => array(
6916     "icon" => "zyborg",
6917     "title" => "WiseNutBot",
6918     "rule" => array(
6919     "(WISE|Zy)bo(rg|t)[ /]([0-9.]{1,10})" => "\\3"
6920     ),
6921     "uri" => ""
6922     ),
6923     // Catch up for the originals, they got to stay in that order.
6924     "blogbot" => array(
6925     "icon" => "blogbot",
6926     "title" => "BlogBot",
6927     "rule" => array(
6928     "Blog[ \-]?Bot" => ""
6929     ),
6930     "uri" => "http://www.blogbot.com/"
6931     ),
6932     "centrum" => array(
6933     "icon" => "centrum",
6934     "title" => "Centrum",
6935     "rule" => array(
6936     "holmes[/ ]([0-9.]{1,10})" => "\\1",
6937     "^Centrum-checker" => ""
6938     ),
6939     "uri" => ""
6940     ),
6941     "httpclient" => array(
6942     "icon" => "robot",
6943     "title" => "HTTPClient",
6944     "rule" => array(
6945     "HTTP[ \-]?Client[ /]([0-9.]{1,10})" => "\\1",
6946     "HTTP[ \-]?Client" => ""
6947     ),
6948     "uri" => "http://www.innovation.ch/java/HTTPClient/"
6949     ),
6950     "incywincy" => array(
6951     "icon" => "robot",
6952     "title" => "IncyWincy",
6953     "rule" => array(
6954     "^IncyWincy[ /]([0-9.]{1,10})" => "\\1",
6955     "^IncyWincy" => ""
6956     ),
6957     "uri" => ""
6958     ),
6959     "java" => array(
6960     "icon" => "java",
6961     "title" => "Java",
6962     "rule" => array(
6963     "^java[ /]*([0-9.a-z]{1,10})" => "\\1"
6964     ),
6965     "uri" => ""
6966     ),
6967     "libfetch" => array(
6968     "icon" => "robot",
6969     "title" => "Libfetch",
6970     "rule" => array(
6971     "^(fetch )?libfetch[ /]([0-9.]{1,10})" => "\\2"
6972     ),
6973     "uri" => "http://www.freebsd.org/"
6974     ),
6975     "libwww" => array(
6976     "icon" => "libwww",
6977 matthys 209 "title" => "LibWWW",
6978 joku 63 "rule" => array(
6979     "^libww(w|w-perl|w-FM)[ /]([0-9.]{1,10})" => "\\2",
6980     "^libww(w|w-perl|w-FM)" => "",
6981     "MyApp.*libww(w|w-perl|w-FM)" => ""
6982     ),
6983     "uri" => ""
6984     ),
6985     "litefinder" => array(
6986     "icon" => "litefinder",
6987     "title" => "LiteFinder",
6988     "rule" => array(
6989     "LiteFinder[ /]([0-9.]{1,10})" => "\\1"
6990     ),
6991     "uri" => "http://www.litefinder.net/about.html"
6992     ),
6993     "nutchorg" => array(
6994     "icon" => "nutchorg",
6995     "title" => "Nutch",
6996     "rule" => array(
6997     "Nutc(hOrg|hCVS|h)?[ /]([0-9.]{1,10})" => "\\2",
6998     "Nutch" => ""
6999     ),
7000     "uri" => "http://lucene.apache.org/nutch/"
7001     ),
7002     "pythonurl" => array(
7003     "icon" => "pythonurl",
7004     "title" => "Python-url",
7005     "rule" => array(
7006     "Python[ \-]?urllib" => ""
7007     ),
7008     "uri" => ""
7009     ),
7010     // Know Robots as SPAM BOTS
7011     "SPAM" => array(
7012     "icon" => "robot",
7013     "title" => "SPAM",
7014     "rule" => array(
7015     "NASA Search[/ ]([0-9.]{1,10})" => "\\1",
7016     "^PHOTO CHECK" => "",
7017     "^FOTOCHECKER" => "",
7018     "^IPTC CHECK" => "",
7019     "^DataCha0s" => "",
7020     "^Mac Finder" => "",
7021     "^Missigua Locator[ /]([0-9.]{1,10})" => "\\1",
7022     "^Missouri College Browse" => "",
7023     "Email[ \-]?Siphon" => "",
7024     "atSpider" => "",
7025     "autoemailspider" => "",
7026     "^Demo Bot" => "",
7027     "^Program Shareware" => "",
7028     "^Snapbot" => "",
7029     "^snap.com" => "",
7030     "^Guestbook Auto Submitter" => "",
7031     "panscient.com" => "",
7032     ),
7033     "uri" => ""
7034     ),
7035     // Things we don't know by now
7036     "robot" => array(
7037     "icon" => "robot",
7038     "title" => "Robot",
7039     "rule" => array(
7040     "(robot|spider|harvest|(?<!orange)bot|(?<!msie)crawler)" => ""
7041     )
7042     )
7043     );
7044 joku 261 ?>

Properties

Name Value
svn:keywords Id