ViewVC Help
View File | Revision Log | Show Annotations | View Changeset | Root Listing
root/BBClone/trunk/lib/robot.php
Revision: 420
Committed: Tue Mar 7 15:12:21 2023 UTC (20 months, 3 weeks ago) by joku
File size: 160331 byte(s)
Log Message:

File Contents

# User Rev Content
1 joku 63 <?php
2     /* This file is part of BBClone (A PHP based Web Counter on Steroids)
3     *
4     * SVN FILE $Id$
5     *
6 joku 417 * Copyright (C) 2001-2023, the BBClone Team (see doc/authors.txt for details)
7 joku 63 *
8     * This program is free software: you can redistribute it and/or modify
9     * it under the terms of the GNU General Public License as published by
10     * the Free Software Foundation, either version 3 of the License, or
11     * (at your option) any later version.
12     *
13     * This program is distributed in the hope that it will be useful,
14     * but WITHOUT ANY WARRANTY; without even the implied warranty of
15     * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16     * GNU General Public License for more details.
17     *
18     * See doc/copying.txt for details
19     */
20    
21     /////////////////////
22     // Robot Detection //
23     /////////////////////
24    
25     $robot = array(
26     "1noon" => array(
27     "icon" => "1noon",
28     "title" => "1noon",
29     "rule" => array(
30     "1Noonbot[/ ]([0-9.]{1,10})" => "\\1",
31     "^Yeti$" => ""
32     ),
33     "uri" => ""
34     ),
35     "123people" => array(
36     "icon" => "123people",
37     "title" => "123people",
38     "rule" => array(
39     "123peoplebot[ /]([0-9.]{1,10})" => "\\1"
40     ),
41     "uri" => "http://www.123people.fr/"
42     ),
43     "123spider" => array(
44     "icon" => "robot",
45     "title" => "123Spider",
46     "rule" => array(
47     "123spider-Bot \(Version: ([0-9.]{1,10})" => "\\1"
48     ),
49     "uri" => "http://www.123spider.de/"
50     ),
51     "192com" => array(
52     "icon" => "robot",
53     "title" => "192.com",
54     "rule" => array(
55     "192.comAgent" => ""
56     ),
57     "uri" => "http://www.192.com/"
58     ),
59 matthys 298 "200please" => array(
60     "icon" => "200please",
61     "title" => "200please Crawler",
62     "rule" => array(
63     "200PleaseBot[ /]([0-9.]{1,10})" => "\\1"
64     ),
65     "uri" => "http://www.200please.com/bot"
66     ),
67 joku 63 "2dehands" => array(
68     "icon" => "2dehands",
69     "title" => "2deHands",
70     "rule" => array(
71     "2dehands\.nl" => ""
72     ),
73     "uri" => ""
74     ),
75     "80legs" => array(
76     "icon" => "80legs",
77     "title" => "80legs",
78     "rule" => array(
79     "008[/ ]([0-9.]{1,10}).*80legs" => "\\1"
80     ),
81     "uri" => "http://www.80legs.com/"
82     ),
83     "a1sitemap" => array(
84     "icon" => "a1sitemap",
85     "title" => "A1 Sitemap",
86     "rule" => array(
87     "^A1 Sitemap Generator[ /]([0-9.]{1,10})" => "\\1",
88     "miggibot[ /]([0-9.]{1,10})" => "\\1"
89     ),
90     "uri" => "http://www.micro-sys.dk/products/sitemap-generator/"
91     ),
92     "a2b" => array(
93     "icon" => "a2b",
94     "title" => "A2B",
95     "rule" => array(
96     "www\.a2b\.cc" => ""
97     ),
98     "uri" => "http://www.a2b.cc"
99     ),
100     "abacho" => array(
101     "icon" => "robot",
102     "title" => "Abacho",
103     "rule" => array(
104     "^ABACHOBot" => ""
105     ),
106     "uri" => ""
107     ),
108     "abcdatos" => array(
109     "icon" => "abcdatos",
110     "title" => "ABCdatos",
111     "rule" => array(
112     "^ABCdatos BotLink[ /]([0-9.]{1,10})" => "\\1"
113     ),
114     "uri" => "http://www.abcdatos.com/"
115     ),
116     "abot" => array(
117     "icon" => "abot",
118     "title" => "aBot",
119     "rule" => array(
120     "^abot[ /]([0-9.]{1,10})" => "\\1"
121     ),
122     "uri" => ""
123     ),
124     "about" => array(
125     "icon" => "about",
126     "title" => "About",
127     "rule" => array(
128     "Libby[_/ ]([0-9.]{1,10})" => "\\1",
129     "About[_/ ]([0-9.]{1,10})libwww-perl" => "\\1"
130     ),
131     "uri" => ""
132     ),
133     "aboutus" => array(
134     "icon" => "aboutus",
135     "title" => "AboutUs",
136     "rule" => array(
137     "AboutUsBot" => ""
138     ),
139     "uri" => "http://www.aboutus.org/"
140     ),
141     "ackerm" => array(
142     "icon" => "robot",
143     "title" => "Ackerm",
144     "rule" => array(
145     "www.ackerm.com" => ""
146     ),
147     "uri" => "http://www.ackerm.com/"
148     ),
149     "acoi" => array(
150     "icon" => "acoi",
151     "title" => "AcoiRobot",
152     "rule" => array(
153     "^AcoiRobot" => ""
154     ),
155     "uri" => "http://monetdb.cwi.nl/acoi/projects.html"
156     ),
157     "acoon" => array(
158     "icon" => "acoon",
159     "title" => "Acoon",
160     "rule" => array(
161     "Acoon[ \-]?Robot" => ""
162     ),
163     "uri" => ""
164     ),
165     "accoona" => array(
166     "icon" => "accoona",
167     "title" => "Accoona",
168     "rule" => array(
169     "Accoona-AI-Agent[/ ]([0-9.]{1,10})" => "\\1",
170     "^accoona" => ""
171     ),
172     "uri" => ""
173     ),
174     "acme" => array(
175     "icon" => "acme",
176     "title" => "Acme",
177     "rule" => array(
178     "^Acme\.Spider" => ""
179     ),
180     "uri" => "http://www.acme.com/java/software/Acme.Spider.html"
181     ),
182     "active" => array(
183     "icon" => "robot",
184     "title" => "ActiveBookmark",
185     "rule" => array(
186     "ActiveBookmark[/ ]([0-9.]{1,10})" => "\\1"
187     ),
188     "uri" => ""
189     ),
190     "admuncher" => array(
191     "icon" => "robot",
192     "title" => "Ad Muncher",
193     "rule" => array(
194     "Ad Muncher[/ v]*([0-9.]{1,10})" => "\\1"
195     ),
196     "uri" => ""
197     ),
198     "aesop" => array(
199     "icon" => "robot",
200     "title" => "Aesop",
201     "rule" => array(
202     "^AESOP_com_SpiderMan" => ""
203     ),
204     "uri" => "http://www.aesop.com"
205     ),
206     "agada" => array(
207     "icon" => "robot",
208     "title" => "Agada",
209     "rule" => array(
210     "^agadine[/ ]([0-9.]{1,10})" => "\\1"
211     ),
212     "uri" => ""
213     ),
214     "ahrefs" => array(
215     "icon" => "ahrefs",
216     "title" => "Ahrefs",
217     "rule" => array(
218     "AhrefsBot[ /]([0-9.]{1,10})" => "\\1"
219     ),
220     "uri" => "http://ahrefs.com/"
221     ),
222     "aibot" => array(
223     "icon" => "robot",
224     "title" => "Aibot",
225     "rule" => array(
226     "AIBOT[/ ]([0-9.]{1,10})" => "\\1"
227     ),
228     "uri" => ""
229     ),
230     "aihitbot" => array(
231     "icon" => "robot",
232     "title" => "aiHit",
233     "rule" => array(
234     "aiHitBot[/ ]([0-9.]{1,10})" => "\\1"
235     ),
236     "uri" => "http://www.aihit.com/"
237     ),
238     "aipbot" => array(
239     "icon" => "robot",
240     "title" => "Aipbot",
241     "rule" => array(
242     "aipbot[/ ]([0-9.]{1,10})" => "\\1"
243     ),
244     "uri" => ""
245     ),
246     "aleksika" => array(
247     "icon" => "aleksika",
248     "title" => "Aleksika",
249     "rule" => array(
250     "Aleksika Spider[/ ]([0-9.]{1,10})" => "\\1"
251     ),
252     "uri" => ""
253     ),
254     "alertsite" => array(
255     "icon" => "alertsite",
256     "title" => "AlertSite",
257     "rule" => array(
258     "ipd[ /]([0-9.]{1,10}).*Alertsite\.com" => "\\1"
259     ),
260     "uri" => "http://www.alertsite.com/index.html"
261     ),
262     "alexa" => array(
263     "icon" => "alexa",
264     "title" => "Alexa",
265     "rule" => array(
266     "^ia_archive" => ""
267     ),
268     "uri" => "http://www.alexa.com/"
269     ),
270     "almaden" => array(
271     "icon" => "almaden",
272     "title" => "IBM Crawler",
273     "rule" => array(
274     "www\.almaden\.ibm\.com/cs/crawler" => ""
275     ),
276     "uri" => "http://www.almaden.ibm.com/cs/crawler/"
277     ),
278     "altavista" => array(
279     "icon" => "altavista",
280     "title" => "Altavista",
281     "rule" => array(
282     "Scooter[ /\-]*[a-z]*([0-9.]{1,10})" => "\\1",
283     "AltaVista V([0-9.]{1,10})" => "\\1",
284     "AltaVista Intranet V([0-9.]{1,10})" => "\\1"
285     ),
286     "uri" => "http://www.altavista.com/"
287     ),
288     "amazon" => array(
289     "icon" => "amazon",
290     "title" => "Amazon",
291     "rule" => array(
292     "^(aranhabot|amzn_assoc)" => "",
293 matthys 401 "^NutchEC2Test" => "",
294     "Amazonbot[/ ]([0-9.]{1,10})" => "\\1"
295 joku 63 ),
296     "uri" => "http://www.amazon.com/"
297     ),
298     "amidalla" => array(
299     "icon" => "amidalla",
300     "title" => "Amidalla",
301     "rule" => array(
302     "^amibot" => ""
303     ),
304     "uri" => ""
305     ),
306     "amfibi" => array(
307     "icon" => "amfibi",
308     "title" => "Amfibi",
309     "rule" => array(
310     "Amfibibot[/ ]([0-9.]{1,10})" => "\\1",
311     "Amfibibot" => ""
312     ),
313     "uri" => ""
314     ),
315     "amphetadesk" => array(
316     "icon" => "robot",
317     "title" => "AmphetaDesk",
318     "rule" => array(
319     "AmphetaDesk[/ ]([0-9.]{1,10})" => "\\1"
320     ),
321     "uri" => ""
322     ),
323     "amphetameme" => array(
324     "icon" => "robot",
325     "title" => "Amphetameme",
326     "rule" => array(
327     "amphetameme[ \-]?crawler" => ""
328     ),
329     "uri" => ""
330     ),
331     "annomille" => array(
332     "icon" => "robot",
333     "title" => "AnnoMille",
334     "rule" => array(
335     "^AnnoMille( spider)?[/ ]([0-9.]{1,10})" => "\\2"
336     ),
337     "uri" => "http://www.annomille.it"
338     ),
339     "anonymouse" => array(
340     "icon" => "anonymouse",
341     "title" => "Anonymouse.org",
342     "rule" => array(
343     "http://Anonymouse.org" => ""
344     ),
345     "uri" => "http://anonymouse.org"
346     ),
347     "ansearch" => array(
348     "icon" => "robot",
349     "title" => "Ansearch",
350     "rule" => array(
351     "AnsearchBot[/ ]([0-9.]{1,10})" => "\\1"
352     ),
353     "uri" => ""
354     ),
355     "answerchase" => array(
356     "icon" => "answerchase",
357     "title" => "AnswerChase",
358     "rule" => array(
359     "AnswerChase( PROve)?[/ ]([0-9.]{1,10})" => "\\2"
360     ),
361     "uri" => "http://www.answerchase.com/"
362     ),
363     "antibot" => array(
364     "icon" => "robot",
365 matthys 205 "title" => "Antibot",
366 joku 63 "rule" => array(
367     "antibot-V([0-9.]{1,10})" => "\\1"
368     ),
369     "uri" => ""
370     ),
371     "aonde" => array(
372     "icon" => "aonde",
373     "title" => "Aonde",
374     "rule" => array(
375     "^AONDE-Spider" => ""
376     ),
377     "uri" => ""
378     ),
379     "aonline" => array(
380     "icon" => "robot",
381     "title" => "A-Online.at",
382     "rule" => array(
383     "^A-Online Search" => ""
384     ),
385     "uri" => "http://www.a-online.at/"
386     ),
387     "aol" => array(
388     "icon" => "aol",
389     "title" => "AOLserver",
390     "rule" => array(
391     "^AOLserver-Tcl[/ ]([0-9.]{1,10})" => "\\1",
392     "^AOLserver" => ""
393     ),
394     "uri" => ""
395     ),
396     "apachebench" => array(
397     "icon" => "robot",
398     "title" => "ApacheBench",
399     "rule" => array(
400     "ApacheBench[ /]([0-9.]{1,10})" => "\\1"
401     ),
402     "uri" => ""
403     ),
404     "apassion4jazz" => array(
405     "icon" => "robot",
406     "title" => "Passion 4 Jazz",
407     "rule" => array(
408     "^BebopBot[ /]([0-9.]{1,10})" => "\\1"
409     ),
410     "uri" => "http://www.apassion4jazz.net/bebopbot.html"
411     ),
412     "apexoo" => array(
413     "icon" => "robot",
414     "title" => "Apexoo",
415     "rule" => array(
416     "^Apexoo Spider ([0-9.]{1,10})" => "\\1"
417     ),
418     "uri" => "http://www.apexoo.com/"
419     ),
420     "apnoti" => array(
421     "icon" => "apnoti",
422 matthys 205 "title" => "Apnoti",
423 joku 63 "rule" => array(
424     "apnoti.*Robot[ /]v([0-9.]{1,10})" => "\\1"
425     ),
426     "uri" => "http://www.apnoti.com/"
427     ),
428     "aport" => array(
429     "icon" => "aport",
430     "title" => "Aport",
431     "rule" => array(
432     "^Aport" => ""
433     ),
434     "uri" => ""
435     ),
436     "appie" => array(
437     "icon" => "walhello",
438     "title" => "Walhello",
439     "rule" => array(
440     "appie[ /]([0-9.]{1,10})" => "\\1"
441     ),
442     "uri" => ""
443     ),
444 matthys 389 "apple" => array(
445     "icon" => "apple",
446     "title" => "Apple",
447     "rule" => array(
448     "Applebot[ /]([0-9.]{1,10})" => "\\1"
449     ),
450     "uri" => "http://www.apple.com/go/applebot"
451     ),
452    
453 joku 63 "arachmo" => array(
454     "icon" => "arachmo",
455     "title" => "Arachmo",
456     "rule" => array(
457     "compatible; Arachmo" => ""
458     ),
459     "uri" => ""
460     ),
461     "arexera" => array(
462     "icon" => "arexera",
463     "title" => "Arexera",
464     "rule" => array(
465     "^X-Crawler" => "",
466     "^TECOMAC-Crawler[ /]([0-9.]{1,10})" => "\\1"
467     ),
468     "uri" => "http://www.arexera.de/"
469     ),
470     "arianna" => array(
471     "icon" => "arianna",
472     "title" => "Arianna",
473     "rule" => array(
474     "^www.arianna.it" => ""
475     ),
476     "uri" => "http://www.arianna.it/"
477     ),
478     "artface" => array(
479     "icon" => "robot",
480     "title" => "Artface",
481     "rule" => array(
482     "^ArtfaceBot" => ""
483     ),
484     "uri" => ""
485     ),
486     "artviper" => array(
487     "icon" => "artviper",
488     "title" => "artViper",
489     "rule" => array(
490     "artViper" => ""
491     ),
492     "uri" => "http://www.artviper.net/"
493     ),
494     "asinfo" => array(
495     "icon" => "robot",
496     "title" => "Any Search Info",
497     "rule" => array(
498     "Sleek Spider[ /]([0-9.]{1,10})" => "\\1"
499     ),
500     "uri" => "http://search-info.com/"
501     ),
502     "ask" => array(
503     "icon" => "askjeeves",
504     "title" => "Ask Jeeves",
505     "rule" => array(
506     "Ask[ \-]?Jeeves" => "",
507     "teomaagent" => ""
508     ),
509     "uri" => ""
510     ),
511     "askaboutoil" => array(
512     "icon" => "robot",
513     "title" => "ASPseek",
514     "rule" => array(
515     "^AskAboutOil[ /]([0-9.]{1,10})" => "\\1"
516     ),
517     "uri" => "http://askaboutoil.com/"
518     ),
519     "asked" => array(
520     "icon" => "robot",
521 matthys 205 "title" => "AskEd!",
522 joku 63 "rule" => array(
523     "^asked[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
524     ),
525     "uri" => "http://asked.jp"
526     ),
527     "aspseek" => array(
528     "icon" => "robot",
529     "title" => "ASPseek",
530     "rule" => array(
531     "^ASPseek[/ ]([0-9.]{1,10})" => "\\1"
532     ),
533     "uri" => ""
534     ),
535     "atlocal" => array(
536     "icon" => "robot",
537     "title" => "At Local",
538     "rule" => array(
539     "AtlocalBot[/ ]([0-9.]{1,10})" => "\\1"
540     ),
541     "uri" => "http://www.atlocal.com/"
542     ),
543     "atomz" => array(
544     "icon" => "atomz",
545     "title" => "Atomz",
546     "rule" => array(
547     "Atomz[/ ]([0-9.]{1,10})" => "\\1"
548     ),
549     "uri" => ""
550     ),
551 matthys 345 "avira" => array(
552     "icon" => "avira",
553     "title" => "Avira SafeSearch",
554     "rule" => array(
555     "^SafeSearch microdata crawler" => ""
556     ),
557     "uri" => "https://safesearch.avira.com"
558     ),
559 joku 63 "axel" => array(
560     "icon" => "robot",
561     "title" => "Axel",
562     "rule" => array(
563     "^axel" => ""
564     ),
565     "uri" => ""
566     ),
567     "axmo" => array(
568     "icon" => "axmo",
569     "title" => "Axmo",
570     "rule" => array(
571     "AxmoRobot" => ""
572     ),
573     "uri" => ""
574     ),
575     "answerbus" => array(
576     "icon" => "answerbus",
577     "title" => "AnswerBus",
578     "rule" => array(
579     "answerbus" => ""
580     ),
581     "uri" => ""
582     ),
583     "automapit" => array(
584     "icon" => "robot",
585     "title" => "AutoMapIt",
586     "rule" => array(
587     "AutoMapIt[ /](Bot)?" => ""
588     ),
589     "uri" => "http://www.automapit.com/bot.html"
590     ),
591     "augurnfind" => array(
592     "icon" => "robot",
593     "title" => "Augurnfind",
594     "rule" => array(
595     "augurnfind[/ ][v\-]*([0-9.]{1,10})" => "\\1"
596     ),
597     "uri" => ""
598     ),
599     "awasu" => array(
600     "icon" => "awasu",
601     "title" => "Awasu",
602     "rule" => array(
603     "Awasu[/ ]([0-9a-z.]{1,10})" => "\\1"
604     ),
605     "uri" => ""
606     ),
607     "axxus" => array(
608     "icon" => "axxus",
609     "title" => "axxus.de",
610     "rule" => array(
611     "whoiam" => ""
612     ),
613     "uri" => "http://www.axxus.de/"
614     ),
615     "ayell" => array(
616     "icon" => "ayell",
617     "title" => "Ayell",
618     "rule" => array(
619     "^Eurobot[ /]([0-9.]{1,10})" => "\\1"
620     ),
621     "uri" => "http://eurobot.ayell.eu"
622     ),
623     "babaloo" => array(
624     "icon" => "babaloo",
625     "title" => "Babaloo",
626     "rule" => array(
627     "BabalooSpider[ /]([0-9.]{1,10})" => "\\1"
628     ),
629     "uri" => "http://www.babaloo.si"
630     ),
631     "babe" => array(
632     "icon" => "robot",
633     "title" => "ba.be",
634     "rule" => array(
635     "BACS http://www.ba.be" => ""
636     ),
637     "uri" => "http://www.ba.be/"
638     ),
639     "baidu" => array(
640     "icon" => "baidu",
641     "title" => "Baidu",
642     "rule" => array(
643     "Baiduspider[ /]([0-9.]{1,10})" => "\\1",
644     "Baiduspider" => ""
645     ),
646     "uri" => "http://www.baidu.com/search/spider.html"
647     ),
648     "bananatree" => array(
649     "icon" => "robot",
650     "title" => "BananaTree",
651     "rule" => array(
652     "www\.thebananatree\.org" => ""
653     ),
654     "uri" => "http://www.thebananatree.org/"
655     ),
656     "bdcindexer" => array(
657     "icon" => "robot",
658     "title" => "bdcindexer",
659     "rule" => array(
660     "bdcindexer_([0-9a-z.]{1,10})" => "\\1"
661     ),
662     "uri" => "http://www.business.com/"
663     ),
664     "bdfetch" => array(
665     "icon" => "robot",
666     "title" => "BDFetch",
667     "rule" => array(
668     "^BDFetch" => ""
669     ),
670     "uri" => ""
671     ),
672     "bdncentral" => array(
673     "icon" => "robot",
674     "title" => "Bdncentral",
675     "rule" => array(
676     "BDNcentral Crawler v([0-9.]{1,10})" => "\\1"
677     ),
678     "uri" => "http://www.bdncentral.com/robot.html"
679     ),
680     "beammachine" => array(
681     "icon" => "robot",
682     "title" => "BeamMachine",
683     "rule" => array(
684     "^BeamMachine[ /]([0-9.]{1,10})" => "\\1"
685     ),
686     "uri" => "http://www.beammachine.net/"
687     ),
688     "become" => array(
689     "icon" => "become",
690     "title" => "Become",
691     "rule" => array(
692     "Become(JP)?Bot[/ ]([0-9.]{1,10})" => "\\2",
693     "(BecomeBot|Exabot)@exava\.com\)$" => ""
694     ),
695     "uri" => "http://www.become.com/"
696     ),
697     "beebware" => array(
698     "icon" => "robot",
699     "title" => "Beebware",
700     "rule" => array(
701     "BeebwareDirectory[/ ]v?([0-9.]{1,10})" => "\\2"
702     ),
703     "uri" => ""
704     ),
705     "bigbrother" => array(
706     "icon" => "robot",
707     "title" => "Big Brother",
708     "rule" => array(
709     "^Big Brother" => ""
710     ),
711     "uri" => "http://pauillac.inria.fr/~fpottier/"
712     ),
713     "bigclique" => array(
714     "icon" => "robot",
715     "title" => "BigClique",
716     "rule" => array(
717     "^BigCliqueBOT[/ ]([0-9.]{1,10})" => "\\1"
718     ),
719     "uri" => "http://www.bigclique.com"
720     ),
721     "biglotron" => array(
722     "icon" => "robot",
723     "title" => "Biglotron",
724     "rule" => array(
725     "^BIGLOTRON" => ""
726     ),
727     "uri" => "http://www.bigclique.com"
728     ),
729     "bigsearch" => array(
730     "icon" => "bigsearch",
731     "title" => "Bigsearch",
732     "rule" => array(
733     "Bigsearch.ca[/ ]Nutch[- ]([0-9.]{1,10})" => "\\1"
734     ),
735     "uri" => ""
736     ),
737     "bilbo" => array(
738     "icon" => "robot",
739     "title" => "Bilbo",
740     "rule" => array(
741     "Bilbo[ /]([0-9.]{1,10})" => "\\1"
742     ),
743     "uri" => "http://home.broadpark.no/~tnilsen-1/Linux/Bilbo_-_Nessus_WEB/bilbo_-_nessus_web.html"
744     ),
745     "bilgi" => array(
746     "icon" => "bilgi",
747     "title" => "Bilgi",
748     "rule" => array(
749     "Bilgi(Beta)?Bot[ /]([0-9.]{1,10})" => "\\1"
750     ),
751     "uri" => "http://www.bilgi.com/"
752     ),
753     "bitacle" => array(
754     "icon" => "bitacle",
755     "title" => "Bitacle",
756     "rule" => array(
757     "Bitacle (ro)?bot[ \(/V\:]+([0-9.]{1,10})" => "\\2",
758     ),
759     "uri" => "http://bitacle.org/"
760     ),
761     "bitbeamer" => array(
762     "icon" => "bitbeamer",
763     "title" => "BitBeamer",
764     "rule" => array(
765     "BitBeamer/([0-9.]{1,10})" => "\\1"
766     ),
767     "uri" => ""
768     ),
769     "biz360" => array(
770     "icon" => "biz360",
771     "title" => "Biz360",
772     "rule" => array(
773     "^Biz360 spider" => ""
774     ),
775     "uri" => ""
776     ),
777     "backlinktest" => array(
778     "icon" => "backlinktest",
779     "title" => "BacklinkCrawler",
780     "rule" => array(
781     "BacklinkCrawler" => ""
782     ),
783     "uri" => "http://www.backlinktest.com/crawler.html"
784     ),
785     "blaizbee" => array(
786     "icon" => "blaiz-bee",
787     "title" => "Blaiz-Bee",
788     "rule" => array(
789     "Blaiz-Bee[ /]([0-9.]{1,10})" => ""
790     ),
791     "uri" => ""
792     ),
793     "blogbeat" => array(
794     "icon" => "robot",
795     "title" => "BlogBeat",
796     "rule" => array(
797     "BlogBeat/?([0-9.]{1,10})" => "\\1",
798     ),
799     "uri" => "http://www.blogbeat.nl"
800     ),
801     "blogbotde" => array(
802     "icon" => "robot",
803     "title" => "blogbot.de",
804     "rule" => array(
805     "Naamah[ /]([0-9.a-z]{1,10})[ /]Blogbot" => "\\1",
806     ),
807     "uri" => "http://blogbot.de/"
808     ),
809     "blogcensus" => array(
810     "icon" => "blogcensus",
811     "title" => "Blogcensus",
812     "rule" => array(
813     "^Blogcensus" => "",
814     ),
815     "uri" => "http://blogcensus.de/bot/"
816     ),
817     "blogdex" => array(
818     "icon" => "robot",
819     "title" => "Blogdex",
820     "rule" => array(
821     "Blogdex[ /]([0-9.]{1,10})" => "\\1",
822     ),
823     "uri" => ""
824     ),
825     "blogg" => array(
826     "icon" => "blogg",
827     "title" => "Blogg",
828     "rule" => array(
829     "^blogg\.de" => ""
830     ),
831     "uri" => ""
832     ),
833     "blogland" => array(
834     "icon" => "robot",
835     "title" => "BlogLand",
836     "rule" => array(
837     "BlogLand[/ ]([0-9.]{1,10})" => "\\1"
838     ),
839     "uri" => ""
840     ),
841     "bloglines" => array(
842     "icon" => "bloglines",
843     "title" => "Bloglines",
844     "rule" => array(
845     "Bloglines[ /]([0-9.]{1,10})" => "\\1",
846     "Bloglines" => ""
847     ),
848     "uri" => ""
849     ),
850     "blogmap" => array(
851     "icon" => "robot",
852     "title" => "Blogmap",
853     "rule" => array(
854     "blogmap" => ""
855     ),
856     "uri" => ""
857     ),
858     "blogosphere" => array(
859     "icon" => "robot",
860     "title" => "Blogosphere",
861     "rule" => array(
862     "Blogosphere" => ""
863     ),
864     "uri" => ""
865     ),
866     "blogpeople" => array(
867     "icon" => "robot",
868     "title" => "BlogPeople",
869     "rule" => array(
870     "BlogPeople" => ""
871     ),
872     "uri" => ""
873     ),
874     "blogpulse" => array(
875     "icon" => "blogpulse",
876     "title" => "Blogpulse",
877     "rule" => array(
878     "Blogpulse" => ""
879     ),
880     "uri" => ""
881     ),
882     "blogranking" => array(
883     "icon" => "blogranking",
884     "title" => "BlogRanking",
885     "rule" => array(
886     "^BlogRanking(/RSS checker)?" => ""
887     ),
888     "uri" => ""
889     ),
890     "blogs" => array(
891     "icon" => "blogs",
892     "title" => "Blo.gs",
893     "rule" => array(
894     "blo\.gs[ /]([0-9.]{1,10})" => "\\1",
895     "blo\.gs" => ""
896     ),
897     "uri" => ""
898     ),
899     "blogshares" => array(
900     "icon" => "blogshares",
901     "title" => "BlogShares",
902     "rule" => array(
903     "BlogShares[ /]V?([0-9.]{1,10})" => "\\1",
904     "(^| |\()Blogshares(\.com| |\))" => ""
905     ),
906     "uri" => ""
907     ),
908     "blogslife" => array(
909     "icon" => "robot",
910     "title" => "BlogsLife",
911     "rule" => array(
912     "Blogslive" => ""
913     ),
914     "uri" => ""
915     ),
916     "blogsnow" => array(
917     "icon" => "blogsnow",
918     "title" => "BlogsNow",
919     "rule" => array(
920     "blogsnowbot" => "",
921     "BlogsNow" => ""
922     ),
923     "uri" => ""
924     ),
925     "blogstreet" => array(
926     "icon" => "blogstreet",
927     "title" => "BlogStreet",
928     "rule" => array(
929     "^BlogStreetBot" => ""
930     ),
931     "uri" => ""
932     ),
933     "blogsurf" => array(
934     "icon" => "robot",
935     "title" => "BlogSurf",
936     "rule" => array(
937     "nomadscafe_ra[/ ]([0-9.]{1,10})" => "\\1"
938     ),
939     "uri" => ""
940     ),
941     "blogtick" => array(
942     "icon" => "robot",
943     "title" => "BlogTick",
944     "rule" => array(
945     "BlogTickServer" => ""
946     ),
947     "uri" => ""
948     ),
949     "blogwatcher" => array(
950     "icon" => "blogwatcher",
951     "title" => "Blogwatcher",
952     "rule" => array(
953     "blogWatcher_Spider[/ ]([0-9.]{1,10})" => "\\1"
954     ),
955     "uri" => ""
956     ),
957     "blogwise" => array(
958     "icon" => "blogwise",
959     "title" => "Blogwise",
960     "rule" => array(
961     "Blogwise\.com(-MetaChecker)?[/ ]([0-9.]{1,10})" => "\\2"
962     ),
963     "uri" => ""
964     ),
965     "boardreader" => array(
966     "icon" => "boardreader",
967     "title" => "BoardReader",
968     "rule" => array(
969     "BoardReader[ \-](Image|Favicon)[ \-]Fetcher[ /]+([0-9.]{1,10})" => "\\2"
970     ),
971     "uri" => "http://www.boardreader.com"
972     ),
973     "bobby" => array(
974     "icon" => "bobby",
975     "title" => "Bobby",
976     "rule" => array(
977     "bobby[ /]([0-9.]{1,10})" => "\\1"
978     ),
979     "uri" => ""
980     ),
981     "boitho" => array(
982     "icon" => "robot",
983     "title" => "Boitho",
984     "rule" => array(
985     "Boitho\.com[ \-](dc|robot)?[/ ]([0-9.]{1,10})" => "\\2"
986     ),
987     "uri" => ""
988     ),
989     "booch" => array(
990     "icon" => "robot",
991     "title" => "Booch",
992     "rule" => array(
993     "^booch[_ /]([0-9.]{1,10})" => "\\1"
994     ),
995     "uri" => ""
996     ),
997     "book" => array(
998     "icon" => "book",
999     "title" => "Bookmark",
1000     "rule" => array(
1001     "http://www\.bookmark\.ne\.jp" => ""
1002     ),
1003     "uri" => ""
1004     ),
1005     "bookdog" => array(
1006     "icon" => "bookdog",
1007     "title" => "Bookdog",
1008     "rule" => array(
1009     "^Bookdog[ /]([0-9.]{1,10})" => "\\1"
1010     ),
1011     "uri" => ""
1012     ),
1013     "bordermanager" => array(
1014     "icon" => "bordermanager",
1015     "title" => "Border Manager",
1016     "rule" => array(
1017     "BorderManager[ /]([0-9.]{1,10})" => "\\1"
1018     ),
1019     "uri" => ""
1020     ),
1021     "botonparade" => array(
1022     "icon" => "botonparade",
1023     "title" => "Bot on Parade",
1024     "rule" => array(
1025     "BotOnParade" => ""
1026     ),
1027     "uri" => "http://www.bots-on-para.de/bot.html"
1028     ),
1029     "botje" => array(
1030     "icon" => "botje",
1031     "title" => "Botje",
1032     "rule" => array(
1033     "Plukkie[ /]([0-9.]{1,10})" => "\\1"
1034     ),
1035     "uri" => "http://www.botje.com/"
1036     ),
1037     "bottomfeeder" => array(
1038     "icon" => "bottomfeeder",
1039     "title" => "BottomFeeder",
1040     "rule" => array(
1041     "BottomFeeder[ /]([0-9.]{1,10})" => "\\1"
1042     ),
1043     "uri" => ""
1044     ),
1045     "browseremulator" => array(
1046     "icon" => "browseremulator",
1047     "title" => "BrowserEmulator",
1048     "rule" => array(
1049     "BrowserEmulator[ /]([0-9.]{1,10})" => "\\1"
1050     ),
1051     "uri" => "http://www.dejavu.org/emulator.htm"
1052     ),
1053     "browsershots" => array(
1054     "icon" => "browsershots",
1055     "title" => "Browsershots",
1056     "rule" => array(
1057     "Browsershots URL Check" => ""
1058     ),
1059     "uri" => "http://browsershots.org"
1060     ),
1061     "browserspy" => array(
1062     "icon" => "robot",
1063     "title" => "BrowserSpy",
1064     "rule" => array(
1065     "BrowserSpy" => ""
1066     ),
1067     "uri" => ""
1068     ),
1069     "bruinbot" => array(
1070     "icon" => "robot",
1071     "title" => "BruinBot",
1072     "rule" => array(
1073     "BruinBot" => ""
1074     ),
1075     "uri" => ""
1076     ),
1077     "bruno" => array(
1078     "icon" => "robot",
1079     "title" => "Bruno",
1080     "rule" => array(
1081     "^Bruno" => ""
1082     ),
1083     "uri" => ""
1084     ),
1085     "btbot" => array(
1086     "icon" => "btbot",
1087     "title" => "BitTorrent",
1088     "rule" => array(
1089     "BTbot/([0-9.]{1,10})" => "\\1"
1090     ),
1091     "uri" => ""
1092     ),
1093 joku 380 "bubing" => array(
1094     "icon" => "robot",
1095     "title" => "BUbiNG",
1096     "rule" => array(
1097     "BUbiNG" => ""
1098     ),
1099     "uri" => "http://law.di.unimi.it/BUbiNG.html"
1100     ),
1101 joku 63 "builtwith" => array(
1102     "icon" => "builtwith",
1103     "title" => "BuiltWith",
1104     "rule" => array(
1105     "BuiltWith[/ ]([0-9.]{1,10})" => "\\1"
1106     ),
1107     "uri" => "http://builtwith.com/bot.html"
1108     ),
1109     "bulkfeeds" => array(
1110     "icon" => "robot",
1111     "title" => "Bulkfeeds",
1112     "rule" => array(
1113     "Bulkfeeds[/ ]([a-z0-9.]{1,10})" => "\\1"
1114     ),
1115     "uri" => ""
1116     ),
1117     "burf" => array(
1118     "icon" => "burf",
1119     "title" => "Burf.com",
1120     "rule" => array(
1121     "^Norbert the Spider" => ""
1122     ),
1123     "uri" => "http://www.burf.com/"
1124     ),
1125     "butch" => array(
1126     "icon" => "robot",
1127     "title" => "Butch",
1128     "rule" => array(
1129     "Butch(__| )?([a-z0-9.]{1,10})" => "\\2"
1130     ),
1131     "uri" => ""
1132     ),
1133     "buzzlogic" => array(
1134     "icon" => "buzzlogic",
1135     "title" => "Buzzlogic",
1136     "rule" => array(
1137     "BuzzBot[ /]([0-9.]{1,10})" => "\\1"
1138     ),
1139     "uri" => "http://www.buzzlogic.com"
1140     ),
1141     "catchbot" => array(
1142     "icon" => "catchbot",
1143     "title" => "CatchBot",
1144     "rule" => array(
1145     "^CatchBot[/ ]([0-9.]{1,10})" => "\\1"
1146     ),
1147     "uri" => "http://www.catchbot.com"
1148     ),
1149     "camdiscover" => array(
1150     "icon" => "robot",
1151     "title" => "Camdiscover",
1152     "rule" => array(
1153     "^Camcrawler" => ""
1154     ),
1155     "uri" => ""
1156     ),
1157     "cazoodle" => array(
1158     "icon" => "cazoodle",
1159     "title" => "Cazoodle",
1160     "rule" => array(
1161     "^CazoodleBot/(Nutch|CazoodleBot)[/ \-]([0-9.]{1,10})" => "\\2",
1162     "^CazoodleBot[/ ]([a-z0-9.]{1,10})" => "\\1"
1163     ),
1164     "uri" => "http://www.cazoodle.com/cazoodlebot"
1165     ),
1166     "ccbot" => array(
1167     "icon" => "robot",
1168     "title" => "ccBot",
1169     "rule" => array(
1170     "CCBot[/ ]([0-9.]{1,10})" => "\\1"
1171     ),
1172     "uri" => "http://www.commoncrawl.org/bot.html"
1173     ),
1174     "ccgcrawl" => array(
1175     "icon" => "robot",
1176     "title" => "CCGCrawl",
1177     "rule" => array(
1178     "CCGCrawl[/ ]([0-9.]{1,10})" => "\\1"
1179     ),
1180     "uri" => "http://www.myworkbase.com/bot.html"
1181     ),
1182     "cerberian" => array(
1183     "icon" => "robot",
1184     "title" => "Cerberian Drtrs",
1185     "rule" => array(
1186     "^Cerberian Drtrs" => ""
1187     ),
1188     "uri" => ""
1189     ),
1190     "cfnetwork" => array(
1191     "icon" => "robot",
1192     "title" => "Cerberian Drtrs",
1193     "rule" => array(
1194     "^CFNetwork[/ ]([0-9.]{1,10})" => "\\1"
1195     ),
1196     "uri" => "http://www.cfnetwork.be/"
1197     ),
1198     "charlotte" => array(
1199     "icon" => "charlotte",
1200     "title" => "Charlotte",
1201     "rule" => array(
1202     "Charlotte[/ ]([0-9a-z.]{1,10})" => "\\1"
1203     ),
1204     "uri" => ""
1205     ),
1206     "cirilizator" => array(
1207     "icon" => "cirilizator",
1208     "title" => "Cirilizator",
1209     "rule" => array(
1210     "Cirilizator[/ ]([0-9.]{1,10})" => "\\1"
1211     ),
1212     "uri" => ""
1213     ),
1214     "claria" => array(
1215     "icon" => "robot",
1216     "title" => "Claria",
1217     "rule" => array(
1218     "(Claria|Diamond)(Bot)?[ /]([0-9.]{1,10})" => "\\3",
1219     "(Claria|Diamond)(Bot)" => ""
1220     ),
1221     "uri" => ""
1222     ),
1223     "claymont" => array(
1224     "icon" => "claymont",
1225     "title" => "Claymont",
1226     "rule" => array(
1227     "claymont\.com" => "",
1228     "OliverPerry" => ""
1229     ),
1230     "uri" => "http://www.claymont.com"
1231     ),
1232 joku 377 "clipinc" => array(
1233     "icon" => "clipinc",
1234     "title" => "ClipInc",
1235     "rule" => array(
1236     "ClipInc" => ""
1237     ),
1238     "uri" => "http://tobit.software"
1239     ),
1240 joku 63 "clush" => array(
1241     "icon" => "clush",
1242     "title" => "Clush",
1243     "rule" => array(
1244     "Clus(tered-Search-|h)Bot[ /]([0-9.]{1,10})" => "\\2"
1245     ),
1246     "uri" => ""
1247     ),
1248     "cmsworldmap" => array(
1249     "icon" => "cmsworldmap",
1250     "title" => "CMS World Map",
1251     "rule" => array(
1252     "cmsworldmap" => ""
1253     ),
1254     "uri" => "http://www.cmsworldmap.com/"
1255     ),
1256     "cobion" => array(
1257     "icon" => "robot",
1258     "title" => "Cobion",
1259     "rule" => array(
1260     " (QXW03018|obot)\)" => ""
1261     ),
1262     "uri" => ""
1263     ),
1264     "coccoc" => array(
1265 matthys 287 "icon" => "coccoc",
1266 matthys 209 "title" => "Coccoc",
1267 joku 63 "rule" => array(
1268 matthys 400 "coccoc[ /]([0-9.]{1,10})" => "\\1",
1269     "coccocbot-web[ /]([0-9.]{1,10})" => "\\1"
1270 joku 63 ),
1271 matthys 287 "uri" => "http://help.coccoc.com"
1272 joku 63 ),
1273     "coldfusion" => array(
1274     "icon" => "coldfusion",
1275     "title" => "ColdFusion",
1276     "rule" => array(
1277     "^coldfusion" => ""
1278     ),
1279     "uri" => ""
1280     ),
1281     "combine" => array(
1282     "icon" => "robot",
1283     "title" => "Combine",
1284     "rule" => array(
1285     "Combine[ /]([0-9.]{1,10})" => "\\1"
1286     ),
1287     "uri" => ""
1288     ),
1289     "combot" => array(
1290     "icon" => "robot",
1291     "title" => "comBot",
1292     "rule" => array(
1293     "^comBot[ /]([0-9.]{1,10})" => "\\1"
1294     ),
1295     "uri" => ""
1296     ),
1297     "comet" => array(
1298     "icon" => "comet",
1299     "title" => "Comet",
1300     "rule" => array(
1301     "cometsearch@cometsystems" => ""
1302     ),
1303     "uri" => ""
1304     ),
1305     "commerobo" => array(
1306     "icon" => "robot",
1307     "title" => "Commerobo",
1308     "rule" => array(
1309     "Commerobo[/ ]([0-9.]{1,10})" => "\\1"
1310     ),
1311     "uri" => ""
1312     ),
1313     "comrite" => array(
1314     "icon" => "robot",
1315     "title" => "ComRite",
1316     "rule" => array(
1317     "Comrite[/ ]([0-9.]{1,10})" => "\\1"
1318     ),
1319     "uri" => "http://www.comrite.com/"
1320     ),
1321     "convera" => array(
1322     "icon" => "convera",
1323     "title" => "Convera",
1324     "rule" => array(
1325     "Convera(MultiMedia)?Crawler[/ ]([0-9.]{1,10})" => "\\2",
1326     "Convera Internet Spider V([0-9.]{1,10})" => "\\1"
1327     ),
1328     "uri" => ""
1329     ),
1330     "coolbot" => array(
1331     "icon" => "robot",
1332     "title" => "CoolBot",
1333     "rule" => array(
1334     "^CoolBot" => ""
1335     ),
1336     "uri" => ""
1337     ),
1338     "cosmix" => array(
1339     "icon" => "robot",
1340     "title" => "Cosmix",
1341     "rule" => array(
1342     "^(voyager|cfetch|CosmixCrawler|carleson)[/ ]([0-9.]{1,10})" => "\\2",
1343     ),
1344     "uri" => ""
1345     ),
1346     "cosmos" => array(
1347     "icon" => "robot",
1348     "title" => "Cosmos",
1349     "rule" => array(
1350     "^cosmos" => ""
1351     ),
1352     "uri" => ""
1353     ),
1354     "cosmoty" => array(
1355     "icon" => "robot",
1356     "title" => "Cosmoty",
1357     "rule" => array(
1358     "^beautybot[/ ]([0-9.]{1,10})" => "\\1"
1359     ),
1360     "uri" => "http://www.uchoose.de/crawler/beautybot/"
1361     ),
1362     "covario" => array(
1363     "icon" => "covario",
1364     "title" => "Covario",
1365     "rule" => array(
1366     "Covario-IDS[/ ]([0-9.]{1,10})" => "\\1"
1367     ),
1368     "uri" => "http://www.covario.com/ids/"
1369     ),
1370     "creativecommons" => array(
1371     "icon" => "creativecommons",
1372     "title" => "Creative Commons",
1373     "rule" => array(
1374     "CreativeCommons[/ ]([0-9.]{1,6}(-dev)?)" => "\\1"
1375     ),
1376     "uri" => ""
1377     ),
1378     "cscrawler" => array(
1379     "icon" => "robot",
1380     "title" => "CsCrawler",
1381     "rule" => array(
1382     "CsCrawler" => ""
1383     ),
1384     "uri" => "http://www.kde.cs.uni-kassel.de/lehre/ss2005/googlespam/crawler.html"
1385     ),
1386 joku 111 "jigsaw" => array(
1387     "icon" => "jigsaw",
1388     "title" => "Jigsaw",
1389     "rule" => array(
1390     "Jigsaw[ /]([0-9.]{1,10})" => "\\1"
1391     ),
1392     "uri" => "http://jigsaw.w3.org/css-validator/"
1393     ),
1394 joku 63 "csscheck" => array(
1395     "icon" => "w3c",
1396     "title" => "W3C CSS Validator",
1397     "rule" => array(
1398     "CSS(Check|_Validator).+[ /]([0-9.]{1,10})" => "\\2"
1399     ),
1400     "uri" => "http://jigsaw.w3.org/css-validator/"
1401     ),
1402     "custo" => array(
1403     "icon" => "robot",
1404     "title" => "Custo",
1405     "rule" => array(
1406     "Custo[ /]([0-9.]{1,10})" => "\\1"
1407     ),
1408     "uri" => ""
1409     ),
1410     "cybernavi" => array(
1411     "icon" => "robot",
1412     "title" => "CyberNavi",
1413     "rule" => array(
1414     "CyberNavi_WebGet[ /]([0-9.]{1,10})" => "\\1"
1415     ),
1416     "uri" => ""
1417     ),
1418     "cyberpatrol" => array(
1419     "icon" => "cyberpatrol",
1420     "title" => "CyberPatrol",
1421     "rule" => array(
1422     "^CyberPatrol" => ""
1423     ),
1424     "uri" => "http://www.cyberpatrol.com/cyberpatrolcrawler.asp"
1425     ),
1426     "cyberz" => array(
1427     "icon" => "cyberz",
1428     "title" => "Cyberz",
1429     "rule" => array(
1430     "Cyberz Communication Agent" => ""
1431     ),
1432     "uri" => ""
1433     ),
1434     "cydral" => array(
1435     "icon" => "robot",
1436     "title" => "Cydral",
1437     "rule" => array(
1438     "CydralSpider[ /]([0-9.]{1,10})" => "\\1"
1439     ),
1440     "uri" => ""
1441     ),
1442     "cynthia" => array(
1443     "icon" => "cynthia",
1444     "title" => "Cynthia Says",
1445     "rule" => array(
1446     "Cynthia[ /]([0-9.]{1,10})" => "\\1"
1447     ),
1448     "uri" => ""
1449     ),
1450     "d4x" => array(
1451     "icon" => "d4x",
1452     "title" => "Downloader for X",
1453     "rule" => array(
1454     "Downloader for X[ /]([0-9.]{1,10})" => "\\1"
1455     ),
1456     "uri" => ""
1457     ),
1458     "da" => array(
1459     "icon" => "da",
1460     "title" => "DA",
1461     "rule" => array(
1462     "^DA[ /]([0-9.]{1,10})" => "\\1"
1463     ),
1464     "uri" => ""
1465     ),
1466     "daum" => array(
1467     "icon" => "daum",
1468     "title" => "DAUM",
1469     "rule" => array(
1470     "DAUMOA[ /]([0-9.]{1,10})" => "\\1",
1471 joku 379 "Daum[ /]([0-9.]{1,10})" => "\\1",
1472 joku 63 "DAUM Web Robot" => "",
1473 joku 339 "daum.net" => "",
1474 joku 63 "Daum Communications Corp" => "",
1475     "EDI[ /]([0-9.]{1,10})" => "\\1",
1476     "Edacious.*Intelligent Web Robot" => "",
1477     "RaBot[/ ]([0-9.]{1,10}) Agent" => "\\1"
1478     ),
1479     "uri" => "http://ws.daum.net/"
1480     ),
1481     "daypop" => array(
1482     "icon" => "robot",
1483     "title" => "Daypop",
1484     "rule" => array(
1485     "daypopbot[/ ]([0-9.]{1,10})" => "\\1"
1486     ),
1487     "uri" => ""
1488     ),
1489     "delfi" => array(
1490     "icon" => "delfi",
1491     "title" => "Delfi",
1492     "rule" => array(
1493     "crawl at delfi dot lt" => ""
1494     ),
1495     "uri" => ""
1496     ),
1497     "depspid" => array(
1498     "icon" => "depspid",
1499     "title" => "DepSpid",
1500     "rule" => array(
1501     "DepSpid[/ ]([0-9.]{1,10})" => "\\1"
1502     ),
1503     "uri" => ""
1504     ),
1505     "devonagent" => array(
1506     "icon" => "devonagent",
1507     "title" => "DEVONagent",
1508     "rule" => array(
1509     "DEVONtech" => ""
1510     ),
1511     "uri" => ""
1512     ),
1513     "diffbot" => array(
1514     "icon" => "diffbot",
1515     "title" => "Diffbot",
1516     "rule" => array(
1517     " Diffbot" => ""
1518     ),
1519     "uri" => "http://www.diffbot.com"
1520     ),
1521     "diribot" => array(
1522     "icon" => "diribot",
1523     "title" => "Diri",
1524     "rule" => array(
1525     "diribot" => ""
1526     ),
1527     "uri" => "http://www.diri.bg"
1528     ),
1529     "directhit" => array(
1530     "icon" => "robot",
1531     "title" => "Direct Hit",
1532     "rule" => array(
1533     "EZResult -- Internet Search Engine" => ""
1534     ),
1535     "uri" => "http://www.directhit.com"
1536     ),
1537     "disco" => array(
1538     "icon" => "disco",
1539 matthys 209 "title" => "Disco",
1540 joku 63 "rule" => array(
1541     "disco/Nutch[/ -]([0-9.]{1,10})" => "\\1",
1542     "discobot[/ -]([0-9.]{1,10})" => "\\1",
1543     "disco-crawl@discoveryengine.com" => ""
1544     ),
1545     "uri" => "http://www.discoveryengine.com/"
1546     ),
1547     "discopump" => array(
1548     "icon" => "robot",
1549     "title" => "DISCo Pump",
1550     "rule" => array(
1551     "DISCo Pump[/ ]([0-9.]{1,10})" => "\\1"
1552     ),
1553     "uri" => ""
1554     ),
1555     "dkimreputation" => array(
1556     "icon" => "dkimreputation",
1557     "title" => "DKIM Reputation",
1558     "rule" => array(
1559     "DKIMRepBot[ /]([0-9.]{1,10})" => "\\1"
1560     ),
1561     "uri" => "http://www.dkim-reputation.org"
1562     ),
1563     "dnsdigger" => array(
1564     "icon" => "dnsdigger",
1565     "title" => "DNS-Digger",
1566     "rule" => array(
1567     "DNS-Digger-Explorer[ /]([0-9.]{1,10})" => "\\1"
1568     ),
1569     "uri" => "http://www.dnsdigger.com"
1570     ),
1571     "dnsvalidation" => array(
1572     "icon" => "dnsvalidation",
1573     "title" => "DNS Validation",
1574     "rule" => array(
1575     "DNSValidation[ /]([0-9.]{1,10})" => "\\1"
1576     ),
1577     "uri" => "http://www.dnsvalidation.com/"
1578     ),
1579     "doctorhtml" => array(
1580     "icon" => "robot",
1581     "title" => "DoctorHTML",
1582     "rule" => array(
1583     "Doctor[ \-]?HTML" => ""
1584     ),
1585     "uri" => ""
1586     ),
1587     "dolphin" => array(
1588     "icon" => "dolphin",
1589     "title" => "Dolphin",
1590     "rule" => array(
1591     "Dolphin[ /]([0-9.]{1,10})" => "\\1"
1592     ),
1593     "uri" => "http://telehouse.ru/crawler.html"
1594     ),
1595     "domaindatei" => array(
1596     "icon" => "robot",
1597     "title" => "Domaindatei",
1598     "rule" => array(
1599     "DomaindateiSpider[ /]([0-9.]{1,10})" => "\\1"
1600     ),
1601     "uri" => ""
1602     ),
1603     "dontbuylists" => array(
1604     "icon" => "dontbuylists",
1605     "title" => "Dontbuylists",
1606     "rule" => array(
1607     "DBLBot[ /]([0-9.]{1,10})" => "\\1"
1608     ),
1609     "uri" => "http://www.dontbuylists.com"
1610     ),
1611     "dotbot" => array(
1612     "icon" => "robot",
1613     "title" => "DotBot",
1614     "rule" => array(
1615     "DotBot[ /]([0-9.]{1,10})" => "\\1"
1616     ),
1617     "uri" => "http://www.dotnetdotcom.org"
1618     ),
1619     "doweb" => array(
1620     "icon" => "doweb",
1621     "title" => "DoWeb",
1622     "rule" => array(
1623     "^www.doweb.co.uk" => ""
1624     ),
1625     "uri" => "http://www.doweb.co.uk/"
1626     ),
1627     "downforeveryoneorjustme" => array(
1628     "icon" => "downforeveryoneorjustme",
1629     "title" => "Down for everyone or just me",
1630     "rule" => array(
1631     "downforeveryoneorjustme" => ""
1632     ),
1633     "uri" => "http://www.downforeveryoneorjustme.com"
1634     ),
1635     "downloadninja" => array(
1636     "icon" => "robot",
1637     "title" => "Download Ninja",
1638     "rule" => array(
1639     "Download Ninja[ /]([0-9.]{1,10})" => "\\1"
1640     ),
1641     "uri" => ""
1642     ),
1643     "drupal" => array(
1644     "icon" => "drupal",
1645     "title" => "Drupal",
1646     "rule" => array(
1647     "^Drupal" => ""
1648     ),
1649     "uri" => ""
1650     ),
1651     "dsns" => array(
1652     "icon" => "robot",
1653     "title" => "DSNS Scanner",
1654     "rule" => array(
1655     "^DSNS" => ""
1656     ),
1657     "uri" => ""
1658     ),
1659     "dtsagent" => array(
1660     "icon" => "robot",
1661     "title" => "DTS Agent",
1662     "rule" => array(
1663     "DTS Agent" => ""
1664     ),
1665     "uri" => ""
1666     ),
1667 matthys 342 "duckduckgo" => array(
1668     "icon" => "duckduckgo",
1669     "title" => "DuckDuckGo",
1670     "rule" => array(
1671 matthys 397 "DuckDuckGo-Favicons-Bot[ /]([0-9.]{1,10})" => "\\1",
1672     "DuckDuckBot-Https[ /]([0-9.]{1,10})" => "\\1"
1673 matthys 342 ),
1674     "uri" => "http://duckduckgo.com"
1675     ),
1676 joku 63 "earthcom" => array(
1677     "icon" => "earthcom",
1678     "title" => "Earthcom",
1679     "rule" => array(
1680     "EARTHCOM\.info[/ ]([0-9a-z.]{1,10})" => "\\1"
1681     ),
1682     "uri" => ""
1683     ),
1684     "ebay" => array(
1685     "icon" => "ebay",
1686     "title" => "eBay",
1687     "rule" => array(
1688     "eBay Relevance Ad Crawler" => ""
1689     ),
1690     "uri" => ""
1691     ),
1692     "echo" => array(
1693     "icon" => "robot",
1694     "title" => "Echo.com",
1695     "rule" => array(
1696     "_TrueRobot[/ ]([0-9.]{1,10})" => "\\1"
1697     ),
1698     "uri" => "http://www.echo.com/"
1699     ),
1700     "eert" => array(
1701     "icon" => "robot",
1702 matthys 209 "title" => "Eert",
1703 joku 63 "rule" => array(
1704     "eert spdr[/ ]([0-9.]{1,10})" => "\\1"
1705     ),
1706     "uri" => "http://bot.eert.net"
1707     ),
1708     "eknip" => array(
1709     "icon" => "eknip",
1710     "title" => "E-Knip",
1711     "rule" => array(
1712     "eknip[ /]([0-9a-z.]{1,10})" => "\\1"
1713     ),
1714     "uri" => ""
1715     ),
1716     "zoominfo" => array(
1717     "icon" => "zoominfo",
1718 matthys 209 "title" => "ZoomInfo", //Previous called Eliyon
1719 joku 63 "rule" => array(
1720     "NextGenSearchBot[/ ]([0-9.]{1,10})" => "\\1"
1721     ),
1722     "uri" => "http://www.zoominfo.com/business/nextgensearchbot.html"
1723     ),
1724     "emeraldshield" => array(
1725     "icon" => "emeraldshield",
1726     "title" => "EmeraldShield",
1727     "rule" => array(
1728     "^EmeraldShield" => ""
1729     ),
1730     "uri" => ""
1731     ),
1732     "empas" => array(
1733     "icon" => "empas",
1734     "title" => "Empas",
1735     "rule" => array(
1736     "DigExt; empas\)$" => "",
1737     "^EMPAS[_\-]ROBOT" => ""
1738     ),
1739     "uri" => ""
1740     ),
1741 matthys 409 "entfer" => array(
1742     "icon" => "entfer",
1743     "title" => "Entfer",
1744     "rule" => array(
1745     "EntferBot[ /]([0-9.]{1,10})" => "\\1"
1746     ),
1747     "uri" => "https://entfer.com"
1748     ),
1749 joku 63 "entireweb" => array(
1750     "icon" => "entireweb",
1751     "title" => "Entireweb",
1752     "rule" => array(
1753     "Speedy[ ]?Spider" => ""
1754     ),
1755     "uri" => ""
1756     ),
1757     "envolk" => array(
1758     "icon" => "envolk",
1759     "title" => "Envolk",
1760     "rule" => array(
1761     "envolk\[ITS\]spider[/ ]([0-9.]{1,10})" => "\\1",
1762     "envolk[/ ]([0-9.]{1,10})" => "\\1"
1763     ),
1764     "uri" => ""
1765     ),
1766     "esnet" => array(
1767     "icon" => "robot",
1768     "title" => "ES.NET",
1769     "rule" => array(
1770     "ES.NET Crawler[ /]([0-9.]{1,10})" => "\\1"
1771     ),
1772     "uri" => ""
1773     ),
1774     "estyle" => array(
1775     "icon" => "estyle",
1776     "title" => "eStyle Search",
1777     "rule" => array(
1778     "eStyleSearch[ /]([0-9.]{1,10})" => "\\1"
1779     ),
1780     "uri" => ""
1781     ),
1782     "eurip" => array(
1783     "icon" => "robot",
1784     "title" => "Eurip",
1785     "rule" => array(
1786     "EuripBot[ /]([0-9.]{1,10})" => "\\1"
1787     ),
1788     "uri" => "http://www.eurip.com"
1789     ),
1790     "eurodirectory" => array(
1791     "icon" => "robot",
1792     "title" => "Euro Directory",
1793     "rule" => array(
1794     "www\.euro-directory\.com" => ""
1795     ),
1796     "uri" => "http://www.euro-directory.com/"
1797     ),
1798     "euroseek" => array(
1799     "icon" => "euroseek",
1800     "title" => "EuroSeek",
1801     "rule" => array(
1802     "Arachnoidea" => ""
1803     ),
1804     "uri" => ""
1805     ),
1806     "evaal" => array(
1807     "icon" => "evaal",
1808     "title" => "Evaal",
1809     "rule" => array(
1810     "^EvaalSE" => ""
1811     ),
1812     "uri" => "http://www.evaal.com/"
1813     ),
1814     "eventax" => array(
1815     "icon" => "eventax",
1816     "title" => "Eventax",
1817     "rule" => array(
1818     "^eventax[ /]([0-9.]{1,10})" => "\\1"
1819     ),
1820     "uri" => "http://www.eventax.de/"
1821     ),
1822     "everbee" => array(
1823     "icon" => "everbee",
1824     "title" => "Everbee",
1825     "rule" => array(
1826     "EverbeeCrawler" => ""
1827     ),
1828     "uri" => ""
1829     ),
1830     "everest" => array(
1831     "icon" => "everest",
1832     "title" => "Everest",
1833     "rule" => array(
1834     "Everest-Vulcan Inc.[ /]([0-9.]{1,10})" => "\\1"
1835     ),
1836     "uri" => ""
1837     ),
1838     "exabot" => array(
1839     "icon" => "exabot",
1840     "title" => "ExaBot",
1841     "rule" => array(
1842     "^NG[ /]([0-9.]{1,10})" => "\\1",
1843     "Exabot/([0-9.]{1,10})" => "\\1",
1844     "ExaBotTest/([0-9.]{1,10})" => "\\1",
1845     "ExaBot-(Test|Images)/([0-9.]{1,10})" => "\\2",
1846     "ExaBot-Thumbnails" => ""
1847     ),
1848     "uri" => "http://www.exabot.com/go/robot"
1849     ),
1850     "exactseek" => array(
1851     "icon" => "exactseek",
1852     "title" => "ExactSeek",
1853     "rule" => array(
1854     "^exactseek[ \-]?(pagereaper|crawler)[ \-]?([0-9.]{1,10})" => "\\2",
1855     "ExactSeek[ \.\-]?(Crawler|com)" => ""
1856     ),
1857     "uri" => "http://www.exactseek.com/"
1858     ),
1859     "excite" => array(
1860     "icon" => "excite",
1861     "title" => "Excite",
1862     "rule" => array(
1863     "Architext[ \-]?Spider" => ""
1864     ),
1865     "uri" => ""
1866     ),
1867     "execrawl" => array(
1868     "icon" => "robot",
1869     "title" => "Execrawl",
1870     "rule" => array(
1871     "Execrawl[ /]([0-9.]{1,10})" => "\\1",
1872     "Execrawl" => ""
1873     ),
1874     "uri" => ""
1875     ),
1876     "expertmonitor" => array(
1877     "icon" => "robot",
1878     "title" => "ExpertMonitor",
1879     "rule" => array(
1880     "^NetMonitor[ /]([0-9.]{1,10})" => "\\1"
1881     ),
1882     "uri" => ""
1883     ),
1884     "explorerrss" => array(
1885     "icon" => "robot",
1886     "title" => "Explorer RSS",
1887     "rule" => array(
1888     "^Windows-RSS-Platform[ /]([0-9.]{1,10})" => "\\1"
1889     ),
1890     "uri" => ""
1891     ),
1892     "ezooms" => array(
1893     "icon" => "robot",
1894     "title" => "Ezooms",
1895     "rule" => array(
1896     "ezooms[/ ]([0-9a-z.\-]{1,10})" => "\\1"
1897     ),
1898     "uri" => ""
1899     ),
1900     "facebook" => array(
1901     "icon" => "facebook",
1902     "title" => "Facebook",
1903     "rule" => array(
1904     "FacebookFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
1905     "facebookexternalhit/([0-9.]{1,10})" => "\\1",
1906     "^facebook" => ""
1907     ),
1908     "uri" => "http://www.facebook.com/"
1909     ),
1910     "fast" => array(
1911     "icon" => "fast",
1912     "title" => "Fast",
1913     "rule" => array(
1914     "^FAST( Enterprise |-Web| MetaWeb )?Crawler[ /]([0-9.]{1,10})" => "\\2",
1915     "^FAST( Enterprise |-Web| MetaWeb | PartnerSite )?Crawler" => "",
1916     "^Fast Crawler" => "",
1917     "^libwww-perl[ /]([0-9.]{1,10}) FP[ /]([0-9.]{1,10})" => "\\2"
1918     ),
1919     "uri" => "http://www.alltheweb.com/"
1920     ),
1921     "fastbuzz" => array(
1922     "icon" => "fastbuzz",
1923     "title" => "Fastbuzz",
1924     "rule" => array(
1925     "^fastbuzz\.com" => ""
1926     ),
1927     "uri" => ""
1928     ),
1929     "favorg" => array(
1930     "icon" => "robot",
1931     "title" => "FavOrg",
1932     "rule" => array(
1933     "^FavOrg" => ""
1934     ),
1935     "uri" => ""
1936     ),
1937     "favorstar" => array(
1938     "icon" => "favorstar",
1939 matthys 209 "title" => "Favorstar",
1940 joku 63 "rule" => array(
1941     "favorstarbot[ /]([0-9.]{1,10})" => "\\1"
1942     ),
1943     "uri" => "http://favorstar.com/bot.html"
1944     ),
1945     "faxo" => array(
1946     "icon" => "robot",
1947     "title" => "Faxo",
1948     "rule" => array(
1949     "^Faxobot[ /]([0-9.]{1,10})" => "\\1"
1950     ),
1951     "uri" => "http://www.faxo.com/"
1952     ),
1953     "fdse" => array(
1954     "icon" => "robot",
1955     "title" => "FDSE Robot",
1956     "rule" => array(
1957     "FDSE[ \-]?robot" => ""
1958     ),
1959     "uri" => ""
1960     ),
1961     "feedback" => array(
1962     "icon" => "robot",
1963     "title" => "FeedBack",
1964     "rule" => array(
1965     "FeedBack[/ ]([0-9.]{1,10})" => "\\1"
1966     ),
1967     "uri" => ""
1968     ),
1969     "feedburner" => array(
1970     "icon" => "feedburner",
1971     "title" => "FeedBurner",
1972     "rule" => array(
1973     "^FeedBurner[/ ]([0-9.]{1,10})" => "\\1"
1974     ),
1975     "uri" => ""
1976     ),
1977     "feeddemon" => array(
1978     "icon" => "feeddemon",
1979     "title" => "FeedDemon",
1980     "rule" => array(
1981     "FeedDemon[/ ]([0-9.]{1,10})" => "\\1"
1982     ),
1983     "uri" => ""
1984     ),
1985     "feedfind" => array(
1986     "icon" => "feedfind",
1987     "title" => "FeedFind",
1988     "rule" => array(
1989     "Feed::Find[ /]([0-9.]{1,10})" => "\\1"
1990     ),
1991     "uri" => ""
1992     ),
1993     "feedonfeeds" => array(
1994     "icon" => "robot",
1995     "title" => "Feed On Feeds",
1996     "rule" => array(
1997     "FeedOnFeeds[/ ]([0-9.]{1,10})" => "\\1"
1998     ),
1999     "uri" => ""
2000     ),
2001     "feedparser" => array(
2002     "icon" => "robot",
2003     "title" => "Feedparser",
2004     "rule" => array(
2005     "UniversalFeedParser[/ ]([0-9a-z.\-]{1,10})" => "\\1",
2006     "FeedParser" => ""
2007     ),
2008     "uri" => ""
2009     ),
2010     "feedreader" => array(
2011     "icon" => "feedreader",
2012     "title" => "Feedreader",
2013     "rule" => array(
2014     "^Feedreader" => ""
2015     ),
2016     "uri" => ""
2017     ),
2018     "feedserver" => array(
2019     "icon" => "robot",
2020     "title" => "FeedServer",
2021     "rule" => array(
2022     "FeedServer[/ ]([0-9.]{1,10})" => "\\1"
2023     ),
2024     "uri" => ""
2025     ),
2026     "feedster" => array(
2027     "icon" => "feedster",
2028     "title" => "Feedster",
2029     "rule" => array(
2030     "Feedster Crawler[/ ]([0-9.]{1,10})" => "\\1"
2031     ),
2032     "uri" => ""
2033     ),
2034     "feedvalidator" => array(
2035     "icon" => "feedvalidator",
2036     "title" => "Feed Validator",
2037     "rule" => array(
2038     "^FeedValidator[/ ]([0-9.]{1,10})" => "\\1"
2039     ),
2040     "uri" => ""
2041     ),
2042     "fdm" => array(
2043     "icon" => "robot",
2044     "title" => "Free Download Manager",
2045     "rule" => array(
2046     "^FDM[/ ]([0-9a-z.]{1,10})" => "\\1"
2047     ),
2048     "uri" => ""
2049     ),
2050     "filangy" => array(
2051     "icon" => "robot",
2052     "title" => "Filangy",
2053     "rule" => array(
2054     "Filangy[/ ]([0-9.]{1,10})" => "\\1"
2055     ),
2056     "uri" => "http://www.filangy.com/"
2057     ),
2058     "findanisp" => array(
2059     "icon" => "robot",
2060     "title" => "FindAnISP",
2061     "rule" => array(
2062     "FindAnISP" => ""
2063     ),
2064     "uri" => "http://www.findanisp.com/"
2065     ),
2066     "findengines" => array(
2067     "icon" => "findengines",
2068     "title" => "FindEngines",
2069     "rule" => array(
2070     "FindEngines! Bot" => ""
2071     ),
2072     "uri" => ""
2073     ),
2074     "findexa" => array(
2075     "icon" => "findexa",
2076     "title" => "Findexa",
2077     "rule" => array(
2078     "Findexa Crawler" => ""
2079     ),
2080     "uri" => ""
2081     ),
2082     "findlinks" => array(
2083     "icon" => "findlinks",
2084     "title" => "FindLinks",
2085     "rule" => array(
2086     "findlinks[ /]([0-9.]{1,10})" => "\\1",
2087     "^FindLinks" => ""
2088     ),
2089     "uri" => ""
2090     ),
2091     "findoor" => array(
2092     "icon" => "findoor",
2093 matthys 209 "title" => "Findoor",
2094 joku 63 "rule" => array(
2095     "^findoor(-Bot)?" => "\\1"
2096     ),
2097     "uri" => ""
2098     ),
2099     "firefly" => array(
2100     "icon" => "firefly",
2101     "title" => "Firefly",
2102     "rule" => array(
2103     "Firefly" => ""
2104     ),
2105     "uri" => ""
2106     ),
2107     "flashget" => array(
2108     "icon" => "flashget",
2109     "title" => "FlashGet",
2110     "rule" => array(
2111     "^FlashGet" => ""
2112     ),
2113     "uri" => ""
2114     ),
2115     "flatland" => array(
2116     "icon" => "flatland",
2117     "title" => "Flatland",
2118     "rule" => array(
2119     "^flatlandbot" => ""
2120     ),
2121     "uri" => "http://www.flatlandindustries.com/flatlandbot"
2122     ),
2123     "flickbot" => array(
2124     "icon" => "flickbot",
2125     "title" => "FlickBot",
2126     "rule" => array(
2127     "FlickBot[ /]([0-9.]{1,10})" => "\\1"
2128     ),
2129     "uri" => ""
2130     ),
2131     "flightdeckreports" => array(
2132     "icon" => "flightdeckreports",
2133     "title" => "Flight Deck Reports",
2134     "rule" => array(
2135     "FlightDeckReportsBot[ /]([0-9.]{1,10})" => "\\1"
2136     ),
2137     "uri" => "http://www.flightdeckreports.com/"
2138     ),
2139     "forex" => array(
2140     "icon" => "robot",
2141     "title" => "Forex",
2142     "rule" => array(
2143     "^Forex Trading Network Organization" => ""
2144     ),
2145     "uri" => "http://www.netforex.org/"
2146     ),
2147     "freshmeat" => array(
2148     "icon" => "freshmeat",
2149 matthys 209 "title" => "Freshmeat",
2150 joku 63 "rule" => array(
2151     "fmII URL validator[ /]([0-9.]{1,10})" => "\\1",
2152     "freshmeat.net URL validator[ /]([0-9.]{1,10})" => "\\1"
2153     ),
2154     "uri" => "http://www.freshmeat.net/"
2155     ),
2156     "friend" => array(
2157     "icon" => "friend",
2158     "title" => "Friend",
2159     "rule" => array(
2160     "www\.friend\.fr" => ""
2161     ),
2162     "uri" => "http://www.friend.fr/"
2163     ),
2164     "frontier" => array(
2165     "icon" => "frontier",
2166     "title" => "Frontier",
2167     "rule" => array(
2168     "Frontier[ /]([0-9.]{1,10})" => "\\1"
2169     ),
2170     "uri" => ""
2171     ),
2172     "fyberspider" => array(
2173     "icon" => "robot",
2174     "title" => "FyberSpider",
2175     "rule" => array(
2176     "FyberSpider[ /]([0-9.]{1,10})" => "\\1"
2177     ),
2178     "uri" => "http://www.fyberspider.com/"
2179     ),
2180     "gaisbot" => array(
2181     "icon" => "gais",
2182     "title" => "Gaisbot",
2183     "rule" => array(
2184     "Gaisbot[ /]([0-9.]{1,10})" => "\\1"
2185     ),
2186     "uri" => ""
2187     ),
2188     "galaxy" => array(
2189     "icon" => "galaxy",
2190     "title" => "Galaxy",
2191     "rule" => array(
2192     "GalaxyBot[ /]([0-9.]{1,10})" => "\\1",
2193     "www.galaxy.com" => ""
2194     ),
2195     "uri" => "http://www.galaxy.com/"
2196     ),
2197     "gamespy" => array(
2198     "icon" => "gamespy",
2199     "title" => "GameSpy",
2200     "rule" => array(
2201     "GameSpyHTTP[ /]([0-9.]{1,10})" => "\\1"
2202     ),
2203     "uri" => ""
2204     ),
2205     "garlik" => array(
2206     "icon" => "garlik",
2207     "title" => "Garlik",
2208     "rule" => array(
2209     "GarlikCrawler[ /]([0-9.]{1,10})" => "\\1"
2210     ),
2211     "uri" => "http://garlik.com/"
2212     ),
2213     "gdesktop" => array(
2214     "icon" => "gdesktop",
2215     "title" => "Google Desktop",
2216     "rule" => array(
2217     "compatible; Google Desktop" => ""
2218     ),
2219     "uri" => ""
2220     ),
2221     "genome" => array(
2222     "icon" => "robot",
2223     "title" => "Genome Machine",
2224     "rule" => array(
2225     "Genome[ \-]?Machine" => ""
2226     ),
2227     "uri" => ""
2228     ),
2229     "geohash" => array(
2230     "icon" => "geohash",
2231     "title" => "Geohash",
2232     "rule" => array(
2233     "GeoHasher(/Nutch)[ /-]([0-9.]{1,10})" => "\\2"
2234     ),
2235     "uri" => "http://geohash.org/"
2236     ),
2237     "geona" => array(
2238     "icon" => "robot",
2239     "title" => "Geona",
2240     "rule" => array(
2241     "GeonaBot[ /]([0-9.]{1,10})" => "\\1"
2242     ),
2243     "uri" => ""
2244     ),
2245     "geoblog" => array(
2246     "icon" => "robot",
2247     "title" => "The World as a Blog",
2248     "rule" => array(
2249     "The World as a Blog" => ""
2250     ),
2251     "uri" => ""
2252     ),
2253     "geourl" => array(
2254     "icon" => "geourl",
2255     "title" => "GeoUrl",
2256     "rule" => array(
2257     "geourl[ /]([0-9.]{1,10})" => "\\1",
2258     "^GeoURLBot[ /]([0-9.]{1,10})" => "\\1",
2259     ),
2260     "uri" => ""
2261     ),
2262     "getnetwise" => array(
2263     "icon" => "robot",
2264     "title" => "GetNetWise",
2265     "rule" => array(
2266     " Crayon Crawler" => ""
2267     ),
2268     "uri" => ""
2269     ),
2270     "getright" => array(
2271     "icon" => "getright",
2272     "title" => "GetRight",
2273     "rule" => array(
2274     "GetRight[ /]([0-9.]{1,10})" => "\\1"
2275     ),
2276     "uri" => ""
2277     ),
2278     "getsmart" => array(
2279     "icon" => "getsmart",
2280     "title" => "GetSmart",
2281     "rule" => array(
2282     "GetSmart[ /]([0-9.]{1,10})" => "\\1"
2283     ),
2284     "uri" => ""
2285     ),
2286     "gigabot" => array(
2287     "icon" => "gigablast",
2288     "title" => "Gigablast",
2289     "rule" => array(
2290     "(Gigabot|Sitesearch)[/ ]([0-9.]{1,10})" => "\\2",
2291     "GigabotSiteSearch[/ ]([0-9.]{1,10})" => "\\1",
2292 joku 336 "GigablastOpenSource" => ""
2293 joku 63 ),
2294     "uri" => ""
2295 matthys 328 ),
2296     "gimme" => array(
2297     "icon" => "gimme",
2298     "title" => "gimmeUSA",
2299     "rule" => array(
2300     "Gimme60bot[ /]([0-9.]{1,10})" => "\\1"
2301     ),
2302     "uri" => "http://gimme60.com"
2303 joku 63 ),
2304 matthys 328 "ginger" => array(
2305     "icon" => "ginger",
2306     "title" => "GingerCrawler",
2307     "rule" => array(
2308     "GingerCrawler[ /]([0-9.]{1,10})" => "\\1"
2309     ),
2310     "uri" => "http://www.gingersoftware.com/crawler_agent.htm"
2311     ),
2312 joku 63 "girafabot" => array(
2313     "icon" => "girafa",
2314     "title" => "Girafa",
2315     "rule" => array(
2316     "Girafabot" => ""
2317     ),
2318     "uri" => ""
2319     ),
2320     "globalspec" => array(
2321     "icon" => "globalspec",
2322     "title" => "GlobalSpec",
2323     "rule" => array(
2324     "Ocelli[ /]([0-9.]{1,10})" => "\\1"
2325     ),
2326     "uri" => ""
2327     ),
2328     "glucose" => array(
2329     "icon" => "glucose",
2330     "title" => "Glucose",
2331     "rule" => array(
2332     "glucose[ /]([0-9a-z.\-]{1,10})" => "\\1"
2333     ),
2334     "uri" => ""
2335     ),
2336     "gnomit" => array(
2337     "icon" => "gnomit",
2338     "title" => "Gnomit",
2339     "rule" => array(
2340     "gnomit[ /]([0-9.]{1,10})" => "\\1"
2341     ),
2342     "uri" => "http://www.gnomit.com/",
2343     ),
2344     "goforit" => array(
2345     "icon" => "goforit",
2346     "title" => "GoForIt",
2347     "rule" => array(
2348     "^GoForIt\.com" => "",
2349     "^GOFORITBOT" => ""
2350     ),
2351     "uri" => ""
2352     ),
2353     "goguides" => array(
2354     "icon" => "robot",
2355     "title" => "GoGuides",
2356     "rule" => array(
2357     "^GoGuidesBot[ /]([0-9.]{1,10})" => "\\1"
2358     ),
2359     "uri" => "http://www.goguides.org/"
2360     ),
2361     // Needs to be before google for correct detection
2362     "mediapartners" => array(
2363     "icon" => "google",
2364     "title" => "Mediapartners",
2365     "rule" => array (
2366     "Mediapartners-Google[ /]([0-9.]{1,10})" => "\\1",
2367     "Mediapartners-Google" => ""
2368     ),
2369     "uri" => ""
2370     ),
2371     "google" => array(
2372     "icon" => "google",
2373     "title" => "Google",
2374     "rule" => array (
2375     "Googl(e|ebot)(-Image)?/([0-9.]{1,10})" => "\\3",
2376     "Googl(e|ebot)(-Image)?/" => "",
2377     "^gsa-crawler" => "",
2378     "Google Web Preview" => ""
2379     ),
2380     "uri" => "http://www.google.com/"
2381     ),
2382     "googlesitemaps" => array(
2383     "icon" => "google",
2384     "title" => "Google-Sitemaps",
2385     "rule" => array (
2386     "Googl(e|ebot)(-Sitemaps)?/([0-9.]{1,10})" => "\\3",
2387     "GSiteCrawler[ /v]*([0-9.a-z]{1,10})" => "\\1",
2388     "Googl(e|ebot)(-Sitemaps)?/" => ""
2389     ),
2390     "uri" => ""
2391     ),
2392     "googlemobile" => array(
2393     "icon" => "google",
2394     "title" => "Google-Mobile",
2395     "rule" => array (
2396     "Googl(e|ebot)(-Mobile)?/([0-9.]{1,10})" => "\\3",
2397     "Googl(e|ebot)(-Mobile)?/" => ""
2398     ),
2399     "uri" => ""
2400     ),
2401     "googleads" => array(
2402     "icon" => "google",
2403     "title" => "Google-AdsBot",
2404     "rule" => array (
2405     "^AdsBot-Google" => "",
2406     ),
2407     "uri" => ""
2408     ),
2409     "googlefeeds" => array(
2410     "icon" => "google",
2411     "title" => "Google-Feedfetcher",
2412     "rule" => array (
2413     "^Feedfetcher-Google" => "",
2414     ),
2415     "uri" => ""
2416     ),
2417     "googlverification" => array(
2418     "icon" => "google",
2419     "title" => "Google-Site-Verification",
2420     "rule" => array (
2421     "Google-Site-Verification[ /]([0-9.]{1,10})" => "\\1"
2422     ),
2423     "uri" => ""
2424     ),
2425 matthys 207 // Needs to be AFTER Google detection
2426     "goo" => array(
2427     "icon" => "goo",
2428     "title" => "Goo",
2429     "rule" => array (
2430     "(gazz|ichiro|mog(et|imogi))[ /]([0-9.]{1,10})" => "\\3",
2431     "DoCoMo[ /]([0-9.]{1,10})" => "\\1"
2432     ),
2433     "uri" => ""
2434     ),
2435 joku 63 "goongee" => array(
2436     "icon" => "robot",
2437     "title" => "GoonGee",
2438     "rule" => array (
2439     "^Big Fish[ /]v?([0-9.]{1,10})" => "\\2"
2440     ),
2441     "uri" => "http://www.goongee.com/"
2442     ),
2443     "gpost" => array(
2444     "icon" => "gpost",
2445     "title" => "GPost",
2446     "rule" => array(
2447     "^GPostbot" => ""
2448     ),
2449     "uri" => ""
2450     ),
2451 matthys 309 "grapeshot" => array(
2452     "icon" => "grapeshot",
2453     "title" => "Grapeshot",
2454     "rule" => array(
2455     "GrapeshotCrawler[/ ]([0-9.]{1,10})" => "\\1"
2456     ),
2457     "uri" => "http://www.grapeshot.co.uk/crawler.php"
2458     ),
2459 joku 63 "gregarius" => array(
2460     "icon" => "robot",
2461     "title" => "Gregarius",
2462     "rule" => array(
2463     "^Gregarius[/ ]([0-9.]{1,10})" => ""
2464     ),
2465     "uri" => ""
2466     ),
2467     "grub" => array(
2468     "icon" => "grub",
2469     "title" => "Grub",
2470     "rule" => array(
2471     "grub[ \-]?client[ /\-]{1,5}([0-9.]{1,10})" => "\\1",
2472     "grub crawler" => "",
2473     "grub[/ ]([0-9.]{1,10})" => "\\1",
2474     "^GrubNG([0-9. ]{1,10})?" => "\\1"
2475     ),
2476     "uri" => "http://www.grub.org/"
2477     ),
2478     "gulliver" => array(
2479     "icon" => "robot",
2480     "title" => "Gulliver",
2481     "rule" => array(
2482     "Gulliver" => ""
2483     ),
2484     "uri" => ""
2485     ),
2486     "guruji" => array(
2487     "icon" => "guruji",
2488     "title" => "Guruji",
2489     "rule" => array(
2490     "GurujiBot[/ ]([0-9.]{1,10})" => "\\1"
2491     ),
2492     "uri" => "http://www.guruji.com/"
2493     ),
2494     "gush" => array(
2495     "icon" => "robot",
2496     "title" => "Gush",
2497     "rule" => array(
2498     "^Gush[/ ]([0-9.]{1,10})" => "\\1"
2499     ),
2500     "uri" => ""
2501     ),
2502     "gziptester" => array(
2503     "icon" => "robot",
2504     "title" => "Gzip Tester",
2505     "rule" => array(
2506     "g(id)?zip[ \-]?test(er)?" => ""
2507     ),
2508     "uri" => ""
2509     ),
2510     "hanzoweb" => array(
2511     "icon" => "hanzoweb",
2512     "title" => "Hanzoweb",
2513     "rule" => array(
2514     "^Hanzoweb" => ""
2515     ),
2516     "uri" => ""
2517     ),
2518     "harbot" => array(
2519     "icon" => "harbot",
2520     "title" => "Harbot",
2521     "rule" => array(
2522     "^Harbot GateStation" => ""
2523     ),
2524     "uri" => ""
2525     ),
2526     "hatena" => array(
2527     "icon" => "hatena",
2528     "title" => "Hatena",
2529     "rule" => array(
2530     "Hatena (Antenna|Bookmark|Pagetitle Agent)[ /]([0-9.]{1,10})" => "\\2"
2531     ),
2532     "uri" => ""
2533     ),
2534     "htmlparser" => array(
2535     "icon" => "htmlparser",
2536     "title" => "HTMLParser",
2537     "rule" => array(
2538     "HTMLParser[ /]([0-9.]{1,10})" => "\\1"
2539     ),
2540     "uri" => "http://htmlparser.sourceforge.net/"
2541     ),
2542     "helix" => array(
2543     "icon" => "helix",
2544     "title" => "Heritrix",
2545     "rule" => array(
2546     "^helix[ /]([0-9.]{1,10})" => "\\1"
2547     ),
2548     "uri" => "http://www.sitesearch.ca/helix/"
2549     ),
2550     "heritrix" => array(
2551     "icon" => "heritrix",
2552     "title" => "Heritrix",
2553     "rule" => array(
2554     "heritrix[ /]([0-9.]{1,10})" => "\\1",
2555     "archive.org_bot" => "",
2556     "InternetArchive[ /]([0-9.a-z]{1,10})" => "\\1"
2557     ),
2558     "uri" => "http://archive.org"
2559     ),
2560     "hiddenmarket" => array(
2561     "icon" => "robot",
2562     "title" => "HiddenMarket",
2563     "rule" => array(
2564     "HiddenMarket[ /\-]([0-9.]{1,10})" => "\\1"
2565     ),
2566     "uri" => ""
2567     ),
2568     "honda" => array(
2569     "icon" => "robot",
2570     "title" => "Honda",
2571     "rule" => array(
2572     "Honda-Search[ /]([0-9.]{1,10})" => "\\1"
2573     ),
2574     "uri" => "http://www.honda-search.com"
2575     ),
2576     "hoowwwer" => array(
2577     "icon" => "hoowwwer",
2578     "title" => "HooWWWer",
2579     "rule" => array(
2580     "HooWWWer[ /]([0-9.]{1,10})" => "\\1"
2581     ),
2582     "uri" => ""
2583     ),
2584     "hotzonu" => array(
2585     "icon" => "hotzonu",
2586     "title" => "Hotzonu",
2587     "rule" => array(
2588     "Hotzonu[ /]([0-9.]{1,10})" => "\\1"
2589     ),
2590     "uri" => ""
2591     ),
2592     "houxou" => array(
2593     "icon" => "robot",
2594     "title" => "Houxou",
2595     "rule" => array(
2596     "HouxouCrawler[ /]Nutch.([0-9.]{1,10})" => "\\1",
2597     "HouxouCrawler" => ""
2598     ),
2599     "uri" => ""
2600     ),
2601     "htdig" => array(
2602     "icon" => "htdig",
2603     "title" => "ht://Dig",
2604     "rule" => array(
2605     "htdig[ /]([0-9.]{1,10})" => "\\1",
2606     "htdig" => "\\1"
2607     ),
2608     "uri" => ""
2609     ),
2610     "html2jpg" => array(
2611     "icon" => "html2jpg",
2612     "title" => "HTML2JPG",
2613     "rule" => array(
2614     "^HTML2JPG" => ""
2615     ),
2616     "uri" => ""
2617     ),
2618     "httperf" => array(
2619     "icon" => "robot",
2620     "title" => "HTTPerf",
2621     "rule" => array(
2622     "httperf[ /]([0-9.]{1,10})" => "\\1"
2623     ),
2624     "uri" => ""
2625     ),
2626     "httpunit" => array(
2627     "icon" => "httpunit",
2628     "title" => "HttpUnit",
2629     "rule" => array(
2630     "httpunit[ /]([0-9.]{1,10})" => "\\1"
2631     ),
2632     "uri" => ""
2633     ),
2634     "httrack" => array(
2635     "icon" => "httrack",
2636     "title" => "HTTrack",
2637     "rule" => array(
2638     "HTTrack[ /]([0-9.]{1,10})" => "\\1"
2639     ),
2640     "uri" => ""
2641     ),
2642     "huaweisymantec" => array(
2643     "icon" => "huaweisymantec",
2644     "title" => "HuaweiSymantec",
2645     "rule" => array(
2646     "HuaweiSymantecSpider[ /]([0-9.]{1,10})" => "\\1"
2647     ),
2648     "uri" => "http://www.huaweisymantec.com/en/IRL/spider/"
2649     ),
2650     "hungary" => array(
2651     "icon" => "hungary",
2652     "title" => "Hungary",
2653     "rule" => array(
2654     "HuRob[ /]([0-9.]{1,10})" => "\\1"
2655     ),
2656     "uri" => ""
2657     ),
2658 joku 261 "i18n" => array(
2659     "icon" => "w3c",
2660     "title" => "W3C I18n Checker",
2661     "rule" => array(
2662     "^W3C_I18n-Checker[ /]([0-9.]{1,10})" => "\\1"
2663 joku 169 ),
2664 joku 261 "uri" => "http://validator.w3.org/services"
2665     ),
2666 joku 63 "iakke" => array(
2667     "icon" => "iakke",
2668 matthys 209 "title" => "Iakké",
2669 joku 63 "rule" => array(
2670     "^iakke_bot[ /]v([0-9.]{1,10})" => "\\1"
2671     ),
2672     "uri" => "http://fr.iakke.com/"
2673     ),
2674     "iask" => array(
2675     "icon" => "iask",
2676     "title" => "IAsk",
2677     "rule" => array(
2678     "iaskspider[ /]([0-9.]{1,10})" => "\\1",
2679     "^iaskspider" => ""
2680     ),
2681     "uri" => "http://iask.com"
2682     ),
2683     "icc" => array(
2684     "icon" => "icc",
2685     "title" => "ICC-Crawler",
2686     "rule" => array(
2687     "^ICC-Crawler" => ""
2688     ),
2689     "uri" => "http://kc.nict.go.jp/icc/crawl.html"
2690     ),
2691     "icerocket" => array(
2692     "icon" => "icerocket",
2693     "title" => "Icerocket",
2694     "rule" => array(
2695     "BlogzIce[ /]([0-9.]{1,10})" => "\\1",
2696     "BlogSearch[ /]([0-9.]{1,10})" => "\\1"
2697     ),
2698     "uri" => ""
2699     ),
2700     "icjobs" => array(
2701     "icon" => "icjobs",
2702     "title" => "iCjobs",
2703     "rule" => array(
2704     "iCjobs[ /]([0-9.]{1,10})" => "\\1"
2705     ),
2706     "uri" => "http://www.icjobs.de/"
2707     ),
2708     "icra" => array(
2709     "icon" => "icra",
2710     "title" => "ICRA",
2711     "rule" => array(
2712     "^ICRA_Semantic_spider[ /]([0-9.]{1,10})" => "\\1"
2713     ),
2714     "uri" => "http://www.icra.org"
2715     ),
2716     "iknow" => array(
2717     "icon" => "robot",
2718     "title" => "I know",
2719     "rule" => array(
2720     "Comaneci_bot[ /]([0-9.]{1,10})" => "\\1"
2721     ),
2722     "uri" => ""
2723     ),
2724     "ilial" => array(
2725     "icon" => "robot",
2726     "title" => "Ilial",
2727     "rule" => array(
2728     "ilial[ /]Nutch[ \-]([0-9.]{1,10})" => "\\1"
2729     ),
2730     "uri" => ""
2731     ),
2732     "ilocal" => array(
2733     "icon" => "ilocal",
2734     "title" => "ilocal",
2735     "rule" => array(
2736     "^ilocal" => "",
2737     ),
2738     "uri" => "http://www.ilocal.nl"
2739     ),
2740     "ilse" => array(
2741     "icon" => "ilse",
2742     "title" => "Ilse",
2743     "rule" => array(
2744     "I(NGRID|lseRobot|lseBot)[ /]([0-9.]{1,10})" => "\\1"
2745     ),
2746     "uri" => "http://ilse.nl/"
2747     ),
2748     "iltrovatore" => array(
2749     "icon" => "iltrovatore",
2750     "title" => "IlTrovatore",
2751     "rule" => array(
2752     "iltrovatore-setaccio[ /]([0-9.]{1,10})" => "\\1",
2753     "Iltrovatore-Setaccio" => "",
2754     "iltrovatore[ /]([0-9.]{1,10})" => "\\1"
2755     ),
2756     "uri" => ""
2757     ),
2758     "indylibrary" => array(
2759     "icon" => "robot",
2760     "title" => "Indy Library",
2761     "rule" => array(
2762     "Indy[ \-]?Library" => ""
2763     ),
2764     "uri" => ""
2765     ),
2766     "inela" => array(
2767     "icon" => "robot",
2768     "title" => "Inela",
2769     "rule" => array(
2770     "InelaBot[ /]([0-9.]{1,10})" => ""
2771     ),
2772     "uri" => "http://inelegant.org/bot"
2773     ),
2774     "ineturl" => array(
2775     "icon" => "robot",
2776     "title" => "InetURL",
2777     "rule" => array(
2778     "InetURL.?[ /]([0-9.]{1,10})" => ""
2779     ),
2780     "uri" => ""
2781     ),
2782     "infoart" => array(
2783     "icon" => "robot",
2784     "title" => "InfoArt",
2785     "rule" => array(
2786     "InfoArt crawler" => ""
2787     ),
2788     "uri" => ""
2789     ),
2790     "infomine" => array(
2791     "icon" => "infomine",
2792     "title" => "INFOMINE",
2793     "rule" => array(
2794     "^DataFountains/DMOZ" => "",
2795     "^INFOMINE[ /]([0-9.]{1,10})" => "\\1"
2796     ),
2797     "uri" => "http://infomine.ucr.edu/"
2798     ),
2799     "infoseek" => array(
2800     "icon" => "infoseek",
2801     "title" => "Infoseek",
2802     "rule" => array(
2803     "SideWinder[ /]?([0-9a-z.]{1,10})" => "\\1",
2804     "Infoseek" => ""
2805     ),
2806     "uri" => ""
2807     ),
2808     "inktomi" => array(
2809     "icon" => "inktomi",
2810     "title" => "Inktomi",
2811     "rule" => array(
2812     "slurp@inktomi\.com" => ""
2813     ),
2814     "uri" => ""
2815     ),
2816     "innerprise" => array(
2817     "icon" => "robot",
2818     "title" => "Innerprise",
2819     "rule" => array(
2820     "^InnerpriseBot[ /]([0-9.]{1,10})" => "\\1",
2821     "URL[ _]Spider[ _]Pro[ /]([0-9.+]{1,10})" => "\\1",
2822     "^ES[ .]NET[ _]Crawler[ /]([0-9.]{1,10})" => "\\1"
2823     ),
2824     "uri" => "http://www.innerprise.com/"
2825     ),
2826     "inria" => array(
2827     "icon" => "inria",
2828     "title" => "Inria",
2829     "rule" => array(
2830     "^xyro_" => ""
2831     ),
2832     "uri" => ""
2833     ),
2834     "insitor" => array(
2835     "icon" => "insitor",
2836     "title" => "Insitor",
2837     "rule" => array(
2838     "^Insitor(,|\.|naut)" => ""
2839     ),
2840     "uri" => "http://www.insitor.com/"
2841     ),
2842     "internetninja" => array(
2843     "icon" => "robot",
2844     "title" => "Internet Ninja",
2845     "rule" => array(
2846     "^Internet Ninja[ /]([0-9.]{1,10})" => "\\1"
2847     ),
2848     "uri" => ""
2849     ),
2850     "internetseer" => array(
2851     "icon" => "internetseer",
2852     "title" => "InternetSeer",
2853     "rule" => array(
2854     "^InternetSeer\.com" => ""
2855     ),
2856     "uri" => ""
2857     ),
2858     "interseek" => array(
2859     "icon" => "interseek",
2860     "title" => "Interseek",
2861     "rule" => array(
2862     "Interseek.com" => ""
2863     ),
2864     "uri" => "http://www.interseek.com"
2865     ),
2866     "intravnews" => array(
2867     "icon" => "intravnews",
2868     "title" => "IntraVnews",
2869     "rule" => array(
2870     "IntraVnews[ /]([0-9.]{1,10})" => "\\1"
2871     ),
2872     "uri" => "http://www.intravnews.com/"
2873     ),
2874 matthys 403 "ionos" => array(
2875     "icon" => "ionos",
2876     "title" => "IONOS",
2877     "rule" => array(
2878     "IonCrawl" => ""
2879     ),
2880     "uri" => "https://www.ionos.de/terms-gtc/faq-crawler-en/"
2881     ),
2882 joku 63 "ip2location" => array(
2883     "icon" => "ip2location",
2884     "title" => "IP2LocationBot",
2885     "rule" => array(
2886     "^IP2(Map|Location)Bot[ /]([0-9.]{1,10})" => "\\2"
2887     ),
2888     "uri" => "http://www.ip2location.com"
2889     ),
2890     "ipworks" => array(
2891     "icon" => "ipworks",
2892     "title" => "IP*Works",
2893     "rule" => array(
2894     "^IP\*Works\! V([0-9.]{1,10})" => "\\1"
2895     ),
2896     "uri" => "http://www.nsoftware.com/ipworks/"
2897     ),
2898     "irca" => array(
2899     "icon" => "robot",
2900     "title" => "Novell iChain Cool Solutions caching",
2901     "rule" => array(
2902 matthys 209 "^ICRA_(label_generator|Semantic_spider)[ /]([0-9.]{1,10})" => "\\2",
2903     "^Mozilla[/ ]([0-9.]{1,10})[/ ]\(compatible[ ;]*ICS" => "\\1"
2904 joku 63 ),
2905     "uri" => "http://www.icra.org"
2906     ),
2907     "irvine" => array(
2908     "icon" => "robot",
2909     "title" => "Irvine",
2910     "rule" => array(
2911     "Irvine[ /]([0-9.]{1,10})" => "\\1"
2912     ),
2913     "uri" => ""
2914     ),
2915     "ips-agent" => array(
2916     "icon" => "robot",
2917 matthys 209 "title" => "IPS-agent",
2918 joku 63 "rule" => array(
2919     "ips-agent" => ""
2920     ),
2921     "uri" => ""
2922     ),
2923     "isara" => array(
2924     "icon" => "isara",
2925 matthys 209 "title" => "Isara",
2926 joku 63 "rule" => array(
2927     "Isara[ -]([0-9.]{1,10})" => "\\1"
2928     ),
2929     "uri" => "http://www.isara.org/"
2930     ),
2931     "isspider" => array(
2932     "icon" => "robot",
2933     "title" => "ISSpider",
2934     "rule" => array(
2935     "ISSpider[ /\-]([0-9.]{1,10})" => "\\1"
2936     ),
2937     "uri" => ""
2938     ),
2939     "it2media" => array(
2940     "icon" => "it2media",
2941     "title" => "IT2media",
2942     "rule" => array(
2943     "www.adressendeutschland.de" => ""
2944     ),
2945     "uri" => "http://www.adressendeutschland.de/"
2946     ),
2947     "ivia" => array(
2948     "icon" => "robot",
2949     "title" => "iVia",
2950     "rule" => array(
2951     "iVia Site Checker.?[ /]([0-9.]{1,10})" => "\\1"
2952     ),
2953     "uri" => ""
2954     ),
2955     "jeteye" => array(
2956     "icon" => "jeteye",
2957     "title" => "Jeteye",
2958     "rule" => array(
2959     "Jetbot[ /]([0-9.]{1,10})" => "\\1"
2960     ),
2961     "uri" => ""
2962     ),
2963     "jobsde" => array(
2964     "icon" => "jobsde",
2965     "title" => "jobs.de",
2966     "rule" => array(
2967     "www\.jobs\.de" => "",
2968     "jobs.de-Robot" => ""
2969     ),
2970     "uri" => "http://www.jobs.de/"
2971     ),
2972     "jpluck" => array(
2973     "icon" => "robot",
2974     "title" => "Jpluck",
2975     "rule" => array(
2976     "JPluck[ /]([0-9a-z.]{1,10})" => "\\1"
2977     ),
2978     "uri" => ""
2979     ),
2980     "jxta" => array(
2981     "icon" => "robot",
2982     "title" => "Jxta",
2983     "rule" => array(
2984     "falcon[ /]([0-9.]{1,10})" => "\\1"
2985     ),
2986     "uri" => ""
2987     ),
2988     "jyte" => array(
2989     "icon" => "jyte",
2990     "title" => "Jyte",
2991     "rule" => array(
2992     "jyte_fetcher[ /]([0-9.]{1,10})" => "\\1"
2993     ),
2994     "uri" => ""
2995     ),
2996     "jyxo" => array(
2997     "icon" => "jyxo",
2998     "title" => "Jyxo",
2999     "rule" => array(
3000     "Jyxobot[ /]([0-9.]{1,10})" => "\\1"
3001     ),
3002     "uri" => ""
3003     ),
3004     "kalooga" => array(
3005     "icon" => "kalooga",
3006     "title" => "Kalooga",
3007     "rule" => array(
3008     "kalooga[ /-]([0-9.]{1,10})" => "\\1",
3009     "^kalooga" => "",
3010     "KaloogaBot" => ""
3011     ),
3012     "uri" => "http://www.kalooga.com"
3013     ),
3014     "keywen" => array(
3015     "icon" => "keywen",
3016     "title" => "Keywen",
3017     "rule" => array(
3018     "EasyDL[ /]([0-9.]{1,10})" => "\\1"
3019     ),
3020     "uri" => ""
3021     ),
3022     "kilomonkey" => array(
3023     "icon" => "robot",
3024     "title" => "Kilomonkey",
3025     "rule" => array(
3026     "kmky-not-a-bot[ /]([0-9.]{1,10})" => "\\1"
3027     ),
3028     "uri" => "http://www.kilomonkey.com/notabot.txt"
3029     ),
3030     "kinja" => array(
3031     "icon" => "kinja",
3032     "title" => "Kinja",
3033     "rule" => array(
3034     "kinjabot[ /]([0-9.]{1,10})" => "\\1",
3035     "^kinjabot" => ""
3036     ),
3037     "uri" => ""
3038     ),
3039     "kiwi" => array(
3040     "icon" => "robot",
3041     "title" => "KiwiStatus",
3042     "rule" => array(
3043     "KiwiStatus[ /]([0-9.]{1,10})" => "\\1",
3044     "KiwiStatus" => ""
3045     ),
3046     "uri" => "http://www.nzs.com/kiei-status/"
3047     ),
3048     "lachesis" => array(
3049     "icon" => "robot",
3050     "title" => "Lachesis",
3051     "rule" => array(
3052     "lachesis" => ""
3053     ),
3054     "uri" => ""
3055     ),
3056     "lanshan" => array(
3057     "icon" => "robot",
3058     "title" => "Lachesis",
3059     "rule" => array(
3060     "lanshanbot[/ ]([0-9.]{1,10})" => "\\1"
3061     ),
3062     "uri" => ""
3063     ),
3064     "lapozz" => array(
3065     "icon" => "lapozz",
3066     "title" => "Lapozz",
3067     "rule" => array(
3068     "LapozzBot[/ ]?([0-9.]{1,10})" => "\\1"
3069     ),
3070     "uri" => ""
3071     ),
3072     "larbin" => array(
3073     "icon" => "robot",
3074     "title" => "Larbin",
3075     "rule" => array(
3076     "larbin[_/ ]?([0-9.]{1,10})" => "\\1"
3077     ),
3078     "uri" => ""
3079     ),
3080     "laurion" => array(
3081     "icon" => "robot",
3082     "title" => "Laurion",
3083     "rule" => array(
3084     "^IPiumBot" => ""
3085     ),
3086     "uri" => "http://www.laurion.com/"
3087     ),
3088     "leechget" => array(
3089     "icon" => "leechget",
3090     "title" => "LeechGet",
3091     "rule" => array(
3092     "^LeechGet[ /]([0-9.]{1,10})" => "\\1"
3093     ),
3094     "uri" => ""
3095     ),
3096     "linguaseek" => array(
3097     "icon" => "linguaseek",
3098     "title" => "Linguaseek",
3099     "rule" => array(
3100     "^LinguaBot[ /]v([0-9.]{1,10})" => "\\1"
3101     ),
3102     "uri" => "http://www.linguaseek.com/"
3103     ),
3104     "linguee" => array(
3105     "icon" => "linguee",
3106     "title" => "Linguee",
3107     "rule" => array(
3108     "^Linguee Bot" => ""
3109     ),
3110     "uri" => "http://www.linguee.com/"
3111     ),
3112 matthys 355 "linkapedia" => array(
3113     "icon" => "linkapedia",
3114     "title" => "Linkapedia",
3115     "rule" => array(
3116     "^linkapedia" => ""
3117     ),
3118     "uri" => "http://www.linkapedia.com"
3119     ),
3120 matthys 346 "linkdex" => array(
3121     "icon" => "linkdex",
3122     "title" => "Linkdex",
3123     "rule" => array(
3124     "linkdexbot[ /]([0-9.]{1,10})" => "\\1"
3125     ),
3126     "uri" => "http://www.linkdex.com/bots/"
3127     ),
3128 matthys 366 "linkedin" => array(
3129     "icon" => "linkedin",
3130     "title" => "LinkedIn",
3131     "rule" => array(
3132     "LinkedInBot[ /]([0-9.]{1,10})" => "\\1"
3133     ),
3134     "uri" => "http://www.linkedin.com"
3135     ),
3136 joku 63 "linkguard" => array(
3137     "icon" => "robot",
3138     "title" => "Linkguard",
3139     "rule" => array(
3140     "Linkguard Online[ /]([0-9.]{1,10})" => "\\1"
3141     ),
3142     "uri" => "http://www.linkguard.com/"
3143     ),
3144     "linklint" => array(
3145     "icon" => "linklint",
3146     "title" => "Linklint",
3147     "rule" => array(
3148     "^Linklint[-\-a-z /]*([0-9.]{1,10})" => "\\1"
3149     ),
3150     "uri" => "http://www.linklint.org/"
3151     ),
3152     "linkman" => array(
3153     "icon" => "linkman",
3154     "title" => "Linkman",
3155     "rule" => array(
3156     "\(compatible; Linkman\)" => ""
3157     ),
3158     "uri" => ""
3159     ),
3160     // Needs to be before linkcheck for correct detection
3161     "linkchecker" => array(
3162     "icon" => "w3c",
3163     "title" => "W3C Link Checker",
3164     "rule" => array(
3165     "^W3C-checklink[ /]([0-9.]{1,10})" => "\\1"
3166     ),
3167     "uri" => "http://validator.w3.org/checklink"
3168     ),
3169     "linkcheck" => array(
3170     "icon" => "linkcheck",
3171     "title" => "Linkcheck",
3172     "rule" => array(
3173     "checklink[ /]([0-9.]{1,10})" => "\\1",
3174     "Link[ \-]?(Chec(k|ker)|Val(et|idator))" => "",
3175     "Adaxas Spider" => "",
3176     "Agent-SharewarePlazaFileCheckBot[ /]([0-9.]{1,10})" => "\\1",
3177     "NetMechanic V([0-9.]{1,10})" => "\\1",
3178     "^InfoLink" => "",
3179     "InternetLinkAgent" => "",
3180     "; SPENG\)" => "",
3181     "SharewarePlazaFileCheckBot" => "",
3182     "fileboost.net" => "",
3183     "^billbot" => ""
3184     ),
3185     "uri" => ""
3186     ),
3187     "linkru" => array(
3188     "icon" => "robot",
3189     "title" => "Link.RU",
3190     "rule" => array(
3191     "^Link.RU bot" => ""
3192     ),
3193     "uri" => ""
3194     ),
3195     "linkssql" => array(
3196     "icon" => "robot",
3197     "title" => "Links SQL",
3198     "rule" => array(
3199     "links sql" => ""
3200     ),
3201     "uri" => ""
3202     ),
3203     "linksweeper" => array(
3204     "icon" => "robot",
3205     "title" => "Link Sweeper",
3206     "rule" => array(
3207     "LinkSweeper[ /]([0-9.]{1,10})" => "\\1"
3208     ),
3209     "uri" => ""
3210     ),
3211     "linkwalker" => array(
3212     "icon" => "robot",
3213     "title" => "Link Walker",
3214     "rule" => array(
3215     "^LinkWalker" => ""
3216     ),
3217     "uri" => ""
3218     ),
3219     "lipperhey" => array(
3220     "icon" => "lipperhey",
3221     "title" => "Lipperhey",
3222     "rule" => array(
3223     "Lipperhey Spider" => ""
3224     ),
3225     "uri" => "http://www.lipperhey.com"
3226     ),
3227     "livedoor" => array(
3228     "icon" => "livedoor",
3229     "title" => "Livedoor",
3230     "rule" => array(
3231     "^Livedoor( SF( - California Crawl)?|Checkers)[ /]" => ""
3232     ),
3233     "uri" => ""
3234     ),
3235     "livejournal" => array(
3236     "icon" => "livejournal",
3237     "title" => "Live Journal",
3238     "rule" => array(
3239     "^LiveJournal\.com" => ""
3240     ),
3241     "uri" => "http://www.livejournal.com"
3242     ),
3243     "ljpic" => array(
3244     "icon" => "ljpic",
3245     "title" => "ljpic",
3246     "rule" => array(
3247     "LjSEEK Picture-Bot[ /]+([0-9.]{1,10})" => "\\1"
3248     ),
3249     "uri" => "http://www.ljpic.com"
3250     ),
3251     "lmspider" => array(
3252     "icon" => "robot",
3253     "title" => "Lmspider",
3254     "rule" => array(
3255     "^lmspider" => ""
3256     ),
3257     "uri" => ""
3258     ),
3259     "locators" => array(
3260     "icon" => "robot",
3261     "title" => "Locaters",
3262     "rule" => array(
3263     "^FiNDoBot[/ ]([0-9a-z.]{1,10})" => "\\1"
3264     ),
3265     "uri" => ""
3266     ),
3267     "look" => array(
3268     "icon" => "look",
3269     "title" => "Look",
3270     "rule" => array(
3271     "www\.look\.com" => "",
3272     "Lookbot" => ""
3273     ),
3274     "uri" => ""
3275     ),
3276     "looksmart" => array(
3277     "icon" => "looksmart",
3278     "title" => "LookSmart",
3279     "rule" => array(
3280     "^Martini" => "",
3281     "^MantraAgent" => "",
3282     "FurlBot" => "",
3283     "looksmart-sv-fw" => ""
3284     ),
3285     "uri" => ""
3286     ),
3287     "loop" => array(
3288     "icon" => "loop",
3289     "title" => "LOOP",
3290     "rule" => array(
3291     "NetResearchServer[ /]([0-9.]{1,10})" => "\\1"
3292     ),
3293     "uri" => ""
3294     ),
3295     "lotkyll" => array(
3296     "icon" => "robot",
3297     "title" => "Lotkyll",
3298     "rule" => array(
3299     "Lotkyll" => ""
3300     ),
3301     "uri" => ""
3302     ),
3303 joku 335 "ltx71" => array(
3304     "icon" => "robot",
3305     "title" => "LTX71",
3306     "rule" => array(
3307     "ltx71" => ""
3308     ),
3309     "uri" => "http://ltx71.com/"
3310     ),
3311 joku 63 "lwp" => array(
3312     "icon" => "robot",
3313     "title" => "lwp",
3314     "rule" => array(
3315     "lwp(-trivial|::simple)[ /]([0-9.]{1,10})" => "\\2"
3316     ),
3317     "uri" => ""
3318     ),
3319     "lycos" => array(
3320     "icon" => "lycos",
3321     "title" => "Lycos",
3322     "rule" => array(
3323     "Lycos_Spider_" => ""
3324     ),
3325     "uri" => ""
3326     ),
3327     "magpierss" => array(
3328     "icon" => "rss",
3329     "title" => "MagpieRSS",
3330     "rule" => array(
3331     "MagpieRSS" => ""
3332     ),
3333     "uri" => "http://magpierss.sourceforge.net/"
3334     ),
3335     "mailru" => array(
3336     "icon" => "mailru",
3337 matthys 209 "title" => "Mail.Ru",
3338 joku 63 "rule" => array(
3339 matthys 195 "^Mail.Ru[ /]([0-9.]{1,10})" => "\\1",
3340     "Mail.RU_Bot[ /]([0-9.]{1,10})" => "\\1"
3341 joku 63 ),
3342 matthys 209 "uri" => "http://www.mail.ru/"
3343 joku 63 ),
3344     "mailsweeper" => array(
3345     "icon" => "robot",
3346     "title" => "Mail Sweeper",
3347     "rule" => array(
3348     "Mail[ \-]?Sweeper" => ""
3349     ),
3350     "uri" => ""
3351     ),
3352     "marvin" => array(
3353     "icon" => "robot",
3354     "title" => "Marvin",
3355     "rule" => array(
3356     "^Marvin" => ""
3357     ),
3358     "uri" => ""
3359     ),
3360     "matkurja" => array(
3361     "icon" => "matkurja",
3362     "title" => "Mat'Kurja",
3363     "rule" => array(
3364     "Mosad[ /]([0-9.]{1,10})" => "\\1"
3365     ),
3366     "uri" => ""
3367     ),
3368     "mavicanet" => array(
3369     "icon" => "mavicanet",
3370     "title" => "Mavicanet",
3371     "rule" => array(
3372     "Mavicanet robot" => ""
3373     ),
3374     "uri" => ""
3375     ),
3376 matthys 292 "meanpath" => array(
3377     "icon" => "meanpath",
3378 matthys 290 "title" => "Meanpath",
3379 matthys 280 "rule" => array(
3380     "meanpathbot[ /]([0-9.]{1,10})" => "\\1"
3381     ),
3382     "uri" => "http://www.meanpath.com/meanpathbot.html"
3383 matthys 275 ),
3384 matthys 280 "mediater" => array(
3385 joku 63 "icon" => "robot",
3386     "title" => "Mediater",
3387     "rule" => array (
3388     "^libwww[ /]([0-9.]{1,10})" => "\\1"
3389 matthys 280 ),
3390     "uri" => ""
3391 joku 63 ),
3392 matthys 305 "memory" => array(
3393     "icon" => "memory",
3394     "title" => "internet Memory",
3395     "rule" => array (
3396     "memoryBot[ /]([0-9.]{1,10})" => "\\1"
3397     ),
3398     "uri" => "http://internetmemory.org/en/"
3399     ),
3400 joku 63 "mercator" => array(
3401     "icon" => "robot",
3402     "title" => "Mercator",
3403     "rule" => array(
3404     "Mercator" => ""
3405     ),
3406     "uri" => ""
3407     ),
3408     "metacarta" => array(
3409     "icon" => "robot",
3410     "title" => "Metacarta",
3411     "rule" => array(
3412     "^RRC (crawler_admin@bigfoot.com)" => "",
3413     "^flunky" => "",
3414     "^Mozilla.*\(samualt9@bigfoot.com\)$" => ""
3415     ),
3416     "uri" => "http://www.metacarta.com"
3417     ),
3418     "metager" => array(
3419     "icon" => "metager",
3420     "title" => "MetaGer",
3421     "rule" => array(
3422     "MetaGer" => ""
3423     ),
3424     "uri" => ""
3425     ),
3426     "metamark" => array(
3427     "icon" => "robot",
3428     "title" => "Metamark",
3429     "rule" => array(
3430     "^XRL[ /]([0-9.a-z]{1,10})" => "\\1"
3431     ),
3432     "uri" => "http://metamark.net"
3433     ),
3434     "metamedic" => array(
3435     "icon" => "metamedic",
3436     "title" => "MetaMedic",
3437     "rule" => array(
3438     "MediBot[ /]([0-9.]{1,10})" => "\\1"
3439     ),
3440     "uri" => ""
3441     ),
3442     "mirago" => array(
3443     "icon" => "mirago",
3444     "title" => "Mirago",
3445     "rule" => array(
3446     "Mirago" => ""
3447     ),
3448     "uri" => ""
3449     ),
3450     "misterwong" => array(
3451     "icon" => "misterwong",
3452     "title" => "Mister Wong",
3453     "rule" => array(
3454     "Mister Wong-Bot[ /]([0-9.]{1,10})" => "\\1"
3455     ),
3456     "uri" => "http://www.mister-wong.de/"
3457     ),
3458     "miva" => array(
3459     "icon" => "miva",
3460     "title" => "Miva",
3461     "rule" => array(
3462     "AlgoFeedback@miva\.com" => ""
3463     ),
3464     "uri" => "http://www.miva.com/"
3465     ),
3466     "mj12" => array(
3467     "icon" => "mj12",
3468     "title" => "Majestic-12",
3469     "rule" => array(
3470     "Mj12bot[ /]v?([0-9.]{1,10})" => "\\1",
3471     "MJ12bot \(mini\)[ /]([0-9.]{1,10})" => "\\1"
3472     ),
3473     "uri" => "http://majestic12.co.uk/bot.php"
3474     ),
3475     "mlbot" => array(
3476     "icon" => "robot",
3477     "title" => "MLBot",
3478     "rule" => array(
3479     "^MLBot" => ""
3480     ),
3481     "uri" => "http://www.metadatalabs.com/mlbot"
3482     ),
3483     "mnogo" => array(
3484     "icon" => "mnogo",
3485     "title" => "mnoGoSearch",
3486     "rule" => array(
3487     "Mnogosearch[ /\-]([0-9.]{1,10})" => "\\1"
3488     ),
3489     "uri" => "http://www.mnogosearch.org/"
3490     ),
3491     "mobileok" => array(
3492     "icon" => "mobileok",
3493     "title" => "W3C mobileOK",
3494     "rule" => array(
3495     "^W3C-mobileOK" => ""
3496     ),
3497     "uri" => "http://www.w3.org/2006/07/mobileok-ddc"
3498     ),
3499 matthys 296 "mojeek" => array(
3500     "icon" => "mojeek",
3501     "title" => "Mojeek",
3502 joku 63 "rule" => array(
3503     "MojeekBot[ /]([0-9.]{1,10})" => "\\1"
3504     ),
3505 matthys 284 "uri" => "https://www.mojeek.com/bot.html"
3506 joku 63 ),
3507     "momspider" => array(
3508     "icon" => "robot",
3509     "title" => "MOM Spider",
3510     "rule" => array(
3511     "MOMspider[ /]([0-9.]{1,10})" => "\\1"
3512     ),
3513     "uri" => ""
3514     ),
3515     "moreover" => array(
3516     "icon" => "moreover",
3517     "title" => "Moreover",
3518     "rule" => array(
3519     "^Moreoverbot[ /]([0-9.]{1,10})" => "\\1"
3520     ),
3521     "uri" => ""
3522     ),
3523     "movabletype" => array(
3524     "icon" => "movabletype",
3525     "title" => "Movable Type",
3526     "rule" => array(
3527     "MovableType[ /]([0-9.]{1,10})" => "\\1"
3528     ),
3529     "uri" => ""
3530     ),
3531     "mozdex" => array(
3532     "icon" => "mozdex",
3533     "title" => "MozDex",
3534     "rule" => array(
3535     "mozDex[ /]([0-9.]{1,6}(-dev)?)" => "\\1"
3536     ),
3537     "uri" => ""
3538     ),
3539     "mqbot" => array(
3540     "icon" => "robot",
3541     "title" => "MQbot",
3542     "rule" => array(
3543     "MQbot" => ""
3544     ),
3545     "uri" => ""
3546     ),
3547     "msnbot" => array(
3548     "icon" => "bing",
3549 matthys 205 "title" => "Bing",
3550 joku 63 "rule" => array(
3551     "MSN(BOT|PTC)[ /]([0-9.]{1,10})" => "\\2",
3552     "MS Search ([0-9.]{1,10}) Robot" => "\\1",
3553     "MSNBOT-(MEDIA|PRODUCTS|NewsBlogs)[ /]([0-9.]{1,10})" => "\\2",
3554     "bingbot[ /]([0-9.]{1,10})" => "\\1"
3555     ),
3556     "uri" => ""
3557     ),
3558     "msnbot-mobile" => array(
3559     "icon" => "msn",
3560     "title" => "MSN Mobile",
3561     "rule" => array(
3562     "MSNBOT-(MOBILE|)[ /]([0-9.]{1,10})" => "\\2",
3563     "MSNBOT_Mobile" => "",
3564     "MSMOBOT" => ""
3565     ),
3566     "uri" => ""
3567     ),
3568     "mslivebot" => array(
3569     "icon" => "livesearch",
3570     "title" => "MS Live Search",
3571     "rule" => array(
3572     "MSNBOT-(Academic)[ /]([0-9.]{1,10})" => "\\2"
3573     ),
3574     "uri" => ""
3575     ),
3576     "msproxy" => array(
3577     "icon" => "robot",
3578     "title" => "MSProxy",
3579     "rule" => array(
3580     "MSProxy[ /]([0-9.]{1,10})" => "\\1"
3581     ),
3582     "uri" => ""
3583     ),
3584     "msrbot" => array(
3585     "icon" => "robot",
3586     "title" => "MSRBOT",
3587     "rule" => array(
3588     "^MSRBOT" => ""
3589     ),
3590     "uri" => "http://research.microsoft.com/research/sv/msrbot/"
3591     ),
3592     "mswebdav" => array(
3593     "icon" => "robot",
3594     "title" => "MS-WebDAV",
3595     "rule" => array(
3596     "Microsoft[ \-]?WebDAV[ \-]?MiniRedir" => ""
3597     ),
3598     "uri" => ""
3599     ),
3600     "mticon" => array(
3601     "icon" => "robot",
3602     "title" => "MTIcon",
3603     "rule" => array(
3604     "MTIcon[/ ]([0-9.]{1,10})" => "\\1"
3605     ),
3606     "uri" => ""
3607     ),
3608     "multipage-validator" => array(
3609     "icon" => "multipage-validator",
3610     "title" => "Multipage Validator",
3611     "rule" => array(
3612     "^W3C_Multipage_Validator[ /]([0-9.]{1,10})" => "\\1"
3613     ),
3614     "uri" => "http://www.validator.ca/"
3615     ),
3616     "myrss" => array(
3617     "icon" => "rss",
3618     "title" => "MyRSS",
3619     "rule" => array(
3620     "MyRSS.jp[/ ]([0-9.]{1,10})" => "\\1"
3621     ),
3622     "uri" => ""
3623     ),
3624     "multimap" => array(
3625     "icon" => "robot",
3626     "title" => "Multimap",
3627     "rule" => array(
3628     "Multimap Geotag Blog Parser[/ ]([0-9.]{1,10})" => "\\1"
3629     ),
3630     "uri" => ""
3631     ),
3632     "najdi" => array(
3633     "icon" => "najdi",
3634     "title" => "Najdi.si",
3635     "rule" => array(
3636     "Najdi.si" => ""
3637     ),
3638     "uri" => "http://www.najdi.si"
3639     ),
3640     "nameprotect" => array(
3641     "icon" => "nameprotect",
3642     "title" => "Name Protect",
3643     "rule" => array(
3644     "NPBot" => ""
3645     ),
3646     "uri" => ""
3647     ),
3648     "nationaldirectory" => array(
3649     "icon" => "robot",
3650     "title" => "National Directory",
3651     "rule" => array(
3652     "NationalDirectory-WebSpider[ /]([0-9.]{1,10})" => "\\1"
3653     ),
3654     "uri" => ""
3655     ),
3656     "natsumican" => array(
3657     "icon" => "robot",
3658     "title" => "Natsu Mican",
3659     "rule" => array(
3660     "NATSU[ \-]MICAN[/ ]([0-9a-z.]{1,10})" => "\\1"
3661     ),
3662     "uri" => ""
3663     ),
3664     "naverbot" => array(
3665     "icon" => "naverbot",
3666     "title" => "Naver",
3667     "rule" => array(
3668     "NaverBot([_\-]dloader)?[/ \-]([0-9.]{1,10})" => "\\2",
3669     "Naver(Bot)?" => "",
3670     "^nabot" => ""
3671     ),
3672     "uri" => ""
3673     ),
3674     "navisso" => array(
3675     "icon" => "navisso",
3676     "title" => "Navisso",
3677     "rule" => array(
3678     "Navisso(Bot)?" => ""
3679     ),
3680     "uri" => "http://www.navisso.com"
3681     ),
3682 matthys 402 "neevabot" => array(
3683 matthys 410 "icon" => "neeva",
3684 matthys 402 "title" => "Neeva",
3685     "rule" => array(
3686     "Neevabot[ /]([0-9.]{1,10})" => "\\1"
3687     ),
3688     "uri" => "https://neeva.com/neevabot"
3689     ),
3690 joku 63 "neofonie" => array(
3691     "icon" => "robot",
3692 matthys 205 "title" => "Neofonie",
3693 joku 63 "rule" => array(
3694     "www.neofonie.de" => ""
3695     ),
3696     "uri" => "http://www.neofonie.de/loesungen/search/robot.html"
3697     ),
3698     "neomo" => array(
3699     "icon" => "robot",
3700     "title" => "Neomo",
3701     "rule" => array(
3702     "Francis[ /]([0-9.]{1,10})" => "\\1"
3703     ),
3704     "uri" => ""
3705     ),
3706     "nessus" => array(
3707     "icon" => "nessus",
3708     "title" => "Nessus",
3709     "rule" => array(
3710     "Nessus\)$" => ""
3711     ),
3712     "uri" => ""
3713     ),
3714 matthys 279 "nerdybot" => array(
3715 matthys 280 "icon" => "robot",
3716     "title" => "NerdyBot",
3717     "rule" => array(
3718     "NerdyBot" => ""
3719     ),
3720     "uri" => "http://nerdybot.com/"
3721 matthys 279 ),
3722 joku 63 "nerdbynature" => array(
3723     "icon" => "nerdbynature",
3724     "title" => "NerdByNature",
3725     "rule" => array(
3726     "NerdByNature.Bot" => ""
3727     ),
3728     "uri" => "http://www.nerdbynature.net/bot"
3729     ),
3730     "netants" => array(
3731     "icon" => "netants",
3732     "title" => "NetAnts",
3733     "rule" => array(
3734     "NetAnts[ /]([0-9.]{1,10})" => "\\1"
3735     ),
3736     "uri" => ""
3737     ),
3738     "netcraft" => array(
3739     "icon" => "netcraft",
3740     "title" => "Netcraft",
3741     "rule" => array(
3742     "netcraft" => ""
3743     ),
3744     "uri" => ""
3745     ),
3746     "netinfo" => array(
3747     "icon" => "netinfo",
3748     "title" => "Netinfo",
3749     "rule" => array(
3750     "^NetinfoBot[ /]([0-9.]{1,10})" => "\\1"
3751     ),
3752     "uri" => "http://netinfo.bg/"
3753     ),
3754     "netluchs" => array(
3755     "icon" => "netluchs",
3756     "title" => "Netluchs",
3757     "rule" => array(
3758     "Netluchs[ /]([0-9.a-z]{1,10})" => "\\1"
3759     ),
3760     "uri" => "http://www.netluchs.de/"
3761     ),
3762     "netmechanic" => array(
3763     "icon" => "netmechanic",
3764     "title" => "NetMechanic",
3765     "rule" => array(
3766     "NetMechanic[ /V]{1,5}([0-9.]{1,10})" => "\\1"
3767     ),
3768     "uri" => ""
3769     ),
3770     "netnose" => array(
3771     "icon" => "netnose",
3772     "title" => "NetNose",
3773     "rule" => array(
3774     "NetNose[ \-]Crawler[/ ]([0-9.]{1,10})" => "\\1"
3775     ),
3776     "uri" => ""
3777     ),
3778     "netoskop" => array(
3779     "icon" => "robot",
3780     "title" => "Netoskop",
3781     "rule" => array(
3782     "netoskop" => ""
3783     ),
3784     "uri" => ""
3785     ),
3786     "netpromoter" => array(
3787     "icon" => "netpromoter",
3788     "title" => "NetPromoter",
3789     "rule" => array(
3790     "NetPromoter Spider" => ""
3791     ),
3792     "uri" => "http://www.net-promoter.com/"
3793     ),
3794     "netprospector" => array(
3795     "icon" => "robot",
3796     "title" => "Netprospector",
3797     "rule" => array(
3798     "^netprospector" => ""
3799     )
3800     ),
3801     "netpumper" => array(
3802     "icon" => "robot",
3803     "title" => "Netpumper",
3804     "rule" => array(
3805     "^NetPumper[/ ]([0-9.]{1,10})" => "\\1"
3806     ),
3807     "uri" => ""
3808     ),
3809     "netscapeproxy" => array(
3810     "icon" => "netscape",
3811     "title" => "Netscape Proxy",
3812     "rule" => array(
3813     "Netscape-Proxy[/ ]([0-9.]{1,10})" => "\\1"
3814     ),
3815     "uri" => ""
3816     ),
3817     "netspective" => array(
3818     "icon" => "robot",
3819     "title" => "NetSpective",
3820     "rule" => array(
3821     "^WebFilter Robot ([0-9.]{1,10})" => "\\1"
3822     ),
3823     "uri" => ""
3824     ),
3825     "netvibes" => array(
3826     "icon" => "netvibes",
3827     "title" => " Netvibes",
3828     "rule" => array(
3829     "^Netvibes" => "\\1"
3830     ),
3831     "uri" => ""
3832     ),
3833     "newsfire" => array(
3834     "icon" => "newsfire",
3835     "title" => "NewsFire",
3836     "rule" => array(
3837     "NewsFire[/ ]([0-9.]{1,10})" => "\\1"
3838     ),
3839     "uri" => ""
3840     ),
3841     "newsgator" => array(
3842     "icon" => "newsgator",
3843     "title" => "NewsGator",
3844     "rule" => array(
3845     "NewsGato(r|rOnline)[/ ]([0-9.]{1,10})" => "\\2"
3846     ),
3847     "uri" => ""
3848     ),
3849     "newzcrawler" => array(
3850     "icon" => "newzcrawler",
3851     "title" => "NewzCrawler",
3852     "rule" => array(
3853     "NewzCrawler[/ ]([0-9.]{1,10})" => "\\1"
3854     ),
3855     "uri" => ""
3856     ),
3857     "nextopia" => array(
3858     "icon" => "newzcrawler",
3859     "title" => "NewzCrawler",
3860     "rule" => array(
3861     "^NextopiaBOT.*[v ]([0-9.]{1,10})" => "\\1"
3862     ),
3863     "uri" => ""
3864     ),
3865     "ngsearch" => array(
3866     "icon" => "ngsearch",
3867     "title" => "NG Search",
3868     "rule" => array(
3869     "NG-Search[/ ]([0-9.]{1,10})" => "\\1"
3870     ),
3871     "uri" => ""
3872     ),
3873     "nimble" => array(
3874     "icon" => "robot",
3875     "title" => "Nimble",
3876     "rule" => array(
3877     "NimbleCrawler[/ ]([0-9.]{1,10})" => "\\1"
3878     ),
3879     "uri" => ""
3880     ),
3881     "nmap" => array(
3882     "icon" => "nmap",
3883     "title" => "Nmap",
3884     "rule" => array(
3885     "Nmap Scripting Engine" => ""
3886     ),
3887     "uri" => "http://nmap.org/book/nse.html"
3888     ),
3889     "nusearch" => array(
3890     "icon" => "robot",
3891     "title" => "NuSearch",
3892     "rule" => array(
3893     "^nuSearch" => ""
3894     ),
3895     "uri" => "http://www.nusearch.com/"
3896     ),
3897     "noago" => array(
3898     "icon" => "noago",
3899     "title" => "Noago",
3900     "rule" => array(
3901     "Noago Spider" => ""
3902     ),
3903     "uri" => "http://www.noago.com/"
3904     ),
3905     "noviforum" => array(
3906     "icon" => "noviforum",
3907     "title" => "Noviforum",
3908     "rule" => array(
3909     "TridentSpider[/ ]?([0-9.]{1,10})" => "\\1"
3910     ),
3911     "uri" => ""
3912     ),
3913     "noxtrum" => array(
3914     "icon" => "noxtrum",
3915     "title" => "noXtrum",
3916     "rule" => array(
3917     "noxtrumbot[/ ]?([0-9.]{1,10})" => "\\1"
3918     ),
3919     "uri" => ""
3920     ),
3921     "noyona" => array(
3922     "icon" => "robot",
3923     "title" => "Noyona",
3924     "rule" => array(
3925     "noyona.([0-9._]{1,10})" => "\\1"
3926     ),
3927     "uri" => "http://noyona.com/"
3928     ),
3929     "nsauditor" => array(
3930     "icon" => "nsauditor",
3931     "title" => "Nsauditor",
3932     "rule" => array(
3933     "Nsauditor[ /]([0-9.]{1,10})" => "\\1"
3934     ),
3935     "uri" => "http://www.nsauditor.com/"
3936     ),
3937     "obidosbot" => array(
3938     "icon" => "robot",
3939     "title" => "Bookwatch",
3940     "rule" => array(
3941     "obidos[ \-]?bot" => ""
3942     ),
3943     "uri" => ""
3944     ),
3945     "objectssearch" => array(
3946     "icon" => "robot",
3947     "title" => "Objects Search",
3948     "rule" => array(
3949     "ObjectsSearch[ /]([0-9.]{1,10})" => "\\1"
3950     ),
3951     "uri" => ""
3952     ),
3953     "obot" => array(
3954 matthys 297 "icon" => "ibm",
3955     "title" => "IBM (ONLY) Crawler",
3956 joku 63 "rule" => array(
3957 matthys 297 "oBot[ /]([0-9.]{1,10})" => "\\1"
3958 joku 63 ),
3959 matthys 297 "uri" => "http://filterdb.iss.net/crawler/"
3960     // Previous from "ONLY Solutions GmbH" – that is what the O stands for
3961 joku 63 ),
3962     "ocawa" => array(
3963     "icon" => "ocawa",
3964     "title" => "Ocawa",
3965     "rule" => array(
3966     "Ocawa[ /]([A-Z.a-z][0-9.]{1,10})" => "\\1",
3967     "Ocawa" => ""
3968     ),
3969     "uri" => "http://www.ocawa.com/"
3970     ),
3971     "octora" => array(
3972     "icon" => "octora",
3973     "title" => "Octora",
3974     "rule" => array(
3975     "^Octora (Beta)?" => ""
3976     ),
3977     "uri" => "http://www.octora.com/"
3978     ),
3979     "offlineexplorer" => array(
3980     "icon" => "robot",
3981     "title" => "OfflineExplorer",
3982     "rule" => array(
3983     "^Offline Explorer[ /]([0-9.]{1,10})" => "\\1"
3984     ),
3985     "uri" => ""
3986     ),
3987     "omea" => array(
3988     "icon" => "omea",
3989     "title" => "Omea Reader",
3990     "rule" => array(
3991     "Omea Reader[ /]([0-9.]{1,10})" => "\\1"
3992     ),
3993     "uri" => ""
3994     ),
3995     "onet" => array(
3996     "icon" => "onet",
3997     "title" => "Onet",
3998     "rule" => array(
3999     "OnetSzukaj[ /]([0-9.]{1,10})" => "\\1",
4000     "Onet\.pl" => "",
4001     "inktomi.search.onet" => ""
4002     ),
4003     "uri" => "http://www.onet.pl"
4004     ),
4005     "online24" => array(
4006     "icon" => "robot",
4007 matthys 209 "title" => "Online24",
4008 joku 63 "rule" => array(
4009     "^Online24-Bot .* ([0-9.]{1,10})" => "\\1"
4010     ),
4011     "uri" => "http://www.online24.de"
4012     ),
4013     "onlinewebcheck" => array(
4014     "icon" => "csehtmlvalidator",
4015     "title" => "CSE HTML Validator",
4016     "rule" => array(
4017     "onlinewebcheck" => ""
4018     ),
4019     "uri" => "http://www.onlinewebcheck.com"
4020     ),
4021     "onsearch" => array(
4022     "icon" => "onsearch",
4023 matthys 209 "title" => "OnSearch",
4024 joku 63 "rule" => array(
4025     "^onCHECK-Robot" => ""
4026     ),
4027     "uri" => "http://www.onsearch.de"
4028     ),
4029     "onto" => array(
4030     "icon" => "robot",
4031     "title" => "OntoSpider",
4032     "rule" => array(
4033     "^OntoSpider[ /]([0-9.]{1,10})" => "\\1"
4034     ),
4035     "uri" => "http://ontospider.i-n.info/"
4036     ),
4037     "openacoon" => array(
4038     "icon" => "robot",
4039     "title" => "OpenAcoon",
4040     "rule" => array(
4041     "^OpenAcoon v([0-9.]{1,10})" => "\\1"
4042     ),
4043     "uri" => "http://www.openacoon.de/"
4044     ),
4045     "openfind" => array(
4046     "icon" => "openfind",
4047     "title" => "Openfind",
4048     "rule" => array(
4049     "openbot[ /]([0-9.]{1,10})" => "\\1",
4050     "Openfind Robot[ /]([0-9.A-Z]{1,10})" => "\\1"
4051     ),
4052     "uri" => ""
4053     ),
4054     "opentagger" => array(
4055     "icon" => "robot",
4056     "title" => "OpenTagger",
4057     "rule" => array(
4058     "^OpenTaggerBot" => ""
4059     ),
4060     "uri" => "http://www.opentagger.com/opentaggerbot.htm"
4061     ),
4062     "opentext" => array(
4063     "icon" => "opentext",
4064     "title" => "OpenText",
4065     "rule" => array(
4066     "^OpenTextSiteCrawler[ /]([0-9.]{1,10})" => "\\1"
4067     ),
4068     "uri" => "http://www.opentext.net/"
4069     ),
4070     "openweb" => array(
4071     "icon" => "robot",
4072     "title" => "OpenWebSpider",
4073     "rule" => array(
4074     "^OpenWebSpider[ /]([0-9.]{1,10})" => "\\1",
4075     "^OpenWebSpider v([0-9.A-Z]{1,10})" => "\\1"
4076     ),
4077     "uri" => "http://www.openwebspider.org"
4078     ),
4079     "openx" => array(
4080     "icon" => "openx",
4081     "title" => "OpenX Spider",
4082     "rule" => array(
4083     "OpenX" => ""
4084     ),
4085     "uri" => "http://www.openx.org"
4086     ),
4087     "orange" => array(
4088     "icon" => "orange",
4089     "title" => "Orange",
4090     "rule" => array(
4091 joku 338 "OrangeBot-Mobile[ /]([0-9.]{1,10})" => "\\1",
4092     "OrangeBot[ /]([0-9.]{1,10})" => "\\1"
4093 joku 63 ),
4094     "uri" => "http://orange.com/"
4095     ),
4096     "organica" => array(
4097     "icon" => "robot",
4098     "title" => "Organica",
4099     "rule" => array(
4100     "crawler@organica\.us" => ""
4101     ),
4102     "uri" => ""
4103     ),
4104     "outfox" => array(
4105     "icon" => "robot",
4106     "title" => "Outfox Melon",
4107     "rule" => array(
4108     "OutfoxMelonBot[ /]([0-9.]{1,10})" => "\\1",
4109     "OutfoxBot[ /]([0-9.]{1,10})" => "\\1"
4110     ),
4111     "uri" => ""
4112     ),
4113     "overture" => array(
4114     "icon" => "overture",
4115     "title" => "Overture",
4116     "rule" => array(
4117     "Overture[ \-]?WebCrawler" => ""
4118     ),
4119     "uri" => ""
4120     ),
4121 joku 337 "owler" => array(
4122     "icon" => "robot",
4123     "title" => "Owler",
4124     "rule" => array(
4125     "Owler[ /]([0-9.]{1,10})" => "\\1",
4126     "Owler" => ""
4127     ),
4128     "uri" => ""
4129     ),
4130 joku 63 "page2rss" => array(
4131     "icon" => "page2rss",
4132     "title" => "Page2RSS",
4133     "rule" => array(
4134     "Page2RSS[ /]([0-9.]{1,10})" => "\\1"
4135     ),
4136     "uri" => "http://page2rss.com"
4137     ),
4138     "pagebytes" => array(
4139     "icon" => "robot",
4140     "title" => "PageBites",
4141     "rule" => array(
4142     "^PageBitesHyperBot[ /]([0-9.]{1,10})" => "\\1"
4143     ),
4144     "uri" => ""
4145     ),
4146 matthys 282 "pagesinventory" => array(
4147     "icon" => "pagesinventory",
4148     "title" => "PagesInventory",
4149     "rule" => array(
4150     "^PagesInventory" => ""
4151     ),
4152     "uri" => "http://www.pagesinventory.com"
4153     ),
4154 joku 63 "pagesjaunes" => array(
4155     "icon" => "pagesjaunes",
4156     "title" => "Pages Jaunes",
4157     "rule" => array(
4158     "PJBot[ /]([0-9.]{1,10})" => "\\1"
4159     ),
4160     "uri" => "http://www.pagesjaunes.fr/"
4161     ),
4162     "pagevalet" => array(
4163     "icon" => "wdg",
4164     "title" => "WDG Page Valet",
4165     "rule" => array(
4166     "^Page Valet[ /]([0-9.]{1,10})" => "\\1"
4167     ),
4168     "uri" => "http://www.htmlhelp.com/tools/validator/"
4169     ),
4170     "panopeabot" => array(
4171     "icon" => "robot",
4172     "title" => "PanopeaBot",
4173     "rule" => array(
4174     "PanopeaBot[/ ]([0-9.]{1,10})" => "\\1"
4175     ),
4176     "uri" => ""
4177     ),
4178     "parchmenthill" => array(
4179     "icon" => "robot",
4180     "title" => "Parchment Hill",
4181     "rule" => array(
4182     "ParchBot[ /]([0-9.]{1,10})" => "\\1"
4183     ),
4184     "uri" => "http://www.parchmenthill.com/search.htm"
4185     ),
4186     "pascient" => array(
4187     "icon" => "pascient",
4188     "title" => "Pascient",
4189     "rule" => array(
4190     "panscient.com" => ""
4191     ),
4192     "uri" => "http://www.panscient.com/"
4193     ),
4194     "peerbot" => array(
4195     "icon" => "peerbot",
4196     "title" => "Peerbot",
4197     "rule" => array(
4198     "^PEERbot" => ""
4199     ),
4200     "uri" => ""
4201     ),
4202 matthys 389 "petalbot" => array(
4203     "icon" => "huawei",
4204     "title" => "PetalBot", // Huawei Search - also called Aspiegel
4205     "rule" => array(
4206     "PetalBot" => "",
4207     "AspiegelBot" => ""
4208     ),
4209     "uri" => "https://aspiegel.com/petalbot"
4210     ),
4211 joku 63 "php" => array(
4212     "icon" => "php",
4213     "title" => "PHP",
4214     "rule" => array(
4215     "^PHP[ /]([0-9.]{1,10})" => "\\1"
4216     ),
4217     "uri" => ""
4218     ),
4219     "phpcrawl" => array(
4220     "icon" => "robot",
4221     "title" => "PHPCrawl",
4222     "rule" => array(
4223     "^PHPCrawl" => ""
4224     ),
4225     "uri" => "http://phpcrawl.cuab.de/"
4226     ),
4227     "phpdig" => array(
4228     "icon" => "robot",
4229     "title" => "PhpDig",
4230     "rule" => array(
4231     "^PhpDig[ /]([0-9.]{1,10})" => "\\1"
4232     ),
4233     "uri" => "http://www.finbot.com/"
4234     ),
4235     "phpversiontracker" => array(
4236     "icon" => "phpversiontracker",
4237     "title" => "PHP version tracker",
4238     "rule" => array(
4239     "^PHP version tracker" => ""
4240     ),
4241     "uri" => "http://www.nexen.net/phpversion/bot.php"
4242     ),
4243     "pictureofinternet" => array(
4244     "icon" => "robot",
4245     "title" => "PictureOfInternet",
4246     "rule" => array(
4247     "^PictureOfInternet[ /]([0-9.]{1,10})" => ""
4248     ),
4249     "uri" => ""
4250     ),
4251     "pingdom" => array(
4252     "icon" => "pingdom",
4253     "title" => "Pingdom",
4254     "rule" => array(
4255     "^Pingdom GIGRIB v([0-9.]{1,10})" => "\\1",
4256     "^Pingdom" => ""
4257     ),
4258     "uri" => "http://www.pingdom.com/"
4259     ),
4260     "pinseri" => array(
4261     "icon" => "pinseri",
4262     "title" => "Pinseri",
4263     "rule" => array(
4264     "www\.pinseri\.com/bloglist" => ""
4265     ),
4266     "uri" => ""
4267     ),
4268     "plagger" => array(
4269     "icon" => "plagger",
4270     "title" => "Plagger",
4271     "rule" => array(
4272     "Plagger[ /]([0-9.]{1,10})" => "\\1"
4273     ),
4274     "uri" => "http://www.plugger.org"
4275     ),
4276     "planet" => array(
4277     "icon" => "planet",
4278     "title" => "Planet",
4279     "rule" => array(
4280     "Planet[ /]([0-9.]{1,10})" => "\\1"
4281     ),
4282     "uri" => ""
4283     ),
4284     "plantynet" => array(
4285     "icon" => "robot",
4286     "title" => "PlantyNet",
4287     "rule" => array(
4288     "PlantyNet_WebRobot[_ /]V?([0-9.]{1,10})" => "\\1"
4289     ),
4290     "uri" => ""
4291     ),
4292     "pluck" => array(
4293     "icon" => "pluck",
4294     "title" => "Pluck",
4295     "rule" => array(
4296     "PluckFeedCrawler[ /]([0-9.]{1,10})" => "\\1"
4297     ),
4298     "uri" => ""
4299     ),
4300     "plsearch" => array(
4301     "icon" => "plsearch",
4302     "title" => "PlanetSearch",
4303     "rule" => array(
4304     "fido[ /]([0-9.]{1,10}) Harvest" => "\\1"
4305     ),
4306     "uri" => ""
4307     ),
4308     "poe" => array(
4309     "icon" => "robot",
4310     "title" => "POE-Component",
4311     "rule" => array(
4312     "^POE-Component-Client-HTTP[/ ]([0-9.]{1,10})" => "\\1"
4313     ),
4314     "uri" => ""
4315     ),
4316     "pogodak" => array(
4317     "icon" => "pogodak",
4318     "title" => "Pogodak",
4319     "rule" => array(
4320     "Pogodak\.hr[/ ]?([0-9.]{1,10})" => "\\1"
4321     ),
4322     "uri" => ""
4323     ),
4324     "poodle" => array(
4325     "icon" => "robot",
4326     "title" => "Poodle predictor",
4327     "rule" => array(
4328     "P(oo|ooo)dle[ \-]?predictor[ \-]?([0-9.]{1,10})" => "\\1",
4329     "P(oo|ooo)dle[ \-]?predictor" => ""
4330     ),
4331     "uri" => "http://www.gritechnologies.com/tools/spider.go"
4332     ),
4333     "pompos" => array(
4334     "icon" => "pompos",
4335     "title" => "Pompos",
4336     "rule" => array(
4337     "Pompos[ /]([0-9.]{1,10})" => "\\1"
4338     ),
4339     "uri" => ""
4340     ),
4341     "popdex" => array(
4342     "icon" => "robot",
4343     "title" => "Popdexter",
4344     "rule" => array(
4345     "Popdexter" => ""
4346     ),
4347     "uri" => ""
4348     ),
4349     "postrank" => array(
4350     "icon" => "postrank",
4351     "title" => "PostRank",
4352     "rule" => array(
4353     "^PostRank[ /]+([0-9.]{1,10})" => "\\1"
4354     ),
4355     "uri" => "http://www.postrank.com/"
4356     ),
4357     "powermarks" => array(
4358     "icon" => "robot",
4359     "title" => "Powermarks",
4360     "rule" => array(
4361     "Powermarks[ /]([0-9.]{1,10})" => "\\1"
4362     ),
4363     "uri" => ""
4364     ),
4365 matthys 366 "pinterest" => array(
4366     "icon" => "pinterest",
4367 joku 63 "title" => "PROBE!",
4368     "rule" => array(
4369 matthys 366 "Pinterest[ /]([0-9.]{1,10})" => "\\1"
4370 joku 63 ),
4371 matthys 366 "uri" => "http://www.pinterest.com/"
4372 joku 63 ),
4373 matthys 366 "probe" => array(
4374     "icon" => "robot",
4375     "title" => "PROBE!",
4376     "rule" => array(
4377     "^PROBE!" => ""
4378     ),
4379     "uri" => ""
4380     ),
4381 joku 63 "projecthoneypot" => array(
4382     "icon" => "projecthoneypot",
4383     "title" => "Project Honeypot",
4384     "rule" => array(
4385     "^PHPot Verispider[ /v]+([0-9.]{1,10})" => "\\1",
4386     "projecthoneypot" => ""
4387     ),
4388     "uri" => "http://www.projecthoneypot.org"
4389     ),
4390     "proxycache" => array(
4391     "icon" => "robot",
4392     "title" => "Proxy Cache",
4393     "rule" => array(
4394     "^Mozilla/[0-9.]{1,10} \(compatible\;\)$" => ""
4395     ),
4396     "uri" => ""
4397     ),
4398     "proxyhunter" => array(
4399     "icon" => "robot",
4400     "title" => "ProxyHunter",
4401     "rule" => array(
4402     "ProxyHunter" => ""
4403     ),
4404     "uri" => ""
4405     ),
4406     "psbot" => array(
4407     "icon" => "picsearch",
4408     "title" => "PicSearch",
4409     "rule" => array(
4410     "^psbot" => ""
4411     ),
4412     "uri" => ""
4413     ),
4414     "pubsub" => array(
4415     "icon" => "pubsub",
4416     "title" => "PubSub",
4417     "rule" => array(
4418     "^PubSub-RSS-Reader[ /]([0-9.]{1,10})" => "\\1",
4419     "^PubSub\.com" => ""
4420     ),
4421     "uri" => ""
4422     ),
4423 joku 330 "pubarch" => array(
4424 joku 334 "icon" => "robot",
4425 joku 330 "title" => "PubArchive",
4426     "rule" => array(
4427     "publiclibraryarchive.org" => ""
4428     ),
4429     "uri" => ""
4430     ),
4431 joku 63 "pukiwiki" => array(
4432     "icon" => "pukiwiki",
4433     "title" => "PukiWiki",
4434     "rule" => array(
4435     "PukiWiki[ /]([0-9.]{1,10})" => "\\1"
4436     ),
4437     "uri" => ""
4438     ),
4439     "pwebotxy" => array(
4440     "icon" => "pwebotxy",
4441     "title" => "PWeBot/X.Y",
4442     "rule" => array(
4443     "^PWeBot[ /]([0-9.]{1,10})" => "\\1"
4444     ),
4445     "uri" => "http://www.programacionweb.net/robot.php"
4446     ),
4447     "pxys" => array(
4448     "icon" => "robot",
4449     "title" => "PXYS",
4450     "rule" => array(
4451     "^pxys" => ""
4452     ),
4453     "uri" => ""
4454     ),
4455     "qango" => array(
4456     "icon" => "qango",
4457     "title" => "Qango",
4458     "rule" => array(
4459     "^Qango.com" => ""
4460     ),
4461     "uri" => "http://www.quango.com/"
4462     ),
4463     "qihoo" => array(
4464     "icon" => "qihoo",
4465     "title" => "Qihoo",
4466     "rule" => array(
4467     "QihooBot[ /]([0-9.]{1,10})" => "\\1"
4468     ),
4469     "uri" => "http://www.qihoo.com/"
4470     ),
4471     "qseero" => array(
4472     "icon" => "robot",
4473     "title" => "Qseero",
4474     "rule" => array(
4475     "Qseero v([0-9.]{1,10})" => "\\1"
4476     ),
4477     "uri" => "http://www.q0.com/"
4478     ),
4479     "quantcast" => array(
4480     "icon" => "robot",
4481     "title" => "Quantcast",
4482     "rule" => array(
4483     "Quantcastbot[ /]([0-9.]{1,10})" => "\\1"
4484     ),
4485     "uri" => "http://www.quantcast.com/"
4486     ),
4487     "quepasa" => array(
4488     "icon" => "quepasa",
4489     "title" => "Quepasa",
4490     "rule" => array(
4491     "Quepasa[ \-]?Creep" => ""
4492     ),
4493     "uri" => ""
4494     ),
4495     "questfinder" => array(
4496     "icon" => "robot",
4497     "title" => "QuestFinder",
4498     "rule" => array(
4499     "www\.questfinder\.com" => ""
4500     ),
4501     "uri" => ""
4502     ),
4503 matthys 351 "qwantify" => array(
4504     "icon" => "qwantify",
4505     "title" => "Qwantify",
4506     "rule" => array(
4507     "Qwantify[ /]([0-9.]{1,10})" => "\\1"
4508     ),
4509     "uri" => "https://www.qwant.com/"
4510     ),
4511 joku 63 "qweery" => array(
4512     "icon" => "robot",
4513     "title" => "Qweery",
4514     "rule" => array(
4515     "^QweeryBot[ /]([0-9.]{1,10})" => "\\1"
4516     ),
4517     "uri" => "http://qweerybot.qweery.nl"
4518     ),
4519     "racaicrawler" => array(
4520     "icon" => "robot",
4521     "title" => "RacaiCrawler",
4522     "rule" => array(
4523     "RacaiCrawler[ -]([0-9.]{1,10})" => "\\1"
4524     )
4525     ),
4526     "radian6" => array(
4527     "icon" => "robot",
4528     "title" => "Radian6",
4529     "rule" => array(
4530     "www\.radian6\.com" => ""
4531     ),
4532     "uri" => "http://www.radian6.com"
4533     ),
4534 joku 375 "radiofx" => array(
4535     "icon" => "radiofx",
4536     "title" => "Radio.fx",
4537     "rule" => array(
4538     "Radio.fx" => ""
4539     ),
4540     "uri" => "https://de.tobit.softwarw"
4541     ),
4542 joku 63 "rambler" => array(
4543     "icon" => "rambler",
4544     "title" => "Rambler",
4545     "rule" => array(
4546     "StackRambler[ /]([0-9.]{1,10})" => "\\1"
4547     ),
4548     "uri" => ""
4549     ),
4550     "ramiba" => array(
4551     "icon" => "robot",
4552 matthys 209 "title" => "Ramiba",
4553 joku 63 "rule" => array(
4554     "^ramiba(-bot)?" => "\\1"
4555     ),
4556     "uri" => ""
4557     ),
4558     "rankur" => array(
4559     "icon" => "rankur",
4560     "title" => "Rankur",
4561     "rule" => array(
4562     "^RankurBot/Rankur([0-9.]{1,10})" => "\\1"
4563     ),
4564     "uri" => "http://rankur.com/",
4565     ),
4566 joku 261 "red" => array(
4567     "icon" => "red",
4568     "title" => "RED",
4569     "rule" => array(
4570     "RED[ /]([0-9.]{1,10})" => "\\1"
4571     ),
4572     "uri" => "http://redbot.org/"
4573 joku 181 ),
4574 joku 63 "rediff" => array(
4575     "icon" => "rediff",
4576 matthys 209 "title" => "Rediff",
4577 joku 63 "rule" => array(
4578     "^RedBot/redbot[ /\-]([0-9.]{1,10})" => "\\1"
4579     ),
4580     "uri" => "http://www.rediff.com",
4581     ),
4582     "repia" => array(
4583     "icon" => "robot",
4584     "title" => "Repia",
4585     "rule" => array(
4586     "webmaster@repia\.com" => ""
4587     ),
4588     "uri" => ""
4589     ),
4590     "robotgenius" => array(
4591     "icon" => "robot",
4592     "title" => "Robot Genius",
4593     "rule" => array(
4594     "^robotgenius" => ""
4595     ),
4596     "uri" => "http://robotgenius.net",
4597     ),
4598     "robozilla" => array(
4599     "icon" => "robot",
4600     "title" => "Robozilla",
4601     "rule" => array(
4602     "Robozilla" => ""
4603     ),
4604     "uri" => ""
4605     ),
4606 matthys 302 "rogerbot" => array(
4607 matthys 306 "icon" => "moz",
4608     "title" => "Moz Rogerbot",
4609 matthys 302 "rule" => array(
4610     "rogerbot[ /]([0-9.]{1,10})" => "\\1"
4611     ),
4612     "uri" => "http://moz.com/help/guides/moz-procedures/who-is-rogerbot"
4613     ),
4614 joku 63 "rojo" => array(
4615     "icon" => "rojo",
4616     "title" => "Rojo",
4617     "rule" => array(
4618     "Rojo[ /]([0-9.]{1,10})" => "\\1"
4619     ),
4620     "uri" => ""
4621     ),
4622     "rss-atom" => array(
4623     "icon" => "rss",
4624     "title" => "RSS / Atom",
4625     "rule" => array(
4626     "^Apple-PubSub" => "",
4627     "^AppleSyndication" => ""
4628     ),
4629     "uri" => ""
4630     ),
4631     "rssbot" => array(
4632     "icon" => "rss",
4633 matthys 209 "title" => "RSS-bot",
4634 joku 63 "rule" => array(
4635     "rss-bot[ /]([0-9.]{1,10})" => "\\1"
4636     ),
4637     "uri" => ""
4638     ),
4639     "rssbandit" => array(
4640     "icon" => "rssbandit",
4641     "title" => "RssBandit",
4642     "rule" => array(
4643     "RssBandit[ /]([0-9.]{1,10})" => "\\1"
4644     ),
4645     "uri" => ""
4646     ),
4647     "rssimages" => array(
4648     "icon" => "rss",
4649 matthys 209 "title" => "RssImages",
4650 joku 63 "rule" => array(
4651     "rssImagesBot[ /]([0-9.]{1,10})" => "\\1"
4652     ),
4653     "uri" => ""
4654     ),
4655     "rssmicro" => array(
4656     "icon" => "rssmicro",
4657     "title" => "RSSMicro",
4658     "rule" => array(
4659     "RSSMicro\.com" => ""
4660     ),
4661     "uri" => "http://www.rssmicro.com"
4662     ),
4663     "rssowl" => array(
4664     "icon" => "rssowl",
4665     "title" => "RSSOwl",
4666     "rule" => array(
4667     "RSSOwl[ /]([0-9a-z.]{1,10})" => "\\1"
4668     ),
4669     "uri" => ""
4670     ),
4671     "rssreader" => array(
4672     "icon" => "rss",
4673     "title" => "RssReader",
4674     "rule" => array(
4675     "RssReader[ /]([0-9.]{1,10})" => ""
4676     ),
4677     "uri" => ""
4678     ),
4679     "rtgi" => array(
4680     "icon" => "rtgi",
4681 matthys 209 "title" => "Rtgi",
4682 joku 63 "rule" => array(
4683     "RTGI" => ""
4684     ),
4685     "uri" => "http://rtgi.fr/"
4686     ),
4687     "rufusbot" => array(
4688     "icon" => "robot",
4689     "title" => "RufusBot",
4690     "rule" => array(
4691     "RufusBot" => ""
4692     ),
4693     "uri" => ""
4694     ),
4695 matthys 304 "runet" => array(
4696     "icon" => "runet",
4697     "title" => "iTrack RuNet Crawler",
4698     "rule" => array(
4699     "Runet-Research-Crawler" => ""
4700     ),
4701     "uri" => "http://www.itrack.ru/research/cmsrate/"
4702     ),
4703 joku 63 "runnk" => array(
4704     "icon" => "robot",
4705     "title" => "Runnk",
4706     "rule" => array(
4707     "Runnk RSS finder" => ""
4708     ),
4709     "uri" => "http://www.runnk.com/il/law"
4710     ),
4711     "sagool" => array(
4712     "icon" => "robot",
4713     "title" => "Sagool",
4714     "rule" => array(
4715     "MaSagool" => ""
4716     ),
4717     "uri" => "http://sagool.jp/"
4718     ),
4719     "sanszbot" => array(
4720     "icon" => "robot",
4721     "title" => "Sansz",
4722     "rule" => array(
4723     "SanszBot" => ""
4724     ),
4725     "uri" => ""
4726     ),
4727     "saucereader" => array(
4728     "icon" => "saucereader",
4729     "title" => "Sauce Reader",
4730     "rule" => array(
4731     "Sauce[ ]?Reader[ /]([0-9.]{1,10})" => "\\1"
4732     ),
4733     "uri" => ""
4734     ),
4735     "sbider" => array(
4736     "icon" => "sbider",
4737     "title" => "SBIder",
4738     "rule" => array(
4739     "SBIder[/ ]([0-9.]{1,10})" => "\\1",
4740     "SBIder[/ ]SBIder.([0-9.]{1,10})" => "\\1"
4741     ),
4742     "uri" => ""
4743     ),
4744     "scirus" => array(
4745     "icon" => "robot",
4746     "title" => "Scirus",
4747     "rule" => array(
4748     "FAST-WebCrawler/[0-9a-z.]{1,10}/Scirus" => ""
4749     ),
4750     "uri" => ""
4751     ),
4752     "scoutjet" => array(
4753     "icon" => "scoutjet",
4754     "title" => "ScoutJet",
4755     "rule" => array(
4756     "ScoutJet" => ""
4757     ),
4758     "uri" => "http://www.scoutjet.com/"
4759     ),
4760 joku 261 "scrapy" => array(
4761     "icon" => "scrapy",
4762     "title" => "Scrapy",
4763     "rule" => array(
4764     "Scrapy[ /]([0-9.]{1,10})" => "\\1"
4765     ),
4766     "uri" => "http://scrapy.org"
4767     ),
4768 joku 63 "scrubby" => array(
4769     "icon" => "scrubby",
4770     "title" => "Scrubby",
4771     "rule" => array(
4772     "Scrubby[ /]([0-9.]{1,10})" => "\\1"
4773     ),
4774     "uri" => ""
4775     ),
4776     "sdm" => array(
4777     "icon" => "sdm",
4778     "title" => "SUN Download Manager",
4779     "rule" => array(
4780     "Sun Download Manager[/ ]([0-9.]{1,10})" => "\\1"
4781     ),
4782     "uri" => ""
4783     ),
4784     "sealinks" => array(
4785     "icon" => "robot",
4786     "title" => "Sea Links",
4787     "rule" => array(
4788     "SEA-Links( HTML-Scanner Pingoo\!)?[ /]([0-9.]{1,10})" => "\\2"
4789     ),
4790     "uri" => ""
4791     ),
4792     "search17" => array(
4793     "icon" => "robot",
4794     "title" => "Search 17",
4795     "rule" => array(
4796     "Search17Bot[ /]([0-9.]{1,10})" => "\\1"
4797     ),
4798     "uri" => "http://www.search17.com/bot.php"
4799     ),
4800     "search2" => array(
4801     "icon" => "search2",
4802     "title" => "Search2.net",
4803     "rule" => array(
4804     "^S2Bot[ /]([0-9.]{1,10})" => "\\1"
4805     ),
4806     "uri" => "http://search2.net/"
4807     ),
4808     "searchbot" => array(
4809     "icon" => "robot",
4810     "title" => "Searchbot",
4811     "rule" => array(
4812     "Searchbot[ /]([0-9.]{1,10})" => "\\1"
4813     ),
4814     "uri" => ""
4815     ),
4816     "searchch" => array(
4817     "icon" => "robot",
4818     "title" => "Search.ch",
4819     "rule" => array(
4820     "search\.ch[ /]?V?([0-9.]{1,10})" => "\\1"
4821     ),
4822     "uri" => ""
4823     ),
4824     "searchengineworld" => array(
4825     "icon" => "robot",
4826     "title" => "SearchEngineWorld",
4827     "rule" => array(
4828     "searchengineworld" => ""
4829     ),
4830     "uri" => "http://www.searchengineworld.com/"
4831     ),
4832     "searchhippo" => array(
4833     "icon" => "searchhippo",
4834     "title" => "Searchhippo",
4835     "rule" => array(
4836     "searchhippo" => ""
4837     ),
4838     "uri" => "http://www.searchhippo.com/"
4839     ),
4840     "searchthruus" => array(
4841     "icon" => "robot",
4842     "title" => "SearchThruUs",
4843     "rule" => array(
4844     "www\.unitek-systems\.co\.uk[ /]([0-9.]{1,10})" => "\\1"
4845     ),
4846     "uri" => ""
4847     ),
4848     "securecomputing" => array(
4849     "icon" => "robot",
4850     "title" => "Secure Computing",
4851     "rule" => array(
4852     "securecomputing" => ""
4853     ),
4854     "uri" => ""
4855     ),
4856     "seekport" => array(
4857     "icon" => "seekport",
4858     "title" => "Seekport",
4859     "rule" => array(
4860     "Seekbot[ /]([0-9.]{1,10})" => "\\1"
4861     ),
4862     "uri" => ""
4863     ),
4864     "semanticdiscovery" => array(
4865     "icon" => "robot",
4866     "title" => "Semantic Discovery",
4867     "rule" => array(
4868     "semanticdiscovery[ /]([0-9.]{1,10})" => "\\1"
4869     ),
4870     "uri" => ""
4871     ),
4872 matthys 319 "semrush" => array(
4873     "icon" => "semrush",
4874     "title" => "SEMrush",
4875     "rule" => array(
4876     "SemrushBot[ /]([0-9.]{1,10})" => "\\1"
4877     ),
4878     "uri" => "http://www.semrush.com/bot.html"
4879     ),
4880 joku 63 "sengine" => array(
4881     "icon" => "sengine",
4882     "title" => "Sengine",
4883     "rule" => array(
4884     "netEstate NE Crawler" => ""
4885     ),
4886     "uri" => "http://www.sengine.info/"
4887     ),
4888     "sensis" => array(
4889     "icon" => "sensis",
4890     "title" => "Sensis",
4891     "rule" => array(
4892     "^Sensis(.com.au)? Web Crawler" => ""
4893     ),
4894     "uri" => "http://sensis.com.au"
4895     ),
4896     "seokicks" => array(
4897     "icon" => "seokicks",
4898     "title" => "SEOkicks",
4899     "rule" => array(
4900     "SEOkicks-Robot" => ""
4901     ),
4902     "uri" => "http://www.seokicks.de/"
4903     ),
4904     "seoprofiler" => array(
4905     "icon" => "seoprofiler",
4906     "title" => "SEOprofiler",
4907     "rule" => array(
4908     "spbot[ /]([0-9.]{1,10})" => "\\1"
4909     ),
4910     "uri" => "http://www.seoprofiler.com/"
4911     ),
4912     "setooz" => array(
4913     "icon" => "setooz",
4914     "title" => "Setooz",
4915     "rule" => array(
4916     "OOZBOT[ /]([0-9.]{1,10})" => "\\1"
4917     ),
4918     "uri" => "http://www.setooz.com/oozbot.html"
4919     ),
4920     "seznam" => array(
4921     "icon" => "seznam",
4922     "title" => "Seznam",
4923     "rule" => array(
4924     "SeznamBot[ /]([0-9.]{1,10})" => "\\1",
4925     "Seznam" => ""
4926     ),
4927     "uri" => "http://www.seznam.cz"
4928     ),
4929     "sharpreader" => array(
4930     "icon" => "sharpreader",
4931     "title" => "SharpReader",
4932     "rule" => array(
4933     "SharpReader[ /]([0-9.]{1,10})" => "\\1"
4934     ),
4935     "uri" => ""
4936     ),
4937     "shelob" => array(
4938     "icon" => "shelob",
4939     "title" => "Sherlock Spider",
4940     "rule" => array(
4941     "^Shelob" => ""
4942     ),
4943     "uri" => "http://www.gmx.net"
4944     ),
4945     "sherlockspider" => array(
4946     "icon" => "robot",
4947     "title" => "Sherlock Spider",
4948     "rule" => array(
4949     "sherlock_spider" => ""
4950     ),
4951     "uri" => ""
4952     ),
4953     "shim" => array(
4954     "icon" => "robot",
4955     "title" => "Shim Crawler",
4956     "rule" => array(
4957     "shim[ \-]crawler" => ""
4958     ),
4959     "uri" => ""
4960     ),
4961     "shopwiki" => array(
4962     "icon" => "shopwiki",
4963     "title" => "ShopWiki",
4964     "rule" => array(
4965     "^ShopWiki[ /]([0-9.]{1,10})" => "\\1"
4966     ),
4967     "uri" => ""
4968     ),
4969     "shoula" => array(
4970     "icon" => "robot",
4971     "title" => "Shoula",
4972     "rule" => array(
4973     "^Shoula.com Crawler ([0-9.]{1,10})" => "\\1"
4974     ),
4975     "uri" => "http://www.shoula.com"
4976     ),
4977     "siege" => array(
4978     "icon" => "robot",
4979     "title" => "Siege",
4980     "rule" => array(
4981     "Siege[ /]([0-9.]{1,10})" => "\\1"
4982     ),
4983     "uri" => ""
4984     ),
4985     "siets" => array(
4986     "icon" => "robot",
4987     "title" => "Siets",
4988     "rule" => array(
4989     "SietsCrawler[ /]([0-9.]{1,10})" => "\\1"
4990     ),
4991     "uri" => ""
4992     ),
4993     "simpy" => array(
4994     "icon" => "simpy",
4995     "title" => "Simpy",
4996     "rule" => array(
4997     "^(argus|simpy)[ /]([0-9.]{1,10})" => "\\2",
4998     ),
4999     "uri" => ""
5000     ),
5001     "singingfish" => array(
5002     "icon" => "singingfish",
5003     "title" => "SingingFish",
5004     "rule" => array(
5005     "asterias[ /]([0-9.]{1,10})" => "\\1",
5006     "Asterias Crawler v([0-9.]{1,10})" => "\\1",
5007     "asterias" => ""
5008     ),
5009     "uri" => ""
5010     ),
5011     "sirketce" => array(
5012     "icon" => "robot",
5013     "title" => "Sirketce",
5014     "rule" => array(
5015     "Sirketcebot[ /v]+([0-9.]{1,10})" => "\\1"
5016     ),
5017     "uri" => "http://www.sirketce.com/bot.html"
5018     ),
5019     "sirobot" => array(
5020     "icon" => "robot",
5021     "title" => "SiroBot",
5022     "rule" => array(
5023     "sirobot" => ""
5024     ),
5025     "uri" => ""
5026     ),
5027     "sistrix" => array(
5028     "icon" => "sistrix",
5029     "title" => "SISTRIX",
5030     "rule" => array(
5031     "SISTRIX Crawler" => ""
5032     ),
5033     "uri" => "http://crawler.sistrix.net/"
5034     ),
5035     "sitebar" => array(
5036     "icon" => "sitebar",
5037     "title" => "SiteBar",
5038     "rule" => array(
5039     "SiteBar[ /]([0-9.]{1,10})" => "\\1"
5040     ),
5041     "uri" => ""
5042     ),
5043     "sitebot" => array(
5044     "icon" => "sitebot",
5045     "title" => "SiteBot",
5046     "rule" => array(
5047     "SiteBot[ /]([0-9.]{1,10})" => "\\1"
5048     ),
5049     "uri" => "http://www.sitebot.org/robot/"
5050     ),
5051 matthys 273 "siteexplorer" => array(
5052     "icon" => "siteexplorer",
5053     "title" => "SiteExplorer",
5054     "rule" => array(
5055     "SiteExplorer[ /]([0-9a-z.]{1,10})" => "\\1"
5056     ),
5057     "uri" => "http://siteexplorer.info/"
5058     ),
5059 joku 63 "sitesell" => array(
5060     "icon" => "sitesell",
5061     "title" => "SiteSell",
5062     "rule" => array(
5063     "SBIder[/ ]([0-9a-z.\-]{1,10})" => "\\1"
5064     ),
5065     "uri" => ""
5066     ),
5067     "sitespider" => array(
5068     "icon" => "robot",
5069     "title" => "SiteSpider",
5070     "rule" => array(
5071     "^SiteSpider" => ""
5072     ),
5073     "uri" => ""
5074     ),
5075     "sitesucker" => array(
5076     "icon" => "sitesucker",
5077     "title" => "SiteSucker",
5078     "rule" => array(
5079     "Sitesucker[ /]([0-9.]{1,10})" => "\\1"
5080     ),
5081     "uri" => "http://www.sitesucker.us/"
5082     ),
5083     "sitidi" => array(
5084     "icon" => "robot",
5085     "title" => "SitiDi",
5086     "rule" => array(
5087     "SitiDiBot[ /]([0-9.]{1,10})" => "\\1"
5088     ),
5089     "uri" => ""
5090     ),
5091 joku 329 "sixy" => array(
5092     "icon" => "robot",
5093     "title" => "Sixy.ch",
5094     "rule" => array(
5095     "sixy.ch[ /]([0-9a-z.]{1,10})" => "\\1"
5096     ),
5097     "uri" => "http://sixy.ch"
5098     ),
5099 joku 63 "skaffe" => array(
5100     "icon" => "robot",
5101     "title" => "Skaffe",
5102     "rule" => array(
5103     "Skampy[ /]([0-9.\-]{1,10})" => "\\1"
5104     ),
5105     "uri" => "http://www.skaffe.com"
5106     ),
5107     "skizzle" => array(
5108     "icon" => "skizzle",
5109     "title" => "Skizzle",
5110     "rule" => array(
5111     "SKIZZLE! Distributed Internet Spider[ /v]+([0-9a-z.\-]{1,10})" => "\\1"
5112     ),
5113     "uri" => "http://www.skizzle.com"
5114     ),
5115     "slider" => array(
5116     "icon" => "robot",
5117     "title" => "Slider",
5118     "rule" => array(
5119     "^Slider[ /]([0-9.]{1,10})" => "\\1"
5120     ),
5121     "uri" => ""
5122     ),
5123     "slugch" => array(
5124     "icon" => "robot",
5125 matthys 209 "title" => "Slugch",
5126 joku 63 "rule" => array(
5127     "^slug\.ch crawl ([0-9a-z.\-]{1,10})" => "\\1"
5128     ),
5129     "uri" => ""
5130     ),
5131     "smartware" => array(
5132     "icon" => "robot",
5133     "title" => "SmartWareSoft",
5134     "rule" => array(
5135     "^SWSBot-Images[ /]([0-9.]{1,10})" => "\\1"
5136     ),
5137     "uri" => "http://www.smartwaresoft.com/swsbot12.html"
5138     ),
5139     "snookit" => array(
5140     "icon" => "snookit",
5141     "title" => "Snookit",
5142     "rule" => array(
5143     "^snookit" => ""
5144     ),
5145     "uri" => "http://www.snookit.com/"
5146     ),
5147     "snoopy" => array(
5148     "icon" => "robot",
5149     "title" => "Snoopy",
5150     "rule" => array(
5151     "^Snoopy.+([0-9.]{1,10})" => "\\1",
5152     "sna-([0-9.]{1,10})" => "\\1"
5153     ),
5154     "uri" => "http://snoopy.sourceforge.net/"
5155     ),
5156     "snyke" => array(
5157     "icon" => "robot",
5158     "title" => "Snyke",
5159     "rule" => array(
5160     "^SnykeBot[ /]([0-9.]{1,10})" => "\\1"
5161     ),
5162     "uri" => "http://www.snyke.com"
5163     ),
5164     "socialradar" => array(
5165     "icon" => "socialradar",
5166     "title" => "Social Radar",
5167     "rule" => array(
5168     "Socialradarbot[ /]([0-9.]{1,10})" => "\\1"
5169     ),
5170     "uri" => "http://infegy.com/"
5171     ),
5172     "soegning" => array(
5173     "icon" => "soegning",
5174 matthys 209 "title" => "Søgning",
5175 joku 63 "rule" => array(
5176     "soegning\.dk[/ ]spider[ /]([0-9.]{1,10})" => "\\1"
5177     ),
5178     "uri" => ""
5179     ),
5180     "soft411" => array(
5181     "icon" => "soft411",
5182     "title" => "Soft411",
5183     "rule" => array(
5184     "SOFT411 Directory" => ""
5185     ),
5186     "uri" => ""
5187     ),
5188     "sogou" => array(
5189     "icon" => "sogou",
5190     "title" => "Sogou",
5191     "rule" => array(
5192     "Sogou web spider[ /]([0-9.]{1,10})" => "\\1"
5193     ),
5194     "uri" => "http://www.sogou.com/docs/help/webmasters.htm#07"
5195     ),
5196     "sohu" => array(
5197     "icon" => "robot",
5198     "title" => "Sohu",
5199     "rule" => array(
5200     "sohu[ \-](agent|search)" => ""
5201     ),
5202     "uri" => ""
5203     ),
5204     "somewhere" => array(
5205     "icon" => "robot",
5206 matthys 209 "title" => "Somewhere.com",
5207 joku 63 "rule" => array(
5208     "Mozilla\@somewhere\.com" => "\\1"
5209     ),
5210     "uri" => "http://www.somewhere.com/"
5211     ),
5212     "sopheus" => array(
5213     "icon" => "robot",
5214     "title" => "Sopheus",
5215     "rule" => array(
5216     "Sopheus Project[ /]([0-9.]{1,10})" => "\\1"
5217     ),
5218     "uri" => "http://www.thenetplanet.com"
5219     ),
5220     "soso" => array(
5221     "icon" => "soso",
5222     "title" => "Soso",
5223     "rule" => array(
5224     "^Soso(image)?spider" => ""
5225     ),
5226     "uri" => "http://help.soso.com/soso-image-spider.htm"
5227     ),
5228     "souppot" => array(
5229     "icon" => "robot",
5230     "title" => "SoupPot",
5231     "rule" => array(
5232     "SoupPotBot" => ""
5233     ),
5234     "uri" => ""
5235     ),
5236     "specificmedia" => array(
5237     "icon" => "specificmedia",
5238     "title" => "Specific Media",
5239     "rule" => array(
5240     "^SMBot[ /]([0-9.]{1,10})" => "\\1"
5241     ),
5242     "uri" => ""
5243     ),
5244     "sphider" => array(
5245     "icon" => "sphider",
5246     "title" => "Sphider",
5247     "rule" => array(
5248     "Sphider" => ""
5249     ),
5250     "uri" => "http://www.sphider.eu"
5251     ),
5252     "spinn3r" => array(
5253     "icon" => "robot",
5254     "title" => "Spinn3r",
5255     "rule" => array(
5256     "Spinn3r[ /]([0-9.]{1,10})" => "\\1"
5257     ),
5258     "uri" => "http://spinn3r.com/robot"
5259     ),
5260     "sproose" => array(
5261     "icon" => "robot",
5262 matthys 209 "title" => "Sproose",
5263 joku 63 "rule" => array(
5264     "^sproose[ /]([0-9a-z.]{1,10})" => "\\1"
5265     ),
5266     "uri" => "http://www.sproose.com/bot.html"
5267     ),
5268     "spurlbot" => array(
5269     "icon" => "robot",
5270     "title" => "SpurlBot",
5271     "rule" => array(
5272     "SpurlBot[/ ]([0-9.]{1,10})" => "\\1"
5273     ),
5274     "uri" => ""
5275     ),
5276     "stardownloader" => array(
5277     "icon" => "stardownloader",
5278     "title" => "Star Downloader",
5279     "rule" => array(
5280     "^Star Downloader( Pro)?" => ""
5281     ),
5282     "uri" => ""
5283     ),
5284     "steeler" => array(
5285     "icon" => "robot",
5286     "title" => "Steeler",
5287     "rule" => array(
5288     "Steeler[ /]([0-9.]{1,10})" => "\\1"
5289     ),
5290     "uri" => ""
5291     ),
5292     "strategicboard" => array(
5293     "icon" => "strategicboard",
5294     "title" => "Strategic Board",
5295     "rule" => array(
5296     "Strategic Board Bot" => ""
5297     ),
5298     "uri" => "http://www.strategicboard.com"
5299     ),
5300     "suchbaer" => array(
5301     "icon" => "robot",
5302 matthys 209 "title" => "Suchbaer.de",
5303 joku 63 "rule" => array(
5304     "^suchbaer\.de" => ""
5305     ),
5306     "uri" => "http://www.suchbaer.de/"
5307     ),
5308     "suchbot" => array(
5309     "icon" => "robot",
5310 matthys 209 "title" => "Suchbot",
5311 joku 63 "rule" => array(
5312     "^suchbot" => ""
5313     ),
5314     "uri" => ""
5315     ),
5316     "suchende" => array(
5317     "icon" => "suchende",
5318 matthys 209 "title" => "Suchen.de",
5319 joku 63 "rule" => array(
5320     "^gonzo([0-9]{1,2}).*www.suchen.de" => "\\1",
5321     "^gonzo/([0-9.]{1,10})" => "\\1"
5322     ),
5323     "uri" => "http://www.suchen.de/"
5324     ),
5325     "suchknecht" => array(
5326     "icon" => "robot",
5327     "title" => "Suchknecht",
5328     "rule" => array(
5329     "^Suchknecht.at-Robot" => ""
5330     ),
5331     "uri" => "http://www.suchknecht.at/"
5332     ),
5333     "suchpad" => array(
5334     "icon" => "robot",
5335 matthys 209 "title" => "Suchpad",
5336 joku 63 "rule" => array(
5337     "^suchpadbot[ /]([0-9.]{1,10})" => "\\1"
5338     ),
5339     "uri" => "http://www.suchpad.de"
5340     ),
5341     "sunrise" => array(
5342     "icon" => "sunrise",
5343     "title" => "Sunrise",
5344     "rule" => array(
5345     "^Sunrise[ /]([0-9a-z.]{1,10})" => "\\1"
5346     ),
5347     "uri" => ""
5348     ),
5349     "superbot" => array(
5350     "icon" => "superbot",
5351     "title" => "SuperBot",
5352     "rule" => array(
5353     "SuperBot[ /]([0-9.]{1,10})" => "\\1"
5354     ),
5355     "uri" => ""
5356     ),
5357     "surfcontrol" => array(
5358     "icon" => "robot",
5359     "title" => "SurfControl",
5360     "rule" => array(
5361     "SurfControl" => "",
5362     "ScSpider[ /]([0-9.]{1,10})" => "\\1"
5363     ),
5364     "uri" => ""
5365     ),
5366     "surfnet" => array(
5367     "icon" => "robot",
5368     "title" => "SURFnet",
5369     "rule" => array(
5370     "AVSearch[ \-]([0-9.]{1,10})" => "\\1"
5371     ),
5372     "uri" => ""
5373     ),
5374     "surfsafely" => array(
5375     "icon" => "robot",
5376     "title" => "Surfsafely",
5377     "rule" => array(
5378     "Submission Spider at surfsafely.com" => ""
5379     ),
5380     "uri" => "http://www.surfsafely.com"
5381     ),
5382     "surphace" => array(
5383     "icon" => "spherescout",
5384     "title" => "Surphace",
5385     "rule" => array(
5386     "Sphere Scout.+([0-9.]{1,10})" => "\\1",//Previous called Sphere Scout
5387     "Surphace.+v([0-9.]{1,10})" => "\\1"
5388     ),
5389     "uri" => "http://www.surphace.com"
5390     ),
5391     "surveybot" => array(
5392     "icon" => "surveybot",
5393     "title" => "Whois Survey",
5394     "rule" => array(
5395     "SurveyBot[ /]([0-9.]{1,10})" => "\\1"
5396     ),
5397     "uri" => ""
5398     ),
5399     "swoogle" => array(
5400     "icon" => "robot",
5401     "title" => "Swoogle",
5402     "rule" => array(
5403     "^Swooglebot[ /]([0-9.]{1,10})" => "\\1"
5404     ),
5405     "uri" => "http://swoogle.umbc.edu/swooglebot.htm"
5406     ),
5407     "swse" => array(
5408     "icon" => "robot",
5409     "title" => "SWSE",
5410     "rule" => array(
5411     "sw\.deri\.org" => ""
5412     ),
5413     "uri" => "http://sw.deri.org/2006/04/multicrawler/robots.html"
5414     ),
5415     "swish-e" => array(
5416     "icon" => "swish-e",
5417     "title" => "Swish-e",
5418     "rule" => array(
5419     "^swish-e" => ""
5420     ),
5421     "uri" => "http://swish-e.org/"
5422     ),
5423     "sygol" => array(
5424     "icon" => "sygol",
5425     "title" => "Sygol",
5426     "rule" => array(
5427     "www.sygol.(com|net)" => ""
5428     ),
5429     "uri" => "http://www.sygol.com"
5430     ),
5431     "syllabs" => array(
5432     "icon" => "syllabs",
5433     "title" => "Syllabs",
5434     "rule" => array(
5435     "Focal[-]([0-9.]{1,10})" => "\\1"
5436     ),
5437     "uri" => "http://www.syllabs.com/crawler.html"
5438     ),
5439     "synapse" => array(
5440     "icon" => "robot",
5441     "title" => "Synapse",
5442     "rule" => array(
5443     " Synapse\)" => ""
5444     ),
5445     "uri" => "http://ws.apache.org/synapse/"
5446     ),
5447     "sync2it" => array(
5448     "icon" => "robot",
5449 matthys 209 "title" => "Sync2it",
5450 joku 63 "rule" => array(
5451     "^\!Susie" => ""
5452     ),
5453     "uri" => "http://www.sync2it.com/bms/susie.php"
5454     ),
5455     "syncit" => array(
5456     "icon" => "robot",
5457 matthys 209 "title" => "Syncit",
5458 joku 63 "rule" => array(
5459     "^SyncIT[ /]([0-9.]{1,10})" => "\\1"
5460     ),
5461     "uri" => "http://www.syncit.com/"
5462     ),
5463     "syndic8" => array(
5464     "icon" => "syndic8",
5465     "title" => "Syndic8",
5466     "rule" => array(
5467     "Syndic8[ /]([0-9.]{1,10})" => "\\1"
5468     ),
5469     "uri" => "http://www.syndic8.com/"
5470     ),
5471     "syndicatie" => array(
5472     "icon" => "robot",
5473     "title" => "Syndicatie.nl",
5474     "rule" => array(
5475     "Syndicatie\.nl robot v ([0-9.]{1,10})" => "\\1",
5476     "Syndicatie\.nl robot;" => ""
5477     ),
5478     "uri" => ""
5479     ),
5480     "synomia" => array(
5481     "icon" => "robot",
5482     "title" => "Synomia",
5483     "rule" => array(
5484     "^SynoBot" => ""
5485     ),
5486     "uri" => ""
5487     ),
5488     "synoo" => array(
5489     "icon" => "robot",
5490     "title" => "SynooBot",
5491     "rule" => array(
5492     "SynooBot[ /]([0-9.]{1,10})" => "\\1",
5493     ),
5494     "uri" => ""
5495     ),
5496     "szukacz" => array(
5497     "icon" => "szukacz",
5498     "title" => "Szukacz",
5499     "rule" => array(
5500     "Szukacz[ /]([0-9.]{1,10})" => "\\1"
5501     ),
5502     "uri" => ""
5503     ),
5504     "tagoo" => array(
5505     "icon" => "tagoobot",
5506     "title" => "Tagoo",
5507     "rule" => array(
5508     "Tagoobot[ /]([0-9.]{1,10})" => "\\1"
5509     ),
5510     "uri" => "http://www.tagoo.ru"
5511     ),
5512     "tagword" => array(
5513     "icon" => "tagword",
5514     "title" => "Tagword",
5515     "rule" => array(
5516     "^Tagword" => ""
5517     ),
5518     "uri" => "http://tagword.com/dmoz_survey.php"
5519     ),
5520     "trailfire" => array(
5521     "icon" => "trailfire",
5522     "title" => "Trailfire",
5523     "rule" => array(
5524     "^Trailfire-bot[ /]([0-9.]{1,10})" => "\\1"
5525     ),
5526     "uri" => "http://trailfire.com"
5527     ),
5528     "tamu" => array(
5529     "icon" => "tamu",
5530     "title" => "Tamu Crawler",
5531     "rule" => array(
5532     "IRLbot[ /]([0-9.]{1,10})" => "\\1",
5533     "TAMU_CS_IRL_CRAWLER[ /]([0-9.]{1,10})" => "\\1"
5534     ),
5535     "uri" => "http://irl.cs.tamu.edu/crawler/"
5536     ),
5537     "taptubot" => array(
5538     "icon" => "taptubot",
5539     "title" => "Taptu",
5540     "rule" => array(
5541     "taptubot" => ""
5542     ),
5543     "uri" => "http://www.taptu.com/corp/taptubot"
5544     ),
5545     "targetseek" => array(
5546     "icon" => "robot",
5547     "title" => "TargetSeek",
5548     "rule" => array(
5549     "TargetSeek[ /]([0-9.]{1,10})" => "\\1"
5550     ),
5551     "uri" => "http://www.targetgroups.net/TargetSeek.html"
5552     ),
5553     "taw" => array(
5554     "icon" => "taw",
5555     "title" => "TAW",
5556     "rule" => array(
5557     "TAW[ /]([0-9.]{1,10})" => "\\1"
5558     ),
5559     "uri" => "http://www.tawdis.net"
5560     ),
5561     "tcd" => array(
5562     "icon" => "tcd",
5563     "title" => "Trinity College Dublin",
5564     "rule" => array(
5565     "^TCDBOT/Nutch-([0-9.]{1,10})" => "\\1"
5566     ),
5567     "uri" => "http://www.tcd.ie"
5568     ),
5569     "technorati" => array(
5570     "icon" => "technorati",
5571     "title" => "Technorati",
5572     "rule" => array(
5573     "Technoratibot[ /]([0-9.]{1,10})" => "\\1"
5574     ),
5575     "uri" => ""
5576     ),
5577     "teleport" => array(
5578     "icon" => "teleport",
5579     "title" => "Teleport",
5580     "rule" => array(
5581     "Teleport[ \-]?Pro" => ""
5582     ),
5583     "uri" => ""
5584     ),
5585     "terrar" => array(
5586     "icon" => "robot",
5587     "title" => "Terrar",
5588     "rule" => array(
5589     "^Fresh Search :: Terrar" => ""
5590     ),
5591     "uri" => ""
5592     ),
5593     "theophrastus" => array(
5594     "icon" => "robot",
5595     "title" => "Theophrastus",
5596     "rule" => array(
5597     "Theophrastus[ /]([0-9.]{1,10})" => "\\1"
5598     ),
5599     "uri" => "http://users.cs.cf.ac.uk/N.A.Smith/theophrastus.php"
5600     ),
5601     "thumbnailscz" => array(
5602     "icon" => "robot",
5603 matthys 209 "title" => "Thumbnails.cz",
5604 joku 63 "rule" => array(
5605     "^thumbnail\.cz robot[ /]([0-9.]{1,10})" => "\\1"
5606     ),
5607     "uri" => ""
5608     ),
5609     "thumbshot" => array(
5610     "icon" => "robot",
5611 matthys 209 "title" => "Thumbshots",
5612 joku 63 "rule" => array(
5613     "^thumbshots.*(Version: |v)([0-9.]{2,10})e" => "\\1",
5614     "^thumbshots-de" => ""
5615     ),
5616     "uri" => "http://www.thumbshots.de"
5617     ),
5618     "thunderstone" => array(
5619     "icon" => "thunderstone",
5620     "title" => "Thunderstone",
5621     "rule" => array(
5622     "T-H-U-N-D-E-R-S-T-O-N-E" => "",
5623     "search.thunderstone.com" => ""
5624     ),
5625     "uri" => "http://search.thunderstone.com/"
5626     ),
5627     "timbobot" => array(
5628     "icon" => "robot",
5629 matthys 209 "title" => "TimboBot",
5630 joku 63 "rule" => array(
5631     "timboBot" => ""
5632     ),
5633     "uri" => ""
5634     ),
5635     "topsy" => array(
5636     "icon" => "topsy",
5637     "title" => "Topsy",
5638     "rule" => array(
5639     "Butterfly[ /]([0-9.]{1,10})" => "\\1"
5640     ),
5641     "uri" => "http://labs.topsy.com/butterfly.html"
5642     ),
5643     "trayce" => array(
5644     "icon" => "robot",
5645 matthys 209 "title" => "Trayce",
5646 joku 63 "rule" => array(
5647     "traycebot[ /]([0-9a-z.\-]{1,10})" => "\\1"
5648     ),
5649     "uri" => ""
5650     ),
5651     "tricus" => array(
5652     "icon" => "robot",
5653     "title" => "Tricus",
5654     "rule" => array(
5655     "B_l_i_t_z_B_O_T_@_t_r_i_c_u_s_\._c_o_m" => ""
5656     ),
5657     "uri" => ""
5658     ),
5659     "topicblogs" => array(
5660     "icon" => "robot",
5661     "title" => "Topicblogs",
5662     "rule" => array(
5663     "topicblogs[ /]([0-9.]{1,10})" => "\\1"
5664     ),
5665     "uri" => ""
5666     ),
5667     "touche" => array(
5668     "icon" => "touche",
5669 matthys 209 "title" => "Touché",
5670 joku 63 "rule" => array(
5671     "^Touche" => ""
5672     ),
5673     "uri" => "http://touche.com.ve"
5674     ),
5675     "tuezilla" => array(
5676     "icon" => "robot",
5677 matthys 209 "title" => "TÃœzilla",
5678 joku 63 "rule" => array(
5679     "tuezilla.de" => ""
5680     ),
5681     "uri" => "http://tuezilla.de/t_st-odp-entries-agent.html"
5682     ),
5683     "turnitin" => array(
5684     "icon" => "turnitin",
5685     "title" => "Turnitin",
5686     "rule" => array(
5687 matthys 408 "TurnitinBot[ /]([0-9.]{1,10})" => "\\1",
5688     "^Turnitin" => ""
5689 joku 63 ),
5690     "uri" => ""
5691     ),
5692     "tutorgig" => array(
5693     "icon" => "robot",
5694     "title" => "TutorGig",
5695     "rule" => array(
5696     "TutorGig(Bot)?[ /]([0-9.]{1,10})" => "\\2"
5697     ),
5698     "uri" => ""
5699     ),
5700     "twiceler" => array(
5701     "icon" => "cuill",
5702 matthys 209 "title" => "Cuill",
5703 joku 63 "rule" => array(
5704     "Twiceler[ /-]([0-9.]{1,10})" => "\\1",
5705     "Twiceler" => ""
5706     ),
5707     "uri" => "http://www.cuill.com/twiceler/robot.html"
5708     ),
5709     "twingly" => array(
5710     "icon" => "twingly",
5711     "title" => "Twingly",
5712     "rule" => array(
5713     "Twingly Recon" => ""
5714     ),
5715     "uri" => "http://www.twingly.com/"
5716     ),
5717 matthys 320 "twitter" => array(
5718     "icon" => "twitter",
5719     "title" => "Twitter",
5720     "rule" => array(
5721     "Twitterbot[ /-]([0-9.]{1,10})" => "\\1"
5722     ),
5723     "uri" => "https://dev.twitter.com/cards/getting-started#crawling"
5724     ),
5725 joku 63 "typepad" => array(
5726     "icon" => "typepad",
5727     "title" => "TypePad",
5728     "rule" => array(
5729     "TypePad/([0-9a-z.]{1,10})" => "\\1"
5730     ),
5731     "uri" => ""
5732     ),
5733     "udmsearch" => array(
5734     "icon" => "robot",
5735     "title" => "UdmSearch",
5736     "rule" => array(
5737     "UdmSearch[/ ]([0-9.]{1,10})" => "\\1"
5738     ),
5739     "uri" => ""
5740     ),
5741     "ukwizz" => array(
5742     "icon" => "ukwizz",
5743     "title" => "UKWizz",
5744     "rule" => array(
5745     "^Mackster.*ukwizz" => ""
5746     ),
5747     "uri" => "http://www.ukwizz.com"
5748     ),
5749     "ultraseek" => array(
5750     "icon" => "robot",
5751     "title" => "Ultraseek",
5752     "rule" => array(
5753     "Ultraseek" => ""
5754     ),
5755     "uri" => ""
5756     ),
5757     "ultraspider" => array(
5758     "icon" => "robot",
5759     "title" => "UltraSpider",
5760     "rule" => array(
5761     "UltraSpider3000[/ ]([0-9.]{1,10})" => "\\1"
5762     ),
5763     "uri" => "http://www.search.ch"
5764     ),
5765     "umai" => array(
5766     "icon" => "robot",
5767 matthys 209 "title" => "Umai",
5768 joku 63 "rule" => array(
5769     "umai[/ ]([0-9.]{1,10})" => "\\1"
5770     ),
5771     "uri" => ""
5772     ),
5773     "unchaos" => array(
5774     "icon" => "robot",
5775     "title" => "Unchaos",
5776     "rule" => array(
5777     "unchaos_crawler[_ /]([0-9.]{1,10})" => "\\1",
5778     "unchaos" => ""
5779     ),
5780     "uri" => ""
5781     ),
5782     "unido" => array(
5783     "icon" => "robot",
5784 matthys 209 "title" => "UNIdo",
5785 joku 63 "rule" => array(
5786     "^unido-bot" => "\\1"
5787     ),
5788     "uri" => "http://mobicom.cs.uni-dortmund.de/bot.html"
5789     ),
5790     "updated" => array(
5791     "icon" => "robot",
5792     "title" => "Updated",
5793     "rule" => array(
5794     "updated[ /]([0-9a-z.]{1,10})" => "\\1"
5795     ),
5796     "uri" => ""
5797     ),
5798     "uptimebot" => array(
5799     "icon" => "robot",
5800     "title" => "UptimeBot",
5801     "rule" => array(
5802     "^UptimeBot" => ""
5803     ),
5804     "uri" => "http://www.uptimebot.com/"
5805     ),
5806     "urifetch" => array(
5807     "icon" => "robot",
5808     "title" => "URI::Fetch",
5809     "rule" => array(
5810     "^URI::Fetch[ /]([0-9.]{1,10})" => "\\1"
5811     ),
5812     "uri" => ""
5813     ),
5814     "urlbase" => array(
5815     "icon" => "robot",
5816     "title" => "URLBase",
5817     "rule" => array(
5818     "URLBase[ /]([0-9.]{1,10})" => "\\1"
5819     ),
5820     "uri" => ""
5821     ),
5822     "urlblaze" => array(
5823     "icon" => "robot",
5824     "title" => "URLBlaze",
5825     "rule" => array(
5826     "^URLBlaze" => ""
5827     ),
5828     "uri" => ""
5829     ),
5830     "urlcontr" => array(
5831     "icon" => "robot",
5832     "title" => "MS URL Control",
5833     "rule" => array(
5834     "Microsoft URL[ \-]?Control" => ""
5835     ),
5836     "uri" => ""
5837     ),
5838     "urlgetfile" => array(
5839     "icon" => "robot",
5840     "title" => "URLGetFile",
5841     "rule" => array(
5842     "^URLGetFile" => ""
5843     ),
5844     "uri" => ""
5845     ),
5846     "urlscope" => array(
5847     "icon" => "robot",
5848     "title" => "UrlScope",
5849     "rule" => array(
5850     "UrlScope" => ""
5851     ),
5852     "uri" => ""
5853     ),
5854     "urltrends" => array(
5855     "icon" => "urltrends",
5856 matthys 209 "title" => "UrlTrends",
5857 joku 63 "rule" => array(
5858     "Snappy/([0-9.]{1,10})" => "\\1",
5859     ),
5860     "uri" => ""
5861     ),
5862     "usww" => array(
5863     "icon" => "usww",
5864 matthys 209 "title" => "USWW",
5865 joku 63 "rule" => array(
5866     "usww\.com" => "",
5867     "Mozilla/5\.0 URL-Spider" => ""
5868     ),
5869     "uri" => "http://www.usww.com/"
5870     ),
5871     "usyd" => array(
5872     "icon" => "robot",
5873     "title" => "USyd-NLP-Spider",
5874     "rule" => array(
5875     "^USyd-NLP-Spider" => ""
5876     ),
5877     "uri" => "http://www.it.usyd.edu.au/~vinci/bot.html"
5878     ),
5879     "vagabondo" => array(
5880     "icon" => "wiseguys",
5881     "title" => "WiseGuys",
5882     "rule" => array(
5883     "Vagabondo[ /]([0-9.]{1,10})" => "\\1",
5884     "Vagabondo-WAP[ /]([0-9.]{1,10})" => "\\1"
5885     ),
5886     "uri" => ""
5887     ),
5888     "unicorn" => array(
5889     "icon" => "w3c",
5890     "title" => "W3C Unicorn",
5891     "rule" => array(
5892     "Unicorn[ /]([0-9.]{1,10})" => "\\1",
5893     ),
5894     "uri" => "http://validator.w3.org/unicorn/"
5895     ),
5896     "validator" => array(
5897     "icon" => "w3c",
5898     "title" => "W3C Validator",
5899     "rule" => array(
5900     "W3C_Validator[ /]([0-9.]{1,10})" => "\\1"
5901     ),
5902     "uri" => "http://validator.w3.org/"
5903     ),
5904     "validator.nu" => array(
5905     "icon" => "validatornu",
5906     "title" => "Validator.nu",
5907     "rule" => array(
5908     "^Validator.nu[ /]([0-9.]{1,10})" => "\\1",
5909     "^Validator.nu/LV" => "\\1"
5910     ),
5911     "uri" => "http://validator.nu/"
5912     ),
5913     "verity" => array(
5914     "icon" => "robot",
5915     "title" => "Verity",
5916     "rule" => array(
5917     "^vspider[ /]([0-9.]{1,10})" => "\\1",
5918     "^vspider" => ""
5919     ),
5920     "uri" => "http://www.verity.com/"
5921     ),
5922     "versionsproject" => array(
5923     "icon" => "robot",
5924     "title" => "Versions-project",
5925     "rule" => array(
5926     "InfoFly[ /]([0-9.]{1,10})" => "\\1"
5927     ),
5928     "uri" => "http://www.versions-project.org/"
5929     ),
5930     "verticalmatch" => array(
5931     "icon" => "robot",
5932     "title" => "VerticalMatch",
5933     "rule" => array(
5934     "^VMBot[ /]([0-9.]{1,10})" => "\\1"
5935     ),
5936     "uri" => "http://www.VerticalMatch.com/"
5937     ),
5938     "verzamelgids" => array(
5939     "icon" => "robot",
5940     "title" => "Verzamelgids",
5941     "rule" => array(
5942     "Verzamelgids[ /]([0-9.]{1,10})" => "\\1"
5943     ),
5944     "uri" => "http://www.verzamelgids.nl/"
5945     ),
5946     "vestris" => array(
5947     "icon" => "vestris",
5948     "title" => "Vestris",
5949     "rule" => array(
5950     "AlkalineBOT[ /]([0-9.]{1,10})" => "\\1"
5951     ),
5952     "uri" => "http://alkaline.vestris.com/"
5953     ),
5954     "vindex" => array(
5955     "icon" => "vindex",
5956     "title" => "Vindex",
5957     "rule" => array(
5958     "Vindex[ /]([0-9.]{1,10})" => "\\1"
5959     ),
5960     "uri" => ""
5961     ),
5962     "visvo" => array(
5963     "icon" => "robot",
5964     "title" => "Visvo",
5965     "rule" => array(
5966     "VisBot[ /]([0-9.]{1,10})" => "\\1"
5967     ),
5968     "uri" => "http://www.visvo.com"
5969     ),
5970     "voila" => array(
5971     "icon" => "voila",
5972     "title" => "Voila",
5973     "rule" => array(
5974     "VoilaBot[ /]?[a-z ]*([0-9.]{1,10})" => "\\1",
5975     "VoilaBot;[ /]([0-9.]{1,10})" => "\\1"
5976     ),
5977     "uri" => ""
5978     ),
5979     "vonna" => array(
5980     "icon" => "robot",
5981     "title" => "Vonna",
5982     "rule" => array(
5983     "Vonna.com b o t" => ""
5984     ),
5985     "uri" => ""
5986     ),
5987     "vortex" => array(
5988     "icon" => "robot",
5989     "title" => "Vortex",
5990     "rule" => array(
5991     "Vortex[ /]([0-9.]{1,10})" => "\\1"
5992     ),
5993     "uri" => "http://marty.anstey.ca/robots/vortex/"
5994     ),
5995     "w3sitesearch" => array(
5996     "icon" => "w3sitesearch",
5997     "title" => "W3SiteSearch",
5998     "rule" => array(
5999     "^W3SiteSearch Crawler[\_v]*([0-9.]{1,10})" => "\\1"
6000     ),
6001     "uri" => "http://www.w3sitesearch.de"
6002     ),
6003     "wagger" => array(
6004     "icon" => "robot",
6005     "title" => "Wagger",
6006     "rule" => array(
6007     "^Waggr" => ""
6008     ),
6009     "uri" => "http://www.waggr.com/"
6010     ),
6011     "wanadoo" => array(
6012     "icon" => "robot",
6013     "title" => "Wanadoo",
6014     "rule" => array(
6015     "^SurferF3[ /]([0-9./]{1,10})" => "\\1"
6016     ),
6017     "uri" => "http://www.wanadoo.fr/"
6018     ),
6019     "wapalizer" => array(
6020     "icon" => "robot",
6021     "title" => "Wapalizer",
6022     "rule" => array(
6023     "wapalizer[ /]([0-9.]{1,10})" => "\\1"
6024     ),
6025     "uri" => "http://www.wapdrive.com/"
6026     ),
6027     "watson" => array(
6028     "icon" => "addy",
6029     "title" => "Dr.Watson",
6030     "rule" => array(
6031     "Watson[ /]([0-9.]{1,10})" => "\\1",
6032     "watson\.addy\.com" => ""
6033     ),
6034     "uri" => ""
6035     ),
6036     "wavefire" => array(
6037     "icon" => "robot",
6038     "title" => "Wavefire",
6039     "rule" => array(
6040     "^Wavefire[ /]([0-9.]{1,10})" => "\\1"
6041     ),
6042     "uri" => ""
6043     ),
6044     "waypath" => array(
6045     "icon" => "waypath",
6046     "title" => "Waypath",
6047     "rule" => array(
6048     "Waypath[ \-]?Scout" => "",
6049     "Waypath (development )?crawler" => ""
6050     ),
6051     "uri" => ""
6052     ),
6053     "wauuu" => array(
6054     "icon" => "wauuu",
6055     "title" => "Wauuu",
6056     "rule" => array(
6057     "Wauuu[/ ]([0-9.]{1,10})" => "\\2"
6058     ),
6059     "uri" => "http://www.wauuu.com"
6060     ),
6061     "wdg" => array(
6062     "icon" => "wdg",
6063     "title" => "WDG Validator",
6064     "rule" => array(
6065     "^WDG_(Site)?Validator[/ ]([0-9.]{1,10})" => "\\2"
6066     ),
6067     "uri" => "http://www.htmlhelp.com/tools/validator/"
6068     ),
6069     "webagogo" => array(
6070     "icon" => "webagogo",
6071     "title" => "Webagogo",
6072     "rule" => array(
6073     "^Webagogo" => ""
6074     ),
6075     "uri" => "http://www.webagogo.be/"
6076     ),
6077     "webalta" => array(
6078     "icon" => "webalta",
6079     "title" => "WebAlta",
6080     "rule" => array(
6081     "^WebAlta( Crawler)?[/ ]([0-9.]{1,10})" => "\\2"
6082     ),
6083     "uri" => "http://www.webalta.net/ru/about_webmaster.html"
6084     ),
6085     "webdigity" => array(
6086     "icon" => "robot",
6087     "title" => "Webdigity Whois Service",
6088     "rule" => array(
6089     "^webdigity whois service" => ""
6090     ),
6091     "uri" => "http://www.webdigity.com/ws"
6092     ),
6093     "webelixir" => array(
6094     "icon" => "webelixir",
6095     "title" => "Webelixir",
6096     "rule" => array(
6097     "^webelixir" => ""
6098     ),
6099     "uri" => "http://www.webelixir.net/"
6100     ),
6101     "webbotru" => array(
6102     "icon" => "robot",
6103     "title" => "Webbot.ru",
6104     "rule" => array(
6105     " Webbot[/ ]([0-9.]{1,10})" => "\\1"
6106     ),
6107     "uri" => "http://www.webbot.ru/bot.html"
6108     ),
6109     "webcapture" => array(
6110     "icon" => "robot",
6111     "title" => "WebCapture",
6112     "rule" => array(
6113     "WebCapture[/ ]([0-9.]{1,10})" => "\\1"
6114     ),
6115     "uri" => ""
6116     ),
6117     "webcollage" => array(
6118     "icon" => "robot",
6119     "title" => "Webcollage",
6120     "rule" => array(
6121     "webcollage" => ""
6122     ),
6123     "uri" => ""
6124     ),
6125     "webcopier" => array(
6126     "icon" => "webcopier",
6127     "title" => "WebCopier",
6128     "rule" => array(
6129     "WebCopier[/ ]v?([0-9.]{1,10})" => "\\1"
6130     ),
6131     "uri" => ""
6132     ),
6133     "webcorp" => array(
6134     "icon" => "webcorp",
6135     "title" => "WebCorp",
6136     "rule" => array(
6137     "WebCorp[/ ]+([0-9.]{1,10})" => "\\1"
6138     ),
6139     "uri" => "http://www.webcorp.org.uk/"
6140     ),
6141     "webcrawl" => array(
6142     "icon" => "robot",
6143     "title" => "WebCrawl",
6144     "rule" => array(
6145     "webcrawl\.net" => ""
6146     ),
6147     "uri" => ""
6148     ),
6149     "webdownloader" => array(
6150     "icon" => "robot",
6151     "title" => "Web Downloader",
6152     "rule" => array(
6153     "Web Downloader[/ ]([0-9.]{1,10})" => "\\1"
6154     ),
6155     "uri" => ""
6156     ),
6157     "webfetch" => array(
6158     "icon" => "robot",
6159 matthys 209 "title" => "WebFetch",
6160 joku 63 "rule" => array(
6161     "^webfetch[/ ]([0-9.]{1,10})" => "\\1"
6162     ),
6163     "uri" => ""
6164     ),
6165     "webfind" => array(
6166     "icon" => "robot",
6167 matthys 209 "title" => "WebFind",
6168 joku 63 "rule" => array(
6169     "^WebFindBot" => ""
6170     ),
6171     "uri" => "http://www.web-find.com"
6172     ),
6173     "webglimpse" => array(
6174     "icon" => "robot",
6175     "title" => "Webglimpse",
6176     "rule" => array(
6177     "^Webglimpse[/ ]([0-9.]{1,10})" => "\\1"
6178     ),
6179     "uri" => "http://webglimpse.net"
6180     ),
6181     "webgobbler" => array(
6182     "icon" => "robot",
6183     "title" => "webGobbler",
6184     "rule" => array(
6185     "^webGobbler[/ ]([0-9.]{1,10})" => "\\1"
6186     ),
6187     "uri" => ""
6188     ),
6189     "webimages" => array(
6190     "icon" => "webimages",
6191     "title" => "WebImages",
6192     "rule" => array(
6193     "^WebImages[/ ]([0-9.]{1,10})" => "\\1"
6194     ),
6195     "uri" => "http://herbert.groot.jebbink.nl/"
6196     ),
6197     "weblight" => array(
6198     "icon" => "robot",
6199     "title" => "WebLight",
6200     "rule" => array(
6201     "^WebLight[/ ]([0-9.]{1,10})" => "\\1"
6202     ),
6203     "uri" => "http://www.illumit.com/Products/weblight/"
6204     ),
6205     "weblinks" => array(
6206     "icon" => "robot",
6207     "title" => "WebLink's",
6208     "rule" => array(
6209     "^Weblink.s checker" => ""
6210     ),
6211     "uri" => ""
6212     ),
6213     "webmeasurement" => array(
6214     "icon" => "robot",
6215     "title" => "Webmeasurement",
6216     "rule" => array(
6217     "^webmeasurement-bot" => ""
6218     ),
6219     "uri" => "http://rvs.informatik.uni-leipzig.de"
6220     ),
6221     "webminer" => array(
6222     "icon" => "robot",
6223     "title" => "WebMiner",
6224     "rule" => array(
6225     "^WebMiner[/ ]([0-9.]{1,10})" => "\\1"
6226     ),
6227     "uri" => ""
6228     ),
6229     "webmin" => array(
6230     "icon" => "webmin",
6231     "title" => "Webmin",
6232     "rule" => array(
6233     "^webmin" => ""
6234     ),
6235     "uri" => ""
6236     ),
6237     "webmon" => array(
6238     "icon" => "webmon",
6239     "title" => "Webmon",
6240     "rule" => array(
6241     "WebMon[ /]([0-9.]{1,10})" => "\\1"
6242     ),
6243     "uri" => "http://www.markwell.btinternet.co.uk/webmon/"
6244     ),
6245     "webox" => array(
6246     "icon" => "robot",
6247     "title" => " WeBoX",
6248     "rule" => array(
6249     "WeBoX[/ ]([0-9.]{1,10})" => "\\1"
6250     ),
6251     "uri" => ""
6252     ),
6253     "webpatrol" => array(
6254     "icon" => "webpatrol",
6255     "title" => "WebPatrol",
6256     "rule" => array(
6257     "^WebPatrol[ /]([0-9.]{1,10})" => "\\1"
6258     ),
6259     "uri" => "http://soft.macfeeling.com/WebPatrol.html"
6260     ),
6261     "webpix" => array(
6262     "icon" => "webpix",
6263     "title" => "WebPix",
6264     "rule" => array(
6265     "WebPix[/ ]([0-9.]{1,10})" => "\\1"
6266     ),
6267     "uri" => ""
6268     ),
6269     "webrace" => array(
6270     "icon" => "robot",
6271     "title" => "WebRACE",
6272     "rule" => array(
6273     "^WebRACE[/ ]([0-9.]{1,10})" => "\\1"
6274     ),
6275     "uri" => ""
6276     ),
6277     "webreaper" => array(
6278     "icon" => "webreaper",
6279     "title" => "WebReaper",
6280     "rule" => array(
6281     "^WebReaper " => ""
6282     ),
6283     "uri" => "http://www.webreaper.net/"
6284     ),
6285     "webresult" => array(
6286     "icon" => "robot",
6287     "title" => "Webresult",
6288     "rule" => array(
6289     "Der webresult\.de Robot" => ""
6290     ),
6291     "uri" => ""
6292     ),
6293     "webring" => array(
6294     "icon" => "robot",
6295     "title" => "Webring Checker",
6296     "rule" => array(
6297     "WebRingChecker[/ ]([0-9.]{1,10})" => "\\1"
6298     ),
6299     "uri" => ""
6300     ),
6301     "webripper" => array(
6302     "icon" => "webripper",
6303     "title" => "WebRipper",
6304     "rule" => array(
6305     "^WebRipper" => ""
6306     ),
6307     "uri" => "http://calluna-software.com"
6308     ),
6309     "webscaled" => array(
6310     "icon" => "webscaled",
6311     "title" => "Webscaled",
6312     "rule" => array(
6313     "Swarm" => ""
6314     ),
6315     "uri" => "http://webscaled.com/"
6316     ),
6317     "websearchau" => array(
6318     "icon" => "websearchau",
6319     "title" => "WebSearch.COM.AU",
6320     "rule" => array(
6321     "WebSearch.COM.AU[/ ]+([0-9.]{1,10})" => "\\1"
6322     ),
6323     "uri" => "http://WebSearch.com.au/"
6324     ),
6325     "websearchbench" => array(
6326     "icon" => "robot",
6327     "title" => "WebSearchBench",
6328     "rule" => array(
6329     "WebSearchBench WebCrawler[v/ ]+([0-9.]{1,10})" => "\\1"
6330     ),
6331     "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6332     ),
6333     "websense" => array(
6334     "icon" => "websense",
6335     "title" => "Websense",
6336     "rule" => array(
6337     "(Sqworm|websense|Konqueror/3\.(0|1)(-rc[1-6])?; i686 Linux; 2002[0-9]{4})" => ""
6338     ),
6339     "uri" => ""
6340     ),
6341     "websiteshadow" => array(
6342     "icon" => "websiteshadow",
6343     "title" => "Websiteshadow",
6344     "rule" => array(
6345     "Websiteshadowbot[ /]([0-9.]{1,10})" => "\\1"
6346     ),
6347     "uri" => "http://websiteshadow.com"
6348     ),
6349     "websiteworth" => array(
6350     "icon" => "robot",
6351     "title" => "WebsiteWorth",
6352     "rule" => array(
6353     "WebsiteWorth[v/ ]+([0-9.]{1,10})" => "\\1"
6354     ),
6355     "uri" => "http://directory.sootle.com/website-worth/tata.php"
6356     ),
6357     "websquash" => array(
6358     "icon" => "websquash",
6359     "title" => "Websquash",
6360     "rule" => array(
6361     "webs(quash\.com|ite[ \-]?Monitor)" => ""
6362     ),
6363     "uri" => ""
6364     ),
6365     "webstripper" => array(
6366     "icon" => "robot",
6367     "title" => "WebStripper",
6368     "rule" => array(
6369     "WebStripper[ /]([0-9.]{1,10})" => "\\1"
6370     ),
6371     "uri" => ""
6372     ),
6373     "webzip" => array(
6374     "icon" => "webzip",
6375     "title" => "WebZIP",
6376     "rule" => array(
6377     "Web[ \-]?ZIP[ /]([0-9.]{1,10})" => "\\1"
6378     ),
6379     "uri" => ""
6380     ),
6381     "wep" => array(
6382     "icon" => "robot",
6383     "title" => "WEP Search",
6384     "rule" => array(
6385     "WEP Search[ /]([0-9.]{1,10})" => "\\1"
6386     ),
6387     "uri" => ""
6388     ),
6389     "westwind" => array(
6390     "icon" => "robot",
6391     "title" => "West Wind Internet Protocols",
6392     "rule" => array(
6393     "^West Wind Internet Protocols[ /]([0-9.]{1,10})" => "\\1"
6394     ),
6395     "uri" => "http://www.west-wind.com/wwipstuff.asp"
6396     ),
6397     "wget" => array(
6398     "icon" => "wget",
6399     "title" => "Wget",
6400     "rule" => array(
6401 joku 308 "Wget[ /]([0-9.]{1,10})" => "\\1",
6402     "Wget" => ""
6403 joku 63 ),
6404     "uri" => ""
6405     ),
6406     "whizbang" => array(
6407     "icon" => "whizbang",
6408     "title" => "WhizBang",
6409     "rule" => array(
6410     "WhizBang" => ""
6411     ),
6412     "uri" => "http://www.whizbang.com/crawler/"
6413     ),
6414     "whois" => array(
6415     "icon" => "whois",
6416     "title" => "Who.is",
6417     "rule" => array(
6418     "Who.is Bot" => ""
6419     ),
6420     "uri" => "http://www.who.is/"
6421     ),
6422     "wikiwix" => array(
6423     "icon" => "wikiwix",
6424     "title" => "Wikiwix",
6425     "rule" => array(
6426     "wikiwix-bot-([0-9.]{1,10})" => "\\1"
6427     ),
6428     "uri" => "http://www.wikiwix.com/"
6429     ),
6430     "wingflyer" => array(
6431     "icon" => "robot",
6432     "title" => "WingFlyer",
6433     "rule" => array(
6434     "^WebFetch" => ""
6435     ),
6436     "uri" => "http://www.wingflyer.com/"
6437     ),
6438     "wininet" => array(
6439     "icon" => "robot",
6440     "title" => "WinInet",
6441     "rule" => array(
6442     "TeamSoft WinInet Component" => ""
6443     ),
6444     "uri" => "http://www.winsoft.sk/wininet.htm"
6445     ),
6446     "winhttp" => array(
6447     "icon" => "robot",
6448     "title" => "WinHTTP",
6449     "rule" => array(
6450     "WinHttp\.WinHttpRequest\.([0-9.]{1,10})" => "\\1"
6451     ),
6452     "uri" => ""
6453     ),
6454     "wire" => array(
6455     "icon" => "robot",
6456     "title" => "WIRE",
6457     "rule" => array(
6458     "^WIRE[ /]([0-9.]{1,10})" => "\\1"
6459     ),
6460     "uri" => ""
6461     ),
6462     "wmp" => array(
6463     "icon" => "robot",
6464     "title" => "WMP",
6465     "rule" => array(
6466     "^WMP" => ""
6467     ),
6468     "uri" => ""
6469     ),
6470     "woozweb" => array(
6471     "icon" => "woozweb",
6472     "title" => "Woozweb",
6473     "rule" => array(
6474     "woozweb" => ""
6475     ),
6476     "uri" => "http://www.woozweb.com/"
6477     ),
6478     "wordchamp" => array(
6479     "icon" => "robot",
6480     "title" => "WordChamp",
6481     "rule" => array(
6482     "^WordChampBot" => ""
6483     ),
6484     "uri" => "http://www.wordchamp.com/"
6485     ),
6486     "wordpress" => array(
6487     "icon" => "wordpress",
6488     "title" => "WordPress",
6489     "rule" => array(
6490     "WordPress[ /]([0-9.]{1,10})" => "\\1"
6491     ),
6492     "uri" => ""
6493     ),
6494     "worio" => array(
6495     "icon" => "worio",
6496     "title" => "Worio",
6497     "rule" => array(
6498     "woriobot" => ""
6499     ),
6500     "uri" => "http://worio.com/"
6501     ),
6502     "worldlight" => array(
6503     "icon" => "worldlight",
6504     "title" => "WorldLight",
6505     "rule" => array(
6506     "^WorldLight" => ""
6507     ),
6508     "uri" => ""
6509     ),
6510     "worqmada" => array(
6511     "icon" => "robot",
6512     "title" => "WorQmada",
6513     "rule" => array(
6514     "WorQmada[ /]([0-9.]{1,10})" => "\\1"
6515     ),
6516     "uri" => ""
6517     ),
6518     "wotbox" => array(
6519     "icon" => "wotbox",
6520     "title" => "Wotbox",
6521     "rule" => array(
6522     "Wotbox[ /]?[a-z]*([0-9.]{1,10})" => "\\1"
6523     ),
6524     "uri" => ""
6525     ),
6526     "wp" => array(
6527     "icon" => "wp",
6528     "title" => "Wirtualna Polska",
6529     "rule" => array(
6530     "NetSprint[ /\-]{1,4}([0-9.]{1,10})" => "\\1"
6531     ),
6532     "uri" => "http://wp.pl"
6533     ),
6534     "wsb" => array(
6535     "icon" => "robot",
6536     "title" => "WebSearchBench",
6537     "rule" => array(
6538     "WSB WebCrawler V([0-9.]{1,10})" => "\\1",
6539     "WSB " => ""
6540     ),
6541     "uri" => "http://websearchbench.cs.uni-dortmund.de/"
6542     ),
6543     "wume" => array(
6544     "icon" => "robot",
6545     "title" => "WUME Lab's",
6546     "rule" => array(
6547     "^wume_crawler[ /]([0-9.]{1,10})" => "\\1",
6548     ),
6549     "uri" => "http://wume.cse.lehigh.edu/~xiq204/crawler/"
6550     ),
6551     "wusage" => array(
6552     "icon" => "wusage",
6553     "title" => "Wusage",
6554     "rule" => array(
6555     "Wusage[ /]([0-9.]{1,10})" => "\\1",
6556     ),
6557     "uri" => "http://www.boutell.com/wusage/"
6558     ),
6559     "wwgrapevine" => array(
6560     "icon" => "wwgrapevine",
6561     "title" => "WWgrapevine",
6562     "rule" => array(
6563     "wwgrapevine[ /]([0-9.]{1,10})" => "\\1"
6564     ),
6565     "uri" => ""
6566     ),
6567     "wws" => array(
6568     "icon" => "robot",
6569     "title" => "WWSBOT",
6570     "rule" => array(
6571     "WWSBOT[ /]([0-9.]{1,10})" => "\\1",
6572     ),
6573     "uri" => "http://www.analyzer.nu"
6574     ),
6575     "www4mail" => array(
6576     "icon" => "robot",
6577 matthys 209 "title" => "WWW4mail",
6578 joku 63 "rule" => array(
6579     "^www4mail[ /]([0-9.]{1,10})" => "\\1"
6580     ),
6581     "uri" => "http://www.www4mail.org/"
6582     ),
6583     "wwwc" => array(
6584     "icon" => "wwwc",
6585     "title" => "WWWC",
6586     "rule" => array(
6587     "^WWWC[ /]([0-9.]{1,10})" => "\\1"
6588     ),
6589     "uri" => ""
6590     ),
6591     "wwwd" => array(
6592     "icon" => "robot",
6593     "title" => "WWWD",
6594     "rule" => array(
6595     "^WWWD[ /]([0-9.]{1,10})" => "\\1"
6596     ),
6597     "uri" => ""
6598     ),
6599     "wwweasel" => array(
6600     "icon" => "wwweasel",
6601     "title" => "WWWeasel",
6602     "rule" => array(
6603     "WWWeasel( Robot)?[/ ]v?([0-9.]{1,10})" => "\\2"
6604     ),
6605     "uri" => ""
6606     ),
6607     "wwwfi" => array(
6608     "icon" => "wwwfi",
6609     "title" => "www.fi",
6610     "rule" => array(
6611     "www\.fi crawler" => ""
6612     ),
6613     "uri" => "http://www.fi/"
6614     ),
6615     "wwwmechanize" => array(
6616     "icon" => "robot",
6617     "title" => "WWW-Mechanize",
6618     "rule" => array(
6619     "^WWW-Mechanize[/ ]([0-9.]{1,10})" => "\\1"
6620     ),
6621     "uri" => ""
6622     ),
6623     "wwwoffle" => array(
6624     "icon" => "robot",
6625     "title" => "WWWoffle",
6626     "rule" => array(
6627     "^wwwoffle[/ ]([0-9.]{1,10})" => "\\1"
6628     ),
6629     "uri" => ""
6630     ),
6631     "wwwster" => array(
6632     "icon" => "robot",
6633     "title" => "WWWster",
6634     "rule" => array(
6635     "^wwwster[/ ]([0-9.]{1,10})" => "\\1"
6636     ),
6637     "uri" => ""
6638     ),
6639     "wysigot" => array(
6640     "icon" => "wysigot",
6641     "title" => "Wysigot",
6642     "rule" => array(
6643     "Wysigot[/ ]([0-9.]{1,10})" => "\\1"
6644     ),
6645     "uri" => ""
6646     ),
6647     "xaldon" => array(
6648     "icon" => "xaldon",
6649     "title" => "Xaldon",
6650     "rule" => array(
6651     "Xaldon WebSpider" => ""
6652     ),
6653     "uri" => "http://www.xaldon.de/"
6654     ),
6655     "xenu" => array(
6656     "icon" => "xenu",
6657     "title" => "Xenu Link Sleuth",
6658     "rule" => array(
6659     "Xenu Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6660     "Xenu(&#039;s)? Link Sleuth[/ ]([0-9a-z.]{1,10})" => "\\1",
6661     "Xenu_Link_Sleuth_([0-9a-z.]{1,10})" => "\\1"
6662     ),
6663     "uri" => "http://home.snafu.de/tilman/xenulink.html"
6664     ),
6665     "xerka" => array(
6666     "icon" => "xerka",
6667     "title" => "Xerka",
6668     "rule" => array(
6669     "^Xerka WebBot v([0-9a-z.]{1,10})" => "\\1"
6670     ),
6671     "uri" => "http://www.diana-teknologia.com/www1/english/xerka.htm"
6672     ),
6673     "xirq" => array(
6674     "icon" => "robot",
6675     "title" => "XIRQ",
6676     "rule" => array(
6677     "^xirq[ /]([0-9a-z.]{1,10})" => "\\1"
6678     ),
6679     "uri" => "http://www.xirq.com"
6680     ),
6681     "xmlslurp" => array(
6682     "icon" => "robot",
6683     "title" => "XMLSlurp",
6684     "rule" => array(
6685     "^XMLSlurp[ /]([0-9a-z.]{1,10})" => "\\1"
6686     ),
6687     "uri" => ""
6688     ),
6689     "xml-sitemaps" => array(
6690     "icon" => "xml-sitemaps",
6691     "title" => "XML-Sitemaps",
6692     "rule" => array(
6693     "XML-Sitemaps[ /]([0-9a-z.]{1,10})" => "\\1"
6694     ),
6695     "uri" => ""
6696     ),
6697     "xmlrpc" => array(
6698     "icon" => "robot",
6699     "title" => "Trackback",
6700     "rule" => array(
6701     "XMLRPC" => ""
6702     ),
6703     "uri" => ""
6704     ),
6705 matthys 294 "xovi" => array(
6706     "icon" => "xovi",
6707     "title" => "Xovi",
6708     "rule" => array(
6709     "XoviBot[ /]([0-9a-z.]{1,10})" => "\\1"
6710     ),
6711     "uri" => "http://www.xovibot.net"
6712     ),
6713 joku 63 "yacy" => array(
6714     "icon" => "yacy",
6715     "title" => "Yacy",
6716     "rule" => array(
6717     "yacy\.net" => ""
6718     ),
6719     "uri" => ""
6720     ),
6721     "yahoo" => array(
6722     "icon" => "yahoo",
6723     "title" => "Yahoo",
6724     "rule" => array(
6725     "Yahoo(! ([a-z]{1,3} )?Slurp|-)" => "",
6726     "Yahoo-MMCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6727     "Yahoo-VerticalCrawler-FormerWebCrawler[/ ]([0-9a-z.]{1,10})" => "\\1",
6728     "^AnzwersCrawl[/ ]([0-9a-z.]{1,10})" => "\\1",
6729     "Y!J(-BSC|-SRD)*[/ ]([0-9a-z.]{1,10})" => "\\2",
6730     "Y!OASIS/TEST" => "",
6731     "Harvest-NG[/ ]([0-9a-z.]{1,10})" => "\\1",
6732     "Y!J; for robot study" => "",
6733     "Yahoo Japan; for robot study" => ""
6734     ),
6735     "uri" => "http://www.yahoo.com"
6736     ),
6737     "yahoo-feed" => array(
6738     "icon" => "yahoo",
6739     "title" => "Yahoo Feedseeker",
6740     "rule" => array(
6741     "^YahooFeedSeeker[/ ]([0-9a-z.]{1,10})" => "\\1"
6742     ),
6743     "uri" => "http://www.yahoo.com"
6744     ),
6745     "yandex" => array(
6746     "icon" => "yandex",
6747     "title" => "Yandex",
6748     "rule" => array(
6749     "Yandex[/ ]([0-9.]{1,10})" => "\\1",
6750     "Yandex(Bot|Images|Media|Antivirus)[/ ]([0-9.]{1,10})" => "\\2"
6751     ),
6752     "uri" => "http://yandex.com/bots"
6753     ),
6754     "yanga" => array(
6755     "icon" => "yanga",
6756     "title" => "Yanga",
6757     "rule" => array (
6758     "^Yanga.*v([0-9.]{1,10})" => "\\1"
6759     ),
6760     "uri" => "http://www.yanga.co.uk/"
6761     ),
6762     "yap" => array(
6763     "icon" => "yap",
6764     "title" => "Yap",
6765     "rule" => array(
6766     "^YapBot[_/ ]v([0-9.]{1,10})" => "\\1"
6767     ),
6768     "uri" => "http://www.yapinc.com/"
6769     ),
6770     "yarienavoir" => array(
6771     "icon" => "robot",
6772     "title" => "Yarienavoir",
6773     "rule" => array(
6774     "^yarienavoir.net[/ ]([0-9.]{1,10})" => "\\1"
6775     ),
6776     "uri" => "http://www.yarienavoir.net/"
6777     ),
6778     "yell" => array(
6779     "icon" => "yell",
6780     "title" => "Yell",
6781     "rule" => array(
6782     "YellCrawl[ /]V?([0-9.]{1,10})" => "\\1",
6783     "Yellbot[ /]Nutch-([0-9.]{1,10})" => "\\1",
6784     ),
6785     "uri" => ""
6786     ),
6787     "youdao" => array(
6788     "icon" => "youdao",
6789     "title" => "Youdao",
6790     "rule" => array(
6791     "YodaoBot-(Image|Mobile)?[ /]([0-9.]{1,10})" => "\\2",
6792     "YoudaoBot[ /]([0-9.]{1,10})" => "\\1"
6793     ),
6794     "uri" => "http://www.youdao.com/help/webmaster/spider/"
6795     ),
6796     "yoogli" => array(
6797     "icon" => "yoogli",
6798     "title" => "Yoogli",
6799     "rule" => array(
6800     "yoogliFetchAgent[ /]([0-9.]{1,10})" => "\\1"
6801     ),
6802     "uri" => "http://www.yoogli.com"
6803     ),
6804     "yotta" => array(
6805     "icon" => "robot",
6806     "title" => "Yotta",
6807     "rule" => array(
6808     "Yotta(Shopping|Cars)_Bot[ /]([0-9.]{1,10})" => "\\2",
6809     "OmniExplorer_Bot[ /]([0-9.]{1,10})" => "\\1"
6810     ),
6811     "uri" => "http://www.yottacars.com"
6812     ),
6813     "yoono" => array(
6814     "icon" => "yoono",
6815     "title" => "Yoono",
6816     "rule" => array(
6817     "Yoono" => ""
6818     ),
6819     "uri" => "http://www.yoono.com/"
6820     ),
6821     "yowedo" => array(
6822     "icon" => "robot",
6823     "title" => "Yowedo",
6824     "rule" => array(
6825     "Yowedo[ /]([0-9.]{1,10})" => "\\1"
6826     ),
6827     "uri" => "http://yowedo.com/en/partners.html"
6828     ),
6829     "yuntis" => array(
6830     "icon" => "robot",
6831 matthys 209 "title" => "Yuntis",
6832 joku 63 "rule" => array(
6833     "Gulper Web Bot[ /]([0-9.]{1,10})" => "\\1"
6834     ),
6835     "uri" => "http://yuntis.ecsl.cs.sunysb.edu/help/robot/"
6836     ),
6837     "zao" => array(
6838     "icon" => "robot",
6839     "title" => "Zao",
6840     "rule" => array(
6841     "Zao[ /]([0-9.]{1,10})" => "\\1",
6842     "Zao-crawler" => ""
6843     ),
6844     "uri" => ""
6845     ),
6846     "zealbot" => array(
6847     "icon" => "zeal",
6848     "title" => "ZealBot",
6849     "rule" => array(
6850     "Zealbot[ /]([0-9.]{1,10})" => "\\1"
6851     ),
6852     "uri" => ""
6853     ),
6854     "zearchit" => array(
6855     "icon" => "zearchit",
6856     "title" => "Zearchit",
6857     "rule" => array(
6858     "Zearchit" => ""
6859     ),
6860     "uri" => "http://www.zearchit.de/"
6861     ),
6862     "zebz" => array(
6863     "icon" => "robot",
6864     "title" => "ze.bz",
6865     "rule" => array(
6866     "^ZeBot_(lseek\.net|www\.ze\.bz)" => ""
6867     ),
6868     "uri" => "http://www.ze.bz/"
6869     ),
6870     "zedzo" => array(
6871     "icon" => "robot",
6872     "title" => "Zedzo",
6873     "rule" => array(
6874     "zedzo.digest[ /]([0-9.]{1,10})" => "\\1"
6875     ),
6876     "uri" => "http://www.zedzo.com/"
6877     ),
6878     "zerx" => array(
6879     "icon" => "zerx",
6880     "title" => "Zerx",
6881     "rule" => array(
6882     "^zerxbot[ /](Version|v)*[ /]*([0-9.]{1,10})" => "\\2"
6883     ),
6884     "uri" => "http://www.zerx.com/"
6885     ),
6886     "zeus" => array(
6887     "icon" => "zeus",
6888     "title" => "Zeus",
6889     "rule" => array(
6890     "Zeus" => ""
6891     ),
6892     "uri" => "http://www.zeus.com"
6893     ),
6894     "zippp" => array(
6895     "icon" => "robot",
6896     "title" => "Zippp",
6897     "rule" => array(
6898     "ZipppBot[ /]([0-9.]{1,10})" => "\\1"
6899     ),
6900     "uri" => ""
6901     ),
6902     "zippy" => array(
6903     "icon" => "robot",
6904     "title" => "Zippy",
6905     "rule" => array(
6906     "^Zippy[ v/]*([0-9.]{1,10})" => "\\1"
6907     ),
6908     "uri" => "http://www.zippyfinder.com"
6909     ),
6910     "zoeky" => array(
6911     "icon" => "robot",
6912     "title" => "Zoeky",
6913     "rule" => array(
6914     "Zoekybot[ /]([0-9.]{1,10})" => "\\1"
6915     ),
6916     "uri" => ""
6917     ),
6918     "zoom" => array(
6919     "icon" => "zoom",
6920 matthys 209 "title" => "ZoomSpider",
6921 joku 63 "rule" => array(
6922     "^ZoomSpider" => ""
6923     ),
6924     "uri" => "http://www.wrensoft.com/"
6925     ),
6926     "zspider" => array(
6927     "icon" => "robot",
6928 matthys 209 "title" => "Zspider",
6929 joku 63 "rule" => array(
6930     "zspider[ /]([0-9.a-z]{1,10})" => "\\1"
6931     ),
6932     "uri" => "http://feedback.redkolibri.com/"
6933     ),
6934 matthys 281 "zumbot" => array(
6935     "icon" => "robot",
6936     "title" => "ZUM Search",
6937     "rule" => array(
6938     "ZumBot[ /]([0-9.]{1,10})" => "\\1"
6939     ),
6940     "uri" => "http://help.zum.com/inquiry"
6941     ),
6942 joku 63 "zyborg" => array(
6943     "icon" => "zyborg",
6944     "title" => "WiseNutBot",
6945     "rule" => array(
6946     "(WISE|Zy)bo(rg|t)[ /]([0-9.]{1,10})" => "\\3"
6947     ),
6948     "uri" => ""
6949     ),
6950     // Catch up for the originals, they got to stay in that order.
6951     "blogbot" => array(
6952     "icon" => "blogbot",
6953     "title" => "BlogBot",
6954     "rule" => array(
6955     "Blog[ \-]?Bot" => ""
6956     ),
6957     "uri" => "http://www.blogbot.com/"
6958     ),
6959     "centrum" => array(
6960     "icon" => "centrum",
6961     "title" => "Centrum",
6962     "rule" => array(
6963     "holmes[/ ]([0-9.]{1,10})" => "\\1",
6964     "^Centrum-checker" => ""
6965     ),
6966     "uri" => ""
6967     ),
6968     "httpclient" => array(
6969     "icon" => "robot",
6970     "title" => "HTTPClient",
6971     "rule" => array(
6972     "HTTP[ \-]?Client[ /]([0-9.]{1,10})" => "\\1",
6973     "HTTP[ \-]?Client" => ""
6974     ),
6975     "uri" => "http://www.innovation.ch/java/HTTPClient/"
6976     ),
6977     "incywincy" => array(
6978     "icon" => "robot",
6979     "title" => "IncyWincy",
6980     "rule" => array(
6981     "^IncyWincy[ /]([0-9.]{1,10})" => "\\1",
6982     "^IncyWincy" => ""
6983     ),
6984     "uri" => ""
6985     ),
6986     "java" => array(
6987     "icon" => "java",
6988     "title" => "Java",
6989     "rule" => array(
6990     "^java[ /]*([0-9.a-z]{1,10})" => "\\1"
6991     ),
6992     "uri" => ""
6993     ),
6994     "libfetch" => array(
6995     "icon" => "robot",
6996     "title" => "Libfetch",
6997     "rule" => array(
6998     "^(fetch )?libfetch[ /]([0-9.]{1,10})" => "\\2"
6999     ),
7000     "uri" => "http://www.freebsd.org/"
7001     ),
7002     "libwww" => array(
7003     "icon" => "libwww",
7004 matthys 209 "title" => "LibWWW",
7005 joku 63 "rule" => array(
7006     "^libww(w|w-perl|w-FM)[ /]([0-9.]{1,10})" => "\\2",
7007     "^libww(w|w-perl|w-FM)" => "",
7008     "MyApp.*libww(w|w-perl|w-FM)" => ""
7009     ),
7010     "uri" => ""
7011     ),
7012     "litefinder" => array(
7013     "icon" => "litefinder",
7014     "title" => "LiteFinder",
7015     "rule" => array(
7016     "LiteFinder[ /]([0-9.]{1,10})" => "\\1"
7017     ),
7018     "uri" => "http://www.litefinder.net/about.html"
7019     ),
7020     "nutchorg" => array(
7021     "icon" => "nutchorg",
7022     "title" => "Nutch",
7023     "rule" => array(
7024     "Nutc(hOrg|hCVS|h)?[ /]([0-9.]{1,10})" => "\\2",
7025     "Nutch" => ""
7026     ),
7027     "uri" => "http://lucene.apache.org/nutch/"
7028     ),
7029     "pythonurl" => array(
7030     "icon" => "pythonurl",
7031 joku 419 "title" => "Python",
7032 joku 63 "rule" => array(
7033 joku 418 "python-requests[ /]([0-9.]{1,10})" => "\\1",
7034 joku 63 "Python[ \-]?urllib" => ""
7035     ),
7036     "uri" => ""
7037     ),
7038     // Know Robots as SPAM BOTS
7039     "SPAM" => array(
7040     "icon" => "robot",
7041     "title" => "SPAM",
7042     "rule" => array(
7043     "NASA Search[/ ]([0-9.]{1,10})" => "\\1",
7044     "^PHOTO CHECK" => "",
7045     "^FOTOCHECKER" => "",
7046     "^IPTC CHECK" => "",
7047     "^DataCha0s" => "",
7048 joku 420 "Expanse" => "",
7049     "CensysInspect[/ ]([0-9.]{1,10})" => "",
7050     "zgrab[/ ]([0-9.]{1,10})" => "",
7051 joku 63 "^Mac Finder" => "",
7052     "^Missigua Locator[ /]([0-9.]{1,10})" => "\\1",
7053     "^Missouri College Browse" => "",
7054     "Email[ \-]?Siphon" => "",
7055     "atSpider" => "",
7056     "autoemailspider" => "",
7057     "^Demo Bot" => "",
7058     "^Program Shareware" => "",
7059     "^Snapbot" => "",
7060     "^snap.com" => "",
7061     "^Guestbook Auto Submitter" => "",
7062     "panscient.com" => "",
7063     ),
7064     "uri" => ""
7065     ),
7066     // Things we don't know by now
7067     "robot" => array(
7068     "icon" => "robot",
7069     "title" => "Robot",
7070     "rule" => array(
7071     "(robot|spider|harvest|(?<!orange)bot|(?<!msie)crawler)" => ""
7072     )
7073     )
7074     );
7075 joku 261 ?>

Properties

Name Value
svn:keywords Id